| // Copyright (c) 2006-2008 The Chromium Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #ifndef NET_BASE_NET_UTIL_H__ |
| #define NET_BASE_NET_UTIL_H__ |
| |
| #include "build/build_config.h" |
| |
| #ifdef OS_WIN |
| #include <windows.h> |
| #endif |
| |
| #include <string> |
| #include <set> |
| |
| #include "base/basictypes.h" |
| #include "base/string16.h" |
| #include "net/base/escape.h" |
| |
| struct addrinfo; |
| class FilePath; |
| class GURL; |
| |
| namespace base { |
| class Time; |
| } |
| |
| namespace url_canon { |
| struct CanonHostInfo; |
| } |
| |
| namespace url_parse { |
| struct Parsed; |
| } |
| |
| namespace net { |
| |
| // Holds a list of ports that should be accepted despite bans. |
| extern std::set<int> explicitly_allowed_ports; |
| |
| // Given the full path to a file name, creates a file: URL. The returned URL |
| // may not be valid if the input is malformed. |
| GURL FilePathToFileURL(const FilePath& path); |
| |
| // Converts a file: URL back to a filename that can be passed to the OS. The |
| // file URL must be well-formed (GURL::is_valid() must return true); we don't |
| // handle degenerate cases here. Returns true on success, false if it isn't a |
| // valid file URL. On failure, *file_path will be empty. |
| bool FileURLToFilePath(const GURL& url, FilePath* file_path); |
| |
| // Splits an input of the form <host>[":"<port>] into its consitituent parts. |
| // Saves the result into |*host| and |*port|. If the input did not have |
| // the optional port, sets |*port| to -1. |
| // Returns true if the parsing was successful, false otherwise. |
| // The returned host is NOT canonicalized, and may be invalid. If <host> is |
| // an IPv6 literal address, the returned host includes the square brackets. |
| bool ParseHostAndPort(std::string::const_iterator host_and_port_begin, |
| std::string::const_iterator host_and_port_end, |
| std::string* host, |
| int* port); |
| bool ParseHostAndPort(const std::string& host_and_port, |
| std::string* host, |
| int* port); |
| |
| // Returns a host:port string for the given URL. |
| std::string GetHostAndPort(const GURL& url); |
| |
| // Returns a host[:port] string for the given URL, where the port is omitted |
| // if it is the default for the URL's scheme. |
| std::string GetHostAndOptionalPort(const GURL& url); |
| |
| // Returns the string representation of an address, like "192.168.0.1". |
| // Returns empty string on failure. |
| std::string NetAddressToString(const struct addrinfo* net_address); |
| |
| // Returns the hostname of the current system. Returns empty string on failure. |
| std::string GetHostName(); |
| |
| // Extracts the unescaped username/password from |url|, saving the results |
| // into |*username| and |*password|. |
| void GetIdentityFromURL(const GURL& url, |
| std::wstring* username, |
| std::wstring* password); |
| |
| // Return the value of the HTTP response header with name 'name'. 'headers' |
| // should be in the format that URLRequest::GetResponseHeaders() returns. |
| // Returns the empty string if the header is not found. |
| std::wstring GetSpecificHeader(const std::wstring& headers, |
| const std::wstring& name); |
| std::string GetSpecificHeader(const std::string& headers, |
| const std::string& name); |
| |
| // Return the value of the HTTP response header field's parameter named |
| // 'param_name'. Returns the empty string if the parameter is not found or is |
| // improperly formatted. |
| std::wstring GetHeaderParamValue(const std::wstring& field, |
| const std::wstring& param_name); |
| std::string GetHeaderParamValue(const std::string& field, |
| const std::string& param_name); |
| |
| // Return the filename extracted from Content-Disposition header. The following |
| // formats are tried in order listed below: |
| // |
| // 1. RFC 2047 |
| // 2. Raw-8bit-characters : |
| // a. UTF-8, b. referrer_charset, c. default os codepage. |
| // 3. %-escaped UTF-8. |
| // |
| // In step 2, if referrer_charset is empty(i.e. unknown), 2b is skipped. |
| // In step 3, the fallback charsets tried in step 2 are not tried. We |
| // can consider doing that later. |
| // |
| // When a param value is ASCII, but is not in format #1 or format #3 above, |
| // it is returned as it is unless it's pretty close to two supported |
| // formats but not well-formed. In that case, an empty string is returned. |
| // |
| // In any case, a caller must check for the empty return value and resort to |
| // another means to get a filename (e.g. url). |
| // |
| // This function does not do any escaping and callers are responsible for |
| // escaping 'unsafe' characters (e.g. (back)slash, colon) as they see fit. |
| // |
| // TODO(jungshik): revisit this issue. At the moment, the only caller |
| // net_util::GetSuggestedFilename and it calls ReplaceIllegalCharacters. The |
| // other caller is a unit test. Need to figure out expose this function only to |
| // net_util_unittest. |
| // |
| std::wstring GetFileNameFromCD(const std::string& header, |
| const std::string& referrer_charset); |
| |
| // Converts the given host name to unicode characters, APPENDING them to the |
| // the given output string. This can be called for any host name, if the |
| // input is not IDN or is invalid in some way, we'll just append the ASCII |
| // source to the output so it is still usable. |
| // |
| // The input should be the canonicalized ASCII host name from GURL. This |
| // function does NOT accept UTF-8! Its length must also be given (this is |
| // designed to work on the substring of the host out of a URL spec). |
| // |
| // |languages| is a comma separated list of ISO 639 language codes. It |
| // is used to determine whether a hostname is 'comprehensible' to a user |
| // who understands languages listed. |host| will be converted to a |
| // human-readable form (Unicode) ONLY when each component of |host| is |
| // regarded as 'comprehensible'. Scipt-mixing is not allowed except that |
| // Latin letters in the ASCII range can be mixed with a limited set of |
| // script-language pairs (currently Han, Kana and Hangul for zh,ja and ko). |
| // When |languages| is empty, even that mixing is not allowed. |
| void IDNToUnicode(const char* host, |
| int host_len, |
| const std::wstring& languages, |
| std::wstring* out); |
| |
| // Canonicalizes |host| and returns it. Also fills |host_info| with |
| // IP address information. |host_info| must not be NULL. |
| std::string CanonicalizeHost(const std::string& host, |
| url_canon::CanonHostInfo* host_info); |
| std::string CanonicalizeHost(const std::wstring& host, |
| url_canon::CanonHostInfo* host_info); |
| |
| // Call these functions to get the html snippet for a directory listing. |
| // The return values of both functions are in UTF-8. |
| std::string GetDirectoryListingHeader(const string16& title); |
| |
| // Given the name of a file in a directory (ftp or local) and |
| // other information (is_dir, size, modification time), it returns |
| // the html snippet to add the entry for the file to the directory listing. |
| // Currently, it's a script tag containing a call to a Javascript function |
| // |addRow|. |
| // |
| // Its 1st parameter is derived from |name| and is the Javascript-string |
| // escaped form of |name| (i.e \uXXXX). The 2nd parameter is the url-escaped |
| // |raw_bytes| if it's not empty. If empty, the 2nd parameter is the |
| // url-escaped |name| in UTF-8. |
| std::string GetDirectoryListingEntry(const string16& name, |
| const std::string& raw_bytes, |
| bool is_dir, int64 size, |
| base::Time modified); |
| |
| // If text starts with "www." it is removed, otherwise text is returned |
| // unmodified. |
| std::wstring StripWWW(const std::wstring& text); |
| |
| // Gets the filename from the raw Content-Disposition header (as read from the |
| // network). Otherwise uses the last path component name or hostname from |
| // |url|. Note: it's possible for the suggested filename to be empty (e.g., |
| // file:///). referrer_charset is used as one of charsets |
| // to interpret a raw 8bit string in C-D header (after interpreting |
| // as UTF-8 fails). See the comment for GetFilenameFromCD for more details. |
| std::wstring GetSuggestedFilename(const GURL& url, |
| const std::string& content_disposition, |
| const std::string& referrer_charset, |
| const std::wstring& default_name); |
| |
| // Checks the given port against a list of ports which are restricted by |
| // default. Returns true if the port is allowed, false if it is restricted. |
| bool IsPortAllowedByDefault(int port); |
| |
| // Checks the given port against a list of ports which are restricted by the |
| // FTP protocol. Returns true if the port is allowed, false if it is |
| // restricted. |
| bool IsPortAllowedByFtp(int port); |
| |
| // Check if banned |port| has been overriden by an entry in |
| // |explicitly_allowed_ports_|. |
| bool IsPortAllowedByOverride(int port); |
| |
| // Set socket to non-blocking mode |
| int SetNonBlocking(int fd); |
| |
| // Appends the given part of the original URL to the output string formatted for |
| // the user. The given parsed structure will be updated. The host name formatter |
| // also takes the same accept languages component as ElideURL. |new_parsed| may |
| // be null. |
| void AppendFormattedHost(const GURL& url, const std::wstring& languages, |
| std::wstring* output, url_parse::Parsed* new_parsed); |
| |
| // Creates a string representation of |url|. The IDN host name may |
| // be in Unicode if |languages| accepts the Unicode representation. |
| // If |omit_username_password| is true, the username and the password are |
| // omitted. |unescape_rules| defines how to clean the URL for human readability. |
| // You will generally want |UnescapeRule::SPACES| for display to the user if you |
| // can handle spaces, or |UnescapeRule::NORMAL| if not. If the path part and the |
| // query part seem to be encoded in %-encoded UTF-8, decodes %-encoding and |
| // UTF-8. |new_parsed| will have parsing parameters of the resultant URL. |
| // |prefix_end| will be the length before the hostname of the resultant URL. |
| // |new_parsed| and |prefix_end| may be NULL. |
| std::wstring FormatUrl(const GURL& url, |
| const std::wstring& languages, |
| bool omit_username_password, |
| UnescapeRule::Type unescape_rules, |
| url_parse::Parsed* new_parsed, |
| size_t* prefix_end); |
| |
| // Creates a string representation of |url| for display to the user. |
| // This is a shorthand of the above function with omit_username_password=true, |
| // unescape=SPACES, new_parsed=NULL, and prefix_end=NULL. |
| inline std::wstring FormatUrl(const GURL& url, const std::wstring& languages) { |
| return FormatUrl(url, languages, true, UnescapeRule::SPACES, NULL, NULL); |
| } |
| |
| // Strip the portions of |url| that aren't core to the network request. |
| // - user name / password |
| // - reference section |
| GURL SimplifyUrlForRequest(const GURL& url); |
| |
| void SetExplicitlyAllowedPorts(const std::wstring& allowed_ports); |
| |
| } // namespace net |
| |
| #endif // NET_BASE_NET_UTIL_H__ |