Dillo v3.2.0
|
Parse and normalize all URL's inside Dillo. More...
#include <stdlib.h>
#include <string.h>
#include <ctype.h>
#include "url.h"
#include "hsts.h"
#include "misc.h"
#include "msg.h"
Go to the source code of this file.
Macros | |
#define | URL_STR_FIELD_CMP(s1, s2) (s1) && (s2) ? strcmp(s1,s2) : !(s1) && !(s2) ? 0 : (s1) ? 1 : -1 |
#define | URL_STR_FIELD_I_CMP(s1, s2) (s1) && (s2) ? dStrAsciiCasecmp(s1,s2) : !(s1) && !(s2) ? 0 : (s1) ? 1 : -1 |
Functions | |
char * | a_Url_str (const DilloUrl *u) |
Return the url as a string. | |
const char * | a_Url_hostname (const DilloUrl *u) |
Return the hostname as a string. | |
static DilloUrl * | Url_object_new (const char *uri_str) |
Create a DilloUrl object and initialize it. | |
void | a_Url_free (DilloUrl *url) |
Free a DilloUrl. | |
static Dstr * | Url_resolve_relative (const char *RelStr, const char *BaseStr) |
Resolve the URL as RFC3986 suggests. | |
DilloUrl * | a_Url_new (const char *url_str, const char *base_url) |
Transform (and resolve) an URL string into the respective DilloURL. | |
DilloUrl * | a_Url_dup (const DilloUrl *ori) |
Duplicate a Url structure. | |
int | a_Url_cmp (const DilloUrl *A, const DilloUrl *B) |
Compare two Url's to check if they're the same, or which one is bigger. | |
void | a_Url_set_flags (DilloUrl *u, int flags) |
Set DilloUrl flags. | |
void | a_Url_set_data (DilloUrl *u, Dstr **data) |
Set DilloUrl data (like POST info, etc.) | |
void | a_Url_set_ismap_coords (DilloUrl *u, char *coord_str) |
Set DilloUrl ismap coordinates. | |
static int | Url_decode_hex_octet (const char *s) |
Given an hex octet (e.g., e3, 2F, 20), return the corresponding character if the octet is valid, and -1 otherwise. | |
char * | a_Url_decode_hex_str (const char *str) |
Parse possible hexadecimal octets in the URI path. | |
char * | a_Url_encode_hex_str (const char *str) |
Urlencode 'str'. | |
char * | a_Url_string_strip_delimiters (const char *str) |
RFC-3986 suggests this stripping when "importing" URLs from other media. | |
int | a_Url_host_type (const char *host) |
What type of host is this? | |
static uint_t | Url_host_public_internal_dots (const char *host) |
How many internal dots are in the public portion of this hostname?. | |
static const char * | Url_host_find_public_suffix (const char *host) |
Given a URL host string, return the portion that is public. | |
bool_t | a_Url_same_organization (const DilloUrl *u1, const DilloUrl *u2) |
Variables | |
static const char * | HEX = "0123456789ABCDEF" |
Parse and normalize all URL's inside Dillo.
Definition in file url.c.
#define URL_STR_FIELD_CMP | ( | s1, | |
s2 | |||
) | (s1) && (s2) ? strcmp(s1,s2) : !(s1) && !(s2) ? 0 : (s1) ? 1 : -1 |
#define URL_STR_FIELD_I_CMP | ( | s1, | |
s2 | |||
) | (s1) && (s2) ? dStrAsciiCasecmp(s1,s2) : !(s1) && !(s2) ? 0 : (s1) ? 1 : -1 |
Compare two Url's to check if they're the same, or which one is bigger.
The fields which are compared here are: <scheme>, <authority>, <path>, <query> and <data> Other fields are left for the caller to check
Return value: 0 if equal, > 0 if A > B, < 0 if A < B.
Note: this function defines a sorting order different from strcmp!
Definition at line 506 of file url.c.
References DilloUrl::authority, DilloUrl::data, dReturn_val_if_fail, dStr_cmp(), DilloUrl::path, DilloUrl::query, DilloUrl::scheme, URL_STR_FIELD_CMP, and URL_STR_FIELD_I_CMP.
Referenced by a_Bw_add_url(), a_Bw_get_url_doc(), a_Capi_conn_abort_by_url(), a_History_add_url(), a_History_get_title_by_url(), a_History_set_title_by_url(), a_Nav_cancel_expect_if_eq(), a_Nav_push(), Cache_entry_by_url_cmp(), Cache_entry_cmp(), Dicache_entry_cmp(), Html_tag_open_meta(), DilloHtml::loadImages(), and Nav_open_url().
char * a_Url_decode_hex_str | ( | const char * | str | ) |
Parse possible hexadecimal octets in the URI path.
Returns a new allocated string.
Definition at line 586 of file url.c.
References dNew, dRealloc(), dStrdup(), and Url_decode_hex_octet().
Duplicate a Url structure.
Definition at line 477 of file url.c.
References DilloUrl::data, dReturn_val_if_fail, dStr_append_l(), dStr_new(), dStr_sized_new(), DilloUrl::flags, DilloUrl::illegal_chars, DilloUrl::illegal_chars_spc, DilloUrl::ismap_url_len, DilloUrl::port, URL_DATA, Url_object_new(), URL_STR, URL_STR_, and DilloUrl::url_string.
Referenced by a_Bw_add_url(), a_Bw_expect(), a_Capi_set_vsource_url(), a_History_add_url(), a_Http_init(), a_Menu_bugmeter_popup(), a_Menu_form_popup(), a_Menu_image_popup(), a_Menu_link_popup(), a_Menu_page_popup(), a_Nav_expect_done(), a_Nav_redirection0(), a_Web_new(), DilloHtml::addCssUrl(), Auth_do_auth_dialog(), Cache_auth_entry(), Cache_entry_init(), Cache_process_queue(), Capi_conn_new(), Dicache_add_entry(), DilloHtml::DilloHtml(), Html_tag_open_form(), Html_tag_open_isindex(), Http_get(), Nav_reload_callback(), Nav_repush(), StyleEngine::StyleEngine(), Tls_conn_new(), and Tls_conn_new().
char * a_Url_encode_hex_str | ( | const char * | str | ) |
Urlencode 'str'.
-RL :: According to the RFC 1738, only alphanumerics, the special characters "$-_.+!*'(),", and reserved characters ";/?:@=&" used for their reserved purposes may be used unencoded within a URL. We'll escape everything but alphanumeric and "-_.*" (as lynx). –Jcid
Note: the content type "application/x-www-form-urlencoded" is used: i.e., ' ' -> '+' and '
' -> CR LF (see HTML 4.01, Sec. 17.13.4)
Definition at line 620 of file url.c.
References d_isascii, dIsalnum, dNew, and HEX.
Referenced by Menu_bugmeter_validate(), and UIcmd_make_search_str().
void a_Url_free | ( | DilloUrl * | url | ) |
Free a DilloUrl.
Do nothing if the argument is NULL
Definition at line 208 of file url.c.
References DilloUrl::authority, DilloUrl::buffer, DilloUrl::data, dFree(), dStr_free(), DilloUrl::hostname, TRUE, and DilloUrl::url_string.
Referenced by a_Bw_cancel_expect(), a_Bw_cleanup(), a_Bw_expect(), a_Bw_free(), a_Cache_init(), a_Capi_set_vsource_url(), a_Dicache_freeall(), a_History_freeall(), a_Http_freeall(), a_Menu_bugmeter_popup(), a_Menu_file_popup(), a_Menu_form_popup(), a_Menu_image_popup(), a_Menu_link_popup(), a_Menu_page_popup(), a_Nav_expect_done(), a_Nav_redirection0(), a_Prefs_freeall(), a_UIcmd_book(), a_UIcmd_open_file(), a_UIcmd_open_urlstr(), a_UIcmd_view_page_source(), a_Web_free(), StyleEngine::apply(), Auth_do_auth_dialog(), Cache_auth_callback(), Cache_entry_free(), Cache_process_queue(), Cache_redirect(), Cache_savelink_cb(), Capi_conn_unref(), Dicache_remove(), Html_tag_content_img(), Html_tag_content_map(), Html_tag_open_base(), Html_tag_open_form(), Html_tag_open_isindex(), Html_tag_open_link(), Html_tag_open_meta(), Html_tag_open_object(), Http_socket_free(), main(), Nav_redirection0_callback(), Nav_reload_callback(), Nav_repush(), CssParser::parseImport(), parseOption(), CssParser::parseUrl(), Tls_close_by_key(), Tls_close_by_key(), Url_resolve_relative(), DilloHtml::~DilloHtml(), and StyleEngine::~StyleEngine().
int a_Url_host_type | ( | const char * | host | ) |
What type of host is this?
Definition at line 683 of file url.c.
References URL_HOST_ERROR, URL_HOST_IPV4, URL_HOST_IPV6, and URL_HOST_NAME.
Referenced by a_Tls_openssl_connect(), Cache_parse_header(), Tls_cert_authorities_print_summary(), and Url_host_find_public_suffix().
const char * a_Url_hostname | ( | const DilloUrl * | u | ) |
Return the hostname as a string.
(initializing 'hostname' and 'port' fields if necessary) Note: a similar approach can be taken for user:password auth.
Definition at line 98 of file url.c.
References DilloUrl::authority, dStrAsciiCasecmp(), dStrndup(), DilloUrl::hostname, DilloUrl::port, DilloUrl::scheme, URL_HTTP_PORT, and URL_HTTPS_PORT.
Referenced by a_Url_new().
DilloUrl * a_Url_new | ( | const char * | url_str, |
const char * | base_url | ||
) |
Transform (and resolve) an URL string into the respective DilloURL.
If URL = "http://dillo.sf.net:8080/index.html?long#part2" then the resulting DilloURL should be:
Return NULL if URL is badly formed.
Definition at line 371 of file url.c.
References _MSG, a_Hsts_require_https(), a_Url_hostname(), DilloUrl::authority, DilloUrl::data, dFree(), dNew, dStr_free(), dStr_new(), dStrAsciiCasecmp(), dStrconcat(), FALSE, HEX, DilloPrefs::http_force_https, DilloPrefs::http_strict_transport_security, DilloUrl::illegal_chars, DilloUrl::illegal_chars_spc, DilloUrl::port, prefs, DilloUrl::scheme, Dstr::str, TRUE, URL_HTTP_PORT, URL_HTTPS_PORT, Url_object_new(), Url_resolve_relative(), and DilloUrl::url_string.
Referenced by a_Cache_init(), a_Html_url_new(), a_Http_init(), a_Prefs_init(), a_UIcmd_book(), a_UIcmd_open_file(), a_UIcmd_open_urlstr(), a_UIcmd_view_page_source(), StyleEngine::apply(), Cache_parse_header(), Cache_redirect(), makeStartUrl(), parseOption(), and CssParser::parseUrl().
Definition at line 798 of file url.c.
References dStrAsciiCasecmp(), FALSE, TRUE, URL_HOST, and Url_host_find_public_suffix().
Referenced by a_Cookies_get_query(), a_Domain_permit(), and Cache_parse_header().
Set DilloUrl data (like POST info, etc.)
Definition at line 536 of file url.c.
References DilloUrl::data, and dStr_free().
void a_Url_set_flags | ( | DilloUrl * | u, |
int | flags | ||
) |
Set DilloUrl flags.
Definition at line 527 of file url.c.
References DilloUrl::flags.
Referenced by a_Capi_open_url(), a_Nav_expect_done(), a_Nav_redirection0(), Cache_redirect(), Html_tag_open_base(), makeStartUrl(), Nav_reload_callback(), and Nav_repush().
void a_Url_set_ismap_coords | ( | DilloUrl * | u, |
char * | coord_str | ||
) |
Set DilloUrl ismap coordinates.
(this is optimized for not hogging the CPU)
Definition at line 549 of file url.c.
References dReturn_if_fail, dStr_append(), dStr_truncate(), DilloUrl::ismap_url_len, Dstr::len, DilloUrl::query, Dstr::str, URL_STR_, and DilloUrl::url_string.
Referenced by Html_set_link_coordinates().
char * a_Url_str | ( | const DilloUrl * | u | ) |
Return the url as a string.
(initializing 'url_string' field if necessary)
Definition at line 66 of file url.c.
References DilloUrl::authority, dReturn_val_if_fail, dStr_sized_new(), dStr_sprintf(), DilloUrl::fragment, DilloUrl::path, DilloUrl::query, DilloUrl::scheme, Dstr::str, and DilloUrl::url_string.
Referenced by DilloHtml::HtmlLinkReceiver::click(), CssParser::parseImport(), and CssParser::parseUrl().
char * a_Url_string_strip_delimiters | ( | const char * | str | ) |
RFC-3986 suggests this stripping when "importing" URLs from other media.
Strip: "URL:", enclosing < >, and embedded whitespace. (We also strip illegal chars: 00-1F and 7F-FF)
Definition at line 658 of file url.c.
References dStrdup().
Referenced by a_UIcmd_open_urlstr(), and makeStartUrl().
|
static |
Given an hex octet (e.g., e3, 2F, 20), return the corresponding character if the octet is valid, and -1 otherwise.
Definition at line 568 of file url.c.
Referenced by a_Url_decode_hex_str().
|
static |
Given a URL host string, return the portion that is public.
i.e., the domain that is in a registry outside the organization. For 'www.dillo.org', that would be 'dillo.org'.
Definition at line 762 of file url.c.
References _MSG, a_Url_host_type(), URL_HOST_NAME, and Url_host_public_internal_dots().
Referenced by a_Url_same_organization().
|
static |
How many internal dots are in the public portion of this hostname?.
e.g., for "www.dillo.org", it is one because everything under "dillo.org", as a .org domain, is part of one organization.
Of course this is only a simple and imperfect approximation of organizational boundaries.
Definition at line 711 of file url.c.
References _MSG, and dStrnAsciiCasecmp().
Referenced by Url_host_find_public_suffix().
|
static |
Create a DilloUrl object and initialize it.
(buffer, scheme, authority, path, query and fragment).
Definition at line 137 of file url.c.
References DilloUrl::authority, DilloUrl::buffer, dNew, dNew0, dReturn_val_if_fail, dStrstrip(), DilloUrl::flags, DilloUrl::fragment, MAX, DilloUrl::path, DilloUrl::query, DilloUrl::scheme, and URL_Get.
Referenced by a_Url_dup(), a_Url_new(), and Url_resolve_relative().
|
static |
Resolve the URL as RFC3986 suggests.
Definition at line 224 of file url.c.
References a_Url_free(), DilloUrl::authority, DilloUrl::buffer, dStr_append(), dStr_append_c(), dStr_erase(), dStr_free(), dStr_sized_new(), dStr_truncate(), DilloUrl::fragment, Dstr::len, DilloUrl::path, DilloUrl::query, DilloUrl::scheme, Dstr::str, TRUE, and Url_object_new().
Referenced by a_Url_new().
|
static |
Definition at line 54 of file url.c.
Referenced by a_Url_encode_hex_str(), a_Url_new(), and dStr_printable().