2011-09-21 18:36:42 +04:00
|
|
|
/*
|
|
|
|
* Copyright 2011 Michael Drake <tlsa@netsurf-browser.org>
|
|
|
|
*
|
|
|
|
* This file is part of NetSurf, http://www.netsurf-browser.org/
|
|
|
|
*
|
|
|
|
* NetSurf is free software; you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
* the Free Software Foundation; version 2 of the License.
|
|
|
|
*
|
|
|
|
* NetSurf is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
*/
|
|
|
|
|
|
|
|
/** \file
|
|
|
|
* NetSurf URL handling (interface).
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef _NETSURF_UTILS_NSURL_H_
|
|
|
|
#define _NETSURF_UTILS_NSURL_H_
|
|
|
|
|
2011-09-27 01:50:16 +04:00
|
|
|
#include <libwapcaplet/libwapcaplet.h>
|
2011-09-21 18:36:42 +04:00
|
|
|
#include "utils/errors.h"
|
|
|
|
|
|
|
|
|
|
|
|
/** NetSurf URL object */
|
|
|
|
typedef struct nsurl nsurl;
|
|
|
|
|
|
|
|
|
|
|
|
typedef enum nsurl_component {
|
|
|
|
NSURL_SCHEME = (1 << 0),
|
|
|
|
NSURL_USERNAME = (1 << 1),
|
|
|
|
NSURL_PASSWORD = (1 << 2),
|
|
|
|
NSURL_CREDENTIALS = NSURL_USERNAME | NSURL_PASSWORD,
|
|
|
|
NSURL_HOST = (1 << 3),
|
|
|
|
NSURL_PORT = (1 << 4),
|
|
|
|
NSURL_AUTHORITY = NSURL_CREDENTIALS | NSURL_HOST | NSURL_PORT,
|
|
|
|
NSURL_PATH = (1 << 5),
|
|
|
|
NSURL_QUERY = (1 << 6),
|
|
|
|
NSURL_COMPLETE = NSURL_SCHEME | NSURL_AUTHORITY |
|
|
|
|
NSURL_PATH | NSURL_QUERY,
|
|
|
|
NSURL_FRAGMENT = (1 << 7),
|
|
|
|
NSURL_WITH_FRAGMENT = NSURL_COMPLETE | NSURL_FRAGMENT
|
|
|
|
} nsurl_component;
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Create a NetSurf URL object from a URL string
|
|
|
|
*
|
|
|
|
* \param url_s String to create NetSurf URL from
|
|
|
|
* \param url Returns a NetSurf URL
|
|
|
|
* \return NSERROR_OK on success, appropriate error otherwise
|
|
|
|
*
|
|
|
|
* If return value != NSERROR_OK, nothing will be returned in url.
|
|
|
|
*
|
2015-07-09 17:02:51 +03:00
|
|
|
* It is up to the client to call nsurl_unref when they are finished with
|
2011-09-21 18:36:42 +04:00
|
|
|
* the created object.
|
|
|
|
*/
|
2011-12-04 15:12:17 +04:00
|
|
|
nserror nsurl_create(const char * const url_s, nsurl **url);
|
2011-09-21 18:36:42 +04:00
|
|
|
|
|
|
|
|
|
|
|
/**
|
2011-09-22 20:28:46 +04:00
|
|
|
* Increment the reference count to a NetSurf URL object
|
2011-09-21 18:36:42 +04:00
|
|
|
*
|
2011-09-22 20:28:46 +04:00
|
|
|
* \param url NetSurf URL to create another reference to
|
|
|
|
* \return The NetSurf URL pointer to use as the copy
|
|
|
|
*
|
|
|
|
* Use this when copying a NetSurf URL into a persistent data structure.
|
|
|
|
*/
|
|
|
|
nsurl *nsurl_ref(nsurl *url);
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Drop a reference to a NetSurf URL object
|
|
|
|
*
|
|
|
|
* \param url NetSurf URL to drop reference to
|
|
|
|
*
|
|
|
|
* When the reference count reaches zero then the NetSurf URL will be destroyed
|
2011-09-21 18:36:42 +04:00
|
|
|
*/
|
2011-09-22 20:28:46 +04:00
|
|
|
void nsurl_unref(nsurl *url);
|
2011-09-21 18:36:42 +04:00
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Compare two URLs
|
|
|
|
*
|
|
|
|
* \param url1 First NetSurf URL
|
|
|
|
* \param url2 Second NetSurf URL
|
|
|
|
* \param parts The URL components to be compared
|
2014-11-13 02:27:13 +03:00
|
|
|
* \return true on match else false
|
2011-09-21 18:36:42 +04:00
|
|
|
*
|
|
|
|
*/
|
2011-09-26 18:57:45 +04:00
|
|
|
bool nsurl_compare(const nsurl *url1, const nsurl *url2, nsurl_component parts);
|
2011-09-21 18:36:42 +04:00
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Get URL (section) as a string, from a NetSurf URL object
|
|
|
|
*
|
|
|
|
* \param url NetSurf URL
|
|
|
|
* \param parts The required URL components.
|
|
|
|
* \param url_s Returns a url string
|
|
|
|
* \param url_l Returns length of url_s
|
|
|
|
* \return NSERROR_OK on success, appropriate error otherwise
|
|
|
|
*
|
|
|
|
* If return value != NSERROR_OK, nothing will be returned in url_s or url_l.
|
|
|
|
*
|
|
|
|
* The string returned in url_s is owned by the client and it is up to them
|
|
|
|
* to free it. It includes a trailing '\0'.
|
|
|
|
*
|
|
|
|
* The length returned in url_l excludes the trailing '\0'.
|
|
|
|
*
|
|
|
|
* That the required URL components be consecutive is not enforced, however,
|
|
|
|
* non-consecutive URL components generally make no sense. The exception
|
|
|
|
* is removal of credentials from a URL, such as for display in browser
|
|
|
|
* window URL bar. 'NSURL_COMPLETE &~ NSURL_PASSWORD' would remove the
|
|
|
|
* password from a complete URL.
|
|
|
|
*/
|
|
|
|
nserror nsurl_get(const nsurl *url, nsurl_component parts,
|
|
|
|
char **url_s, size_t *url_l);
|
|
|
|
|
|
|
|
|
2011-09-27 01:50:16 +04:00
|
|
|
/**
|
|
|
|
* Get part of a URL as a lwc_string, from a NetSurf URL object
|
|
|
|
*
|
|
|
|
* \param url NetSurf URL object
|
|
|
|
* \param part The URL component required
|
|
|
|
* \return the required component as an lwc_string, or NULL
|
|
|
|
*
|
|
|
|
* The caller owns the returned lwc_string and should call lwc_string_unref
|
|
|
|
* when they are done with it.
|
|
|
|
*
|
|
|
|
* The valid values for the part parameter are:
|
|
|
|
* NSURL_SCHEME
|
|
|
|
* NSURL_USERNAME
|
|
|
|
* NSURL_PASSWORD
|
|
|
|
* NSURL_HOST
|
|
|
|
* NSURL_PORT
|
|
|
|
* NSURL_PATH
|
|
|
|
* NSURL_QUERY
|
|
|
|
* NSURL_FRAGMENT
|
|
|
|
*/
|
2011-09-27 12:18:32 +04:00
|
|
|
lwc_string *nsurl_get_component(const nsurl *url, nsurl_component part);
|
2011-09-27 01:50:16 +04:00
|
|
|
|
|
|
|
|
2011-09-26 17:27:20 +04:00
|
|
|
/**
|
|
|
|
* Enquire about the existence of componenets in a given URL
|
|
|
|
*
|
|
|
|
* \param url NetSurf URL object
|
|
|
|
* \param part The URL components confirm existence of
|
|
|
|
* \return true iff the component in question exists in url
|
|
|
|
*
|
|
|
|
* The valid values for the part parameter are:
|
|
|
|
* NSURL_SCHEME
|
|
|
|
* NSURL_USERNAME
|
|
|
|
* NSURL_PASSWORD
|
|
|
|
* NSURL_CREDENTIALS
|
|
|
|
* NSURL_HOST
|
|
|
|
* NSURL_PORT
|
|
|
|
* NSURL_PATH
|
|
|
|
* NSURL_QUERY
|
|
|
|
* NSURL_FRAGMENT
|
|
|
|
*/
|
2011-11-27 22:32:06 +04:00
|
|
|
bool nsurl_has_component(const nsurl *url, nsurl_component part);
|
2011-09-26 17:27:20 +04:00
|
|
|
|
|
|
|
|
2011-09-22 20:28:46 +04:00
|
|
|
/**
|
2011-09-26 16:19:35 +04:00
|
|
|
* Access a NetSurf URL object as a string
|
2011-09-22 20:28:46 +04:00
|
|
|
*
|
|
|
|
* \param url NetSurf URL to retrieve a string pointer for.
|
|
|
|
* \return the required string
|
|
|
|
*
|
2011-09-23 00:28:26 +04:00
|
|
|
* The returned string is owned by the NetSurf URL object. It will die
|
2011-09-22 20:28:46 +04:00
|
|
|
* with the NetSurf URL object. Keep a reference to the URL if you need it.
|
|
|
|
*
|
2011-09-26 16:19:35 +04:00
|
|
|
* The returned string has a trailing '\0'.
|
2011-09-22 20:28:46 +04:00
|
|
|
*/
|
2011-09-26 16:19:35 +04:00
|
|
|
const char *nsurl_access(const nsurl *url);
|
2011-09-22 20:28:46 +04:00
|
|
|
|
|
|
|
|
2018-08-09 17:35:24 +03:00
|
|
|
/**
|
|
|
|
* Variant of \ref nsurl_access for logging.
|
|
|
|
*
|
|
|
|
* \param url NetSurf URL to retrieve a string pointer for.
|
|
|
|
* \return the required string
|
|
|
|
*
|
|
|
|
* This will not necessarily return the actual nsurl's URL, but something
|
|
|
|
* that is suitable for recording to logs. E.g. URLs with the `data` scheme
|
|
|
|
* will return a simple place holder, to avoid repeatedly dumping loads of data.
|
|
|
|
*
|
|
|
|
* The returned string is owned by the NetSurf URL object. It will die
|
|
|
|
* with the NetSurf URL object. Keep a reference to the URL if you need it.
|
|
|
|
*
|
|
|
|
* The returned string has a trailing '\0'.
|
|
|
|
*/
|
|
|
|
const char *nsurl_access_log(const nsurl *url);
|
|
|
|
|
|
|
|
|
2015-07-17 21:18:20 +03:00
|
|
|
/**
|
2015-10-25 12:03:20 +03:00
|
|
|
* Get a UTF-8 string (for human readable IDNs) from a NetSurf URL object
|
2015-07-17 21:18:20 +03:00
|
|
|
*
|
2015-07-26 20:09:25 +03:00
|
|
|
* \param url NetSurf URL object
|
2015-07-23 02:05:22 +03:00
|
|
|
* \param url_s Returns a url string
|
|
|
|
* \param url_l Returns length of url_s
|
|
|
|
* \return NSERROR_OK on success, appropriate error otherwise
|
|
|
|
*
|
|
|
|
* If return value != NSERROR_OK, nothing will be returned in url_s or url_l.
|
2015-07-17 21:18:20 +03:00
|
|
|
*
|
2015-07-23 02:05:22 +03:00
|
|
|
* The string returned in url_s is owned by the client and it is up to them
|
|
|
|
* to free it. It includes a trailing '\0'.
|
2015-07-17 21:18:20 +03:00
|
|
|
*
|
2015-07-23 02:05:22 +03:00
|
|
|
* The length returned in url_l excludes the trailing '\0'.
|
2015-07-17 21:18:20 +03:00
|
|
|
*/
|
2015-10-25 12:03:20 +03:00
|
|
|
nserror nsurl_get_utf8(const nsurl *url, char **url_s, size_t *url_l);
|
2015-07-17 21:18:20 +03:00
|
|
|
|
|
|
|
|
2012-10-24 21:22:45 +04:00
|
|
|
/**
|
|
|
|
* Access a URL's path leaf as a string
|
|
|
|
*
|
|
|
|
* \param url NetSurf URL to retrieve a string pointer for.
|
|
|
|
* \return the required string
|
|
|
|
*
|
|
|
|
* The returned string is owned by the NetSurf URL object. It will die
|
|
|
|
* with the NetSurf URL object. Keep a reference to the URL if you need it.
|
|
|
|
*
|
|
|
|
* The returned string has a trailing '\0'.
|
|
|
|
*/
|
|
|
|
const char *nsurl_access_leaf(const nsurl *url);
|
|
|
|
|
|
|
|
|
2011-10-08 16:03:54 +04:00
|
|
|
/**
|
|
|
|
* Find the length of a NetSurf URL object's URL, as returned by nsurl_access
|
|
|
|
*
|
|
|
|
* \param url NetSurf URL to find length of.
|
|
|
|
* \return the required string
|
|
|
|
*
|
|
|
|
* The returned length excludes the trailing '\0'.
|
|
|
|
*/
|
|
|
|
size_t nsurl_length(const nsurl *url);
|
|
|
|
|
|
|
|
|
2013-05-17 15:25:04 +04:00
|
|
|
/**
|
|
|
|
* Get a URL's hash value
|
|
|
|
*
|
|
|
|
* \param url NetSurf URL get hash value for.
|
|
|
|
* \return the hash value
|
|
|
|
*/
|
|
|
|
uint32_t nsurl_hash(const nsurl *url);
|
|
|
|
|
|
|
|
|
2011-09-21 18:36:42 +04:00
|
|
|
/**
|
|
|
|
* Join a base url to a relative link part, creating a new NetSurf URL object
|
|
|
|
*
|
|
|
|
* \param base NetSurf URL containing the base to join rel to
|
|
|
|
* \param rel String containing the relative link part
|
|
|
|
* \param joined Returns joined NetSurf URL
|
|
|
|
* \return NSERROR_OK on success, appropriate error otherwise
|
|
|
|
*
|
|
|
|
* If return value != NSERROR_OK, nothing will be returned in join.
|
|
|
|
*
|
2015-07-09 17:02:51 +03:00
|
|
|
* It is up to the client to call nsurl_unref when they are finished with
|
2011-09-21 18:36:42 +04:00
|
|
|
* the created object.
|
|
|
|
*/
|
|
|
|
nserror nsurl_join(const nsurl *base, const char *rel, nsurl **joined);
|
|
|
|
|
2011-09-28 15:26:10 +04:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Create a NetSurf URL object without a fragment from a NetSurf URL
|
|
|
|
*
|
2011-10-28 23:18:14 +04:00
|
|
|
* \param url NetSurf URL to create new NetSurf URL from
|
2011-09-28 15:26:10 +04:00
|
|
|
* \param no_frag Returns new NetSurf URL without fragment
|
|
|
|
* \return NSERROR_OK on success, appropriate error otherwise
|
|
|
|
*
|
|
|
|
* If return value != NSERROR_OK, nothing will be returned in no_frag.
|
|
|
|
*
|
2015-07-09 17:02:51 +03:00
|
|
|
* It is up to the client to call nsurl_unref when they are finished with
|
2011-09-28 15:26:10 +04:00
|
|
|
* the created object.
|
|
|
|
*/
|
|
|
|
nserror nsurl_defragment(const nsurl *url, nsurl **no_frag);
|
|
|
|
|
2011-10-28 23:18:14 +04:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Create a NetSurf URL object, adding a fragment to an existing URL object
|
|
|
|
*
|
|
|
|
* \param url NetSurf URL to create new NetSurf URL from
|
|
|
|
* \param frag Fragment to add
|
|
|
|
* \param new_url Returns new NetSurf URL without fragment
|
|
|
|
* \return NSERROR_OK on success, appropriate error otherwise
|
|
|
|
*
|
|
|
|
* If return value != NSERROR_OK, nothing will be returned in new_url.
|
|
|
|
*
|
2015-07-09 17:02:51 +03:00
|
|
|
* It is up to the client to call nsurl_unref when they are finished with
|
2011-10-28 23:18:14 +04:00
|
|
|
* the created object.
|
|
|
|
*
|
|
|
|
* Any fragment in url is replaced with frag in new_url.
|
|
|
|
*/
|
|
|
|
nserror nsurl_refragment(const nsurl *url, lwc_string *frag, nsurl **new_url);
|
|
|
|
|
2012-10-06 17:06:38 +04:00
|
|
|
|
2012-10-11 22:23:22 +04:00
|
|
|
/**
|
|
|
|
* Create a NetSurf URL object, with query string replaced
|
|
|
|
*
|
|
|
|
* \param url NetSurf URL to create new NetSurf URL from
|
|
|
|
* \param query Query string to use
|
|
|
|
* \param new_url Returns new NetSurf URL with query string provided
|
|
|
|
* \return NSERROR_OK on success, appropriate error otherwise
|
|
|
|
*
|
|
|
|
* If return value != NSERROR_OK, nothing will be returned in new_url.
|
|
|
|
*
|
2015-07-09 17:02:51 +03:00
|
|
|
* It is up to the client to call nsurl_unref when they are finished with
|
2012-10-11 22:23:22 +04:00
|
|
|
* the created object.
|
|
|
|
*
|
|
|
|
* Any query component in url is replaced with query in new_url.
|
2018-09-26 11:39:09 +03:00
|
|
|
*
|
|
|
|
* Passing the empty string as a replacement will result in the query
|
|
|
|
* component being removed.
|
2012-10-11 22:23:22 +04:00
|
|
|
*/
|
|
|
|
nserror nsurl_replace_query(const nsurl *url, const char *query,
|
|
|
|
nsurl **new_url);
|
|
|
|
|
|
|
|
|
2018-04-22 05:59:44 +03:00
|
|
|
/**
|
|
|
|
* Create a NetSurf URL object, with scheme replaced
|
|
|
|
*
|
|
|
|
* \param url NetSurf URL to create new NetSurf URL from
|
|
|
|
* \param scheme Scheme to use
|
|
|
|
* \param new_url Returns new NetSurf URL with scheme provided
|
|
|
|
* \return NSERROR_OK on success, appropriate error otherwise
|
|
|
|
*
|
|
|
|
* If return value != NSERROR_OK, nothing will be returned in new_url.
|
|
|
|
*
|
|
|
|
* It is up to the client to call nsurl_unref when they are finished with
|
|
|
|
* the created object.
|
|
|
|
*
|
|
|
|
* Any scheme component in url is replaced with scheme in new_url.
|
|
|
|
*/
|
|
|
|
nserror nsurl_replace_scheme(const nsurl *url, lwc_string *scheme,
|
|
|
|
nsurl **new_url);
|
|
|
|
|
|
|
|
|
2014-10-31 01:26:03 +03:00
|
|
|
/**
|
|
|
|
* Attempt to find a nice filename for a URL.
|
|
|
|
*
|
|
|
|
* \param url A NetSurf URL object to create a filename from
|
|
|
|
* \param result Updated to caller-owned string with filename
|
|
|
|
* \param remove_extensions remove any extensions from the filename
|
|
|
|
* \return NSERROR_OK on success, appropriate error otherwise
|
|
|
|
*
|
|
|
|
* Caller must ensure string result string is freed, if NSERROR_OK returned.
|
|
|
|
*/
|
|
|
|
nserror nsurl_nice(const nsurl *url, char **result, bool remove_extensions);
|
|
|
|
|
|
|
|
|
2012-10-06 17:06:38 +04:00
|
|
|
/**
|
|
|
|
* Create a NetSurf URL object for URL with parent location of an existing URL.
|
|
|
|
*
|
|
|
|
* \param url NetSurf URL to create new NetSurf URL from
|
|
|
|
* \param new_url Returns new NetSurf URL with parent URL path
|
|
|
|
* \return NSERROR_OK on success, appropriate error otherwise
|
|
|
|
*
|
|
|
|
* If return value != NSERROR_OK, nothing will be returned in new_url.
|
|
|
|
*
|
2015-07-09 17:02:51 +03:00
|
|
|
* It is up to the client to call nsurl_unref when they are finished with
|
2012-10-06 17:06:38 +04:00
|
|
|
* the created object.
|
|
|
|
*
|
|
|
|
* As well as stripping top most path segment, query and fragments are stripped.
|
|
|
|
*/
|
|
|
|
nserror nsurl_parent(const nsurl *url, nsurl **new_url);
|
|
|
|
|
2011-09-21 18:36:42 +04:00
|
|
|
#endif
|