2 * UCW Library -- URL Functions
4 * (c) 1997--2004 Martin Mares <mj@ucw.cz>
5 * (c) 2001 Robert Spalek <robert@ucw.cz>
7 * This software may be freely distributed and used according to the terms
8 * of the GNU Lesser General Public License.
14 #define MAX_URL_SIZE 1024
16 /* Non-control meanings of control characters */
18 #define NCC_SEMICOLON 1
28 #define NCC_CHARS " ;/?:@=&#"
30 /* Remove/Introduce '%' escapes */
32 int url_deescape(byte *s, byte *d);
33 int url_enescape(byte *s, byte *d);
35 /* URL splitting and normalization */
43 uns port; /* ~0 if unspec */
48 int url_split(byte *s, struct url *u, byte *d);
49 int url_normalize(struct url *u, struct url *b);
50 int url_canonicalize(struct url *u);
51 int url_pack(struct url *u, byte *d);
52 int url_canon_split_rel(byte *url, byte *buf1, byte *buf2, struct url *u, struct url *base);
53 int url_auto_canonicalize_rel(byte *src, byte *dst, struct url *base);
54 uns identify_protocol(byte *p);
55 int url_has_repeated_component(byte *url);
57 static inline int url_canon_split(byte *url, byte *buf1, byte *buf2, struct url *u)
58 { return url_canon_split_rel(url, buf1, buf2, u, NULL); }
60 static inline int url_auto_canonicalize(byte *src, byte *dst)
61 { return url_auto_canonicalize_rel(src, dst, NULL); }
67 #define URL_ERR_TOO_LONG 1
68 #define URL_ERR_INVALID_CHAR 2
69 #define URL_ERR_INVALID_ESCAPE 3
70 #define URL_ERR_INVALID_ESCAPED_CHAR 4
71 #define URL_ERR_INVALID_PORT 5
72 #define URL_ERR_REL_NOTHING 6
73 #define URL_ERR_UNKNOWN_PROTOCOL 7
74 #define URL_SYNTAX_ERROR 8
75 #define URL_PATH_UNDERFLOW 9
77 #define URL_PROTO_UNKNOWN 0
78 #define URL_PROTO_HTTP 1
79 #define URL_PROTO_FTP 2
80 #define URL_PROTO_FILE 3
81 #define URL_PROTO_MAX 4
83 #define URL_PNAMES { "unknown", "http", "ftp", "file" }
84 #define URL_DEFPORTS { ~0, 80, 21, 0 }
85 #define URL_PATH_FLAGS { 0, 1, 1, 1 }
87 extern byte *url_proto_names[];