Browse Source

Much, much smaller. :)

tags/v0.9.3
Michael Brown 19 years ago
parent
commit
c1253d2219
1 changed files with 50 additions and 123 deletions
  1. 50
    123
      src/core/url.c

+ 50
- 123
src/core/url.c View File

@@ -1,144 +1,71 @@
1
-#include "stdlib.h"
2 1
 #include "string.h"
3
-#include "proto.h"
4
-#include "resolv.h"
5 2
 #include "url.h"
6 3
 
7
-static struct protocol protocols[0] __protocol_start;
8
-static struct protocol default_protocols[0] __default_protocol_start;
9
-static struct protocol protocols_end[0] __protocol_end;
10
-
11 4
 /*
12
- * Parse protocol portion of a URL.  Return 0 if no "proto://" is
13
- * present.
5
+ * Parse a URL string into its constituent parts.
14 6
  *
15
- */
16
-static inline int parse_protocol ( struct url_info *info, const char **p ) {
17
-	const char *q = *p;
18
-
19
-	info->protocol = q;
20
-	for ( ; *q ; q++ ) {
21
-		if ( memcmp ( q, "://", 3 ) == 0 ) {
22
-			info->protocol_len = q - info->protocol;
23
-			*p = q + 3;
24
-			return 1;
25
-		}
26
-	}
27
-	return 0;
28
-}
29
-
30
-/*
31
- * Parse the host:port portion of a URL.  Also fills in sin_port.
7
+ * We accept URLs of the form
32 8
  *
33
- */
34
-static inline void parse_host_port ( struct url_info *info, const char **p ) {
35
-	info->host = *p;
36
-	for ( ; **p && ( **p != '/' ) ; (*p)++ ) {
37
-		if ( **p == ':' ) {
38
-			info->host_len = *p - info->host;
39
-			info->port = ++(*p);
40
-			info->sin.sin_port = strtoul ( *p, p, 10 );
41
-			info->port_len = *p - info->port;
42
-			return;
43
-		}
44
-	}
45
-	/* No ':' separator seen; it's all the host part */
46
-	info->host_len = *p - info->host;
47
-}
48
-
49
-/*
50
- * Identify the protocol
9
+ *   [protocol://[host][:port]/]path/to/file
10
+ *
11
+ * We return true for success, 0 for failure (e.g. unknown protocol).
12
+ * The URL string will be modified by having NULs inserted after
13
+ * "protocol", "host" and "port".  The original URL can be
14
+ * reconstructed by calling unparse_url.
51 15
  *
52 16
  */
53
-static inline int identify_protocol ( struct url_info *info ) {
54
-	struct protocol *proto;
17
+void parse_url ( struct url_info *info, char *url ) {
18
+	char *p;
55 19
 
56
-	if ( info->protocol_len ) {
57
-		char *terminator;
58
-		char temp;
20
+	/* Zero the structure */
21
+	memset ( info, 0, sizeof ( *info ) );
59 22
 
60
-		/* Explcitly specified protocol */
61
-		terminator = ( char * ) &info->protocol[info->protocol_len];
62
-		temp = *terminator;
63
-		*terminator = '\0';
64
-		for ( proto = protocols ; proto < protocols_end ; proto++ ) {
65
-			if ( memcmp ( proto->name, info->protocol,
66
-				      info->protocol_len + 1 ) == 0 ) {
67
-				info->proto = proto;
23
+	/* Search for a protocol delimiter */
24
+	for ( p = url ; *p ; p++ ) {
25
+		if ( memcmp ( p, "://", 3 ) != 0 )
26
+			continue;
27
+
28
+		/* URL has an explicit protocol */
29
+		info->protocol = url;
30
+		*p = '\0';
31
+		p += 3;
32
+		info->host = p;
33
+
34
+		/* Search for port or file delimiter */
35
+		for ( ; *p ; p++ ) {
36
+			if ( *p == ':' ) {
37
+				*p = '\0';
38
+				info->port = p + 1;
39
+				continue;
40
+			}
41
+			if ( *p == '/' ) {
42
+				*(p++) = '\0';
68 43
 				break;
69 44
 			}
70 45
 		}
71
-		*terminator = temp;
72
-	} else {
73
-		/* No explicitly specified protocol */
74
-		if ( default_protocols < protocols_end )
75
-			info->proto = default_protocols;
46
+		info->file = p;
47
+		return;
76 48
 	}
77
-	return ( ( int ) info->proto ); /* NULL indicates failure */
78
-}
79 49
 
80
-/*
81
- * Resolve the host portion of the URL
82
- *
83
- */
84
-static inline int resolve_host ( struct url_info *info ) {
85
-	char *terminator;
86
-	char temp;
87
-	int success;
88
-
89
-	if ( ! info->host_len ) {
90
-		/* No host specified - leave sin.sin_addr empty to
91
-		 * indicate use of DHCP-supplied next-server
92
-		 */
93
-		return 1;
94
-	}
95
-
96
-	terminator = ( char * ) &info->host[info->host_len];
97
-	temp = *terminator;
98
-	*terminator = '\0';
99
-	success = resolv ( &info->sin.sin_addr, info->host );
100
-	*terminator = temp;
101
-	return success;
50
+	/* URL has no explicit protocol; is just a filename */
51
+	info->file = url;
102 52
 }
103 53
 
104 54
 /*
105
- * Parse a URL string into its constituent parts.  Perform name
106
- * resolution if required (and if resolver code is linked in), and
107
- * identify the protocol.
108
- *
109
- * We accept URLs of the form
110
- *
111
- *   [protocol://[host][:port]/]path/to/file
112
- *
113
- * We return true for success, 0 for failure (e.g. unknown protocol).
114
- * Note that the "/" before path/to/file *will* be counted as part of
115
- * the filename, if it is present.
55
+ * Restore a parsed URL to its original pristine form.
116 56
  *
117 57
  */
118
-int parse_url ( struct url_info *info, const char *url ) {
119
-	const char *p;
120
-
121
-	/* Fill in initial values */
122
-	memset ( info, 0, sizeof ( *info ) );
123
-	info->url = url;
124
-	info->protocol = url;
125
-	info->host = url;
126
-	info->port = url;
127
-	info->file = url;
128
-
129
-	/* Split the URL into substrings, and fill in sin.sin_port */
130
-	p = url;
131
-	if ( parse_protocol ( info, &p ) )
132
-		parse_host_port ( info, &p );
133
-	info->file = p;
134
-
135
-	/* Identify the protocol */
136
-	if ( ! identify_protocol ( info ) )
137
-		return 0;
138
-
139
-	/* Resolve the host name to an IP address */
140
-	if ( ! resolve_host ( info ) )
141
-		return 0;
142
-
143
-	return 1;
58
+char * unparse_url ( struct url_info *info ) {
59
+	if ( info->protocol ) {
60
+		/* URL had a protocol: fill in the deleted separators */
61
+		info->file[-1] = '/';
62
+		if ( info->port ) {
63
+			info->port[-1] = ':';
64
+		}
65
+		info->host[-3] = ':';
66
+		return info->protocol;
67
+	} else {
68
+		/* URL had no protocol; was just a filename */
69
+		return info->file;
70
+	}
144 71
 }

Loading…
Cancel
Save