3 int is_urlschemechar(int first_flag
, int ch
)
6 * The set of valid URL schemes, as per STD66 (RFC3986) is
7 * '[A-Za-z][A-Za-z0-9+.-]*'. But use sightly looser check
8 * of '[A-Za-z0-9][A-Za-z0-9+.-]*' because earlier version
9 * of check used '[A-Za-z0-9]+' so not to break any remote
12 int alphanumeric
, special
;
13 alphanumeric
= ch
> 0 && isalnum(ch
);
14 special
= ch
== '+' || ch
== '-' || ch
== '.';
15 return alphanumeric
|| (!first_flag
&& special
);
18 int is_url(const char *url
)
20 const char *url2
, *first_slash
;
25 first_slash
= strchr(url
, '/');
27 /* Input with no slash at all or slash first can't be URL. */
28 if (!first_slash
|| first_slash
== url
)
30 /* Character before must be : and next must be /. */
31 if (first_slash
[-1] != ':' || first_slash
[1] != '/')
33 /* There must be something before the :// */
34 if (first_slash
== url
+ 1)
37 * Check all characters up to first slash - 1. Only alphanum
41 while (url2
< first_slash
- 1) {
42 if (!is_urlschemechar(url2
== url
, (unsigned char)*url2
))
51 static int url_decode_char(const char *q
)
54 unsigned char val
= 0;
55 for (i
= 0; i
< 2; i
++) {
56 unsigned char c
= *q
++;
58 if (c
>= '0' && c
<= '9')
60 else if (c
>= 'a' && c
<= 'f')
62 else if (c
>= 'A' && c
<= 'F')
70 static char *url_decode_internal(const char **query
, const char *stop_at
)
72 const char *q
= *query
;
75 strbuf_init(&out
, 16);
81 if (stop_at
&& strchr(stop_at
, c
)) {
87 int val
= url_decode_char(q
+ 1);
89 strbuf_addch(&out
, val
);
96 strbuf_addch(&out
, ' ');
98 strbuf_addch(&out
, c
);
102 return strbuf_detach(&out
, NULL
);
105 char *url_decode(const char *url
)
107 return url_decode_internal(&url
, NULL
);
110 char *url_decode_parameter_name(const char **query
)
112 return url_decode_internal(query
, "&=");
115 char *url_decode_parameter_value(const char **query
)
117 return url_decode_internal(query
, "&");