1 ;;; url-parse.el --- Uniform Resource Locator parser
3 ;; Copyright (C) 1996, 1997, 1998, 1999, 2004,
4 ;; 2005, 2006, 2007, 2008, 2009 Free Software Foundation, Inc.
6 ;; Keywords: comm, data, processes
8 ;; This file is part of GNU Emacs.
10 ;; GNU Emacs is free software: you can redistribute it and/or modify
11 ;; it under the terms of the GNU General Public License as published by
12 ;; the Free Software Foundation, either version 3 of the License, or
13 ;; (at your option) any later version.
15 ;; GNU Emacs is distributed in the hope that it will be useful,
16 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
17 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 ;; GNU General Public License for more details.
20 ;; You should have received a copy of the GNU General Public License
21 ;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
28 (eval-when-compile (require 'cl
))
30 (autoload 'url-scheme-get-property
"url-methods")
34 (:constructor url-parse-make-urlobj
35 (&optional type user password host portspec filename
36 target attributes fullness
))
38 type user password host portspec filename target attributes fullness
)
40 (defsubst url-port
(urlobj)
41 (or (url-portspec urlobj
)
42 (if (url-fullness urlobj
)
43 (url-scheme-get-property (url-type urlobj
) 'default-port
))))
45 (defsetf url-port
(urlobj) (port) `(setf (url-portspec ,urlobj
) ,port
))
48 (defun url-recreate-url (urlobj)
49 "Recreate a URL string from the parsed URLOBJ."
50 (concat (url-type urlobj
) ":" (if (url-host urlobj
) "//" "")
52 (concat (url-user urlobj
)
53 (if (url-password urlobj
)
54 (concat ":" (url-password urlobj
)))
57 (if (and (url-port urlobj
)
58 (not (equal (url-port urlobj
)
59 (url-scheme-get-property (url-type urlobj
) 'default-port
))))
60 (format ":%d" (url-port urlobj
)))
61 (or (url-filename urlobj
) "/")
62 (url-recreate-url-attributes urlobj
)
63 (if (url-target urlobj
)
64 (concat "#" (url-target urlobj
)))))
66 (defun url-recreate-url-attributes (urlobj)
67 "Recreate the attributes of an URL string from the parsed URLOBJ."
68 (when (url-attributes urlobj
)
70 (mapconcat (lambda (x)
72 (concat (car x
) "=" (cdr x
))
74 (url-attributes urlobj
) ";"))))
77 (defun url-generic-parse-url (url)
78 "Return an URL-struct of the parts of URL.
79 The CL-style struct contains the following fields:
80 TYPE USER PASSWORD HOST PORTSPEC FILENAME TARGET ATTRIBUTES FULLNESS."
84 (url-parse-make-urlobj))
85 ((or (not (string-match url-nonrelative-link url
))
86 (= ?
/ (string-to-char url
)))
87 ;; This isn't correct, as a relative URL can be a fragment link
88 ;; (e.g. "#foo") and many other things (see section 4.2).
89 ;; However, let's not fix something that isn't broken, especially
90 ;; when close to a release.
91 (url-parse-make-urlobj nil nil nil nil nil url
))
94 (set-syntax-table url-parse-syntax-table
)
105 (inhibit-read-only t
))
108 (goto-char (point-min))
109 (setq save-pos
(point))
112 (if (not (looking-at "//"))
114 (skip-chars-forward "a-zA-Z+.\\-")
115 (downcase-region save-pos
(point))
116 (setq prot
(buffer-substring save-pos
(point)))
117 (skip-chars-forward ":")
118 (setq save-pos
(point))))
121 (if (looking-at "//")
125 (setq save-pos
(point))
126 (skip-chars-forward "^/")
127 (setq host
(buffer-substring save-pos
(point)))
128 (if (string-match "^\\([^@]+\\)@" host
)
129 (setq user
(match-string 1 host
)
130 host
(substring host
(match-end 0) nil
)))
131 (if (and user
(string-match "\\([^:]+\\):\\(.*\\)" user
))
132 (setq pass
(match-string 2 user
)
133 user
(match-string 1 user
)))
134 ;; This gives wrong results for IPv6 literal addresses.
135 (if (string-match ":\\([0-9+]+\\)" host
)
136 (setq port
(string-to-number (match-string 1 host
))
137 host
(substring host
0 (match-beginning 0))))
138 (if (string-match ":$" host
)
139 (setq host
(substring host
0 (match-beginning 0))))
140 (setq host
(downcase host
)
144 (setq port
(url-scheme-get-property prot
'default-port
)))
147 ;; Gross hack to preserve ';' in data URLs
148 (setq save-pos
(point))
151 (if (string= "data" prot
)
152 (goto-char (point-max))
153 ;; Now check for references
154 (skip-chars-forward "^#")
160 (skip-chars-forward "#")
161 (setq refs
(buffer-substring (point) (point-max)))
164 (skip-chars-forward "^;")
166 (setq attr
(url-parse-args (buffer-substring (point) (point-max)) t
)
167 attr
(nreverse attr
))))
169 (setq file
(buffer-substring save-pos
(point)))
170 (if (and host
(string-match "%[0-9][0-9]" host
))
171 (setq host
(url-unhex-string host
)))
172 (url-parse-make-urlobj
173 prot user pass host port file refs attr full
))))))
177 ;; arch-tag: f338325f-71ab-4bee-93cc-78fb9a03d403
178 ;;; url-parse.el ends here