1 ;;; nnwfm.el --- interfacing with a web forum
3 ;; Copyright (C) 2000, 2002, 2003, 2004, 2005,
4 ;; 2006, 2007, 2008 Free Software Foundation, Inc.
6 ;; Author: Lars Magne Ingebrigtsen <larsi@gnus.org>
9 ;; This file is part of GNU Emacs.
11 ;; GNU Emacs is free software; you can redistribute it and/or modify
12 ;; it under the terms of the GNU General Public License as published by
13 ;; the Free Software Foundation; either version 3, or (at your option)
16 ;; GNU Emacs is distributed in the hope that it will be useful,
17 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
18 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
19 ;; GNU General Public License for more details.
21 ;; You should have received a copy of the GNU General Public License
22 ;; along with GNU Emacs; see the file COPYING. If not, write to the
23 ;; Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
24 ;; Boston, MA 02110-1301, USA.
28 ;; Note: You need to have `url' and `w3' installed for this
33 (eval-when-compile (require 'cl
))
43 (autoload 'w3-parse-buffer
"w3-parse")
47 (defvoo nnwfm-directory
(nnheader-concat gnus-directory
"wfm/")
48 "Where nnwfm will save its files.")
50 (defvoo nnwfm-address
""
51 "The address of the Ultimate bulletin board.")
53 ;;; Internal variables
55 (defvar nnwfm-groups-alist nil
)
56 (defvoo nnwfm-groups nil
)
57 (defvoo nnwfm-headers nil
)
58 (defvoo nnwfm-articles nil
)
59 (defvar nnwfm-table-regexp
60 "postings.*editpost\\|forumdisplay\\|Forum[0-9]+/HTML\\|getbio")
62 ;;; Interface functions
64 (nnoo-define-basics nnwfm
)
66 (deffoo nnwfm-retrieve-headers
(articles &optional group server fetch-old
)
67 (nnwfm-possibly-change-server group server
)
68 (unless gnus-nov-is-evil
69 (let* ((last (car (last articles
)))
72 (entry (assoc group nnwfm-groups
))
74 (topics (nth 4 entry
))
75 (mapping (nth 5 entry
))
76 (old-total (or (nth 6 entry
) 1))
77 (nnwfm-table-regexp "Thread.asp")
78 headers article subject score from date lines parent point
79 contents tinfo fetchers map elem a href garticles topic old-max
80 inc datel table string current-page total-contents pages
81 farticles forum-contents parse furl-fetched mmap farticle
82 thread-id tables hstuff bstuff time
)
84 (while (and (setq article
(car articles
))
87 (or (> article
(caar map
))
88 (< (cadar map
) (caar map
))))
90 (when (setq mmap
(car map
))
93 (<= article
(nth 1 mmap
)))
94 ;; Do we already have a fetcher for this topic?
95 (if (setq elem
(assq (nth 2 mmap
) fetchers
))
96 ;; Yes, so we just add the spec to the end.
97 (nconc elem
(list (cons article
98 (+ (nth 3 mmap
) (incf farticle
)))))
99 ;; No, so we add a new one.
100 (push (list (nth 2 mmap
)
102 (+ (nth 3 mmap
) (incf farticle
))))
105 (setq article
(car articles
)))))
106 ;; Now we have the mapping from/to Gnus/nnwfm article numbers,
107 ;; so we start fetching the topics that we need to satisfy the
111 (set-buffer nntp-server-buffer
)
113 (setq nnwfm-articles nil
)
114 (mm-with-unibyte-buffer
115 (dolist (elem fetchers
)
117 (setq subject
(nth 2 (assq (car elem
) topics
))
118 thread-id
(nth 0 (assq (car elem
) topics
)))
120 (concat nnwfm-address
121 (format "Item.asp?GroupID=%d&ThreadID=%d" sid
123 (goto-char (point-min))
129 (w3-parse-buffer (current-buffer)))))))))
130 (setq tables
(cdr (caddar (memq (assq 'div tables
) tables
))))
132 (dolist (table tables
)
133 (when (eq (car table
) 'table
)
134 (setq table
(caddar (caddar (caddr table
)))
135 hstuff
(delete ":link" (nnweb-text (car table
)))
136 bstuff
(car (caddar (cdr table
)))
139 (setq time
(nnwfm-date-to-time (nth 2 hstuff
)))
140 (push (list from time bstuff
) contents
))))
141 (setq contents
(nreverse contents
))
142 (dolist (art (cdr elem
))
143 (push (list (car art
)
144 (nth (1- (cdr art
)) contents
)
148 (sort nnwfm-articles
'car-less-than-car
))
149 ;; Now we have all the articles, conveniently in an alist
150 ;; where the key is the Gnus article number.
151 (dolist (articlef nnwfm-articles
)
152 (setq article
(nth 0 articlef
)
153 contents
(nth 1 articlef
)
154 subject
(nth 2 articlef
))
155 (setq from
(nth 0 contents
)
156 date
(message-make-date (nth 1 contents
)))
160 (make-full-mail-header
163 (concat "<" (number-to-string sid
) "%"
164 (number-to-string article
)
167 (/ (length (mapconcat 'identity
(nnweb-text (nth 2 contents
)) ""))
171 (setq nnwfm-headers
(sort headers
'car-less-than-car
))
173 (set-buffer nntp-server-buffer
)
174 (mm-with-unibyte-current-buffer
176 (dolist (header nnwfm-headers
)
177 (nnheader-insert-nov (cdr header
))))))
180 (deffoo nnwfm-request-group
(group &optional server dont-check
)
181 (nnwfm-possibly-change-server nil server
)
182 (when (not nnwfm-groups
)
183 (nnwfm-request-list))
185 (nnwfm-create-mapping group
))
186 (let ((elem (assoc group nnwfm-groups
)))
189 (nnheader-report 'nnwfm
"Group does not exist"))
191 (nnheader-report 'nnwfm
"Opened group %s" group
)
193 "211 %d %d %d %s\n" (cadr elem
) 1 (cadr elem
)
194 (prin1-to-string group
))))))
196 (deffoo nnwfm-request-close
()
197 (setq nnwfm-groups-alist nil
200 (deffoo nnwfm-request-article
(article &optional group server buffer
)
201 (nnwfm-possibly-change-server group server
)
202 (let ((contents (cdr (assq article nnwfm-articles
))))
203 (when (setq contents
(nth 2 (car contents
)))
205 (set-buffer (or buffer nntp-server-buffer
))
207 (nnweb-insert-html contents
)
208 (goto-char (point-min))
209 (insert "Content-Type: text/html\nMIME-Version: 1.0\n")
210 (let ((header (cdr (assq article nnwfm-headers
))))
211 (mm-with-unibyte-current-buffer
212 (nnheader-insert-header header
)))
213 (nnheader-report 'nnwfm
"Fetched article %s" article
)
214 (cons group article
)))))
216 (deffoo nnwfm-request-list
(&optional server
)
217 (nnwfm-possibly-change-server nil server
)
218 (mm-with-unibyte-buffer
220 (if (string-match "/$" nnwfm-address
)
221 (concat nnwfm-address
"Group.asp")
223 (let* ((nnwfm-table-regexp "Thread.asp")
224 (contents (w3-parse-buffer (current-buffer)))
225 sid elem description articles a href group forum
227 (dolist (row (cdr (nth 2 (car (nth 2 (nnwfm-find-forum-table
229 (setq row
(nth 2 row
))
230 (when (setq a
(nnweb-parse-find 'a row
))
231 (setq group
(car (last (nnweb-text a
)))
232 href
(cdr (assq 'href
(nth 1 a
))))
233 (setq description
(car (last (nnweb-text (nth 1 row
)))))
236 (gnus-replace-in-string
237 (car (last (nnweb-text (nth 3 row
)))) "," "")))
239 (string-match "GroupId=\\([0-9]+\\)" href
))
240 (setq forum
(string-to-number (match-string 1 href
)))
241 (if (setq elem
(assoc group nnwfm-groups
))
242 (setcar (cdr elem
) articles
)
243 (push (list group articles forum description nil nil nil nil
)
246 (nnwfm-generate-active)
249 (deffoo nnwfm-request-newgroups
(date &optional server
)
250 (nnwfm-possibly-change-server nil server
)
251 (nnwfm-generate-active)
254 (nnoo-define-skeleton nnwfm
)
256 ;;; Internal functions
258 (defun nnwfm-new-threads-p (group time
)
259 "See whether we want to fetch the threads for GROUP written before TIME."
260 (let ((old-time (nth 7 (assoc group nnwfm-groups
))))
262 (time-less-p old-time time
))))
264 (defun nnwfm-create-mapping (group)
265 (let* ((entry (assoc group nnwfm-groups
))
267 (topics (nth 4 entry
))
268 (mapping (nth 5 entry
))
269 (old-total (or (nth 6 entry
) 1))
270 (current-time (current-time))
271 (nnwfm-table-regexp "Thread.asp")
272 (furls (list (concat nnwfm-address
273 (format "Thread.asp?GroupId=%d" sid
))))
275 contents forum-contents a subject href
276 garticles topic tinfo old-max inc parse elem date
278 (mm-with-unibyte-buffer
281 (push (car furls
) fetched-urls
)
282 (mm-url-insert (pop furls
))
283 (goto-char (point-min))
284 (while (re-search-forward " wr(" nil t
)
286 (setq elem
(message-tokenize-header
287 (gnus-replace-in-string
295 (string-to-number (nth 1 elem
))
296 (gnus-replace-in-string (nth 2 elem
) "\"" "")
297 (string-to-number (nth 5 elem
)))
299 (when (re-search-forward "href=\"\\(Thread.*DateLast=\\([^\"]+\\)\\)"
301 (setq url
(match-string 1)
302 time
(nnwfm-date-to-time (gnus-url-unhex-string
304 (when (and (nnwfm-new-threads-p group time
)
308 (mm-url-decode-entities-string url
)))
311 ;; The main idea here is to map Gnus article numbers to
312 ;; nnwfm article numbers. Say there are three topics in
313 ;; this forum, the first with 4 articles, the seconds with 2,
314 ;; and the third with 1. Then this will translate into 7 Gnus
315 ;; article numbers, where 1-4 comes from the first topic, 5-6
316 ;; from the second and 7 from the third. Now, then next time
317 ;; the group is entered, there's 2 new articles in topic one
318 ;; and 1 in topic three. Then Gnus article number 8-9 be 5-6
319 ;; in topic one and 10 will be the 2 in topic three.
320 (dolist (elem (nreverse forum-contents
))
321 (setq subject
(nth 1 elem
)
323 garticles
(nth 2 elem
))
324 (if (setq tinfo
(assq topic topics
))
326 (setq old-max
(cadr tinfo
))
327 (setcar (cdr tinfo
) garticles
))
329 (push (list topic garticles subject
) topics
)
330 (setcar (nthcdr 4 entry
) topics
))
331 (when (not (= old-max garticles
))
332 (setq inc
(- garticles old-max
))
333 (setq mapping
(nconc mapping
336 old-total
(1- (incf old-total inc
))
337 topic
(1+ old-max
)))))
339 (setcar (nthcdr 5 entry
) mapping
)
340 (setcar (nthcdr 6 entry
) old-total
))))
341 (setcar (nthcdr 7 entry
) current-time
)
342 (setcar (nthcdr 1 entry
) (1- old-total
))
346 (defun nnwfm-possibly-change-server (&optional group server
)
349 (not (nnwfm-server-opened server
)))
350 (nnwfm-open-server server
))
351 (unless nnwfm-groups-alist
353 (setq nnwfm-groups
(cdr (assoc nnwfm-address
354 nnwfm-groups-alist
)))))
356 (deffoo nnwfm-open-server
(server &optional defs connectionless
)
357 (nnheader-init-server-buffer)
358 (if (nnwfm-server-opened server
)
360 (unless (assq 'nnwfm-address defs
)
361 (setq defs
(append defs
(list (list 'nnwfm-address server
)))))
362 (nnoo-change-server 'nnwfm server defs
)))
364 (defun nnwfm-read-groups ()
365 (setq nnwfm-groups-alist nil
)
366 (let ((file (expand-file-name "groups" nnwfm-directory
)))
367 (when (file-exists-p file
)
368 (mm-with-unibyte-buffer
369 (insert-file-contents file
)
370 (goto-char (point-min))
371 (setq nnwfm-groups-alist
(read (current-buffer)))))))
373 (defun nnwfm-write-groups ()
374 (setq nnwfm-groups-alist
375 (delq (assoc nnwfm-address nnwfm-groups-alist
)
377 (push (cons nnwfm-address nnwfm-groups
)
379 (with-temp-file (expand-file-name "groups" nnwfm-directory
)
380 (prin1 nnwfm-groups-alist
(current-buffer))))
382 (defun nnwfm-init (server)
383 "Initialize buffers and such."
384 (unless (file-exists-p nnwfm-directory
)
385 (gnus-make-directory nnwfm-directory
)))
387 (defun nnwfm-generate-active ()
389 (set-buffer nntp-server-buffer
)
391 (dolist (elem nnwfm-groups
)
392 (insert (prin1-to-string (car elem
))
393 " " (number-to-string (cadr elem
)) " 1 y\n"))))
395 (defun nnwfm-find-forum-table (contents)
397 (nnwfm-find-forum-table-1 contents
)))
399 (defun nnwfm-find-forum-table-1 (contents)
400 (dolist (element contents
)
401 (unless (stringp element
)
402 (when (and (eq (car element
) 'table
)
403 (nnwfm-forum-table-p element
))
404 (throw 'found element
))
405 (when (nth 2 element
)
406 (nnwfm-find-forum-table-1 (nth 2 element
))))))
408 (defun nnwfm-forum-table-p (parse)
409 (when (not (apply 'gnus-or
412 (nnweb-parse-find 'table p
))
414 (let ((href (cdr (assq 'href
(nth 1 (nnweb-parse-find 'a parse
20)))))
416 (when (and href
(string-match nnwfm-table-regexp href
))
419 (defun nnwfm-date-to-time (date)
420 (let ((time (mapcar #'string-to-number
(split-string date
"[\\.\\+ :]"))))
421 (encode-time 0 (nth 4 time
) (nth 3 time
)
422 (nth 0 time
) (nth 1 time
)
423 (if (< (nth 2 time
) 70)
424 (+ 2000 (nth 2 time
))
425 (+ 1900 (nth 2 time
))))))
430 ;; coding: iso-8859-1
433 ;;; arch-tag: d813966a-4211-4557-ad11-d1ac2bc86536
434 ;;; nnwfm.el ends here