* textmodes/two-column.el (2C-split):
[bpt/emacs.git] / lisp / net / newst-backend.el
1 ;;; newst-backend.el --- Retrieval backend for newsticker.
2
3 ;; Copyright (C) 2003, 2004, 2005, 2006, 2007, 2008, 2009
4 ;; Free Software Foundation, Inc.
5
6 ;; Author: Ulf Jasper <ulf.jasper@web.de>
7 ;; Filename: newst-backend.el
8 ;; URL: http://www.nongnu.org/newsticker
9 ;; Keywords: News, RSS, Atom
10 ;; Time-stamp: "23. Januar 2009, 19:39:22 (ulf)"
11
12 ;; ======================================================================
13
14 ;; This file is part of GNU Emacs.
15
16 ;; GNU Emacs is free software: you can redistribute it and/or modify
17 ;; it under the terms of the GNU General Public License as published by
18 ;; the Free Software Foundation, either version 3 of the License, or
19 ;; (at your option) any later version.
20
21 ;; GNU Emacs is distributed in the hope that it will be useful,
22 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
23 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
24 ;; GNU General Public License for more details.
25
26 ;; You should have received a copy of the GNU General Public License
27 ;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
28
29 ;; ======================================================================
30
31 ;;; Commentary:
32
33 ;; See newsticker.el
34
35 ;; ======================================================================
36 ;;; Code:
37
38 (require 'derived)
39 (require 'xml)
40
41 ;; Silence warnings
42 (defvar w3-mode-map)
43 (defvar w3m-minor-mode-map)
44
45
46 (defvar newsticker--retrieval-timer-list nil
47 "List of timers for news retrieval.
48 This is an alist, each element consisting of (feed-name . timer).")
49
50 (defvar newsticker--download-logos nil
51 "If non-nil download feed logos if available.")
52
53 (defvar newsticker--sentinel-callback nil
54 "Function called at end of `newsticker--sentinel'.")
55
56 ;;;###autoload
57 (defun newsticker-running-p ()
58 "Check whether newsticker is running.
59 Return t if newsticker is running, nil otherwise. Newsticker is
60 considered to be running if the newsticker timer list is not empty."
61 (> (length newsticker--retrieval-timer-list) 0))
62
63 ;; ======================================================================
64 ;;; Customization
65 ;; ======================================================================
66 (defgroup newsticker nil
67 "Aggregator for RSS and Atom feeds."
68 :group 'applications)
69
70 (defconst newsticker--raw-url-list-defaults
71 '(("CNET News.com"
72 "http://export.cnet.com/export/feeds/news/rss/1,11176,,00.xml")
73 ("Debian Security Advisories"
74 "http://www.debian.org/security/dsa.en.rdf")
75 ("Debian Security Advisories - Long format"
76 "http://www.debian.org/security/dsa-long.en.rdf")
77 ("Emacs Wiki"
78 "http://www.emacswiki.org/cgi-bin/wiki.pl?action=rss"
79 nil
80 3600)
81 ("Freshmeat.net"
82 "http://freshmeat.net/index.atom")
83 ("Kuro5hin.org"
84 "http://www.kuro5hin.org/backend.rdf")
85 ("LWN (Linux Weekly News)"
86 "http://lwn.net/headlines/rss")
87 ("NY Times: Technology"
88 "http://partners.userland.com/nytRss/technology.xml")
89 ("NY Times"
90 "http://partners.userland.com/nytRss/nytHomepage.xml")
91 ("Quote of the day"
92 "http://www.quotationspage.com/data/qotd.rss"
93 "07:00"
94 86400)
95 ("The Register"
96 "http://www.theregister.co.uk/tonys/slashdot.rdf")
97 ("slashdot"
98 "http://slashdot.org/index.rss"
99 nil
100 3600) ;/. will ban you if under 3600 seconds!
101 ("Wired News"
102 "http://www.wired.com/news_drop/netcenter/netcenter.rdf")
103 ("Heise News (german)"
104 "http://www.heise.de/newsticker/heise.rdf")
105 ("Tagesschau (german)"
106 "http://www.tagesschau.de/newsticker.rdf"
107 nil
108 1800)
109 ("Telepolis (german)"
110 "http://www.heise.de/tp/news.rdf"))
111 "Default URL list in raw form.
112 This list is fed into defcustom via `newsticker--splicer'.")
113
114 (defun newsticker--splicer (item)
115 "Convert ITEM for splicing into `newsticker-url-list-defaults'."
116 (let ((result (list 'list :tag (nth 0 item) (list 'const (nth 0 item))))
117 (element (cdr item)))
118 (while element
119 (setq result (append result (list (list 'const (car element)))))
120 (setq element (cdr element)))
121 result))
122
123 (defun newsticker--set-customvar-retrieval (symbol value)
124 "Set retrieval related newsticker-variable SYMBOL value to VALUE.
125 Calls all actions which are necessary in order to make the new
126 value effective."
127 (if (or (not (boundp symbol))
128 (equal (symbol-value symbol) value))
129 (set symbol value)
130 ;; something must have changed
131 (let ((need-restart nil)
132 (new-or-changed-feeds nil)
133 (removed-feeds))
134 (cond ((eq symbol 'newsticker-retrieval-interval)
135 (setq need-restart t))
136 ((memq symbol '(newsticker-url-list-defaults newsticker-url-list))
137 (dolist (elt value)
138 (unless (member elt (symbol-value symbol))
139 (setq new-or-changed-feeds (cons elt new-or-changed-feeds))))
140 (dolist (elt (symbol-value symbol))
141 (unless (member elt value)
142 (setq removed-feeds (cons elt removed-feeds))))))
143 (cond (need-restart
144 (set symbol value)
145 (when (newsticker-running-p)
146 (message "Restarting newsticker")
147 (newsticker-stop)
148 (newsticker-start)))
149 (t
150 (dolist (feed removed-feeds)
151 (message "Stopping feed `%s'" (car feed))
152 (newsticker--stop-feed (car feed)))
153 (dolist (feed new-or-changed-feeds)
154 (message "Starting feed `%s'" (car feed))
155 (newsticker--stop-feed (car feed))
156 (newsticker--start-feed feed))
157 (unless new-or-changed-feeds
158 (when newsticker--sentinel-callback
159 (funcall newsticker--sentinel-callback)))))
160 (set symbol value))))
161
162 ;; ======================================================================
163 ;; retrieval
164 (defgroup newsticker-retrieval nil
165 "Settings for news retrieval."
166 :group 'newsticker)
167
168 (defcustom newsticker-url-list-defaults
169 '(("Emacs Wiki"
170 "http://www.emacswiki.org/cgi-bin/wiki.pl?action=rss"
171 nil
172 3600))
173 "A customizable list of news feeds to select from.
174 These were mostly extracted from the Radio Community Server at
175 http://subhonker6.userland.com/rcsPublic/rssHotlist.
176
177 You may add other entries in `newsticker-url-list'."
178 :type `(set ,@(mapcar `newsticker--splicer
179 newsticker--raw-url-list-defaults))
180 :set 'newsticker--set-customvar-retrieval
181 :group 'newsticker-retrieval)
182
183 (defcustom newsticker-url-list nil
184 "The news feeds which you like to watch.
185
186 This alist will be used in addition to selection made customizing
187 `newsticker-url-list-defaults'.
188
189 This is an alist. Each element consists of two items: a LABEL and a URL,
190 optionally followed by a START-TIME, INTERVAL specifier and WGET-ARGUMENTS.
191
192 The LABEL gives the name of the news feed. It can be an arbitrary string.
193
194 The URL gives the location of the news feed. It must point to a valid
195 RSS or Atom file. The file is retrieved by calling wget, or whatever you
196 specify as `newsticker-wget-name'.
197
198 URL may also be a function which returns news data. In this case
199 `newsticker-retrieval-method' etc. are ignored for this feed.
200
201 The START-TIME can be either a string, or nil. If it is a string it
202 specifies a fixed time at which this feed shall be retrieved for the
203 first time. (Examples: \"11:00pm\", \"23:00\".) If it is nil (or
204 unspecified), this feed will be retrieved immediately after calling
205 `newsticker-start'.
206
207 The INTERVAL specifies the time between retrievals for this feed. If it
208 is nil (or unspecified) the default interval value as set in
209 `newsticker-retrieval-interval' is used.
210
211 \(newsticker.el calls `run-at-time'. The newsticker-parameters START-TIME
212 and INTERVAL correspond to the `run-at-time'-parameters TIME and REPEAT.)
213
214 WGET-ARGUMENTS specifies arguments for wget (see `newsticker-wget-name')
215 which apply for this feed only, overriding the value of
216 `newsticker-wget-arguments'."
217 :type '(repeat (list :tag "News feed"
218 (string :tag "Label")
219 (choice :tag "URI"
220 (string :tag "String")
221 (function :tag "Function"))
222 (choice :tag "Start"
223 (const :tag "Default" nil)
224 (string :tag "Fixed Time"))
225 (choice :tag "Interval"
226 (const :tag "Default" nil)
227 (const :tag "Hourly" 3600)
228 (const :tag "Daily" 86400)
229 (const :tag "Weekly" 604800)
230 (integer :tag "Interval"))
231 (choice :tag "Wget Arguments"
232 (const :tag "Default arguments" nil)
233 (repeat :tag "Special arguments" string))))
234 :set 'newsticker--set-customvar-retrieval
235 :group 'newsticker-retrieval)
236
237 (defcustom newsticker-retrieval-method
238 'intern
239 "Method for retrieving news from the web, either `intern' or `extern'.
240 Default value `intern' uses Emacs' built-in asynchronous download
241 capabilities ('url-retrieve'). If set to `extern' the external
242 program wget is used, see `newsticker-wget-name'."
243 :type '(choice :tag "Method"
244 (const :tag "Intern" intern)
245 (const :tag "Extern" extern))
246 :group 'newsticker-retrieval)
247
248 (defcustom newsticker-wget-name
249 "wget"
250 "Name of the program which is called to retrieve news from the web.
251 The canonical choice is wget but you may take any other program which is
252 able to return the contents of a news feed file on stdout."
253 :type 'string
254 :group 'newsticker-retrieval)
255
256 (defcustom newsticker-wget-arguments
257 '("-q" "-O" "-")
258 "Arguments which are passed to wget.
259 There is probably no reason to change the default settings, unless you
260 are living behind a firewall."
261 :type '(repeat (string :tag "Argument"))
262 :group 'newsticker-retrieval)
263
264 (defcustom newsticker-retrieval-interval
265 3600
266 "Time interval for retrieving new news items (seconds).
267 If this value is not positive (i.e. less than or equal to 0)
268 items are retrieved only once!
269 Please note that some feeds, e.g. Slashdot, will ban you if you
270 make it less than 1800 seconds (30 minutes)!"
271 :type '(choice :tag "Interval"
272 (const :tag "No automatic retrieval" 0)
273 (const :tag "Hourly" 3600)
274 (const :tag "Daily" 86400)
275 (const :tag "Weekly" 604800)
276 (integer :tag "Interval"))
277 :set 'newsticker--set-customvar-retrieval
278 :group 'newsticker-retrieval)
279
280 (defcustom newsticker-desc-comp-max
281 100
282 "Relevant length of headline descriptions.
283 This value gives the maximum number of characters which will be
284 taken into account when newsticker compares two headline
285 descriptions."
286 :type 'integer
287 :group 'newsticker-retrieval)
288
289 ;; ======================================================================
290 ;; headline processing
291 (defgroup newsticker-headline-processing nil
292 "Settings for the automatic processing of headlines."
293 :group 'newsticker)
294
295 (defcustom newsticker-automatically-mark-items-as-old
296 t
297 "Decides whether to automatically mark items as old.
298 If t a new item is considered as new only after its first retrieval. As
299 soon as it is retrieved a second time, it becomes old. If not t all
300 items stay new until you mark them as old. This is done in the
301 *newsticker* buffer."
302 :type 'boolean
303 :group 'newsticker-headline-processing)
304
305 (defcustom newsticker-automatically-mark-visited-items-as-old
306 t
307 "Decides whether to automatically mark visited items as old.
308 If t an item is marked as old as soon as the associated link is
309 visited, i.e. after pressing RET or mouse2 on the item's
310 headline."
311
312 :type 'boolean
313 :group 'newsticker-headline-processing)
314
315 (defcustom newsticker-keep-obsolete-items
316 t
317 "Decides whether to keep unread items which have been removed from feed.
318 If t a new item, which has been removed from the feed, is kept in
319 the cache until it is marked as read."
320 :type 'boolean
321 :group 'newsticker-headline-processing)
322
323 (defcustom newsticker-obsolete-item-max-age
324 (* 60 60 24)
325 "Maximal age of obsolete items, in seconds.
326 Obsolete items which are older than this value will be silently
327 deleted at the next retrieval."
328 :type 'integer
329 :group 'newsticker-headline-processing)
330
331 (defcustom newsticker-auto-mark-filter-list
332 nil
333 "A list of filters for automatically marking headlines.
334
335 This is an alist of the form (FEED-NAME PATTERN-LIST). I.e. each
336 element consists of a FEED-NAME a PATTERN-LIST. Each element of
337 the pattern-list has the form (AGE TITLE-OR-DESCRIPTION REGEXP).
338 AGE must be one of the symbols 'old or 'immortal.
339 TITLE-OR-DESCRIPTION must be on of the symbols 'title,
340 'description, or 'all. REGEXP is a regular expression, i.e. a
341 string.
342
343 This filter is checked after a new headline has been retrieved.
344 If FEED-NAME matches the name of the corresponding news feed, the
345 pattern-list is checked: The new headline will be marked as AGE
346 if REGEXP matches the headline's TITLE-OR-DESCRIPTION.
347
348 If, for example, `newsticker-auto-mark-filter-list' looks like
349 \((slashdot ('old 'title \"^Forget me!$\") ('immortal 'title \"Read me\")
350 \('immortal 'all \"important\"))))
351
352 then all articles from slashdot are marked as old if they have
353 the title \"Forget me!\". All articles with a title containing
354 the string \"Read me\" are marked as immortal. All articles which
355 contain the string \"important\" in their title or their
356 description are marked as immortal."
357 :type '(repeat (list :tag "Auto mark filter"
358 (string :tag "Feed name")
359 (repeat
360 (list :tag "Filter element"
361 (choice
362 :tag "Auto-assigned age"
363 (const :tag "Old" old)
364 (const :tag "Immortal" immortal))
365 (choice
366 :tag "Title/Description"
367 (const :tag "Title" title)
368 (const :tag "Description" description)
369 (const :tag "All" all))
370 (string :tag "Regexp")))))
371 :group 'newsticker-headline-processing)
372
373 ;; ======================================================================
374 ;; hooks
375 (defgroup newsticker-hooks nil
376 "Settings for newsticker hooks."
377 :group 'newsticker)
378
379 (defcustom newsticker-start-hook
380 nil
381 "Hook run when starting newsticker.
382 This hook is run at the very end of `newsticker-start'."
383 :options '(newsticker-start-ticker)
384 :type 'hook
385 :group 'newsticker-hooks)
386
387 (defcustom newsticker-stop-hook
388 nil
389 "Hook run when stopping newsticker.
390 This hook is run at the very end of `newsticker-stop'."
391 :options nil
392 :type 'hook
393 :group 'newsticker-hooks)
394
395 (defcustom newsticker-new-item-functions
396 nil
397 "List of functions run after a new headline has been retrieved.
398 Each function is called with the following three arguments:
399 FEED the name of the corresponding news feed,
400 TITLE the title of the headline,
401 DESC the decoded description of the headline.
402
403 See `newsticker-download-images', and
404 `newsticker-download-enclosures' for sample functions.
405
406 Please note that these functions are called only once for a
407 headline after it has been retrieved for the first time."
408 :type 'hook
409 :options '(newsticker-download-images
410 newsticker-download-enclosures)
411 :group 'newsticker-hooks)
412
413 ;; ======================================================================
414 ;; miscellaneous
415 (defgroup newsticker-miscellaneous nil
416 "Miscellaneous newsticker settings."
417 :group 'newsticker)
418
419 (defcustom newsticker-cache-filename
420 "~/.newsticker-cache"
421 "Name of the newsticker cache file."
422 :type 'string
423 :group 'newsticker-miscellaneous)
424 (make-obsolete 'newsticker-cache-filename 'newsticker-dir "23.1")
425
426 (defcustom newsticker-dir
427 (locate-user-emacs-file "newsticker/" ".newsticker/")
428 "Directory where newsticker saves data."
429 :type 'directory
430 :group 'newsticker-miscellaneous)
431
432 ;; debugging
433 (defcustom newsticker-debug
434 nil
435 "Enables some features needed for debugging newsticker.el.
436
437 If set to t newsticker.el will print lots of debugging messages, and the
438 buffers *newsticker-wget-<feed>* will not be closed."
439 :type 'boolean
440 :group 'newsticker-miscellaneous)
441
442 ;; ======================================================================
443 ;;; Compatibility section, XEmacs, Emacs
444 ;; ======================================================================
445
446 ;; FIXME It is bad practice to define compat functions with such generic names.
447
448 ;; This is not needed in Emacs >= 22.1.
449 (unless (fboundp 'time-add)
450 (require 'time-date);;FIXME
451 (defun time-add (t1 t2)
452 (with-no-warnings ; don't warn about obsolete time-to-seconds in 23.2
453 (seconds-to-time (+ (time-to-seconds t1) (time-to-seconds t2))))))
454
455 (unless (fboundp 'match-string-no-properties)
456 (defalias 'match-string-no-properties 'match-string))
457
458 (when (featurep 'xemacs)
459 (unless (fboundp 'replace-regexp-in-string)
460 (defun replace-regexp-in-string (re rp st)
461 (save-match-data ;; apparently XEmacs needs save-match-data
462 (replace-in-string st re rp)))))
463
464 ;; copied from subr.el
465 (unless (fboundp 'add-to-invisibility-spec)
466 (defun add-to-invisibility-spec (arg)
467 "Add elements to `buffer-invisibility-spec'.
468 See documentation for `buffer-invisibility-spec' for the kind of elements
469 that can be added."
470 (if (eq buffer-invisibility-spec t)
471 (setq buffer-invisibility-spec (list t)))
472 (setq buffer-invisibility-spec
473 (cons arg buffer-invisibility-spec))))
474
475 ;; copied from subr.el
476 (unless (fboundp 'remove-from-invisibility-spec)
477 (defun remove-from-invisibility-spec (arg)
478 "Remove elements from `buffer-invisibility-spec'."
479 (if (consp buffer-invisibility-spec)
480 (setq buffer-invisibility-spec
481 (delete arg buffer-invisibility-spec)))))
482
483 ;; ======================================================================
484 ;;; Internal variables
485 ;; ======================================================================
486 (defvar newsticker--item-list nil
487 "List of newsticker items.")
488 (defvar newsticker--item-position 0
489 "Actual position in list of newsticker items.")
490 (defvar newsticker--prev-message "There was no previous message yet!"
491 "Last message that the newsticker displayed.")
492 (defvar newsticker--scrollable-text ""
493 "The text which is scrolled smoothly in the echo area.")
494 (defvar newsticker--buffer-uptodate-p nil
495 "Tells whether the newsticker buffer is up to date.")
496 (defvar newsticker--latest-update-time (current-time)
497 "The time at which the latest news arrived.")
498 (defvar newsticker--process-ids nil
499 "List of PIDs of active newsticker processes.")
500
501 (defvar newsticker--cache nil "Cached newsticker data.
502 This is a list of the form
503
504 ((label1
505 (title description link time age index preformatted-contents
506 preformatted-title extra-elements)
507 ...)
508 (label2
509 (title description link time age index preformatted-contents
510 preformatted-title extra-elements)
511 ...)
512 ...)
513
514 where LABEL is a symbol. TITLE, DESCRIPTION, and LINK are
515 strings. TIME is a time value as returned by `current-time'.
516 AGE is a symbol: 'new, 'old, 'immortal, and 'obsolete denote
517 ordinary news items, whereas 'feed denotes an item which is not a
518 headline but describes the feed itself. INDEX denotes the
519 original position of the item -- used for restoring the original
520 order. PREFORMATTED-CONTENTS and PREFORMATTED-TITLE hold the
521 formatted contents of the item's description and title. This
522 speeds things up if HTML rendering is used, which is rather
523 slow. EXTRA-ELEMENTS is an alist containing additional elements.")
524
525 (defvar newsticker--auto-narrow-to-feed nil
526 "Automatically narrow to current news feed.
527 If non-nil only the items of the current news feed are visible.")
528
529 (defvar newsticker--auto-narrow-to-item nil
530 "Automatically narrow to current news item.
531 If non-nil only the current headline is visible.")
532
533 (defconst newsticker--error-headline
534 "[COULD NOT DOWNLOAD HEADLINES!]"
535 "Title of error headline which will be inserted if news retrieval fails.")
536
537 ;; ======================================================================
538 ;;; Shortcuts
539 ;; ======================================================================
540 (defsubst newsticker--title (item)
541 "Return title of ITEM."
542 (nth 0 item))
543 (defsubst newsticker--desc (item)
544 "Return description of ITEM."
545 (nth 1 item))
546 (defsubst newsticker--link (item)
547 "Return link of ITEM."
548 (nth 2 item))
549 (defsubst newsticker--time (item)
550 "Return time of ITEM."
551 (nth 3 item))
552 (defsubst newsticker--age (item)
553 "Return age of ITEM."
554 (nth 4 item))
555 (defsubst newsticker--pos (item)
556 "Return position/index of ITEM."
557 (nth 5 item))
558 (defsubst newsticker--preformatted-contents (item)
559 "Return pre-formatted text of ITEM."
560 (nth 6 item))
561 (defsubst newsticker--preformatted-title (item)
562 "Return pre-formatted title of ITEM."
563 (nth 7 item))
564 (defsubst newsticker--extra (item)
565 "Return extra attributes of ITEM."
566 (nth 8 item))
567 (defsubst newsticker--guid-to-string (guid)
568 "Return string representation of GUID."
569 (if (stringp guid)
570 guid
571 (car (xml-node-children guid))))
572 (defsubst newsticker--guid (item)
573 "Return guid of ITEM."
574 (newsticker--guid-to-string (assoc 'guid (newsticker--extra item))))
575 (defsubst newsticker--enclosure (item)
576 "Return enclosure element of ITEM in the form \(...FIXME...\) or nil."
577 (let ((enclosure (assoc 'enclosure (newsticker--extra item))))
578 (if enclosure
579 (xml-node-attributes enclosure))))
580 (defun newsticker--real-feed-name (feed)
581 "Return real name of FEED."
582 (catch 'name
583 (mapc (lambda (item)
584 (if (eq (newsticker--age item) 'feed)
585 (throw 'name (newsticker--title item))))
586 (cdr (newsticker--cache-get-feed feed)))
587 (symbol-name feed)))
588
589
590 ;; ======================================================================
591 ;;; User fun
592 ;; ======================================================================
593
594 (defun newsticker--start-feed (feed &optional do-not-complain-if-running)
595 "Start retrieval timer for FEED.
596 If timer is running already a warning message is printed unless
597 DO-NOT-COMPLAIN-IF-RUNNING is not nil. Add the started
598 name/timer pair to `newsticker--retrieval-timer-list'."
599 (let* ((feed-name (car feed))
600 (start-time (nth 2 feed))
601 (interval (or (nth 3 feed)
602 newsticker-retrieval-interval))
603 (timer (assoc (car feed)
604 newsticker--retrieval-timer-list)))
605 (if timer
606 (or do-not-complain-if-running
607 (message "Timer for %s is running already!"
608 feed-name))
609 (newsticker--debug-msg "Starting timer for %s: %s, %d"
610 feed-name start-time interval)
611 ;; do not repeat retrieval if interval not positive
612 (if (<= interval 0)
613 (setq interval nil))
614 ;; Suddenly XEmacs doesn't like start-time 0
615 (if (or (not start-time)
616 (and (numberp start-time) (= start-time 0)))
617 (setq start-time 1))
618 ;; (message "start-time %s" start-time)
619 (setq timer (run-at-time start-time interval
620 'newsticker-get-news feed-name))
621 (if interval
622 (add-to-list 'newsticker--retrieval-timer-list
623 (cons feed-name timer))))))
624
625 ;;;###autoload
626 (defun newsticker-start (&optional do-not-complain-if-running)
627 "Start the newsticker.
628 Start the timers for display and retrieval. If the newsticker, i.e. the
629 timers, are running already a warning message is printed unless
630 DO-NOT-COMPLAIN-IF-RUNNING is not nil.
631 Run `newsticker-start-hook' if newsticker was not running already."
632 (interactive)
633 (let ((running (newsticker-running-p)))
634 ;; read old cache if it exists and newsticker is not running
635 (unless running
636 (newsticker--cache-read))
637 ;; start retrieval timers -- one timer for each feed
638 (dolist (feed (append newsticker-url-list-defaults newsticker-url-list))
639 (newsticker--start-feed feed))
640 (unless running
641 (run-hooks 'newsticker-start-hook)
642 (message "Newsticker started!"))))
643
644 (defun newsticker--stop-feed (feed-name)
645 "Stop retrieval for feed FEED-NAME.
646 Delete the stopped name/timer pair from `newsticker--retrieval-timer-list'."
647 (let ((name-and-timer (assoc feed-name newsticker--retrieval-timer-list)))
648 (when name-and-timer
649 (cancel-timer (cdr name-and-timer))
650 (setq newsticker--retrieval-timer-list
651 (delete name-and-timer newsticker--retrieval-timer-list)))))
652
653 (defun newsticker-stop ()
654 "Stop the newsticker and the newsticker-ticker.
655 Cancel the timers for display and retrieval. Run `newsticker-stop-hook'
656 if newsticker has been running."
657 (interactive)
658 (newsticker--cache-save)
659 (when (fboundp 'newsticker-stop-ticker) ; silence compiler warnings
660 (newsticker-stop-ticker))
661 (when (newsticker-running-p)
662 (mapc (lambda (name-and-timer)
663 (newsticker--stop-feed (car name-and-timer)))
664 newsticker--retrieval-timer-list)
665 (setq newsticker--retrieval-timer-list nil)
666 (run-hooks 'newsticker-stop-hook)
667 (message "Newsticker stopped!")))
668
669 (defun newsticker-get-all-news ()
670 "Launch retrieval of news from all configured newsticker sites.
671 This does NOT start the retrieval timers."
672 (interactive)
673 ;; launch retrieval of news
674 (mapc (lambda (item)
675 (newsticker-get-news (car item)))
676 (append newsticker-url-list-defaults newsticker-url-list)))
677
678 (defun newsticker-save-item (feed item)
679 "Save FEED ITEM."
680 (interactive)
681 (let ((filename (read-string "Filename: "
682 (concat feed ":_"
683 (replace-regexp-in-string
684 " " "_" (newsticker--title item))
685 ".html"))))
686 (with-temp-buffer
687 (insert (newsticker--desc item))
688 (write-file filename t))))
689
690 (defun newsticker-add-url (url name)
691 "Add given URL under given NAME to `newsticker-url-list'.
692 If URL is nil it is searched at point."
693 (interactive
694 (list
695 (read-string "URL: "
696 (save-excursion
697 (end-of-line)
698 (and
699 (re-search-backward
700 "http://"
701 (if (> (point) (+ (point-min) 100))
702 (- (point) 100)
703 (point-min))
704 t)
705 (re-search-forward
706 "http://[-a-zA-Z0-9&/_.]*"
707 (if (< (point) (- (point-max) 200))
708 (+ (point) 200)
709 (point-max))
710 t)
711 (buffer-substring-no-properties (match-beginning 0)
712 (match-end 0)))))
713 (read-string "Name: ")))
714 (add-to-list 'newsticker-url-list (list name url nil nil nil) t)
715 (customize-variable 'newsticker-url-list))
716
717 (defun newsticker-customize ()
718 "Open the newsticker customization group."
719 (interactive)
720 (customize-group "newsticker"))
721
722 ;; ======================================================================
723 ;;; Local stuff
724 ;; ======================================================================
725 (defun newsticker--get-news-by-funcall (feed-name function)
726 "Get news for the site FEED-NAME by calling FUNCTION.
727 See `newsticker-get-news'."
728 (let ((buffername (concat " *newsticker-funcall-" feed-name "*")))
729 (with-current-buffer (get-buffer-create buffername)
730 (erase-buffer)
731 (insert (string-to-multibyte (funcall function feed-name)))
732 (newsticker--sentinel-work nil t feed-name function
733 (current-buffer)))))
734
735 (defun newsticker--get-news-by-url (feed-name url)
736 "Get news for the site FEED-NAME from address URL using `url-retrieve'.
737 See `newsticker-get-news'."
738 (let ((coding-system-for-read 'no-conversion))
739 (condition-case error-data
740 (url-retrieve url 'newsticker--get-news-by-url-callback
741 (list feed-name))
742 (error (message "Error retrieving news from %s: %s" feed-name
743 error-data))))
744 (force-mode-line-update))
745
746 (defun newsticker--get-news-by-url-callback (status feed-name)
747 "Callback function for `newsticker--get-news-by-url'.
748 STATUS is the return status as delivered by `url-retrieve', and
749 FEED-NAME is the name of the feed that the news were retrieved
750 from."
751 (let ((buf (get-buffer-create (concat " *newsticker-url-" feed-name "*")))
752 (result (string-to-multibyte (buffer-string))))
753 (set-buffer buf)
754 (erase-buffer)
755 (insert result)
756 ;; remove MIME header
757 (goto-char (point-min))
758 (search-forward "\n\n")
759 (delete-region (point-min) (point))
760 ;; read the rss/atom contents
761 (newsticker--sentinel-work nil t feed-name "url-retrieve" (current-buffer))
762 (when status
763 (let ((status-type (car status))
764 (status-details (cdr status)))
765 (cond ((eq status-type :redirect)
766 ;; don't care about redirects
767 )
768 ((eq status-type :error)
769 (message "%s: Error while retrieving news from %s: %s: \"%s\""
770 (format-time-string "%A, %H:%M" (current-time))
771 feed-name
772 (car status-details) (cdr status-details))))))))
773
774 (defun newsticker--get-news-by-wget (feed-name url wget-arguments)
775 "Get news for the site FEED-NAME from address URL using wget.
776 WGET-ARGUMENTS is a list of arguments for wget.
777 See `newsticker-get-news'."
778 (let ((buffername (concat " *newsticker-wget-" feed-name "*")))
779 (with-current-buffer (get-buffer-create buffername)
780 (erase-buffer)
781 ;; throw an error if there is an old wget-process around
782 (if (get-process feed-name)
783 (error "Another wget-process is running for %s" feed-name))
784 ;; start wget
785 (let* ((args (append wget-arguments (list url)))
786 (proc (apply 'start-process feed-name buffername
787 newsticker-wget-name args)))
788 (set-process-coding-system proc 'no-conversion 'no-conversion)
789 (set-process-sentinel proc 'newsticker--sentinel)
790 (setq newsticker--process-ids (cons (process-id proc)
791 newsticker--process-ids))
792 (force-mode-line-update)))))
793
794 (defun newsticker-get-news (feed-name)
795 "Get news from the site FEED-NAME and load feed logo.
796 FEED-NAME must be a string which occurs as the label (i.e. the first element)
797 in an element of `newsticker-url-list' or `newsticker-url-list-defaults'."
798 (newsticker--debug-msg "%s: Getting news for %s"
799 (format-time-string "%A, %H:%M" (current-time))
800 feed-name)
801 (let* ((item (or (assoc feed-name newsticker-url-list)
802 (assoc feed-name newsticker-url-list-defaults)
803 (error
804 "Cannot get news for %s: Check newsticker-url-list"
805 feed-name)))
806 (url (cadr item))
807 (wget-arguments (or (car (cdr (cdr (cdr (cdr item)))))
808 newsticker-wget-arguments)))
809 (if (functionp url)
810 (newsticker--get-news-by-funcall feed-name url)
811 (if (eq newsticker-retrieval-method 'intern)
812 (newsticker--get-news-by-url feed-name url)
813 (newsticker--get-news-by-wget feed-name url wget-arguments)))))
814
815 ;; ======================================================================
816 ;; Parsing
817 ;; ======================================================================
818
819 (defun newsticker--sentinel (process event)
820 "Sentinel for extracting news titles from an RDF buffer.
821 Argument PROCESS is the process which has just changed its state.
822 Argument EVENT tells what has happened to the process."
823 (let ((p-status (process-status process))
824 (exit-status (process-exit-status process))
825 (name (process-name process))
826 (command (process-command process))
827 (buffer (process-buffer process)))
828 (newsticker--sentinel-work event
829 (and (eq p-status 'exit)
830 (= exit-status 0))
831 name command buffer)))
832
833 (defun newsticker--sentinel-work (event status-ok name command buffer)
834 "Actually do the sentinel work.
835 Argument EVENT tells what has happened to the retrieval process.
836 Argument STATUS-OK is the final status of the retrieval process,
837 non-nil meaning retrieval was successful.
838 Argument NAME is the name of the retrieval process.
839 Argument COMMAND is the command of the retrieval process.
840 Argument BUFFER is the buffer of the retrieval process."
841 (let ((time (current-time))
842 (name-symbol (intern name))
843 (something-was-added nil))
844 ;; catch known errors (zombie processes, rubbish-xml etc.
845 ;; if an error occurs the news feed is not updated!
846 (catch 'oops
847 (unless status-ok
848 (setq newsticker--cache
849 (newsticker--cache-add
850 newsticker--cache
851 name-symbol
852 newsticker--error-headline
853 (format
854 (concat "%s: Newsticker could not retrieve news from %s.\n"
855 "Return status: `%s'\n"
856 "Command was `%s'")
857 (format-time-string "%A, %H:%M" (current-time))
858 name event command)
859 ""
860 (current-time)
861 'new
862 0 nil))
863 (message "%s: Error while retrieving news from %s"
864 (format-time-string "%A, %H:%M" (current-time))
865 name)
866 (throw 'oops nil))
867 (let* ((coding-system 'utf-8)
868 (node-list
869 (save-current-buffer
870 (set-buffer buffer)
871 ;; a very very dirty workaround to overcome the
872 ;; problems with the newest (20030621) xml.el:
873 ;; remove all unnecessary whitespace
874 (goto-char (point-min))
875 (while (re-search-forward ">[ \t\r\n]+<" nil t)
876 (replace-match "><" nil t))
877 ;; and another brutal workaround (20031105)! For some
878 ;; reason the xml parser does not like the colon in the
879 ;; doctype name "rdf:RDF"
880 (goto-char (point-min))
881 (if (re-search-forward "<!DOCTYPE[ \t\n]+rdf:RDF" nil t)
882 (replace-match "<!DOCTYPE rdfColonRDF" nil t))
883 ;; finally.... ~##^°!!!!!
884 (goto-char (point-min))
885 (while (search-forward "\r\n" nil t)
886 (replace-match "\n" nil t))
887 ;; still more brutal workarounds (20040309)! The xml
888 ;; parser does not like doctype rss
889 (goto-char (point-min))
890 (if (re-search-forward "<!DOCTYPE[ \t\n]+rss[ \t\n]*>" nil t)
891 (replace-match "" nil t))
892 ;; And another one (20050618)! (Fixed in GNU Emacs 22.0.50.18)
893 ;; Remove comments to avoid this xml-parsing bug:
894 ;; "XML files can have only one toplevel tag"
895 (goto-char (point-min))
896 (while (search-forward "<!--" nil t)
897 (let ((start (match-beginning 0)))
898 (unless (search-forward "-->" nil t)
899 (error "Can't find end of comment"))
900 (delete-region start (point))))
901 ;; And another one (20050702)! If description is HTML
902 ;; encoded and starts with a `<', wrap the whole
903 ;; description in a CDATA expression. This happened for
904 ;; http://www.thefreedictionary.com/_/WoD/rss.aspx?type=quote
905 (goto-char (point-min))
906 (while (re-search-forward
907 "<description>\\(<img.*?\\)</description>" nil t)
908 (replace-match
909 "<description><![CDATA[ \\1 ]]></description>"))
910 ;; And another one (20051123)! XML parser does not
911 ;; like this: <yweather:location city="Frankfurt/Main"
912 ;; region="" country="GM" />
913 ;; try to "fix" empty attributes
914 ;; This happened for
915 ;; http://xml.weather.yahoo.com/forecastrss?p=GMXX0040&u=f
916 (goto-char (point-min))
917 (while (re-search-forward "\\(<[^>]*\\)=\"\"" nil t)
918 (replace-match "\\1=\" \""))
919 ;;
920 (set-buffer-modified-p nil)
921 ;; check coding system
922 (goto-char (point-min))
923 (if (re-search-forward "encoding=\"\\([^\"]+\\)\""
924 nil t)
925 (setq coding-system (intern (downcase (match-string 1))))
926 (setq coding-system
927 (condition-case nil
928 (check-coding-system coding-system)
929 (coding-system-error
930 (message
931 "newsticker.el: ignoring coding system %s for %s"
932 coding-system name)
933 nil))))
934 ;; Decode if possible
935 (when coding-system
936 (decode-coding-region (point-min) (point-max)
937 coding-system))
938 (condition-case errordata
939 ;; The xml parser might fail
940 ;; or the xml might be bugged
941 (xml-parse-region (point-min) (point-max))
942 (error (message "Could not parse %s: %s"
943 (buffer-name) (cadr errordata))
944 (throw 'oops nil)))))
945 (topnode (car node-list))
946 (channelnode (car (xml-get-children topnode 'channel)))
947 (imageurl nil))
948 ;; mark all items as obsolete
949 (newsticker--cache-replace-age newsticker--cache
950 name-symbol
951 'new 'obsolete-new)
952 (newsticker--cache-replace-age newsticker--cache
953 name-symbol
954 'old 'obsolete-old)
955 (newsticker--cache-replace-age newsticker--cache
956 name-symbol
957 'feed 'obsolete-old)
958
959 ;; check Atom/RSS version and call corresponding parser
960 (condition-case error-data
961 (if (cond
962 ;; RSS 0.91
963 ((and (eq 'rss (xml-node-name topnode))
964 (string= "0.91" (xml-get-attribute topnode 'version)))
965 (setq imageurl (newsticker--get-logo-url-rss-0.91 topnode))
966 (newsticker--parse-rss-0.91 name time topnode))
967 ;; RSS 0.92
968 ((and (eq 'rss (xml-node-name topnode))
969 (string= "0.92" (xml-get-attribute topnode 'version)))
970 (setq imageurl (newsticker--get-logo-url-rss-0.92 topnode))
971 (newsticker--parse-rss-0.92 name time topnode))
972 ;; RSS 1.0
973 ((eq 'rdf:RDF (xml-node-name topnode))
974 (setq imageurl (newsticker--get-logo-url-rss-1.0 topnode))
975 (newsticker--parse-rss-1.0 name time topnode))
976 ;; RSS 2.0
977 ((and (eq 'rss (xml-node-name topnode))
978 (string= "2.0" (xml-get-attribute topnode 'version)))
979 (setq imageurl (newsticker--get-logo-url-rss-2.0 topnode))
980 (newsticker--parse-rss-2.0 name time topnode))
981 ;; Atom 0.3
982 ((and (eq 'feed (xml-node-name topnode))
983 (string= "http://purl.org/atom/ns#"
984 (xml-get-attribute topnode 'xmlns)))
985 (setq imageurl (newsticker--get-logo-url-atom-0.3 topnode))
986 (newsticker--parse-atom-0.3 name time topnode))
987 ;; Atom 1.0
988 ((and (eq 'feed (xml-node-name topnode))
989 (string= "http://www.w3.org/2005/Atom"
990 (xml-get-attribute topnode 'xmlns)))
991 (setq imageurl (newsticker--get-logo-url-atom-1.0 topnode))
992 (newsticker--parse-atom-1.0 name time topnode))
993 ;; unknown feed type
994 (t
995 (newsticker--debug-msg "Feed type unknown: %s: %s"
996 (xml-node-name topnode) name)
997 nil))
998 (setq something-was-added t))
999 (error (message "sentinelerror in %s: %s" name error-data)))
1000
1001 ;; Remove those old items from cache which have been removed from
1002 ;; the feed
1003 (newsticker--cache-replace-age newsticker--cache
1004 name-symbol 'obsolete-old 'deleteme)
1005 (newsticker--cache-remove newsticker--cache name-symbol
1006 'deleteme)
1007 ;; Remove those new items from cache which have been removed from
1008 ;; the feed. Or keep them as `obsolete'
1009 (if (not newsticker-keep-obsolete-items)
1010 (newsticker--cache-remove newsticker--cache
1011 name-symbol 'obsolete-new)
1012 (setq newsticker--cache
1013 (newsticker--cache-mark-expired
1014 newsticker--cache name-symbol 'obsolete 'obsolete-expired
1015 newsticker-obsolete-item-max-age))
1016 (newsticker--cache-remove newsticker--cache
1017 name-symbol 'obsolete-expired)
1018 (newsticker--cache-replace-age newsticker--cache
1019 name-symbol 'obsolete-new
1020 'obsolete))
1021 (newsticker--update-process-ids)
1022 ;; setup scrollable text
1023 (when (= 0 (length newsticker--process-ids))
1024 (when (fboundp 'newsticker--ticker-text-setup) ;silence
1025 ;compiler
1026 ;warnings
1027 (newsticker--ticker-text-setup)))
1028 (setq newsticker--latest-update-time (current-time))
1029 (when something-was-added
1030 ;; FIXME: should we care about removed items as well?
1031 (newsticker--cache-save-feed
1032 (newsticker--cache-get-feed name-symbol))
1033 (when (fboundp 'newsticker--buffer-set-uptodate) ;silence
1034 ;compiler
1035 ;warnings
1036 (newsticker--buffer-set-uptodate nil)))
1037 ;; kill the process buffer if wanted
1038 (unless newsticker-debug
1039 (kill-buffer buffer))
1040 ;; launch retrieval of image
1041 (when (and imageurl newsticker--download-logos)
1042 (newsticker--image-get name imageurl)))))
1043 (when newsticker--sentinel-callback
1044 (funcall newsticker--sentinel-callback)))
1045
1046 (defun newsticker--get-logo-url-atom-1.0 (node)
1047 "Return logo URL from atom 1.0 data in NODE."
1048 (car (xml-node-children
1049 (car (xml-get-children node 'logo)))))
1050
1051 (defun newsticker--get-logo-url-atom-0.3 (node)
1052 "Return logo URL from atom 0.3 data in NODE."
1053 (car (xml-node-children
1054 (car (xml-get-children (car (xml-get-children node 'image)) 'url)))))
1055
1056 (defun newsticker--get-logo-url-rss-2.0 (node)
1057 "Return logo URL from RSS 2.0 data in NODE."
1058 (car (xml-node-children
1059 (car (xml-get-children
1060 (car (xml-get-children
1061 (car (xml-get-children node 'channel)) 'image)) 'url)))))
1062
1063 (defun newsticker--get-logo-url-rss-1.0 (node)
1064 "Return logo URL from RSS 1.0 data in NODE."
1065 (car (xml-node-children
1066 (car (xml-get-children (car (xml-get-children node 'image)) 'url)))))
1067
1068 (defun newsticker--get-logo-url-rss-0.92 (node)
1069 "Return logo URL from RSS 0.92 data in NODE."
1070 (car (xml-node-children
1071 (car (xml-get-children (car (xml-get-children node 'image)) 'url)))))
1072
1073 (defun newsticker--get-logo-url-rss-0.91 (node)
1074 "Return logo URL from RSS 0.91 data in NODE."
1075 (car (xml-node-children
1076 (car (xml-get-children (car (xml-get-children node 'image)) 'url)))))
1077
1078 (defun newsticker--parse-atom-0.3 (name time topnode)
1079 "Parse Atom 0.3 data.
1080 Return value as well as arguments NAME, TIME, and TOPNODE are the
1081 same as in `newsticker--parse-atom-1.0'."
1082 (newsticker--debug-msg "Parsing Atom 0.3 feed %s" name)
1083 (let (new-feed new-item)
1084 (setq new-feed (newsticker--parse-generic-feed
1085 name time
1086 ;; title
1087 (car (xml-node-children
1088 (car (xml-get-children topnode 'title))))
1089 ;; desc
1090 (car (xml-node-children
1091 (car (xml-get-children topnode 'content))))
1092 ;; link
1093 (xml-get-attribute
1094 (car (xml-get-children topnode 'link)) 'href)
1095 ;; extra-elements
1096 (xml-node-children topnode)))
1097 (setq new-item (newsticker--parse-generic-items
1098 name time (xml-get-children topnode 'entry)
1099 ;; title-fn
1100 (lambda (node)
1101 (car (xml-node-children
1102 (car (xml-get-children node 'title)))))
1103 ;; desc-fn
1104 (lambda (node)
1105 (or (car (xml-node-children
1106 (car (xml-get-children node 'content))))
1107 (car (xml-node-children
1108 (car (xml-get-children node 'summary))))))
1109 ;; link-fn
1110 (lambda (node)
1111 (xml-get-attribute
1112 (car (xml-get-children node 'link)) 'href))
1113 ;; time-fn
1114 (lambda (node)
1115 (newsticker--decode-rfc822-date
1116 (car (xml-node-children
1117 (car (xml-get-children node 'modified))))))
1118 ;; guid-fn
1119 (lambda (node)
1120 (newsticker--guid-to-string
1121 (assoc 'guid (xml-node-children node))))
1122 ;; extra-fn
1123 (lambda (node)
1124 (xml-node-children node))))
1125 (or new-item new-feed)))
1126
1127 (defun newsticker--parse-atom-1.0 (name time topnode)
1128 "Parse Atom 1.0 data.
1129 Argument NAME gives the name of a news feed. TIME gives the
1130 system time at which the data have been retrieved. TOPNODE
1131 contains the feed data as returned by the xml parser.
1132
1133 For the Atom 1.0 specification see
1134 URL `http://www.atompub.org/2005/08/17/draft-ietf-atompub-format-11.html'"
1135 (newsticker--debug-msg "Parsing Atom 1.0 feed %s" name)
1136 (let (new-feed new-item)
1137 (setq new-feed (newsticker--parse-generic-feed
1138 name time
1139 ;; title
1140 (car (xml-node-children
1141 (car (xml-get-children topnode 'title))))
1142 ;; desc
1143 (car (xml-node-children
1144 (car (xml-get-children topnode 'subtitle))))
1145 ;; link
1146 (lambda (node)
1147 (xml-get-attribute
1148 (car (xml-get-children node 'link)) 'href))
1149 ;; extra-elements
1150 (xml-node-children topnode)))
1151 (setq new-item (newsticker--parse-generic-items
1152 name time (xml-get-children topnode 'entry)
1153 ;; title-fn
1154 (lambda (node)
1155 (car (xml-node-children
1156 (car (xml-get-children node 'title)))))
1157 ;; desc-fn
1158 (lambda (node)
1159 (or (car (xml-node-children
1160 (car (xml-get-children node 'content))))
1161 (car (xml-node-children
1162 (car (xml-get-children node 'summary))))))
1163 ;; link-fn
1164 (lambda (node)
1165 (xml-get-attribute
1166 (car (xml-get-children node 'link)) 'href))
1167 ;; time-fn
1168 (lambda (node)
1169 (newsticker--decode-iso8601-date
1170 (or (car (xml-node-children
1171 (car (xml-get-children node 'updated))))
1172 (car (xml-node-children
1173 (car (xml-get-children node 'published)))))))
1174 ;; guid-fn
1175 (lambda (node)
1176 (car (xml-node-children
1177 (car (xml-get-children node 'id)))))
1178 ;; extra-fn
1179 (lambda (node)
1180 (xml-node-children node))))
1181 (or new-item new-feed)))
1182
1183 (defun newsticker--parse-rss-0.91 (name time topnode)
1184 "Parse RSS 0.91 data.
1185 Return value as well as arguments NAME, TIME, and TOPNODE are the
1186 same as in `newsticker--parse-atom-1.0'.
1187
1188 For the RSS 0.91 specification see URL `http://backend.userland.com/rss091'
1189 or URL `http://my.netscape.com/publish/formats/rss-spec-0.91.html'."
1190 (newsticker--debug-msg "Parsing RSS 0.91 feed %s" name)
1191 (let* ((channelnode (car (xml-get-children topnode 'channel)))
1192 (pub-date (newsticker--decode-rfc822-date
1193 (car (xml-node-children
1194 (car (xml-get-children channelnode 'pubDate))))))
1195 is-new-feed has-new-items)
1196 (setq is-new-feed (newsticker--parse-generic-feed
1197 name time
1198 ;; title
1199 (car (xml-node-children
1200 (car (xml-get-children channelnode 'title))))
1201 ;; desc
1202 (car (xml-node-children
1203 (car (xml-get-children channelnode
1204 'description))))
1205 ;; link
1206 (car (xml-node-children
1207 (car (xml-get-children channelnode 'link))))
1208 ;; extra-elements
1209 (xml-node-children channelnode)))
1210 (setq has-new-items (newsticker--parse-generic-items
1211 name time (xml-get-children channelnode 'item)
1212 ;; title-fn
1213 (lambda (node)
1214 (car (xml-node-children
1215 (car (xml-get-children node 'title)))))
1216 ;; desc-fn
1217 (lambda (node)
1218 (car (xml-node-children
1219 (car (xml-get-children node 'description)))))
1220 ;; link-fn
1221 (lambda (node)
1222 (car (xml-node-children
1223 (car (xml-get-children node 'link)))))
1224 ;; time-fn
1225 (lambda (node)
1226 (newsticker--decode-rfc822-date
1227 (car (xml-node-children
1228 (car (xml-get-children node 'pubDate))))))
1229 ;; guid-fn
1230 (lambda (node)
1231 nil)
1232 ;; extra-fn
1233 (lambda (node)
1234 (xml-node-children node))))
1235 (or has-new-items is-new-feed)))
1236
1237 (defun newsticker--parse-rss-0.92 (name time topnode)
1238 "Parse RSS 0.92 data.
1239 Return value as well as arguments NAME, TIME, and TOPNODE are the
1240 same as in `newsticker--parse-atom-1.0'.
1241
1242 For the RSS 0.92 specification see URL `http://backend.userland.com/rss092'."
1243 (newsticker--debug-msg "Parsing RSS 0.92 feed %s" name)
1244 (let* ((channelnode (car (xml-get-children topnode 'channel)))
1245 (pub-date (newsticker--decode-rfc822-date
1246 (car (xml-node-children
1247 (car (xml-get-children channelnode 'pubDate))))))
1248 is-new-feed has-new-items)
1249 (setq is-new-feed (newsticker--parse-generic-feed
1250 name time
1251 ;; title
1252 (car (xml-node-children
1253 (car (xml-get-children channelnode 'title))))
1254 ;; desc
1255 (car (xml-node-children
1256 (car (xml-get-children channelnode
1257 'description))))
1258 ;; link
1259 (car (xml-node-children
1260 (car (xml-get-children channelnode 'link))))
1261 ;; extra-elements
1262 (xml-node-children channelnode)))
1263 (setq has-new-items (newsticker--parse-generic-items
1264 name time (xml-get-children channelnode 'item)
1265 ;; title-fn
1266 (lambda (node)
1267 (car (xml-node-children
1268 (car (xml-get-children node 'title)))))
1269 ;; desc-fn
1270 (lambda (node)
1271 (car (xml-node-children
1272 (car (xml-get-children node 'description)))))
1273 ;; link-fn
1274 (lambda (node)
1275 (car (xml-node-children
1276 (car (xml-get-children node 'link)))))
1277 ;; time-fn
1278 (lambda (node)
1279 (newsticker--decode-rfc822-date
1280 (car (xml-node-children
1281 (car (xml-get-children node 'pubDate))))))
1282 ;; guid-fn
1283 (lambda (node)
1284 nil)
1285 ;; extra-fn
1286 (lambda (node)
1287 (xml-node-children node))))
1288 (or has-new-items is-new-feed)))
1289
1290 (defun newsticker--parse-rss-1.0 (name time topnode)
1291 "Parse RSS 1.0 data.
1292 Return value as well as arguments NAME, TIME, and TOPNODE are the
1293 same as in `newsticker--parse-atom-1.0'.
1294
1295 For the RSS 1.0 specification see URL `http://web.resource.org/rss/1.0/spec'."
1296 (newsticker--debug-msg "Parsing RSS 1.0 feed %s" name)
1297 (let* ((channelnode (car (xml-get-children topnode 'channel)))
1298 is-new-feed has-new-items)
1299 (setq is-new-feed (newsticker--parse-generic-feed
1300 name time
1301 ;; title
1302 (car (xml-node-children
1303 (car (xml-get-children channelnode 'title))))
1304 ;; desc
1305 (car (xml-node-children
1306 (car (xml-get-children channelnode
1307 'description))))
1308 ;; link
1309 (car (xml-node-children
1310 (car (xml-get-children channelnode 'link))))
1311 ;; extra-elements
1312 (xml-node-children channelnode)))
1313 (setq has-new-items (newsticker--parse-generic-items
1314 name time (xml-get-children topnode 'item)
1315 ;; title-fn
1316 (lambda (node)
1317 (car (xml-node-children
1318 (car (xml-get-children node 'title)))))
1319 ;; desc-fn
1320 (lambda (node)
1321 (car (xml-node-children
1322 (car (xml-get-children node
1323 'description)))))
1324 ;; link-fn
1325 (lambda (node)
1326 (car (xml-node-children
1327 (car (xml-get-children node 'link)))))
1328 ;; time-fn
1329 (lambda (node)
1330 (newsticker--decode-iso8601-date
1331 (car (xml-node-children
1332 (car (xml-get-children node 'dc:date))))))
1333 ;; guid-fn
1334 (lambda (node)
1335 nil)
1336 ;; extra-fn
1337 (lambda (node)
1338 (xml-node-children node))))
1339 (or has-new-items is-new-feed)))
1340
1341 (defun newsticker--parse-rss-2.0 (name time topnode)
1342 "Parse RSS 2.0 data.
1343 Return value as well as arguments NAME, TIME, and TOPNODE are the
1344 same as in `newsticker--parse-atom-1.0'.
1345
1346 For the RSS 2.0 specification see URL `http://blogs.law.harvard.edu/tech/rss'."
1347 (newsticker--debug-msg "Parsing RSS 2.0 feed %s" name)
1348 (let* ((channelnode (car (xml-get-children topnode 'channel)))
1349 is-new-feed has-new-items)
1350 (setq is-new-feed (newsticker--parse-generic-feed
1351 name time
1352 ;; title
1353 (car (xml-node-children
1354 (car (xml-get-children channelnode 'title))))
1355 ;; desc
1356 (car (xml-node-children
1357 (car (xml-get-children channelnode
1358 'description))))
1359 ;; link
1360 (car (xml-node-children
1361 (car (xml-get-children channelnode 'link))))
1362 ;; extra-elements
1363 (xml-node-children channelnode)))
1364 (setq has-new-items (newsticker--parse-generic-items
1365 name time (xml-get-children channelnode 'item)
1366 ;; title-fn
1367 (lambda (node)
1368 (car (xml-node-children
1369 (car (xml-get-children node 'title)))))
1370 ;; desc-fn
1371 (lambda (node)
1372 (or (car (xml-node-children
1373 (car (xml-get-children node
1374 'content:encoded))))
1375 (car (xml-node-children
1376 (car (xml-get-children node
1377 'description))))))
1378 ;; link-fn
1379 (lambda (node)
1380 (car (xml-node-children
1381 (car (xml-get-children node 'link)))))
1382 ;; time-fn
1383 (lambda (node)
1384 (newsticker--decode-rfc822-date
1385 (car (xml-node-children
1386 (car (xml-get-children node 'pubDate))))))
1387 ;; guid-fn
1388 (lambda (node)
1389 (newsticker--guid-to-string
1390 (assoc 'guid (xml-node-children node))))
1391 ;; extra-fn
1392 (lambda (node)
1393 (xml-node-children node))))
1394 (or has-new-items is-new-feed)))
1395
1396 (defun newsticker--parse-generic-feed (name time title desc link
1397 extra-elements)
1398 "Parse generic news feed data.
1399 Argument NAME gives the name of a news feed. TIME gives the
1400 system time at which the data have been retrieved.
1401
1402 The arguments TITLE, DESC, LINK, and EXTRA-ELEMENTS give the feed's title,
1403 description, link, and extra elements resp."
1404 (let ((title (or title "[untitled]"))
1405 (link (or link ""))
1406 (old-item nil)
1407 (position 0)
1408 (something-was-added nil))
1409 ;; decode numeric entities
1410 (setq title (newsticker--decode-numeric-entities title))
1411 (setq desc (newsticker--decode-numeric-entities desc))
1412 (setq link (newsticker--decode-numeric-entities link))
1413 ;; remove whitespace from title, desc, and link
1414 (setq title (newsticker--remove-whitespace title))
1415 (setq desc (newsticker--remove-whitespace desc))
1416 (setq link (newsticker--remove-whitespace link))
1417
1418 ;; handle the feed itself
1419 (unless (newsticker--cache-contains newsticker--cache
1420 (intern name) title
1421 desc link 'feed)
1422 (setq something-was-added t))
1423 (setq newsticker--cache
1424 (newsticker--cache-add newsticker--cache (intern name)
1425 title desc link time 'feed position
1426 extra-elements time 'feed))
1427 something-was-added))
1428
1429 (defun newsticker--parse-generic-items (name time itemlist
1430 title-fn desc-fn
1431 link-fn time-fn
1432 guid-fn extra-fn)
1433 "Parse generic news feed data.
1434 Argument NAME gives the name of a news feed. TIME gives the
1435 system time at which the data have been retrieved. ITEMLIST
1436 contains the news items returned by the xml parser.
1437
1438 The arguments TITLE-FN, DESC-FN, LINK-FN, TIME-FN, GUID-FN, and
1439 EXTRA-FN give functions for extracting title, description, link,
1440 time, guid, and extra-elements resp. They are called with one
1441 argument, which is one of the items in ITEMLIST."
1442 (let (title desc link
1443 (old-item nil)
1444 (position 0)
1445 (something-was-added nil))
1446 ;; gather all items for this feed
1447 (mapc (lambda (node)
1448 (setq position (1+ position))
1449 (setq title (or (funcall title-fn node) "[untitled]"))
1450 (setq desc (funcall desc-fn node))
1451 (setq link (or (funcall link-fn node) ""))
1452 (setq time (or (funcall time-fn node) time))
1453 ;; It happened that the title or description
1454 ;; contained evil HTML code that confused the
1455 ;; xml parser. Therefore:
1456 (unless (stringp title)
1457 (setq title (prin1-to-string title)))
1458 (unless (or (stringp desc) (not desc))
1459 (setq desc (prin1-to-string desc)))
1460 ;; ignore items with empty title AND empty desc
1461 (when (or (> (length title) 0)
1462 (> (length desc) 0))
1463 ;; decode numeric entities
1464 (setq title (newsticker--decode-numeric-entities title))
1465 (when desc
1466 (setq desc (newsticker--decode-numeric-entities desc)))
1467 (setq link (newsticker--decode-numeric-entities link))
1468 ;; remove whitespace from title, desc, and link
1469 (setq title (newsticker--remove-whitespace title))
1470 (setq desc (newsticker--remove-whitespace desc))
1471 (setq link (newsticker--remove-whitespace link))
1472 ;; add data to cache
1473 ;; do we have this item already?
1474 (let* ((guid (funcall guid-fn node)))
1475 ;;(message "guid=%s" guid)
1476 (setq old-item
1477 (newsticker--cache-contains newsticker--cache
1478 (intern name) title
1479 desc link nil guid)))
1480 ;; add this item, or mark it as old, or do nothing
1481 (let ((age1 'new)
1482 (age2 'old)
1483 (item-new-p nil))
1484 (if old-item
1485 (let ((prev-age (newsticker--age old-item)))
1486 (unless newsticker-automatically-mark-items-as-old
1487 ;; Some feeds deliver items multiply, the
1488 ;; first time we find an 'obsolete-old one the
1489 ;; cache, the following times we find an 'old
1490 ;; one
1491 (if (memq prev-age '(obsolete-old old))
1492 (setq age2 'old)
1493 (setq age2 'new)))
1494 (if (eq prev-age 'immortal)
1495 (setq age2 'immortal))
1496 (setq time (newsticker--time old-item)))
1497 ;; item was not there
1498 (setq item-new-p t)
1499 (setq something-was-added t))
1500 (setq newsticker--cache
1501 (newsticker--cache-add
1502 newsticker--cache (intern name) title desc link
1503 time age1 position (funcall extra-fn node)
1504 time age2))
1505 (when item-new-p
1506 (let ((item (newsticker--cache-contains
1507 newsticker--cache (intern name) title
1508 desc link nil)))
1509 (if newsticker-auto-mark-filter-list
1510 (newsticker--run-auto-mark-filter name item))
1511 (run-hook-with-args
1512 'newsticker-new-item-functions name item))))))
1513 itemlist)
1514 something-was-added))
1515
1516 ;; ======================================================================
1517 ;;; Misc
1518 ;; ======================================================================
1519 (defun newsticker--decode-numeric-entities (string)
1520 "Decode SGML numeric entities by their respective utf characters.
1521 This function replaces numeric entities in the input STRING and
1522 returns the modified string. For example \"&#42;\" gets replaced
1523 by \"*\"."
1524 (if (and string (stringp string))
1525 (let ((start 0))
1526 (while (string-match "&#\\([0-9]+\\);" string start)
1527 (condition-case nil
1528 (setq string (replace-match
1529 (string (read (substring string
1530 (match-beginning 1)
1531 (match-end 1))))
1532 nil nil string))
1533 (error nil))
1534 (setq start (1+ (match-beginning 0))))
1535 string)
1536 nil))
1537
1538 (defun newsticker--remove-whitespace (string)
1539 "Remove leading and trailing whitespace from STRING."
1540 ;; we must have ...+ but not ...* in the regexps otherwise xemacs loops
1541 ;; endlessly...
1542 (when (and string (stringp string))
1543 (replace-regexp-in-string
1544 "[ \t\r\n]+$" ""
1545 (replace-regexp-in-string "^[ \t\r\n]+" "" string))))
1546
1547 (defun newsticker--do-forget-preformatted (item)
1548 "Forget pre-formatted data for ITEM.
1549 Remove the pre-formatted from `newsticker--cache'."
1550 (if (nthcdr 7 item)
1551 (setcar (nthcdr 7 item) nil))
1552 (if (nthcdr 6 item)
1553 (setcar (nthcdr 6 item) nil)))
1554
1555 (defun newsticker--forget-preformatted ()
1556 "Forget all cached pre-formatted data.
1557 Remove the pre-formatted from `newsticker--cache'."
1558 (mapc (lambda (feed)
1559 (mapc 'newsticker--do-forget-preformatted
1560 (cdr feed)))
1561 newsticker--cache)
1562 (when (fboundp 'newsticker--buffer-set-uptodate)
1563 (newsticker--buffer-set-uptodate nil)))
1564
1565 (defun newsticker--debug-msg (string &rest args)
1566 "Print newsticker debug messages.
1567 This function calls `message' with arguments STRING and ARGS, if
1568 `newsticker-debug' is non-nil."
1569 (and newsticker-debug
1570 ;;(not (active-minibuffer-window))
1571 ;;(not (current-message))
1572 (apply 'message string args)))
1573
1574 (defun newsticker--decode-iso8601-date (iso8601-string)
1575 "Return ISO8601-STRING in format like `decode-time'.
1576 Converts from ISO-8601 to Emacs representation.
1577 Examples:
1578 2004-09-17T05:09:49.001+00:00
1579 2004-09-17T05:09:49+00:00
1580 2004-09-17T05:09+00:00
1581 2004-09-17T05:09:49
1582 2004-09-17T05:09
1583 2004-09-17
1584 2004-09
1585 2004"
1586 (if iso8601-string
1587 (when (string-match
1588 (concat
1589 "^ *\\([0-9]\\{4\\}\\)" ;year
1590 "\\(-\\([0-9]\\{2\\}\\)" ;month
1591 "\\(-\\([0-9]\\{2\\}\\)" ;day
1592 "\\(T"
1593 "\\([0-9]\\{2\\}\\):\\([0-9]\\{2\\}\\)" ;hour:minute
1594 "\\(:\\([0-9]\\{2\\}\\)\\(\\.[0-9]+\\)?\\)?" ;second
1595 ;timezone
1596 "\\(\\([-+Z]\\)\\(\\([0-9]\\{2\\}\\):\\([0-9]\\{2\\}\\)\\)?\\)?"
1597 "\\)?\\)?\\)? *$")
1598 iso8601-string)
1599 (let ((year (read (match-string 1 iso8601-string)))
1600 (month (read (or (match-string 3 iso8601-string)
1601 "1")))
1602 (day (read (or (match-string 5 iso8601-string)
1603 "1")))
1604 (hour (read (or (match-string 7 iso8601-string)
1605 "0")))
1606 (minute (read (or (match-string 8 iso8601-string)
1607 "0")))
1608 (second (read (or (match-string 10 iso8601-string)
1609 "0")))
1610 (sign (match-string 13 iso8601-string))
1611 (offset-hour (read (or (match-string 15 iso8601-string)
1612 "0")))
1613 (offset-minute (read (or (match-string 16 iso8601-string)
1614 "0"))))
1615 (cond ((string= sign "+")
1616 (setq hour (- hour offset-hour))
1617 (setq minute (- minute offset-minute)))
1618 ((string= sign "-")
1619 (setq hour (+ hour offset-hour))
1620 (setq minute (+ minute offset-minute))))
1621 ;; if UTC subtract current-time-zone offset
1622 ;;(setq second (+ (car (current-time-zone)) second)))
1623
1624 (condition-case nil
1625 (encode-time second minute hour day month year t)
1626 (error
1627 (message "Cannot decode \"%s\"" iso8601-string)
1628 nil))))
1629 nil))
1630
1631 (defun newsticker--decode-rfc822-date (rfc822-string)
1632 "Return RFC822-STRING in format like `decode-time'.
1633 Converts from RFC822 to Emacs representation.
1634 Examples:
1635 Sat, 07 September 2002 00:00:01 +0100
1636 Sat, 07 September 2002 00:00:01 MET
1637 Sat, 07 Sep 2002 00:00:01 GMT
1638 07 Sep 2002 00:00:01 GMT
1639 07 Sep 2002"
1640 (if (and rfc822-string (stringp rfc822-string))
1641 (when (string-match
1642 (concat
1643 "\\s-*"
1644 ;; week day
1645 "\\(\\(Mon\\|Tue\\|Wed\\|Thu\\|Fri\\|Sat\\|Sun\\)\\s-*,?\\)?\\s-*"
1646 ;; day
1647 "\\([0-9]\\{1,2\\}\\)\\s-+"
1648 ;; month
1649 "\\(Jan\\|Feb\\|Mar\\|Apr\\|May\\|Jun\\|"
1650 "Jul\\|Aug\\|Sep\\|Oct\\|Nov\\|Dec\\).*?\\s-+"
1651 ;; year
1652 "\\([0-9]\\{2,4\\}\\)"
1653 ;; time may be missing
1654 "\\(\\s-+"
1655 ;; hour
1656 "\\([0-9]\\{2\\}\\)"
1657 ;; minute
1658 ":\\([0-9]\\{2\\}\\)"
1659 ;; second
1660 "\\(:\\([0-9]\\{2\\}\\)\\)?"
1661 ;; zone -- fixme
1662 "\\(\\s-+\\("
1663 "UT\\|GMT\\|EST\\|EDT\\|CST\\|CDT\\|MST\\|MDT\\|PST\\|PDT"
1664 "\\|\\([-+]\\)\\([0-9]\\{2\\}\\)\\([0-9]\\{2\\}\\)"
1665 "\\)\\)?"
1666 "\\)?")
1667 rfc822-string)
1668 (let ((day (read (match-string 3 rfc822-string)))
1669 (month-name (match-string 4 rfc822-string))
1670 (month 0)
1671 (year (read (match-string 5 rfc822-string)))
1672 (hour (read (or (match-string 7 rfc822-string) "0")))
1673 (minute (read (or (match-string 8 rfc822-string) "0")))
1674 (second (read (or (match-string 10 rfc822-string) "0")))
1675 (zone (match-string 12 rfc822-string))
1676 (sign (match-string 13 rfc822-string))
1677 (offset-hour (read (or (match-string 14 rfc822-string)
1678 "0")))
1679 (offset-minute (read (or (match-string 15 rfc822-string)
1680 "0")))
1681 ;;FIXME
1682 )
1683 (when zone
1684 (cond ((string= sign "+")
1685 (setq hour (- hour offset-hour))
1686 (setq minute (- minute offset-minute)))
1687 ((string= sign "-")
1688 (setq hour (+ hour offset-hour))
1689 (setq minute (+ minute offset-minute)))))
1690 (condition-case error-data
1691 (let ((i 1))
1692 (mapc (lambda (m)
1693 (if (string= month-name m)
1694 (setq month i))
1695 (setq i (1+ i)))
1696 '("Jan" "Feb" "Mar" "Apr" "May" "Jun" "Jul" "Aug"
1697 "Sep" "Oct" "Nov" "Dec"))
1698 (encode-time second minute hour day month year t))
1699 (error
1700 (message "Cannot decode \"%s\": %s %s" rfc822-string
1701 (car error-data) (cdr error-data))
1702 nil))))
1703 nil))
1704
1705 (defun newsticker--lists-intersect-p (list1 list2)
1706 "Return t if LIST1 and LIST2 share elements."
1707 (let ((result nil))
1708 (mapc (lambda (elt)
1709 (if (memq elt list2)
1710 (setq result t)))
1711 list1)
1712 result))
1713
1714 (defun newsticker--update-process-ids ()
1715 "Update list of ids of active newsticker processes.
1716 Checks list of active processes against list of newsticker processes."
1717 (let ((active-procs (process-list))
1718 (new-list nil))
1719 (mapc (lambda (proc)
1720 (let ((id (process-id proc)))
1721 (if (memq id newsticker--process-ids)
1722 (setq new-list (cons id new-list)))))
1723 active-procs)
1724 (setq newsticker--process-ids new-list))
1725 (force-mode-line-update))
1726
1727 ;; ======================================================================
1728 ;;; Images
1729 ;; ======================================================================
1730 (defun newsticker--images-dir ()
1731 "Return directory where feed images are saved."
1732 (concat newsticker-dir "/images"))
1733
1734 (defun newsticker--image-get (feed-name url)
1735 "Get image of the news site FEED-NAME from URL.
1736 If the image has been downloaded in the last 24h do nothing."
1737 (let ((image-name (concat (newsticker--images-dir) feed-name)))
1738 (if (and (file-exists-p image-name)
1739 (time-less-p (current-time)
1740 (time-add (nth 5 (file-attributes image-name))
1741 (seconds-to-time 86400))))
1742 (newsticker--debug-msg "%s: Getting image for %s skipped"
1743 (format-time-string "%A, %H:%M" (current-time))
1744 feed-name)
1745 ;; download
1746 (newsticker--debug-msg "%s: Getting image for %s"
1747 (format-time-string "%A, %H:%M" (current-time))
1748 feed-name)
1749 (let* ((buffername (concat " *newsticker-wget-image-" feed-name "*"))
1750 (item (or (assoc feed-name newsticker-url-list)
1751 (assoc feed-name newsticker-url-list-defaults)
1752 (error
1753 "Cannot get news for %s: Check newsticker-url-list"
1754 feed-name)))
1755 (wget-arguments (or (car (cdr (cdr (cdr (cdr item)))))
1756 newsticker-wget-arguments)))
1757 (with-current-buffer (get-buffer-create buffername)
1758 (erase-buffer)
1759 ;; throw an error if there is an old wget-process around
1760 (if (get-process feed-name)
1761 (error "Another wget-process is running for image %s"
1762 feed-name))
1763 ;; start wget
1764 (let* ((args (append wget-arguments (list url)))
1765 (proc (apply 'start-process feed-name buffername
1766 newsticker-wget-name args)))
1767 (set-process-coding-system proc 'no-conversion 'no-conversion)
1768 (set-process-sentinel proc 'newsticker--image-sentinel)))))))
1769
1770 (defun newsticker--image-sentinel (process event)
1771 "Sentinel for image-retrieving PROCESS caused by EVENT."
1772 (let* ((p-status (process-status process))
1773 (exit-status (process-exit-status process))
1774 (feed-name (process-name process)))
1775 ;; catch known errors (zombie processes, rubbish-xml, etc.)
1776 ;; if an error occurs the news feed is not updated!
1777 (catch 'oops
1778 (unless (and (eq p-status 'exit)
1779 (= exit-status 0))
1780 (message "%s: Error while retrieving image from %s"
1781 (format-time-string "%A, %H:%M" (current-time))
1782 feed-name)
1783 (throw 'oops nil))
1784 (let (image-name)
1785 (with-current-buffer (process-buffer process)
1786 (setq image-name (concat (newsticker--images-dir) feed-name))
1787 (set-buffer-file-coding-system 'no-conversion)
1788 ;; make sure the cache dir exists
1789 (unless (file-directory-p (newsticker--images-dir))
1790 (make-directory (newsticker--images-dir)))
1791 ;; write and close buffer
1792 (let ((require-final-newline nil)
1793 (backup-inhibited t)
1794 (coding-system-for-write 'no-conversion))
1795 (write-region nil nil image-name nil 'quiet))
1796 (set-buffer-modified-p nil)
1797 (kill-buffer (current-buffer)))))))
1798
1799 (defun newsticker--insert-image (img string)
1800 "Insert IMG with STRING at point."
1801 (insert-image img string))
1802
1803 ;; ======================================================================
1804 ;;; HTML rendering
1805 ;; ======================================================================
1806 (defun newsticker-htmlr-render (pos1 pos2) ;
1807 "Replacement for `htmlr-render'.
1808 Renders the HTML code in the region POS1 to POS2 using htmlr."
1809 (let ((str (buffer-substring-no-properties pos1 pos2)))
1810 (delete-region pos1 pos2)
1811 (insert
1812 (with-temp-buffer
1813 (insert str)
1814 (goto-char (point-min))
1815 ;; begin original htmlr-render
1816 (when (fboundp 'htmlr-reset) (htmlr-reset))
1817 ;; something omitted here...
1818 (when (fboundp 'htmlr-step)
1819 (while (< (point) (point-max))
1820 (htmlr-step)))
1821 ;; end original htmlr-render
1822 (newsticker--remove-whitespace (buffer-string))))))
1823
1824 ;; ======================================================================
1825 ;;; Manipulation of cached data
1826 ;; ======================================================================
1827 (defun newsticker--cache-set-preformatted-contents (item contents)
1828 "Set preformatted contents of ITEM to CONTENTS."
1829 (if (nthcdr 6 item)
1830 (setcar (nthcdr 6 item) contents)
1831 (setcdr (nthcdr 5 item) (list contents))))
1832
1833 (defun newsticker--cache-set-preformatted-title (item title)
1834 "Set preformatted title of ITEM to TITLE."
1835 (if (nthcdr 7 item)
1836 (setcar (nthcdr 7 item) title)
1837 (setcdr (nthcdr 6 item) title)))
1838
1839 (defun newsticker--cache-replace-age (data feed old-age new-age)
1840 "Mark all items in DATA in FEED which carry age OLD-AGE with NEW-AGE.
1841 If FEED is 'any it applies to all feeds. If OLD-AGE is 'any,
1842 all marks are replaced by NEW-AGE. Removes all pre-formatted contents."
1843 (mapc (lambda (a-feed)
1844 (when (or (eq feed 'any)
1845 (eq (car a-feed) feed))
1846 (let ((items (cdr a-feed)))
1847 (mapc (lambda (item)
1848 (when (or (eq old-age 'any)
1849 (eq (newsticker--age item) old-age))
1850 (setcar (nthcdr 4 item) new-age)
1851 (newsticker--do-forget-preformatted item)))
1852 items))))
1853 data)
1854 data)
1855
1856 (defun newsticker--cache-mark-expired (data feed old-age new-age time)
1857 "Mark all expired entries.
1858 This function sets the age entries in DATA in the feed FEED. If
1859 an item's age is OLD-AGE it is set to NEW-AGE if the item is
1860 older than TIME."
1861 (mapc
1862 (lambda (a-feed)
1863 (when (or (eq feed 'any)
1864 (eq (car a-feed) feed))
1865 (let ((items (cdr a-feed)))
1866 (mapc
1867 (lambda (item)
1868 (when (eq (newsticker--age item) old-age)
1869 (let ((exp-time (time-add (newsticker--time item)
1870 (seconds-to-time time))))
1871 (when (time-less-p exp-time (current-time))
1872 (newsticker--debug-msg
1873 "Item `%s' from %s has expired on %s"
1874 (newsticker--title item)
1875 (format-time-string "%Y-%02m-%d, %H:%M"
1876 (newsticker--time item))
1877 (format-time-string "%Y-%02m-%d, %H:%M" exp-time))
1878 (setcar (nthcdr 4 item) new-age)))))
1879 items))))
1880 data)
1881 data)
1882
1883 (defun newsticker--cache-contains (data feed title desc link age
1884 &optional guid)
1885 "Check DATA whether FEED contains an item with the given properties.
1886 This function returns the contained item or nil if it is not
1887 contained.
1888 The properties which are checked are TITLE, DESC, LINK, AGE, and
1889 GUID. In general all properties must match in order to return a
1890 certain item, except for the following cases.
1891
1892 If AGE equals 'feed the TITLE, DESCription and LINK do not
1893 matter. If DESC is nil it is ignored as well. If
1894 `newsticker-desc-comp-max' is non-nil, only the first
1895 `newsticker-desc-comp-max' characters of DESC are taken into
1896 account.
1897
1898 If GUID is non-nil it is sufficient to match this value, and the
1899 other properties are ignored."
1900 ;;(newsticker--debug-msg "Looking for %s guid=%s" title guid)
1901 (condition-case nil
1902 (catch 'found
1903 (when (and desc newsticker-desc-comp-max
1904 (> (length desc) newsticker-desc-comp-max))
1905 (setq desc (substring desc 0 newsticker-desc-comp-max)))
1906 (mapc
1907 (lambda (this-feed)
1908 (when (eq (car this-feed) feed)
1909 (mapc (lambda (anitem)
1910 (when (cond (guid
1911 ;; global unique id can match
1912 (string= guid (newsticker--guid anitem)))
1913 (t;;FIXME?
1914 (or
1915 ;; or title, desc, etc.
1916 (and
1917 ;;(or (not (eq age 'feed))
1918 ;; (eq (newsticker--age anitem) 'feed))
1919 (string= (newsticker--title anitem)
1920 title)
1921 (or (not link)
1922 (string= (newsticker--link anitem)
1923 link))
1924 (or (not desc)
1925 (if (and desc newsticker-desc-comp-max
1926 (> (length (newsticker--desc
1927 anitem))
1928 newsticker-desc-comp-max))
1929 (string= (substring
1930 (newsticker--desc anitem)
1931 0
1932 newsticker-desc-comp-max)
1933 desc)
1934 (string= (newsticker--desc anitem)
1935 desc)))))))
1936 ;;(newsticker--debug-msg "Found %s guid=%s"
1937 ;; (newsticker--title anitem)
1938 ;; (newsticker--guid anitem))
1939 (throw 'found anitem)))
1940 (cdr this-feed))))
1941 data)
1942 ;;(newsticker--debug-msg "Found nothing")
1943 nil)
1944 (error nil)))
1945
1946 (defun newsticker--cache-add (data feed-name-symbol title desc link time age
1947 position extra-elements
1948 &optional updated-time updated-age
1949 preformatted-contents
1950 preformatted-title)
1951 "Add another item to cache data.
1952 Add to DATA in the FEED-NAME-SYMBOL an item with TITLE, DESC,
1953 LINK, TIME, AGE, POSITION, and EXTRA-ELEMENTS. If this item is
1954 contained already, its time is set to UPDATED-TIME, its mark is
1955 set to UPDATED-AGE, and its pre-formatted contents is set to
1956 PREFORMATTED-CONTENTS and PREFORMATTED-TITLE. Returns the age
1957 which the item got."
1958 (let* ((guid (newsticker--guid-to-string (assoc 'guid extra-elements)))
1959 (item (newsticker--cache-contains data feed-name-symbol title desc link
1960 age guid)))
1961 ;;(message "guid=%s" guid)
1962 (if item
1963 ;; does exist already -- change age, update time and position
1964 (progn
1965 ;;(newsticker--debug-msg "Updating item %s %s %s %s %s -> %s %s
1966 ;; (guid %s -> %s)"
1967 ;; feed-name-symbol title link time age
1968 ;; updated-time updated-age
1969 ;; guid (newsticker--guid item))
1970 (if (nthcdr 5 item)
1971 (setcar (nthcdr 5 item) position)
1972 (setcdr (nthcdr 4 item) (list position)))
1973 (setcar (nthcdr 4 item) updated-age)
1974 (if updated-time
1975 (setcar (nthcdr 3 item) updated-time))
1976 ;; replace cached pre-formatted contents
1977 (newsticker--cache-set-preformatted-contents
1978 item preformatted-contents)
1979 (newsticker--cache-set-preformatted-title
1980 item preformatted-title))
1981 ;; did not exist or age equals 'feed-name-symbol
1982 (setq item (list title desc link time age position preformatted-contents
1983 preformatted-title extra-elements))
1984 ;;(newsticker--debug-msg "Adding item %s" item)
1985 (catch 'found
1986 (mapc (lambda (this-feed)
1987 (when (eq (car this-feed) feed-name-symbol)
1988 (setcdr this-feed (nconc (cdr this-feed) (list item)))
1989 (throw 'found this-feed)))
1990 data)
1991 ;; the feed is not contained
1992 (add-to-list 'data (list feed-name-symbol item) t))))
1993 data)
1994
1995 (defun newsticker--cache-remove (data feed-symbol age)
1996 "Remove all entries from DATA in the feed FEED-SYMBOL with AGE.
1997 FEED-SYMBOL may be 'any. Entries from old feeds, which are no longer in
1998 `newsticker-url-list' or `newsticker-url-list-defaults', are removed as
1999 well."
2000 (let* ((pos data)
2001 (feed (car pos))
2002 (last-pos nil))
2003 (while feed
2004 (if (or (assoc (symbol-name (car feed)) newsticker-url-list)
2005 (assoc (symbol-name (car feed)) newsticker-url-list-defaults))
2006 ;; feed is still valid=active
2007 ;; (message "Keeping feed %s" (car feed))
2008 (if (or (eq feed-symbol 'any)
2009 (eq feed-symbol (car feed)))
2010 (let* ((item-pos (cdr feed))
2011 (item (car item-pos))
2012 (prev-pos nil))
2013 (while item
2014 ;;(message "%s" (car item))
2015 (if (eq age (newsticker--age item))
2016 ;; remove this item
2017 (progn
2018 ;;(message "Removing item %s" (car item))
2019 (if prev-pos
2020 (setcdr prev-pos (cdr item-pos))
2021 (setcdr feed (cdr item-pos))))
2022 ;;(message "Keeping item %s" (car item))
2023 (setq prev-pos item-pos))
2024 (setq item-pos (cdr item-pos))
2025 (setq item (car item-pos)))))
2026 ;; feed is not active anymore
2027 ;; (message "Removing feed %s" (car feed))
2028 (if last-pos
2029 (setcdr last-pos (cdr pos))
2030 (setq data (cdr pos))))
2031 (setq last-pos pos)
2032 (setq pos (cdr pos))
2033 (setq feed (car pos)))))
2034
2035 ;; ======================================================================
2036 ;;; Sorting
2037 ;; ======================================================================
2038 (defun newsticker--cache-item-compare-by-time (item1 item2)
2039 "Compare two news items ITEM1 and ITEM2 by comparing their time values."
2040 (catch 'result
2041 (let ((age1 (newsticker--age item1))
2042 (age2 (newsticker--age item2)))
2043 (if (not (eq age1 age2))
2044 (cond ((eq age1 'obsolete)
2045 (throw 'result nil))
2046 ((eq age2 'obsolete)
2047 (throw 'result t)))))
2048 (let* ((time1 (newsticker--time item1))
2049 (time2 (newsticker--time item2)))
2050 (cond ((< (nth 0 time1) (nth 0 time2))
2051 nil)
2052 ((> (nth 0 time1) (nth 0 time2))
2053 t)
2054 ((< (nth 1 time1) (nth 1 time2))
2055 nil)
2056 ((> (nth 1 time1) (nth 1 time2))
2057 t)
2058 ((< (or (nth 2 time1) 0) (or (nth 2 time2) 0))
2059 nil)
2060 ((> (or (nth 2 time1) 0) (or (nth 2 time2) 0))
2061 t)
2062 (t
2063 nil)))))
2064
2065 (defun newsticker--cache-item-compare-by-title (item1 item2)
2066 "Compare ITEM1 and ITEM2 by comparing their titles."
2067 (catch 'result
2068 (let ((age1 (newsticker--age item1))
2069 (age2 (newsticker--age item2)))
2070 (if (not (eq age1 age2))
2071 (cond ((eq age1 'obsolete)
2072 (throw 'result nil))
2073 ((eq age2 'obsolete)
2074 (throw 'result t)))))
2075 (string< (newsticker--title item1) (newsticker--title item2))))
2076
2077 (defun newsticker--cache-item-compare-by-position (item1 item2)
2078 "Compare ITEM1 and ITEM2 by comparing their original positions."
2079 (catch 'result
2080 (let ((age1 (newsticker--age item1))
2081 (age2 (newsticker--age item2)))
2082 (if (not (eq age1 age2))
2083 (cond ((eq age1 'obsolete)
2084 (throw 'result nil))
2085 ((eq age2 'obsolete)
2086 (throw 'result t)))))
2087 (< (or (newsticker--pos item1) 0) (or (newsticker--pos item2) 0))))
2088
2089 (defun newsticker--cache-save-version1 ()
2090 "Update and save newsticker cache file."
2091 (interactive)
2092 (newsticker--cache-update t))
2093
2094 (defun newsticker--cache-update (&optional save)
2095 "Update newsticker cache file.
2096 If optional argument SAVE is not nil the cache file is saved to disk."
2097 (save-excursion
2098 (unless (file-directory-p newsticker-dir)
2099 (make-directory newsticker-dir t))
2100 (let ((coding-system-for-write 'utf-8)
2101 (buf (find-file-noselect newsticker-cache-filename)))
2102 (when buf
2103 (set-buffer buf)
2104 (setq buffer-undo-list t)
2105 (erase-buffer)
2106 (insert ";; -*- coding: utf-8 -*-\n")
2107 (insert (prin1-to-string newsticker--cache))
2108 (when save
2109 (save-buffer))))))
2110
2111 (defun newsticker--cache-get-feed (feed)
2112 "Return the cached data for the feed FEED.
2113 FEED is a symbol!"
2114 (assoc feed newsticker--cache))
2115
2116 (defun newsticker--cache-dir ()
2117 "Return directory for saving cache data."
2118 (concat newsticker-dir "/feeds"))
2119
2120 (defun newsticker--cache-save ()
2121 "Save cache data for all feeds."
2122 (unless (file-directory-p newsticker-dir)
2123 (make-directory newsticker-dir t))
2124 (mapc 'newsticker--cache-save-feed newsticker--cache)
2125 nil)
2126
2127 (defun newsticker--cache-save-feed (feed)
2128 "Save cache data for FEED."
2129 (let ((dir (concat (newsticker--cache-dir) "/" (symbol-name (car feed)))))
2130 (unless (file-directory-p dir)
2131 (make-directory dir t))
2132 (let ((coding-system-for-write 'utf-8))
2133 (with-temp-file (concat dir "/data")
2134 (insert ";; -*- coding: utf-8 -*-\n")
2135 (insert (prin1-to-string (cdr feed)))))))
2136
2137 (defun newsticker--cache-read-version1 ()
2138 "Read version1 cache data."
2139 (let ((coding-system-for-read 'utf-8))
2140 (when (file-exists-p newsticker-cache-filename)
2141 (with-temp-buffer
2142 (insert-file-contents newsticker-cache-filename)
2143 (goto-char (point-min))
2144 (condition-case nil
2145 (setq newsticker--cache (read (current-buffer)))
2146 (error
2147 (message "Error while reading newsticker cache file!")
2148 (setq newsticker--cache nil)))))))
2149
2150 (defun newsticker--cache-read ()
2151 "Read cache data."
2152 (setq newsticker--cache nil)
2153 (if (file-exists-p newsticker-cache-filename)
2154 (progn
2155 (when (y-or-n-p "Old newsticker cache file exists. Read it? ")
2156 (newsticker--cache-read-version1))
2157 (when (y-or-n-p (format "Delete old newsticker cache file? "))
2158 (delete-file newsticker-cache-filename)))
2159 (mapc (lambda (f)
2160 (newsticker--cache-read-feed (car f)))
2161 (append newsticker-url-list-defaults newsticker-url-list))))
2162
2163 (defun newsticker--cache-read-feed (feed-name)
2164 "Read cache data for feed named FEED-NAME."
2165 (let ((file-name (concat (newsticker--cache-dir) "/" feed-name "/data"))
2166 (coding-system-for-read 'utf-8))
2167 (when (file-exists-p file-name)
2168 (with-temp-buffer
2169 (insert-file-contents file-name)
2170 (goto-char (point-min))
2171 (condition-case nil
2172 (add-to-list 'newsticker--cache (cons (intern feed-name)
2173 (read (current-buffer))))
2174 (error
2175 (message "Error while reading newsticker cache file %s!"
2176 file-name)
2177 (setq newsticker--cache nil)))))))
2178
2179 ;; ======================================================================
2180 ;;; Statistics
2181 ;; ======================================================================
2182 (defun newsticker--stat-num-items (feed &rest ages)
2183 "Return number of items in the given FEED which have one of the given AGES.
2184 If AGES is nil, the total number of items is returned."
2185 (let ((items (cdr (newsticker--cache-get-feed feed)))
2186 (num 0))
2187 (while items
2188 (if ages
2189 (if (memq (newsticker--age (car items)) ages)
2190 (setq num (1+ num)))
2191 (if (memq (newsticker--age (car items)) '(new old immortal obsolete))
2192 (setq num (1+ num))))
2193 (setq items (cdr items)))
2194 num))
2195
2196 (defun newsticker--stat-num-items-total (&optional age)
2197 "Return total number of items in all feeds which have the given AGE.
2198 If AGE is nil, the total number of items is returned."
2199 (apply '+
2200 (mapcar (lambda (feed)
2201 (if age
2202 (newsticker--stat-num-items (intern (car feed)) age)
2203 (newsticker--stat-num-items (intern (car feed)))))
2204 (append newsticker-url-list-defaults newsticker-url-list))))
2205
2206 ;; ======================================================================
2207 ;;; OPML
2208 ;; ======================================================================
2209 (defun newsticker-opml-export ()
2210 "OPML subscription export.
2211 Export subscriptions to a buffer in OPML Format."
2212 (interactive)
2213 (with-current-buffer (get-buffer-create "*OPML Export*")
2214 (set-buffer-file-coding-system 'utf-8)
2215 (insert (concat
2216 "<?xml version=\"1.0\" encoding=\"utf-8\"?>\n"
2217 "<!-- OPML generated by Emacs newsticker.el -->\n"
2218 "<opml version=\"1.0\">\n"
2219 " <head>\n"
2220 " <title>mySubscriptions</title>\n"
2221 " <dateCreated>" (format-time-string "%a, %d %b %Y %T %z")
2222 "</dateCreated>\n"
2223 " <ownerEmail>" user-mail-address "</ownerEmail>\n"
2224 " <ownerName>" (user-full-name) "</ownerName>\n"
2225 " </head>\n"
2226 " <body>\n"))
2227 (mapc (lambda (sub)
2228 (insert " <outline text=\"")
2229 (insert (newsticker--title sub))
2230 (insert "\" xmlUrl=\"")
2231 (insert (cadr sub))
2232 (insert "\"/>\n"))
2233 (append newsticker-url-list newsticker-url-list-defaults))
2234 (insert " </body>\n</opml>\n"))
2235 (pop-to-buffer "*OPML Export*")
2236 (when (fboundp 'sgml-mode)
2237 (sgml-mode)))
2238
2239 (defun newsticker--opml-import-outlines (outlines)
2240 "Recursively import OUTLINES from OPML data.
2241 Note that nested outlines are currently flattened -- i.e. grouping is
2242 removed."
2243 (mapc (lambda (outline)
2244 (let ((name (xml-get-attribute outline 'text))
2245 (url (xml-get-attribute outline 'xmlUrl))
2246 (children (xml-get-children outline 'outline)))
2247 (unless (string= "" url)
2248 (add-to-list 'newsticker-url-list
2249 (list name url nil nil nil) t))
2250 (if children
2251 (newsticker--opml-import-outlines children))))
2252 outlines))
2253
2254 (defun newsticker-opml-import (filename)
2255 "Import OPML data from FILENAME."
2256 (interactive "fOPML file: ")
2257 (set-buffer (find-file-noselect filename))
2258 (goto-char (point-min))
2259 (let* ((node-list (xml-parse-region (point-min) (point-max)))
2260 (body (car (xml-get-children (car node-list) 'body)))
2261 (outlines (xml-get-children body 'outline)))
2262 (newsticker--opml-import-outlines outlines))
2263 (customize-variable 'newsticker-url-list))
2264
2265 ;; ======================================================================
2266 ;;; Auto marking
2267 ;; ======================================================================
2268 (defun newsticker--run-auto-mark-filter (feed item)
2269 "Automatically mark an item as old or immortal.
2270 This function checks the variable `newsticker-auto-mark-filter-list'
2271 for an entry that matches FEED and ITEM."
2272 (let ((case-fold-search t))
2273 (mapc (lambda (filter)
2274 (let ((filter-feed (car filter))
2275 (pattern-list (cadr filter)))
2276 (when (string-match filter-feed feed)
2277 (newsticker--do-run-auto-mark-filter item pattern-list))))
2278 newsticker-auto-mark-filter-list)))
2279
2280 (defun newsticker--do-run-auto-mark-filter (item list)
2281 "Actually compare ITEM against the pattern-LIST.
2282 LIST must be an element of `newsticker-auto-mark-filter-list'."
2283 (mapc (lambda (pattern)
2284 (let ((age (nth 0 pattern))
2285 (place (nth 1 pattern))
2286 (regexp (nth 2 pattern))
2287 (title (newsticker--title item))
2288 (desc (newsticker--desc item)))
2289 (when (or (eq place 'title) (eq place 'all))
2290 (when (and title (string-match regexp title))
2291 (newsticker--debug-msg "Auto-marking as %s: `%s'"
2292 age (newsticker--title item))
2293 (setcar (nthcdr 4 item) age)))
2294 (when (or (eq place 'description) (eq place 'all))
2295 (when (and desc (string-match regexp desc))
2296 (newsticker--debug-msg "Auto-marking as %s: `%s'"
2297 age (newsticker--title item))
2298 (setcar (nthcdr 4 item) age)))))
2299 list))
2300
2301
2302 ;; ======================================================================
2303 ;;; Hook samples
2304 ;; ======================================================================
2305 (defun newsticker-new-item-functions-sample (feed item)
2306 "Demonstrate the use of the `newsticker-new-item-functions' hook.
2307 This function just prints out the values of the FEED and title of the ITEM."
2308 (message (concat "newsticker-new-item-functions-sample: feed=`%s', "
2309 "title=`%s'")
2310 feed (newsticker--title item)))
2311
2312 (defun newsticker-download-images (feed item)
2313 "Download the first image.
2314 If FEED equals \"imagefeed\" download the first image URL found
2315 in the description=contents of ITEM to the directory
2316 \"~/tmp/newsticker/FEED/TITLE\" where TITLE is the title of the item."
2317 (when (string= feed "imagefeed")
2318 (let ((title (newsticker--title item))
2319 (desc (newsticker--desc item)))
2320 (when (string-match "<img src=\"\\(http://[^ \"]+\\)\"" desc)
2321 (let ((url (substring desc (match-beginning 1) (match-end 1)))
2322 (temp-dir (concat "~/tmp/newsticker/" feed "/" title))
2323 (org-dir default-directory))
2324 (unless (file-directory-p temp-dir)
2325 (make-directory temp-dir t))
2326 (cd temp-dir)
2327 (message "Getting image %s" url)
2328 (apply 'start-process "wget-image"
2329 " *newsticker-wget-download-images*"
2330 newsticker-wget-name
2331 (list url))
2332 (cd org-dir))))))
2333
2334 (defun newsticker-download-enclosures (feed item)
2335 "In all FEEDs download the enclosed object of the news ITEM.
2336 The object is saved to the directory \"~/tmp/newsticker/FEED/TITLE\", which
2337 is created if it does not exist. TITLE is the title of the news
2338 item. Argument FEED is ignored.
2339 This function is suited for adding it to `newsticker-new-item-functions'."
2340 (let ((title (newsticker--title item))
2341 (enclosure (newsticker--enclosure item)))
2342 (when enclosure
2343 (let ((url (cdr (assoc 'url enclosure)))
2344 (temp-dir (concat "~/tmp/newsticker/" feed "/" title))
2345 (org-dir default-directory))
2346 (unless (file-directory-p temp-dir)
2347 (make-directory temp-dir t))
2348 (cd temp-dir)
2349 (message "Getting enclosure %s" url)
2350 (apply 'start-process "wget-enclosure"
2351 " *newsticker-wget-download-enclosures*"
2352 newsticker-wget-name
2353 (list url))
2354 (cd org-dir)))))
2355
2356 ;; ======================================================================
2357 ;;; Retrieve samples
2358 ;; ======================================================================
2359 (defun newsticker-retrieve-random-message (feed-name)
2360 "Return an artificial RSS string under the name FEED-NAME."
2361 (concat "<?xml version=\"1.0\" encoding=\"iso-8859-1\" ?><rss version=\"0.91\">"
2362 "<channel>"
2363 "<title>newsticker-retrieve-random-message</title>"
2364 "<description>Sample retrieval function</description>"
2365 "<pubDate>FIXME Sat, 07 Sep 2005 00:00:01 GMT</pubDate>"
2366 "<item><title>" (format "Your lucky number is %d" (random 10000))
2367 "</title><description>" (format "Or maybe it is %d" (random 10000))
2368 "</description></item></channel></rss>"))
2369
2370 (provide 'newsticker-backend)
2371
2372 ;; arch-tag: 0e37b658-56e9-49ab-90f9-f2df57e1a659
2373 ;;; newst-backend.el ends here