1 ;;; shr.el --- Simple HTML Renderer
3 ;; Copyright (C) 2010 Free Software Foundation, Inc.
5 ;; Author: Lars Magne Ingebrigtsen <larsi@gnus.org>
8 ;; This file is part of GNU Emacs.
10 ;; GNU Emacs is free software: you can redistribute it and/or modify
11 ;; it under the terms of the GNU General Public License as published by
12 ;; the Free Software Foundation, either version 3 of the License, or
13 ;; (at your option) any later version.
15 ;; GNU Emacs is distributed in the hope that it will be useful,
16 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
17 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 ;; GNU General Public License for more details.
20 ;; You should have received a copy of the GNU General Public License
21 ;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
25 ;; This package takes a HTML parse tree (as provided by
26 ;; libxml-parse-html-region) and renders it in the current buffer. It
27 ;; does not do CSS, JavaScript or anything advanced: It's geared
28 ;; towards rendering typical short snippets of HTML, like what you'd
29 ;; find in HTML email and the like.
34 "Simple HTML Renderer"
37 (defcustom shr-max-image-proportion 0.9
38 "How big pictures displayed are in relation to the window they're in.
39 A value of 0.7 means that they are allowed to take up 70% of the
40 width and height of the window. If they are larger than this,
41 and Emacs supports it, then the images will be rescaled down to
47 (defcustom shr-blocked-images nil
48 "Images that have URLs matching this regexp will be blocked."
53 (defvar shr-folding-mode nil)
54 (defvar shr-state nil)
55 (defvar shr-start nil)
56 (defvar shr-indentation 0)
60 (defun shr-transform-dom (dom)
61 (let ((result (list (pop dom))))
62 (dolist (arg (pop dom))
63 (push (cons (intern (concat ":" (symbol-name (car arg))) obarray)
68 (push (cons :text sub) result)
69 (push (shr-transform-dom sub) result)))
73 (defun shr-insert-document (dom)
76 (shr-descend (shr-transform-dom dom))))
78 (defun shr-descend (dom)
79 (let ((function (intern (concat "shr-tag-" (symbol-name (car dom))) obarray)))
80 (if (fboundp function)
81 (funcall function (cdr dom))
82 (shr-generic (cdr dom)))))
84 (defun shr-generic (cont)
88 (shr-insert (cdr sub)))
92 (defun shr-tag-p (cont)
93 (shr-ensure-paragraph)
95 (shr-ensure-paragraph))
97 (defun shr-ensure-paragraph ()
100 (unless (eql (char-after (- (point) 2)) ?\n)
108 (defun shr-tag-b (cont)
109 (shr-fontize-cont cont 'bold))
111 (defun shr-tag-i (cont)
112 (shr-fontize-cont cont 'italic))
114 (defun shr-tag-u (cont)
115 (shr-fontize-cont cont 'underline))
117 (defun shr-tag-s (cont)
118 (shr-fontize-cont cont 'strikethru))
120 (defun shr-fontize-cont (cont &rest types)
124 (shr-add-font (or shr-start (point)) (point) type))))
126 (defun shr-add-font (start end type)
127 (let ((overlay (make-overlay start end)))
128 (overlay-put overlay 'face type)))
130 (defun shr-tag-a (cont)
131 (let ((url (cdr (assq :href cont)))
134 (widget-convert-button
135 'link shr-start (point)
136 :action 'shr-browse-url
138 :keymap widget-keymap
141 (defun shr-browse-url (widget &rest stuff)
142 (browse-url (widget-get widget :url)))
144 (defun shr-tag-img (cont)
145 (when (and (> (current-column) 0)
146 (not (eq shr-state 'image)))
148 (let ((start (point-marker)))
149 (let ((alt (cdr (assq :alt cont)))
150 (url (cdr (assq :src cont))))
151 (when (zerop (length alt))
154 ((and shr-blocked-images
155 (string-match shr-blocked-images url))
157 ((url-is-cached (browse-url-url-encode-chars url "[&)$ ]"))
158 (shr-put-image (shr-get-image-data url) (point) alt))
161 (url-retrieve url 'shr-image-fetched
162 (list (current-buffer) start (point-marker))
165 (setq shr-state 'image))))
167 (defun shr-image-fetched (status buffer start end)
168 (when (and (buffer-name buffer)
169 (not (plist-get status :error)))
170 (url-store-in-cache (current-buffer))
171 (when (or (search-forward "\n\n" nil t)
172 (search-forward "\r\n\r\n" nil t))
173 (let ((data (buffer-substring (point) (point-max))))
174 (with-current-buffer buffer
175 (let ((alt (buffer-substring start end))
176 (inhibit-read-only t))
177 (delete-region start end)
178 (shr-put-image data start alt))))))
179 (kill-buffer (current-buffer)))
181 (defun shr-put-image (data point alt)
182 (if (not (display-graphic-p))
184 (let ((image (ignore-errors
185 (shr-rescale-image data))))
187 (put-image image point alt)))))
189 (defun shr-rescale-image (data)
190 (if (or (not (fboundp 'imagemagick-types))
191 (not (get-buffer-window (current-buffer))))
192 (create-image data nil t)
193 (let* ((image (create-image data nil t))
194 (size (image-size image t))
197 (edges (window-inside-pixel-edges
198 (get-buffer-window (current-buffer))))
199 (window-width (truncate (* shr-max-image-proportion
200 (- (nth 2 edges) (nth 0 edges)))))
201 (window-height (truncate (* shr-max-image-proportion
202 (- (nth 3 edges) (nth 1 edges)))))
204 (when (> height window-height)
205 (setq image (or (create-image data 'imagemagick t
206 :height window-height)
208 (setq size (image-size image t)))
209 (when (> (car size) window-width)
211 (create-image data 'imagemagick t
216 (defun shr-tag-pre (cont)
217 (let ((shr-folding-mode nil))
220 (shr-ensure-newline)))
222 (defun shr-tag-blockquote (cont)
223 (let ((shr-indentation (+ shr-indentation 4)))
226 (defun shr-ensure-newline ()
227 (unless (zerop (current-column))
230 (defun shr-insert (text)
231 (when (eq shr-state 'image)
233 (setq shr-state nil))
235 ((eq shr-folding-mode 'none)
240 (when (and (string-match "^[ \t\n]" text)
243 (dolist (elem (split-string text))
244 (setq column (current-column))
247 ((> (+ column (length elem) 1) shr-width)
253 (> shr-indentation 0))
254 (insert (make-string shr-indentation ? )))
255 ;; The shr-start is a special variable that is used to pass
256 ;; upwards the first point in the buffer where the text really
259 (setq shr-start (point)))
261 (when (and (string-match "[ \t\n]$" text)
265 (defun shr-get-image-data (url)
266 "Get image data for URL.
267 Return a string with image data."
269 (mm-disable-multibyte)
270 (url-cache-extract (url-cache-create-filename url))
271 (when (or (search-forward "\n\n" nil t)
272 (search-forward "\r\n\r\n" nil t))
273 (buffer-substring (point) (point-max)))))
275 (defvar shr-list-mode nil)
277 (defun shr-tag-ul (cont)
278 (shr-ensure-paragraph)
279 (let ((shr-list-mode 'ul))
282 (defun shr-tag-ol (cont)
283 (let ((shr-list-mode 1))
286 (defun shr-tag-li (cont)
288 (if (numberp shr-list-mode)
290 (insert (format "%d " shr-list-mode))
291 (setq shr-list-mode (1+ shr-list-mode)))
295 (defun shr-tag-br (cont)
299 (defun shr-tag-h1 (cont)
300 (shr-heading cont 'bold 'underline))
302 (defun shr-tag-h2 (cont)
303 (shr-heading cont 'bold))
305 (defun shr-tag-h3 (cont)
306 (shr-heading cont 'italic))
308 (defun shr-tag-h4 (cont)
311 (defun shr-tag-h5 (cont)
314 (defun shr-tag-h6 (cont)
317 (defun shr-heading (cont &rest types)
318 (shr-ensure-paragraph)
319 (apply #'shr-fontize-cont cont types)
320 (shr-ensure-paragraph))