ol-w3m.el 9.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221
  1. ;;; ol-w3m.el --- Copy and Paste From W3M -*- lexical-binding: t; -*-
  2. ;; Copyright (C) 2008-2022 Free Software Foundation, Inc.
  3. ;; Author: Andy Stewart <lazycat dot manatee at gmail dot com>
  4. ;; Keywords: outlines, hypermedia, calendar, wp
  5. ;; Homepage: https://orgmode.org
  6. ;;
  7. ;; This file is part of GNU Emacs.
  8. ;; GNU Emacs is free software: you can redistribute it and/or modify
  9. ;; it under the terms of the GNU General Public License as published by
  10. ;; the Free Software Foundation, either version 3 of the License, or
  11. ;; (at your option) any later version.
  12. ;; GNU Emacs is distributed in the hope that it will be useful,
  13. ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  15. ;; GNU General Public License for more details.
  16. ;; You should have received a copy of the GNU General Public License
  17. ;; along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>.
  18. ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
  19. ;;
  20. ;;; Commentary:
  21. ;; This file implements copying HTML content from a w3m buffer and
  22. ;; transforming the text on the fly so that it can be pasted into an
  23. ;; Org buffer with hot links. It will also work for regions in gnus
  24. ;; buffers that have been washed with w3m.
  25. ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
  26. ;;
  27. ;;; Acknowledgments:
  28. ;; Richard Riley <rileyrgdev at googlemail dot com>
  29. ;;
  30. ;; The idea of transforming the HTML content with Org syntax is
  31. ;; proposed by Richard, I'm just coding it.
  32. ;;
  33. ;;; Code:
  34. (require 'ol)
  35. (defvar w3m-current-url)
  36. (defvar w3m-current-title)
  37. (org-link-set-parameters "w3m" :store #'org-w3m-store-link)
  38. (defun org-w3m-store-link ()
  39. "Store a link to a w3m buffer."
  40. (when (eq major-mode 'w3m-mode)
  41. (org-link-store-props
  42. :type "w3m"
  43. :link w3m-current-url
  44. :url (url-view-url t)
  45. :description (or w3m-current-title w3m-current-url))))
  46. (defun org-w3m-copy-for-org-mode ()
  47. "Copy current buffer content or active region with Org style links.
  48. This will encode `link-title' and `link-location' with
  49. `org-link-make-string', and insert the transformed test into the kill ring,
  50. so that it can be yanked into an Org buffer with links working correctly."
  51. (interactive)
  52. (let* ((regionp (org-region-active-p))
  53. (transform-start (point-min))
  54. (transform-end (point-max))
  55. return-content
  56. link-location link-title
  57. temp-position out-bound)
  58. (when regionp
  59. (setq transform-start (region-beginning))
  60. (setq transform-end (region-end))
  61. ;; Deactivate mark if current mark is activate.
  62. (deactivate-mark))
  63. (message "Transforming links...")
  64. (save-excursion
  65. (goto-char transform-start)
  66. (while (and (not out-bound) ; still inside region to copy
  67. (not (org-w3m-no-next-link-p))) ; no next link current buffer
  68. ;; store current point before jump next anchor
  69. (setq temp-position (point))
  70. ;; move to next anchor when current point is not at anchor
  71. (or (get-text-property (point) 'w3m-href-anchor) (org-w3m-get-next-link-start))
  72. (cond
  73. ((<= (point) transform-end) ; point is inside transform bound
  74. ;; get content between two links.
  75. (when (> (point) temp-position)
  76. (setq return-content (concat return-content
  77. (buffer-substring
  78. temp-position (point)))))
  79. (cond
  80. ((setq link-location (get-text-property (point) 'w3m-href-anchor))
  81. ;; current point is a link
  82. ;; (we thus also got link location at current point)
  83. ;; get link title at current point.
  84. (setq link-title (buffer-substring (point)
  85. (org-w3m-get-anchor-end)))
  86. ;; concat Org style url to `return-content'.
  87. (setq return-content
  88. (concat return-content
  89. (if (org-string-nw-p link-location)
  90. (org-link-make-string link-location link-title)
  91. link-title))))
  92. ((setq link-location (get-text-property (point) 'w3m-image))
  93. ;; current point is an image
  94. ;; (we thus also got image link location at current point)
  95. ;; get link title at current point.
  96. (setq link-title (buffer-substring (point) (org-w3m-get-image-end)))
  97. ;; concat Org style url to `return-content'.
  98. (setq return-content
  99. (concat return-content
  100. (if (org-string-nw-p link-location)
  101. (org-link-make-string link-location link-title)
  102. link-title))))
  103. (t nil))); current point is neither a link nor an image
  104. (t ; point is NOT inside transform bound
  105. (goto-char temp-position) ; reset point before jump next anchor
  106. (setq out-bound t)))) ; for break out `while' loop
  107. ;; add the rest until end of the region to be copied
  108. (when (< (point) transform-end)
  109. (setq return-content
  110. (concat return-content
  111. (buffer-substring (point) transform-end))))
  112. (org-kill-new return-content)
  113. (message "Transforming links...done, use C-y to insert text into Org file")
  114. (message "Copy with link transformation complete."))))
  115. (defun org-w3m-get-anchor-start ()
  116. "Move cursor to the start of current anchor. Return point."
  117. ;; get start position of anchor or current point
  118. ;; NOTE: This function seems never to be used. Should it be removed?
  119. (goto-char (or (previous-single-property-change (point) 'w3m-anchor-sequence)
  120. (point))))
  121. (defun org-w3m-get-anchor-end ()
  122. "Move cursor to the end of current anchor. Return point."
  123. ;; get end position of anchor or point
  124. (goto-char (or (next-single-property-change (point) 'w3m-anchor-sequence)
  125. (point))))
  126. (defun org-w3m-get-image-end ()
  127. "Move cursor to the end of current image. Return point."
  128. ;; get end position of image or point
  129. ;; NOTE: Function `org-w3m-get-image-start' was not created because
  130. ;; function `org-w3m-get-anchor-start' is never used.
  131. (goto-char (or (next-single-property-change (point) 'w3m-image)
  132. (point))))
  133. (defun org-w3m-get-next-link-start ()
  134. "Move cursor to the start of next link or image. Return point."
  135. (let (pos start-pos anchor-pos image-pos)
  136. (setq pos (setq start-pos (point)))
  137. (setq anchor-pos
  138. (catch 'reach
  139. (while (setq pos (next-single-property-change pos 'w3m-anchor-sequence))
  140. (when (get-text-property pos 'w3m-href-anchor)
  141. (throw 'reach pos)))))
  142. (setq pos start-pos)
  143. (setq image-pos
  144. (catch 'reach
  145. (while (setq pos (next-single-property-change pos 'w3m-image))
  146. (when (get-text-property pos 'w3m-image)
  147. (throw 'reach pos)))))
  148. (goto-char (min (or anchor-pos (point-max)) (or image-pos (point-max))))))
  149. (defun org-w3m-get-prev-link-start ()
  150. "Move cursor to the start of previous link. Return point."
  151. ;; NOTE: This function is only called by `org-w3m-no-prev-link-p',
  152. ;; which itself seems never to be used. Should it be removed?
  153. ;;
  154. ;; WARNING: This function has not been updated to account for
  155. ;; `w3m-image'. See `org-w3m-get-next-link-start'.
  156. (catch 'reach
  157. (let ((pos (point)))
  158. (while (setq pos (previous-single-property-change pos 'w3m-anchor-sequence))
  159. (when (get-text-property pos 'w3m-href-anchor)
  160. ;; jump to previous anchor
  161. (goto-char pos)
  162. ;; return point when current is valid link
  163. (throw 'reach nil)))))
  164. (point))
  165. (defun org-w3m-no-next-link-p ()
  166. "Whether there is no next link after the cursor.
  167. Return t if there is no next link; otherwise, return nil."
  168. (save-excursion
  169. (equal (point) (org-w3m-get-next-link-start))))
  170. (defun org-w3m-no-prev-link-p ()
  171. "Whether there is no previous link after the cursor.
  172. Return t if there is no previous link; otherwise, return nil."
  173. ;; NOTE: This function seems never to be used. Should it be removed?
  174. (save-excursion
  175. (equal (point) (org-w3m-get-prev-link-start))))
  176. ;; Install keys into the w3m keymap
  177. (defvar w3m-mode-map)
  178. (defvar w3m-minor-mode-map)
  179. (when (and (boundp 'w3m-mode-map)
  180. (keymapp w3m-mode-map))
  181. (define-key w3m-mode-map "\C-c\C-x\M-w" 'org-w3m-copy-for-org-mode)
  182. (define-key w3m-mode-map "\C-c\C-x\C-w" 'org-w3m-copy-for-org-mode))
  183. (when (and (boundp 'w3m-minor-mode-map)
  184. (keymapp w3m-minor-mode-map))
  185. (define-key w3m-minor-mode-map "\C-c\C-x\M-w" 'org-w3m-copy-for-org-mode)
  186. (define-key w3m-minor-mode-map "\C-c\C-x\C-w" 'org-w3m-copy-for-org-mode))
  187. (add-hook
  188. 'w3m-mode-hook
  189. (lambda ()
  190. (define-key w3m-mode-map "\C-c\C-x\M-w" 'org-w3m-copy-for-org-mode)
  191. (define-key w3m-mode-map "\C-c\C-x\C-w" 'org-w3m-copy-for-org-mode)))
  192. (add-hook
  193. 'w3m-minor-mode-hook
  194. (lambda ()
  195. (define-key w3m-minor-mode-map "\C-c\C-x\M-w" 'org-w3m-copy-for-org-mode)
  196. (define-key w3m-minor-mode-map "\C-c\C-x\C-w" 'org-w3m-copy-for-org-mode)))
  197. (provide 'ol-w3m)
  198. ;;; ol-w3m.el ends here