1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
|
;;; jao-doc-view.el -- extensions for doc-view -*- lexical-binding: t; -*-
;; Copyright (c) 2013, 2015, 2017, 2018, 2019, 2021, 2022 Jose Antonio Ortega Ruiz
;; This file is free software; you can redistribute it and/or modify
;; it under the terms of the GNU General Public License as published by
;; the Free Software Foundation; either version 3 of the License, or
;; (at your option) any later version.
;; This file is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
;; GNU General Public License for more details.
;; You should have received a copy of the GNU General Public License
;; along with this program. If not, see <http://www.gnu.org/licenses/>.
;; Author: Jose Antonio Ortega Ruiz <jao@gnu.org>
;; Start date: Fri Feb 15, 2013 01:21
(require 'doc-view)
(require 'jao-pdf)
;;; Utilities
(defmacro jao-doc-view--funcall (a b &rest args)
`(cond ((derived-mode-p 'pdf-view-mode) (,a ,@args))
((derived-mode-p 'doc-view-mode) (,b ,@args))))
(defun jao-doc-view-current-page ()
(jao-doc-view--funcall pdf-view-current-page doc-view-current-page))
(defun jao-doc-view-goto-page (page &optional height)
(when page
(jao-doc-view--funcall pdf-view-goto-page doc-view-goto-page page))
(when (and height (derived-mode-p 'pdf-view-mode))
(image-set-window-vscroll
(round (/ (* height (cdr (pdf-view-image-size))) (frame-char-height))))))
;;; imenu
(defun jao-doc-view-enable-imenu (file-name goto-page)
(let ((ifun (lambda () (doc-view-imenu-index file-name goto-page)))
(doc-view-imenu-enabled t))
(doc-view-imenu-setup)
(setq-local imenu-create-index-function ifun)))
;;; Page trailing
(defvar-local jao-doc-view--trail-back ())
(defvar-local jao-doc-view--trail-fwd ())
(defun jao-doc-view--trail-push (dest-page)
(when-let (page (jao-doc-view-current-page))
(unless (eq (car jao-doc-view--trail-back) page)
(push page jao-doc-view--trail-back))))
(defun jao-doc-view-back ()
(interactive nil doc-view-mode)
(if-let (p (pop jao-doc-view--trail-back))
(progn (push (jao-doc-view-current-page) jao-doc-view--trail-fwd)
(jao-doc-view-goto-page p))
(message "No more back marks.")))
(defun jao-doc-view-forward ()
(interactive nil doc-view-mode)
(if-let (p (pop jao-doc-view--trail-fwd))
(progn (push (jao-doc-view-current-page) jao-doc-view--trail-back)
(jao-doc-view-goto-page p))
(message "No more forward marks.")))
(advice-add 'doc-view-goto-page :before #'jao-doc-view--trail-push)
;;; Extract text
(defun jao-doc-view-page-text (&optional re-render no-select)
(interactive "P")
(let* ((pno (doc-view-current-page))
(in buffer-file-name)
(cdir (or (doc-view--current-cache-dir) "/tmp"))
(out (format "%s/p%s.txt" cdir pno)))
(when (and (file-exists-p out) re-render)
(delete-file out))
(unless (file-exists-p out)
(shell-command-to-string (format "mutool convert -o %s %s %s" out in pno)))
(if no-select
out
(find-file out)
(view-mode))))
(define-key doc-view-mode-map "t" #'jao-doc-view-page-text)
;;; Find URLs
(defun jao-doc-view--full-txt ()
(expand-file-name "doc.txt" (doc-view--current-cache-dir)))
(defun jao-doc-view--collect-urls (file)
(with-current-buffer (find-file-noselect file)
(goto-char (point-min))
(let ((urls nil))
(while (re-search-forward "https?://" nil t)
(push (thing-at-point-url-at-point) urls))
urls)))
(defun jao-doc-view--page-urls (&optional all)
(let ((txt (jao-doc-view--full-txt)))
(cond ((and all (not (file-exists-p txt)))
(message "Full text not extracted yet: doing so!")
(doc-view-doc->txt txt (lambda () (message "Text extracted")))
'wait)
(all (jao-doc-view--collect-urls txt))
(t (jao-doc-view--collect-urls (jao-doc-view-page-text nil t))))))
(defun jao-doc-view-visit-url (all)
"Visit URL displayed in this page."
(interactive "P")
(let ((urls (jao-doc-view--page-urls all)))
(cond ((eq 'wait urls) (message "Extracting text, please wait and retry."))
((zerop (length urls))
(message "No URLs in this %s" (if all "document" "page")))
(t (when-let (url (completing-read "URL: " urls nil nil
(when (null (cdr urls)) (car urls))))
(browse-url url))))))
;;; .
(provide 'jao-doc-view)
|