-
-
Notifications
You must be signed in to change notification settings - Fork 244
/
org-ref-refproc.el
481 lines (414 loc) · 17.4 KB
/
org-ref-refproc.el
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
;;; org-ref-refproc.el --- refproc - for exporting ref links in non-LaTeX backends -*- lexical-binding: t; -*-
;; For autoref and cref* links, a clever prefix is added at export.
;; Prefixes are found in `org-ref-refproc-clever-prefixes'
;; Use a keyword like this to set the style of clever prefixes. You can use a full or abbreviated prefix
;;
;; #+refproc: :abbreviate t :capitalize t
;;; Commentary:
;;
;;; Code:
(require 'org-ref-ref-links)
(defcustom org-ref-refproc-clever-prefixes
'((section :full "section" :abbrv "sec." :org-element headline)
(figure :full "figure" :abbrv "fig." :org-element link)
(table :full "table" :abbrv "tab." :org-element table)
(equation :full "equation" :abbrv "eq." :org-element latex-environment)
(proof :full "proof" :abbrv "pf." :org-element latex-environment)
(listing :full "listing" :abbrv "lst." :org-element src-block)
(lemma :full "lemma" :abbrv "lem." :org-element special-block)
(theorem :full "theorem" :abbrv "thm." :org-element special-block)
(corollary :full "corollary" :abbrv "cor." :org-element special-block))
"Prefixes for cleveref links.
plist with :full and :abbrv forms for each type.
:org-element is the element these are defined in."
:type 'sexp
:group 'org-ref)
;; * refproc
;;
(defun org-ref-refproc-get-options ()
"Return a plist of options from a #+refproc keyword.
Supported options are:
:abbreviate (nil or non-nil)
:capitalize (nil or non-nil)
These options only affect the cref* links."
(read (format "(%s)" (cadr (assoc "REFPROC"
(org-collect-keywords
'("REFPROC")))))))
(defun org-ref-get-ref-links ()
"Return a list of ref links in the buffer."
(org-element-map (org-element-parse-buffer) 'link
(lambda (lnk)
(when (assoc (org-element-property :type lnk) org-ref-ref-types)
lnk))))
(defun org-ref-refproc-referenceables ()
"Return a list of referenceable items, grouped by type.
This will be a list of (type label1 label2 ...).
Not all styles of target are currently supported. This supports
named tables, figures and src-blocks, headlines with a custom_id,
and latex_environments with a latex label or name (these are all
considered equations, which might be wrong for other
environments)."
(let* ((parse-data (org-element-parse-buffer))
type el
;; for each type, we specify what org-element to get the labels from.
(referencables (cl-loop for entry in org-ref-refproc-clever-prefixes
do
(setq type (car entry)
el (plist-get (cdr entry) :org-element))
collect
(cons type
(org-element-map parse-data el
(lambda (e)
(pcase el
;; Headlines
('headline
(cond
;; There is a custom_id, we use it.
((org-element-property :CUSTOM_ID e)
(org-element-property :CUSTOM_ID e))
;; See if there is a target in the heading
((string-match org-target-regexp
(org-element-property :raw-value e))
(match-string 1 (org-element-property :raw-value e)))
;; Check for a label link
((string-match (concat "label:" org-ref-label-re)
(org-element-property :raw-value e))
(match-string 1 (org-element-property :raw-value e)))))
;; Figures
('link
(cond
;; file link with a name property
((and (org-file-image-p (org-element-property :path e))
(org-element-property
:name (org-element-property :parent e)))
(org-element-property
:name (org-element-property :parent e)))
;; a label link in the caption
((and (org-file-image-p (org-element-property :path e))
(org-element-property
:caption (org-element-property :parent e))
(string-match (concat "label:" org-ref-label-re)
(org-element-interpret-data
(org-element-property
:caption
(org-element-property :parent e)))))
(match-string 1 (org-element-interpret-data
(org-element-property
:caption
(org-element-property :parent e)))))))
;; Tables
('table
(cond
;; A name keyword is preferred
((org-element-property :name e)
(org-element-property :name e))
;; a label link in a caption also works
((string-match (concat "label:" org-ref-label-re)
(or (org-element-interpret-data
(org-element-property :caption e))
""))
(match-string 1 (org-element-interpret-data
(org-element-property :caption e))))))
;; equations, proofs, and other latex environments
('latex-environment
(when (or (and (eq type 'equation)
(string-match "\\\\begin{equation}"
(org-element-property :value e)))
(and (eq type 'equation)
(string-match "\\\\begin{align}"
(org-element-property :value e)))
(and (eq type 'proof) (string-match "\\\\begin{proof}"
(org-element-property :value e))))
(cond
;; Name keyword
((org-element-property :name e)
(org-element-property :name e))
;; latex label in the value
((string-match "\\\\label{\\(.*\\)}" (org-element-property :value e))
(save-match-data
(let ((pos 1)
matches)
(while (string-match "\\\\label{\\(.*\\)}" (org-element-property :value e) pos)
(push (match-string 1 (org-element-property :value e)) matches)
(setq pos (match-end 0)))
matches))))))
;; special blocks
('special-block
(cond
((and (eq type 'lemma)
(org-element-property :name e)
(string= "lemma" (org-element-property :type e)))
(org-element-property :name e))
((and (eq type 'corollary)
(org-element-property :name e)
(string= "corollary" (org-element-property :type e)))
(org-element-property :name e))
((and (eq type 'theorem)
(org-element-property :name e)
(string= "theorem" (org-element-property :type e)))
(org-element-property :name e))))
;; Listings of code blocks
('src-block
(when-let (name (org-element-property :name e))
name)))))))))
;; the align equation environment needs to be flattened
(cl-loop for type in referencables
collect (cons (car type) (-flatten (cdr type))))))
(defun org-ref-refproc-get-type (label referenceables)
"Get the type of reference LABEL refers to.
REFERENCEABLES comes from `org-ref-refproc-referenceables'.
Returns a plist (:type type :label label :index index)"
(cl-loop for type in referenceables
if (member label type)
return (list :type (car type) :label label :index (seq-position (cdr type) label 'equal))))
(defun org-ref-refproc-group-sort-labels (lbls referenceables)
"Group and sort the labels in LBLS.
REFERENCEABLES comes from `org-ref-refproc-referenceables'.
Returns a list of (list (type l1 i1) (type l2, i2)...) where l1
is label1, i1 is index1, etc.
This data structure has all the references from a single link
grouped by type. For some links there will only be one type, and
one label, because that is all that is allowed, e.g. for ref,
eqref, pageref, nameref and autoref.
For the cref* links though you can have many labels, even to
different kinds of things, and these are why we do the fancy
grouping and sorting here."
(cl-loop for entry in
(seq-group-by (lambda (el)
(plist-get el :type))
(cl-loop for label in lbls collect
(org-ref-refproc-get-type label referenceables)))
collect
(sort (cdr entry) (lambda (a b)
(< (plist-get a :index) (plist-get b :index))))))
;; * Refproc - a reference processor for org-mode
;;
;; The strategy is to compute string replacements that are just org-syntax, then
;; replace each link with the replacement.
(defun org-ref-refproc-replacement (ref-link referenceables backend)
"Compute a replacement for REF-LINK (an org-element).
REFERENCEABLES comes from `org-ref-refproc-referenceables'.
BACKEND is the export backend."
(let* ((ref-type (org-element-property :type ref-link))
(labels (split-string (org-element-property :path ref-link) ","))
(post-blanks (org-element-property :post-blank ref-link))
(data (cl-loop for label in labels collect (org-ref-refproc-get-type label referenceables))))
(pcase ref-type
;; These types only allow one label in the reference
("ref"
(when (> (length data) 1)
(error "A ref link can only have one label in it"))
(setq data (cl-first data))
(format "[[%s%s]]%s"
(if (eq 'section (plist-get data :type))
"#"
"")
(plist-get data :label)
;; add back post blank spaces.
(make-string post-blanks ? )))
("eqref"
(when (> (length data) 1)
(error "An eqref link can only have one label in it"))
(setq data (cl-first data))
(format (if (eq backend 'html)
"[[%s]]%s"
"([[%s]])%s")
(plist-get data :label)
;; add back post blank spaces.
(make-string post-blanks ? )))
;; This one doesn't make much sense in unpaginated exports, and I don't
;; have a way to get a page number anyway, so we make this a regular ref.
("pageref"
(when (> (length data) 1)
(error "A pageref link can only have one label in it"))
(setq data (cl-first data))
(format "[[%s%s]]%s"
(if (eq 'section (plist-get data :type))
"#"
"")
(plist-get data :label)
;; add back post blank spaces.
(make-string post-blanks ? )))
;; this will use the heading name, or caption of the ref
("nameref"
(when (> (length data) 1)
(error "A nameref link can only have one label in it"))
(setq data (cl-first data))
;; Basically I follow the link, and depending on the ref type get a
;; "name" for it. Right now there is no error if there is not a heading
;; or caption, you would just get an empty string.
(save-excursion
(goto-char (org-element-property :begin ref-link))
(search-forward ":")
(org-ref-ref-jump-to (org-element-property :path ref-link))
(pcase (plist-get data :type)
('section
(org-previous-visible-heading 1)
(format "[[#%s][%s]]%s"
(plist-get data :label)
(cl-fifth (org-heading-components))
(make-string post-blanks ? )))
('table
(format "[[%s][%s]]%s"
(plist-get data :label)
(org-element-interpret-data (org-element-property :caption (org-element-context)))
(make-string post-blanks ? )))
('figure
(format "[[%s][%s]]%s"
(plist-get data :label)
(org-element-interpret-data (org-element-property :caption (org-element-context)))
(make-string post-blanks ? )))
('listing
(format "[[%s][%s]]%s"
(plist-get data :label)
(org-element-interpret-data (org-element-property :caption (org-element-context)))
(make-string post-blanks ? )))
;; does equation even make sense? is there ever a caption?
(_
(error "The nameref link is not implemented for %S" data)))))
;; autoref is the first place we have to be clever.
("autoref"
(when (> (length data) 1)
(error "A pageref link can only have one label in it"))
(setq data (cl-first data))
(let* ((prefix-data (cdr (assoc (plist-get data :type) org-ref-refproc-clever-prefixes)))
(options (org-ref-refproc-get-options))
(prefix (plist-get prefix-data (if (plist-get options :abbreviate)
:abbrv
:full))))
(when (plist-get options :capitalize) (setq prefix (capitalize prefix)))
(format "%s [[%s%s]]%s"
prefix
(if (eq 'section (plist-get data :type))
"#"
"")
(plist-get data :label)
(make-string post-blanks ? ))))
;; Now we get to the cref* links. These are complicated, so I will pass
;; this out to dedicated functions. At this point, I have the ref-link,
("cref"
(org-ref-refproc-cref-replacement ref-link referenceables nil))
("Cref"
(org-ref-refproc-cref-replacement ref-link referenceables t))
(_
(error "%s links are not supported yet" ref-type)))))
(defun org-ref-refproc-cref-replacement (ref-link referenceables capitalize)
"Calculate a replacement for a REF-LINK.
REFERENCEABLES comes from `org-ref-refproc-referenceables'.
If CAPITALIZE is non-nil, capitalize the first entry (this is for
Cref) and is different than the capitalize option in #+refproc:
which capitalizes each prefix."
(let* ((options (org-ref-refproc-get-options))
(labels (split-string (org-element-property :path ref-link) ","))
(post-blanks (org-element-property :post-blank ref-link))
(data (cl-loop for label in labels collect (org-ref-refproc-get-type label referenceables)))
(groups (seq-group-by (lambda (entry)
(plist-get entry :type))
data))
;; this will be a list of sorted entries.
(sorted-groups (cl-loop for group in groups collect
(sort (cdr group) (lambda (a b)
(< (plist-get a :index) (plist-get b :index))))))
;; temp vars
prefix
prefix-data
;; Now we have to be clever on each sorted group. One day I should add compression to the groups, e.g. 1,2,3 - > 1 to 3
;; For each group we need a prefix, and it may have to be a plural prefix.
;; If there are two members of a group, they are joined by and
;; if there are more than two members of a group, they are separated by commas with and at the end.
(replacements (cl-loop for collection in sorted-groups collect
(pcase (length collection)
;; One thing in the list
(1
(setq collection (cl-first collection)
prefix-data (cdr (assoc (plist-get collection :type) org-ref-refproc-clever-prefixes))
prefix (plist-get prefix-data (if (plist-get options :abbreviate)
:abbrv
:full)))
(when (plist-get options :capitalize)
(setq prefix (capitalize prefix)))
(format "%s %s"
;; prefix
prefix
(concat
(cond
((eq 'section (plist-get collection :type))
(format "[[#%s]]" (plist-get collection :label)))
((eq 'equation (plist-get collection :type))
(format "\\ref{%s}" (plist-get collection :label)))
(t
(format "[[%s]]" (plist-get collection :label)))))))
(2
;; the prefix can be found from the first label, but we have to make it plural.
(setq prefix-data (cdr (assoc (plist-get (cl-first collection) :type)
org-ref-refproc-clever-prefixes))
prefix (plist-get prefix-data (if (plist-get options :abbreviate)
:abbrv
:full)))
(when (plist-get options :capitalize)
(setq prefix (capitalize prefix)))
;; Make it plural (substring "fig." -1)
(setq prefix (if (string= "." (substring prefix -1))
(concat (substring prefix 0 -1) "s.")
(concat prefix "s")))
(format "%s [[%s]] and [[%s]]"
prefix
(concat
(if (eq 'section (plist-get (cl-first collection) :type)) "#" "")
(plist-get (cl-first collection) :label))
(concat
(if (eq 'section (plist-get (cl-second collection) :type)) "#" "")
(plist-get (cl-second collection) :label))))
(_
;; the prefix can be found from the first label, but we have to make it plural.
(setq prefix-data (cdr (assoc (plist-get (cl-first collection) :type)
org-ref-refproc-clever-prefixes))
prefix (plist-get prefix-data (if (plist-get options :abbreviate)
:abbrv
:full)))
(when (plist-get options :capitalize)
(setq prefix (capitalize prefix)))
;; Make it plural. If the prefix ends in .
;; (i.e. it is abbreviated) we remove it and
;; add s.
(setq prefix (if (string= "." (substring prefix -1))
(concat (substring prefix 0 -1) "s.")
(concat prefix "s")))
;; now get
(format "%s %s and [[%s]]"
prefix
(string-join
(cl-loop for entry in (butlast collection) collect
(format "[[%s]]"
(concat
(if (eq 'section (plist-get entry :type)) "#" "")
(plist-get entry :label))))
", ")
;; the last one
(concat
(if (eq 'section (plist-get (car (last collection)) :type)) "#" "")
(plist-get (car (last collection)) :label))))))))
(when capitalize (setf (car replacements) (concat (capitalize (substring (car replacements) 0 1)) (substring (car replacements) 1))))
;; Finally, join them together with commas, and add post-blank spaces.
(concat
(pcase (length replacements)
(1
(cl-first replacements))
(2
(concat (cl-first replacements) " and " (cl-second replacements)))
(_
(concat (string-join (butlast replacements) ", ") " and " (car (last replacements)))))
(make-string post-blanks ? ))))
(defun org-ref-refproc (&optional backend)
"Process the buffer replacing all ref links with org syntax.
BACKEND is the
Meant to be used in an `org-export-before-parsing-hook' on a copy
of the buffer."
(let ((ref-links (org-ref-get-ref-links))
(referenceables (org-ref-refproc-referenceables)))
(cl-loop for ref in (reverse ref-links) do
(cl--set-buffer-substring (org-element-property :begin ref)
(org-element-property :end ref)
(org-ref-refproc-replacement ref referenceables backend)))))
(provide 'org-ref-refproc)
;;; org-ref-refproc.el ends here