-
Notifications
You must be signed in to change notification settings - Fork 9
/
Copy pathciteproc.el
323 lines (298 loc) · 13.8 KB
/
citeproc.el
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
;;; citeproc.el --- A CSL 1.0.2 Citation Processor -*- lexical-binding: t; -*-
;; Copyright (C) 2017-2024 András Simonyi
;; Author: András Simonyi <andras.simonyi@gmail.com>
;; Maintainer: András Simonyi <andras.simonyi@gmail.com>
;; URL: https://github.com/andras-simonyi/citeproc-el
;; Keywords: bib
;; Package-Requires: ((emacs "26") (dash "2.13.0") (s "1.12.0") (f "0.18.0") (queue "0.2") (string-inflection "1.0") (org "9") (parsebib "2.4")(compat "28.1"))
;; Version: 0.9.3
;; This program is free software; you can redistribute it and/or modify
;; it under the terms of the GNU General Public License as published by
;; the Free Software Foundation, either version 3 of the License, or
;; (at your option) any later version.
;; This program is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
;; GNU General Public License for more details.
;; You should have received a copy of the GNU General Public License
;; along with this program. If not, see <http://www.gnu.org/licenses/>.
;; This file is not part of GNU Emacs.
;;; Commentary:
;; citeproc-el is a library for rendering citations and bibliographies in styles
;; described in the Citation Style Language (CSL).
;;; Code:
(require 'dash)
(require 'queue)
(require 'citeproc-rt)
(require 'citeproc-locale)
(require 'citeproc-style)
(require 'citeproc-choose)
(require 'citeproc-generic-elements)
(require 'citeproc-context)
(require 'citeproc-itemdata)
(require 'citeproc-proc)
(require 'citeproc-cite)
(require 'citeproc-sort)
(require 'citeproc-formatters)
(require 'citeproc-itemgetters)
(require 'citeproc-subbibs)
;;; Public API
(defun citeproc-create (style it-getter loc-getter &optional loc force-loc)
"Return a CSL processor for a given STYLE, IT-GETTER and LOC-GETTER.
STYLE is either a path to a CSL style file or a CSL style as a
string.
IT-GETTER is an item-getter function that takes a list of itemid
strings as its sole argument and returns an alist in which the
given itemids are the keys and the values are the parsed csl
json descriptions of the corresponding bibliography items (keys
are symbols, arrays and hashes should be represented as lists
and alists, respecively).
LOC-GETTER is a function that takes a locale string (e.g.
\"en-GB\") as an argument and returns a corresponding parsed
CSL locale (as parsed by Emacs's `libxml-parse-xml-region').
Optional LOC is the locale to use if the style doesn't specify a
default one. Defaults to \"en-US\".
If optional FORCE-LOC is non-nil then use locale LOC even if
STYLE specifies a different one as default. Defaults to nil."
(let ((style (citeproc-create-style style loc-getter loc force-loc))
(names (make-hash-table :test 'equal))
(itemdata (make-hash-table :test 'equal))
(citations (make-queue)))
(citeproc-proc--create :style style :getter it-getter :names names
:itemdata itemdata :citations citations :finalized t)))
(defun citeproc-append-citations (citations proc)
"Append CITATIONS to the list of citations in PROC.
CITATIONS is a list of `citeproc-citation' structures."
(let ((itemdata (citeproc-proc-itemdata proc))
ids)
;; Collect new itemids
(dolist (citation citations)
(dolist (cite (citeproc-citation-cites citation))
(push (alist-get 'id cite) ids)))
(let* ((uniq-ids (delete-dups (nreverse ids))) ; reverse pushed ids
(new-ids (--remove (gethash it itemdata) uniq-ids)))
;; Add all new items in one pass
(citeproc-proc-put-items-by-id proc new-ids)
;; Internalize the cites dealing with locator-extra if present, add itemdata to
;; the cite structs and add them to the cite queue.
(dolist (citation citations)
(setf (citeproc-citation-cites citation)
(--map (cons (cons 'itd (gethash (alist-get 'id it) itemdata))
(citeproc-cite--internalize-locator it))
(citeproc-citation-cites citation)))
(queue-append (citeproc-proc-citations proc) citation))
(setf (citeproc-proc-finalized proc) nil))))
(defun citeproc-add-uncited (itemids proc)
"Add uncited bib items with ITEMIDS to PROC.
As an extension, an itemid can be the string \"*\" which has the
effect of adding all items available in the itemgetter."
;; We simply store the added ids here, real processing is performed when the
;; processor is finalized.
(push itemids (citeproc-proc-uncited proc))
(setf (citeproc-proc-finalized proc) nil))
(defun citeproc-add-subbib-filters (filters proc)
"Add sub-bibliography FILTERS to PROC.
FILTERS should be a list of alists containing symbol keys and
string values, each pair describing an atomic condition to be
satisified by the printed entries. The following keys are
supported:
- `type': print only entries of the given type. Type is the
bib(la)tex entry type if available, otherwise the CSL type is
used as fallback;
- `nottype': print only entries not of the given type. Type is
the bib(la)tex entry type if available, otherwise the CSL type
is used as fallback;
- `csltype', `notcsltype': same as `type' and `nottype' but uses
the entries' CSL type even if the bib(la)tex type is also
available;
- `keyword': print only entries with the given keyword;
- `notkeyword': print only entries without the given keyword;
- `filter': print only entries for which the function named by
the key returns a non-nil value."
(setf (citeproc-proc-bib-filters proc) filters
(citeproc-proc-finalized proc) nil))
(defun citeproc-render-citations (proc format &optional internal-links)
"Render all citations in PROC in the given FORMAT.
Return a list of formatted citations.
If the optional INTERNAL-LINKS is `bib-links' then link cites
to the bibliography regardless of the style type, if `no-links'
then don't add internal links, if nil or `auto' then add internal
links based on the style type (cite-cite links for note styles
and cite-bib links else). For legacy reasons, any other value is
treated as `no-links'."
(citeproc-proc-finalize proc)
(--map (citeproc-citation--render-formatted-citation it proc format internal-links)
(queue-head (citeproc-proc-citations proc))))
(defun citeproc-render-bib (proc format &optional internal-links
no-external-links bib-formatter-fun)
"Render a bibliography of items in PROC in FORMAT.
For the optional INTERNAL-LINKS argument see
`citeproc-render-citations'. If the optional NO-EXTERNAL-LINKS is
non-nil then don't generate external links. If the optional
BIB-FORMATTER-FUN is given then it will be used to join the
bibliography items instead of the content of the chosen
formatter's `bib' slot (see `citeproc-formatter' for details).
Returns an error message string if the style of PROC doesn't
contain a bibliography section. Otherwise it returns
a (FORMATTED-BIBLIOGRAPHY . FORMATTING-PARAMETERS) cons cell,
where FORMATTED-BIBLIOGRAPHY is either a single bibliography or a
list of sub-bibliograhies if filters were added to the processor,
and FORMATTING-PARAMETERS is an alist containing the following
formatting parameters keyed to the parameter names as symbols:
- `max-offset' (integer): The width of the widest first field in
the bibliography, measured in characters.
- `line-spacing' (integer): Vertical line distance specified as a
multiple of standard line height.
- `entry-spacing' (integer): Vertical distance between
bibliographic entries, specified as a multiple of standard line
height.
- `second-field-align' (`flush'or `margin'): The position of
second-field alignment.
- `hanging-indent' (boolean): Whether the bibliography items should
be rendered with hanging-indents."
(if (null (citeproc-style-bib-layout (citeproc-proc-style proc)))
"[NO BIBLIOGRAPHY LAYOUT IN CSL STYLE]"
(citeproc-proc-finalize proc)
(let* ((formatter (citeproc-formatter-for-format format))
(rt-formatter (citeproc-formatter-rt formatter))
(bib-formatter (or bib-formatter-fun
(citeproc-formatter-bib formatter)))
(bibitem-formatter (citeproc-formatter-bib-item formatter))
(formatter-no-external-links (citeproc-formatter-no-external-links
formatter))
(style (citeproc-proc-style proc))
(bib-opts (citeproc-style-bib-opts style))
(punct-in-quote (string= (alist-get 'punctuation-in-quote
(citeproc-style-locale-opts style))
"true"))
(itemdata (citeproc-proc-itemdata proc))
(filters (citeproc-proc-bib-filters proc)))
;; Render raw bibitems for each itemdata struct and store them in the
;; `rawbibitem' slot.
(maphash (lambda (_ itd)
(setf (citeproc-itemdata-rawbibitem itd)
(citeproc-rt-finalize
(citeproc-render-varlist-in-rt
(citeproc-itemdata-varvals itd)
style 'bib 'display internal-links
(or formatter-no-external-links no-external-links))
punct-in-quote)))
itemdata)
(let* ((raw-bib
(if (citeproc-proc-filtered-bib-p proc)
;; There are filters, we need to select and sort the subbibs.
(let* ((nr-of-filters (length filters))
(result (make-list nr-of-filters nil))
;; We store boolean to-be-sorted flags for each sub-bib
(to-be-sorted (make-bool-vector nr-of-filters nil))
(bib-sort (citeproc-style-bib-sort (citeproc-proc-style proc))))
;; Put the itds into subbib lists.
(maphash
(lambda (_ itd)
(let ((subbib-nos (citeproc-itemdata-subbib-nos itd)))
;; Set to-be-sorted for later subbibs if itemdata
;; occcurs in more than one.
(when-let ((later-subbib-nos (cdr subbib-nos)))
(dolist (subbib-no later-subbib-nos)
(setf (elt to-be-sorted subbib-no) t)))
;; Push the item in all corresponding subbibs.
(dolist (subbib-no subbib-nos)
(push itd (elt result subbib-no)))))
itemdata)
;; Sort the itds in each individual list
(setq result
(--map-indexed
(if (and bib-sort (elt to-be-sorted it-index))
;; Subbib contains earlier item, needs to sorted.
(citeproc-sort-itds it (citeproc-style-bib-sort-orders
(citeproc-proc-style proc)))
;; No earlier item, sorting on citation-number.
(citeproc-sort-itds-on-citnum it))
result))
;; Generate the raw bibs.
(--map (mapcar #'citeproc-itemdata-rawbibitem it) result))
;; No filters, so raw-bib is a list containing a single raw bibliograhy.
(list (mapcar #'citeproc-itemdata-rawbibitem
(citeproc-sort-itds-on-citnum (hash-table-values itemdata))))))
;; Perform author-substitution.
(substituted
(-if-let (subs-auth-subst
(alist-get 'subsequent-author-substitute bib-opts))
(--map (citeproc-rt-subsequent-author-substitute it subs-auth-subst)
raw-bib)
raw-bib))
;; Calculate formatting params.
;; NOTE: This is the only place where we check whether there are
;; bibliography items in the processor, even though the empty case
;; could be handled way more efficiently.
(max-offset (if (and (alist-get 'second-field-align bib-opts)
(not (hash-table-empty-p itemdata)))
(citeproc-proc-max-offset itemdata)
0))
(format-params (cons (cons 'max-offset max-offset)
(citeproc-style-bib-opts-to-formatting-params bib-opts)))
(formatted-bib
(--map (funcall bib-formatter
(mapcar
(lambda (x)
(funcall
bibitem-formatter
(funcall
rt-formatter (citeproc-rt-cull-spaces-puncts x))
format-params))
it)
format-params)
substituted)))
;; Generate final return value.
(cons (if filters formatted-bib (car formatted-bib))
format-params)))))
(defun citeproc-clear (proc)
"Remove all bibliographic and citation data from PROC."
(clrhash (citeproc-proc-itemdata proc))
(clrhash (citeproc-proc-names proc))
(queue-clear (citeproc-proc-citations proc))
(setf (citeproc-proc-finalized proc) t))
;; For one-off renderings
(defun citeproc-create-style (style locale-getter &optional locale force-locale)
"Compile style in STYLE into a citeproc-style struct.
STYLE is either a path to a CSL style file, or a style as a
string. LOCALE-GETTER is a getter function for locales, the
optional LOCALE is a locale to prefer. If FORCE-LOCALE is non-nil
then use LOCALE even if the style's default locale is different."
(-let* (((year-suffix . parsed-style) (citeproc-style-parse style))
(default-locale (alist-get 'default-locale (cadr parsed-style)))
(preferred-locale (if force-locale locale (or default-locale
locale
"en-US")))
(act-parsed-locale (funcall locale-getter preferred-locale))
(act-locale (alist-get 'lang (cadr act-parsed-locale)))
(style (citeproc-create-style-from-locale
parsed-style
(not (not year-suffix)) act-locale)))
(citeproc-style--update-locale style act-parsed-locale)
(citeproc-style--set-opt-defaults style)
(setf (citeproc-style-locale style) (or locale act-locale))
style))
;; REVIEW: this should be rethought -- should we apply the specific wrappers as
;; well?
(defun citeproc-render-item (item-data style mode format
&optional no-external-links)
"Render a bibliography item described by ITEM-DATA with STYLE.
ITEM-DATA is the parsed form of a bibliography item description
in CSL-JSON format,
STYLE is a `citeproc-style' structure,
MODE is one of the symbols `bib' or `cite',
FORMAT is a symbol representing a supported output format.
If the optional NO-EXTERNAL-LINKS is non-nil then don't generate
external links in the item."
(let ((internal-varlist (--map-when (memq (car it) citeproc--date-vars)
(cons (car it)
(citeproc-date-parse (cdr it)))
item-data)))
(funcall (citeproc-formatter-rt (citeproc-formatter-for-format format))
(citeproc-rt-cull-spaces-puncts
(citeproc-rt-finalize
(citeproc-render-varlist-in-rt
internal-varlist style mode 'display 'no-links no-external-links))))))
(provide 'citeproc)
;;; citeproc.el ends here