-
Notifications
You must be signed in to change notification settings - Fork 2
/
extmap.el
655 lines (577 loc) · 30.8 KB
/
extmap.el
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
;;; extmap.el --- Externally-stored constant mapping for Elisp -*- lexical-binding: t -*-
;; Copyright (C) 2018-2023 Paul Pogonyshev
;; Author: Paul Pogonyshev <pogonyshev@gmail.com>
;; Maintainer: Paul Pogonyshev <pogonyshev@gmail.com>
;; Version: 1.3.1snapshot
;; Keywords: lisp
;; Homepage: https://github.com/doublep/extmap
;; Package-Requires: ((emacs "24.4"))
;; This program is free software; you can redistribute it and/or
;; modify it under the terms of the GNU General Public License as
;; published by the Free Software Foundation, either version 3 of
;; the License, or (at your option) any later version.
;; This program is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
;; GNU General Public License for more details.
;;
;; You should have received a copy of the GNU General Public License
;; along with this program. If not, see http://www.gnu.org/licenses.
;;; Commentary:
;; Mapping of symbols to constants that is stored externally as a
;; single binary file and loaded on-demand. Can be used for huge
;; databases to avoid loading everything to memory. This package
;; doesn't use any external programs, making it a suitable dependency
;; for smaller libraries.
;;
;; Typical usage of the library consists of two separate stages:
;;
;; 1) Package maintainer/developer creates a map file, which is
;; then distributed along with its `*.el' etc. files.
;;
;; 2) For end-user, Elisp code retrieves values from the
;; pre-created map file.
;;
;; Creating a map file doesn't require any external tools. See
;; function `extmap-from-alist' for details. If you use Emacs 25 or
;; later and your map is so huge that you don't want to load it fully
;; even when creating, see `extmap-from-iterator'.
;;
;; The main functions for using an existing map file are `extmap-init'
;; to open it and `extmap-get' to retrieve value associated with given
;; key. See function documentation for details. Other functions that
;; work with a prepared file:
;;
;; - extmap-contains-key
;; - extmap-value-loaded
;; - extmap-keys
;; - extmap-mapc
;; - extmap-mapcar
;; - extmap-statistics
;;; Code:
(require 'bindat)
(defconst extmap--header-bindat-spec '((magic u16)
(version u16)
(num-items u32)
(offset u32)))
;; TYPE can be:
;; 0 -- inlined string (short specification is used);
;; 1 -- inlined Lisp object (short specification is used);
;; 2 -- string;
;; 3 -- Lisp object;
;; 4 -- shared value (short specification is used).
(defconst extmap--item-short-bindat-spec '((type u8)
(length u24)))
(defconst extmap--item-bindat-spec '((type u8)
(length u24)
(offset u32)))
(defun extmap-init (filename &rest options)
"Load metadata of a previously created map from FILENAME.
Loaded metadata can be further passed to `extmap-get' and other
functions. It must be treated as an opaque object: you must not
alter it or make any assumptions about its contents.
OPTIONS can be a list of the following keyword arguments:
:weak-data
If non-nil, loaded values are stored in a weak hashmap and
can be garbage-collected by Emacs if no longer used. This
allows to potentially reduce memory usage at the cost of more
disk operations.
:auto-reload
If the backing file is changed, automatically reset the map.
By default, backing file is supposed to remain constant and
if it changes, that results in undefined map behavior.
Reloading doesn't affect any already retrieved values.
Backing file is considered changed only if its modification
time is different compared to the previous check, actual
contents is not checked.
Using this option slows a map down a little, since it has to
check file modification time often. It exists mainly for
developing, when you'd often re-generate disk files, though
nothing precludes using it in end-code either.
:preload-metadata
Immediately parse the header of the extmap file. Otherwise
this is done lazily, on first access. For consistency, it is
still an error if FILENAME points to an unreadable file.
The file must remain accessible in case `extmap-get' needs to
load a value later. There is no need to somehow close a map:
just stop using it."
(let ((extmap (list (cons filename (if (plist-get options :auto-reload) :auto-reload :not-initialized))
nil (when (plist-get options :weak-data) (make-hash-table :test #'eq :weakness 'value)))))
(if (plist-get options :preload-metadata)
(extmap--do-reload-if-needed extmap)
;; Still check that `filename' exists and is readable.
(unless (file-regular-p filename)
(signal 'file-error (list "Not a regular file" filename))))
extmap))
;; After a call to this, any value in `extmap' other than the filename
;; might change.
(defsubst extmap--reload-if-needed (extmap)
(let ((modtime (cdr (nth 0 extmap))))
(when modtime
(extmap--do-reload-if-needed extmap))))
(defun extmap--do-reload-if-needed (extmap)
(let* ((filename (car (nth 0 extmap)))
(modtime-then (cdr (nth 0 extmap)))
;; Fifth element of `file-attributes' result is the modification date.
;; `file-attribute-modification-time' doesn't exist in Emacs 25.
(modtime-now (nth 5 (file-attributes filename))))
(cond ((keywordp modtime-then)
;; Means the map has not been initialized yet.
(progn (extmap--do-initialize extmap)
(setf (cdr (nth 0 extmap)) (when (eq modtime-then :auto-reload) modtime-now))))
((not (equal modtime-now modtime-then))
(let ((reloaded-extmap (extmap-init filename :auto-reload t :weak-data (nth 2 extmap) :preload-metadata t)))
(setf (car extmap) (car reloaded-extmap))
(setf (cdr extmap) (cdr reloaded-extmap)))))))
(defun extmap--do-initialize (extmap)
(with-temp-buffer
(let* ((filename (car (nth 0 extmap)))
(header-length (bindat-length extmap--header-bindat-spec nil))
(item-short-header-length (bindat-length extmap--item-short-bindat-spec nil))
(item-header-length (bindat-length extmap--item-bindat-spec nil))
(read-as (insert-file-contents-literally filename nil 0 header-length))
(filename (car read-as))
(header (when (equal (cadr read-as) header-length) (bindat-unpack extmap--header-bindat-spec (encode-coding-string (buffer-string) 'no-conversion))))
items)
(erase-buffer)
(unless (= (bindat-get-field header 'magic) #x91f7)
(error "Wrong or corrupted extmap in file `%s'" filename))
(unless (<= (bindat-get-field header 'version) 1)
(error "Future version of extmap in file `%s', upgrade your `extmap' package" filename))
(setq items (make-hash-table :test #'eq :size (bindat-get-field header 'num-items)))
(insert-file-contents-literally filename nil (bindat-get-field header 'offset))
(dotimes (_ (bindat-get-field header 'num-items))
(let* ((key (intern (decode-coding-string (buffer-substring-no-properties (point) (1- (re-search-forward (rx 0)))) 'utf-8 t)))
(item-header (bindat-unpack extmap--item-short-bindat-spec (encode-coding-string (buffer-substring-no-properties (point) (+ (point) item-short-header-length)) 'no-conversion)))
(type (bindat-get-field item-header 'type))
(length (bindat-get-field item-header 'length)))
(if (or (= type 2) (= type 3))
;; Non-inlined item.
(let ((item-header (bindat-unpack extmap--item-bindat-spec (encode-coding-string (buffer-substring-no-properties (point) (+ (point) item-header-length)) 'no-conversion))))
(goto-char (+ (point) item-header-length))
(puthash key (cons nil (cons type (cons (bindat-get-field item-header 'offset) length))) items))
(let ((value (decode-coding-string (buffer-substring-no-properties (+ (point) item-short-header-length) (+ (point) item-short-header-length length)) 'utf-8 t)))
(goto-char (+ (point) item-short-header-length length))
(if (= type 4)
;; Shared-value item.
(puthash key (cons nil (cons type (intern value))) items)
;; Inlined item.
(if (= type 1)
(setq value (car (read-from-string value)))
(unless (= type 0)
(error "Corrupted extmap file")))
(puthash key (cons t value) items))))))
(setf (nth 1 extmap) items))))
(defun extmap-get (extmap key &optional no-error)
"Get value associated with KEY from the map.
EXTMAP must be a result of a previous call to `extmap-init'. KEY
should be a symbol present in the map. If it is not, function
signals an error, unless NO-ERROR is specified, in which case it
returns nil."
(extmap--reload-if-needed extmap)
(let* ((items (nth 1 extmap))
(weak-data (nth 2 extmap))
;; A key cannot be mapped to `items' table itself, we use
;; that as a marker for "no mapping" situation.
(value items))
(when weak-data
(setq value (gethash key weak-data items)))
(if (eq value items)
(progn (setq value (gethash key items))
(if value
(if (car value)
;; Already loaded.
(cdr value)
(let (new-value)
(if (= (cadr value) 4)
;; Value is shared with a different key.
(setq new-value (extmap-get extmap (cddr value)))
;; Load now.
(let ((coding-system-for-read 'utf-8)
(offset (cadr (cdr value))))
(with-temp-buffer
(insert-file-contents (car (nth 0 extmap)) nil offset (+ offset (cddr (cdr value))))
(setq new-value (if (= (cadr value) 2) (buffer-string) (read (current-buffer)))))))
(if weak-data
(puthash key new-value weak-data)
(prog1 (setcdr value new-value)
(setcar value t)))))
(unless no-error
(error "No value for key `%s'" key))))
value)))
(defun extmap-contains-key (extmap key)
"Determine if there is a mapping for given KEY in EXTMAP."
(extmap--reload-if-needed extmap)
(consp (gethash key (nth 1 extmap))))
(defun extmap-value-loaded (extmap key)
"Determine if value for given KEY is loaded in EXTMAP.
If there is no mapping for KEY, this function always returns
nil.
In case the map has been initialized with `:weak-data' option, it
may happen that this function returns t, but value for the KEY
has to be loaded again in the future."
(extmap--reload-if-needed extmap)
(let* ((items (nth 1 extmap))
(value (gethash key items)))
(or (car value)
(when value
(let ((synonym-of (when (= (cadr value) 4) (cddr value))))
(or (and synonym-of (car (gethash synonym-of items)))
(let ((weak-data (nth 2 extmap)))
(when weak-data
(or (not (eq (gethash key weak-data weak-data) weak-data))
(and synonym-of (not (eq (gethash synonym-of weak-data weak-data) weak-data))))))))))))
(defun extmap-keys (extmap)
"Return a list of all the keys in the map.
The list is in no particular order.
EXTMAP must be a result of a previous call to `extmap-init'."
(extmap--reload-if-needed extmap)
(let (keys)
(maphash (lambda (key _value) (push key keys)) (nth 1 extmap))
keys))
(defun extmap-mapc (extmap callback)
"Invoke CALLBACK on each key-value pairing in the map.
EXTMAP must be a result of a previous call to `extmap-init'.
CALLBACK is called with two arguments: KEY and VALUE. Its return
value is ignored. Values in the map are enumerated in no
particular order.
Note that unless CALLBACK exits non-locally (with `throw' or by
signalling an error), this will result in loading all values into
memory. If you just need to enumerate the keys, use
`extmap-keys' instead."
(extmap--reload-if-needed extmap)
(maphash (lambda (key _value) (funcall callback key (extmap-get extmap key))) (nth 1 extmap)))
(defun extmap-mapcar (extmap callback)
"Invoke CALLBACK on each key-value pairing in the map.
Return its results as a list.
Returned list corresponds to the order in which keys have been
passed to CALLBACK. However, that order can be arbitrary.
See `extmap-mapc' for more information."
(extmap--reload-if-needed extmap)
(let (result)
(maphash (lambda (key _value) (push (funcall callback key (extmap-get extmap key)) result)) (nth 1 extmap))
(nreverse result)))
(defun extmap-statistics (extmap)
"Collect and return some statistics about EXTMAP.
Returned value is an alist (in no particular order) with at least
the following items:
`filename': absolute path of the file that contains the map;
`num-items': number of key-value mappings in the map;
`num-loaded': number of loaded values;
`weak-data' and `auto-reload': t if `extmap-init' has been
called with corresponding option.
In some cases maps can report loaded values right after
initialization. This is because of value inlining and typically
happens for small values. In case the map has been initialized
with `:weak-data' option, `num-loaded' should be seen as an upper
limit only, as (some) loaded values can be garbage-collected at
any time."
(extmap--reload-if-needed extmap)
(let ((items (nth 1 extmap))
(weak-data (nth 2 extmap))
(num-loaded 0))
(maphash (lambda (_key value) (when (car value) (setq num-loaded (1+ num-loaded)))) items)
`((filename . ,(car (nth 0 extmap)))
(num-items . ,(hash-table-count items))
(num-loaded . ,(+ num-loaded (if weak-data (hash-table-count weak-data) 0)))
(weak-data . ,(not (null weak-data)))
(auto-reload . ,(not (null (cdr (nth 0 extmap))))))))
(defun extmap-from-alist (filename data &rest options)
"Create an externally-stored map from given DATA.
Created map is stored to file specified by FILENAME. Later this
filename should be passed to `extmap-init' to read the map.
DATA must be an alist with symbols used as keys. All symbols
must be interned in the default obarray. Values must be
serializable with `print'/`read' (e.g. no buffers or non-interned
symbols), but are otherwise not restricted.
OPTIONS can be a list of the following keyword arguments:
:overwrite
By default, this function will signal an error if the output
file already exists. However, you can order it to
overwrite (not merge!) the file.
:share-values
When values for different keys are equal, store only one copy
in the database. This can decrease database size, but you
must be prepared that `extmap-get' can return `eq' values for
different keys (for this reason, this is not the default).
:compress-values
Replace equal parts within values with the same object. This
can decrease database size, but you must be prepared that
values returned `extmap-get' can contain `eq' elements (in
lists, vectors, etc.). It also makes map creation noticeably
slower. For these reason, this is not the default.
:max-inline-bytes
Inline values for which `print' results in this many bytes.
Inlined values are loaded by `extmap-init' immediately and
don't require additional disk access later. Default value is
currently 16, but can be changed in a future package version.
If this setting is important for you for some reason, always
specify it explicitly."
(extmap--do-create filename (lambda () (if data (pop data) (throw 'end-of-data nil))) options))
(defun extmap-from-iterator (filename iterator &rest options)
"Create an externally-stored map from data provided by ITERATOR.
Iterator must return cons cells with car being a symbol (key),
cdr -- the value. See standard Emacs form `iter-defun' for how
to declare iterator functions.
See `extmap-from-alist' for more information. This function is
basically the same, but is provided for the cases your values are
so huge you'd rather provide them one-by-one with an iterator
instead of keeping them all in memory.
Only available on Emacs 25, as this requires `generator' package."
(require 'generator)
(extmap--do-create filename (lambda ()
(condition-case _
(with-no-warnings (iter-yield iterator))
(iter-end-of-sequence (throw 'end-of-data nil))))
options))
(defun extmap--do-create (filename data options)
(with-temp-buffer
(let ((print-level nil)
(print-length nil)
(shared-values (when (plist-get options :share-values) (make-hash-table :test #'extmap--equal-including-properties)))
(canonical-subvalues (when (plist-get options :compress-values) (make-hash-table :test #'extmap--equal-including-properties)))
(max-inline-bytes (or (plist-get options :max-inline-bytes) 16))
(offset (bindat-length extmap--header-bindat-spec nil))
(buffer (current-buffer))
(coding-system-for-write 'no-conversion)
(write-region-inhibit-fsync t)
(used-keys (make-hash-table :test #'eq)))
;; Will be replaced at the end.
(insert (bindat-pack extmap--header-bindat-spec nil))
(write-region nil nil filename nil 'no-message nil (if (plist-get options :overwrite) nil 'excl))
(erase-buffer)
(catch 'end-of-data
(while t
(let* ((item (funcall data))
(key (car item))
(value (cdr item)))
(unless (and (symbolp key) (not (string-match (rx 0) (symbol-name key))) (eq (intern (symbol-name key)) key))
(error "Wrong key `%S': expected an interned symbol without null character" key))
(when (gethash key used-keys)
(error "Duplicate key `%s'" key))
(puthash key t used-keys)
(insert (encode-coding-string (symbol-name key) 'utf-8 t))
(insert 0)
(let ((serialized (if (extmap--plain-string-p value)
value
(let ((print-circle t)
(print-continuous-numbering nil))
(when canonical-subvalues
(clrhash canonical-subvalues)
(setq value (extmap--compress-value value canonical-subvalues)))
;; Workaround for Emacs (27?) not using the print circle for
;; strings on the first level. At this point I no longer care to
;; report bugs in Emacs. Fuck it, it's faster and easier to just
;; add workarounds
(if (stringp value)
(prin1-to-string value)
(substring (prin1-to-string (list value)) 1 -1))))))
(unless (or (extmap--plain-string-p value) (condition-case _ (equal (read serialized) value) (error nil)))
(error "Value for key `%s' cannot be saved in database: it cannot be read back or is different after reading" key))
;; The whole point of this buffer is to be used for
;; `write-region' below (in the most common case).
(with-temp-buffer
(let* ((serialized-in (current-buffer))
(num-bytes (encode-coding-string serialized 'utf-8 t serialized-in))
canonical-key)
(cond ((<= num-bytes max-inline-bytes)
(with-current-buffer buffer
(insert (bindat-pack extmap--item-short-bindat-spec `((type . ,(if (extmap--plain-string-p value) 0 1)) (length . ,num-bytes))))
(insert-buffer-substring serialized-in)))
((and shared-values (setq canonical-key (gethash value shared-values)))
(with-current-buffer buffer
(let ((encoded (encode-coding-string (symbol-name canonical-key) 'utf-8 t)))
(insert (bindat-pack extmap--item-short-bindat-spec `((type . 4) (length . ,(length encoded))))
encoded))))
(t
(write-region nil nil filename t 'no-message)
(with-current-buffer buffer
(insert (bindat-pack extmap--item-bindat-spec `((type . ,(if (extmap--plain-string-p value) 2 3)) (length . ,num-bytes) (offset . ,offset))))
(setq offset (+ offset num-bytes))
(when shared-values
(puthash value key shared-values)))))))))))
(write-region nil nil filename t 'no-message)
;; Update the header.
(erase-buffer)
(insert (bindat-pack extmap--header-bindat-spec `((magic . #x91f7)
(version . 1)
(num-items . ,(hash-table-count used-keys))
(offset . ,offset))))
(write-region nil nil filename 0 'no-message))))
(defun extmap--plain-string-p (object)
(and (stringp object)
(null (text-properties-at 0 object))
(null (next-property-change 0 object))))
(defun extmap--compress-value (value canonical-subvalues)
(cond ((stringp value)
(if (and (<= (length value) 4) (extmap--plain-string-p value))
;; Don't try to compress very short strings without text properties.
value
(or (gethash value canonical-subvalues)
(puthash value value canonical-subvalues))))
((consp value)
(let ((original-value value)
canonical-head
canonical-tail)
(while (unless (setq canonical-tail (gethash value canonical-subvalues))
(push (extmap--compress-value (car value) canonical-subvalues) canonical-head)
(consp (setq value (cdr value)))))
(setq canonical-head (nreverse canonical-head))
(puthash original-value
(if canonical-tail
(nconc canonical-head canonical-tail)
(when value
(setcdr (last canonical-head) (extmap--compress-value value canonical-subvalues)))
canonical-head)
canonical-subvalues)))
((or (vectorp value) (with-no-warnings (when (fboundp #'recordp) (recordp value))))
(or (gethash value canonical-subvalues)
(let* ((length (length value))
(result (if (vectorp value) (make-vector length nil) (with-no-warnings (make-record nil (1- length) nil)))))
(dotimes (k length)
(aset result k (extmap--compress-value (aref value k) canonical-subvalues)))
(puthash value result canonical-subvalues))))
(t
value)))
;; This is like built-in `equal-including-properties', except that
;; property values are compared with the same function, not with `eq'.
;; Slow, but is used only during extmap creation, testing and diffing,
;; all of which are not performance-critical.
(defun extmap--equal-including-properties (a b)
(cond ((stringp a)
(and (stringp b)
(string= a b)
(let ((at 0)
(equal t))
(while (and at equal)
(let ((next (next-property-change at a)))
(setq equal (and (equal next (next-property-change at b))
(let ((a-properties (text-properties-at at a))
(b-properties (text-properties-at at b)))
;; Speedup, especially for plain strings: don't create
;; hash-tables if there are no properties at all.
(or (and (null a-properties) (null b-properties))
(and a-properties b-properties
;; Property keys are compared by `eq' everywhere.
(let ((a-property-hash (make-hash-table :test #'eq))
(b-property-hash (make-hash-table :test #'eq)))
(while a-properties
(puthash (pop a-properties) (pop a-properties) a-property-hash))
(while b-properties
(puthash (pop b-properties) (pop b-properties) b-property-hash))
(extmap--equal-including-properties a-property-hash b-property-hash))))))
at next)))
equal)))
((consp a)
(let ((equal t))
(while (if (and (consp b) (extmap--equal-including-properties (car a) (car b)))
(consp (setq b (cdr b)
a (cdr a)))
(setq equal nil)))
(and equal (extmap--equal-including-properties a b))))
((or (vectorp a) (with-no-warnings (when (fboundp #'recordp) (recordp a))))
(and (if (vectorp a) (vectorp b) (with-no-warnings (recordp b)))
(let ((length (length a)))
(and (= length (length b))
(let ((equal t)
(k 0))
(while (< k length)
(if (extmap--equal-including-properties (aref a k) (aref b k))
(setq k (1+ k))
(setq k length
equal nil)))
equal)))))
((hash-table-p a)
(and (hash-table-p b)
(= (hash-table-count a) (hash-table-count b))
(catch 'equal
(maphash (lambda (key value)
(unless (extmap--equal-including-properties value (gethash key b (not value)))
(throw 'equal nil)))
a)
t)))
;; Works for all the primitive types, as well as for bool vectors.
(t
(equal a b))))
;; No special hashing function: `sxhash' ignores text properties, but
;; it is not required that hashes of different values are different.
(define-hash-table-test 'extmap--equal-including-properties #'extmap--equal-including-properties #'sxhash)
(defun extmap-equal-p (extmap1 extmap2 &optional keys-to-ignore describe)
"Compare two maps.
Don't count any differences in KEYS-TO-IGNORE (must be a list).
Return non-nil if the two maps are equal for all other keys.
When optional argument DESCRIBE is set, also print information
about differences to a new buffer and present it, if there are
any. Non-interactively, print this to stdout. The information
is in free form meant only for humans. Presentation can thus be
improved or otherwise changed in future versions."
(when (stringp extmap1)
(setq extmap1 (extmap-init extmap1)))
(when (stringp extmap2)
(setq extmap2 (extmap-init extmap2)))
(setq keys-to-ignore (let ((lookup (make-hash-table :test #'eq)))
(dolist (key keys-to-ignore)
(puthash key t lookup))
(remhash nil lookup)
lookup))
(catch 'done
(with-temp-buffer
(let* ((keys1 (sort (extmap-keys extmap1) #'string<))
(keys2 (sort (extmap-keys extmap2) #'string<))
(scan1 keys1)
(scan2 keys2)
(only-in-1-lookup (make-hash-table :test #'eq))
only-in-1
only-in-2)
(while (or scan1 scan2)
(let ((key1 (car scan1))
(key2 (car scan2)))
(if (eq key1 key2)
(setq scan1 (cdr scan1)
scan2 (cdr scan2))
(cond ((gethash key1 keys-to-ignore)
(setq scan1 (cdr scan1)))
((gethash key2 keys-to-ignore)
(setq scan2 (cdr scan2)))
(t
(unless describe
(throw 'done nil))
(if (and key1 (or (null key2) (string< key1 key2)))
(progn (setq only-in-1 (cons key1 only-in-1)
scan1 (cdr scan1))
(puthash key1 t only-in-1-lookup))
(setq only-in-2 (cons key2 only-in-2)
scan2 (cdr scan2))))))))
(when only-in-1
(insert "Only in the first extmap:\n")
(dolist (key (nreverse only-in-1))
(insert " " (symbol-name key) "\n")))
(when only-in-2
(insert "Only in the second extmap:\n")
(dolist (key (nreverse only-in-2))
(insert " " (symbol-name key) "\n")))
(dolist (key keys1)
(unless (or (gethash key keys-to-ignore) (gethash key only-in-1-lookup))
(let ((value1 (extmap-get extmap1 key))
(value2 (extmap-get extmap2 key)))
(unless (extmap--equal-including-properties value1 value2)
(unless describe
(throw 'done nil))
(insert (symbol-name key) ":\n" (prin1-to-string value1) "\n" (prin1-to-string value2) "\n"))))))
(if describe
(if (= (point) 1)
(progn (message "There are no differences")
t)
(let ((differences (buffer-string)))
(if noninteractive
(princ differences)
(let ((buffer (get-buffer-create " *Extmap differences*")))
(set-buffer buffer)
(erase-buffer)
(insert differences)
(goto-char (point-min))
(display-buffer buffer))))
nil)
t))))
(provide 'extmap)
;;; extmap.el ends here