1 /*
2 * libkmod - interface to kernel module operations
3 *
4 * Copyright (C) 2011-2013 ProFUSION embedded systems
5 *
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2.1 of the License, or (at your option) any later version.
10 *
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
18 */
19
20 #include <arpa/inet.h>
21 #include <assert.h>
22 #include <errno.h>
23 #include <fnmatch.h>
24 #include <inttypes.h>
25 #include <stdio.h>
26 #include <stdlib.h>
27 #include <string.h>
28
29 #include <shared/macro.h>
30 #include <shared/strbuf.h>
31 #include <shared/util.h>
32
33 #include "libkmod-internal.h"
34 #include "libkmod-index.h"
35
36 /* libkmod-index.c: module index file implementation
37 *
38 * Integers are stored as 32 bit unsigned in "network" order, i.e. MSB first.
39 * All files start with a magic number.
40 *
41 * Magic spells "BOOTFAST". Second one used on newer versioned binary files.
42 * #define INDEX_MAGIC_OLD 0xB007FA57
43 *
44 * We use a version string to keep track of changes to the binary format
45 * This is stored in the form: INDEX_MAJOR (hi) INDEX_MINOR (lo) just in
46 * case we ever decide to have minor changes that are not incompatible.
47 */
48 #define INDEX_MAGIC 0xB007F457
49 #define INDEX_VERSION_MAJOR 0x0002
50 #define INDEX_VERSION_MINOR 0x0001
51 #define INDEX_VERSION ((INDEX_VERSION_MAJOR<<16)|INDEX_VERSION_MINOR)
52
53 /* The index file maps keys to values. Both keys and values are ASCII strings.
54 * Each key can have multiple values. Values are sorted by an integer priority.
55 *
56 * The reader also implements a wildcard search (including range expressions)
57 * where the keys in the index are treated as patterns.
58 * This feature is required for module aliases.
59 */
60 #define INDEX_CHILDMAX 128
61
62 /* Disk format:
63 *
64 * uint32_t magic = INDEX_MAGIC;
65 * uint32_t version = INDEX_VERSION;
66 * uint32_t root_offset;
67 *
68 * (node_offset & INDEX_NODE_MASK) specifies the file offset of nodes:
69 *
70 * char[] prefix; // nul terminated
71 *
72 * char first;
73 * char last;
74 * uint32_t children[last - first + 1];
75 *
76 * uint32_t value_count;
77 * struct {
78 * uint32_t priority;
79 * char[] value; // nul terminated
80 * } values[value_count];
81 *
82 * (node_offset & INDEX_NODE_FLAGS) indicates which fields are present.
83 * Empty prefixes are omitted, leaf nodes omit the three child-related fields.
84 *
85 * This could be optimised further by adding a sparse child format
86 * (indicated using a new flag).
87 *
88 *
89 * Implementation is based on a radix tree, or "trie".
90 * Each arc from parent to child is labelled with a character.
91 * Each path from the root represents a string.
92 *
93 * == Example strings ==
94 *
95 * ask
96 * ate
97 * on
98 * once
99 * one
100 *
101 * == Key ==
102 * + Normal node
103 * * Marked node, representing a key and it's values.
104 *
105 * +
106 * |-a-+-s-+-k-*
107 * | |
108 * | `-t-+-e-*
109 * |
110 * `-o-+-n-*-c-+-e-*
111 * |
112 * `-e-*
113 *
114 * Naive implementations tend to be very space inefficient; child pointers
115 * are stored in arrays indexed by character, but most child pointers are null.
116 *
117 * Our implementation uses a scheme described by Wikipedia as a Patrica trie,
118 *
119 * "easiest to understand as a space-optimized trie where
120 * each node with only one child is merged with its child"
121 *
122 * +
123 * |-a-+-sk-*
124 * | |
125 * | `-te-*
126 * |
127 * `-on-*-ce-*
128 * |
129 * `-e-*
130 *
131 * We still use arrays of child pointers indexed by a single character;
132 * the remaining characters of the label are stored as a "prefix" in the child.
133 *
134 * The paper describing the original Patrica trie works on individiual bits -
135 * each node has a maximum of two children, which increases space efficiency.
136 * However for this application it is simpler to use the ASCII character set.
137 * Since the index file is read-only, it can be compressed by omitting null
138 * child pointers at the start and end of arrays.
139 */
140
141 /* Format of node offsets within index file */
142 enum node_offset {
143 INDEX_NODE_FLAGS = 0xF0000000, /* Flags in high nibble */
144 INDEX_NODE_PREFIX = 0x80000000,
145 INDEX_NODE_VALUES = 0x40000000,
146 INDEX_NODE_CHILDS = 0x20000000,
147
148 INDEX_NODE_MASK = 0x0FFFFFFF, /* Offset value */
149 };
150
index_values_free(struct index_value * values)151 void index_values_free(struct index_value *values)
152 {
153 while (values) {
154 struct index_value *value = values;
155
156 values = value->next;
157 free(value);
158 }
159 }
160
add_value(struct index_value ** values,const char * value,unsigned len,unsigned int priority)161 static int add_value(struct index_value **values,
162 const char *value, unsigned len, unsigned int priority)
163 {
164 struct index_value *v;
165
166 /* find position to insert value */
167 while (*values && (*values)->priority < priority)
168 values = &(*values)->next;
169
170 v = malloc(sizeof(struct index_value) + len + 1);
171 if (!v)
172 return -1;
173 v->next = *values;
174 v->priority = priority;
175 v->len = len;
176 memcpy(v->value, value, len);
177 v->value[len] = '\0';
178 *values = v;
179
180 return 0;
181 }
182
read_error(void)183 static void read_error(void)
184 {
185 fatal("Module index: unexpected error: %s\n"
186 "Try re-running depmod\n", errno ? strerror(errno) : "EOF");
187 }
188
read_char(FILE * in)189 static int read_char(FILE *in)
190 {
191 int ch;
192
193 errno = 0;
194 ch = getc_unlocked(in);
195 if (ch == EOF)
196 read_error();
197 return ch;
198 }
199
read_long(FILE * in)200 static uint32_t read_long(FILE *in)
201 {
202 uint32_t l;
203
204 errno = 0;
205 if (fread(&l, sizeof(uint32_t), 1, in) != sizeof(uint32_t))
206 read_error();
207 return ntohl(l);
208 }
209
buf_freadchars(struct strbuf * buf,FILE * in)210 static unsigned buf_freadchars(struct strbuf *buf, FILE *in)
211 {
212 unsigned i = 0;
213 int ch;
214
215 while ((ch = read_char(in))) {
216 if (!strbuf_pushchar(buf, ch))
217 break;
218 i++;
219 }
220
221 return i;
222 }
223
224 /*
225 * Index file searching
226 */
227 struct index_node_f {
228 FILE *file;
229 char *prefix; /* path compression */
230 struct index_value *values;
231 unsigned char first; /* range of child nodes */
232 unsigned char last;
233 uint32_t children[0];
234 };
235
index_read(FILE * in,uint32_t offset)236 static struct index_node_f *index_read(FILE *in, uint32_t offset)
237 {
238 struct index_node_f *node;
239 char *prefix;
240 int i, child_count = 0;
241
242 if ((offset & INDEX_NODE_MASK) == 0)
243 return NULL;
244
245 if (fseek(in, offset & INDEX_NODE_MASK, SEEK_SET) < 0)
246 return NULL;
247
248 if (offset & INDEX_NODE_PREFIX) {
249 struct strbuf buf;
250 strbuf_init(&buf);
251 buf_freadchars(&buf, in);
252 prefix = strbuf_steal(&buf);
253 } else
254 prefix = NOFAIL(strdup(""));
255
256 if (offset & INDEX_NODE_CHILDS) {
257 char first = read_char(in);
258 char last = read_char(in);
259 child_count = last - first + 1;
260
261 node = NOFAIL(malloc(sizeof(struct index_node_f) +
262 sizeof(uint32_t) * child_count));
263
264 node->first = first;
265 node->last = last;
266
267 for (i = 0; i < child_count; i++)
268 node->children[i] = read_long(in);
269 } else {
270 node = NOFAIL(malloc(sizeof(struct index_node_f)));
271 node->first = INDEX_CHILDMAX;
272 node->last = 0;
273 }
274
275 node->values = NULL;
276 if (offset & INDEX_NODE_VALUES) {
277 int value_count;
278 struct strbuf buf;
279 const char *value;
280 unsigned int priority;
281
282 value_count = read_long(in);
283
284 strbuf_init(&buf);
285 while (value_count--) {
286 priority = read_long(in);
287 buf_freadchars(&buf, in);
288 value = strbuf_str(&buf);
289 add_value(&node->values, value, buf.used, priority);
290 strbuf_clear(&buf);
291 }
292 strbuf_release(&buf);
293 }
294
295 node->prefix = prefix;
296 node->file = in;
297 return node;
298 }
299
index_close(struct index_node_f * node)300 static void index_close(struct index_node_f *node)
301 {
302 free(node->prefix);
303 index_values_free(node->values);
304 free(node);
305 }
306
307 struct index_file {
308 FILE *file;
309 uint32_t root_offset;
310 };
311
index_file_open(const char * filename)312 struct index_file *index_file_open(const char *filename)
313 {
314 FILE *file;
315 uint32_t magic, version;
316 struct index_file *new;
317
318 file = fopen(filename, "re");
319 if (!file)
320 return NULL;
321 errno = EINVAL;
322
323 magic = read_long(file);
324 if (magic != INDEX_MAGIC) {
325 fclose(file);
326 return NULL;
327 }
328
329 version = read_long(file);
330 if (version >> 16 != INDEX_VERSION_MAJOR) {
331 fclose(file);
332 return NULL;
333 }
334
335 new = NOFAIL(malloc(sizeof(struct index_file)));
336 new->file = file;
337 new->root_offset = read_long(new->file);
338
339 errno = 0;
340 return new;
341 }
342
index_file_close(struct index_file * idx)343 void index_file_close(struct index_file *idx)
344 {
345 fclose(idx->file);
346 free(idx);
347 }
348
index_readroot(struct index_file * in)349 static struct index_node_f *index_readroot(struct index_file *in)
350 {
351 return index_read(in->file, in->root_offset);
352 }
353
index_readchild(const struct index_node_f * parent,int ch)354 static struct index_node_f *index_readchild(const struct index_node_f *parent,
355 int ch)
356 {
357 if (parent->first <= ch && ch <= parent->last) {
358 return index_read(parent->file,
359 parent->children[ch - parent->first]);
360 }
361
362 return NULL;
363 }
364
index_dump_node(struct index_node_f * node,struct strbuf * buf,int fd)365 static void index_dump_node(struct index_node_f *node, struct strbuf *buf,
366 int fd)
367 {
368 struct index_value *v;
369 int ch, pushed;
370
371 pushed = strbuf_pushchars(buf, node->prefix);
372
373 for (v = node->values; v != NULL; v = v->next) {
374 write_str_safe(fd, buf->bytes, buf->used);
375 write_str_safe(fd, " ", 1);
376 write_str_safe(fd, v->value, strlen(v->value));
377 write_str_safe(fd, "\n", 1);
378 }
379
380 for (ch = node->first; ch <= node->last; ch++) {
381 struct index_node_f *child = index_readchild(node, ch);
382
383 if (!child)
384 continue;
385
386 strbuf_pushchar(buf, ch);
387 index_dump_node(child, buf, fd);
388 strbuf_popchar(buf);
389 }
390
391 strbuf_popchars(buf, pushed);
392 index_close(node);
393 }
394
index_dump(struct index_file * in,int fd,const char * prefix)395 void index_dump(struct index_file *in, int fd, const char *prefix)
396 {
397 struct index_node_f *root;
398 struct strbuf buf;
399
400 root = index_readroot(in);
401 if (root == NULL)
402 return;
403
404 strbuf_init(&buf);
405 strbuf_pushchars(&buf, prefix);
406 index_dump_node(root, &buf, fd);
407 strbuf_release(&buf);
408 }
409
index_search__node(struct index_node_f * node,const char * key,int i)410 static char *index_search__node(struct index_node_f *node, const char *key, int i)
411 {
412 char *value;
413 struct index_node_f *child;
414 int ch;
415 int j;
416
417 while(node) {
418 for (j = 0; node->prefix[j]; j++) {
419 ch = node->prefix[j];
420
421 if (ch != key[i+j]) {
422 index_close(node);
423 return NULL;
424 }
425 }
426
427 i += j;
428
429 if (key[i] == '\0') {
430 value = node->values != NULL
431 ? strdup(node->values[0].value)
432 : NULL;
433
434 index_close(node);
435 return value;
436 }
437
438 child = index_readchild(node, key[i]);
439 index_close(node);
440 node = child;
441 i++;
442 }
443
444 return NULL;
445 }
446
447 /*
448 * Search the index for a key
449 *
450 * Returns the value of the first match
451 *
452 * The recursive functions free their node argument (using index_close).
453 */
index_search(struct index_file * in,const char * key)454 char *index_search(struct index_file *in, const char *key)
455 {
456 // FIXME: return value by reference instead of strdup
457 struct index_node_f *root;
458 char *value;
459
460 root = index_readroot(in);
461 value = index_search__node(root, key, 0);
462
463 return value;
464 }
465
466
467
468 /* Level 4: add all the values from a matching node */
index_searchwild__allvalues(struct index_node_f * node,struct index_value ** out)469 static void index_searchwild__allvalues(struct index_node_f *node,
470 struct index_value **out)
471 {
472 struct index_value *v;
473
474 for (v = node->values; v != NULL; v = v->next)
475 add_value(out, v->value, v->len, v->priority);
476
477 index_close(node);
478 }
479
480 /*
481 * Level 3: traverse a sub-keyspace which starts with a wildcard,
482 * looking for matches.
483 */
index_searchwild__all(struct index_node_f * node,int j,struct strbuf * buf,const char * subkey,struct index_value ** out)484 static void index_searchwild__all(struct index_node_f *node, int j,
485 struct strbuf *buf,
486 const char *subkey,
487 struct index_value **out)
488 {
489 int pushed = 0;
490 int ch;
491
492 while (node->prefix[j]) {
493 ch = node->prefix[j];
494
495 strbuf_pushchar(buf, ch);
496 pushed++;
497 j++;
498 }
499
500 for (ch = node->first; ch <= node->last; ch++) {
501 struct index_node_f *child = index_readchild(node, ch);
502
503 if (!child)
504 continue;
505
506 strbuf_pushchar(buf, ch);
507 index_searchwild__all(child, 0, buf, subkey, out);
508 strbuf_popchar(buf);
509 }
510
511 if (node->values) {
512 if (fnmatch(strbuf_str(buf), subkey, 0) == 0)
513 index_searchwild__allvalues(node, out);
514 else
515 index_close(node);
516 } else {
517 index_close(node);
518 }
519
520 strbuf_popchars(buf, pushed);
521 }
522
523 /* Level 2: descend the tree (until we hit a wildcard) */
index_searchwild__node(struct index_node_f * node,struct strbuf * buf,const char * key,int i,struct index_value ** out)524 static void index_searchwild__node(struct index_node_f *node,
525 struct strbuf *buf,
526 const char *key, int i,
527 struct index_value **out)
528 {
529 struct index_node_f *child;
530 int j;
531 int ch;
532
533 while(node) {
534 for (j = 0; node->prefix[j]; j++) {
535 ch = node->prefix[j];
536
537 if (ch == '*' || ch == '?' || ch == '[') {
538 index_searchwild__all(node, j, buf,
539 &key[i+j], out);
540 return;
541 }
542
543 if (ch != key[i+j]) {
544 index_close(node);
545 return;
546 }
547 }
548
549 i += j;
550
551 child = index_readchild(node, '*');
552 if (child) {
553 strbuf_pushchar(buf, '*');
554 index_searchwild__all(child, 0, buf, &key[i], out);
555 strbuf_popchar(buf);
556 }
557
558 child = index_readchild(node, '?');
559 if (child) {
560 strbuf_pushchar(buf, '?');
561 index_searchwild__all(child, 0, buf, &key[i], out);
562 strbuf_popchar(buf);
563 }
564
565 child = index_readchild(node, '[');
566 if (child) {
567 strbuf_pushchar(buf, '[');
568 index_searchwild__all(child, 0, buf, &key[i], out);
569 strbuf_popchar(buf);
570 }
571
572 if (key[i] == '\0') {
573 index_searchwild__allvalues(node, out);
574
575 return;
576 }
577
578 child = index_readchild(node, key[i]);
579 index_close(node);
580 node = child;
581 i++;
582 }
583 }
584
585 /*
586 * Search the index for a key. The index may contain wildcards.
587 *
588 * Returns a list of all the values of matching keys.
589 */
index_searchwild(struct index_file * in,const char * key)590 struct index_value *index_searchwild(struct index_file *in, const char *key)
591 {
592 struct index_node_f *root = index_readroot(in);
593 struct strbuf buf;
594 struct index_value *out = NULL;
595
596 strbuf_init(&buf);
597 index_searchwild__node(root, &buf, key, 0, &out);
598 strbuf_release(&buf);
599 return out;
600 }
601
602 /**************************************************************************/
603 /*
604 * Alternative implementation, using mmap to map all the file to memory when
605 * starting
606 */
607 #include <sys/mman.h>
608 #include <sys/stat.h>
609 #include <unistd.h>
610
611 static const char _idx_empty_str[] = "";
612
613 struct index_mm {
614 struct kmod_ctx *ctx;
615 void *mm;
616 uint32_t root_offset;
617 size_t size;
618 };
619
620 struct index_mm_value {
621 unsigned int priority;
622 unsigned int len;
623 const char *value;
624 };
625
626 struct index_mm_value_array {
627 struct index_mm_value *values;
628 unsigned int len;
629 };
630
631 struct index_mm_node {
632 struct index_mm *idx;
633 const char *prefix; /* mmape'd value */
634 struct index_mm_value_array values;
635 unsigned char first;
636 unsigned char last;
637 uint32_t children[];
638 };
639
read_long_mm(void ** p)640 static inline uint32_t read_long_mm(void **p)
641 {
642 uint8_t *addr = *(uint8_t **)p;
643 uint32_t v;
644
645 /* addr may be unalined to uint32_t */
646 v = get_unaligned((uint32_t *) addr);
647
648 *p = addr + sizeof(uint32_t);
649 return ntohl(v);
650 }
651
read_char_mm(void ** p)652 static inline uint8_t read_char_mm(void **p)
653 {
654 uint8_t *addr = *(uint8_t **)p;
655 uint8_t v = *addr;
656 *p = addr + sizeof(uint8_t);
657 return v;
658 }
659
read_chars_mm(void ** p,unsigned * rlen)660 static inline char *read_chars_mm(void **p, unsigned *rlen)
661 {
662 char *addr = *(char **)p;
663 size_t len = *rlen = strlen(addr);
664 *p = addr + len + 1;
665 return addr;
666 }
667
index_mm_read_node(struct index_mm * idx,uint32_t offset)668 static struct index_mm_node *index_mm_read_node(struct index_mm *idx,
669 uint32_t offset) {
670 void *p = idx->mm;
671 struct index_mm_node *node;
672 const char *prefix;
673 int i, child_count, value_count, children_padding;
674 uint32_t children[INDEX_CHILDMAX];
675 char first, last;
676
677 if ((offset & INDEX_NODE_MASK) == 0)
678 return NULL;
679
680 p = (char *)p + (offset & INDEX_NODE_MASK);
681
682 if (offset & INDEX_NODE_PREFIX) {
683 unsigned len;
684 prefix = read_chars_mm(&p, &len);
685 } else
686 prefix = _idx_empty_str;
687
688 if (offset & INDEX_NODE_CHILDS) {
689 first = read_char_mm(&p);
690 last = read_char_mm(&p);
691 child_count = last - first + 1;
692 for (i = 0; i < child_count; i++)
693 children[i] = read_long_mm(&p);
694 } else {
695 first = (char)INDEX_CHILDMAX;
696 last = 0;
697 child_count = 0;
698 }
699
700 children_padding = (sizeof(struct index_mm_node) +
701 (sizeof(uint32_t) * child_count)) % sizeof(void *);
702
703 if (offset & INDEX_NODE_VALUES)
704 value_count = read_long_mm(&p);
705 else
706 value_count = 0;
707
708 node = malloc(sizeof(struct index_mm_node)
709 + sizeof(uint32_t) * child_count + children_padding
710 + sizeof(struct index_mm_value) * value_count);
711 if (node == NULL)
712 return NULL;
713
714 node->idx = idx;
715 node->prefix = prefix;
716 if (value_count == 0)
717 node->values.values = NULL;
718 else {
719 node->values.values = (struct index_mm_value *)
720 ((char *)node + sizeof(struct index_mm_node) +
721 sizeof(uint32_t) * child_count + children_padding);
722 }
723 node->values.len = value_count;
724 node->first = first;
725 node->last = last;
726 memcpy(node->children, children, sizeof(uint32_t) * child_count);
727
728 for (i = 0; i < value_count; i++) {
729 struct index_mm_value *v = node->values.values + i;
730 v->priority = read_long_mm(&p);
731 v->value = read_chars_mm(&p, &v->len);
732 }
733
734 return node;
735 }
736
index_mm_free_node(struct index_mm_node * node)737 static void index_mm_free_node(struct index_mm_node *node)
738 {
739 free(node);
740 }
741
index_mm_open(struct kmod_ctx * ctx,const char * filename,unsigned long long * stamp)742 struct index_mm *index_mm_open(struct kmod_ctx *ctx, const char *filename,
743 unsigned long long *stamp)
744 {
745 int fd;
746 struct stat st;
747 struct index_mm *idx;
748 struct {
749 uint32_t magic;
750 uint32_t version;
751 uint32_t root_offset;
752 } hdr;
753 void *p;
754
755 DBG(ctx, "file=%s\n", filename);
756
757 idx = malloc(sizeof(*idx));
758 if (idx == NULL) {
759 ERR(ctx, "malloc: %m\n");
760 return NULL;
761 }
762
763 if ((fd = open(filename, O_RDONLY|O_CLOEXEC)) < 0) {
764 DBG(ctx, "open(%s, O_RDONLY|O_CLOEXEC): %m\n", filename);
765 goto fail_open;
766 }
767
768 if (fstat(fd, &st) < 0)
769 goto fail_nommap;
770 if ((size_t) st.st_size < sizeof(hdr))
771 goto fail_nommap;
772
773 if ((idx->mm = mmap(NULL, st.st_size, PROT_READ, MAP_PRIVATE, fd, 0))
774 == MAP_FAILED) {
775 ERR(ctx, "mmap(NULL, %"PRIu64", PROT_READ, %d, MAP_PRIVATE, 0): %m\n",
776 st.st_size, fd);
777 goto fail_nommap;
778 }
779
780 p = idx->mm;
781 hdr.magic = read_long_mm(&p);
782 hdr.version = read_long_mm(&p);
783 hdr.root_offset = read_long_mm(&p);
784
785 if (hdr.magic != INDEX_MAGIC) {
786 ERR(ctx, "magic check fail: %x instead of %x\n", hdr.magic,
787 INDEX_MAGIC);
788 goto fail;
789 }
790
791 if (hdr.version >> 16 != INDEX_VERSION_MAJOR) {
792 ERR(ctx, "major version check fail: %u instead of %u\n",
793 hdr.version >> 16, INDEX_VERSION_MAJOR);
794 goto fail;
795 }
796
797 idx->root_offset = hdr.root_offset;
798 idx->size = st.st_size;
799 idx->ctx = ctx;
800 close(fd);
801
802 *stamp = stat_mstamp(&st);
803
804 return idx;
805
806 fail:
807 munmap(idx->mm, st.st_size);
808 fail_nommap:
809 close(fd);
810 fail_open:
811 free(idx);
812 return NULL;
813 }
814
index_mm_close(struct index_mm * idx)815 void index_mm_close(struct index_mm *idx)
816 {
817 munmap(idx->mm, idx->size);
818 free(idx);
819 }
820
index_mm_readroot(struct index_mm * idx)821 static struct index_mm_node *index_mm_readroot(struct index_mm *idx)
822 {
823 return index_mm_read_node(idx, idx->root_offset);
824 }
825
index_mm_readchild(const struct index_mm_node * parent,int ch)826 static struct index_mm_node *index_mm_readchild(const struct index_mm_node *parent,
827 int ch)
828 {
829 if (parent->first <= ch && ch <= parent->last) {
830 return index_mm_read_node(parent->idx,
831 parent->children[ch - parent->first]);
832 }
833
834 return NULL;
835 }
836
index_mm_dump_node(struct index_mm_node * node,struct strbuf * buf,int fd)837 static void index_mm_dump_node(struct index_mm_node *node, struct strbuf *buf,
838 int fd)
839 {
840 struct index_mm_value *itr, *itr_end;
841 int ch, pushed;
842
843 pushed = strbuf_pushchars(buf, node->prefix);
844
845 itr = node->values.values;
846 itr_end = itr + node->values.len;
847 for (; itr < itr_end; itr++) {
848 write_str_safe(fd, buf->bytes, buf->used);
849 write_str_safe(fd, " ", 1);
850 write_str_safe(fd, itr->value, itr->len);
851 write_str_safe(fd, "\n", 1);
852 }
853
854 for (ch = node->first; ch <= node->last; ch++) {
855 struct index_mm_node *child = index_mm_readchild(node, ch);
856
857 if (child == NULL)
858 continue;
859
860 strbuf_pushchar(buf, ch);
861 index_mm_dump_node(child, buf, fd);
862 strbuf_popchar(buf);
863 }
864
865 strbuf_popchars(buf, pushed);
866 index_mm_free_node(node);
867 }
868
index_mm_dump(struct index_mm * idx,int fd,const char * prefix)869 void index_mm_dump(struct index_mm *idx, int fd, const char *prefix)
870 {
871 struct index_mm_node *root;
872 struct strbuf buf;
873
874 root = index_mm_readroot(idx);
875 if (root == NULL)
876 return;
877
878 strbuf_init(&buf);
879 strbuf_pushchars(&buf, prefix);
880 index_mm_dump_node(root, &buf, fd);
881 strbuf_release(&buf);
882 }
883
index_mm_search_node(struct index_mm_node * node,const char * key,int i)884 static char *index_mm_search_node(struct index_mm_node *node, const char *key,
885 int i)
886 {
887 char *value;
888 struct index_mm_node *child;
889 int ch;
890 int j;
891
892 while(node) {
893 for (j = 0; node->prefix[j]; j++) {
894 ch = node->prefix[j];
895
896 if (ch != key[i+j]) {
897 index_mm_free_node(node);
898 return NULL;
899 }
900 }
901
902 i += j;
903
904 if (key[i] == '\0') {
905 value = node->values.len > 0
906 ? strdup(node->values.values[0].value)
907 : NULL;
908
909 index_mm_free_node(node);
910 return value;
911 }
912
913 child = index_mm_readchild(node, key[i]);
914 index_mm_free_node(node);
915 node = child;
916 i++;
917 }
918
919 return NULL;
920 }
921
922 /*
923 * Search the index for a key
924 *
925 * Returns the value of the first match
926 *
927 * The recursive functions free their node argument (using index_close).
928 */
index_mm_search(struct index_mm * idx,const char * key)929 char *index_mm_search(struct index_mm *idx, const char *key)
930 {
931 // FIXME: return value by reference instead of strdup
932 struct index_mm_node *root;
933 char *value;
934
935 root = index_mm_readroot(idx);
936 value = index_mm_search_node(root, key, 0);
937
938 return value;
939 }
940
941 /* Level 4: add all the values from a matching node */
index_mm_searchwild_allvalues(struct index_mm_node * node,struct index_value ** out)942 static void index_mm_searchwild_allvalues(struct index_mm_node *node,
943 struct index_value **out)
944 {
945 struct index_mm_value *itr, *itr_end;
946
947 itr = node->values.values;
948 itr_end = itr + node->values.len;
949 for (; itr < itr_end; itr++)
950 add_value(out, itr->value, itr->len, itr->priority);
951
952 index_mm_free_node(node);
953 }
954
955 /*
956 * Level 3: traverse a sub-keyspace which starts with a wildcard,
957 * looking for matches.
958 */
index_mm_searchwild_all(struct index_mm_node * node,int j,struct strbuf * buf,const char * subkey,struct index_value ** out)959 static void index_mm_searchwild_all(struct index_mm_node *node, int j,
960 struct strbuf *buf,
961 const char *subkey,
962 struct index_value **out)
963 {
964 int pushed = 0;
965 int ch;
966
967 while (node->prefix[j]) {
968 ch = node->prefix[j];
969
970 strbuf_pushchar(buf, ch);
971 pushed++;
972 j++;
973 }
974
975 for (ch = node->first; ch <= node->last; ch++) {
976 struct index_mm_node *child = index_mm_readchild(node, ch);
977
978 if (!child)
979 continue;
980
981 strbuf_pushchar(buf, ch);
982 index_mm_searchwild_all(child, 0, buf, subkey, out);
983 strbuf_popchar(buf);
984 }
985
986 if (node->values.len > 0) {
987 if (fnmatch(strbuf_str(buf), subkey, 0) == 0)
988 index_mm_searchwild_allvalues(node, out);
989 else
990 index_mm_free_node(node);
991 } else {
992 index_mm_free_node(node);
993 }
994
995 strbuf_popchars(buf, pushed);
996 }
997
998 /* Level 2: descend the tree (until we hit a wildcard) */
index_mm_searchwild_node(struct index_mm_node * node,struct strbuf * buf,const char * key,int i,struct index_value ** out)999 static void index_mm_searchwild_node(struct index_mm_node *node,
1000 struct strbuf *buf,
1001 const char *key, int i,
1002 struct index_value **out)
1003 {
1004 struct index_mm_node *child;
1005 int j;
1006 int ch;
1007
1008 while(node) {
1009 for (j = 0; node->prefix[j]; j++) {
1010 ch = node->prefix[j];
1011
1012 if (ch == '*' || ch == '?' || ch == '[') {
1013 index_mm_searchwild_all(node, j, buf,
1014 &key[i+j], out);
1015 return;
1016 }
1017
1018 if (ch != key[i+j]) {
1019 index_mm_free_node(node);
1020 return;
1021 }
1022 }
1023
1024 i += j;
1025
1026 child = index_mm_readchild(node, '*');
1027 if (child) {
1028 strbuf_pushchar(buf, '*');
1029 index_mm_searchwild_all(child, 0, buf, &key[i], out);
1030 strbuf_popchar(buf);
1031 }
1032
1033 child = index_mm_readchild(node, '?');
1034 if (child) {
1035 strbuf_pushchar(buf, '?');
1036 index_mm_searchwild_all(child, 0, buf, &key[i], out);
1037 strbuf_popchar(buf);
1038 }
1039
1040 child = index_mm_readchild(node, '[');
1041 if (child) {
1042 strbuf_pushchar(buf, '[');
1043 index_mm_searchwild_all(child, 0, buf, &key[i], out);
1044 strbuf_popchar(buf);
1045 }
1046
1047 if (key[i] == '\0') {
1048 index_mm_searchwild_allvalues(node, out);
1049
1050 return;
1051 }
1052
1053 child = index_mm_readchild(node, key[i]);
1054 index_mm_free_node(node);
1055 node = child;
1056 i++;
1057 }
1058 }
1059
1060 /*
1061 * Search the index for a key. The index may contain wildcards.
1062 *
1063 * Returns a list of all the values of matching keys.
1064 */
index_mm_searchwild(struct index_mm * idx,const char * key)1065 struct index_value *index_mm_searchwild(struct index_mm *idx, const char *key)
1066 {
1067 struct index_mm_node *root = index_mm_readroot(idx);
1068 struct strbuf buf;
1069 struct index_value *out = NULL;
1070
1071 strbuf_init(&buf);
1072 index_mm_searchwild_node(root, &buf, key, 0, &out);
1073 strbuf_release(&buf);
1074 return out;
1075 }
1076