xref: /illumos-gate/usr/src/cmd/mandoc/mansearch.c (revision e153cda9f9660e385e8f468253f80e59f5d454d7)
1 /*	$Id: mansearch.c,v 1.77 2017/08/22 17:50:11 schwarze Exp $ */
2 /*
3  * Copyright (c) 2012 Kristaps Dzonsons <kristaps@bsd.lv>
4  * Copyright (c) 2013-2017 Ingo Schwarze <schwarze@openbsd.org>
5  *
6  * Permission to use, copy, modify, and distribute this software for any
7  * purpose with or without fee is hereby granted, provided that the above
8  * copyright notice and this permission notice appear in all copies.
9  *
10  * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHORS DISCLAIM ALL WARRANTIES
11  * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
12  * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR
13  * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
14  * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
15  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
16  * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
17  */
18 #include "config.h"
19 
20 #include <sys/mman.h>
21 #include <sys/types.h>
22 
23 #include <assert.h>
24 #if HAVE_ERR
25 #include <err.h>
26 #endif
27 #include <errno.h>
28 #include <fcntl.h>
29 #include <glob.h>
30 #include <limits.h>
31 #include <regex.h>
32 #include <stdio.h>
33 #include <stdint.h>
34 #include <stddef.h>
35 #include <stdlib.h>
36 #include <string.h>
37 #include <unistd.h>
38 
39 #include "mandoc.h"
40 #include "mandoc_aux.h"
41 #include "mandoc_ohash.h"
42 #include "manconf.h"
43 #include "mansearch.h"
44 #include "dbm.h"
45 
46 struct	expr {
47 	/* Used for terms: */
48 	struct dbm_match match;   /* Match type and expression. */
49 	uint64_t	 bits;    /* Type mask. */
50 	/* Used for OR and AND groups: */
51 	struct expr	*next;    /* Next child in the parent group. */
52 	struct expr	*child;   /* First child in this group. */
53 	enum { EXPR_TERM, EXPR_OR, EXPR_AND } type;
54 };
55 
56 const char *const mansearch_keynames[KEY_MAX] = {
57 	"arch",	"sec",	"Xr",	"Ar",	"Fa",	"Fl",	"Dv",	"Fn",
58 	"Ic",	"Pa",	"Cm",	"Li",	"Em",	"Cd",	"Va",	"Ft",
59 	"Tn",	"Er",	"Ev",	"Sy",	"Sh",	"In",	"Ss",	"Ox",
60 	"An",	"Mt",	"St",	"Bx",	"At",	"Nx",	"Fx",	"Lk",
61 	"Ms",	"Bsx",	"Dx",	"Rs",	"Vt",	"Lb",	"Nm",	"Nd"
62 };
63 
64 
65 static	struct ohash	*manmerge(struct expr *, struct ohash *);
66 static	struct ohash	*manmerge_term(struct expr *, struct ohash *);
67 static	struct ohash	*manmerge_or(struct expr *, struct ohash *);
68 static	struct ohash	*manmerge_and(struct expr *, struct ohash *);
69 static	char		*buildnames(const struct dbm_page *);
70 static	char		*buildoutput(size_t, struct dbm_page *);
71 static	size_t		 lstlen(const char *, size_t);
72 static	void		 lstcat(char *, size_t *, const char *, const char *);
73 static	int		 lstmatch(const char *, const char *);
74 static	struct expr	*exprcomp(const struct mansearch *,
75 				int, char *[], int *);
76 static	struct expr	*expr_and(const struct mansearch *,
77 				int, char *[], int *);
78 static	struct expr	*exprterm(const struct mansearch *,
79 				int, char *[], int *);
80 static	void		 exprfree(struct expr *);
81 static	int		 manpage_compare(const void *, const void *);
82 
83 
84 int
85 mansearch(const struct mansearch *search,
86 		const struct manpaths *paths,
87 		int argc, char *argv[],
88 		struct manpage **res, size_t *sz)
89 {
90 	char		 buf[PATH_MAX];
91 	struct dbm_res	*rp;
92 	struct expr	*e;
93 	struct dbm_page	*page;
94 	struct manpage	*mpage;
95 	struct ohash	*htab;
96 	size_t		 cur, i, maxres, outkey;
97 	unsigned int	 slot;
98 	int		 argi, chdir_status, getcwd_status, im;
99 
100 	argi = 0;
101 	if ((e = exprcomp(search, argc, argv, &argi)) == NULL) {
102 		*sz = 0;
103 		return 0;
104 	}
105 
106 	cur = maxres = 0;
107 	if (res != NULL)
108 		*res = NULL;
109 
110 	outkey = KEY_Nd;
111 	if (search->outkey != NULL)
112 		for (im = 0; im < KEY_MAX; im++)
113 			if (0 == strcasecmp(search->outkey,
114 			    mansearch_keynames[im])) {
115 				outkey = im;
116 				break;
117 			}
118 
119 	/*
120 	 * Remember the original working directory, if possible.
121 	 * This will be needed if the second or a later directory
122 	 * is given as a relative path.
123 	 * Do not error out if the current directory is not
124 	 * searchable: Maybe it won't be needed after all.
125 	 */
126 
127 	if (getcwd(buf, PATH_MAX) == NULL) {
128 		getcwd_status = 0;
129 		(void)strlcpy(buf, strerror(errno), sizeof(buf));
130 	} else
131 		getcwd_status = 1;
132 
133 	/*
134 	 * Loop over the directories (containing databases) for us to
135 	 * search.
136 	 * Don't let missing/bad databases/directories phase us.
137 	 * In each, try to open the resident database and, if it opens,
138 	 * scan it for our match expression.
139 	 */
140 
141 	chdir_status = 0;
142 	for (i = 0; i < paths->sz; i++) {
143 		if (chdir_status && paths->paths[i][0] != '/') {
144 			if ( ! getcwd_status) {
145 				warnx("%s: getcwd: %s", paths->paths[i], buf);
146 				continue;
147 			} else if (chdir(buf) == -1) {
148 				warn("%s", buf);
149 				continue;
150 			}
151 		}
152 		if (chdir(paths->paths[i]) == -1) {
153 			warn("%s", paths->paths[i]);
154 			continue;
155 		}
156 		chdir_status = 1;
157 
158 		if (dbm_open(MANDOC_DB) == -1) {
159 			if (errno != ENOENT)
160 				warn("%s/%s", paths->paths[i], MANDOC_DB);
161 			continue;
162 		}
163 
164 		if ((htab = manmerge(e, NULL)) == NULL) {
165 			dbm_close();
166 			continue;
167 		}
168 
169 		for (rp = ohash_first(htab, &slot); rp != NULL;
170 		    rp = ohash_next(htab, &slot)) {
171 			page = dbm_page_get(rp->page);
172 
173 			if (lstmatch(search->sec, page->sect) == 0 ||
174 			    lstmatch(search->arch, page->arch) == 0 ||
175 			    (search->argmode == ARG_NAME &&
176 			     rp->bits <= (int32_t)(NAME_SYN & NAME_MASK)))
177 				continue;
178 
179 			if (res == NULL) {
180 				cur = 1;
181 				break;
182 			}
183 			if (cur + 1 > maxres) {
184 				maxres += 1024;
185 				*res = mandoc_reallocarray(*res,
186 				    maxres, sizeof(**res));
187 			}
188 			mpage = *res + cur;
189 			mandoc_asprintf(&mpage->file, "%s/%s",
190 			    paths->paths[i], page->file + 1);
191 			if (access(chdir_status ? page->file + 1 :
192 			    mpage->file, R_OK) == -1) {
193 				warn("%s", mpage->file);
194 				warnx("outdated mandoc.db contains "
195 				    "bogus %s entry, run makewhatis %s",
196 				    page->file + 1, paths->paths[i]);
197 				free(mpage->file);
198 				free(rp);
199 				continue;
200 			}
201 			mpage->names = buildnames(page);
202 			mpage->output = buildoutput(outkey, page);
203 			mpage->ipath = i;
204 			mpage->bits = rp->bits;
205 			mpage->sec = *page->sect - '0';
206 			if (mpage->sec < 0 || mpage->sec > 9)
207 				mpage->sec = 10;
208 			mpage->form = *page->file;
209 			free(rp);
210 			cur++;
211 		}
212 		ohash_delete(htab);
213 		free(htab);
214 		dbm_close();
215 
216 		/*
217 		 * In man(1) mode, prefer matches in earlier trees
218 		 * over matches in later trees.
219 		 */
220 
221 		if (cur && search->firstmatch)
222 			break;
223 	}
224 	if (res != NULL)
225 		qsort(*res, cur, sizeof(struct manpage), manpage_compare);
226 	if (chdir_status && getcwd_status && chdir(buf) == -1)
227 		warn("%s", buf);
228 	exprfree(e);
229 	*sz = cur;
230 	return res != NULL || cur;
231 }
232 
233 /*
234  * Merge the results for the expression tree rooted at e
235  * into the the result list htab.
236  */
237 static struct ohash *
238 manmerge(struct expr *e, struct ohash *htab)
239 {
240 	switch (e->type) {
241 	case EXPR_TERM:
242 		return manmerge_term(e, htab);
243 	case EXPR_OR:
244 		return manmerge_or(e->child, htab);
245 	case EXPR_AND:
246 		return manmerge_and(e->child, htab);
247 	default:
248 		abort();
249 	}
250 }
251 
252 static struct ohash *
253 manmerge_term(struct expr *e, struct ohash *htab)
254 {
255 	struct dbm_res	 res, *rp;
256 	uint64_t	 ib;
257 	unsigned int	 slot;
258 	int		 im;
259 
260 	if (htab == NULL) {
261 		htab = mandoc_malloc(sizeof(*htab));
262 		mandoc_ohash_init(htab, 4, offsetof(struct dbm_res, page));
263 	}
264 
265 	for (im = 0, ib = 1; im < KEY_MAX; im++, ib <<= 1) {
266 		if ((e->bits & ib) == 0)
267 			continue;
268 
269 		switch (ib) {
270 		case TYPE_arch:
271 			dbm_page_byarch(&e->match);
272 			break;
273 		case TYPE_sec:
274 			dbm_page_bysect(&e->match);
275 			break;
276 		case TYPE_Nm:
277 			dbm_page_byname(&e->match);
278 			break;
279 		case TYPE_Nd:
280 			dbm_page_bydesc(&e->match);
281 			break;
282 		default:
283 			dbm_page_bymacro(im - 2, &e->match);
284 			break;
285 		}
286 
287 		/*
288 		 * When hashing for deduplication, use the unique
289 		 * page ID itself instead of a hash function;
290 		 * that is quite efficient.
291 		 */
292 
293 		for (;;) {
294 			res = dbm_page_next();
295 			if (res.page == -1)
296 				break;
297 			slot = ohash_lookup_memory(htab,
298 			    (char *)&res, sizeof(res.page), res.page);
299 			if ((rp = ohash_find(htab, slot)) != NULL) {
300 				rp->bits |= res.bits;
301 				continue;
302 			}
303 			rp = mandoc_malloc(sizeof(*rp));
304 			*rp = res;
305 			ohash_insert(htab, slot, rp);
306 		}
307 	}
308 	return htab;
309 }
310 
311 static struct ohash *
312 manmerge_or(struct expr *e, struct ohash *htab)
313 {
314 	while (e != NULL) {
315 		htab = manmerge(e, htab);
316 		e = e->next;
317 	}
318 	return htab;
319 }
320 
321 static struct ohash *
322 manmerge_and(struct expr *e, struct ohash *htab)
323 {
324 	struct ohash	*hand, *h1, *h2;
325 	struct dbm_res	*res;
326 	unsigned int	 slot1, slot2;
327 
328 	/* Evaluate the first term of the AND clause. */
329 
330 	hand = manmerge(e, NULL);
331 
332 	while ((e = e->next) != NULL) {
333 
334 		/* Evaluate the next term and prepare for ANDing. */
335 
336 		h2 = manmerge(e, NULL);
337 		if (ohash_entries(h2) < ohash_entries(hand)) {
338 			h1 = h2;
339 			h2 = hand;
340 		} else
341 			h1 = hand;
342 		hand = mandoc_malloc(sizeof(*hand));
343 		mandoc_ohash_init(hand, 4, offsetof(struct dbm_res, page));
344 
345 		/* Keep all pages that are in both result sets. */
346 
347 		for (res = ohash_first(h1, &slot1); res != NULL;
348 		    res = ohash_next(h1, &slot1)) {
349 			if (ohash_find(h2, ohash_lookup_memory(h2,
350 			    (char *)res, sizeof(res->page),
351 			    res->page)) == NULL)
352 				free(res);
353 			else
354 				ohash_insert(hand, ohash_lookup_memory(hand,
355 				    (char *)res, sizeof(res->page),
356 				    res->page), res);
357 		}
358 
359 		/* Discard the merged results. */
360 
361 		for (res = ohash_first(h2, &slot2); res != NULL;
362 		    res = ohash_next(h2, &slot2))
363 			free(res);
364 		ohash_delete(h2);
365 		free(h2);
366 		ohash_delete(h1);
367 		free(h1);
368 	}
369 
370 	/* Merge the result of the AND into htab. */
371 
372 	if (htab == NULL)
373 		return hand;
374 
375 	for (res = ohash_first(hand, &slot1); res != NULL;
376 	    res = ohash_next(hand, &slot1)) {
377 		slot2 = ohash_lookup_memory(htab,
378 		    (char *)res, sizeof(res->page), res->page);
379 		if (ohash_find(htab, slot2) == NULL)
380 			ohash_insert(htab, slot2, res);
381 		else
382 			free(res);
383 	}
384 
385 	/* Discard the merged result. */
386 
387 	ohash_delete(hand);
388 	free(hand);
389 	return htab;
390 }
391 
392 void
393 mansearch_free(struct manpage *res, size_t sz)
394 {
395 	size_t	 i;
396 
397 	for (i = 0; i < sz; i++) {
398 		free(res[i].file);
399 		free(res[i].names);
400 		free(res[i].output);
401 	}
402 	free(res);
403 }
404 
405 static int
406 manpage_compare(const void *vp1, const void *vp2)
407 {
408 	const struct manpage	*mp1, *mp2;
409 	const char		*cp1, *cp2;
410 	size_t			 sz1, sz2;
411 	int			 diff;
412 
413 	mp1 = vp1;
414 	mp2 = vp2;
415 	if ((diff = mp2->bits - mp1->bits) ||
416 	    (diff = mp1->sec - mp2->sec))
417 		return diff;
418 
419 	/* Fall back to alphabetic ordering of names. */
420 	sz1 = strcspn(mp1->names, "(");
421 	sz2 = strcspn(mp2->names, "(");
422 	if (sz1 < sz2)
423 		sz1 = sz2;
424 	if ((diff = strncasecmp(mp1->names, mp2->names, sz1)))
425 		return diff;
426 
427 	/* For identical names and sections, prefer arch-dependent. */
428 	cp1 = strchr(mp1->names + sz1, '/');
429 	cp2 = strchr(mp2->names + sz2, '/');
430 	return cp1 != NULL && cp2 != NULL ? strcasecmp(cp1, cp2) :
431 	    cp1 != NULL ? -1 : cp2 != NULL ? 1 : 0;
432 }
433 
434 static char *
435 buildnames(const struct dbm_page *page)
436 {
437 	char	*buf;
438 	size_t	 i, sz;
439 
440 	sz = lstlen(page->name, 2) + 1 + lstlen(page->sect, 2) +
441 	    (page->arch == NULL ? 0 : 1 + lstlen(page->arch, 2)) + 2;
442 	buf = mandoc_malloc(sz);
443 	i = 0;
444 	lstcat(buf, &i, page->name, ", ");
445 	buf[i++] = '(';
446 	lstcat(buf, &i, page->sect, ", ");
447 	if (page->arch != NULL) {
448 		buf[i++] = '/';
449 		lstcat(buf, &i, page->arch, ", ");
450 	}
451 	buf[i++] = ')';
452 	buf[i++] = '\0';
453 	assert(i == sz);
454 	return buf;
455 }
456 
457 /*
458  * Count the buffer space needed to print the NUL-terminated
459  * list of NUL-terminated strings, when printing sep separator
460  * characters between strings.
461  */
462 static size_t
463 lstlen(const char *cp, size_t sep)
464 {
465 	size_t	 sz;
466 
467 	for (sz = 0; *cp != '\0'; cp++) {
468 
469 		/* Skip names appearing only in the SYNOPSIS. */
470 		if (*cp <= (char)(NAME_SYN & NAME_MASK)) {
471 			while (*cp != '\0')
472 				cp++;
473 			continue;
474 		}
475 
476 		/* Skip name class markers. */
477 		if (*cp < ' ')
478 			cp++;
479 
480 		/* Print a separator before each but the first string. */
481 		if (sz)
482 			sz += sep;
483 
484 		/* Copy one string. */
485 		while (*cp != '\0') {
486 			sz++;
487 			cp++;
488 		}
489 	}
490 	return sz;
491 }
492 
493 /*
494  * Print the NUL-terminated list of NUL-terminated strings
495  * into the buffer, seperating strings with sep.
496  */
497 static void
498 lstcat(char *buf, size_t *i, const char *cp, const char *sep)
499 {
500 	const char	*s;
501 	size_t		 i_start;
502 
503 	for (i_start = *i; *cp != '\0'; cp++) {
504 
505 		/* Skip names appearing only in the SYNOPSIS. */
506 		if (*cp <= (char)(NAME_SYN & NAME_MASK)) {
507 			while (*cp != '\0')
508 				cp++;
509 			continue;
510 		}
511 
512 		/* Skip name class markers. */
513 		if (*cp < ' ')
514 			cp++;
515 
516 		/* Print a separator before each but the first string. */
517 		if (*i > i_start) {
518 			s = sep;
519 			while (*s != '\0')
520 				buf[(*i)++] = *s++;
521 		}
522 
523 		/* Copy one string. */
524 		while (*cp != '\0')
525 			buf[(*i)++] = *cp++;
526 	}
527 
528 }
529 
530 /*
531  * Return 1 if the string *want occurs in any of the strings
532  * in the NUL-terminated string list *have, or 0 otherwise.
533  * If either argument is NULL or empty, assume no filtering
534  * is desired and return 1.
535  */
536 static int
537 lstmatch(const char *want, const char *have)
538 {
539         if (want == NULL || have == NULL || *have == '\0')
540                 return 1;
541         while (*have != '\0') {
542                 if (strcasestr(have, want) != NULL)
543                         return 1;
544                 have = strchr(have, '\0') + 1;
545         }
546         return 0;
547 }
548 
549 /*
550  * Build a list of values taken by the macro im in the manual page.
551  */
552 static char *
553 buildoutput(size_t im, struct dbm_page *page)
554 {
555 	const char	*oldoutput, *sep, *input;
556 	char		*output, *newoutput, *value;
557 	size_t		 sz, i;
558 
559 	switch (im) {
560 	case KEY_Nd:
561 		return mandoc_strdup(page->desc);
562 	case KEY_Nm:
563 		input = page->name;
564 		break;
565 	case KEY_sec:
566 		input = page->sect;
567 		break;
568 	case KEY_arch:
569 		input = page->arch;
570 		if (input == NULL)
571 			input = "all\0";
572 		break;
573 	default:
574 		input = NULL;
575 		break;
576 	}
577 
578 	if (input != NULL) {
579 		sz = lstlen(input, 3) + 1;
580 		output = mandoc_malloc(sz);
581 		i = 0;
582 		lstcat(output, &i, input, " # ");
583 		output[i++] = '\0';
584 		assert(i == sz);
585 		return output;
586 	}
587 
588 	output = NULL;
589 	dbm_macro_bypage(im - 2, page->addr);
590 	while ((value = dbm_macro_next()) != NULL) {
591 		if (output == NULL) {
592 			oldoutput = "";
593 			sep = "";
594 		} else {
595 			oldoutput = output;
596 			sep = " # ";
597 		}
598 		mandoc_asprintf(&newoutput, "%s%s%s", oldoutput, sep, value);
599 		free(output);
600 		output = newoutput;
601 	}
602 	return output;
603 }
604 
605 /*
606  * Compile a set of string tokens into an expression.
607  * Tokens in "argv" are assumed to be individual expression atoms (e.g.,
608  * "(", "foo=bar", etc.).
609  */
610 static struct expr *
611 exprcomp(const struct mansearch *search, int argc, char *argv[], int *argi)
612 {
613 	struct expr	*parent, *child;
614 	int		 needterm, nested;
615 
616 	if ((nested = *argi) == argc)
617 		return NULL;
618 	needterm = 1;
619 	parent = child = NULL;
620 	while (*argi < argc) {
621 		if (strcmp(")", argv[*argi]) == 0) {
622 			if (needterm)
623 				warnx("missing term "
624 				    "before closing parenthesis");
625 			needterm = 0;
626 			if (nested)
627 				break;
628 			warnx("ignoring unmatched right parenthesis");
629 			++*argi;
630 			continue;
631 		}
632 		if (strcmp("-o", argv[*argi]) == 0) {
633 			if (needterm) {
634 				if (*argi > 0)
635 					warnx("ignoring -o after %s",
636 					    argv[*argi - 1]);
637 				else
638 					warnx("ignoring initial -o");
639 			}
640 			needterm = 1;
641 			++*argi;
642 			continue;
643 		}
644 		needterm = 0;
645 		if (child == NULL) {
646 			child = expr_and(search, argc, argv, argi);
647 			continue;
648 		}
649 		if (parent == NULL) {
650 			parent = mandoc_calloc(1, sizeof(*parent));
651 			parent->type = EXPR_OR;
652 			parent->next = NULL;
653 			parent->child = child;
654 		}
655 		child->next = expr_and(search, argc, argv, argi);
656 		child = child->next;
657 	}
658 	if (needterm && *argi)
659 		warnx("ignoring trailing %s", argv[*argi - 1]);
660 	return parent == NULL ? child : parent;
661 }
662 
663 static struct expr *
664 expr_and(const struct mansearch *search, int argc, char *argv[], int *argi)
665 {
666 	struct expr	*parent, *child;
667 	int		 needterm;
668 
669 	needterm = 1;
670 	parent = child = NULL;
671 	while (*argi < argc) {
672 		if (strcmp(")", argv[*argi]) == 0) {
673 			if (needterm)
674 				warnx("missing term "
675 				    "before closing parenthesis");
676 			needterm = 0;
677 			break;
678 		}
679 		if (strcmp("-o", argv[*argi]) == 0)
680 			break;
681 		if (strcmp("-a", argv[*argi]) == 0) {
682 			if (needterm) {
683 				if (*argi > 0)
684 					warnx("ignoring -a after %s",
685 					    argv[*argi - 1]);
686 				else
687 					warnx("ignoring initial -a");
688 			}
689 			needterm = 1;
690 			++*argi;
691 			continue;
692 		}
693 		if (needterm == 0)
694 			break;
695 		if (child == NULL) {
696 			child = exprterm(search, argc, argv, argi);
697 			if (child != NULL)
698 				needterm = 0;
699 			continue;
700 		}
701 		needterm = 0;
702 		if (parent == NULL) {
703 			parent = mandoc_calloc(1, sizeof(*parent));
704 			parent->type = EXPR_AND;
705 			parent->next = NULL;
706 			parent->child = child;
707 		}
708 		child->next = exprterm(search, argc, argv, argi);
709 		if (child->next != NULL) {
710 			child = child->next;
711 			needterm = 0;
712 		}
713 	}
714 	if (needterm && *argi)
715 		warnx("ignoring trailing %s", argv[*argi - 1]);
716 	return parent == NULL ? child : parent;
717 }
718 
719 static struct expr *
720 exprterm(const struct mansearch *search, int argc, char *argv[], int *argi)
721 {
722 	char		 errbuf[BUFSIZ];
723 	struct expr	*e;
724 	char		*key, *val;
725 	uint64_t	 iterbit;
726 	int		 cs, i, irc;
727 
728 	if (strcmp("(", argv[*argi]) == 0) {
729 		++*argi;
730 		e = exprcomp(search, argc, argv, argi);
731 		if (*argi < argc) {
732 			assert(strcmp(")", argv[*argi]) == 0);
733 			++*argi;
734 		} else
735 			warnx("unclosed parenthesis");
736 		return e;
737 	}
738 
739 	if (strcmp("-i", argv[*argi]) == 0 && *argi + 1 < argc) {
740 		cs = 0;
741 		++*argi;
742 	} else
743 		cs = 1;
744 
745 	e = mandoc_calloc(1, sizeof(*e));
746 	e->type = EXPR_TERM;
747 	e->bits = 0;
748 	e->next = NULL;
749 	e->child = NULL;
750 
751 	if (search->argmode == ARG_NAME) {
752 		e->bits = TYPE_Nm;
753 		e->match.type = DBM_EXACT;
754 		e->match.str = argv[(*argi)++];
755 		return e;
756 	}
757 
758 	/*
759 	 * Separate macro keys from search string.
760 	 * If needed, request regular expression handling.
761 	 */
762 
763 	if (search->argmode == ARG_WORD) {
764 		e->bits = TYPE_Nm;
765 		e->match.type = DBM_REGEX;
766 #if HAVE_REWB_BSD
767 		mandoc_asprintf(&val, "[[:<:]]%s[[:>:]]", argv[*argi]);
768 #elif HAVE_REWB_SYSV
769 		mandoc_asprintf(&val, "\\<%s\\>", argv[*argi]);
770 #else
771 		mandoc_asprintf(&val,
772 		    "(^|[^a-zA-Z01-9_])%s([^a-zA-Z01-9_]|$)", argv[*argi]);
773 #endif
774 		cs = 0;
775 	} else if ((val = strpbrk(argv[*argi], "=~")) == NULL) {
776 		e->bits = TYPE_Nm | TYPE_Nd;
777 		e->match.type = DBM_SUB;
778 		e->match.str = argv[*argi];
779 	} else {
780 		if (val == argv[*argi])
781 			e->bits = TYPE_Nm | TYPE_Nd;
782 		if (*val == '=') {
783 			e->match.type = DBM_SUB;
784 			e->match.str = val + 1;
785 		} else
786 			e->match.type = DBM_REGEX;
787 		*val++ = '\0';
788 		if (strstr(argv[*argi], "arch") != NULL)
789 			cs = 0;
790 	}
791 
792 	/* Compile regular expressions. */
793 
794 	if (e->match.type == DBM_REGEX) {
795 		e->match.re = mandoc_malloc(sizeof(*e->match.re));
796 		irc = regcomp(e->match.re, val,
797 		    REG_EXTENDED | REG_NOSUB | (cs ? 0 : REG_ICASE));
798 		if (irc) {
799 			regerror(irc, e->match.re, errbuf, sizeof(errbuf));
800 			warnx("regcomp /%s/: %s", val, errbuf);
801 		}
802 		if (search->argmode == ARG_WORD)
803 			free(val);
804 		if (irc) {
805 			free(e->match.re);
806 			free(e);
807 			++*argi;
808 			return NULL;
809 		}
810 	}
811 
812 	if (e->bits) {
813 		++*argi;
814 		return e;
815 	}
816 
817 	/*
818 	 * Parse out all possible fields.
819 	 * If the field doesn't resolve, bail.
820 	 */
821 
822 	while (NULL != (key = strsep(&argv[*argi], ","))) {
823 		if ('\0' == *key)
824 			continue;
825 		for (i = 0, iterbit = 1; i < KEY_MAX; i++, iterbit <<= 1) {
826 			if (0 == strcasecmp(key, mansearch_keynames[i])) {
827 				e->bits |= iterbit;
828 				break;
829 			}
830 		}
831 		if (i == KEY_MAX) {
832 			if (strcasecmp(key, "any"))
833 				warnx("treating unknown key "
834 				    "\"%s\" as \"any\"", key);
835 			e->bits |= ~0ULL;
836 		}
837 	}
838 
839 	++*argi;
840 	return e;
841 }
842 
843 static void
844 exprfree(struct expr *e)
845 {
846 	if (e->next != NULL)
847 		exprfree(e->next);
848 	if (e->child != NULL)
849 		exprfree(e->child);
850 	free(e);
851 }
852