1 |
|
|
/* $OpenBSD: dbm_map.c,v 1.6 2017/02/09 18:26:17 schwarze Exp $ */ |
2 |
|
|
/* |
3 |
|
|
* Copyright (c) 2016 Ingo Schwarze <schwarze@openbsd.org> |
4 |
|
|
* |
5 |
|
|
* Permission to use, copy, modify, and distribute this software for any |
6 |
|
|
* purpose with or without fee is hereby granted, provided that the above |
7 |
|
|
* copyright notice and this permission notice appear in all copies. |
8 |
|
|
* |
9 |
|
|
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES |
10 |
|
|
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF |
11 |
|
|
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR |
12 |
|
|
* ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES |
13 |
|
|
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN |
14 |
|
|
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
15 |
|
|
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
16 |
|
|
* |
17 |
|
|
* Low-level routines for the map-based version |
18 |
|
|
* of the mandoc database, for read-only access. |
19 |
|
|
* The interface is defined in "dbm_map.h". |
20 |
|
|
*/ |
21 |
|
|
#include <sys/mman.h> |
22 |
|
|
#include <sys/stat.h> |
23 |
|
|
#include <sys/types.h> |
24 |
|
|
|
25 |
|
|
#include <endian.h> |
26 |
|
|
#include <err.h> |
27 |
|
|
#include <errno.h> |
28 |
|
|
#include <fcntl.h> |
29 |
|
|
#include <regex.h> |
30 |
|
|
#include <stdint.h> |
31 |
|
|
#include <stdlib.h> |
32 |
|
|
#include <string.h> |
33 |
|
|
#include <unistd.h> |
34 |
|
|
|
35 |
|
|
#include "mansearch.h" |
36 |
|
|
#include "dbm_map.h" |
37 |
|
|
#include "dbm.h" |
38 |
|
|
|
39 |
|
|
static struct stat st; |
40 |
|
|
static char *dbm_base; |
41 |
|
|
static int ifd; |
42 |
|
|
static int32_t max_offset; |
43 |
|
|
|
44 |
|
|
/* |
45 |
|
|
* Open a disk-based database for read-only access. |
46 |
|
|
* Validate the file format as far as it is not mandoc-specific. |
47 |
|
|
* Return 0 on success. Return -1 and set errno on failure. |
48 |
|
|
*/ |
49 |
|
|
int |
50 |
|
|
dbm_map(const char *fname) |
51 |
|
|
{ |
52 |
|
|
int save_errno; |
53 |
|
|
const int32_t *magic; |
54 |
|
|
|
55 |
✓✓ |
408 |
if ((ifd = open(fname, O_RDONLY)) == -1) |
56 |
|
13 |
return -1; |
57 |
✓✗ |
191 |
if (fstat(ifd, &st) == -1) |
58 |
|
|
goto fail; |
59 |
✓✓ |
191 |
if (st.st_size < 5) { |
60 |
|
2 |
warnx("dbm_map(%s): File too short", fname); |
61 |
|
2 |
errno = EFTYPE; |
62 |
|
2 |
goto fail; |
63 |
|
|
} |
64 |
✗✓ |
189 |
if (st.st_size > INT32_MAX) { |
65 |
|
|
errno = EFBIG; |
66 |
|
|
goto fail; |
67 |
|
|
} |
68 |
✓✗ |
378 |
if ((dbm_base = mmap(NULL, st.st_size, PROT_READ, MAP_SHARED, |
69 |
|
378 |
ifd, 0)) == MAP_FAILED) |
70 |
|
|
goto fail; |
71 |
|
189 |
magic = dbm_getint(0); |
72 |
✓✓ |
189 |
if (be32toh(*magic) != MANDOCDB_MAGIC) { |
73 |
✓✗ |
2 |
if (strncmp(dbm_base, "SQLite format 3", 15)) |
74 |
|
2 |
warnx("dbm_map(%s): " |
75 |
|
|
"Bad initial magic %x (expected %x)", |
76 |
|
2 |
fname, be32toh(*magic), MANDOCDB_MAGIC); |
77 |
|
|
else |
78 |
|
|
warnx("dbm_map(%s): " |
79 |
|
|
"Obsolete format based on SQLite 3", |
80 |
|
|
fname); |
81 |
|
2 |
errno = EFTYPE; |
82 |
|
2 |
goto fail; |
83 |
|
|
} |
84 |
|
187 |
magic = dbm_getint(1); |
85 |
✓✓ |
187 |
if (be32toh(*magic) != MANDOCDB_VERSION) { |
86 |
|
2 |
warnx("dbm_map(%s): Bad version number %d (expected %d)", |
87 |
|
|
fname, be32toh(*magic), MANDOCDB_VERSION); |
88 |
|
2 |
errno = EFTYPE; |
89 |
|
2 |
goto fail; |
90 |
|
|
} |
91 |
|
185 |
max_offset = be32toh(*dbm_getint(3)) + sizeof(int32_t); |
92 |
✓✓ |
185 |
if (st.st_size != max_offset) { |
93 |
|
2 |
warnx("dbm_map(%s): Inconsistent file size %lld (expected %d)", |
94 |
|
|
fname, (long long)st.st_size, max_offset); |
95 |
|
2 |
errno = EFTYPE; |
96 |
|
2 |
goto fail; |
97 |
|
|
} |
98 |
✗✓ |
183 |
if ((magic = dbm_get(*dbm_getint(3))) == NULL) { |
99 |
|
|
errno = EFTYPE; |
100 |
|
|
goto fail; |
101 |
|
|
} |
102 |
✓✓ |
183 |
if (be32toh(*magic) != MANDOCDB_MAGIC) { |
103 |
|
2 |
warnx("dbm_map(%s): Bad final magic %x (expected %x)", |
104 |
|
|
fname, be32toh(*magic), MANDOCDB_MAGIC); |
105 |
|
2 |
errno = EFTYPE; |
106 |
|
2 |
goto fail; |
107 |
|
|
} |
108 |
|
181 |
return 0; |
109 |
|
|
|
110 |
|
|
fail: |
111 |
|
10 |
save_errno = errno; |
112 |
|
10 |
close(ifd); |
113 |
|
10 |
errno = save_errno; |
114 |
|
10 |
return -1; |
115 |
|
204 |
} |
116 |
|
|
|
117 |
|
|
void |
118 |
|
|
dbm_unmap(void) |
119 |
|
|
{ |
120 |
✗✓ |
362 |
if (munmap(dbm_base, st.st_size) == -1) |
121 |
|
|
warn("dbm_unmap: munmap"); |
122 |
✗✓ |
181 |
if (close(ifd) == -1) |
123 |
|
|
warn("dbm_unmap: close"); |
124 |
|
181 |
dbm_base = (char *)-1; |
125 |
|
181 |
} |
126 |
|
|
|
127 |
|
|
/* |
128 |
|
|
* Take a raw integer as it was read from the database. |
129 |
|
|
* Interpret it as an offset into the database file |
130 |
|
|
* and return a pointer to that place in the file. |
131 |
|
|
*/ |
132 |
|
|
void * |
133 |
|
|
dbm_get(int32_t offset) |
134 |
|
|
{ |
135 |
|
22614 |
offset = be32toh(offset); |
136 |
✓✓ |
11307 |
if (offset < 0) { |
137 |
|
52 |
warnx("dbm_get: Database corrupt: offset %d", offset); |
138 |
|
52 |
return NULL; |
139 |
|
|
} |
140 |
✓✓ |
11255 |
if (offset >= max_offset) { |
141 |
|
4 |
warnx("dbm_get: Database corrupt: offset %d > %d", |
142 |
|
|
offset, max_offset); |
143 |
|
4 |
return NULL; |
144 |
|
|
} |
145 |
|
11251 |
return dbm_base + offset; |
146 |
|
11307 |
} |
147 |
|
|
|
148 |
|
|
/* |
149 |
|
|
* Assume the database starts with some integers. |
150 |
|
|
* Assume they are numbered starting from 0, increasing. |
151 |
|
|
* Get a pointer to one with the number "offset". |
152 |
|
|
*/ |
153 |
|
|
int32_t * |
154 |
|
|
dbm_getint(int32_t offset) |
155 |
|
|
{ |
156 |
|
2714 |
return (int32_t *)dbm_base + offset; |
157 |
|
|
} |
158 |
|
|
|
159 |
|
|
/* |
160 |
|
|
* The reverse of dbm_get(). |
161 |
|
|
* Take pointer into the database file |
162 |
|
|
* and convert it to the raw integer |
163 |
|
|
* that would be used to refer to that place in the file. |
164 |
|
|
*/ |
165 |
|
|
int32_t |
166 |
|
|
dbm_addr(const void *p) |
167 |
|
|
{ |
168 |
|
514 |
return htobe32((const char *)p - dbm_base); |
169 |
|
|
} |
170 |
|
|
|
171 |
|
|
int |
172 |
|
|
dbm_match(const struct dbm_match *match, const char *str) |
173 |
|
|
{ |
174 |
✓✓✓✗
|
124844 |
switch (match->type) { |
175 |
|
|
case DBM_EXACT: |
176 |
|
62274 |
return strcmp(str, match->str) == 0; |
177 |
|
|
case DBM_SUB: |
178 |
|
138 |
return strcasestr(str, match->str) != NULL; |
179 |
|
|
case DBM_REGEX: |
180 |
|
10 |
return regexec(match->re, str, 0, NULL, 0) == 0; |
181 |
|
|
default: |
182 |
|
|
abort(); |
183 |
|
|
} |
184 |
|
62422 |
} |