1 | /*- |
2 | * Copyright (c) 1990, 1993, 1994 |
3 | * The Regents of the University of California. All rights reserved. |
4 | * |
5 | * This code is derived from software contributed to Berkeley by |
6 | * Mike Olson. |
7 | * |
8 | * Redistribution and use in source and binary forms, with or without |
9 | * modification, are permitted provided that the following conditions |
10 | * are met: |
11 | * 1. Redistributions of source code must retain the above copyright |
12 | * notice, this list of conditions and the following disclaimer. |
13 | * 2. Redistributions in binary form must reproduce the above copyright |
14 | * notice, this list of conditions and the following disclaimer in the |
15 | * documentation and/or other materials provided with the distribution. |
16 | * 3. All advertising materials mentioning features or use of this software |
17 | * must display the following acknowledgement: |
18 | * This product includes software developed by the University of |
19 | * California, Berkeley and its contributors. |
20 | * 4. Neither the name of the University nor the names of its contributors |
21 | * may be used to endorse or promote products derived from this software |
22 | * without specific prior written permission. |
23 | * |
24 | * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND |
25 | * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
26 | * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
27 | * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE |
28 | * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL |
29 | * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS |
30 | * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) |
31 | * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT |
32 | * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY |
33 | * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF |
34 | * SUCH DAMAGE. |
35 | */ |
36 | |
37 | #if defined(LIBC_SCCS) && !defined(lint) |
38 | static char sccsid[] = "@(#)bt_put.c 8.8 (Berkeley) 7/26/94" ; |
39 | #endif /* LIBC_SCCS and not lint */ |
40 | |
41 | #include <sys/types.h> |
42 | |
43 | #include <errno.h> |
44 | #include <stdio.h> |
45 | #include <stdlib.h> |
46 | #include <string.h> |
47 | |
48 | #include <db.h> |
49 | #include "btree.h" |
50 | |
51 | static EPG *bt_fast __P((BTREE *, const DBT *, const DBT *, int *)); |
52 | |
53 | /* |
54 | * __BT_PUT -- Add a btree item to the tree. |
55 | * |
56 | * Parameters: |
57 | * dbp: pointer to access method |
58 | * key: key |
59 | * data: data |
60 | * flag: R_NOOVERWRITE |
61 | * |
62 | * Returns: |
63 | * RET_ERROR, RET_SUCCESS and RET_SPECIAL if the key is already in the |
64 | * tree and R_NOOVERWRITE specified. |
65 | */ |
66 | int |
67 | __bt_put(dbp, key, data, flags) |
68 | const DB *dbp; |
69 | DBT *key; |
70 | const DBT *data; |
71 | u_int flags; |
72 | { |
73 | BTREE *t; |
74 | DBT tkey, tdata; |
75 | EPG *e = NULL; |
76 | PAGE *h; |
77 | indx_t index, nxtindex; |
78 | pgno_t pg; |
79 | u_int32_t nbytes; |
80 | int dflags, exact, status; |
81 | char *dest, db[NOVFLSIZE], kb[NOVFLSIZE]; |
82 | |
83 | t = dbp->internal; |
84 | |
85 | /* Toss any page pinned across calls. */ |
86 | if (t->bt_pinned != NULL) { |
87 | mpool_put(t->bt_mp, t->bt_pinned, 0); |
88 | t->bt_pinned = NULL; |
89 | } |
90 | |
91 | /* Check for change to a read-only tree. */ |
92 | if (F_ISSET(t, B_RDONLY)) { |
93 | errno = EPERM; |
94 | return (RET_ERROR); |
95 | } |
96 | |
97 | switch (flags) { |
98 | case 0: |
99 | case R_NOOVERWRITE: |
100 | break; |
101 | case R_CURSOR: |
102 | /* |
103 | * If flags is R_CURSOR, put the cursor. Must already |
104 | * have started a scan and not have already deleted it. |
105 | */ |
106 | if (F_ISSET(&t->bt_cursor, CURS_INIT) && |
107 | !F_ISSET(&t->bt_cursor, |
108 | CURS_ACQUIRE | CURS_AFTER | CURS_BEFORE)) |
109 | break; |
110 | /* FALLTHROUGH */ |
111 | default: |
112 | errno = EINVAL; |
113 | return (RET_ERROR); |
114 | } |
115 | |
116 | /* |
117 | * If the key/data pair won't fit on a page, store it on overflow |
118 | * pages. Only put the key on the overflow page if the pair are |
119 | * still too big after moving the data to an overflow page. |
120 | * |
121 | * XXX |
122 | * If the insert fails later on, the overflow pages aren't recovered. |
123 | */ |
124 | dflags = 0; |
125 | if (key->size + data->size > t->bt_ovflsize) { |
126 | if (key->size > t->bt_ovflsize) { |
127 | storekey: if (__ovfl_put(t, key, &pg) == RET_ERROR) |
128 | return (RET_ERROR); |
129 | tkey.data = kb; |
130 | tkey.size = NOVFLSIZE; |
131 | memmove(kb, &pg, sizeof(pgno_t)); |
132 | memmove(kb + sizeof(pgno_t), |
133 | &key->size, sizeof(u_int32_t)); |
134 | dflags |= P_BIGKEY; |
135 | key = &tkey; |
136 | } |
137 | if (key->size + data->size > t->bt_ovflsize) { |
138 | if (__ovfl_put(t, data, &pg) == RET_ERROR) |
139 | return (RET_ERROR); |
140 | tdata.data = db; |
141 | tdata.size = NOVFLSIZE; |
142 | memmove(db, &pg, sizeof(pgno_t)); |
143 | memmove(db + sizeof(pgno_t), |
144 | &data->size, sizeof(u_int32_t)); |
145 | dflags |= P_BIGDATA; |
146 | data = &tdata; |
147 | } |
148 | if (key->size + data->size > t->bt_ovflsize) |
149 | goto storekey; |
150 | } |
151 | |
152 | /* Replace the cursor. */ |
153 | if (flags == R_CURSOR) { |
154 | if ((h = mpool_get(t->bt_mp, t->bt_cursor.pg.pgno, 0)) == NULL) |
155 | return (RET_ERROR); |
156 | index = t->bt_cursor.pg.index; |
157 | goto delete; |
158 | } |
159 | |
160 | /* |
161 | * Find the key to delete, or, the location at which to insert. |
162 | * Bt_fast and __bt_search both pin the returned page. |
163 | */ |
164 | if (t->bt_order == NOT || (e = bt_fast(t, key, data, &exact)) == NULL) |
165 | if ((e = __bt_search(t, key, &exact)) == NULL) |
166 | return (RET_ERROR); |
167 | h = e->page; |
168 | index = e->index; |
169 | |
170 | /* |
171 | * Add the key/data pair to the tree. If an identical key is already |
172 | * in the tree, and R_NOOVERWRITE is set, an error is returned. If |
173 | * R_NOOVERWRITE is not set, the key is either added (if duplicates are |
174 | * permitted) or an error is returned. |
175 | */ |
176 | switch (flags) { |
177 | case R_NOOVERWRITE: |
178 | if (!exact) |
179 | break; |
180 | mpool_put(t->bt_mp, h, 0); |
181 | return (RET_SPECIAL); |
182 | default: |
183 | if (!exact || !F_ISSET(t, B_NODUPS)) |
184 | break; |
185 | /* |
186 | * !!! |
187 | * Note, the delete may empty the page, so we need to put a |
188 | * new entry into the page immediately. |
189 | */ |
190 | delete: if (__bt_dleaf(t, key, h, index) == RET_ERROR) { |
191 | mpool_put(t->bt_mp, h, 0); |
192 | return (RET_ERROR); |
193 | } |
194 | break; |
195 | } |
196 | |
197 | /* |
198 | * If not enough room, or the user has put a ceiling on the number of |
199 | * keys permitted in the page, split the page. The split code will |
200 | * insert the key and data and unpin the current page. If inserting |
201 | * into the offset array, shift the pointers up. |
202 | */ |
203 | nbytes = NBLEAFDBT(key->size, data->size); |
204 | if (h->upper - h->lower < nbytes + sizeof(indx_t)) { |
205 | if ((status = __bt_split(t, h, key, |
206 | data, dflags, nbytes, index)) != RET_SUCCESS) |
207 | return (status); |
208 | goto success; |
209 | } |
210 | |
211 | if (index < (nxtindex = NEXTINDEX(h))) |
212 | memmove(h->linp + index + 1, h->linp + index, |
213 | (nxtindex - index) * sizeof(indx_t)); |
214 | h->lower += sizeof(indx_t); |
215 | |
216 | h->linp[index] = h->upper -= nbytes; |
217 | dest = (char *)h + h->upper; |
218 | WR_BLEAF(dest, key, data, dflags); |
219 | |
220 | /* If the cursor is on this page, adjust it as necessary. */ |
221 | if (F_ISSET(&t->bt_cursor, CURS_INIT) && |
222 | !F_ISSET(&t->bt_cursor, CURS_ACQUIRE) && |
223 | t->bt_cursor.pg.pgno == h->pgno && t->bt_cursor.pg.index >= index) |
224 | ++t->bt_cursor.pg.index; |
225 | |
226 | if (t->bt_order == NOT) { |
227 | if (h->nextpg == P_INVALID) { |
228 | if (index == NEXTINDEX(h) - 1) { |
229 | t->bt_order = FORWARD; |
230 | t->bt_last.index = index; |
231 | t->bt_last.pgno = h->pgno; |
232 | } |
233 | } else if (h->prevpg == P_INVALID) { |
234 | if (index == 0) { |
235 | t->bt_order = BACK; |
236 | t->bt_last.index = 0; |
237 | t->bt_last.pgno = h->pgno; |
238 | } |
239 | } |
240 | } |
241 | |
242 | mpool_put(t->bt_mp, h, MPOOL_DIRTY); |
243 | |
244 | success: |
245 | if (flags == R_SETCURSOR) |
246 | __bt_setcur(t, e->page->pgno, e->index); |
247 | |
248 | F_SET(t, B_MODIFIED); |
249 | return (RET_SUCCESS); |
250 | } |
251 | |
252 | #ifdef STATISTICS |
253 | u_long bt_cache_hit, bt_cache_miss; |
254 | #endif |
255 | |
256 | /* |
257 | * BT_FAST -- Do a quick check for sorted data. |
258 | * |
259 | * Parameters: |
260 | * t: tree |
261 | * key: key to insert |
262 | * |
263 | * Returns: |
264 | * EPG for new record or NULL if not found. |
265 | */ |
266 | static EPG * |
267 | bt_fast(t, key, data, exactp) |
268 | BTREE *t; |
269 | const DBT *key, *data; |
270 | int *exactp; |
271 | { |
272 | PAGE *h; |
273 | u_int32_t nbytes; |
274 | int cmp; |
275 | |
276 | if ((h = mpool_get(t->bt_mp, t->bt_last.pgno, 0)) == NULL) { |
277 | t->bt_order = NOT; |
278 | return (NULL); |
279 | } |
280 | t->bt_cur.page = h; |
281 | t->bt_cur.index = t->bt_last.index; |
282 | |
283 | /* |
284 | * If won't fit in this page or have too many keys in this page, |
285 | * have to search to get split stack. |
286 | */ |
287 | nbytes = NBLEAFDBT(key->size, data->size); |
288 | if (h->upper - h->lower < nbytes + sizeof(indx_t)) |
289 | goto miss; |
290 | |
291 | if (t->bt_order == FORWARD) { |
292 | if (t->bt_cur.page->nextpg != P_INVALID) |
293 | goto miss; |
294 | if (t->bt_cur.index != NEXTINDEX(h) - 1) |
295 | goto miss; |
296 | if ((cmp = __bt_cmp(t, key, &t->bt_cur)) < 0) |
297 | goto miss; |
298 | t->bt_last.index = cmp ? ++t->bt_cur.index : t->bt_cur.index; |
299 | } else { |
300 | if (t->bt_cur.page->prevpg != P_INVALID) |
301 | goto miss; |
302 | if (t->bt_cur.index != 0) |
303 | goto miss; |
304 | if ((cmp = __bt_cmp(t, key, &t->bt_cur)) > 0) |
305 | goto miss; |
306 | t->bt_last.index = 0; |
307 | } |
308 | *exactp = cmp == 0; |
309 | #ifdef STATISTICS |
310 | ++bt_cache_hit; |
311 | #endif |
312 | return (&t->bt_cur); |
313 | |
314 | miss: |
315 | #ifdef STATISTICS |
316 | ++bt_cache_miss; |
317 | #endif |
318 | t->bt_order = NOT; |
319 | mpool_put(t->bt_mp, h, 0); |
320 | return (NULL); |
321 | } |
322 | |