IB/mthca: Query port fix
[linux-2.6/verdex.git] / fs / hfs / brec.c
blob5c87cf4801fcb00f05311d2883c9977dbfa5ef2f
1 /*
2 * linux/fs/hfs/brec.c
4 * Copyright (C) 2001
5 * Brad Boyer (flar@allandria.com)
6 * (C) 2003 Ardis Technologies <roman@ardistech.com>
8 * Handle individual btree records
9 */
11 #include "btree.h"
13 static struct hfs_bnode *hfs_bnode_split(struct hfs_find_data *fd);
14 static int hfs_brec_update_parent(struct hfs_find_data *fd);
15 static int hfs_btree_inc_height(struct hfs_btree *tree);
17 /* Get the length and offset of the given record in the given node */
18 u16 hfs_brec_lenoff(struct hfs_bnode *node, u16 rec, u16 *off)
20 __be16 retval[2];
21 u16 dataoff;
23 dataoff = node->tree->node_size - (rec + 2) * 2;
24 hfs_bnode_read(node, retval, dataoff, 4);
25 *off = be16_to_cpu(retval[1]);
26 return be16_to_cpu(retval[0]) - *off;
29 /* Get the length of the key from a keyed record */
30 u16 hfs_brec_keylen(struct hfs_bnode *node, u16 rec)
32 u16 retval, recoff;
34 if (node->type != HFS_NODE_INDEX && node->type != HFS_NODE_LEAF)
35 return 0;
37 if ((node->type == HFS_NODE_INDEX) &&
38 !(node->tree->attributes & HFS_TREE_VARIDXKEYS)) {
39 if (node->tree->attributes & HFS_TREE_BIGKEYS)
40 retval = node->tree->max_key_len + 2;
41 else
42 retval = node->tree->max_key_len + 1;
43 } else {
44 recoff = hfs_bnode_read_u16(node, node->tree->node_size - (rec + 1) * 2);
45 if (!recoff)
46 return 0;
47 if (node->tree->attributes & HFS_TREE_BIGKEYS)
48 retval = hfs_bnode_read_u16(node, recoff) + 2;
49 else
50 retval = (hfs_bnode_read_u8(node, recoff) | 1) + 1;
52 return retval;
55 int hfs_brec_insert(struct hfs_find_data *fd, void *entry, int entry_len)
57 struct hfs_btree *tree;
58 struct hfs_bnode *node, *new_node;
59 int size, key_len, rec;
60 int data_off, end_off;
61 int idx_rec_off, data_rec_off, end_rec_off;
62 __be32 cnid;
64 tree = fd->tree;
65 if (!fd->bnode) {
66 if (!tree->root)
67 hfs_btree_inc_height(tree);
68 fd->bnode = hfs_bnode_find(tree, tree->leaf_head);
69 if (IS_ERR(fd->bnode))
70 return PTR_ERR(fd->bnode);
71 fd->record = -1;
73 new_node = NULL;
74 key_len = (fd->search_key->key_len | 1) + 1;
75 again:
76 /* new record idx and complete record size */
77 rec = fd->record + 1;
78 size = key_len + entry_len;
80 node = fd->bnode;
81 hfs_bnode_dump(node);
82 /* get last offset */
83 end_rec_off = tree->node_size - (node->num_recs + 1) * 2;
84 end_off = hfs_bnode_read_u16(node, end_rec_off);
85 end_rec_off -= 2;
86 dprint(DBG_BNODE_MOD, "insert_rec: %d, %d, %d, %d\n", rec, size, end_off, end_rec_off);
87 if (size > end_rec_off - end_off) {
88 if (new_node)
89 panic("not enough room!\n");
90 new_node = hfs_bnode_split(fd);
91 if (IS_ERR(new_node))
92 return PTR_ERR(new_node);
93 goto again;
95 if (node->type == HFS_NODE_LEAF) {
96 tree->leaf_count++;
97 mark_inode_dirty(tree->inode);
99 node->num_recs++;
100 /* write new last offset */
101 hfs_bnode_write_u16(node, offsetof(struct hfs_bnode_desc, num_recs), node->num_recs);
102 hfs_bnode_write_u16(node, end_rec_off, end_off + size);
103 data_off = end_off;
104 data_rec_off = end_rec_off + 2;
105 idx_rec_off = tree->node_size - (rec + 1) * 2;
106 if (idx_rec_off == data_rec_off)
107 goto skip;
108 /* move all following entries */
109 do {
110 data_off = hfs_bnode_read_u16(node, data_rec_off + 2);
111 hfs_bnode_write_u16(node, data_rec_off, data_off + size);
112 data_rec_off += 2;
113 } while (data_rec_off < idx_rec_off);
115 /* move data away */
116 hfs_bnode_move(node, data_off + size, data_off,
117 end_off - data_off);
119 skip:
120 hfs_bnode_write(node, fd->search_key, data_off, key_len);
121 hfs_bnode_write(node, entry, data_off + key_len, entry_len);
122 hfs_bnode_dump(node);
124 if (new_node) {
125 /* update parent key if we inserted a key
126 * at the start of the first node
128 if (!rec && new_node != node)
129 hfs_brec_update_parent(fd);
131 hfs_bnode_put(fd->bnode);
132 if (!new_node->parent) {
133 hfs_btree_inc_height(tree);
134 new_node->parent = tree->root;
136 fd->bnode = hfs_bnode_find(tree, new_node->parent);
138 /* create index data entry */
139 cnid = cpu_to_be32(new_node->this);
140 entry = &cnid;
141 entry_len = sizeof(cnid);
143 /* get index key */
144 hfs_bnode_read_key(new_node, fd->search_key, 14);
145 __hfs_brec_find(fd->bnode, fd);
147 hfs_bnode_put(new_node);
148 new_node = NULL;
150 if (tree->attributes & HFS_TREE_VARIDXKEYS)
151 key_len = fd->search_key->key_len + 1;
152 else {
153 fd->search_key->key_len = tree->max_key_len;
154 key_len = tree->max_key_len + 1;
156 goto again;
159 if (!rec)
160 hfs_brec_update_parent(fd);
162 return 0;
165 int hfs_brec_remove(struct hfs_find_data *fd)
167 struct hfs_btree *tree;
168 struct hfs_bnode *node, *parent;
169 int end_off, rec_off, data_off, size;
171 tree = fd->tree;
172 node = fd->bnode;
173 again:
174 rec_off = tree->node_size - (fd->record + 2) * 2;
175 end_off = tree->node_size - (node->num_recs + 1) * 2;
177 if (node->type == HFS_NODE_LEAF) {
178 tree->leaf_count--;
179 mark_inode_dirty(tree->inode);
181 hfs_bnode_dump(node);
182 dprint(DBG_BNODE_MOD, "remove_rec: %d, %d\n", fd->record, fd->keylength + fd->entrylength);
183 if (!--node->num_recs) {
184 hfs_bnode_unlink(node);
185 if (!node->parent)
186 return 0;
187 parent = hfs_bnode_find(tree, node->parent);
188 if (IS_ERR(parent))
189 return PTR_ERR(parent);
190 hfs_bnode_put(node);
191 node = fd->bnode = parent;
193 __hfs_brec_find(node, fd);
194 goto again;
196 hfs_bnode_write_u16(node, offsetof(struct hfs_bnode_desc, num_recs), node->num_recs);
198 if (rec_off == end_off)
199 goto skip;
200 size = fd->keylength + fd->entrylength;
202 do {
203 data_off = hfs_bnode_read_u16(node, rec_off);
204 hfs_bnode_write_u16(node, rec_off + 2, data_off - size);
205 rec_off -= 2;
206 } while (rec_off >= end_off);
208 /* fill hole */
209 hfs_bnode_move(node, fd->keyoffset, fd->keyoffset + size,
210 data_off - fd->keyoffset - size);
211 skip:
212 hfs_bnode_dump(node);
213 if (!fd->record)
214 hfs_brec_update_parent(fd);
215 return 0;
218 static struct hfs_bnode *hfs_bnode_split(struct hfs_find_data *fd)
220 struct hfs_btree *tree;
221 struct hfs_bnode *node, *new_node;
222 struct hfs_bnode_desc node_desc;
223 int num_recs, new_rec_off, new_off, old_rec_off;
224 int data_start, data_end, size;
226 tree = fd->tree;
227 node = fd->bnode;
228 new_node = hfs_bmap_alloc(tree);
229 if (IS_ERR(new_node))
230 return new_node;
231 hfs_bnode_get(node);
232 dprint(DBG_BNODE_MOD, "split_nodes: %d - %d - %d\n",
233 node->this, new_node->this, node->next);
234 new_node->next = node->next;
235 new_node->prev = node->this;
236 new_node->parent = node->parent;
237 new_node->type = node->type;
238 new_node->height = node->height;
240 size = tree->node_size / 2 - node->num_recs * 2 - 14;
241 old_rec_off = tree->node_size - 4;
242 num_recs = 1;
243 for (;;) {
244 data_start = hfs_bnode_read_u16(node, old_rec_off);
245 if (data_start > size)
246 break;
247 old_rec_off -= 2;
248 if (++num_recs < node->num_recs)
249 continue;
250 /* panic? */
251 hfs_bnode_put(node);
252 hfs_bnode_put(new_node);
253 return ERR_PTR(-ENOSPC);
256 if (fd->record + 1 < num_recs) {
257 /* new record is in the lower half,
258 * so leave some more space there
260 old_rec_off += 2;
261 num_recs--;
262 data_start = hfs_bnode_read_u16(node, old_rec_off);
263 } else {
264 hfs_bnode_put(node);
265 hfs_bnode_get(new_node);
266 fd->bnode = new_node;
267 fd->record -= num_recs;
268 fd->keyoffset -= data_start - 14;
269 fd->entryoffset -= data_start - 14;
271 new_node->num_recs = node->num_recs - num_recs;
272 node->num_recs = num_recs;
274 new_rec_off = tree->node_size - 2;
275 new_off = 14;
276 size = data_start - new_off;
277 num_recs = new_node->num_recs;
278 data_end = data_start;
279 while (num_recs) {
280 hfs_bnode_write_u16(new_node, new_rec_off, new_off);
281 old_rec_off -= 2;
282 new_rec_off -= 2;
283 data_end = hfs_bnode_read_u16(node, old_rec_off);
284 new_off = data_end - size;
285 num_recs--;
287 hfs_bnode_write_u16(new_node, new_rec_off, new_off);
288 hfs_bnode_copy(new_node, 14, node, data_start, data_end - data_start);
290 /* update new bnode header */
291 node_desc.next = cpu_to_be32(new_node->next);
292 node_desc.prev = cpu_to_be32(new_node->prev);
293 node_desc.type = new_node->type;
294 node_desc.height = new_node->height;
295 node_desc.num_recs = cpu_to_be16(new_node->num_recs);
296 node_desc.reserved = 0;
297 hfs_bnode_write(new_node, &node_desc, 0, sizeof(node_desc));
299 /* update previous bnode header */
300 node->next = new_node->this;
301 hfs_bnode_read(node, &node_desc, 0, sizeof(node_desc));
302 node_desc.next = cpu_to_be32(node->next);
303 node_desc.num_recs = cpu_to_be16(node->num_recs);
304 hfs_bnode_write(node, &node_desc, 0, sizeof(node_desc));
306 /* update next bnode header */
307 if (new_node->next) {
308 struct hfs_bnode *next_node = hfs_bnode_find(tree, new_node->next);
309 next_node->prev = new_node->this;
310 hfs_bnode_read(next_node, &node_desc, 0, sizeof(node_desc));
311 node_desc.prev = cpu_to_be32(next_node->prev);
312 hfs_bnode_write(next_node, &node_desc, 0, sizeof(node_desc));
313 hfs_bnode_put(next_node);
314 } else if (node->this == tree->leaf_tail) {
315 /* if there is no next node, this might be the new tail */
316 tree->leaf_tail = new_node->this;
317 mark_inode_dirty(tree->inode);
320 hfs_bnode_dump(node);
321 hfs_bnode_dump(new_node);
322 hfs_bnode_put(node);
324 return new_node;
327 static int hfs_brec_update_parent(struct hfs_find_data *fd)
329 struct hfs_btree *tree;
330 struct hfs_bnode *node, *new_node, *parent;
331 int newkeylen, diff;
332 int rec, rec_off, end_rec_off;
333 int start_off, end_off;
335 tree = fd->tree;
336 node = fd->bnode;
337 new_node = NULL;
338 if (!node->parent)
339 return 0;
341 again:
342 parent = hfs_bnode_find(tree, node->parent);
343 if (IS_ERR(parent))
344 return PTR_ERR(parent);
345 __hfs_brec_find(parent, fd);
346 hfs_bnode_dump(parent);
347 rec = fd->record;
349 /* size difference between old and new key */
350 if (tree->attributes & HFS_TREE_VARIDXKEYS)
351 newkeylen = (hfs_bnode_read_u8(node, 14) | 1) + 1;
352 else
353 fd->keylength = newkeylen = tree->max_key_len + 1;
354 dprint(DBG_BNODE_MOD, "update_rec: %d, %d, %d\n", rec, fd->keylength, newkeylen);
356 rec_off = tree->node_size - (rec + 2) * 2;
357 end_rec_off = tree->node_size - (parent->num_recs + 1) * 2;
358 diff = newkeylen - fd->keylength;
359 if (!diff)
360 goto skip;
361 if (diff > 0) {
362 end_off = hfs_bnode_read_u16(parent, end_rec_off);
363 if (end_rec_off - end_off < diff) {
365 printk(KERN_DEBUG "hfs: splitting index node...\n");
366 fd->bnode = parent;
367 new_node = hfs_bnode_split(fd);
368 if (IS_ERR(new_node))
369 return PTR_ERR(new_node);
370 parent = fd->bnode;
371 rec = fd->record;
372 rec_off = tree->node_size - (rec + 2) * 2;
373 end_rec_off = tree->node_size - (parent->num_recs + 1) * 2;
377 end_off = start_off = hfs_bnode_read_u16(parent, rec_off);
378 hfs_bnode_write_u16(parent, rec_off, start_off + diff);
379 start_off -= 4; /* move previous cnid too */
381 while (rec_off > end_rec_off) {
382 rec_off -= 2;
383 end_off = hfs_bnode_read_u16(parent, rec_off);
384 hfs_bnode_write_u16(parent, rec_off, end_off + diff);
386 hfs_bnode_move(parent, start_off + diff, start_off,
387 end_off - start_off);
388 skip:
389 hfs_bnode_copy(parent, fd->keyoffset, node, 14, newkeylen);
390 if (!(tree->attributes & HFS_TREE_VARIDXKEYS))
391 hfs_bnode_write_u8(parent, fd->keyoffset, newkeylen - 1);
392 hfs_bnode_dump(parent);
394 hfs_bnode_put(node);
395 node = parent;
397 if (new_node) {
398 __be32 cnid;
400 fd->bnode = hfs_bnode_find(tree, new_node->parent);
401 /* create index key and entry */
402 hfs_bnode_read_key(new_node, fd->search_key, 14);
403 cnid = cpu_to_be32(new_node->this);
405 __hfs_brec_find(fd->bnode, fd);
406 hfs_brec_insert(fd, &cnid, sizeof(cnid));
407 hfs_bnode_put(fd->bnode);
408 hfs_bnode_put(new_node);
410 if (!rec) {
411 if (new_node == node)
412 goto out;
413 /* restore search_key */
414 hfs_bnode_read_key(node, fd->search_key, 14);
418 if (!rec && node->parent)
419 goto again;
420 out:
421 fd->bnode = node;
422 return 0;
425 static int hfs_btree_inc_height(struct hfs_btree *tree)
427 struct hfs_bnode *node, *new_node;
428 struct hfs_bnode_desc node_desc;
429 int key_size, rec;
430 __be32 cnid;
432 node = NULL;
433 if (tree->root) {
434 node = hfs_bnode_find(tree, tree->root);
435 if (IS_ERR(node))
436 return PTR_ERR(node);
438 new_node = hfs_bmap_alloc(tree);
439 if (IS_ERR(new_node)) {
440 hfs_bnode_put(node);
441 return PTR_ERR(new_node);
444 tree->root = new_node->this;
445 if (!tree->depth) {
446 tree->leaf_head = tree->leaf_tail = new_node->this;
447 new_node->type = HFS_NODE_LEAF;
448 new_node->num_recs = 0;
449 } else {
450 new_node->type = HFS_NODE_INDEX;
451 new_node->num_recs = 1;
453 new_node->parent = 0;
454 new_node->next = 0;
455 new_node->prev = 0;
456 new_node->height = ++tree->depth;
458 node_desc.next = cpu_to_be32(new_node->next);
459 node_desc.prev = cpu_to_be32(new_node->prev);
460 node_desc.type = new_node->type;
461 node_desc.height = new_node->height;
462 node_desc.num_recs = cpu_to_be16(new_node->num_recs);
463 node_desc.reserved = 0;
464 hfs_bnode_write(new_node, &node_desc, 0, sizeof(node_desc));
466 rec = tree->node_size - 2;
467 hfs_bnode_write_u16(new_node, rec, 14);
469 if (node) {
470 /* insert old root idx into new root */
471 node->parent = tree->root;
472 if (node->type == HFS_NODE_LEAF ||
473 tree->attributes & HFS_TREE_VARIDXKEYS)
474 key_size = hfs_bnode_read_u8(node, 14) + 1;
475 else
476 key_size = tree->max_key_len + 1;
477 hfs_bnode_copy(new_node, 14, node, 14, key_size);
479 if (!(tree->attributes & HFS_TREE_VARIDXKEYS)) {
480 key_size = tree->max_key_len + 1;
481 hfs_bnode_write_u8(new_node, 14, tree->max_key_len);
483 key_size = (key_size + 1) & -2;
484 cnid = cpu_to_be32(node->this);
485 hfs_bnode_write(new_node, &cnid, 14 + key_size, 4);
487 rec -= 2;
488 hfs_bnode_write_u16(new_node, rec, 14 + key_size + 4);
490 hfs_bnode_put(node);
492 hfs_bnode_put(new_node);
493 mark_inode_dirty(tree->inode);
495 return 0;