xfs: connect up write verifiers to new buffers
[deliverable/linux.git] / fs / xfs / xfs_attr_leaf.c
CommitLineData
1da177e4 1/*
7b718769
NS
2 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
3 * All Rights Reserved.
1da177e4 4 *
7b718769
NS
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License as
1da177e4
LT
7 * published by the Free Software Foundation.
8 *
7b718769
NS
9 * This program is distributed in the hope that it would be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
1da177e4 13 *
7b718769
NS
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write the Free Software Foundation,
16 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
1da177e4 17 */
1da177e4 18#include "xfs.h"
a844f451 19#include "xfs_fs.h"
1da177e4 20#include "xfs_types.h"
a844f451 21#include "xfs_bit.h"
1da177e4
LT
22#include "xfs_log.h"
23#include "xfs_trans.h"
24#include "xfs_sb.h"
25#include "xfs_ag.h"
1da177e4 26#include "xfs_mount.h"
a844f451 27#include "xfs_da_btree.h"
1da177e4 28#include "xfs_bmap_btree.h"
a844f451 29#include "xfs_alloc_btree.h"
1da177e4
LT
30#include "xfs_ialloc_btree.h"
31#include "xfs_alloc.h"
32#include "xfs_btree.h"
a844f451 33#include "xfs_attr_sf.h"
1da177e4 34#include "xfs_dinode.h"
1da177e4 35#include "xfs_inode.h"
a844f451 36#include "xfs_inode_item.h"
1da177e4 37#include "xfs_bmap.h"
1da177e4
LT
38#include "xfs_attr.h"
39#include "xfs_attr_leaf.h"
40#include "xfs_error.h"
0b1b213f 41#include "xfs_trace.h"
1da177e4
LT
42
43/*
44 * xfs_attr_leaf.c
45 *
46 * Routines to implement leaf blocks of attributes as Btrees of hashed names.
47 */
48
49/*========================================================================
50 * Function prototypes for the kernel.
51 *========================================================================*/
52
53/*
54 * Routines used for growing the Btree.
55 */
ba0f32d4 56STATIC int xfs_attr_leaf_create(xfs_da_args_t *args, xfs_dablk_t which_block,
1d9025e5
DC
57 struct xfs_buf **bpp);
58STATIC int xfs_attr_leaf_add_work(struct xfs_buf *leaf_buffer,
59 xfs_da_args_t *args, int freemap_index);
ee73259b
DC
60STATIC void xfs_attr_leaf_compact(struct xfs_da_args *args,
61 struct xfs_buf *leaf_buffer);
1da177e4
LT
62STATIC void xfs_attr_leaf_rebalance(xfs_da_state_t *state,
63 xfs_da_state_blk_t *blk1,
64 xfs_da_state_blk_t *blk2);
65STATIC int xfs_attr_leaf_figure_balance(xfs_da_state_t *state,
66 xfs_da_state_blk_t *leaf_blk_1,
67 xfs_da_state_blk_t *leaf_blk_2,
68 int *number_entries_in_blk1,
69 int *number_usedbytes_in_blk1);
70
ba0f32d4
CH
71/*
72 * Routines used for shrinking the Btree.
73 */
74STATIC int xfs_attr_node_inactive(xfs_trans_t **trans, xfs_inode_t *dp,
1d9025e5 75 struct xfs_buf *bp, int level);
ba0f32d4 76STATIC int xfs_attr_leaf_inactive(xfs_trans_t **trans, xfs_inode_t *dp,
1d9025e5 77 struct xfs_buf *bp);
ba0f32d4
CH
78STATIC int xfs_attr_leaf_freextent(xfs_trans_t **trans, xfs_inode_t *dp,
79 xfs_dablk_t blkno, int blkcnt);
80
1da177e4
LT
81/*
82 * Utility routines.
83 */
84STATIC void xfs_attr_leaf_moveents(xfs_attr_leafblock_t *src_leaf,
85 int src_start,
86 xfs_attr_leafblock_t *dst_leaf,
87 int dst_start, int move_count,
88 xfs_mount_t *mp);
ba0f32d4 89STATIC int xfs_attr_leaf_entsize(xfs_attr_leafblock_t *leaf, int index);
726801ba 90
612cfbfe 91static void
ad14c33a
DC
92xfs_attr_leaf_verify(
93 struct xfs_buf *bp)
94{
95 struct xfs_mount *mp = bp->b_target->bt_mount;
96 struct xfs_attr_leaf_hdr *hdr = bp->b_addr;
97 int block_ok = 0;
98
99 block_ok = hdr->info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC);
100 if (!block_ok) {
101 XFS_CORRUPTION_ERROR(__func__, XFS_ERRLEVEL_LOW, mp, hdr);
102 xfs_buf_ioerror(bp, EFSCORRUPTED);
103 }
612cfbfe
DC
104}
105
106static void
107xfs_attr_leaf_write_verify(
108 struct xfs_buf *bp)
109{
110 xfs_attr_leaf_verify(bp);
111}
ad14c33a 112
612cfbfe
DC
113void
114xfs_attr_leaf_read_verify(
115 struct xfs_buf *bp)
116{
117 xfs_attr_leaf_verify(bp);
118 bp->b_pre_io = xfs_attr_leaf_write_verify;
ad14c33a
DC
119 bp->b_iodone = NULL;
120 xfs_buf_ioend(bp, 0);
121}
122
612cfbfe 123
ad14c33a
DC
124int
125xfs_attr_leaf_read(
126 struct xfs_trans *tp,
127 struct xfs_inode *dp,
128 xfs_dablk_t bno,
129 xfs_daddr_t mappedbno,
130 struct xfs_buf **bpp)
131{
132 return xfs_da_read_buf(tp, dp, bno, mappedbno, bpp,
612cfbfe 133 XFS_ATTR_FORK, xfs_attr_leaf_read_verify);
ad14c33a
DC
134}
135
726801ba
TS
136/*========================================================================
137 * Namespace helper routines
138 *========================================================================*/
139
726801ba
TS
140/*
141 * If namespace bits don't match return 0.
142 * If all match then return 1.
143 */
b8f82a4a 144STATIC int
726801ba
TS
145xfs_attr_namesp_match(int arg_flags, int ondisk_flags)
146{
147 return XFS_ATTR_NSP_ONDISK(ondisk_flags) == XFS_ATTR_NSP_ARGS_TO_ONDISK(arg_flags);
148}
149
1da177e4
LT
150
151/*========================================================================
d8cc890d 152 * External routines when attribute fork size < XFS_LITINO(mp).
1da177e4
LT
153 *========================================================================*/
154
155/*
d8cc890d
NS
156 * Query whether the requested number of additional bytes of extended
157 * attribute space will be able to fit inline.
4c393a60 158 *
d8cc890d
NS
159 * Returns zero if not, else the di_forkoff fork offset to be used in the
160 * literal area for attribute data once the new bytes have been added.
161 *
162 * di_forkoff must be 8 byte aligned, hence is stored as a >>3 value;
163 * special case for dev/uuid inodes, they have fixed size data forks.
1da177e4
LT
164 */
165int
d8cc890d
NS
166xfs_attr_shortform_bytesfit(xfs_inode_t *dp, int bytes)
167{
168 int offset;
169 int minforkoff; /* lower limit on valid forkoff locations */
170 int maxforkoff; /* upper limit on valid forkoff locations */
4c393a60 171 int dsize;
d8cc890d
NS
172 xfs_mount_t *mp = dp->i_mount;
173
d8cc890d
NS
174 offset = (XFS_LITINO(mp) - bytes) >> 3; /* rounded down */
175
176 switch (dp->i_d.di_format) {
177 case XFS_DINODE_FMT_DEV:
178 minforkoff = roundup(sizeof(xfs_dev_t), 8) >> 3;
179 return (offset >= minforkoff) ? minforkoff : 0;
180 case XFS_DINODE_FMT_UUID:
181 minforkoff = roundup(sizeof(uuid_t), 8) >> 3;
182 return (offset >= minforkoff) ? minforkoff : 0;
183 }
184
4c393a60
CH
185 /*
186 * If the requested numbers of bytes is smaller or equal to the
187 * current attribute fork size we can always proceed.
188 *
189 * Note that if_bytes in the data fork might actually be larger than
190 * the current data fork size is due to delalloc extents. In that
191 * case either the extent count will go down when they are converted
192 * to real extents, or the delalloc conversion will take care of the
193 * literal area rebalancing.
194 */
195 if (bytes <= XFS_IFORK_ASIZE(dp))
196 return dp->i_d.di_forkoff;
197
198 /*
199 * For attr2 we can try to move the forkoff if there is space in the
200 * literal area, but for the old format we are done if there is no
201 * space in the fixed attribute fork.
202 */
203 if (!(mp->m_flags & XFS_MOUNT_ATTR2))
da087bad 204 return 0;
da087bad 205
e5889e90 206 dsize = dp->i_df.if_bytes;
4c393a60 207
e5889e90
BN
208 switch (dp->i_d.di_format) {
209 case XFS_DINODE_FMT_EXTENTS:
4c393a60 210 /*
e5889e90 211 * If there is no attr fork and the data fork is extents,
4c393a60
CH
212 * determine if creating the default attr fork will result
213 * in the extents form migrating to btree. If so, the
214 * minimum offset only needs to be the space required for
e5889e90 215 * the btree root.
4c393a60 216 */
1a5902c5
CH
217 if (!dp->i_d.di_forkoff && dp->i_df.if_bytes >
218 xfs_default_attroffset(dp))
e5889e90
BN
219 dsize = XFS_BMDR_SPACE_CALC(MINDBTPTRS);
220 break;
e5889e90
BN
221 case XFS_DINODE_FMT_BTREE:
222 /*
4c393a60
CH
223 * If we have a data btree then keep forkoff if we have one,
224 * otherwise we are adding a new attr, so then we set
225 * minforkoff to where the btree root can finish so we have
e5889e90
BN
226 * plenty of room for attrs
227 */
228 if (dp->i_d.di_forkoff) {
4c393a60 229 if (offset < dp->i_d.di_forkoff)
e5889e90 230 return 0;
4c393a60
CH
231 return dp->i_d.di_forkoff;
232 }
233 dsize = XFS_BMAP_BROOT_SPACE(dp->i_df.if_broot);
e5889e90
BN
234 break;
235 }
4c393a60
CH
236
237 /*
238 * A data fork btree root must have space for at least
e5889e90
BN
239 * MINDBTPTRS key/ptr pairs if the data fork is small or empty.
240 */
241 minforkoff = MAX(dsize, XFS_BMDR_SPACE_CALC(MINDBTPTRS));
d8cc890d
NS
242 minforkoff = roundup(minforkoff, 8) >> 3;
243
244 /* attr fork btree root can have at least this many key/ptr pairs */
245 maxforkoff = XFS_LITINO(mp) - XFS_BMDR_SPACE_CALC(MINABTPTRS);
246 maxforkoff = maxforkoff >> 3; /* rounded down */
247
d8cc890d
NS
248 if (offset >= maxforkoff)
249 return maxforkoff;
4c393a60
CH
250 if (offset >= minforkoff)
251 return offset;
d8cc890d
NS
252 return 0;
253}
254
255/*
256 * Switch on the ATTR2 superblock bit (implies also FEATURES2)
257 */
258STATIC void
259xfs_sbversion_add_attr2(xfs_mount_t *mp, xfs_trans_t *tp)
260{
13059ff0 261 if ((mp->m_flags & XFS_MOUNT_ATTR2) &&
62118709 262 !(xfs_sb_version_hasattr2(&mp->m_sb))) {
3685c2a1 263 spin_lock(&mp->m_sb_lock);
62118709
ES
264 if (!xfs_sb_version_hasattr2(&mp->m_sb)) {
265 xfs_sb_version_addattr2(&mp->m_sb);
3685c2a1 266 spin_unlock(&mp->m_sb_lock);
d8cc890d
NS
267 xfs_mod_sb(tp, XFS_SB_VERSIONNUM | XFS_SB_FEATURES2);
268 } else
3685c2a1 269 spin_unlock(&mp->m_sb_lock);
d8cc890d
NS
270 }
271}
272
273/*
274 * Create the initial contents of a shortform attribute list.
275 */
276void
1da177e4
LT
277xfs_attr_shortform_create(xfs_da_args_t *args)
278{
279 xfs_attr_sf_hdr_t *hdr;
280 xfs_inode_t *dp;
281 xfs_ifork_t *ifp;
282
5a5881cd
DC
283 trace_xfs_attr_sf_create(args);
284
1da177e4
LT
285 dp = args->dp;
286 ASSERT(dp != NULL);
287 ifp = dp->i_afp;
288 ASSERT(ifp != NULL);
289 ASSERT(ifp->if_bytes == 0);
290 if (dp->i_d.di_aformat == XFS_DINODE_FMT_EXTENTS) {
291 ifp->if_flags &= ~XFS_IFEXTENTS; /* just in case */
292 dp->i_d.di_aformat = XFS_DINODE_FMT_LOCAL;
293 ifp->if_flags |= XFS_IFINLINE;
294 } else {
295 ASSERT(ifp->if_flags & XFS_IFINLINE);
296 }
297 xfs_idata_realloc(dp, sizeof(*hdr), XFS_ATTR_FORK);
298 hdr = (xfs_attr_sf_hdr_t *)ifp->if_u1.if_data;
299 hdr->count = 0;
3b244aa8 300 hdr->totsize = cpu_to_be16(sizeof(*hdr));
1da177e4 301 xfs_trans_log_inode(args->trans, dp, XFS_ILOG_CORE | XFS_ILOG_ADATA);
1da177e4
LT
302}
303
304/*
305 * Add a name/value pair to the shortform attribute list.
306 * Overflow from the inode has already been checked for.
307 */
d8cc890d
NS
308void
309xfs_attr_shortform_add(xfs_da_args_t *args, int forkoff)
1da177e4
LT
310{
311 xfs_attr_shortform_t *sf;
312 xfs_attr_sf_entry_t *sfe;
313 int i, offset, size;
d8cc890d 314 xfs_mount_t *mp;
1da177e4
LT
315 xfs_inode_t *dp;
316 xfs_ifork_t *ifp;
317
5a5881cd
DC
318 trace_xfs_attr_sf_add(args);
319
1da177e4 320 dp = args->dp;
d8cc890d
NS
321 mp = dp->i_mount;
322 dp->i_d.di_forkoff = forkoff;
d8cc890d 323
1da177e4
LT
324 ifp = dp->i_afp;
325 ASSERT(ifp->if_flags & XFS_IFINLINE);
326 sf = (xfs_attr_shortform_t *)ifp->if_u1.if_data;
327 sfe = &sf->list[0];
3b244aa8 328 for (i = 0; i < sf->hdr.count; sfe = XFS_ATTR_SF_NEXTENTRY(sfe), i++) {
d8cc890d 329#ifdef DEBUG
1da177e4
LT
330 if (sfe->namelen != args->namelen)
331 continue;
332 if (memcmp(args->name, sfe->nameval, args->namelen) != 0)
333 continue;
726801ba 334 if (!xfs_attr_namesp_match(args->flags, sfe->flags))
1da177e4 335 continue;
d8cc890d
NS
336 ASSERT(0);
337#endif
1da177e4
LT
338 }
339
340 offset = (char *)sfe - (char *)sf;
341 size = XFS_ATTR_SF_ENTSIZE_BYNAME(args->namelen, args->valuelen);
342 xfs_idata_realloc(dp, size, XFS_ATTR_FORK);
343 sf = (xfs_attr_shortform_t *)ifp->if_u1.if_data;
344 sfe = (xfs_attr_sf_entry_t *)((char *)sf + offset);
345
346 sfe->namelen = args->namelen;
3b244aa8 347 sfe->valuelen = args->valuelen;
726801ba 348 sfe->flags = XFS_ATTR_NSP_ARGS_TO_ONDISK(args->flags);
1da177e4
LT
349 memcpy(sfe->nameval, args->name, args->namelen);
350 memcpy(&sfe->nameval[args->namelen], args->value, args->valuelen);
3b244aa8 351 sf->hdr.count++;
413d57c9 352 be16_add_cpu(&sf->hdr.totsize, size);
1da177e4
LT
353 xfs_trans_log_inode(args->trans, dp, XFS_ILOG_CORE | XFS_ILOG_ADATA);
354
d8cc890d 355 xfs_sbversion_add_attr2(mp, args->trans);
1da177e4
LT
356}
357
e1486dea
CH
358/*
359 * After the last attribute is removed revert to original inode format,
360 * making all literal area available to the data fork once more.
361 */
362STATIC void
363xfs_attr_fork_reset(
364 struct xfs_inode *ip,
365 struct xfs_trans *tp)
366{
367 xfs_idestroy_fork(ip, XFS_ATTR_FORK);
368 ip->i_d.di_forkoff = 0;
369 ip->i_d.di_aformat = XFS_DINODE_FMT_EXTENTS;
370
371 ASSERT(ip->i_d.di_anextents == 0);
372 ASSERT(ip->i_afp == NULL);
373
e1486dea
CH
374 xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE);
375}
376
1da177e4 377/*
d8cc890d 378 * Remove an attribute from the shortform attribute list structure.
1da177e4
LT
379 */
380int
381xfs_attr_shortform_remove(xfs_da_args_t *args)
382{
383 xfs_attr_shortform_t *sf;
384 xfs_attr_sf_entry_t *sfe;
385 int base, size=0, end, totsize, i;
d8cc890d 386 xfs_mount_t *mp;
1da177e4
LT
387 xfs_inode_t *dp;
388
5a5881cd
DC
389 trace_xfs_attr_sf_remove(args);
390
1da177e4 391 dp = args->dp;
d8cc890d 392 mp = dp->i_mount;
1da177e4
LT
393 base = sizeof(xfs_attr_sf_hdr_t);
394 sf = (xfs_attr_shortform_t *)dp->i_afp->if_u1.if_data;
395 sfe = &sf->list[0];
3b244aa8 396 end = sf->hdr.count;
d8cc890d 397 for (i = 0; i < end; sfe = XFS_ATTR_SF_NEXTENTRY(sfe),
1da177e4
LT
398 base += size, i++) {
399 size = XFS_ATTR_SF_ENTSIZE(sfe);
400 if (sfe->namelen != args->namelen)
401 continue;
402 if (memcmp(sfe->nameval, args->name, args->namelen) != 0)
403 continue;
726801ba 404 if (!xfs_attr_namesp_match(args->flags, sfe->flags))
1da177e4
LT
405 continue;
406 break;
407 }
d8cc890d 408 if (i == end)
1da177e4
LT
409 return(XFS_ERROR(ENOATTR));
410
d8cc890d
NS
411 /*
412 * Fix up the attribute fork data, covering the hole
413 */
1da177e4 414 end = base + size;
3b244aa8 415 totsize = be16_to_cpu(sf->hdr.totsize);
d8cc890d
NS
416 if (end != totsize)
417 memmove(&((char *)sf)[base], &((char *)sf)[end], totsize - end);
3b244aa8 418 sf->hdr.count--;
413d57c9 419 be16_add_cpu(&sf->hdr.totsize, -size);
d8cc890d
NS
420
421 /*
422 * Fix up the start offset of the attribute fork
423 */
424 totsize -= size;
6a178100 425 if (totsize == sizeof(xfs_attr_sf_hdr_t) &&
e1486dea
CH
426 (mp->m_flags & XFS_MOUNT_ATTR2) &&
427 (dp->i_d.di_format != XFS_DINODE_FMT_BTREE) &&
428 !(args->op_flags & XFS_DA_OP_ADDNAME)) {
429 xfs_attr_fork_reset(dp, args->trans);
d8cc890d
NS
430 } else {
431 xfs_idata_realloc(dp, -size, XFS_ATTR_FORK);
432 dp->i_d.di_forkoff = xfs_attr_shortform_bytesfit(dp, totsize);
433 ASSERT(dp->i_d.di_forkoff);
6a178100
BN
434 ASSERT(totsize > sizeof(xfs_attr_sf_hdr_t) ||
435 (args->op_flags & XFS_DA_OP_ADDNAME) ||
436 !(mp->m_flags & XFS_MOUNT_ATTR2) ||
437 dp->i_d.di_format == XFS_DINODE_FMT_BTREE);
d8cc890d
NS
438 xfs_trans_log_inode(args->trans, dp,
439 XFS_ILOG_CORE | XFS_ILOG_ADATA);
440 }
441
442 xfs_sbversion_add_attr2(mp, args->trans);
1da177e4
LT
443
444 return(0);
445}
446
447/*
448 * Look up a name in a shortform attribute list structure.
449 */
450/*ARGSUSED*/
451int
452xfs_attr_shortform_lookup(xfs_da_args_t *args)
453{
454 xfs_attr_shortform_t *sf;
455 xfs_attr_sf_entry_t *sfe;
456 int i;
457 xfs_ifork_t *ifp;
458
5a5881cd
DC
459 trace_xfs_attr_sf_lookup(args);
460
1da177e4
LT
461 ifp = args->dp->i_afp;
462 ASSERT(ifp->if_flags & XFS_IFINLINE);
463 sf = (xfs_attr_shortform_t *)ifp->if_u1.if_data;
464 sfe = &sf->list[0];
3b244aa8 465 for (i = 0; i < sf->hdr.count;
1da177e4
LT
466 sfe = XFS_ATTR_SF_NEXTENTRY(sfe), i++) {
467 if (sfe->namelen != args->namelen)
468 continue;
469 if (memcmp(args->name, sfe->nameval, args->namelen) != 0)
470 continue;
726801ba 471 if (!xfs_attr_namesp_match(args->flags, sfe->flags))
1da177e4
LT
472 continue;
473 return(XFS_ERROR(EEXIST));
474 }
475 return(XFS_ERROR(ENOATTR));
476}
477
478/*
479 * Look up a name in a shortform attribute list structure.
480 */
481/*ARGSUSED*/
482int
483xfs_attr_shortform_getvalue(xfs_da_args_t *args)
484{
485 xfs_attr_shortform_t *sf;
486 xfs_attr_sf_entry_t *sfe;
487 int i;
488
489 ASSERT(args->dp->i_d.di_aformat == XFS_IFINLINE);
490 sf = (xfs_attr_shortform_t *)args->dp->i_afp->if_u1.if_data;
491 sfe = &sf->list[0];
3b244aa8 492 for (i = 0; i < sf->hdr.count;
1da177e4
LT
493 sfe = XFS_ATTR_SF_NEXTENTRY(sfe), i++) {
494 if (sfe->namelen != args->namelen)
495 continue;
496 if (memcmp(args->name, sfe->nameval, args->namelen) != 0)
497 continue;
726801ba 498 if (!xfs_attr_namesp_match(args->flags, sfe->flags))
1da177e4
LT
499 continue;
500 if (args->flags & ATTR_KERNOVAL) {
3b244aa8 501 args->valuelen = sfe->valuelen;
1da177e4
LT
502 return(XFS_ERROR(EEXIST));
503 }
3b244aa8
NS
504 if (args->valuelen < sfe->valuelen) {
505 args->valuelen = sfe->valuelen;
1da177e4
LT
506 return(XFS_ERROR(ERANGE));
507 }
3b244aa8 508 args->valuelen = sfe->valuelen;
1da177e4
LT
509 memcpy(args->value, &sfe->nameval[args->namelen],
510 args->valuelen);
511 return(XFS_ERROR(EEXIST));
512 }
513 return(XFS_ERROR(ENOATTR));
514}
515
516/*
517 * Convert from using the shortform to the leaf.
518 */
519int
520xfs_attr_shortform_to_leaf(xfs_da_args_t *args)
521{
522 xfs_inode_t *dp;
523 xfs_attr_shortform_t *sf;
524 xfs_attr_sf_entry_t *sfe;
525 xfs_da_args_t nargs;
526 char *tmpbuffer;
527 int error, i, size;
528 xfs_dablk_t blkno;
1d9025e5 529 struct xfs_buf *bp;
1da177e4
LT
530 xfs_ifork_t *ifp;
531
5a5881cd
DC
532 trace_xfs_attr_sf_to_leaf(args);
533
1da177e4
LT
534 dp = args->dp;
535 ifp = dp->i_afp;
536 sf = (xfs_attr_shortform_t *)ifp->if_u1.if_data;
3b244aa8 537 size = be16_to_cpu(sf->hdr.totsize);
1da177e4
LT
538 tmpbuffer = kmem_alloc(size, KM_SLEEP);
539 ASSERT(tmpbuffer != NULL);
540 memcpy(tmpbuffer, ifp->if_u1.if_data, size);
541 sf = (xfs_attr_shortform_t *)tmpbuffer;
542
543 xfs_idata_realloc(dp, -size, XFS_ATTR_FORK);
544 bp = NULL;
545 error = xfs_da_grow_inode(args, &blkno);
546 if (error) {
547 /*
548 * If we hit an IO error middle of the transaction inside
549 * grow_inode(), we may have inconsistent data. Bail out.
550 */
551 if (error == EIO)
552 goto out;
553 xfs_idata_realloc(dp, size, XFS_ATTR_FORK); /* try to put */
554 memcpy(ifp->if_u1.if_data, tmpbuffer, size); /* it back */
555 goto out;
556 }
557
558 ASSERT(blkno == 0);
559 error = xfs_attr_leaf_create(args, blkno, &bp);
560 if (error) {
561 error = xfs_da_shrink_inode(args, 0, bp);
562 bp = NULL;
563 if (error)
564 goto out;
565 xfs_idata_realloc(dp, size, XFS_ATTR_FORK); /* try to put */
566 memcpy(ifp->if_u1.if_data, tmpbuffer, size); /* it back */
567 goto out;
568 }
569
570 memset((char *)&nargs, 0, sizeof(nargs));
571 nargs.dp = dp;
572 nargs.firstblock = args->firstblock;
573 nargs.flist = args->flist;
574 nargs.total = args->total;
575 nargs.whichfork = XFS_ATTR_FORK;
576 nargs.trans = args->trans;
6a178100 577 nargs.op_flags = XFS_DA_OP_OKNOENT;
1da177e4
LT
578
579 sfe = &sf->list[0];
3b244aa8 580 for (i = 0; i < sf->hdr.count; i++) {
a9273ca5 581 nargs.name = sfe->nameval;
1da177e4 582 nargs.namelen = sfe->namelen;
a9273ca5 583 nargs.value = &sfe->nameval[nargs.namelen];
3b244aa8 584 nargs.valuelen = sfe->valuelen;
a9273ca5 585 nargs.hashval = xfs_da_hashname(sfe->nameval,
1da177e4 586 sfe->namelen);
726801ba 587 nargs.flags = XFS_ATTR_NSP_ONDISK_TO_ARGS(sfe->flags);
1da177e4
LT
588 error = xfs_attr_leaf_lookup_int(bp, &nargs); /* set a->index */
589 ASSERT(error == ENOATTR);
590 error = xfs_attr_leaf_add(bp, &nargs);
591 ASSERT(error != ENOSPC);
592 if (error)
593 goto out;
594 sfe = XFS_ATTR_SF_NEXTENTRY(sfe);
595 }
596 error = 0;
597
598out:
f0e2d93c 599 kmem_free(tmpbuffer);
1da177e4
LT
600 return(error);
601}
602
603STATIC int
604xfs_attr_shortform_compare(const void *a, const void *b)
605{
606 xfs_attr_sf_sort_t *sa, *sb;
607
608 sa = (xfs_attr_sf_sort_t *)a;
609 sb = (xfs_attr_sf_sort_t *)b;
984a081a 610 if (sa->hash < sb->hash) {
1da177e4 611 return(-1);
984a081a 612 } else if (sa->hash > sb->hash) {
1da177e4
LT
613 return(1);
614 } else {
615 return(sa->entno - sb->entno);
616 }
617}
618
726801ba
TS
619
620#define XFS_ISRESET_CURSOR(cursor) \
621 (!((cursor)->initted) && !((cursor)->hashval) && \
622 !((cursor)->blkno) && !((cursor)->offset))
1da177e4
LT
623/*
624 * Copy out entries of shortform attribute lists for attr_list().
c41564b5 625 * Shortform attribute lists are not stored in hashval sorted order.
1da177e4
LT
626 * If the output buffer is not large enough to hold them all, then we
627 * we have to calculate each entries' hashvalue and sort them before
628 * we can begin returning them to the user.
629 */
630/*ARGSUSED*/
631int
632xfs_attr_shortform_list(xfs_attr_list_context_t *context)
633{
634 attrlist_cursor_kern_t *cursor;
635 xfs_attr_sf_sort_t *sbuf, *sbp;
636 xfs_attr_shortform_t *sf;
637 xfs_attr_sf_entry_t *sfe;
638 xfs_inode_t *dp;
639 int sbsize, nsbuf, count, i;
726801ba 640 int error;
1da177e4
LT
641
642 ASSERT(context != NULL);
643 dp = context->dp;
644 ASSERT(dp != NULL);
645 ASSERT(dp->i_afp != NULL);
646 sf = (xfs_attr_shortform_t *)dp->i_afp->if_u1.if_data;
647 ASSERT(sf != NULL);
648 if (!sf->hdr.count)
649 return(0);
650 cursor = context->cursor;
651 ASSERT(cursor != NULL);
652
0b1b213f 653 trace_xfs_attr_list_sf(context);
1da177e4
LT
654
655 /*
726801ba
TS
656 * If the buffer is large enough and the cursor is at the start,
657 * do not bother with sorting since we will return everything in
658 * one buffer and another call using the cursor won't need to be
659 * made.
1da177e4 660 * Note the generous fudge factor of 16 overhead bytes per entry.
726801ba
TS
661 * If bufsize is zero then put_listent must be a search function
662 * and can just scan through what we have.
1da177e4 663 */
726801ba
TS
664 if (context->bufsize == 0 ||
665 (XFS_ISRESET_CURSOR(cursor) &&
666 (dp->i_afp->if_bytes + sf->hdr.count * 16) < context->bufsize)) {
3b244aa8 667 for (i = 0, sfe = &sf->list[0]; i < sf->hdr.count; i++) {
726801ba 668 error = context->put_listent(context,
ad9b463a 669 sfe->flags,
a9273ca5 670 sfe->nameval,
726801ba
TS
671 (int)sfe->namelen,
672 (int)sfe->valuelen,
a9273ca5 673 &sfe->nameval[sfe->namelen]);
726801ba
TS
674
675 /*
676 * Either search callback finished early or
677 * didn't fit it all in the buffer after all.
678 */
679 if (context->seen_enough)
680 break;
681
682 if (error)
683 return error;
1da177e4
LT
684 sfe = XFS_ATTR_SF_NEXTENTRY(sfe);
685 }
0b1b213f 686 trace_xfs_attr_list_sf_all(context);
1da177e4
LT
687 return(0);
688 }
689
726801ba
TS
690 /* do no more for a search callback */
691 if (context->bufsize == 0)
692 return 0;
693
1da177e4
LT
694 /*
695 * It didn't all fit, so we have to sort everything on hashval.
696 */
3b244aa8 697 sbsize = sf->hdr.count * sizeof(*sbuf);
622d8149 698 sbp = sbuf = kmem_alloc(sbsize, KM_SLEEP | KM_NOFS);
1da177e4
LT
699
700 /*
701 * Scan the attribute list for the rest of the entries, storing
702 * the relevant info from only those that match into a buffer.
703 */
704 nsbuf = 0;
3b244aa8 705 for (i = 0, sfe = &sf->list[0]; i < sf->hdr.count; i++) {
1da177e4
LT
706 if (unlikely(
707 ((char *)sfe < (char *)sf) ||
708 ((char *)sfe >= ((char *)sf + dp->i_afp->if_bytes)))) {
709 XFS_CORRUPTION_ERROR("xfs_attr_shortform_list",
710 XFS_ERRLEVEL_LOW,
711 context->dp->i_mount, sfe);
f0e2d93c 712 kmem_free(sbuf);
1da177e4
LT
713 return XFS_ERROR(EFSCORRUPTED);
714 }
ad9b463a 715
1da177e4 716 sbp->entno = i;
a9273ca5
DC
717 sbp->hash = xfs_da_hashname(sfe->nameval, sfe->namelen);
718 sbp->name = sfe->nameval;
1da177e4
LT
719 sbp->namelen = sfe->namelen;
720 /* These are bytes, and both on-disk, don't endian-flip */
721 sbp->valuelen = sfe->valuelen;
722 sbp->flags = sfe->flags;
723 sfe = XFS_ATTR_SF_NEXTENTRY(sfe);
724 sbp++;
725 nsbuf++;
726 }
727
728 /*
729 * Sort the entries on hash then entno.
730 */
380b5dc0 731 xfs_sort(sbuf, nsbuf, sizeof(*sbuf), xfs_attr_shortform_compare);
1da177e4
LT
732
733 /*
734 * Re-find our place IN THE SORTED LIST.
735 */
736 count = 0;
737 cursor->initted = 1;
738 cursor->blkno = 0;
739 for (sbp = sbuf, i = 0; i < nsbuf; i++, sbp++) {
984a081a 740 if (sbp->hash == cursor->hashval) {
1da177e4
LT
741 if (cursor->offset == count) {
742 break;
743 }
744 count++;
984a081a 745 } else if (sbp->hash > cursor->hashval) {
1da177e4
LT
746 break;
747 }
748 }
749 if (i == nsbuf) {
f0e2d93c 750 kmem_free(sbuf);
1da177e4
LT
751 return(0);
752 }
753
754 /*
755 * Loop putting entries into the user buffer.
756 */
757 for ( ; i < nsbuf; i++, sbp++) {
984a081a
NS
758 if (cursor->hashval != sbp->hash) {
759 cursor->hashval = sbp->hash;
1da177e4
LT
760 cursor->offset = 0;
761 }
726801ba 762 error = context->put_listent(context,
ad9b463a 763 sbp->flags,
726801ba
TS
764 sbp->name,
765 sbp->namelen,
766 sbp->valuelen,
767 &sbp->name[sbp->namelen]);
768 if (error)
769 return error;
770 if (context->seen_enough)
771 break;
1da177e4
LT
772 cursor->offset++;
773 }
774
f0e2d93c 775 kmem_free(sbuf);
1da177e4
LT
776 return(0);
777}
778
779/*
780 * Check a leaf attribute block to see if all the entries would fit into
781 * a shortform attribute list.
782 */
783int
1d9025e5
DC
784xfs_attr_shortform_allfit(
785 struct xfs_buf *bp,
786 struct xfs_inode *dp)
1da177e4
LT
787{
788 xfs_attr_leafblock_t *leaf;
789 xfs_attr_leaf_entry_t *entry;
790 xfs_attr_leaf_name_local_t *name_loc;
791 int bytes, i;
792
1d9025e5 793 leaf = bp->b_addr;
69ef921b 794 ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
1da177e4
LT
795
796 entry = &leaf->entries[0];
797 bytes = sizeof(struct xfs_attr_sf_hdr);
918ae424 798 for (i = 0; i < be16_to_cpu(leaf->hdr.count); entry++, i++) {
1da177e4
LT
799 if (entry->flags & XFS_ATTR_INCOMPLETE)
800 continue; /* don't copy partial entries */
801 if (!(entry->flags & XFS_ATTR_LOCAL))
802 return(0);
c9fb86a9 803 name_loc = xfs_attr_leaf_name_local(leaf, i);
1da177e4
LT
804 if (name_loc->namelen >= XFS_ATTR_SF_ENTSIZE_MAX)
805 return(0);
053b5758 806 if (be16_to_cpu(name_loc->valuelen) >= XFS_ATTR_SF_ENTSIZE_MAX)
1da177e4
LT
807 return(0);
808 bytes += sizeof(struct xfs_attr_sf_entry)-1
809 + name_loc->namelen
053b5758 810 + be16_to_cpu(name_loc->valuelen);
1da177e4 811 }
13059ff0 812 if ((dp->i_mount->m_flags & XFS_MOUNT_ATTR2) &&
e5889e90 813 (dp->i_d.di_format != XFS_DINODE_FMT_BTREE) &&
e0144ca5 814 (bytes == sizeof(struct xfs_attr_sf_hdr)))
d8cc890d
NS
815 return(-1);
816 return(xfs_attr_shortform_bytesfit(dp, bytes));
1da177e4
LT
817}
818
819/*
820 * Convert a leaf attribute list to shortform attribute list
821 */
822int
1d9025e5
DC
823xfs_attr_leaf_to_shortform(
824 struct xfs_buf *bp,
825 xfs_da_args_t *args,
826 int forkoff)
1da177e4
LT
827{
828 xfs_attr_leafblock_t *leaf;
829 xfs_attr_leaf_entry_t *entry;
830 xfs_attr_leaf_name_local_t *name_loc;
831 xfs_da_args_t nargs;
832 xfs_inode_t *dp;
833 char *tmpbuffer;
834 int error, i;
835
5a5881cd
DC
836 trace_xfs_attr_leaf_to_sf(args);
837
1da177e4
LT
838 dp = args->dp;
839 tmpbuffer = kmem_alloc(XFS_LBSIZE(dp->i_mount), KM_SLEEP);
840 ASSERT(tmpbuffer != NULL);
841
842 ASSERT(bp != NULL);
1d9025e5 843 memcpy(tmpbuffer, bp->b_addr, XFS_LBSIZE(dp->i_mount));
1da177e4 844 leaf = (xfs_attr_leafblock_t *)tmpbuffer;
69ef921b 845 ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
1d9025e5 846 memset(bp->b_addr, 0, XFS_LBSIZE(dp->i_mount));
1da177e4
LT
847
848 /*
849 * Clean out the prior contents of the attribute list.
850 */
851 error = xfs_da_shrink_inode(args, 0, bp);
852 if (error)
853 goto out;
d8cc890d
NS
854
855 if (forkoff == -1) {
13059ff0 856 ASSERT(dp->i_mount->m_flags & XFS_MOUNT_ATTR2);
e5889e90 857 ASSERT(dp->i_d.di_format != XFS_DINODE_FMT_BTREE);
e1486dea 858 xfs_attr_fork_reset(dp, args->trans);
1da177e4 859 goto out;
d8cc890d
NS
860 }
861
862 xfs_attr_shortform_create(args);
1da177e4
LT
863
864 /*
865 * Copy the attributes
866 */
867 memset((char *)&nargs, 0, sizeof(nargs));
868 nargs.dp = dp;
869 nargs.firstblock = args->firstblock;
870 nargs.flist = args->flist;
871 nargs.total = args->total;
872 nargs.whichfork = XFS_ATTR_FORK;
873 nargs.trans = args->trans;
6a178100 874 nargs.op_flags = XFS_DA_OP_OKNOENT;
1da177e4 875 entry = &leaf->entries[0];
918ae424 876 for (i = 0; i < be16_to_cpu(leaf->hdr.count); entry++, i++) {
1da177e4
LT
877 if (entry->flags & XFS_ATTR_INCOMPLETE)
878 continue; /* don't copy partial entries */
879 if (!entry->nameidx)
880 continue;
881 ASSERT(entry->flags & XFS_ATTR_LOCAL);
c9fb86a9 882 name_loc = xfs_attr_leaf_name_local(leaf, i);
a9273ca5 883 nargs.name = name_loc->nameval;
1da177e4 884 nargs.namelen = name_loc->namelen;
a9273ca5 885 nargs.value = &name_loc->nameval[nargs.namelen];
053b5758 886 nargs.valuelen = be16_to_cpu(name_loc->valuelen);
6b19f2d8 887 nargs.hashval = be32_to_cpu(entry->hashval);
726801ba 888 nargs.flags = XFS_ATTR_NSP_ONDISK_TO_ARGS(entry->flags);
d8cc890d 889 xfs_attr_shortform_add(&nargs, forkoff);
1da177e4
LT
890 }
891 error = 0;
892
893out:
f0e2d93c 894 kmem_free(tmpbuffer);
1da177e4
LT
895 return(error);
896}
897
898/*
899 * Convert from using a single leaf to a root node and a leaf.
900 */
901int
902xfs_attr_leaf_to_node(xfs_da_args_t *args)
903{
904 xfs_attr_leafblock_t *leaf;
905 xfs_da_intnode_t *node;
906 xfs_inode_t *dp;
1d9025e5 907 struct xfs_buf *bp1, *bp2;
1da177e4
LT
908 xfs_dablk_t blkno;
909 int error;
910
5a5881cd
DC
911 trace_xfs_attr_leaf_to_node(args);
912
1da177e4
LT
913 dp = args->dp;
914 bp1 = bp2 = NULL;
915 error = xfs_da_grow_inode(args, &blkno);
916 if (error)
917 goto out;
ad14c33a 918 error = xfs_attr_leaf_read(args->trans, args->dp, 0, -1, &bp1);
1da177e4
LT
919 if (error)
920 goto out;
ad14c33a 921
1da177e4
LT
922 bp2 = NULL;
923 error = xfs_da_get_buf(args->trans, args->dp, blkno, -1, &bp2,
924 XFS_ATTR_FORK);
925 if (error)
926 goto out;
b0f539de 927 bp2->b_pre_io = bp1->b_pre_io;
1d9025e5 928 memcpy(bp2->b_addr, bp1->b_addr, XFS_LBSIZE(dp->i_mount));
1da177e4 929 bp1 = NULL;
1d9025e5 930 xfs_trans_log_buf(args->trans, bp2, 0, XFS_LBSIZE(dp->i_mount) - 1);
1da177e4
LT
931
932 /*
933 * Set up the new root node.
934 */
935 error = xfs_da_node_create(args, 0, 1, &bp1, XFS_ATTR_FORK);
936 if (error)
937 goto out;
1d9025e5
DC
938 node = bp1->b_addr;
939 leaf = bp2->b_addr;
69ef921b 940 ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
1da177e4
LT
941 /* both on-disk, don't endian-flip twice */
942 node->btree[0].hashval =
918ae424 943 leaf->entries[be16_to_cpu(leaf->hdr.count)-1 ].hashval;
403432dc 944 node->btree[0].before = cpu_to_be32(blkno);
fac80cce 945 node->hdr.count = cpu_to_be16(1);
1d9025e5 946 xfs_trans_log_buf(args->trans, bp1, 0, XFS_LBSIZE(dp->i_mount) - 1);
1da177e4
LT
947 error = 0;
948out:
1da177e4
LT
949 return(error);
950}
951
952
953/*========================================================================
954 * Routines used for growing the Btree.
955 *========================================================================*/
956
957/*
958 * Create the initial contents of a leaf attribute list
959 * or a leaf in a node attribute list.
960 */
ba0f32d4 961STATIC int
1d9025e5
DC
962xfs_attr_leaf_create(
963 xfs_da_args_t *args,
964 xfs_dablk_t blkno,
965 struct xfs_buf **bpp)
1da177e4
LT
966{
967 xfs_attr_leafblock_t *leaf;
968 xfs_attr_leaf_hdr_t *hdr;
969 xfs_inode_t *dp;
1d9025e5 970 struct xfs_buf *bp;
1da177e4
LT
971 int error;
972
5a5881cd
DC
973 trace_xfs_attr_leaf_create(args);
974
1da177e4
LT
975 dp = args->dp;
976 ASSERT(dp != NULL);
977 error = xfs_da_get_buf(args->trans, args->dp, blkno, -1, &bp,
978 XFS_ATTR_FORK);
979 if (error)
980 return(error);
b0f539de 981 bp->b_pre_io = xfs_attr_leaf_write_verify;
1d9025e5 982 leaf = bp->b_addr;
1da177e4
LT
983 memset((char *)leaf, 0, XFS_LBSIZE(dp->i_mount));
984 hdr = &leaf->hdr;
89da0544 985 hdr->info.magic = cpu_to_be16(XFS_ATTR_LEAF_MAGIC);
918ae424 986 hdr->firstused = cpu_to_be16(XFS_LBSIZE(dp->i_mount));
1da177e4 987 if (!hdr->firstused) {
918ae424 988 hdr->firstused = cpu_to_be16(
1da177e4
LT
989 XFS_LBSIZE(dp->i_mount) - XFS_ATTR_LEAF_NAME_ALIGN);
990 }
991
918ae424
NS
992 hdr->freemap[0].base = cpu_to_be16(sizeof(xfs_attr_leaf_hdr_t));
993 hdr->freemap[0].size = cpu_to_be16(be16_to_cpu(hdr->firstused) -
994 sizeof(xfs_attr_leaf_hdr_t));
1da177e4 995
1d9025e5 996 xfs_trans_log_buf(args->trans, bp, 0, XFS_LBSIZE(dp->i_mount) - 1);
1da177e4
LT
997
998 *bpp = bp;
999 return(0);
1000}
1001
1002/*
1003 * Split the leaf node, rebalance, then add the new entry.
1004 */
1005int
1006xfs_attr_leaf_split(xfs_da_state_t *state, xfs_da_state_blk_t *oldblk,
1007 xfs_da_state_blk_t *newblk)
1008{
1009 xfs_dablk_t blkno;
1010 int error;
1011
5a5881cd
DC
1012 trace_xfs_attr_leaf_split(state->args);
1013
1da177e4
LT
1014 /*
1015 * Allocate space for a new leaf node.
1016 */
1017 ASSERT(oldblk->magic == XFS_ATTR_LEAF_MAGIC);
1018 error = xfs_da_grow_inode(state->args, &blkno);
1019 if (error)
1020 return(error);
1021 error = xfs_attr_leaf_create(state->args, blkno, &newblk->bp);
1022 if (error)
1023 return(error);
1024 newblk->blkno = blkno;
1025 newblk->magic = XFS_ATTR_LEAF_MAGIC;
1026
1027 /*
1028 * Rebalance the entries across the two leaves.
1029 * NOTE: rebalance() currently depends on the 2nd block being empty.
1030 */
1031 xfs_attr_leaf_rebalance(state, oldblk, newblk);
1032 error = xfs_da_blk_link(state, oldblk, newblk);
1033 if (error)
1034 return(error);
1035
1036 /*
1037 * Save info on "old" attribute for "atomic rename" ops, leaf_add()
1038 * modifies the index/blkno/rmtblk/rmtblkcnt fields to show the
1039 * "new" attrs info. Will need the "old" info to remove it later.
1040 *
1041 * Insert the "new" entry in the correct block.
1042 */
5a5881cd
DC
1043 if (state->inleaf) {
1044 trace_xfs_attr_leaf_add_old(state->args);
1da177e4 1045 error = xfs_attr_leaf_add(oldblk->bp, state->args);
5a5881cd
DC
1046 } else {
1047 trace_xfs_attr_leaf_add_new(state->args);
1da177e4 1048 error = xfs_attr_leaf_add(newblk->bp, state->args);
5a5881cd 1049 }
1da177e4
LT
1050
1051 /*
1052 * Update last hashval in each block since we added the name.
1053 */
1054 oldblk->hashval = xfs_attr_leaf_lasthash(oldblk->bp, NULL);
1055 newblk->hashval = xfs_attr_leaf_lasthash(newblk->bp, NULL);
1056 return(error);
1057}
1058
1059/*
1060 * Add a name to the leaf attribute list structure.
1061 */
1062int
1d9025e5
DC
1063xfs_attr_leaf_add(
1064 struct xfs_buf *bp,
1065 struct xfs_da_args *args)
1da177e4
LT
1066{
1067 xfs_attr_leafblock_t *leaf;
1068 xfs_attr_leaf_hdr_t *hdr;
1069 xfs_attr_leaf_map_t *map;
1070 int tablesize, entsize, sum, tmp, i;
1071
5a5881cd
DC
1072 trace_xfs_attr_leaf_add(args);
1073
1d9025e5 1074 leaf = bp->b_addr;
69ef921b 1075 ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
1da177e4 1076 ASSERT((args->index >= 0)
918ae424 1077 && (args->index <= be16_to_cpu(leaf->hdr.count)));
1da177e4 1078 hdr = &leaf->hdr;
aa82daa0 1079 entsize = xfs_attr_leaf_newentsize(args->namelen, args->valuelen,
1da177e4
LT
1080 args->trans->t_mountp->m_sb.sb_blocksize, NULL);
1081
1082 /*
1083 * Search through freemap for first-fit on new name length.
1084 * (may need to figure in size of entry struct too)
1085 */
918ae424 1086 tablesize = (be16_to_cpu(hdr->count) + 1)
1da177e4
LT
1087 * sizeof(xfs_attr_leaf_entry_t)
1088 + sizeof(xfs_attr_leaf_hdr_t);
1089 map = &hdr->freemap[XFS_ATTR_LEAF_MAPSIZE-1];
1090 for (sum = 0, i = XFS_ATTR_LEAF_MAPSIZE-1; i >= 0; map--, i--) {
918ae424
NS
1091 if (tablesize > be16_to_cpu(hdr->firstused)) {
1092 sum += be16_to_cpu(map->size);
1da177e4
LT
1093 continue;
1094 }
1095 if (!map->size)
1096 continue; /* no space in this map */
1097 tmp = entsize;
918ae424 1098 if (be16_to_cpu(map->base) < be16_to_cpu(hdr->firstused))
1da177e4 1099 tmp += sizeof(xfs_attr_leaf_entry_t);
918ae424 1100 if (be16_to_cpu(map->size) >= tmp) {
1da177e4
LT
1101 tmp = xfs_attr_leaf_add_work(bp, args, i);
1102 return(tmp);
1103 }
918ae424 1104 sum += be16_to_cpu(map->size);
1da177e4
LT
1105 }
1106
1107 /*
1108 * If there are no holes in the address space of the block,
1109 * and we don't have enough freespace, then compaction will do us
1110 * no good and we should just give up.
1111 */
1112 if (!hdr->holes && (sum < entsize))
1113 return(XFS_ERROR(ENOSPC));
1114
1115 /*
1116 * Compact the entries to coalesce free space.
1117 * This may change the hdr->count via dropping INCOMPLETE entries.
1118 */
ee73259b 1119 xfs_attr_leaf_compact(args, bp);
1da177e4
LT
1120
1121 /*
1122 * After compaction, the block is guaranteed to have only one
1123 * free region, in freemap[0]. If it is not big enough, give up.
1124 */
918ae424 1125 if (be16_to_cpu(hdr->freemap[0].size)
1da177e4
LT
1126 < (entsize + sizeof(xfs_attr_leaf_entry_t)))
1127 return(XFS_ERROR(ENOSPC));
1128
1129 return(xfs_attr_leaf_add_work(bp, args, 0));
1130}
1131
1132/*
1133 * Add a name to a leaf attribute list structure.
1134 */
1135STATIC int
1d9025e5
DC
1136xfs_attr_leaf_add_work(
1137 struct xfs_buf *bp,
1138 xfs_da_args_t *args,
1139 int mapindex)
1da177e4
LT
1140{
1141 xfs_attr_leafblock_t *leaf;
1142 xfs_attr_leaf_hdr_t *hdr;
1143 xfs_attr_leaf_entry_t *entry;
1144 xfs_attr_leaf_name_local_t *name_loc;
1145 xfs_attr_leaf_name_remote_t *name_rmt;
1146 xfs_attr_leaf_map_t *map;
1147 xfs_mount_t *mp;
1148 int tmp, i;
1149
ee73259b
DC
1150 trace_xfs_attr_leaf_add_work(args);
1151
1d9025e5 1152 leaf = bp->b_addr;
69ef921b 1153 ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
1da177e4
LT
1154 hdr = &leaf->hdr;
1155 ASSERT((mapindex >= 0) && (mapindex < XFS_ATTR_LEAF_MAPSIZE));
918ae424 1156 ASSERT((args->index >= 0) && (args->index <= be16_to_cpu(hdr->count)));
1da177e4
LT
1157
1158 /*
1159 * Force open some space in the entry array and fill it in.
1160 */
1161 entry = &leaf->entries[args->index];
918ae424
NS
1162 if (args->index < be16_to_cpu(hdr->count)) {
1163 tmp = be16_to_cpu(hdr->count) - args->index;
1da177e4
LT
1164 tmp *= sizeof(xfs_attr_leaf_entry_t);
1165 memmove((char *)(entry+1), (char *)entry, tmp);
1d9025e5 1166 xfs_trans_log_buf(args->trans, bp,
1da177e4
LT
1167 XFS_DA_LOGRANGE(leaf, entry, tmp + sizeof(*entry)));
1168 }
413d57c9 1169 be16_add_cpu(&hdr->count, 1);
1da177e4
LT
1170
1171 /*
1172 * Allocate space for the new string (at the end of the run).
1173 */
1174 map = &hdr->freemap[mapindex];
1175 mp = args->trans->t_mountp;
918ae424
NS
1176 ASSERT(be16_to_cpu(map->base) < XFS_LBSIZE(mp));
1177 ASSERT((be16_to_cpu(map->base) & 0x3) == 0);
1178 ASSERT(be16_to_cpu(map->size) >=
aa82daa0
NS
1179 xfs_attr_leaf_newentsize(args->namelen, args->valuelen,
1180 mp->m_sb.sb_blocksize, NULL));
918ae424
NS
1181 ASSERT(be16_to_cpu(map->size) < XFS_LBSIZE(mp));
1182 ASSERT((be16_to_cpu(map->size) & 0x3) == 0);
413d57c9 1183 be16_add_cpu(&map->size,
aa82daa0
NS
1184 -xfs_attr_leaf_newentsize(args->namelen, args->valuelen,
1185 mp->m_sb.sb_blocksize, &tmp));
6b19f2d8
NS
1186 entry->nameidx = cpu_to_be16(be16_to_cpu(map->base) +
1187 be16_to_cpu(map->size));
1188 entry->hashval = cpu_to_be32(args->hashval);
1da177e4 1189 entry->flags = tmp ? XFS_ATTR_LOCAL : 0;
726801ba 1190 entry->flags |= XFS_ATTR_NSP_ARGS_TO_ONDISK(args->flags);
6a178100 1191 if (args->op_flags & XFS_DA_OP_RENAME) {
1da177e4
LT
1192 entry->flags |= XFS_ATTR_INCOMPLETE;
1193 if ((args->blkno2 == args->blkno) &&
1194 (args->index2 <= args->index)) {
1195 args->index2++;
1196 }
1197 }
1d9025e5 1198 xfs_trans_log_buf(args->trans, bp,
1da177e4 1199 XFS_DA_LOGRANGE(leaf, entry, sizeof(*entry)));
6b19f2d8
NS
1200 ASSERT((args->index == 0) ||
1201 (be32_to_cpu(entry->hashval) >= be32_to_cpu((entry-1)->hashval)));
918ae424 1202 ASSERT((args->index == be16_to_cpu(hdr->count)-1) ||
6b19f2d8 1203 (be32_to_cpu(entry->hashval) <= be32_to_cpu((entry+1)->hashval)));
1da177e4
LT
1204
1205 /*
1da177e4
LT
1206 * For "remote" attribute values, simply note that we need to
1207 * allocate space for the "remote" value. We can't actually
1208 * allocate the extents in this transaction, and we can't decide
1209 * which blocks they should be as we might allocate more blocks
1210 * as part of this transaction (a split operation for example).
1211 */
1212 if (entry->flags & XFS_ATTR_LOCAL) {
c9fb86a9 1213 name_loc = xfs_attr_leaf_name_local(leaf, args->index);
1da177e4 1214 name_loc->namelen = args->namelen;
053b5758 1215 name_loc->valuelen = cpu_to_be16(args->valuelen);
1da177e4
LT
1216 memcpy((char *)name_loc->nameval, args->name, args->namelen);
1217 memcpy((char *)&name_loc->nameval[args->namelen], args->value,
053b5758 1218 be16_to_cpu(name_loc->valuelen));
1da177e4 1219 } else {
c9fb86a9 1220 name_rmt = xfs_attr_leaf_name_remote(leaf, args->index);
1da177e4
LT
1221 name_rmt->namelen = args->namelen;
1222 memcpy((char *)name_rmt->name, args->name, args->namelen);
1223 entry->flags |= XFS_ATTR_INCOMPLETE;
1224 /* just in case */
1225 name_rmt->valuelen = 0;
1226 name_rmt->valueblk = 0;
1227 args->rmtblkno = 1;
1228 args->rmtblkcnt = XFS_B_TO_FSB(mp, args->valuelen);
1229 }
1d9025e5 1230 xfs_trans_log_buf(args->trans, bp,
c9fb86a9 1231 XFS_DA_LOGRANGE(leaf, xfs_attr_leaf_name(leaf, args->index),
1da177e4
LT
1232 xfs_attr_leaf_entsize(leaf, args->index)));
1233
1234 /*
1235 * Update the control info for this leaf node
1236 */
6b19f2d8 1237 if (be16_to_cpu(entry->nameidx) < be16_to_cpu(hdr->firstused)) {
1da177e4
LT
1238 /* both on-disk, don't endian-flip twice */
1239 hdr->firstused = entry->nameidx;
1240 }
918ae424
NS
1241 ASSERT(be16_to_cpu(hdr->firstused) >=
1242 ((be16_to_cpu(hdr->count) * sizeof(*entry)) + sizeof(*hdr)));
1243 tmp = (be16_to_cpu(hdr->count)-1) * sizeof(xfs_attr_leaf_entry_t)
1da177e4
LT
1244 + sizeof(xfs_attr_leaf_hdr_t);
1245 map = &hdr->freemap[0];
1246 for (i = 0; i < XFS_ATTR_LEAF_MAPSIZE; map++, i++) {
918ae424 1247 if (be16_to_cpu(map->base) == tmp) {
413d57c9
MS
1248 be16_add_cpu(&map->base, sizeof(xfs_attr_leaf_entry_t));
1249 be16_add_cpu(&map->size,
918ae424 1250 -((int)sizeof(xfs_attr_leaf_entry_t)));
1da177e4
LT
1251 }
1252 }
413d57c9 1253 be16_add_cpu(&hdr->usedbytes, xfs_attr_leaf_entsize(leaf, args->index));
1d9025e5 1254 xfs_trans_log_buf(args->trans, bp,
1da177e4
LT
1255 XFS_DA_LOGRANGE(leaf, hdr, sizeof(*hdr)));
1256 return(0);
1257}
1258
1259/*
1260 * Garbage collect a leaf attribute list block by copying it to a new buffer.
1261 */
1262STATIC void
1d9025e5 1263xfs_attr_leaf_compact(
ee73259b
DC
1264 struct xfs_da_args *args,
1265 struct xfs_buf *bp)
1da177e4 1266{
ee73259b
DC
1267 xfs_attr_leafblock_t *leaf_s, *leaf_d;
1268 xfs_attr_leaf_hdr_t *hdr_s, *hdr_d;
1269 struct xfs_trans *trans = args->trans;
1270 struct xfs_mount *mp = trans->t_mountp;
1271 char *tmpbuffer;
1272
1273 trace_xfs_attr_leaf_compact(args);
1da177e4 1274
1da177e4
LT
1275 tmpbuffer = kmem_alloc(XFS_LBSIZE(mp), KM_SLEEP);
1276 ASSERT(tmpbuffer != NULL);
1d9025e5
DC
1277 memcpy(tmpbuffer, bp->b_addr, XFS_LBSIZE(mp));
1278 memset(bp->b_addr, 0, XFS_LBSIZE(mp));
1da177e4
LT
1279
1280 /*
1281 * Copy basic information
1282 */
1283 leaf_s = (xfs_attr_leafblock_t *)tmpbuffer;
1d9025e5 1284 leaf_d = bp->b_addr;
1da177e4
LT
1285 hdr_s = &leaf_s->hdr;
1286 hdr_d = &leaf_d->hdr;
1287 hdr_d->info = hdr_s->info; /* struct copy */
918ae424 1288 hdr_d->firstused = cpu_to_be16(XFS_LBSIZE(mp));
1da177e4
LT
1289 /* handle truncation gracefully */
1290 if (!hdr_d->firstused) {
918ae424 1291 hdr_d->firstused = cpu_to_be16(
1da177e4
LT
1292 XFS_LBSIZE(mp) - XFS_ATTR_LEAF_NAME_ALIGN);
1293 }
1294 hdr_d->usedbytes = 0;
1295 hdr_d->count = 0;
1296 hdr_d->holes = 0;
918ae424
NS
1297 hdr_d->freemap[0].base = cpu_to_be16(sizeof(xfs_attr_leaf_hdr_t));
1298 hdr_d->freemap[0].size = cpu_to_be16(be16_to_cpu(hdr_d->firstused) -
1299 sizeof(xfs_attr_leaf_hdr_t));
1da177e4
LT
1300
1301 /*
1302 * Copy all entry's in the same (sorted) order,
1303 * but allocate name/value pairs packed and in sequence.
1304 */
1305 xfs_attr_leaf_moveents(leaf_s, 0, leaf_d, 0,
918ae424 1306 be16_to_cpu(hdr_s->count), mp);
1d9025e5 1307 xfs_trans_log_buf(trans, bp, 0, XFS_LBSIZE(mp) - 1);
1da177e4 1308
f0e2d93c 1309 kmem_free(tmpbuffer);
1da177e4
LT
1310}
1311
1312/*
1313 * Redistribute the attribute list entries between two leaf nodes,
1314 * taking into account the size of the new entry.
1315 *
1316 * NOTE: if new block is empty, then it will get the upper half of the
1317 * old block. At present, all (one) callers pass in an empty second block.
1318 *
1319 * This code adjusts the args->index/blkno and args->index2/blkno2 fields
1320 * to match what it is doing in splitting the attribute leaf block. Those
1321 * values are used in "atomic rename" operations on attributes. Note that
1322 * the "new" and "old" values can end up in different blocks.
1323 */
1324STATIC void
1325xfs_attr_leaf_rebalance(xfs_da_state_t *state, xfs_da_state_blk_t *blk1,
1326 xfs_da_state_blk_t *blk2)
1327{
1328 xfs_da_args_t *args;
1329 xfs_da_state_blk_t *tmp_blk;
1330 xfs_attr_leafblock_t *leaf1, *leaf2;
1331 xfs_attr_leaf_hdr_t *hdr1, *hdr2;
1332 int count, totallen, max, space, swap;
1333
1334 /*
1335 * Set up environment.
1336 */
1337 ASSERT(blk1->magic == XFS_ATTR_LEAF_MAGIC);
1338 ASSERT(blk2->magic == XFS_ATTR_LEAF_MAGIC);
1d9025e5
DC
1339 leaf1 = blk1->bp->b_addr;
1340 leaf2 = blk2->bp->b_addr;
69ef921b
CH
1341 ASSERT(leaf1->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
1342 ASSERT(leaf2->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
07428d7f 1343 ASSERT(leaf2->hdr.count == 0);
1da177e4
LT
1344 args = state->args;
1345
5a5881cd
DC
1346 trace_xfs_attr_leaf_rebalance(args);
1347
1da177e4
LT
1348 /*
1349 * Check ordering of blocks, reverse if it makes things simpler.
1350 *
1351 * NOTE: Given that all (current) callers pass in an empty
1352 * second block, this code should never set "swap".
1353 */
1354 swap = 0;
1355 if (xfs_attr_leaf_order(blk1->bp, blk2->bp)) {
1356 tmp_blk = blk1;
1357 blk1 = blk2;
1358 blk2 = tmp_blk;
1d9025e5
DC
1359 leaf1 = blk1->bp->b_addr;
1360 leaf2 = blk2->bp->b_addr;
1da177e4
LT
1361 swap = 1;
1362 }
1363 hdr1 = &leaf1->hdr;
1364 hdr2 = &leaf2->hdr;
1365
1366 /*
1367 * Examine entries until we reduce the absolute difference in
1368 * byte usage between the two blocks to a minimum. Then get
1369 * the direction to copy and the number of elements to move.
1370 *
1371 * "inleaf" is true if the new entry should be inserted into blk1.
1372 * If "swap" is also true, then reverse the sense of "inleaf".
1373 */
1374 state->inleaf = xfs_attr_leaf_figure_balance(state, blk1, blk2,
1375 &count, &totallen);
1376 if (swap)
1377 state->inleaf = !state->inleaf;
1378
1379 /*
1380 * Move any entries required from leaf to leaf:
1381 */
918ae424 1382 if (count < be16_to_cpu(hdr1->count)) {
1da177e4
LT
1383 /*
1384 * Figure the total bytes to be added to the destination leaf.
1385 */
1386 /* number entries being moved */
918ae424
NS
1387 count = be16_to_cpu(hdr1->count) - count;
1388 space = be16_to_cpu(hdr1->usedbytes) - totallen;
1da177e4
LT
1389 space += count * sizeof(xfs_attr_leaf_entry_t);
1390
1391 /*
1392 * leaf2 is the destination, compact it if it looks tight.
1393 */
918ae424 1394 max = be16_to_cpu(hdr2->firstused)
1da177e4 1395 - sizeof(xfs_attr_leaf_hdr_t);
918ae424 1396 max -= be16_to_cpu(hdr2->count) * sizeof(xfs_attr_leaf_entry_t);
ee73259b
DC
1397 if (space > max)
1398 xfs_attr_leaf_compact(args, blk2->bp);
1da177e4
LT
1399
1400 /*
1401 * Move high entries from leaf1 to low end of leaf2.
1402 */
918ae424 1403 xfs_attr_leaf_moveents(leaf1, be16_to_cpu(hdr1->count) - count,
1da177e4
LT
1404 leaf2, 0, count, state->mp);
1405
1d9025e5
DC
1406 xfs_trans_log_buf(args->trans, blk1->bp, 0, state->blocksize-1);
1407 xfs_trans_log_buf(args->trans, blk2->bp, 0, state->blocksize-1);
918ae424 1408 } else if (count > be16_to_cpu(hdr1->count)) {
1da177e4
LT
1409 /*
1410 * I assert that since all callers pass in an empty
1411 * second buffer, this code should never execute.
1412 */
07428d7f 1413 ASSERT(0);
1da177e4
LT
1414
1415 /*
1416 * Figure the total bytes to be added to the destination leaf.
1417 */
1418 /* number entries being moved */
918ae424
NS
1419 count -= be16_to_cpu(hdr1->count);
1420 space = totallen - be16_to_cpu(hdr1->usedbytes);
1da177e4
LT
1421 space += count * sizeof(xfs_attr_leaf_entry_t);
1422
1423 /*
1424 * leaf1 is the destination, compact it if it looks tight.
1425 */
918ae424 1426 max = be16_to_cpu(hdr1->firstused)
1da177e4 1427 - sizeof(xfs_attr_leaf_hdr_t);
918ae424 1428 max -= be16_to_cpu(hdr1->count) * sizeof(xfs_attr_leaf_entry_t);
ee73259b
DC
1429 if (space > max)
1430 xfs_attr_leaf_compact(args, blk1->bp);
1da177e4
LT
1431
1432 /*
1433 * Move low entries from leaf2 to high end of leaf1.
1434 */
1435 xfs_attr_leaf_moveents(leaf2, 0, leaf1,
918ae424 1436 be16_to_cpu(hdr1->count), count, state->mp);
1da177e4 1437
1d9025e5
DC
1438 xfs_trans_log_buf(args->trans, blk1->bp, 0, state->blocksize-1);
1439 xfs_trans_log_buf(args->trans, blk2->bp, 0, state->blocksize-1);
1da177e4
LT
1440 }
1441
1442 /*
1443 * Copy out last hashval in each block for B-tree code.
1444 */
6b19f2d8
NS
1445 blk1->hashval = be32_to_cpu(
1446 leaf1->entries[be16_to_cpu(leaf1->hdr.count)-1].hashval);
1447 blk2->hashval = be32_to_cpu(
1448 leaf2->entries[be16_to_cpu(leaf2->hdr.count)-1].hashval);
1da177e4
LT
1449
1450 /*
1451 * Adjust the expected index for insertion.
1452 * NOTE: this code depends on the (current) situation that the
1453 * second block was originally empty.
1454 *
1455 * If the insertion point moved to the 2nd block, we must adjust
1456 * the index. We must also track the entry just following the
1457 * new entry for use in an "atomic rename" operation, that entry
1458 * is always the "old" entry and the "new" entry is what we are
1459 * inserting. The index/blkno fields refer to the "old" entry,
1460 * while the index2/blkno2 fields refer to the "new" entry.
1461 */
918ae424 1462 if (blk1->index > be16_to_cpu(leaf1->hdr.count)) {
1da177e4 1463 ASSERT(state->inleaf == 0);
918ae424 1464 blk2->index = blk1->index - be16_to_cpu(leaf1->hdr.count);
1da177e4
LT
1465 args->index = args->index2 = blk2->index;
1466 args->blkno = args->blkno2 = blk2->blkno;
918ae424 1467 } else if (blk1->index == be16_to_cpu(leaf1->hdr.count)) {
1da177e4
LT
1468 if (state->inleaf) {
1469 args->index = blk1->index;
1470 args->blkno = blk1->blkno;
1471 args->index2 = 0;
1472 args->blkno2 = blk2->blkno;
1473 } else {
07428d7f
DC
1474 /*
1475 * On a double leaf split, the original attr location
1476 * is already stored in blkno2/index2, so don't
1477 * overwrite it overwise we corrupt the tree.
1478 */
1da177e4 1479 blk2->index = blk1->index
918ae424 1480 - be16_to_cpu(leaf1->hdr.count);
07428d7f
DC
1481 args->index = blk2->index;
1482 args->blkno = blk2->blkno;
1483 if (!state->extravalid) {
1484 /*
1485 * set the new attr location to match the old
1486 * one and let the higher level split code
1487 * decide where in the leaf to place it.
1488 */
1489 args->index2 = blk2->index;
1490 args->blkno2 = blk2->blkno;
1491 }
1da177e4
LT
1492 }
1493 } else {
1494 ASSERT(state->inleaf == 1);
1495 args->index = args->index2 = blk1->index;
1496 args->blkno = args->blkno2 = blk1->blkno;
1497 }
1498}
1499
1500/*
1501 * Examine entries until we reduce the absolute difference in
1502 * byte usage between the two blocks to a minimum.
1503 * GROT: Is this really necessary? With other than a 512 byte blocksize,
1504 * GROT: there will always be enough room in either block for a new entry.
1505 * GROT: Do a double-split for this case?
1506 */
1507STATIC int
1508xfs_attr_leaf_figure_balance(xfs_da_state_t *state,
1509 xfs_da_state_blk_t *blk1,
1510 xfs_da_state_blk_t *blk2,
1511 int *countarg, int *usedbytesarg)
1512{
1513 xfs_attr_leafblock_t *leaf1, *leaf2;
1514 xfs_attr_leaf_hdr_t *hdr1, *hdr2;
1515 xfs_attr_leaf_entry_t *entry;
1516 int count, max, index, totallen, half;
1517 int lastdelta, foundit, tmp;
1518
1519 /*
1520 * Set up environment.
1521 */
1d9025e5
DC
1522 leaf1 = blk1->bp->b_addr;
1523 leaf2 = blk2->bp->b_addr;
1da177e4
LT
1524 hdr1 = &leaf1->hdr;
1525 hdr2 = &leaf2->hdr;
1526 foundit = 0;
1527 totallen = 0;
1528
1529 /*
1530 * Examine entries until we reduce the absolute difference in
1531 * byte usage between the two blocks to a minimum.
1532 */
918ae424 1533 max = be16_to_cpu(hdr1->count) + be16_to_cpu(hdr2->count);
1da177e4 1534 half = (max+1) * sizeof(*entry);
918ae424
NS
1535 half += be16_to_cpu(hdr1->usedbytes) +
1536 be16_to_cpu(hdr2->usedbytes) +
1537 xfs_attr_leaf_newentsize(
1538 state->args->namelen,
1539 state->args->valuelen,
1540 state->blocksize, NULL);
1da177e4
LT
1541 half /= 2;
1542 lastdelta = state->blocksize;
1543 entry = &leaf1->entries[0];
1544 for (count = index = 0; count < max; entry++, index++, count++) {
1545
1546#define XFS_ATTR_ABS(A) (((A) < 0) ? -(A) : (A))
1547 /*
1548 * The new entry is in the first block, account for it.
1549 */
1550 if (count == blk1->index) {
1551 tmp = totallen + sizeof(*entry) +
aa82daa0
NS
1552 xfs_attr_leaf_newentsize(
1553 state->args->namelen,
1554 state->args->valuelen,
1555 state->blocksize, NULL);
1da177e4
LT
1556 if (XFS_ATTR_ABS(half - tmp) > lastdelta)
1557 break;
1558 lastdelta = XFS_ATTR_ABS(half - tmp);
1559 totallen = tmp;
1560 foundit = 1;
1561 }
1562
1563 /*
1564 * Wrap around into the second block if necessary.
1565 */
918ae424 1566 if (count == be16_to_cpu(hdr1->count)) {
1da177e4
LT
1567 leaf1 = leaf2;
1568 entry = &leaf1->entries[0];
1569 index = 0;
1570 }
1571
1572 /*
1573 * Figure out if next leaf entry would be too much.
1574 */
1575 tmp = totallen + sizeof(*entry) + xfs_attr_leaf_entsize(leaf1,
1576 index);
1577 if (XFS_ATTR_ABS(half - tmp) > lastdelta)
1578 break;
1579 lastdelta = XFS_ATTR_ABS(half - tmp);
1580 totallen = tmp;
1581#undef XFS_ATTR_ABS
1582 }
1583
1584 /*
1585 * Calculate the number of usedbytes that will end up in lower block.
1586 * If new entry not in lower block, fix up the count.
1587 */
1588 totallen -= count * sizeof(*entry);
1589 if (foundit) {
1590 totallen -= sizeof(*entry) +
aa82daa0
NS
1591 xfs_attr_leaf_newentsize(
1592 state->args->namelen,
1593 state->args->valuelen,
1594 state->blocksize, NULL);
1da177e4
LT
1595 }
1596
1597 *countarg = count;
1598 *usedbytesarg = totallen;
1599 return(foundit);
1600}
1601
1602/*========================================================================
1603 * Routines used for shrinking the Btree.
1604 *========================================================================*/
1605
1606/*
1607 * Check a leaf block and its neighbors to see if the block should be
1608 * collapsed into one or the other neighbor. Always keep the block
1609 * with the smaller block number.
1610 * If the current block is over 50% full, don't try to join it, return 0.
1611 * If the block is empty, fill in the state structure and return 2.
1612 * If it can be collapsed, fill in the state structure and return 1.
1613 * If nothing can be done, return 0.
1614 *
1615 * GROT: allow for INCOMPLETE entries in calculation.
1616 */
1617int
1618xfs_attr_leaf_toosmall(xfs_da_state_t *state, int *action)
1619{
1620 xfs_attr_leafblock_t *leaf;
1621 xfs_da_state_blk_t *blk;
1622 xfs_da_blkinfo_t *info;
1623 int count, bytes, forward, error, retval, i;
1624 xfs_dablk_t blkno;
1d9025e5 1625 struct xfs_buf *bp;
1da177e4 1626
ee73259b
DC
1627 trace_xfs_attr_leaf_toosmall(state->args);
1628
1da177e4
LT
1629 /*
1630 * Check for the degenerate case of the block being over 50% full.
1631 * If so, it's not worth even looking to see if we might be able
1632 * to coalesce with a sibling.
1633 */
1634 blk = &state->path.blk[ state->path.active-1 ];
1d9025e5 1635 info = blk->bp->b_addr;
69ef921b 1636 ASSERT(info->magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
1da177e4 1637 leaf = (xfs_attr_leafblock_t *)info;
918ae424 1638 count = be16_to_cpu(leaf->hdr.count);
1da177e4
LT
1639 bytes = sizeof(xfs_attr_leaf_hdr_t) +
1640 count * sizeof(xfs_attr_leaf_entry_t) +
918ae424 1641 be16_to_cpu(leaf->hdr.usedbytes);
1da177e4
LT
1642 if (bytes > (state->blocksize >> 1)) {
1643 *action = 0; /* blk over 50%, don't try to join */
1644 return(0);
1645 }
1646
1647 /*
1648 * Check for the degenerate case of the block being empty.
1649 * If the block is empty, we'll simply delete it, no need to
c41564b5 1650 * coalesce it with a sibling block. We choose (arbitrarily)
1da177e4
LT
1651 * to merge with the forward block unless it is NULL.
1652 */
1653 if (count == 0) {
1654 /*
1655 * Make altpath point to the block we want to keep and
1656 * path point to the block we want to drop (this one).
1657 */
89da0544 1658 forward = (info->forw != 0);
1da177e4
LT
1659 memcpy(&state->altpath, &state->path, sizeof(state->path));
1660 error = xfs_da_path_shift(state, &state->altpath, forward,
1661 0, &retval);
1662 if (error)
1663 return(error);
1664 if (retval) {
1665 *action = 0;
1666 } else {
1667 *action = 2;
1668 }
1669 return(0);
1670 }
1671
1672 /*
1673 * Examine each sibling block to see if we can coalesce with
1674 * at least 25% free space to spare. We need to figure out
1675 * whether to merge with the forward or the backward block.
1676 * We prefer coalescing with the lower numbered sibling so as
1677 * to shrink an attribute list over time.
1678 */
1679 /* start with smaller blk num */
89da0544 1680 forward = (be32_to_cpu(info->forw) < be32_to_cpu(info->back));
1da177e4
LT
1681 for (i = 0; i < 2; forward = !forward, i++) {
1682 if (forward)
89da0544 1683 blkno = be32_to_cpu(info->forw);
1da177e4 1684 else
89da0544 1685 blkno = be32_to_cpu(info->back);
1da177e4
LT
1686 if (blkno == 0)
1687 continue;
ad14c33a
DC
1688 error = xfs_attr_leaf_read(state->args->trans, state->args->dp,
1689 blkno, -1, &bp);
1da177e4
LT
1690 if (error)
1691 return(error);
1da177e4
LT
1692
1693 leaf = (xfs_attr_leafblock_t *)info;
918ae424 1694 count = be16_to_cpu(leaf->hdr.count);
1da177e4 1695 bytes = state->blocksize - (state->blocksize>>2);
918ae424 1696 bytes -= be16_to_cpu(leaf->hdr.usedbytes);
1d9025e5 1697 leaf = bp->b_addr;
918ae424
NS
1698 count += be16_to_cpu(leaf->hdr.count);
1699 bytes -= be16_to_cpu(leaf->hdr.usedbytes);
1da177e4
LT
1700 bytes -= count * sizeof(xfs_attr_leaf_entry_t);
1701 bytes -= sizeof(xfs_attr_leaf_hdr_t);
1d9025e5 1702 xfs_trans_brelse(state->args->trans, bp);
1da177e4
LT
1703 if (bytes >= 0)
1704 break; /* fits with at least 25% to spare */
1705 }
1706 if (i >= 2) {
1707 *action = 0;
1708 return(0);
1709 }
1710
1711 /*
1712 * Make altpath point to the block we want to keep (the lower
1713 * numbered block) and path point to the block we want to drop.
1714 */
1715 memcpy(&state->altpath, &state->path, sizeof(state->path));
1716 if (blkno < blk->blkno) {
1717 error = xfs_da_path_shift(state, &state->altpath, forward,
1718 0, &retval);
1719 } else {
1720 error = xfs_da_path_shift(state, &state->path, forward,
1721 0, &retval);
1722 }
1723 if (error)
1724 return(error);
1725 if (retval) {
1726 *action = 0;
1727 } else {
1728 *action = 1;
1729 }
1730 return(0);
1731}
1732
1733/*
1734 * Remove a name from the leaf attribute list structure.
1735 *
1736 * Return 1 if leaf is less than 37% full, 0 if >= 37% full.
1737 * If two leaves are 37% full, when combined they will leave 25% free.
1738 */
1739int
1d9025e5
DC
1740xfs_attr_leaf_remove(
1741 struct xfs_buf *bp,
1742 xfs_da_args_t *args)
1da177e4
LT
1743{
1744 xfs_attr_leafblock_t *leaf;
1745 xfs_attr_leaf_hdr_t *hdr;
1746 xfs_attr_leaf_map_t *map;
1747 xfs_attr_leaf_entry_t *entry;
1748 int before, after, smallest, entsize;
1749 int tablesize, tmp, i;
1750 xfs_mount_t *mp;
1751
ee73259b
DC
1752 trace_xfs_attr_leaf_remove(args);
1753
1d9025e5 1754 leaf = bp->b_addr;
69ef921b 1755 ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
1da177e4
LT
1756 hdr = &leaf->hdr;
1757 mp = args->trans->t_mountp;
918ae424
NS
1758 ASSERT((be16_to_cpu(hdr->count) > 0)
1759 && (be16_to_cpu(hdr->count) < (XFS_LBSIZE(mp)/8)));
1da177e4 1760 ASSERT((args->index >= 0)
918ae424
NS
1761 && (args->index < be16_to_cpu(hdr->count)));
1762 ASSERT(be16_to_cpu(hdr->firstused) >=
1763 ((be16_to_cpu(hdr->count) * sizeof(*entry)) + sizeof(*hdr)));
1da177e4 1764 entry = &leaf->entries[args->index];
6b19f2d8
NS
1765 ASSERT(be16_to_cpu(entry->nameidx) >= be16_to_cpu(hdr->firstused));
1766 ASSERT(be16_to_cpu(entry->nameidx) < XFS_LBSIZE(mp));
1da177e4
LT
1767
1768 /*
1769 * Scan through free region table:
1770 * check for adjacency of free'd entry with an existing one,
1771 * find smallest free region in case we need to replace it,
1772 * adjust any map that borders the entry table,
1773 */
918ae424 1774 tablesize = be16_to_cpu(hdr->count) * sizeof(xfs_attr_leaf_entry_t)
1da177e4
LT
1775 + sizeof(xfs_attr_leaf_hdr_t);
1776 map = &hdr->freemap[0];
918ae424 1777 tmp = be16_to_cpu(map->size);
1da177e4
LT
1778 before = after = -1;
1779 smallest = XFS_ATTR_LEAF_MAPSIZE - 1;
1780 entsize = xfs_attr_leaf_entsize(leaf, args->index);
1781 for (i = 0; i < XFS_ATTR_LEAF_MAPSIZE; map++, i++) {
918ae424
NS
1782 ASSERT(be16_to_cpu(map->base) < XFS_LBSIZE(mp));
1783 ASSERT(be16_to_cpu(map->size) < XFS_LBSIZE(mp));
1784 if (be16_to_cpu(map->base) == tablesize) {
413d57c9 1785 be16_add_cpu(&map->base,
918ae424 1786 -((int)sizeof(xfs_attr_leaf_entry_t)));
413d57c9 1787 be16_add_cpu(&map->size, sizeof(xfs_attr_leaf_entry_t));
1da177e4
LT
1788 }
1789
918ae424 1790 if ((be16_to_cpu(map->base) + be16_to_cpu(map->size))
6b19f2d8 1791 == be16_to_cpu(entry->nameidx)) {
1da177e4 1792 before = i;
918ae424 1793 } else if (be16_to_cpu(map->base)
6b19f2d8 1794 == (be16_to_cpu(entry->nameidx) + entsize)) {
1da177e4 1795 after = i;
918ae424
NS
1796 } else if (be16_to_cpu(map->size) < tmp) {
1797 tmp = be16_to_cpu(map->size);
1da177e4
LT
1798 smallest = i;
1799 }
1800 }
1801
1802 /*
1803 * Coalesce adjacent freemap regions,
1804 * or replace the smallest region.
1805 */
1806 if ((before >= 0) || (after >= 0)) {
1807 if ((before >= 0) && (after >= 0)) {
1808 map = &hdr->freemap[before];
413d57c9
MS
1809 be16_add_cpu(&map->size, entsize);
1810 be16_add_cpu(&map->size,
918ae424 1811 be16_to_cpu(hdr->freemap[after].size));
1da177e4
LT
1812 hdr->freemap[after].base = 0;
1813 hdr->freemap[after].size = 0;
1814 } else if (before >= 0) {
1815 map = &hdr->freemap[before];
413d57c9 1816 be16_add_cpu(&map->size, entsize);
1da177e4
LT
1817 } else {
1818 map = &hdr->freemap[after];
1819 /* both on-disk, don't endian flip twice */
1820 map->base = entry->nameidx;
413d57c9 1821 be16_add_cpu(&map->size, entsize);
1da177e4
LT
1822 }
1823 } else {
1824 /*
1825 * Replace smallest region (if it is smaller than free'd entry)
1826 */
1827 map = &hdr->freemap[smallest];
918ae424 1828 if (be16_to_cpu(map->size) < entsize) {
6b19f2d8 1829 map->base = cpu_to_be16(be16_to_cpu(entry->nameidx));
918ae424 1830 map->size = cpu_to_be16(entsize);
1da177e4
LT
1831 }
1832 }
1833
1834 /*
1835 * Did we remove the first entry?
1836 */
6b19f2d8 1837 if (be16_to_cpu(entry->nameidx) == be16_to_cpu(hdr->firstused))
1da177e4
LT
1838 smallest = 1;
1839 else
1840 smallest = 0;
1841
1842 /*
1843 * Compress the remaining entries and zero out the removed stuff.
1844 */
c9fb86a9 1845 memset(xfs_attr_leaf_name(leaf, args->index), 0, entsize);
413d57c9 1846 be16_add_cpu(&hdr->usedbytes, -entsize);
1d9025e5 1847 xfs_trans_log_buf(args->trans, bp,
c9fb86a9 1848 XFS_DA_LOGRANGE(leaf, xfs_attr_leaf_name(leaf, args->index),
1da177e4
LT
1849 entsize));
1850
918ae424 1851 tmp = (be16_to_cpu(hdr->count) - args->index)
1da177e4
LT
1852 * sizeof(xfs_attr_leaf_entry_t);
1853 memmove((char *)entry, (char *)(entry+1), tmp);
413d57c9 1854 be16_add_cpu(&hdr->count, -1);
1d9025e5 1855 xfs_trans_log_buf(args->trans, bp,
1da177e4 1856 XFS_DA_LOGRANGE(leaf, entry, tmp + sizeof(*entry)));
918ae424 1857 entry = &leaf->entries[be16_to_cpu(hdr->count)];
1da177e4
LT
1858 memset((char *)entry, 0, sizeof(xfs_attr_leaf_entry_t));
1859
1860 /*
1861 * If we removed the first entry, re-find the first used byte
1862 * in the name area. Note that if the entry was the "firstused",
1863 * then we don't have a "hole" in our block resulting from
1864 * removing the name.
1865 */
1866 if (smallest) {
1867 tmp = XFS_LBSIZE(mp);
1868 entry = &leaf->entries[0];
918ae424 1869 for (i = be16_to_cpu(hdr->count)-1; i >= 0; entry++, i--) {
6b19f2d8
NS
1870 ASSERT(be16_to_cpu(entry->nameidx) >=
1871 be16_to_cpu(hdr->firstused));
1872 ASSERT(be16_to_cpu(entry->nameidx) < XFS_LBSIZE(mp));
1873
1874 if (be16_to_cpu(entry->nameidx) < tmp)
1875 tmp = be16_to_cpu(entry->nameidx);
1da177e4 1876 }
918ae424 1877 hdr->firstused = cpu_to_be16(tmp);
1da177e4 1878 if (!hdr->firstused) {
918ae424 1879 hdr->firstused = cpu_to_be16(
1da177e4
LT
1880 tmp - XFS_ATTR_LEAF_NAME_ALIGN);
1881 }
1882 } else {
1883 hdr->holes = 1; /* mark as needing compaction */
1884 }
1d9025e5 1885 xfs_trans_log_buf(args->trans, bp,
1da177e4
LT
1886 XFS_DA_LOGRANGE(leaf, hdr, sizeof(*hdr)));
1887
1888 /*
1889 * Check if leaf is less than 50% full, caller may want to
1890 * "join" the leaf with a sibling if so.
1891 */
1892 tmp = sizeof(xfs_attr_leaf_hdr_t);
918ae424
NS
1893 tmp += be16_to_cpu(leaf->hdr.count) * sizeof(xfs_attr_leaf_entry_t);
1894 tmp += be16_to_cpu(leaf->hdr.usedbytes);
1da177e4
LT
1895 return(tmp < mp->m_attr_magicpct); /* leaf is < 37% full */
1896}
1897
1898/*
1899 * Move all the attribute list entries from drop_leaf into save_leaf.
1900 */
1901void
1902xfs_attr_leaf_unbalance(xfs_da_state_t *state, xfs_da_state_blk_t *drop_blk,
1903 xfs_da_state_blk_t *save_blk)
1904{
1905 xfs_attr_leafblock_t *drop_leaf, *save_leaf, *tmp_leaf;
1906 xfs_attr_leaf_hdr_t *drop_hdr, *save_hdr, *tmp_hdr;
1907 xfs_mount_t *mp;
1908 char *tmpbuffer;
1909
5a5881cd
DC
1910 trace_xfs_attr_leaf_unbalance(state->args);
1911
1da177e4
LT
1912 /*
1913 * Set up environment.
1914 */
1915 mp = state->mp;
1916 ASSERT(drop_blk->magic == XFS_ATTR_LEAF_MAGIC);
1917 ASSERT(save_blk->magic == XFS_ATTR_LEAF_MAGIC);
1d9025e5
DC
1918 drop_leaf = drop_blk->bp->b_addr;
1919 save_leaf = save_blk->bp->b_addr;
69ef921b
CH
1920 ASSERT(drop_leaf->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
1921 ASSERT(save_leaf->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
1da177e4
LT
1922 drop_hdr = &drop_leaf->hdr;
1923 save_hdr = &save_leaf->hdr;
1924
1925 /*
1926 * Save last hashval from dying block for later Btree fixup.
1927 */
6b19f2d8
NS
1928 drop_blk->hashval = be32_to_cpu(
1929 drop_leaf->entries[be16_to_cpu(drop_leaf->hdr.count)-1].hashval);
1da177e4
LT
1930
1931 /*
1932 * Check if we need a temp buffer, or can we do it in place.
1933 * Note that we don't check "leaf" for holes because we will
1934 * always be dropping it, toosmall() decided that for us already.
1935 */
1936 if (save_hdr->holes == 0) {
1937 /*
1938 * dest leaf has no holes, so we add there. May need
1939 * to make some room in the entry array.
1940 */
1941 if (xfs_attr_leaf_order(save_blk->bp, drop_blk->bp)) {
1942 xfs_attr_leaf_moveents(drop_leaf, 0, save_leaf, 0,
918ae424 1943 be16_to_cpu(drop_hdr->count), mp);
1da177e4
LT
1944 } else {
1945 xfs_attr_leaf_moveents(drop_leaf, 0, save_leaf,
918ae424
NS
1946 be16_to_cpu(save_hdr->count),
1947 be16_to_cpu(drop_hdr->count), mp);
1da177e4
LT
1948 }
1949 } else {
1950 /*
1951 * Destination has holes, so we make a temporary copy
1952 * of the leaf and add them both to that.
1953 */
1954 tmpbuffer = kmem_alloc(state->blocksize, KM_SLEEP);
1955 ASSERT(tmpbuffer != NULL);
1956 memset(tmpbuffer, 0, state->blocksize);
1957 tmp_leaf = (xfs_attr_leafblock_t *)tmpbuffer;
1958 tmp_hdr = &tmp_leaf->hdr;
1959 tmp_hdr->info = save_hdr->info; /* struct copy */
1960 tmp_hdr->count = 0;
918ae424 1961 tmp_hdr->firstused = cpu_to_be16(state->blocksize);
1da177e4 1962 if (!tmp_hdr->firstused) {
918ae424 1963 tmp_hdr->firstused = cpu_to_be16(
1da177e4
LT
1964 state->blocksize - XFS_ATTR_LEAF_NAME_ALIGN);
1965 }
1966 tmp_hdr->usedbytes = 0;
1967 if (xfs_attr_leaf_order(save_blk->bp, drop_blk->bp)) {
1968 xfs_attr_leaf_moveents(drop_leaf, 0, tmp_leaf, 0,
918ae424 1969 be16_to_cpu(drop_hdr->count), mp);
1da177e4 1970 xfs_attr_leaf_moveents(save_leaf, 0, tmp_leaf,
918ae424
NS
1971 be16_to_cpu(tmp_leaf->hdr.count),
1972 be16_to_cpu(save_hdr->count), mp);
1da177e4
LT
1973 } else {
1974 xfs_attr_leaf_moveents(save_leaf, 0, tmp_leaf, 0,
918ae424 1975 be16_to_cpu(save_hdr->count), mp);
1da177e4 1976 xfs_attr_leaf_moveents(drop_leaf, 0, tmp_leaf,
918ae424
NS
1977 be16_to_cpu(tmp_leaf->hdr.count),
1978 be16_to_cpu(drop_hdr->count), mp);
1da177e4
LT
1979 }
1980 memcpy((char *)save_leaf, (char *)tmp_leaf, state->blocksize);
f0e2d93c 1981 kmem_free(tmpbuffer);
1da177e4
LT
1982 }
1983
1d9025e5 1984 xfs_trans_log_buf(state->args->trans, save_blk->bp, 0,
1da177e4
LT
1985 state->blocksize - 1);
1986
1987 /*
1988 * Copy out last hashval in each block for B-tree code.
1989 */
6b19f2d8
NS
1990 save_blk->hashval = be32_to_cpu(
1991 save_leaf->entries[be16_to_cpu(save_leaf->hdr.count)-1].hashval);
1da177e4
LT
1992}
1993
1994/*========================================================================
1995 * Routines used for finding things in the Btree.
1996 *========================================================================*/
1997
1998/*
1999 * Look up a name in a leaf attribute list structure.
2000 * This is the internal routine, it uses the caller's buffer.
2001 *
2002 * Note that duplicate keys are allowed, but only check within the
2003 * current leaf node. The Btree code must check in adjacent leaf nodes.
2004 *
2005 * Return in args->index the index into the entry[] array of either
2006 * the found entry, or where the entry should have been (insert before
2007 * that entry).
2008 *
2009 * Don't change the args->value unless we find the attribute.
2010 */
2011int
1d9025e5
DC
2012xfs_attr_leaf_lookup_int(
2013 struct xfs_buf *bp,
2014 xfs_da_args_t *args)
1da177e4
LT
2015{
2016 xfs_attr_leafblock_t *leaf;
2017 xfs_attr_leaf_entry_t *entry;
2018 xfs_attr_leaf_name_local_t *name_loc;
2019 xfs_attr_leaf_name_remote_t *name_rmt;
2020 int probe, span;
2021 xfs_dahash_t hashval;
2022
5a5881cd
DC
2023 trace_xfs_attr_leaf_lookup(args);
2024
1d9025e5 2025 leaf = bp->b_addr;
69ef921b 2026 ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
918ae424 2027 ASSERT(be16_to_cpu(leaf->hdr.count)
1da177e4
LT
2028 < (XFS_LBSIZE(args->dp->i_mount)/8));
2029
2030 /*
2031 * Binary search. (note: small blocks will skip this loop)
2032 */
2033 hashval = args->hashval;
918ae424 2034 probe = span = be16_to_cpu(leaf->hdr.count) / 2;
1da177e4
LT
2035 for (entry = &leaf->entries[probe]; span > 4;
2036 entry = &leaf->entries[probe]) {
2037 span /= 2;
6b19f2d8 2038 if (be32_to_cpu(entry->hashval) < hashval)
1da177e4 2039 probe += span;
6b19f2d8 2040 else if (be32_to_cpu(entry->hashval) > hashval)
1da177e4
LT
2041 probe -= span;
2042 else
2043 break;
2044 }
726801ba 2045 ASSERT((probe >= 0) &&
1da177e4 2046 (!leaf->hdr.count
918ae424 2047 || (probe < be16_to_cpu(leaf->hdr.count))));
6b19f2d8 2048 ASSERT((span <= 4) || (be32_to_cpu(entry->hashval) == hashval));
1da177e4
LT
2049
2050 /*
2051 * Since we may have duplicate hashval's, find the first matching
2052 * hashval in the leaf.
2053 */
6b19f2d8 2054 while ((probe > 0) && (be32_to_cpu(entry->hashval) >= hashval)) {
1da177e4
LT
2055 entry--;
2056 probe--;
2057 }
6b19f2d8
NS
2058 while ((probe < be16_to_cpu(leaf->hdr.count)) &&
2059 (be32_to_cpu(entry->hashval) < hashval)) {
1da177e4
LT
2060 entry++;
2061 probe++;
2062 }
6b19f2d8
NS
2063 if ((probe == be16_to_cpu(leaf->hdr.count)) ||
2064 (be32_to_cpu(entry->hashval) != hashval)) {
1da177e4
LT
2065 args->index = probe;
2066 return(XFS_ERROR(ENOATTR));
2067 }
2068
2069 /*
2070 * Duplicate keys may be present, so search all of them for a match.
2071 */
6b19f2d8
NS
2072 for ( ; (probe < be16_to_cpu(leaf->hdr.count)) &&
2073 (be32_to_cpu(entry->hashval) == hashval);
1da177e4
LT
2074 entry++, probe++) {
2075/*
2076 * GROT: Add code to remove incomplete entries.
2077 */
2078 /*
2079 * If we are looking for INCOMPLETE entries, show only those.
2080 * If we are looking for complete entries, show only those.
2081 */
2082 if ((args->flags & XFS_ATTR_INCOMPLETE) !=
2083 (entry->flags & XFS_ATTR_INCOMPLETE)) {
2084 continue;
2085 }
2086 if (entry->flags & XFS_ATTR_LOCAL) {
c9fb86a9 2087 name_loc = xfs_attr_leaf_name_local(leaf, probe);
1da177e4
LT
2088 if (name_loc->namelen != args->namelen)
2089 continue;
726801ba 2090 if (memcmp(args->name, (char *)name_loc->nameval, args->namelen) != 0)
1da177e4 2091 continue;
726801ba 2092 if (!xfs_attr_namesp_match(args->flags, entry->flags))
1da177e4
LT
2093 continue;
2094 args->index = probe;
2095 return(XFS_ERROR(EEXIST));
2096 } else {
c9fb86a9 2097 name_rmt = xfs_attr_leaf_name_remote(leaf, probe);
1da177e4
LT
2098 if (name_rmt->namelen != args->namelen)
2099 continue;
2100 if (memcmp(args->name, (char *)name_rmt->name,
2101 args->namelen) != 0)
2102 continue;
726801ba 2103 if (!xfs_attr_namesp_match(args->flags, entry->flags))
1da177e4
LT
2104 continue;
2105 args->index = probe;
c0f054e7 2106 args->rmtblkno = be32_to_cpu(name_rmt->valueblk);
1da177e4 2107 args->rmtblkcnt = XFS_B_TO_FSB(args->dp->i_mount,
c0f054e7 2108 be32_to_cpu(name_rmt->valuelen));
1da177e4
LT
2109 return(XFS_ERROR(EEXIST));
2110 }
2111 }
2112 args->index = probe;
2113 return(XFS_ERROR(ENOATTR));
2114}
2115
2116/*
2117 * Get the value associated with an attribute name from a leaf attribute
2118 * list structure.
2119 */
2120int
1d9025e5
DC
2121xfs_attr_leaf_getvalue(
2122 struct xfs_buf *bp,
2123 xfs_da_args_t *args)
1da177e4
LT
2124{
2125 int valuelen;
2126 xfs_attr_leafblock_t *leaf;
2127 xfs_attr_leaf_entry_t *entry;
2128 xfs_attr_leaf_name_local_t *name_loc;
2129 xfs_attr_leaf_name_remote_t *name_rmt;
2130
1d9025e5 2131 leaf = bp->b_addr;
69ef921b 2132 ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
918ae424 2133 ASSERT(be16_to_cpu(leaf->hdr.count)
1da177e4 2134 < (XFS_LBSIZE(args->dp->i_mount)/8));
918ae424 2135 ASSERT(args->index < be16_to_cpu(leaf->hdr.count));
1da177e4
LT
2136
2137 entry = &leaf->entries[args->index];
2138 if (entry->flags & XFS_ATTR_LOCAL) {
c9fb86a9 2139 name_loc = xfs_attr_leaf_name_local(leaf, args->index);
1da177e4
LT
2140 ASSERT(name_loc->namelen == args->namelen);
2141 ASSERT(memcmp(args->name, name_loc->nameval, args->namelen) == 0);
053b5758 2142 valuelen = be16_to_cpu(name_loc->valuelen);
1da177e4
LT
2143 if (args->flags & ATTR_KERNOVAL) {
2144 args->valuelen = valuelen;
2145 return(0);
2146 }
2147 if (args->valuelen < valuelen) {
2148 args->valuelen = valuelen;
2149 return(XFS_ERROR(ERANGE));
2150 }
2151 args->valuelen = valuelen;
2152 memcpy(args->value, &name_loc->nameval[args->namelen], valuelen);
2153 } else {
c9fb86a9 2154 name_rmt = xfs_attr_leaf_name_remote(leaf, args->index);
1da177e4
LT
2155 ASSERT(name_rmt->namelen == args->namelen);
2156 ASSERT(memcmp(args->name, name_rmt->name, args->namelen) == 0);
c0f054e7
NS
2157 valuelen = be32_to_cpu(name_rmt->valuelen);
2158 args->rmtblkno = be32_to_cpu(name_rmt->valueblk);
1da177e4
LT
2159 args->rmtblkcnt = XFS_B_TO_FSB(args->dp->i_mount, valuelen);
2160 if (args->flags & ATTR_KERNOVAL) {
2161 args->valuelen = valuelen;
2162 return(0);
2163 }
2164 if (args->valuelen < valuelen) {
2165 args->valuelen = valuelen;
2166 return(XFS_ERROR(ERANGE));
2167 }
2168 args->valuelen = valuelen;
2169 }
2170 return(0);
2171}
2172
2173/*========================================================================
2174 * Utility routines.
2175 *========================================================================*/
2176
2177/*
2178 * Move the indicated entries from one leaf to another.
2179 * NOTE: this routine modifies both source and destination leaves.
2180 */
2181/*ARGSUSED*/
2182STATIC void
2183xfs_attr_leaf_moveents(xfs_attr_leafblock_t *leaf_s, int start_s,
2184 xfs_attr_leafblock_t *leaf_d, int start_d,
2185 int count, xfs_mount_t *mp)
2186{
2187 xfs_attr_leaf_hdr_t *hdr_s, *hdr_d;
2188 xfs_attr_leaf_entry_t *entry_s, *entry_d;
2189 int desti, tmp, i;
2190
2191 /*
2192 * Check for nothing to do.
2193 */
2194 if (count == 0)
2195 return;
2196
2197 /*
2198 * Set up environment.
2199 */
69ef921b
CH
2200 ASSERT(leaf_s->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
2201 ASSERT(leaf_d->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
1da177e4
LT
2202 hdr_s = &leaf_s->hdr;
2203 hdr_d = &leaf_d->hdr;
918ae424
NS
2204 ASSERT((be16_to_cpu(hdr_s->count) > 0) &&
2205 (be16_to_cpu(hdr_s->count) < (XFS_LBSIZE(mp)/8)));
2206 ASSERT(be16_to_cpu(hdr_s->firstused) >=
2207 ((be16_to_cpu(hdr_s->count)
1da177e4 2208 * sizeof(*entry_s))+sizeof(*hdr_s)));
918ae424
NS
2209 ASSERT(be16_to_cpu(hdr_d->count) < (XFS_LBSIZE(mp)/8));
2210 ASSERT(be16_to_cpu(hdr_d->firstused) >=
2211 ((be16_to_cpu(hdr_d->count)
1da177e4
LT
2212 * sizeof(*entry_d))+sizeof(*hdr_d)));
2213
918ae424
NS
2214 ASSERT(start_s < be16_to_cpu(hdr_s->count));
2215 ASSERT(start_d <= be16_to_cpu(hdr_d->count));
2216 ASSERT(count <= be16_to_cpu(hdr_s->count));
1da177e4
LT
2217
2218 /*
2219 * Move the entries in the destination leaf up to make a hole?
2220 */
918ae424
NS
2221 if (start_d < be16_to_cpu(hdr_d->count)) {
2222 tmp = be16_to_cpu(hdr_d->count) - start_d;
1da177e4
LT
2223 tmp *= sizeof(xfs_attr_leaf_entry_t);
2224 entry_s = &leaf_d->entries[start_d];
2225 entry_d = &leaf_d->entries[start_d + count];
2226 memmove((char *)entry_d, (char *)entry_s, tmp);
2227 }
2228
2229 /*
2230 * Copy all entry's in the same (sorted) order,
2231 * but allocate attribute info packed and in sequence.
2232 */
2233 entry_s = &leaf_s->entries[start_s];
2234 entry_d = &leaf_d->entries[start_d];
2235 desti = start_d;
2236 for (i = 0; i < count; entry_s++, entry_d++, desti++, i++) {
6b19f2d8 2237 ASSERT(be16_to_cpu(entry_s->nameidx)
918ae424 2238 >= be16_to_cpu(hdr_s->firstused));
1da177e4
LT
2239 tmp = xfs_attr_leaf_entsize(leaf_s, start_s + i);
2240#ifdef GROT
2241 /*
2242 * Code to drop INCOMPLETE entries. Difficult to use as we
2243 * may also need to change the insertion index. Code turned
2244 * off for 6.2, should be revisited later.
2245 */
2246 if (entry_s->flags & XFS_ATTR_INCOMPLETE) { /* skip partials? */
c9fb86a9 2247 memset(xfs_attr_leaf_name(leaf_s, start_s + i), 0, tmp);
413d57c9
MS
2248 be16_add_cpu(&hdr_s->usedbytes, -tmp);
2249 be16_add_cpu(&hdr_s->count, -1);
1da177e4
LT
2250 entry_d--; /* to compensate for ++ in loop hdr */
2251 desti--;
2252 if ((start_s + i) < offset)
2253 result++; /* insertion index adjustment */
2254 } else {
2255#endif /* GROT */
413d57c9 2256 be16_add_cpu(&hdr_d->firstused, -tmp);
1da177e4
LT
2257 /* both on-disk, don't endian flip twice */
2258 entry_d->hashval = entry_s->hashval;
2259 /* both on-disk, don't endian flip twice */
2260 entry_d->nameidx = hdr_d->firstused;
2261 entry_d->flags = entry_s->flags;
6b19f2d8 2262 ASSERT(be16_to_cpu(entry_d->nameidx) + tmp
1da177e4 2263 <= XFS_LBSIZE(mp));
c9fb86a9
ES
2264 memmove(xfs_attr_leaf_name(leaf_d, desti),
2265 xfs_attr_leaf_name(leaf_s, start_s + i), tmp);
6b19f2d8 2266 ASSERT(be16_to_cpu(entry_s->nameidx) + tmp
1da177e4 2267 <= XFS_LBSIZE(mp));
c9fb86a9 2268 memset(xfs_attr_leaf_name(leaf_s, start_s + i), 0, tmp);
413d57c9
MS
2269 be16_add_cpu(&hdr_s->usedbytes, -tmp);
2270 be16_add_cpu(&hdr_d->usedbytes, tmp);
2271 be16_add_cpu(&hdr_s->count, -1);
2272 be16_add_cpu(&hdr_d->count, 1);
918ae424 2273 tmp = be16_to_cpu(hdr_d->count)
1da177e4
LT
2274 * sizeof(xfs_attr_leaf_entry_t)
2275 + sizeof(xfs_attr_leaf_hdr_t);
918ae424 2276 ASSERT(be16_to_cpu(hdr_d->firstused) >= tmp);
1da177e4
LT
2277#ifdef GROT
2278 }
2279#endif /* GROT */
2280 }
2281
2282 /*
2283 * Zero out the entries we just copied.
2284 */
918ae424 2285 if (start_s == be16_to_cpu(hdr_s->count)) {
1da177e4
LT
2286 tmp = count * sizeof(xfs_attr_leaf_entry_t);
2287 entry_s = &leaf_s->entries[start_s];
2288 ASSERT(((char *)entry_s + tmp) <=
2289 ((char *)leaf_s + XFS_LBSIZE(mp)));
2290 memset((char *)entry_s, 0, tmp);
2291 } else {
2292 /*
2293 * Move the remaining entries down to fill the hole,
2294 * then zero the entries at the top.
2295 */
918ae424 2296 tmp = be16_to_cpu(hdr_s->count) - count;
1da177e4
LT
2297 tmp *= sizeof(xfs_attr_leaf_entry_t);
2298 entry_s = &leaf_s->entries[start_s + count];
2299 entry_d = &leaf_s->entries[start_s];
2300 memmove((char *)entry_d, (char *)entry_s, tmp);
2301
2302 tmp = count * sizeof(xfs_attr_leaf_entry_t);
918ae424 2303 entry_s = &leaf_s->entries[be16_to_cpu(hdr_s->count)];
1da177e4
LT
2304 ASSERT(((char *)entry_s + tmp) <=
2305 ((char *)leaf_s + XFS_LBSIZE(mp)));
2306 memset((char *)entry_s, 0, tmp);
2307 }
2308
2309 /*
2310 * Fill in the freemap information
2311 */
918ae424 2312 hdr_d->freemap[0].base = cpu_to_be16(sizeof(xfs_attr_leaf_hdr_t));
413d57c9 2313 be16_add_cpu(&hdr_d->freemap[0].base, be16_to_cpu(hdr_d->count) *
918ae424
NS
2314 sizeof(xfs_attr_leaf_entry_t));
2315 hdr_d->freemap[0].size = cpu_to_be16(be16_to_cpu(hdr_d->firstused)
2316 - be16_to_cpu(hdr_d->freemap[0].base));
1da177e4
LT
2317 hdr_d->freemap[1].base = 0;
2318 hdr_d->freemap[2].base = 0;
2319 hdr_d->freemap[1].size = 0;
2320 hdr_d->freemap[2].size = 0;
2321 hdr_s->holes = 1; /* leaf may not be compact */
2322}
2323
2324/*
2325 * Compare two leaf blocks "order".
2326 * Return 0 unless leaf2 should go before leaf1.
2327 */
2328int
1d9025e5
DC
2329xfs_attr_leaf_order(
2330 struct xfs_buf *leaf1_bp,
2331 struct xfs_buf *leaf2_bp)
1da177e4
LT
2332{
2333 xfs_attr_leafblock_t *leaf1, *leaf2;
2334
1d9025e5
DC
2335 leaf1 = leaf1_bp->b_addr;
2336 leaf2 = leaf2_bp->b_addr;
69ef921b
CH
2337 ASSERT((leaf1->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC)) &&
2338 (leaf2->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC)));
918ae424
NS
2339 if ((be16_to_cpu(leaf1->hdr.count) > 0) &&
2340 (be16_to_cpu(leaf2->hdr.count) > 0) &&
6b19f2d8
NS
2341 ((be32_to_cpu(leaf2->entries[0].hashval) <
2342 be32_to_cpu(leaf1->entries[0].hashval)) ||
2343 (be32_to_cpu(leaf2->entries[
2344 be16_to_cpu(leaf2->hdr.count)-1].hashval) <
2345 be32_to_cpu(leaf1->entries[
2346 be16_to_cpu(leaf1->hdr.count)-1].hashval)))) {
1da177e4
LT
2347 return(1);
2348 }
2349 return(0);
2350}
2351
2352/*
2353 * Pick up the last hashvalue from a leaf block.
2354 */
2355xfs_dahash_t
1d9025e5
DC
2356xfs_attr_leaf_lasthash(
2357 struct xfs_buf *bp,
2358 int *count)
1da177e4
LT
2359{
2360 xfs_attr_leafblock_t *leaf;
2361
1d9025e5 2362 leaf = bp->b_addr;
69ef921b 2363 ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
1da177e4 2364 if (count)
918ae424 2365 *count = be16_to_cpu(leaf->hdr.count);
1da177e4
LT
2366 if (!leaf->hdr.count)
2367 return(0);
6b19f2d8 2368 return be32_to_cpu(leaf->entries[be16_to_cpu(leaf->hdr.count)-1].hashval);
1da177e4
LT
2369}
2370
2371/*
2372 * Calculate the number of bytes used to store the indicated attribute
2373 * (whether local or remote only calculate bytes in this block).
2374 */
ba0f32d4 2375STATIC int
1da177e4
LT
2376xfs_attr_leaf_entsize(xfs_attr_leafblock_t *leaf, int index)
2377{
2378 xfs_attr_leaf_name_local_t *name_loc;
2379 xfs_attr_leaf_name_remote_t *name_rmt;
2380 int size;
2381
69ef921b 2382 ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
1da177e4 2383 if (leaf->entries[index].flags & XFS_ATTR_LOCAL) {
c9fb86a9
ES
2384 name_loc = xfs_attr_leaf_name_local(leaf, index);
2385 size = xfs_attr_leaf_entsize_local(name_loc->namelen,
053b5758 2386 be16_to_cpu(name_loc->valuelen));
1da177e4 2387 } else {
c9fb86a9
ES
2388 name_rmt = xfs_attr_leaf_name_remote(leaf, index);
2389 size = xfs_attr_leaf_entsize_remote(name_rmt->namelen);
1da177e4
LT
2390 }
2391 return(size);
2392}
2393
2394/*
2395 * Calculate the number of bytes that would be required to store the new
2396 * attribute (whether local or remote only calculate bytes in this block).
2397 * This routine decides as a side effect whether the attribute will be
2398 * a "local" or a "remote" attribute.
2399 */
2400int
aa82daa0 2401xfs_attr_leaf_newentsize(int namelen, int valuelen, int blocksize, int *local)
1da177e4
LT
2402{
2403 int size;
2404
c9fb86a9
ES
2405 size = xfs_attr_leaf_entsize_local(namelen, valuelen);
2406 if (size < xfs_attr_leaf_entsize_local_max(blocksize)) {
1da177e4
LT
2407 if (local) {
2408 *local = 1;
2409 }
2410 } else {
c9fb86a9 2411 size = xfs_attr_leaf_entsize_remote(namelen);
1da177e4
LT
2412 if (local) {
2413 *local = 0;
2414 }
2415 }
2416 return(size);
2417}
2418
2419/*
2420 * Copy out attribute list entries for attr_list(), for leaf attribute lists.
2421 */
2422int
1d9025e5
DC
2423xfs_attr_leaf_list_int(
2424 struct xfs_buf *bp,
2425 xfs_attr_list_context_t *context)
1da177e4
LT
2426{
2427 attrlist_cursor_kern_t *cursor;
2428 xfs_attr_leafblock_t *leaf;
2429 xfs_attr_leaf_entry_t *entry;
1da177e4
LT
2430 int retval, i;
2431
2432 ASSERT(bp != NULL);
1d9025e5 2433 leaf = bp->b_addr;
1da177e4
LT
2434 cursor = context->cursor;
2435 cursor->initted = 1;
2436
0b1b213f 2437 trace_xfs_attr_list_leaf(context);
1da177e4
LT
2438
2439 /*
2440 * Re-find our place in the leaf block if this is a new syscall.
2441 */
2442 if (context->resynch) {
2443 entry = &leaf->entries[0];
918ae424 2444 for (i = 0; i < be16_to_cpu(leaf->hdr.count); entry++, i++) {
6b19f2d8 2445 if (be32_to_cpu(entry->hashval) == cursor->hashval) {
1da177e4
LT
2446 if (cursor->offset == context->dupcnt) {
2447 context->dupcnt = 0;
2448 break;
2449 }
2450 context->dupcnt++;
6b19f2d8
NS
2451 } else if (be32_to_cpu(entry->hashval) >
2452 cursor->hashval) {
1da177e4
LT
2453 context->dupcnt = 0;
2454 break;
2455 }
2456 }
918ae424 2457 if (i == be16_to_cpu(leaf->hdr.count)) {
0b1b213f 2458 trace_xfs_attr_list_notfound(context);
1da177e4
LT
2459 return(0);
2460 }
2461 } else {
2462 entry = &leaf->entries[0];
2463 i = 0;
2464 }
2465 context->resynch = 0;
2466
2467 /*
2468 * We have found our place, start copying out the new attributes.
2469 */
2470 retval = 0;
726801ba 2471 for ( ; (i < be16_to_cpu(leaf->hdr.count)); entry++, i++) {
6b19f2d8
NS
2472 if (be32_to_cpu(entry->hashval) != cursor->hashval) {
2473 cursor->hashval = be32_to_cpu(entry->hashval);
1da177e4
LT
2474 cursor->offset = 0;
2475 }
2476
2477 if (entry->flags & XFS_ATTR_INCOMPLETE)
2478 continue; /* skip incomplete entries */
1da177e4
LT
2479
2480 if (entry->flags & XFS_ATTR_LOCAL) {
726801ba 2481 xfs_attr_leaf_name_local_t *name_loc =
c9fb86a9 2482 xfs_attr_leaf_name_local(leaf, i);
726801ba
TS
2483
2484 retval = context->put_listent(context,
ad9b463a 2485 entry->flags,
a9273ca5 2486 name_loc->nameval,
726801ba
TS
2487 (int)name_loc->namelen,
2488 be16_to_cpu(name_loc->valuelen),
a9273ca5 2489 &name_loc->nameval[name_loc->namelen]);
726801ba
TS
2490 if (retval)
2491 return retval;
1da177e4 2492 } else {
726801ba 2493 xfs_attr_leaf_name_remote_t *name_rmt =
c9fb86a9 2494 xfs_attr_leaf_name_remote(leaf, i);
726801ba
TS
2495
2496 int valuelen = be32_to_cpu(name_rmt->valuelen);
2497
2498 if (context->put_value) {
2499 xfs_da_args_t args;
2500
2501 memset((char *)&args, 0, sizeof(args));
2502 args.dp = context->dp;
2503 args.whichfork = XFS_ATTR_FORK;
2504 args.valuelen = valuelen;
622d8149 2505 args.value = kmem_alloc(valuelen, KM_SLEEP | KM_NOFS);
726801ba
TS
2506 args.rmtblkno = be32_to_cpu(name_rmt->valueblk);
2507 args.rmtblkcnt = XFS_B_TO_FSB(args.dp->i_mount, valuelen);
2508 retval = xfs_attr_rmtval_get(&args);
2509 if (retval)
2510 return retval;
2511 retval = context->put_listent(context,
ad9b463a 2512 entry->flags,
a9273ca5 2513 name_rmt->name,
726801ba
TS
2514 (int)name_rmt->namelen,
2515 valuelen,
a9273ca5 2516 args.value);
f0e2d93c 2517 kmem_free(args.value);
ad9b463a 2518 } else {
726801ba 2519 retval = context->put_listent(context,
ad9b463a 2520 entry->flags,
a9273ca5 2521 name_rmt->name,
726801ba
TS
2522 (int)name_rmt->namelen,
2523 valuelen,
2524 NULL);
2525 }
2526 if (retval)
2527 return retval;
1da177e4 2528 }
726801ba
TS
2529 if (context->seen_enough)
2530 break;
2531 cursor->offset++;
1da177e4 2532 }
0b1b213f 2533 trace_xfs_attr_list_leaf_end(context);
1da177e4
LT
2534 return(retval);
2535}
2536
1da177e4
LT
2537
2538/*========================================================================
2539 * Manage the INCOMPLETE flag in a leaf entry
2540 *========================================================================*/
2541
2542/*
2543 * Clear the INCOMPLETE flag on an entry in a leaf block.
2544 */
2545int
2546xfs_attr_leaf_clearflag(xfs_da_args_t *args)
2547{
2548 xfs_attr_leafblock_t *leaf;
2549 xfs_attr_leaf_entry_t *entry;
2550 xfs_attr_leaf_name_remote_t *name_rmt;
1d9025e5 2551 struct xfs_buf *bp;
1da177e4
LT
2552 int error;
2553#ifdef DEBUG
2554 xfs_attr_leaf_name_local_t *name_loc;
2555 int namelen;
2556 char *name;
2557#endif /* DEBUG */
2558
5a5881cd 2559 trace_xfs_attr_leaf_clearflag(args);
1da177e4
LT
2560 /*
2561 * Set up the operation.
2562 */
ad14c33a
DC
2563 error = xfs_attr_leaf_read(args->trans, args->dp, args->blkno, -1, &bp);
2564 if (error)
1da177e4 2565 return(error);
1da177e4 2566
1d9025e5 2567 leaf = bp->b_addr;
918ae424 2568 ASSERT(args->index < be16_to_cpu(leaf->hdr.count));
1da177e4
LT
2569 ASSERT(args->index >= 0);
2570 entry = &leaf->entries[ args->index ];
2571 ASSERT(entry->flags & XFS_ATTR_INCOMPLETE);
2572
2573#ifdef DEBUG
2574 if (entry->flags & XFS_ATTR_LOCAL) {
c9fb86a9 2575 name_loc = xfs_attr_leaf_name_local(leaf, args->index);
1da177e4
LT
2576 namelen = name_loc->namelen;
2577 name = (char *)name_loc->nameval;
2578 } else {
c9fb86a9 2579 name_rmt = xfs_attr_leaf_name_remote(leaf, args->index);
1da177e4
LT
2580 namelen = name_rmt->namelen;
2581 name = (char *)name_rmt->name;
2582 }
6b19f2d8 2583 ASSERT(be32_to_cpu(entry->hashval) == args->hashval);
1da177e4
LT
2584 ASSERT(namelen == args->namelen);
2585 ASSERT(memcmp(name, args->name, namelen) == 0);
2586#endif /* DEBUG */
2587
2588 entry->flags &= ~XFS_ATTR_INCOMPLETE;
1d9025e5 2589 xfs_trans_log_buf(args->trans, bp,
1da177e4
LT
2590 XFS_DA_LOGRANGE(leaf, entry, sizeof(*entry)));
2591
2592 if (args->rmtblkno) {
2593 ASSERT((entry->flags & XFS_ATTR_LOCAL) == 0);
c9fb86a9 2594 name_rmt = xfs_attr_leaf_name_remote(leaf, args->index);
c0f054e7
NS
2595 name_rmt->valueblk = cpu_to_be32(args->rmtblkno);
2596 name_rmt->valuelen = cpu_to_be32(args->valuelen);
1d9025e5 2597 xfs_trans_log_buf(args->trans, bp,
1da177e4
LT
2598 XFS_DA_LOGRANGE(leaf, name_rmt, sizeof(*name_rmt)));
2599 }
1da177e4
LT
2600
2601 /*
2602 * Commit the flag value change and start the next trans in series.
2603 */
322ff6b8 2604 return xfs_trans_roll(&args->trans, args->dp);
1da177e4
LT
2605}
2606
2607/*
2608 * Set the INCOMPLETE flag on an entry in a leaf block.
2609 */
2610int
2611xfs_attr_leaf_setflag(xfs_da_args_t *args)
2612{
2613 xfs_attr_leafblock_t *leaf;
2614 xfs_attr_leaf_entry_t *entry;
2615 xfs_attr_leaf_name_remote_t *name_rmt;
1d9025e5 2616 struct xfs_buf *bp;
1da177e4
LT
2617 int error;
2618
5a5881cd
DC
2619 trace_xfs_attr_leaf_setflag(args);
2620
1da177e4
LT
2621 /*
2622 * Set up the operation.
2623 */
ad14c33a
DC
2624 error = xfs_attr_leaf_read(args->trans, args->dp, args->blkno, -1, &bp);
2625 if (error)
1da177e4 2626 return(error);
1da177e4 2627
1d9025e5 2628 leaf = bp->b_addr;
918ae424 2629 ASSERT(args->index < be16_to_cpu(leaf->hdr.count));
1da177e4
LT
2630 ASSERT(args->index >= 0);
2631 entry = &leaf->entries[ args->index ];
2632
2633 ASSERT((entry->flags & XFS_ATTR_INCOMPLETE) == 0);
2634 entry->flags |= XFS_ATTR_INCOMPLETE;
1d9025e5 2635 xfs_trans_log_buf(args->trans, bp,
1da177e4
LT
2636 XFS_DA_LOGRANGE(leaf, entry, sizeof(*entry)));
2637 if ((entry->flags & XFS_ATTR_LOCAL) == 0) {
c9fb86a9 2638 name_rmt = xfs_attr_leaf_name_remote(leaf, args->index);
1da177e4
LT
2639 name_rmt->valueblk = 0;
2640 name_rmt->valuelen = 0;
1d9025e5 2641 xfs_trans_log_buf(args->trans, bp,
1da177e4
LT
2642 XFS_DA_LOGRANGE(leaf, name_rmt, sizeof(*name_rmt)));
2643 }
1da177e4
LT
2644
2645 /*
2646 * Commit the flag value change and start the next trans in series.
2647 */
322ff6b8 2648 return xfs_trans_roll(&args->trans, args->dp);
1da177e4
LT
2649}
2650
2651/*
2652 * In a single transaction, clear the INCOMPLETE flag on the leaf entry
2653 * given by args->blkno/index and set the INCOMPLETE flag on the leaf
2654 * entry given by args->blkno2/index2.
2655 *
2656 * Note that they could be in different blocks, or in the same block.
2657 */
2658int
2659xfs_attr_leaf_flipflags(xfs_da_args_t *args)
2660{
2661 xfs_attr_leafblock_t *leaf1, *leaf2;
2662 xfs_attr_leaf_entry_t *entry1, *entry2;
2663 xfs_attr_leaf_name_remote_t *name_rmt;
1d9025e5 2664 struct xfs_buf *bp1, *bp2;
1da177e4
LT
2665 int error;
2666#ifdef DEBUG
2667 xfs_attr_leaf_name_local_t *name_loc;
2668 int namelen1, namelen2;
2669 char *name1, *name2;
2670#endif /* DEBUG */
2671
5a5881cd
DC
2672 trace_xfs_attr_leaf_flipflags(args);
2673
1da177e4
LT
2674 /*
2675 * Read the block containing the "old" attr
2676 */
ad14c33a
DC
2677 error = xfs_attr_leaf_read(args->trans, args->dp, args->blkno, -1, &bp1);
2678 if (error)
2679 return error;
1da177e4
LT
2680
2681 /*
2682 * Read the block containing the "new" attr, if it is different
2683 */
2684 if (args->blkno2 != args->blkno) {
ad14c33a
DC
2685 error = xfs_attr_leaf_read(args->trans, args->dp, args->blkno2,
2686 -1, &bp2);
2687 if (error)
2688 return error;
1da177e4
LT
2689 } else {
2690 bp2 = bp1;
2691 }
2692
1d9025e5 2693 leaf1 = bp1->b_addr;
918ae424 2694 ASSERT(args->index < be16_to_cpu(leaf1->hdr.count));
1da177e4
LT
2695 ASSERT(args->index >= 0);
2696 entry1 = &leaf1->entries[ args->index ];
2697
1d9025e5 2698 leaf2 = bp2->b_addr;
918ae424 2699 ASSERT(args->index2 < be16_to_cpu(leaf2->hdr.count));
1da177e4
LT
2700 ASSERT(args->index2 >= 0);
2701 entry2 = &leaf2->entries[ args->index2 ];
2702
2703#ifdef DEBUG
2704 if (entry1->flags & XFS_ATTR_LOCAL) {
c9fb86a9 2705 name_loc = xfs_attr_leaf_name_local(leaf1, args->index);
1da177e4
LT
2706 namelen1 = name_loc->namelen;
2707 name1 = (char *)name_loc->nameval;
2708 } else {
c9fb86a9 2709 name_rmt = xfs_attr_leaf_name_remote(leaf1, args->index);
1da177e4
LT
2710 namelen1 = name_rmt->namelen;
2711 name1 = (char *)name_rmt->name;
2712 }
2713 if (entry2->flags & XFS_ATTR_LOCAL) {
c9fb86a9 2714 name_loc = xfs_attr_leaf_name_local(leaf2, args->index2);
1da177e4
LT
2715 namelen2 = name_loc->namelen;
2716 name2 = (char *)name_loc->nameval;
2717 } else {
c9fb86a9 2718 name_rmt = xfs_attr_leaf_name_remote(leaf2, args->index2);
1da177e4
LT
2719 namelen2 = name_rmt->namelen;
2720 name2 = (char *)name_rmt->name;
2721 }
6b19f2d8 2722 ASSERT(be32_to_cpu(entry1->hashval) == be32_to_cpu(entry2->hashval));
1da177e4
LT
2723 ASSERT(namelen1 == namelen2);
2724 ASSERT(memcmp(name1, name2, namelen1) == 0);
2725#endif /* DEBUG */
2726
2727 ASSERT(entry1->flags & XFS_ATTR_INCOMPLETE);
2728 ASSERT((entry2->flags & XFS_ATTR_INCOMPLETE) == 0);
2729
2730 entry1->flags &= ~XFS_ATTR_INCOMPLETE;
1d9025e5 2731 xfs_trans_log_buf(args->trans, bp1,
1da177e4
LT
2732 XFS_DA_LOGRANGE(leaf1, entry1, sizeof(*entry1)));
2733 if (args->rmtblkno) {
2734 ASSERT((entry1->flags & XFS_ATTR_LOCAL) == 0);
c9fb86a9 2735 name_rmt = xfs_attr_leaf_name_remote(leaf1, args->index);
c0f054e7
NS
2736 name_rmt->valueblk = cpu_to_be32(args->rmtblkno);
2737 name_rmt->valuelen = cpu_to_be32(args->valuelen);
1d9025e5 2738 xfs_trans_log_buf(args->trans, bp1,
1da177e4
LT
2739 XFS_DA_LOGRANGE(leaf1, name_rmt, sizeof(*name_rmt)));
2740 }
2741
2742 entry2->flags |= XFS_ATTR_INCOMPLETE;
1d9025e5 2743 xfs_trans_log_buf(args->trans, bp2,
1da177e4
LT
2744 XFS_DA_LOGRANGE(leaf2, entry2, sizeof(*entry2)));
2745 if ((entry2->flags & XFS_ATTR_LOCAL) == 0) {
c9fb86a9 2746 name_rmt = xfs_attr_leaf_name_remote(leaf2, args->index2);
1da177e4
LT
2747 name_rmt->valueblk = 0;
2748 name_rmt->valuelen = 0;
1d9025e5 2749 xfs_trans_log_buf(args->trans, bp2,
1da177e4
LT
2750 XFS_DA_LOGRANGE(leaf2, name_rmt, sizeof(*name_rmt)));
2751 }
1da177e4
LT
2752
2753 /*
2754 * Commit the flag value change and start the next trans in series.
2755 */
322ff6b8 2756 error = xfs_trans_roll(&args->trans, args->dp);
1da177e4
LT
2757
2758 return(error);
2759}
2760
2761/*========================================================================
2762 * Indiscriminately delete the entire attribute fork
2763 *========================================================================*/
2764
2765/*
2766 * Recurse (gasp!) through the attribute nodes until we find leaves.
2767 * We're doing a depth-first traversal in order to invalidate everything.
2768 */
2769int
2770xfs_attr_root_inactive(xfs_trans_t **trans, xfs_inode_t *dp)
2771{
2772 xfs_da_blkinfo_t *info;
2773 xfs_daddr_t blkno;
1d9025e5 2774 struct xfs_buf *bp;
1da177e4
LT
2775 int error;
2776
2777 /*
2778 * Read block 0 to see what we have to work with.
2779 * We only get here if we have extents, since we remove
2780 * the extents in reverse order the extent containing
2781 * block 0 must still be there.
2782 */
d9392a4b 2783 error = xfs_da_node_read(*trans, dp, 0, -1, &bp, XFS_ATTR_FORK);
1da177e4
LT
2784 if (error)
2785 return(error);
1d9025e5 2786 blkno = XFS_BUF_ADDR(bp);
1da177e4
LT
2787
2788 /*
2789 * Invalidate the tree, even if the "tree" is only a single leaf block.
2790 * This is a depth-first traversal!
2791 */
1d9025e5 2792 info = bp->b_addr;
69ef921b 2793 if (info->magic == cpu_to_be16(XFS_DA_NODE_MAGIC)) {
1da177e4 2794 error = xfs_attr_node_inactive(trans, dp, bp, 1);
69ef921b 2795 } else if (info->magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC)) {
1da177e4
LT
2796 error = xfs_attr_leaf_inactive(trans, dp, bp);
2797 } else {
2798 error = XFS_ERROR(EIO);
1d9025e5 2799 xfs_trans_brelse(*trans, bp);
1da177e4
LT
2800 }
2801 if (error)
2802 return(error);
2803
2804 /*
2805 * Invalidate the incore copy of the root block.
2806 */
2807 error = xfs_da_get_buf(*trans, dp, 0, blkno, &bp, XFS_ATTR_FORK);
2808 if (error)
2809 return(error);
1d9025e5 2810 xfs_trans_binval(*trans, bp); /* remove from cache */
1da177e4
LT
2811 /*
2812 * Commit the invalidate and start the next transaction.
2813 */
322ff6b8 2814 error = xfs_trans_roll(trans, dp);
1da177e4
LT
2815
2816 return (error);
2817}
2818
2819/*
2820 * Recurse (gasp!) through the attribute nodes until we find leaves.
2821 * We're doing a depth-first traversal in order to invalidate everything.
2822 */
ba0f32d4 2823STATIC int
1d9025e5
DC
2824xfs_attr_node_inactive(
2825 struct xfs_trans **trans,
2826 struct xfs_inode *dp,
2827 struct xfs_buf *bp,
2828 int level)
1da177e4
LT
2829{
2830 xfs_da_blkinfo_t *info;
2831 xfs_da_intnode_t *node;
2832 xfs_dablk_t child_fsb;
2833 xfs_daddr_t parent_blkno, child_blkno;
2834 int error, count, i;
1d9025e5 2835 struct xfs_buf *child_bp;
1da177e4
LT
2836
2837 /*
2838 * Since this code is recursive (gasp!) we must protect ourselves.
2839 */
2840 if (level > XFS_DA_NODE_MAXDEPTH) {
1d9025e5 2841 xfs_trans_brelse(*trans, bp); /* no locks for later trans */
1da177e4
LT
2842 return(XFS_ERROR(EIO));
2843 }
2844
1d9025e5 2845 node = bp->b_addr;
69ef921b 2846 ASSERT(node->hdr.info.magic == cpu_to_be16(XFS_DA_NODE_MAGIC));
1d9025e5 2847 parent_blkno = XFS_BUF_ADDR(bp); /* save for re-read later */
fac80cce 2848 count = be16_to_cpu(node->hdr.count);
1da177e4 2849 if (!count) {
1d9025e5 2850 xfs_trans_brelse(*trans, bp);
1da177e4
LT
2851 return(0);
2852 }
403432dc 2853 child_fsb = be32_to_cpu(node->btree[0].before);
1d9025e5 2854 xfs_trans_brelse(*trans, bp); /* no locks for later trans */
1da177e4
LT
2855
2856 /*
2857 * If this is the node level just above the leaves, simply loop
2858 * over the leaves removing all of them. If this is higher up
2859 * in the tree, recurse downward.
2860 */
2861 for (i = 0; i < count; i++) {
2862 /*
2863 * Read the subsidiary block to see what we have to work with.
2864 * Don't do this in a transaction. This is a depth-first
2865 * traversal of the tree so we may deal with many blocks
2866 * before we come back to this one.
2867 */
d9392a4b
DC
2868 error = xfs_da_node_read(*trans, dp, child_fsb, -2, &child_bp,
2869 XFS_ATTR_FORK);
1da177e4
LT
2870 if (error)
2871 return(error);
2872 if (child_bp) {
2873 /* save for re-read later */
1d9025e5 2874 child_blkno = XFS_BUF_ADDR(child_bp);
1da177e4
LT
2875
2876 /*
2877 * Invalidate the subtree, however we have to.
2878 */
1d9025e5 2879 info = child_bp->b_addr;
69ef921b 2880 if (info->magic == cpu_to_be16(XFS_DA_NODE_MAGIC)) {
1da177e4
LT
2881 error = xfs_attr_node_inactive(trans, dp,
2882 child_bp, level+1);
69ef921b 2883 } else if (info->magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC)) {
1da177e4
LT
2884 error = xfs_attr_leaf_inactive(trans, dp,
2885 child_bp);
2886 } else {
2887 error = XFS_ERROR(EIO);
1d9025e5 2888 xfs_trans_brelse(*trans, child_bp);
1da177e4
LT
2889 }
2890 if (error)
2891 return(error);
2892
2893 /*
2894 * Remove the subsidiary block from the cache
2895 * and from the log.
2896 */
2897 error = xfs_da_get_buf(*trans, dp, 0, child_blkno,
2898 &child_bp, XFS_ATTR_FORK);
2899 if (error)
2900 return(error);
1d9025e5 2901 xfs_trans_binval(*trans, child_bp);
1da177e4
LT
2902 }
2903
2904 /*
2905 * If we're not done, re-read the parent to get the next
2906 * child block number.
2907 */
2908 if ((i+1) < count) {
d9392a4b
DC
2909 error = xfs_da_node_read(*trans, dp, 0, parent_blkno,
2910 &bp, XFS_ATTR_FORK);
1da177e4
LT
2911 if (error)
2912 return(error);
403432dc 2913 child_fsb = be32_to_cpu(node->btree[i+1].before);
1d9025e5 2914 xfs_trans_brelse(*trans, bp);
1da177e4
LT
2915 }
2916 /*
2917 * Atomically commit the whole invalidate stuff.
2918 */
322ff6b8
NS
2919 error = xfs_trans_roll(trans, dp);
2920 if (error)
1da177e4
LT
2921 return (error);
2922 }
2923
2924 return(0);
2925}
2926
2927/*
2928 * Invalidate all of the "remote" value regions pointed to by a particular
2929 * leaf block.
2930 * Note that we must release the lock on the buffer so that we are not
2931 * caught holding something that the logging code wants to flush to disk.
2932 */
ba0f32d4 2933STATIC int
1d9025e5
DC
2934xfs_attr_leaf_inactive(
2935 struct xfs_trans **trans,
2936 struct xfs_inode *dp,
2937 struct xfs_buf *bp)
1da177e4
LT
2938{
2939 xfs_attr_leafblock_t *leaf;
2940 xfs_attr_leaf_entry_t *entry;
2941 xfs_attr_leaf_name_remote_t *name_rmt;
2942 xfs_attr_inactive_list_t *list, *lp;
2943 int error, count, size, tmp, i;
2944
1d9025e5 2945 leaf = bp->b_addr;
69ef921b 2946 ASSERT(leaf->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC));
1da177e4
LT
2947
2948 /*
2949 * Count the number of "remote" value extents.
2950 */
2951 count = 0;
2952 entry = &leaf->entries[0];
918ae424 2953 for (i = 0; i < be16_to_cpu(leaf->hdr.count); entry++, i++) {
6b19f2d8
NS
2954 if (be16_to_cpu(entry->nameidx) &&
2955 ((entry->flags & XFS_ATTR_LOCAL) == 0)) {
c9fb86a9 2956 name_rmt = xfs_attr_leaf_name_remote(leaf, i);
1da177e4
LT
2957 if (name_rmt->valueblk)
2958 count++;
2959 }
2960 }
2961
2962 /*
2963 * If there are no "remote" values, we're done.
2964 */
2965 if (count == 0) {
1d9025e5 2966 xfs_trans_brelse(*trans, bp);
1da177e4
LT
2967 return(0);
2968 }
2969
2970 /*
2971 * Allocate storage for a list of all the "remote" value extents.
2972 */
2973 size = count * sizeof(xfs_attr_inactive_list_t);
2974 list = (xfs_attr_inactive_list_t *)kmem_alloc(size, KM_SLEEP);
2975
2976 /*
2977 * Identify each of the "remote" value extents.
2978 */
2979 lp = list;
2980 entry = &leaf->entries[0];
918ae424 2981 for (i = 0; i < be16_to_cpu(leaf->hdr.count); entry++, i++) {
6b19f2d8
NS
2982 if (be16_to_cpu(entry->nameidx) &&
2983 ((entry->flags & XFS_ATTR_LOCAL) == 0)) {
c9fb86a9 2984 name_rmt = xfs_attr_leaf_name_remote(leaf, i);
1da177e4 2985 if (name_rmt->valueblk) {
d7929ff6
NS
2986 lp->valueblk = be32_to_cpu(name_rmt->valueblk);
2987 lp->valuelen = XFS_B_TO_FSB(dp->i_mount,
2988 be32_to_cpu(name_rmt->valuelen));
1da177e4
LT
2989 lp++;
2990 }
2991 }
2992 }
1d9025e5 2993 xfs_trans_brelse(*trans, bp); /* unlock for trans. in freextent() */
1da177e4
LT
2994
2995 /*
2996 * Invalidate each of the "remote" value extents.
2997 */
2998 error = 0;
2999 for (lp = list, i = 0; i < count; i++, lp++) {
3000 tmp = xfs_attr_leaf_freextent(trans, dp,
d7929ff6
NS
3001 lp->valueblk, lp->valuelen);
3002
1da177e4
LT
3003 if (error == 0)
3004 error = tmp; /* save only the 1st errno */
3005 }
3006
f0e2d93c 3007 kmem_free((xfs_caddr_t)list);
1da177e4
LT
3008 return(error);
3009}
3010
3011/*
3012 * Look at all the extents for this logical region,
3013 * invalidate any buffers that are incore/in transactions.
3014 */
ba0f32d4 3015STATIC int
1da177e4
LT
3016xfs_attr_leaf_freextent(xfs_trans_t **trans, xfs_inode_t *dp,
3017 xfs_dablk_t blkno, int blkcnt)
3018{
3019 xfs_bmbt_irec_t map;
3020 xfs_dablk_t tblkno;
3021 int tblkcnt, dblkcnt, nmap, error;
3022 xfs_daddr_t dblkno;
3023 xfs_buf_t *bp;
3024
3025 /*
3026 * Roll through the "value", invalidating the attribute value's
3027 * blocks.
3028 */
3029 tblkno = blkno;
3030 tblkcnt = blkcnt;
3031 while (tblkcnt > 0) {
3032 /*
3033 * Try to remember where we decided to put the value.
3034 */
3035 nmap = 1;
5c8ed202
DC
3036 error = xfs_bmapi_read(dp, (xfs_fileoff_t)tblkno, tblkcnt,
3037 &map, &nmap, XFS_BMAPI_ATTRFORK);
1da177e4
LT
3038 if (error) {
3039 return(error);
3040 }
3041 ASSERT(nmap == 1);
3042 ASSERT(map.br_startblock != DELAYSTARTBLOCK);
3043
3044 /*
3045 * If it's a hole, these are already unmapped
3046 * so there's nothing to invalidate.
3047 */
3048 if (map.br_startblock != HOLESTARTBLOCK) {
3049
3050 dblkno = XFS_FSB_TO_DADDR(dp->i_mount,
3051 map.br_startblock);
3052 dblkcnt = XFS_FSB_TO_BB(dp->i_mount,
3053 map.br_blockcount);
3054 bp = xfs_trans_get_buf(*trans,
3055 dp->i_mount->m_ddev_targp,
a8acad70 3056 dblkno, dblkcnt, 0);
2a30f36d
CS
3057 if (!bp)
3058 return ENOMEM;
1da177e4
LT
3059 xfs_trans_binval(*trans, bp);
3060 /*
3061 * Roll to next transaction.
3062 */
322ff6b8
NS
3063 error = xfs_trans_roll(trans, dp);
3064 if (error)
1da177e4
LT
3065 return (error);
3066 }
3067
3068 tblkno += map.br_blockcount;
3069 tblkcnt -= map.br_blockcount;
3070 }
3071
3072 return(0);
3073}
This page took 0.85209 seconds and 5 git commands to generate.