~ [ source navigation ] ~ [ diff markup ] ~ [ identifier search ] ~

TOMOYO Linux Cross Reference
Linux/fs/xfs/libxfs/xfs_da_format.h

Version: ~ [ linux-6.11.5 ] ~ [ linux-6.10.14 ] ~ [ linux-6.9.12 ] ~ [ linux-6.8.12 ] ~ [ linux-6.7.12 ] ~ [ linux-6.6.58 ] ~ [ linux-6.5.13 ] ~ [ linux-6.4.16 ] ~ [ linux-6.3.13 ] ~ [ linux-6.2.16 ] ~ [ linux-6.1.114 ] ~ [ linux-6.0.19 ] ~ [ linux-5.19.17 ] ~ [ linux-5.18.19 ] ~ [ linux-5.17.15 ] ~ [ linux-5.16.20 ] ~ [ linux-5.15.169 ] ~ [ linux-5.14.21 ] ~ [ linux-5.13.19 ] ~ [ linux-5.12.19 ] ~ [ linux-5.11.22 ] ~ [ linux-5.10.228 ] ~ [ linux-5.9.16 ] ~ [ linux-5.8.18 ] ~ [ linux-5.7.19 ] ~ [ linux-5.6.19 ] ~ [ linux-5.5.19 ] ~ [ linux-5.4.284 ] ~ [ linux-5.3.18 ] ~ [ linux-5.2.21 ] ~ [ linux-5.1.21 ] ~ [ linux-5.0.21 ] ~ [ linux-4.20.17 ] ~ [ linux-4.19.322 ] ~ [ linux-4.18.20 ] ~ [ linux-4.17.19 ] ~ [ linux-4.16.18 ] ~ [ linux-4.15.18 ] ~ [ linux-4.14.336 ] ~ [ linux-4.13.16 ] ~ [ linux-4.12.14 ] ~ [ linux-4.11.12 ] ~ [ linux-4.10.17 ] ~ [ linux-4.9.337 ] ~ [ linux-4.4.302 ] ~ [ linux-3.10.108 ] ~ [ linux-2.6.32.71 ] ~ [ linux-2.6.0 ] ~ [ linux-2.4.37.11 ] ~ [ unix-v6-master ] ~ [ ccs-tools-1.8.9 ] ~ [ policy-sample ] ~
Architecture: ~ [ i386 ] ~ [ alpha ] ~ [ m68k ] ~ [ mips ] ~ [ ppc ] ~ [ sparc ] ~ [ sparc64 ] ~

  1 /* SPDX-License-Identifier: GPL-2.0 */
  2 /*
  3  * Copyright (c) 2000-2001,2005 Silicon Graphics, Inc.
  4  * Copyright (c) 2013 Red Hat, Inc.
  5  * All Rights Reserved.
  6  */
  7 #ifndef __XFS_DA_FORMAT_H__
  8 #define __XFS_DA_FORMAT_H__
  9 
 10 /*
 11  * This structure is common to both leaf nodes and non-leaf nodes in the Btree.
 12  *
 13  * It is used to manage a doubly linked list of all blocks at the same
 14  * level in the Btree, and to identify which type of block this is.
 15  */
 16 #define XFS_DA_NODE_MAGIC       0xfebe  /* magic number: non-leaf blocks */
 17 #define XFS_ATTR_LEAF_MAGIC     0xfbee  /* magic number: attribute leaf blks */
 18 #define XFS_DIR2_LEAF1_MAGIC    0xd2f1  /* magic number: v2 dirlf single blks */
 19 #define XFS_DIR2_LEAFN_MAGIC    0xd2ff  /* magic number: v2 dirlf multi blks */
 20 
 21 typedef struct xfs_da_blkinfo {
 22         __be32          forw;                   /* previous block in list */
 23         __be32          back;                   /* following block in list */
 24         __be16          magic;                  /* validity check on block */
 25         __be16          pad;                    /* unused */
 26 } xfs_da_blkinfo_t;
 27 
 28 /*
 29  * CRC enabled directory structure types
 30  *
 31  * The headers change size for the additional verification information, but
 32  * otherwise the tree layouts and contents are unchanged. Hence the da btree
 33  * code can use the struct xfs_da_blkinfo for manipulating the tree links and
 34  * magic numbers without modification for both v2 and v3 nodes.
 35  */
 36 #define XFS_DA3_NODE_MAGIC      0x3ebe  /* magic number: non-leaf blocks */
 37 #define XFS_ATTR3_LEAF_MAGIC    0x3bee  /* magic number: attribute leaf blks */
 38 #define XFS_DIR3_LEAF1_MAGIC    0x3df1  /* magic number: v3 dirlf single blks */
 39 #define XFS_DIR3_LEAFN_MAGIC    0x3dff  /* magic number: v3 dirlf multi blks */
 40 
 41 struct xfs_da3_blkinfo {
 42         /*
 43          * the node link manipulation code relies on the fact that the first
 44          * element of this structure is the struct xfs_da_blkinfo so it can
 45          * ignore the differences in the rest of the structures.
 46          */
 47         struct xfs_da_blkinfo   hdr;
 48         __be32                  crc;    /* CRC of block */
 49         __be64                  blkno;  /* first block of the buffer */
 50         __be64                  lsn;    /* sequence number of last write */
 51         uuid_t                  uuid;   /* filesystem we belong to */
 52         __be64                  owner;  /* inode that owns the block */
 53 };
 54 
 55 /*
 56  * This is the structure of the root and intermediate nodes in the Btree.
 57  * The leaf nodes are defined above.
 58  *
 59  * Entries are not packed.
 60  *
 61  * Since we have duplicate keys, use a binary search but always follow
 62  * all match in the block, not just the first match found.
 63  */
 64 #define XFS_DA_NODE_MAXDEPTH    5       /* max depth of Btree */
 65 
 66 typedef struct xfs_da_node_hdr {
 67         struct xfs_da_blkinfo   info;   /* block type, links, etc. */
 68         __be16                  __count; /* count of active entries */
 69         __be16                  __level; /* level above leaves (leaf == 0) */
 70 } xfs_da_node_hdr_t;
 71 
 72 struct xfs_da3_node_hdr {
 73         struct xfs_da3_blkinfo  info;   /* block type, links, etc. */
 74         __be16                  __count; /* count of active entries */
 75         __be16                  __level; /* level above leaves (leaf == 0) */
 76         __be32                  __pad32;
 77 };
 78 
 79 #define XFS_DA3_NODE_CRC_OFF    (offsetof(struct xfs_da3_node_hdr, info.crc))
 80 
 81 typedef struct xfs_da_node_entry {
 82         __be32  hashval;        /* hash value for this descendant */
 83         __be32  before;         /* Btree block before this key */
 84 } xfs_da_node_entry_t;
 85 
 86 typedef struct xfs_da_intnode {
 87         struct xfs_da_node_hdr  hdr;
 88         struct xfs_da_node_entry __btree[];
 89 } xfs_da_intnode_t;
 90 
 91 struct xfs_da3_intnode {
 92         struct xfs_da3_node_hdr hdr;
 93         struct xfs_da_node_entry __btree[];
 94 };
 95 
 96 /*
 97  * Directory version 2.
 98  *
 99  * There are 4 possible formats:
100  *  - shortform - embedded into the inode
101  *  - single block - data with embedded leaf at the end
102  *  - multiple data blocks, single leaf+freeindex block
103  *  - data blocks, node and leaf blocks (btree), freeindex blocks
104  *
105  * Note: many node blocks structures and constants are shared with the attr
106  * code and defined in xfs_da_btree.h.
107  */
108 
109 #define XFS_DIR2_BLOCK_MAGIC    0x58443242      /* XD2B: single block dirs */
110 #define XFS_DIR2_DATA_MAGIC     0x58443244      /* XD2D: multiblock dirs */
111 #define XFS_DIR2_FREE_MAGIC     0x58443246      /* XD2F: free index blocks */
112 
113 /*
114  * Directory Version 3 With CRCs.
115  *
116  * The tree formats are the same as for version 2 directories.  The difference
117  * is in the block header and dirent formats. In many cases the v3 structures
118  * use v2 definitions as they are no different and this makes code sharing much
119  * easier.
120  *
121  * Also, the xfs_dir3_*() functions handle both v2 and v3 formats - if the
122  * format is v2 then they switch to the existing v2 code, or the format is v3
123  * they implement the v3 functionality. This means the existing dir2 is a mix of
124  * xfs_dir2/xfs_dir3 calls and functions. The xfs_dir3 functions are called
125  * where there is a difference in the formats, otherwise the code is unchanged.
126  *
127  * Where it is possible, the code decides what to do based on the magic numbers
128  * in the blocks rather than feature bits in the superblock. This means the code
129  * is as independent of the external XFS code as possible as doesn't require
130  * passing struct xfs_mount pointers into places where it isn't really
131  * necessary.
132  *
133  * Version 3 includes:
134  *
135  *      - a larger block header for CRC and identification purposes and so the
136  *      offsets of all the structures inside the blocks are different.
137  *
138  *      - new magic numbers to be able to detect the v2/v3 types on the fly.
139  */
140 
141 #define XFS_DIR3_BLOCK_MAGIC    0x58444233      /* XDB3: single block dirs */
142 #define XFS_DIR3_DATA_MAGIC     0x58444433      /* XDD3: multiblock dirs */
143 #define XFS_DIR3_FREE_MAGIC     0x58444633      /* XDF3: free index blocks */
144 
145 /*
146  * Dirents in version 3 directories have a file type field. Additions to this
147  * list are an on-disk format change, requiring feature bits. Valid values
148  * are as follows:
149  */
150 #define XFS_DIR3_FT_UNKNOWN             0
151 #define XFS_DIR3_FT_REG_FILE            1
152 #define XFS_DIR3_FT_DIR                 2
153 #define XFS_DIR3_FT_CHRDEV              3
154 #define XFS_DIR3_FT_BLKDEV              4
155 #define XFS_DIR3_FT_FIFO                5
156 #define XFS_DIR3_FT_SOCK                6
157 #define XFS_DIR3_FT_SYMLINK             7
158 #define XFS_DIR3_FT_WHT                 8
159 
160 #define XFS_DIR3_FT_MAX                 9
161 
162 #define XFS_DIR3_FTYPE_STR \
163         { XFS_DIR3_FT_UNKNOWN,  "unknown" }, \
164         { XFS_DIR3_FT_REG_FILE, "file" }, \
165         { XFS_DIR3_FT_DIR,      "directory" }, \
166         { XFS_DIR3_FT_CHRDEV,   "char" }, \
167         { XFS_DIR3_FT_BLKDEV,   "block" }, \
168         { XFS_DIR3_FT_FIFO,     "fifo" }, \
169         { XFS_DIR3_FT_SOCK,     "sock" }, \
170         { XFS_DIR3_FT_SYMLINK,  "symlink" }, \
171         { XFS_DIR3_FT_WHT,      "whiteout" }
172 
173 /*
174  * Byte offset in data block and shortform entry.
175  */
176 typedef uint16_t        xfs_dir2_data_off_t;
177 #define NULLDATAOFF     0xffffU
178 typedef uint            xfs_dir2_data_aoff_t;   /* argument form */
179 
180 /*
181  * Offset in data space of a data entry.
182  */
183 typedef uint32_t        xfs_dir2_dataptr_t;
184 #define XFS_DIR2_MAX_DATAPTR    ((xfs_dir2_dataptr_t)0xffffffff)
185 #define XFS_DIR2_NULL_DATAPTR   ((xfs_dir2_dataptr_t)0)
186 
187 /*
188  * Byte offset in a directory.
189  */
190 typedef xfs_off_t       xfs_dir2_off_t;
191 
192 /*
193  * Directory block number (logical dirblk in file)
194  */
195 typedef uint32_t        xfs_dir2_db_t;
196 
197 #define XFS_INO32_SIZE  4
198 #define XFS_INO64_SIZE  8
199 #define XFS_INO64_DIFF  (XFS_INO64_SIZE - XFS_INO32_SIZE)
200 
201 #define XFS_DIR2_MAX_SHORT_INUM ((xfs_ino_t)0xffffffffULL)
202 
203 /*
204  * Directory layout when stored internal to an inode.
205  *
206  * Small directories are packed as tightly as possible so as to fit into the
207  * literal area of the inode.  These "shortform" directories consist of a
208  * single xfs_dir2_sf_hdr header followed by zero or more xfs_dir2_sf_entry
209  * structures.  Due the different inode number storage size and the variable
210  * length name field in the xfs_dir2_sf_entry all these structure are
211  * variable length, and the accessors in this file should be used to iterate
212  * over them.
213  */
214 typedef struct xfs_dir2_sf_hdr {
215         uint8_t                 count;          /* count of entries */
216         uint8_t                 i8count;        /* count of 8-byte inode #s */
217         uint8_t                 parent[8];      /* parent dir inode number */
218 } __packed xfs_dir2_sf_hdr_t;
219 
220 typedef struct xfs_dir2_sf_entry {
221         __u8                    namelen;        /* actual name length */
222         __u8                    offset[2];      /* saved offset */
223         __u8                    name[];         /* name, variable size */
224         /*
225          * A single byte containing the file type field follows the inode
226          * number for version 3 directory entries.
227          *
228          * A 64-bit or 32-bit inode number follows here, at a variable offset
229          * after the name.
230          */
231 } __packed xfs_dir2_sf_entry_t;
232 
233 static inline int xfs_dir2_sf_hdr_size(int i8count)
234 {
235         return sizeof(struct xfs_dir2_sf_hdr) -
236                 (i8count == 0) * XFS_INO64_DIFF;
237 }
238 
239 static inline xfs_dir2_data_aoff_t
240 xfs_dir2_sf_get_offset(xfs_dir2_sf_entry_t *sfep)
241 {
242         return get_unaligned_be16(sfep->offset);
243 }
244 
245 static inline void
246 xfs_dir2_sf_put_offset(xfs_dir2_sf_entry_t *sfep, xfs_dir2_data_aoff_t off)
247 {
248         put_unaligned_be16(off, sfep->offset);
249 }
250 
251 static inline struct xfs_dir2_sf_entry *
252 xfs_dir2_sf_firstentry(struct xfs_dir2_sf_hdr *hdr)
253 {
254         return (struct xfs_dir2_sf_entry *)
255                 ((char *)hdr + xfs_dir2_sf_hdr_size(hdr->i8count));
256 }
257 
258 /*
259  * Data block structures.
260  *
261  * A pure data block looks like the following drawing on disk:
262  *
263  *    +-------------------------------------------------+
264  *    | xfs_dir2_data_hdr_t                             |
265  *    +-------------------------------------------------+
266  *    | xfs_dir2_data_entry_t OR xfs_dir2_data_unused_t |
267  *    | xfs_dir2_data_entry_t OR xfs_dir2_data_unused_t |
268  *    | xfs_dir2_data_entry_t OR xfs_dir2_data_unused_t |
269  *    | ...                                             |
270  *    +-------------------------------------------------+
271  *    | unused space                                    |
272  *    +-------------------------------------------------+
273  *
274  * As all the entries are variable size structures the accessors below should
275  * be used to iterate over them.
276  *
277  * In addition to the pure data blocks for the data and node formats,
278  * most structures are also used for the combined data/freespace "block"
279  * format below.
280  */
281 
282 #define XFS_DIR2_DATA_ALIGN_LOG 3               /* i.e., 8 bytes */
283 #define XFS_DIR2_DATA_ALIGN     (1 << XFS_DIR2_DATA_ALIGN_LOG)
284 #define XFS_DIR2_DATA_FREE_TAG  0xffff
285 #define XFS_DIR2_DATA_FD_COUNT  3
286 
287 /*
288  * Directory address space divided into sections,
289  * spaces separated by 32GB.
290  */
291 #define XFS_DIR2_MAX_SPACES     3
292 #define XFS_DIR2_SPACE_SIZE     (1ULL << (32 + XFS_DIR2_DATA_ALIGN_LOG))
293 #define XFS_DIR2_DATA_SPACE     0
294 #define XFS_DIR2_DATA_OFFSET    (XFS_DIR2_DATA_SPACE * XFS_DIR2_SPACE_SIZE)
295 
296 /*
297  * Describe a free area in the data block.
298  *
299  * The freespace will be formatted as a xfs_dir2_data_unused_t.
300  */
301 typedef struct xfs_dir2_data_free {
302         __be16                  offset;         /* start of freespace */
303         __be16                  length;         /* length of freespace */
304 } xfs_dir2_data_free_t;
305 
306 /*
307  * Header for the data blocks.
308  *
309  * The code knows that XFS_DIR2_DATA_FD_COUNT is 3.
310  */
311 typedef struct xfs_dir2_data_hdr {
312         __be32                  magic;          /* XFS_DIR2_DATA_MAGIC or */
313                                                 /* XFS_DIR2_BLOCK_MAGIC */
314         xfs_dir2_data_free_t    bestfree[XFS_DIR2_DATA_FD_COUNT];
315 } xfs_dir2_data_hdr_t;
316 
317 /*
318  * define a structure for all the verification fields we are adding to the
319  * directory block structures. This will be used in several structures.
320  * The magic number must be the first entry to align with all the dir2
321  * structures so we determine how to decode them just by the magic number.
322  */
323 struct xfs_dir3_blk_hdr {
324         __be32                  magic;  /* magic number */
325         __be32                  crc;    /* CRC of block */
326         __be64                  blkno;  /* first block of the buffer */
327         __be64                  lsn;    /* sequence number of last write */
328         uuid_t                  uuid;   /* filesystem we belong to */
329         __be64                  owner;  /* inode that owns the block */
330 };
331 
332 struct xfs_dir3_data_hdr {
333         struct xfs_dir3_blk_hdr hdr;
334         xfs_dir2_data_free_t    best_free[XFS_DIR2_DATA_FD_COUNT];
335         __be32                  pad;    /* 64 bit alignment */
336 };
337 
338 #define XFS_DIR3_DATA_CRC_OFF  offsetof(struct xfs_dir3_data_hdr, hdr.crc)
339 
340 /*
341  * Active entry in a data block.
342  *
343  * Aligned to 8 bytes.  After the variable length name field there is a
344  * 2 byte tag field, which can be accessed using xfs_dir3_data_entry_tag_p.
345  *
346  * For dir3 structures, there is file type field between the name and the tag.
347  * This can only be manipulated by helper functions. It is packed hard against
348  * the end of the name so any padding for rounding is between the file type and
349  * the tag.
350  */
351 typedef struct xfs_dir2_data_entry {
352         __be64                  inumber;        /* inode number */
353         __u8                    namelen;        /* name length */
354         __u8                    name[];         /* name bytes, no null */
355      /* __u8                    filetype; */    /* type of inode we point to */
356      /* __be16                  tag; */         /* starting offset of us */
357 } xfs_dir2_data_entry_t;
358 
359 /*
360  * Unused entry in a data block.
361  *
362  * Aligned to 8 bytes.  Tag appears as the last 2 bytes and must be accessed
363  * using xfs_dir2_data_unused_tag_p.
364  */
365 typedef struct xfs_dir2_data_unused {
366         __be16                  freetag;        /* XFS_DIR2_DATA_FREE_TAG */
367         __be16                  length;         /* total free length */
368                                                 /* variable offset */
369         __be16                  tag;            /* starting offset of us */
370 } xfs_dir2_data_unused_t;
371 
372 /*
373  * Pointer to a freespace's tag word.
374  */
375 static inline __be16 *
376 xfs_dir2_data_unused_tag_p(struct xfs_dir2_data_unused *dup)
377 {
378         return (__be16 *)((char *)dup +
379                         be16_to_cpu(dup->length) - sizeof(__be16));
380 }
381 
382 /*
383  * Leaf block structures.
384  *
385  * A pure leaf block looks like the following drawing on disk:
386  *
387  *    +---------------------------+
388  *    | xfs_dir2_leaf_hdr_t       |
389  *    +---------------------------+
390  *    | xfs_dir2_leaf_entry_t     |
391  *    | xfs_dir2_leaf_entry_t     |
392  *    | xfs_dir2_leaf_entry_t     |
393  *    | xfs_dir2_leaf_entry_t     |
394  *    | ...                       |
395  *    +---------------------------+
396  *    | xfs_dir2_data_off_t       |
397  *    | xfs_dir2_data_off_t       |
398  *    | xfs_dir2_data_off_t       |
399  *    | ...                       |
400  *    +---------------------------+
401  *    | xfs_dir2_leaf_tail_t      |
402  *    +---------------------------+
403  *
404  * The xfs_dir2_data_off_t members (bests) and tail are at the end of the block
405  * for single-leaf (magic = XFS_DIR2_LEAF1_MAGIC) blocks only, but not present
406  * for directories with separate leaf nodes and free space blocks
407  * (magic = XFS_DIR2_LEAFN_MAGIC).
408  *
409  * As all the entries are variable size structures the accessors below should
410  * be used to iterate over them.
411  */
412 
413 /*
414  * Offset of the leaf/node space.  First block in this space
415  * is the btree root.
416  */
417 #define XFS_DIR2_LEAF_SPACE     1
418 #define XFS_DIR2_LEAF_OFFSET    (XFS_DIR2_LEAF_SPACE * XFS_DIR2_SPACE_SIZE)
419 
420 /*
421  * Leaf block header.
422  */
423 typedef struct xfs_dir2_leaf_hdr {
424         xfs_da_blkinfo_t        info;           /* header for da routines */
425         __be16                  count;          /* count of entries */
426         __be16                  stale;          /* count of stale entries */
427 } xfs_dir2_leaf_hdr_t;
428 
429 struct xfs_dir3_leaf_hdr {
430         struct xfs_da3_blkinfo  info;           /* header for da routines */
431         __be16                  count;          /* count of entries */
432         __be16                  stale;          /* count of stale entries */
433         __be32                  pad;            /* 64 bit alignment */
434 };
435 
436 /*
437  * Leaf block entry.
438  */
439 typedef struct xfs_dir2_leaf_entry {
440         __be32                  hashval;        /* hash value of name */
441         __be32                  address;        /* address of data entry */
442 } xfs_dir2_leaf_entry_t;
443 
444 /*
445  * Leaf block tail.
446  */
447 typedef struct xfs_dir2_leaf_tail {
448         __be32                  bestcount;
449 } xfs_dir2_leaf_tail_t;
450 
451 /*
452  * Leaf block.
453  */
454 typedef struct xfs_dir2_leaf {
455         xfs_dir2_leaf_hdr_t     hdr;                    /* leaf header */
456         xfs_dir2_leaf_entry_t   __ents[];               /* entries */
457 } xfs_dir2_leaf_t;
458 
459 struct xfs_dir3_leaf {
460         struct xfs_dir3_leaf_hdr        hdr;            /* leaf header */
461         struct xfs_dir2_leaf_entry      __ents[];       /* entries */
462 };
463 
464 #define XFS_DIR3_LEAF_CRC_OFF  offsetof(struct xfs_dir3_leaf_hdr, info.crc)
465 
466 /*
467  * Get address of the bests array in the single-leaf block.
468  */
469 static inline __be16 *
470 xfs_dir2_leaf_bests_p(struct xfs_dir2_leaf_tail *ltp)
471 {
472         return (__be16 *)ltp - be32_to_cpu(ltp->bestcount);
473 }
474 
475 /*
476  * Free space block definitions for the node format.
477  */
478 
479 /*
480  * Offset of the freespace index.
481  */
482 #define XFS_DIR2_FREE_SPACE     2
483 #define XFS_DIR2_FREE_OFFSET    (XFS_DIR2_FREE_SPACE * XFS_DIR2_SPACE_SIZE)
484 
485 typedef struct xfs_dir2_free_hdr {
486         __be32                  magic;          /* XFS_DIR2_FREE_MAGIC */
487         __be32                  firstdb;        /* db of first entry */
488         __be32                  nvalid;         /* count of valid entries */
489         __be32                  nused;          /* count of used entries */
490 } xfs_dir2_free_hdr_t;
491 
492 typedef struct xfs_dir2_free {
493         xfs_dir2_free_hdr_t     hdr;            /* block header */
494         __be16                  bests[];        /* best free counts */
495                                                 /* unused entries are -1 */
496 } xfs_dir2_free_t;
497 
498 struct xfs_dir3_free_hdr {
499         struct xfs_dir3_blk_hdr hdr;
500         __be32                  firstdb;        /* db of first entry */
501         __be32                  nvalid;         /* count of valid entries */
502         __be32                  nused;          /* count of used entries */
503         __be32                  pad;            /* 64 bit alignment */
504 };
505 
506 struct xfs_dir3_free {
507         struct xfs_dir3_free_hdr hdr;
508         __be16                  bests[];        /* best free counts */
509                                                 /* unused entries are -1 */
510 };
511 
512 #define XFS_DIR3_FREE_CRC_OFF  offsetof(struct xfs_dir3_free, hdr.hdr.crc)
513 
514 /*
515  * Single block format.
516  *
517  * The single block format looks like the following drawing on disk:
518  *
519  *    +-------------------------------------------------+
520  *    | xfs_dir2_data_hdr_t                             |
521  *    +-------------------------------------------------+
522  *    | xfs_dir2_data_entry_t OR xfs_dir2_data_unused_t |
523  *    | xfs_dir2_data_entry_t OR xfs_dir2_data_unused_t |
524  *    | xfs_dir2_data_entry_t OR xfs_dir2_data_unused_t :
525  *    | ...                                             |
526  *    +-------------------------------------------------+
527  *    | unused space                                    |
528  *    +-------------------------------------------------+
529  *    | ...                                             |
530  *    | xfs_dir2_leaf_entry_t                           |
531  *    | xfs_dir2_leaf_entry_t                           |
532  *    +-------------------------------------------------+
533  *    | xfs_dir2_block_tail_t                           |
534  *    +-------------------------------------------------+
535  *
536  * As all the entries are variable size structures the accessors below should
537  * be used to iterate over them.
538  */
539 
540 typedef struct xfs_dir2_block_tail {
541         __be32          count;                  /* count of leaf entries */
542         __be32          stale;                  /* count of stale lf entries */
543 } xfs_dir2_block_tail_t;
544 
545 /*
546  * Pointer to the leaf entries embedded in a data block (1-block format)
547  */
548 static inline struct xfs_dir2_leaf_entry *
549 xfs_dir2_block_leaf_p(struct xfs_dir2_block_tail *btp)
550 {
551         return ((struct xfs_dir2_leaf_entry *)btp) - be32_to_cpu(btp->count);
552 }
553 
554 
555 /*
556  * Attribute storage layout
557  *
558  * Attribute lists are structured around Btrees where all the data
559  * elements are in the leaf nodes.  Attribute names are hashed into an int,
560  * then that int is used as the index into the Btree.  Since the hashval
561  * of an attribute name may not be unique, we may have duplicate keys.  The
562  * internal links in the Btree are logical block offsets into the file.
563  *
564  * Struct leaf_entry's are packed from the top.  Name/values grow from the
565  * bottom but are not packed.  The freemap contains run-length-encoded entries
566  * for the free bytes after the leaf_entry's, but only the N largest such,
567  * smaller runs are dropped.  When the freemap doesn't show enough space
568  * for an allocation, we compact the name/value area and try again.  If we
569  * still don't have enough space, then we have to split the block.  The
570  * name/value structs (both local and remote versions) must be 32bit aligned.
571  *
572  * Since we have duplicate hash keys, for each key that matches, compare
573  * the actual name string.  The root and intermediate node search always
574  * takes the first-in-the-block key match found, so we should only have
575  * to work "forw"ard.  If none matches, continue with the "forw"ard leaf
576  * nodes until the hash key changes or the attribute name is found.
577  *
578  * We store the fact that an attribute is a ROOT/USER/SECURE attribute in
579  * the leaf_entry.  The namespaces are independent only because we also look
580  * at the namespace bit when we are looking for a matching attribute name.
581  *
582  * We also store an "incomplete" bit in the leaf_entry.  It shows that an
583  * attribute is in the middle of being created and should not be shown to
584  * the user if we crash during the time that the bit is set.  We clear the
585  * bit when we have finished setting up the attribute.  We do this because
586  * we cannot create some large attributes inside a single transaction, and we
587  * need some indication that we weren't finished if we crash in the middle.
588  */
589 #define XFS_ATTR_LEAF_MAPSIZE   3       /* how many freespace slots */
590 
591 /*
592  * Attribute storage when stored inside the inode.
593  *
594  * Small attribute lists are packed as tightly as possible so as to fit into the
595  * literal area of the inode.
596  *
597  * These "shortform" attribute forks consist of a single xfs_attr_sf_hdr header
598  * followed by zero or more xfs_attr_sf_entry structures.
599  */
600 struct xfs_attr_sf_hdr {        /* constant-structure header block */
601         __be16  totsize;        /* total bytes in shortform list */
602         __u8    count;          /* count of active entries */
603         __u8    padding;
604 };
605 
606 struct xfs_attr_sf_entry {
607         __u8    namelen;        /* actual length of name (no NULL) */
608         __u8    valuelen;       /* actual length of value (no NULL) */
609         __u8    flags;          /* flags bits (XFS_ATTR_*) */
610         __u8    nameval[];      /* name & value bytes concatenated */
611 };
612 
613 typedef struct xfs_attr_leaf_map {      /* RLE map of free bytes */
614         __be16  base;                     /* base of free region */
615         __be16  size;                     /* length of free region */
616 } xfs_attr_leaf_map_t;
617 
618 typedef struct xfs_attr_leaf_hdr {      /* constant-structure header block */
619         xfs_da_blkinfo_t info;          /* block type, links, etc. */
620         __be16  count;                  /* count of active leaf_entry's */
621         __be16  usedbytes;              /* num bytes of names/values stored */
622         __be16  firstused;              /* first used byte in name area */
623         __u8    holes;                  /* != 0 if blk needs compaction */
624         __u8    pad1;
625         xfs_attr_leaf_map_t freemap[XFS_ATTR_LEAF_MAPSIZE];
626                                         /* N largest free regions */
627 } xfs_attr_leaf_hdr_t;
628 
629 typedef struct xfs_attr_leaf_entry {    /* sorted on key, not name */
630         __be32  hashval;                /* hash value of name */
631         __be16  nameidx;                /* index into buffer of name/value */
632         __u8    flags;                  /* LOCAL/ROOT/SECURE/INCOMPLETE flag */
633         __u8    pad2;                   /* unused pad byte */
634 } xfs_attr_leaf_entry_t;
635 
636 typedef struct xfs_attr_leaf_name_local {
637         __be16  valuelen;               /* number of bytes in value */
638         __u8    namelen;                /* length of name bytes */
639         /*
640          * In Linux 6.5 this flex array was converted from nameval[1] to
641          * nameval[].  Be very careful here about extra padding at the end;
642          * see xfs_attr_leaf_entsize_local() for details.
643          */
644         __u8    nameval[];              /* name/value bytes */
645 } xfs_attr_leaf_name_local_t;
646 
647 typedef struct xfs_attr_leaf_name_remote {
648         __be32  valueblk;               /* block number of value bytes */
649         __be32  valuelen;               /* number of bytes in value */
650         __u8    namelen;                /* length of name bytes */
651         /*
652          * In Linux 6.5 this flex array was converted from name[1] to name[].
653          * Be very careful here about extra padding at the end; see
654          * xfs_attr_leaf_entsize_remote() for details.
655          */
656         __u8    name[];                 /* name bytes */
657 } xfs_attr_leaf_name_remote_t;
658 
659 typedef struct xfs_attr_leafblock {
660         xfs_attr_leaf_hdr_t     hdr;    /* constant-structure header block */
661         xfs_attr_leaf_entry_t   entries[];      /* sorted on key, not name */
662         /*
663          * The rest of the block contains the following structures after the
664          * leaf entries, growing from the bottom up. The variables are never
665          * referenced and definining them can actually make gcc optimize away
666          * accesses to the 'entries' array above index 0 so don't do that.
667          *
668          * xfs_attr_leaf_name_local_t namelist;
669          * xfs_attr_leaf_name_remote_t valuelist;
670          */
671 } xfs_attr_leafblock_t;
672 
673 /*
674  * CRC enabled leaf structures. Called "version 3" structures to match the
675  * version number of the directory and dablk structures for this feature, and
676  * attr2 is already taken by the variable inode attribute fork size feature.
677  */
678 struct xfs_attr3_leaf_hdr {
679         struct xfs_da3_blkinfo  info;
680         __be16                  count;
681         __be16                  usedbytes;
682         __be16                  firstused;
683         __u8                    holes;
684         __u8                    pad1;
685         struct xfs_attr_leaf_map freemap[XFS_ATTR_LEAF_MAPSIZE];
686         __be32                  pad2;           /* 64 bit alignment */
687 };
688 
689 #define XFS_ATTR3_LEAF_CRC_OFF  (offsetof(struct xfs_attr3_leaf_hdr, info.crc))
690 
691 struct xfs_attr3_leafblock {
692         struct xfs_attr3_leaf_hdr       hdr;
693         struct xfs_attr_leaf_entry      entries[];
694 
695         /*
696          * The rest of the block contains the following structures after the
697          * leaf entries, growing from the bottom up. The variables are never
698          * referenced, the locations accessed purely from helper functions.
699          *
700          * struct xfs_attr_leaf_name_local
701          * struct xfs_attr_leaf_name_remote
702          */
703 };
704 
705 /*
706  * Special value to represent fs block size in the leaf header firstused field.
707  * Only used when block size overflows the 2-bytes available on disk.
708  */
709 #define XFS_ATTR3_LEAF_NULLOFF  0
710 
711 /*
712  * Flags used in the leaf_entry[i].flags field.
713  */
714 #define XFS_ATTR_LOCAL_BIT      0       /* attr is stored locally */
715 #define XFS_ATTR_ROOT_BIT       1       /* limit access to trusted attrs */
716 #define XFS_ATTR_SECURE_BIT     2       /* limit access to secure attrs */
717 #define XFS_ATTR_PARENT_BIT     3       /* parent pointer attrs */
718 #define XFS_ATTR_INCOMPLETE_BIT 7       /* attr in middle of create/delete */
719 #define XFS_ATTR_LOCAL          (1u << XFS_ATTR_LOCAL_BIT)
720 #define XFS_ATTR_ROOT           (1u << XFS_ATTR_ROOT_BIT)
721 #define XFS_ATTR_SECURE         (1u << XFS_ATTR_SECURE_BIT)
722 #define XFS_ATTR_PARENT         (1u << XFS_ATTR_PARENT_BIT)
723 #define XFS_ATTR_INCOMPLETE     (1u << XFS_ATTR_INCOMPLETE_BIT)
724 
725 #define XFS_ATTR_NSP_ONDISK_MASK        (XFS_ATTR_ROOT | \
726                                          XFS_ATTR_SECURE | \
727                                          XFS_ATTR_PARENT)
728 
729 /* Private attr namespaces not exposed to userspace */
730 #define XFS_ATTR_PRIVATE_NSP_MASK       (XFS_ATTR_PARENT)
731 
732 #define XFS_ATTR_ONDISK_MASK    (XFS_ATTR_NSP_ONDISK_MASK | \
733                                  XFS_ATTR_LOCAL | \
734                                  XFS_ATTR_INCOMPLETE)
735 
736 #define XFS_ATTR_NAMESPACE_STR \
737         { XFS_ATTR_LOCAL,       "local" }, \
738         { XFS_ATTR_ROOT,        "root" }, \
739         { XFS_ATTR_SECURE,      "secure" }, \
740         { XFS_ATTR_PARENT,      "parent" }
741 
742 /*
743  * Alignment for namelist and valuelist entries (since they are mixed
744  * there can be only one alignment value)
745  */
746 #define XFS_ATTR_LEAF_NAME_ALIGN        ((uint)sizeof(xfs_dablk_t))
747 
748 static inline int
749 xfs_attr3_leaf_hdr_size(struct xfs_attr_leafblock *leafp)
750 {
751         if (leafp->hdr.info.magic == cpu_to_be16(XFS_ATTR3_LEAF_MAGIC))
752                 return sizeof(struct xfs_attr3_leaf_hdr);
753         return sizeof(struct xfs_attr_leaf_hdr);
754 }
755 
756 static inline struct xfs_attr_leaf_entry *
757 xfs_attr3_leaf_entryp(xfs_attr_leafblock_t *leafp)
758 {
759         if (leafp->hdr.info.magic == cpu_to_be16(XFS_ATTR3_LEAF_MAGIC))
760                 return &((struct xfs_attr3_leafblock *)leafp)->entries[0];
761         return &leafp->entries[0];
762 }
763 
764 /*
765  * Cast typed pointers for "local" and "remote" name/value structs.
766  */
767 static inline char *
768 xfs_attr3_leaf_name(xfs_attr_leafblock_t *leafp, int idx)
769 {
770         struct xfs_attr_leaf_entry *entries = xfs_attr3_leaf_entryp(leafp);
771 
772         return &((char *)leafp)[be16_to_cpu(entries[idx].nameidx)];
773 }
774 
775 static inline xfs_attr_leaf_name_remote_t *
776 xfs_attr3_leaf_name_remote(xfs_attr_leafblock_t *leafp, int idx)
777 {
778         return (xfs_attr_leaf_name_remote_t *)xfs_attr3_leaf_name(leafp, idx);
779 }
780 
781 static inline xfs_attr_leaf_name_local_t *
782 xfs_attr3_leaf_name_local(xfs_attr_leafblock_t *leafp, int idx)
783 {
784         return (xfs_attr_leaf_name_local_t *)xfs_attr3_leaf_name(leafp, idx);
785 }
786 
787 /*
788  * Calculate total bytes used (including trailing pad for alignment) for
789  * a "local" name/value structure, a "remote" name/value structure, and
790  * a pointer which might be either.
791  */
792 static inline int xfs_attr_leaf_entsize_remote(int nlen)
793 {
794         /*
795          * Prior to Linux 6.5, struct xfs_attr_leaf_name_remote ended with
796          * name[1], which was used as a flexarray.  The layout of this struct
797          * is 9 bytes of fixed-length fields followed by a __u8 flex array at
798          * offset 9.
799          *
800          * On most architectures, struct xfs_attr_leaf_name_remote had two
801          * bytes of implicit padding at the end of the struct to make the
802          * struct length 12.  After converting name[1] to name[], there are
803          * three implicit padding bytes and the struct size remains 12.
804          * However, there are compiler configurations that do not add implicit
805          * padding at all (m68k) and have been broken for years.
806          *
807          * This entsize computation historically added (the xattr name length)
808          * to (the padded struct length - 1) and rounded that sum up to the
809          * nearest multiple of 4 (NAME_ALIGN).  IOWs, round_up(11 + nlen, 4).
810          * This is encoded in the ondisk format, so we cannot change this.
811          *
812          * Compute the entsize from offsetof of the flexarray and manually
813          * adding bytes for the implicit padding.
814          */
815         const size_t remotesize =
816                         offsetof(struct xfs_attr_leaf_name_remote, name) + 2;
817 
818         return round_up(remotesize + nlen, XFS_ATTR_LEAF_NAME_ALIGN);
819 }
820 
821 static inline int xfs_attr_leaf_entsize_local(int nlen, int vlen)
822 {
823         /*
824          * Prior to Linux 6.5, struct xfs_attr_leaf_name_local ended with
825          * nameval[1], which was used as a flexarray.  The layout of this
826          * struct is 3 bytes of fixed-length fields followed by a __u8 flex
827          * array at offset 3.
828          *
829          * struct xfs_attr_leaf_name_local had zero bytes of implicit padding
830          * at the end of the struct to make the struct length 4.  On most
831          * architectures, after converting nameval[1] to nameval[], there is
832          * one implicit padding byte and the struct size remains 4.  However,
833          * there are compiler configurations that do not add implicit padding
834          * at all (m68k) and would break.
835          *
836          * This entsize computation historically added (the xattr name and
837          * value length) to (the padded struct length - 1) and rounded that sum
838          * up to the nearest multiple of 4 (NAME_ALIGN).  IOWs, the formula is
839          * round_up(3 + nlen + vlen, 4).  This is encoded in the ondisk format,
840          * so we cannot change this.
841          *
842          * Compute the entsize from offsetof of the flexarray and manually
843          * adding bytes for the implicit padding.
844          */
845         const size_t localsize =
846                         offsetof(struct xfs_attr_leaf_name_local, nameval);
847 
848         return round_up(localsize + nlen + vlen, XFS_ATTR_LEAF_NAME_ALIGN);
849 }
850 
851 static inline int xfs_attr_leaf_entsize_local_max(int bsize)
852 {
853         return (((bsize) >> 1) + ((bsize) >> 2));
854 }
855 
856 
857 
858 /*
859  * Remote attribute block format definition
860  *
861  * There is one of these headers per filesystem block in a remote attribute.
862  * This is done to ensure there is a 1:1 mapping between the attribute value
863  * length and the number of blocks needed to store the attribute. This makes the
864  * verification of a buffer a little more complex, but greatly simplifies the
865  * allocation, reading and writing of these attributes as we don't have to guess
866  * the number of blocks needed to store the attribute data.
867  */
868 #define XFS_ATTR3_RMT_MAGIC     0x5841524d      /* XARM */
869 
870 struct xfs_attr3_rmt_hdr {
871         __be32  rm_magic;
872         __be32  rm_offset;
873         __be32  rm_bytes;
874         __be32  rm_crc;
875         uuid_t  rm_uuid;
876         __be64  rm_owner;
877         __be64  rm_blkno;
878         __be64  rm_lsn;
879 };
880 
881 #define XFS_ATTR3_RMT_CRC_OFF   offsetof(struct xfs_attr3_rmt_hdr, rm_crc)
882 
883 unsigned int xfs_attr3_rmt_buf_space(struct xfs_mount *mp);
884 
885 /* Number of bytes in a directory block. */
886 static inline unsigned int xfs_dir2_dirblock_bytes(struct xfs_sb *sbp)
887 {
888         return 1 << (sbp->sb_blocklog + sbp->sb_dirblklog);
889 }
890 
891 xfs_failaddr_t xfs_da3_blkinfo_verify(struct xfs_buf *bp,
892                                       struct xfs_da3_blkinfo *hdr3);
893 
894 /*
895  * Parent pointer attribute format definition
896  *
897  * The xattr name contains the dirent name.
898  * The xattr value encodes the parent inode number and generation to ease
899  * opening parents by handle.
900  * The xattr hashval is xfs_dir2_namehash() ^ p_ino
901  */
902 struct xfs_parent_rec {
903         __be64  p_ino;
904         __be32  p_gen;
905 } __packed;
906 
907 #endif /* __XFS_DA_FORMAT_H__ */
908 

~ [ source navigation ] ~ [ diff markup ] ~ [ identifier search ] ~

kernel.org | git.kernel.org | LWN.net | Project Home | SVN repository | Mail admin

Linux® is a registered trademark of Linus Torvalds in the United States and other countries.
TOMOYO® is a registered trademark of NTT DATA CORPORATION.

sflogo.php