dirhash.h revision 262779
1/*-
2 * Copyright (c) 2001 Ian Dowse.  All rights reserved.
3 *
4 * Redistribution and use in source and binary forms, with or without
5 * modification, are permitted provided that the following conditions
6 * are met:
7 * 1. Redistributions of source code must retain the above copyright
8 *    notice, this list of conditions and the following disclaimer.
9 * 2. Redistributions in binary form must reproduce the above copyright
10 *    notice, this list of conditions and the following disclaimer in the
11 *    documentation and/or other materials provided with the distribution.
12 *
13 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
14 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
15 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
16 * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
17 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
18 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
19 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
20 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
21 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
22 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
23 * SUCH DAMAGE.
24 *
25 * $FreeBSD: stable/10/sys/ufs/ufs/dirhash.h 262779 2014-03-05 04:23:19Z pfg $
26 */
27
28#ifndef _UFS_UFS_DIRHASH_H_
29#define	_UFS_UFS_DIRHASH_H_
30
31#include <sys/_lock.h>
32#include <sys/_sx.h>
33
34/*
35 * For fast operations on large directories, we maintain a hash
36 * that maps the file name to the offset of the directory entry within
37 * the directory file.
38 *
39 * The hashing uses a dumb spillover to the next free slot on
40 * collisions, so we must keep the utilisation low to avoid
41 * long linear searches. Deleted entries that are not the last
42 * in a chain must be marked DIRHASH_DEL.
43 *
44 * We also maintain information about free space in each block
45 * to speed up creations.
46 */
47#define	DIRHASH_EMPTY	(-1)	/* entry unused */
48#define	DIRHASH_DEL	(-2)	/* deleted entry; may be part of chain */
49
50#define	DIRALIGN	4
51#define	DH_NFSTATS	(DIRECTSIZ(MAXNAMLEN + 1) / DIRALIGN)
52				 /* max DIRALIGN words in a directory entry */
53
54/*
55 * Dirhash uses a score mechanism to achieve a hybrid between a
56 * least-recently-used and a least-often-used algorithm for entry
57 * recycling. The score is incremented when a directory is used, and
58 * decremented when the directory is a candidate for recycling. When
59 * the score reaches zero, the hash is recycled. Hashes are linked
60 * together on a TAILQ list, and hashes with higher scores filter
61 * towards the tail (most recently used) end of the list.
62 *
63 * New hash entries are given an inital score of DH_SCOREINIT and are
64 * placed at the most-recently-used end of the list. This helps a lot
65 * in the worst-case case scenario where every directory access is
66 * to a directory that is not hashed (i.e. the working set of hash
67 * candidates is much larger than the configured memry limit). In this
68 * case it limits the number of hash builds to 1/DH_SCOREINIT of the
69 * number of accesses.
70 */
71#define	DH_SCOREINIT	8	/* initial dh_score when dirhash built */
72#define	DH_SCOREMAX	64	/* max dh_score value */
73
74/*
75 * The main hash table has 2 levels. It is an array of pointers to
76 * blocks of DH_NBLKOFF offsets.
77 */
78#define	DH_BLKOFFSHIFT	8
79#define	DH_NBLKOFF	(1 << DH_BLKOFFSHIFT)
80#define	DH_BLKOFFMASK	(DH_NBLKOFF - 1)
81
82#define	DH_ENTRY(dh, slot) \
83    ((dh)->dh_hash[(slot) >> DH_BLKOFFSHIFT][(slot) & DH_BLKOFFMASK])
84
85struct dirhash {
86	struct sx dh_lock;	/* protects all fields except list & score */
87	int	dh_refcount;
88
89	doff_t	**dh_hash;	/* the hash array (2-level) */
90	int	dh_narrays;	/* number of entries in dh_hash */
91	int	dh_hlen;	/* total slots in the 2-level hash array */
92	int	dh_hused;	/* entries in use */
93	int	dh_memreq;	/* Memory used. */
94
95	/* Free space statistics. XXX assumes DIRBLKSIZ is 512. */
96	u_int8_t *dh_blkfree;	/* free DIRALIGN words in each dir block */
97	int	dh_nblk;	/* size of dh_blkfree array */
98	int	dh_dirblks;	/* number of DIRBLKSIZ blocks in dir */
99	int	dh_firstfree[DH_NFSTATS + 1]; /* first blk with N words free */
100
101	doff_t	dh_seqoff;	/* sequential access optimisation offset */
102
103	int	dh_score;	/* access count for this dirhash */
104
105	int	dh_onlist;	/* true if on the ufsdirhash_list chain */
106
107	time_t	dh_lastused;	/* time the dirhash was last read or written*/
108
109	/* Protected by ufsdirhash_mtx. */
110	TAILQ_ENTRY(dirhash) dh_list;	/* chain of all dirhashes */
111};
112
113
114/*
115 * Dirhash functions.
116 */
117void	ufsdirhash_init(void);
118void	ufsdirhash_uninit(void);
119int	ufsdirhash_build(struct inode *);
120doff_t	ufsdirhash_findfree(struct inode *, int, int *);
121doff_t	ufsdirhash_enduseful(struct inode *);
122int	ufsdirhash_lookup(struct inode *, char *, int, doff_t *, struct buf **,
123	    doff_t *);
124void	ufsdirhash_newblk(struct inode *, doff_t);
125void	ufsdirhash_add(struct inode *, struct direct *, doff_t);
126void	ufsdirhash_remove(struct inode *, struct direct *, doff_t);
127void	ufsdirhash_move(struct inode *, struct direct *, doff_t, doff_t);
128void	ufsdirhash_dirtrunc(struct inode *, doff_t);
129void	ufsdirhash_free(struct inode *);
130
131void	ufsdirhash_checkblock(struct inode *, char *, doff_t);
132
133#endif /* !_UFS_UFS_DIRHASH_H_ */
134