super.h 13 KB
Newer Older
J. R. Okajima's avatar
J. R. Okajima committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
/* SPDX-License-Identifier: GPL-2.0 */
/*
 * Copyright (C) 2005-2019 Junjiro R. Okajima
 */

/*
 * super_block operations
 */

#ifndef __AUFS_SUPER_H__
#define __AUFS_SUPER_H__

#ifdef __KERNEL__

J. R. Okajima's avatar
J. R. Okajima committed
15
16
#include <linux/fs.h>
#include <linux/kobject.h>
J. R. Okajima's avatar
J. R. Okajima committed
17
#include "hbl.h"
18
#include "lcnt.h"
J. R. Okajima's avatar
J. R. Okajima committed
19
#include "rwsem.h"
J. R. Okajima's avatar
J. R. Okajima committed
20
#include "wkq.h"
J. R. Okajima's avatar
J. R. Okajima committed
21

22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
/* policies to select one among multiple writable branches */
struct au_wbr_copyup_operations {
	int (*copyup)(struct dentry *dentry);
};

#define AuWbr_DIR	1		/* target is a dir */
#define AuWbr_PARENT	(1 << 1)	/* always require a parent */

#define au_ftest_wbr(flags, name)	((flags) & AuWbr_##name)
#define au_fset_wbr(flags, name)	{ (flags) |= AuWbr_##name; }
#define au_fclr_wbr(flags, name)	{ (flags) &= ~AuWbr_##name; }

struct au_wbr_create_operations {
	int (*create)(struct dentry *dentry, unsigned int flags);
	int (*init)(struct super_block *sb);
	int (*fin)(struct super_block *sb);
};

40
41
42
43
44
45
46
47
48
49
struct au_wbr_mfs {
	struct mutex	mfs_lock; /* protect this structure */
	unsigned long	mfs_jiffy;
	unsigned long	mfs_expire;
	aufs_bindex_t	mfs_bindex;

	unsigned long long	mfsrr_bytes;
	unsigned long long	mfsrr_watermark;
};

50
51
52
53
54
55
#define AuPlink_NHASH 100
static inline int au_plink_hash(ino_t ino)
{
	return ino % AuPlink_NHASH;
}

J. R. Okajima's avatar
J. R. Okajima committed
56
57
struct au_branch;
struct au_sbinfo {
J. R. Okajima's avatar
J. R. Okajima committed
58
59
60
	/* nowait tasks in the system-wide workqueue */
	struct au_nowait_tasks	si_nowait;

J. R. Okajima's avatar
J. R. Okajima committed
61
62
63
64
65
66
	/*
	 * tried sb->s_umount, but failed due to the dependency between i_mutex.
	 * rwsem for au_sbinfo is necessary.
	 */
	struct au_rwsem		si_rwsem;

67
	/*
68
	 * dirty approach to protect sb->sb_inodes and ->s_files (gone) from
69
70
	 * remount.
	 */
71
	au_lcnt_t		si_ninodes, si_nfiles;
72

J. R. Okajima's avatar
J. R. Okajima committed
73
	/* branch management */
J. R. Okajima's avatar
J. R. Okajima committed
74
75
	unsigned int		si_generation;

76
77
78
	/* see AuSi_ flags */
	unsigned char		au_si_status;

J. R. Okajima's avatar
J. R. Okajima committed
79
	aufs_bindex_t		si_bbot;
80
81
82
83

	/* dirty trick to keep br_id plus */
	unsigned int		si_last_br_id :
				sizeof(aufs_bindex_t) * BITS_PER_BYTE - 1;
J. R. Okajima's avatar
J. R. Okajima committed
84
85
	struct au_branch	**si_branch;

86
87
88
89
90
91
	/* policy to select a writable branch */
	unsigned char		si_wbr_copyup;
	unsigned char		si_wbr_create;
	struct au_wbr_copyup_operations *si_wbr_copyup_ops;
	struct au_wbr_create_operations *si_wbr_create_ops;

92
93
94
95
96
97
	/* round robin */
	atomic_t		si_wbr_rr_next;

	/* most free space */
	struct au_wbr_mfs	si_wbr_mfs;

98
99
100
101
	/* mount flags */
	/* include/asm-ia64/siginfo.h defines a macro named si_flags */
	unsigned int		si_mntflags;

J. R. Okajima's avatar
J. R. Okajima committed
102
103
104
105
106
107
108
109
110
111
112
	/* external inode number (bitmap and translation table) */
	vfs_readf_t		si_xread;
	vfs_writef_t		si_xwrite;
	loff_t			si_ximaxent;	/* max entries in a xino */

	struct file		*si_xib;
	struct mutex		si_xib_mtx; /* protect xib members */
	unsigned long		*si_xib_buf;
	unsigned long		si_xib_last_pindex;
	int			si_xib_next_bit;

J. R. Okajima's avatar
J. R. Okajima committed
113
114
	unsigned long		si_xino_jiffy;
	unsigned long		si_xino_expire;
J. R. Okajima's avatar
J. R. Okajima committed
115
116
117
	/* reserved for future use */
	/* unsigned long long	si_xib_limit; */	/* Max xib file size */

J. R. Okajima's avatar
J. R. Okajima committed
118
119
120
121
122
123
124
#ifdef CONFIG_AUFS_EXPORT
	/* i_generation */
	/* todo: make xigen file an array to support many inode numbers */
	struct file		*si_xigen;
	atomic_t		si_xigen_next;
#endif

125
126
127
	/* dirty trick to support atomic_open */
	struct hlist_bl_head	si_aopen;

128
129
130
131
132
	/* vdir parameters */
	unsigned long		si_rdcache;	/* max cache time in jiffies */
	unsigned int		si_rdblk;	/* deblk size */
	unsigned int		si_rdhash;	/* hash size */

J. R. Okajima's avatar
J. R. Okajima committed
133
134
135
136
137
138
139
140
	/*
	 * If the number of whiteouts are larger than si_dirwh, leave all of
	 * them after au_whtmp_ren to reduce the cost of rmdir(2).
	 * future fsck.aufs or kernel thread will remove them later.
	 * Otherwise, remove all whiteouts and the dir in rmdir(2).
	 */
	unsigned int		si_dirwh;

141
142
143
144
145
146
	/* pseudo_link list */
	struct hlist_bl_head	si_plink[AuPlink_NHASH];
	wait_queue_head_t	si_plink_wq;
	spinlock_t		si_plink_maint_lock;
	pid_t			si_plink_maint_pid;

147
148
149
	/* file list */
	struct hlist_bl_head	si_files;

150
151
152
	/* with/without getattr, brother of sb->s_d_op */
	struct inode_operations *si_iop_array;

J. R. Okajima's avatar
J. R. Okajima committed
153
154
155
156
157
158
159
	/*
	 * sysfs and lifetime management.
	 * this is not a small structure and it may be a waste of memory in case
	 * of sysfs is disabled, particularly when many aufs-es are mounted.
	 * but using sysfs is majority.
	 */
	struct kobject		si_kobj;
J. R. Okajima's avatar
J. R. Okajima committed
160

J. R. Okajima's avatar
J. R. Okajima committed
161
162
163
164
#ifdef CONFIG_AUFS_SBILIST
	struct hlist_bl_node	si_list;
#endif

J. R. Okajima's avatar
J. R. Okajima committed
165
166
	/* dirty, necessary for unmounting, sysfs and sysrq */
	struct super_block	*si_sb;
J. R. Okajima's avatar
J. R. Okajima committed
167
168
};

169
170
171
172
173
174
175
/* sbinfo status flags */
/*
 * set true when refresh_dirs() failed at remount time.
 * then try refreshing dirs at access time again.
 * if it is false, refreshing dirs at access time is unnecessary
 */
#define AuSi_FAILED_REFRESH_DIR	1
176
177
/* add later */
#define AuSi_NO_DREVAL		(1 << 2)	/* disable all d_revalidate */
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194

static inline unsigned char au_do_ftest_si(struct au_sbinfo *sbi,
					   unsigned int flag)
{
	AuRwMustAnyLock(&sbi->si_rwsem);
	return sbi->au_si_status & flag;
}
#define au_ftest_si(sbinfo, name)	au_do_ftest_si(sbinfo, AuSi_##name)
#define au_fset_si(sbinfo, name) do { \
	AuRwMustWriteLock(&(sbinfo)->si_rwsem); \
	(sbinfo)->au_si_status |= AuSi_##name; \
} while (0)
#define au_fclr_si(sbinfo, name) do { \
	AuRwMustWriteLock(&(sbinfo)->si_rwsem); \
	(sbinfo)->au_si_status &= ~AuSi_##name; \
} while (0)

J. R. Okajima's avatar
J. R. Okajima committed
195
196
/* ---------------------------------------------------------------------- */

197
198
199
200
201
202
/* policy to select one among writable branches */
#define AuWbrCopyup(sbinfo, ...) \
	((sbinfo)->si_wbr_copyup_ops->copyup(__VA_ARGS__))
#define AuWbrCreate(sbinfo, ...) \
	((sbinfo)->si_wbr_create_ops->create(__VA_ARGS__))

J. R. Okajima's avatar
J. R. Okajima committed
203
/* flags for si_read_lock()/aufs_read_lock()/di_read_lock() */
J. R. Okajima's avatar
J. R. Okajima committed
204
205
206
#define AuLock_DW		1		/* write-lock dentry */
#define AuLock_IR		(1 << 1)	/* read-lock inode */
#define AuLock_IW		(1 << 2)	/* write-lock inode */
J. R. Okajima's avatar
J. R. Okajima committed
207
#define AuLock_FLUSH		(1 << 3)	/* wait for 'nowait' tasks */
208
209
#define AuLock_DIRS		(1 << 4)	/* target is a pair of dirs */
						/* except RENAME_EXCHANGE */
210
211
#define AuLock_NOPLM		(1 << 5)	/* return err in plm mode */
#define AuLock_NOPLMW		(1 << 6)	/* wait for plm mode ends */
J. R. Okajima's avatar
J. R. Okajima committed
212
#define AuLock_GEN		(1 << 7)	/* test digen/iigen */
J. R. Okajima's avatar
J. R. Okajima committed
213
214
215
216
217
218
219
220
#define au_ftest_lock(flags, name)	((flags) & AuLock_##name)
#define au_fset_lock(flags, name) \
	do { (flags) |= AuLock_##name; } while (0)
#define au_fclr_lock(flags, name) \
	do { (flags) &= ~AuLock_##name; } while (0)

/* ---------------------------------------------------------------------- */

J. R. Okajima's avatar
J. R. Okajima committed
221
/* super.c */
J. R. Okajima's avatar
J. R. Okajima committed
222
extern struct file_system_type aufs_fs_type;
J. R. Okajima's avatar
J. R. Okajima committed
223
struct inode *au_iget_locked(struct super_block *sb, ino_t ino);
224
225
226
227
228
229
typedef unsigned long long (*au_arraycb_t)(struct super_block *sb, void *array,
					   unsigned long long max, void *arg);
void *au_array_alloc(unsigned long long *hint, au_arraycb_t cb,
		     struct super_block *sb, void *arg);
struct inode **au_iarray_alloc(struct super_block *sb, unsigned long long *max);
void au_iarray_free(struct inode **a, unsigned long long max);
J. R. Okajima's avatar
J. R. Okajima committed
230

J. R. Okajima's avatar
J. R. Okajima committed
231
232
233
/* sbinfo.c */
void au_si_free(struct kobject *kobj);
int au_si_alloc(struct super_block *sb);
234
int au_sbr_realloc(struct au_sbinfo *sbinfo, int nbr, int may_shrink);
J. R. Okajima's avatar
J. R. Okajima committed
235

J. R. Okajima's avatar
J. R. Okajima committed
236
unsigned int au_sigen_inc(struct super_block *sb);
237
aufs_bindex_t au_new_br_id(struct super_block *sb);
J. R. Okajima's avatar
J. R. Okajima committed
238

J. R. Okajima's avatar
J. R. Okajima committed
239
240
int si_read_lock(struct super_block *sb, int flags);
int si_write_lock(struct super_block *sb, int flags);
J. R. Okajima's avatar
J. R. Okajima committed
241
242
243
244
int aufs_read_lock(struct dentry *dentry, int flags);
void aufs_read_unlock(struct dentry *dentry, int flags);
void aufs_write_lock(struct dentry *dentry);
void aufs_write_unlock(struct dentry *dentry);
245
246
int aufs_read_and_write_lock2(struct dentry *d1, struct dentry *d2, int flags);
void aufs_read_and_write_unlock2(struct dentry *d1, struct dentry *d2);
J. R. Okajima's avatar
J. R. Okajima committed
247

248
249
250
251
252
253
254
/* wbr_policy.c */
extern struct au_wbr_copyup_operations au_wbr_copyup_ops[];
extern struct au_wbr_create_operations au_wbr_create_ops[];
int au_cpdown_dirs(struct dentry *dentry, aufs_bindex_t bdst);
int au_wbr_nonopq(struct dentry *dentry, aufs_bindex_t bindex);
int au_wbr_do_copyup_bu(struct dentry *dentry, aufs_bindex_t btop);

J. R. Okajima's avatar
J. R. Okajima committed
255
256
257
258
259
260
261
262
263
/* ---------------------------------------------------------------------- */

static inline struct au_sbinfo *au_sbi(struct super_block *sb)
{
	return sb->s_fs_info;
}

/* ---------------------------------------------------------------------- */

J. R. Okajima's avatar
J. R. Okajima committed
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
#ifdef CONFIG_AUFS_EXPORT
int au_test_nfsd(void);
void au_export_init(struct super_block *sb);
void au_xigen_inc(struct inode *inode);
int au_xigen_new(struct inode *inode);
int au_xigen_set(struct super_block *sb, struct path *path);
void au_xigen_clr(struct super_block *sb);

static inline int au_busy_or_stale(void)
{
	if (!au_test_nfsd())
		return -EBUSY;
	return -ESTALE;
}
#else
AuStubInt0(au_test_nfsd, void)
AuStubVoid(au_export_init, struct super_block *sb)
AuStubVoid(au_xigen_inc, struct inode *inode)
AuStubInt0(au_xigen_new, struct inode *inode)
AuStubInt0(au_xigen_set, struct super_block *sb, struct path *path)
AuStubVoid(au_xigen_clr, struct super_block *sb)
AuStub(int, au_busy_or_stale, return -EBUSY, void)
#endif /* CONFIG_AUFS_EXPORT */

/* ---------------------------------------------------------------------- */

J. R. Okajima's avatar
J. R. Okajima committed
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
#ifdef CONFIG_AUFS_SBILIST
/* module.c */
extern struct hlist_bl_head au_sbilist;

static inline void au_sbilist_init(void)
{
	INIT_HLIST_BL_HEAD(&au_sbilist);
}

static inline void au_sbilist_add(struct super_block *sb)
{
	au_hbl_add(&au_sbi(sb)->si_list, &au_sbilist);
}

static inline void au_sbilist_del(struct super_block *sb)
{
	au_hbl_del(&au_sbi(sb)->si_list, &au_sbilist);
}

#define AuGFP_SBILIST	GFP_NOFS
#else
AuStubVoid(au_sbilist_init, void)
AuStubVoid(au_sbilist_add, struct super_block *sb)
AuStubVoid(au_sbilist_del, struct super_block *sb)
#define AuGFP_SBILIST	GFP_NOFS
#endif

/* ---------------------------------------------------------------------- */

319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
/* current->atomic_flags */
/* this value should never corrupt the ones defined in linux/sched.h */
#define PFA_AUFS	7

TASK_PFA_TEST(AUFS, test_aufs)	/* task_test_aufs */
TASK_PFA_SET(AUFS, aufs)	/* task_set_aufs */
TASK_PFA_CLEAR(AUFS, aufs)	/* task_clear_aufs */

static inline int si_pid_test(struct super_block *sb)
{
	return !!task_test_aufs(current);
}

static inline void si_pid_clr(struct super_block *sb)
{
	AuDebugOn(!task_test_aufs(current));
	task_clear_aufs(current);
}

static inline void si_pid_set(struct super_block *sb)
{
	AuDebugOn(task_test_aufs(current));
	task_set_aufs(current);
}

/* ---------------------------------------------------------------------- */

J. R. Okajima's avatar
J. R. Okajima committed
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
/* lock superblock. mainly for entry point functions */
#define __si_read_lock(sb)	au_rw_read_lock(&au_sbi(sb)->si_rwsem)
#define __si_write_lock(sb)	au_rw_write_lock(&au_sbi(sb)->si_rwsem)
#define __si_read_trylock(sb)	au_rw_read_trylock(&au_sbi(sb)->si_rwsem)
#define __si_write_trylock(sb)	au_rw_write_trylock(&au_sbi(sb)->si_rwsem)
/*
#define __si_read_trylock_nested(sb) \
	au_rw_read_trylock_nested(&au_sbi(sb)->si_rwsem)
#define __si_write_trylock_nested(sb) \
	au_rw_write_trylock_nested(&au_sbi(sb)->si_rwsem)
*/

#define __si_read_unlock(sb)	au_rw_read_unlock(&au_sbi(sb)->si_rwsem)
#define __si_write_unlock(sb)	au_rw_write_unlock(&au_sbi(sb)->si_rwsem)
#define __si_downgrade_lock(sb)	au_rw_dgrade_lock(&au_sbi(sb)->si_rwsem)

#define SiMustNoWaiters(sb)	AuRwMustNoWaiters(&au_sbi(sb)->si_rwsem)
#define SiMustAnyLock(sb)	AuRwMustAnyLock(&au_sbi(sb)->si_rwsem)
#define SiMustWriteLock(sb)	AuRwMustWriteLock(&au_sbi(sb)->si_rwsem)

J. R. Okajima's avatar
J. R. Okajima committed
366
367
368
static inline void si_noflush_read_lock(struct super_block *sb)
{
	__si_read_lock(sb);
369
	si_pid_set(sb);
J. R. Okajima's avatar
J. R. Okajima committed
370
371
372
373
}

static inline int si_noflush_read_trylock(struct super_block *sb)
{
374
375
376
377
378
379
	int locked;

	locked = __si_read_trylock(sb);
	if (locked)
		si_pid_set(sb);
	return locked;
J. R. Okajima's avatar
J. R. Okajima committed
380
381
382
383
384
}

static inline void si_noflush_write_lock(struct super_block *sb)
{
	__si_write_lock(sb);
385
	si_pid_set(sb);
J. R. Okajima's avatar
J. R. Okajima committed
386
387
388
389
}

static inline int si_noflush_write_trylock(struct super_block *sb)
{
390
391
392
393
394
395
	int locked;

	locked = __si_write_trylock(sb);
	if (locked)
		si_pid_set(sb);
	return locked;
J. R. Okajima's avatar
J. R. Okajima committed
396
397
398
399
400
401
402
403
404
405
406
407
408
}

#if 0 /* reserved */
static inline int si_read_trylock(struct super_block *sb, int flags)
{
	if (au_ftest_lock(flags, FLUSH))
		au_nwt_flush(&au_sbi(sb)->si_nowait);
	return si_noflush_read_trylock(sb);
}
#endif

static inline void si_read_unlock(struct super_block *sb)
{
409
	si_pid_clr(sb);
J. R. Okajima's avatar
J. R. Okajima committed
410
411
412
413
414
415
416
417
418
419
420
421
422
423
	__si_read_unlock(sb);
}

#if 0 /* reserved */
static inline int si_write_trylock(struct super_block *sb, int flags)
{
	if (au_ftest_lock(flags, FLUSH))
		au_nwt_flush(&au_sbi(sb)->si_nowait);
	return si_noflush_write_trylock(sb);
}
#endif

static inline void si_write_unlock(struct super_block *sb)
{
424
	si_pid_clr(sb);
J. R. Okajima's avatar
J. R. Okajima committed
425
426
427
428
429
430
431
432
433
434
	__si_write_unlock(sb);
}

#if 0 /* reserved */
static inline void si_downgrade_lock(struct super_block *sb)
{
	__si_downgrade_lock(sb);
}
#endif

J. R. Okajima's avatar
J. R. Okajima committed
435
436
437
438
439
440
441
442
/* ---------------------------------------------------------------------- */

static inline aufs_bindex_t au_sbbot(struct super_block *sb)
{
	SiMustAnyLock(sb);
	return au_sbi(sb)->si_bbot;
}

443
444
445
446
447
448
static inline unsigned int au_mntflags(struct super_block *sb)
{
	SiMustAnyLock(sb);
	return au_sbi(sb)->si_mntflags;
}

J. R. Okajima's avatar
J. R. Okajima committed
449
450
451
452
453
454
static inline unsigned int au_sigen(struct super_block *sb)
{
	SiMustAnyLock(sb);
	return au_sbi(sb)->si_generation;
}

455
456
457
458
459
460
461
static inline struct au_branch *au_sbr(struct super_block *sb,
				       aufs_bindex_t bindex)
{
	SiMustAnyLock(sb);
	return au_sbi(sb)->si_branch[0 + bindex];
}

J. R. Okajima's avatar
J. R. Okajima committed
462
463
464
465
466
467
static inline loff_t au_xi_maxent(struct super_block *sb)
{
	SiMustAnyLock(sb);
	return au_sbi(sb)->si_ximaxent;
}

J. R. Okajima's avatar
J. R. Okajima committed
468
469
#endif /* __KERNEL__ */
#endif /* __AUFS_SUPER_H__ */