/usr/src/sys/ufs/ffs/ffs

Bug Summary

File:	ufs/ffs/ffs_softdep.c
Warning:	line 4531, column 18 Although the value stored to 'flushparent' is used in the enclosing expression, the value is never actually read from 'flushparent'

Annotated Source Code

Press '?' to see keyboard shortcuts

Show analyzer invocation

clang -cc1 -cc1 -triple amd64-unknown-openbsd7.4 -analyze -disable-free -clear-ast-before-backend -disable-llvm-verifier -discard-value-names -main-file-name ffs_softdep.c -analyzer-checker=core -analyzer-checker=apiModeling -analyzer-checker=unix -analyzer-checker=deadcode -analyzer-checker=security.insecureAPI.UncheckedReturn -analyzer-checker=security.insecureAPI.getpw -analyzer-checker=security.insecureAPI.gets -analyzer-checker=security.insecureAPI.mktemp -analyzer-checker=security.insecureAPI.mkstemp -analyzer-checker=security.insecureAPI.vfork -analyzer-checker=nullability.NullPassedToNonnull -analyzer-checker=nullability.NullReturnedFromNonnull -analyzer-output plist -w -setup-static-analyzer -mrelocation-model static -mframe-pointer=all -relaxed-aliasing -ffp-contract=on -fno-rounding-math -mconstructor-aliases -ffreestanding -mcmodel=kernel -target-cpu x86-64 -target-feature +retpoline-indirect-calls -target-feature +retpoline-indirect-branches -target-feature -sse2 -target-feature -sse -target-feature -3dnow -target-feature -mmx -target-feature +save-args -target-feature +retpoline-external-thunk -disable-red-zone -no-implicit-float -tune-cpu generic -debugger-tuning=gdb -fcoverage-compilation-dir=/usr/src/sys/arch/amd64/compile/GENERIC.MP/obj -nostdsysteminc -nobuiltininc -resource-dir /usr/local/llvm16/lib/clang/16 -I /usr/src/sys -I /usr/src/sys/arch/amd64/compile/GENERIC.MP/obj -I /usr/src/sys/arch -I /usr/src/sys/dev/pci/drm/include -I /usr/src/sys/dev/pci/drm/include/uapi -I /usr/src/sys/dev/pci/drm/amd/include/asic_reg -I /usr/src/sys/dev/pci/drm/amd/include -I /usr/src/sys/dev/pci/drm/amd/amdgpu -I /usr/src/sys/dev/pci/drm/amd/display -I /usr/src/sys/dev/pci/drm/amd/display/include -I /usr/src/sys/dev/pci/drm/amd/display/dc -I /usr/src/sys/dev/pci/drm/amd/display/amdgpu_dm -I /usr/src/sys/dev/pci/drm/amd/pm/inc -I /usr/src/sys/dev/pci/drm/amd/pm/legacy-dpm -I /usr/src/sys/dev/pci/drm/amd/pm/swsmu -I /usr/src/sys/dev/pci/drm/amd/pm/swsmu/inc -I /usr/src/sys/dev/pci/drm/amd/pm/swsmu/smu11 -I /usr/src/sys/dev/pci/drm/amd/pm/swsmu/smu12 -I /usr/src/sys/dev/pci/drm/amd/pm/swsmu/smu13 -I /usr/src/sys/dev/pci/drm/amd/pm/powerplay/inc -I /usr/src/sys/dev/pci/drm/amd/pm/powerplay/hwmgr -I /usr/src/sys/dev/pci/drm/amd/pm/powerplay/smumgr -I /usr/src/sys/dev/pci/drm/amd/pm/swsmu/inc -I /usr/src/sys/dev/pci/drm/amd/pm/swsmu/inc/pmfw_if -I /usr/src/sys/dev/pci/drm/amd/display/dc/inc -I /usr/src/sys/dev/pci/drm/amd/display/dc/inc/hw -I /usr/src/sys/dev/pci/drm/amd/display/dc/clk_mgr -I /usr/src/sys/dev/pci/drm/amd/display/modules/inc -I /usr/src/sys/dev/pci/drm/amd/display/modules/hdcp -I /usr/src/sys/dev/pci/drm/amd/display/dmub/inc -I /usr/src/sys/dev/pci/drm/i915 -D DDB -D DIAGNOSTIC -D KTRACE -D ACCOUNTING -D KMEMSTATS -D PTRACE -D POOL_DEBUG -D CRYPTO -D SYSVMSG -D SYSVSEM -D SYSVSHM -D UVM_SWAP_ENCRYPT -D FFS -D FFS2 -D FFS_SOFTUPDATES -D UFS_DIRHASH -D QUOTA -D EXT2FS -D MFS -D NFSCLIENT -D NFSSERVER -D CD9660 -D UDF -D MSDOSFS -D FIFO -D FUSE -D SOCKET_SPLICE -D TCP_ECN -D TCP_SIGNATURE -D INET6 -D IPSEC -D PPP_BSDCOMP -D PPP_DEFLATE -D PIPEX -D MROUTING -D MPLS -D BOOT_CONFIG -D USER_PCICONF -D APERTURE -D MTRR -D NTFS -D SUSPEND -D HIBERNATE -D PCIVERBOSE -D USBVERBOSE -D WSDISPLAY_COMPAT_USL -D WSDISPLAY_COMPAT_RAWKBD -D WSDISPLAY_DEFAULTSCREENS=6 -D X86EMU -D ONEWIREVERBOSE -D MULTIPROCESSOR -D MAXUSERS=80 -D _KERNEL -O2 -Wno-pointer-sign -Wno-address-of-packed-member -Wno-constant-conversion -Wno-unused-but-set-variable -Wno-gnu-folding-constant -fdebug-compilation-dir=/usr/src/sys/arch/amd64/compile/GENERIC.MP/obj -ferror-limit 19 -fwrapv -D_RET_PROTECTOR -ret-protector -fcf-protection=branch -fgnuc-version=4.2.1 -vectorize-loops -vectorize-slp -fno-builtin-malloc -fno-builtin-calloc -fno-builtin-realloc -fno-builtin-valloc -fno-builtin-free -fno-builtin-strdup -fno-builtin-strndup -analyzer-output=html -faddrsig -o /home/ben/Projects/scan/2024-01-11-110808-61670-1 -x c /usr/src/sys/ufs/ffs/ffs_softdep.c

1	/* $OpenBSD: ffs_softdep.c,v 1.152 2023/07/05 15:13:28 beck Exp $ */
2
3	/*
4	* Copyright 1998, 2000 Marshall Kirk McKusick. All Rights Reserved.
5	*
6	* The soft updates code is derived from the appendix of a University
7	* of Michigan technical report (Gregory R. Ganger and Yale N. Patt,
8	* "Soft Updates: A Solution to the Metadata Update Problem in File
9	* Systems", CSE-TR-254-95, August 1995).
10	*
11	* Further information about soft updates can be obtained from:
12	*
13	* Marshall Kirk McKusick http://www.mckusick.com/softdep/
14	* 1614 Oxford Street mckusick@mckusick.com
15	* Berkeley, CA 94709-1608 +1-510-843-9542
16	* USA
17	*
18	* Redistribution and use in source and binary forms, with or without
19	* modification, are permitted provided that the following conditions
20	* are met:
21	*
22	* 1. Redistributions of source code must retain the above copyright
23	* notice, this list of conditions and the following disclaimer.
24	* 2. Redistributions in binary form must reproduce the above copyright
25	* notice, this list of conditions and the following disclaimer in the
26	* documentation and/or other materials provided with the distribution.
27	*
28	* THIS SOFTWARE IS PROVIDED BY MARSHALL KIRK MCKUSICK ``AS IS'' AND ANY
29	* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
30	* WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
31	* DISCLAIMED. IN NO EVENT SHALL MARSHALL KIRK MCKUSICK BE LIABLE FOR
32	* ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
33	* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
34	* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
35	* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
36	* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
37	* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
38	* SUCH DAMAGE.
39	*
40	* from: @(#)ffs_softdep.c 9.59 (McKusick) 6/21/00
41	* $FreeBSD: src/sys/ufs/ffs/ffs_softdep.c,v 1.86 2001/02/04 16:08:18 phk Exp $
42	*/
43
44	#include <sys/param.h>
45	#include <sys/buf.h>
46	#include <sys/kernel.h>
47	#include <sys/malloc.h>
48	#include <sys/mount.h>
49	#include <sys/proc.h>
50	#include <sys/pool.h>
51	#include <sys/syslog.h>
52	#include <sys/systm.h>
53	#include <sys/vnode.h>
54	#include <sys/specdev.h>
55	#include <crypto/siphash.h>
56	#include <ufs/ufs/dir.h>
57	#include <ufs/ufs/quota.h>
58	#include <ufs/ufs/inode.h>
59	#include <ufs/ufs/ufsmount.h>
60	#include <ufs/ffs/fs.h>
61	#include <ufs/ffs/softdep.h>
62	#include <ufs/ffs/ffs_extern.h>
63	#include <ufs/ufs/ufs_extern.h>
64
65	#define STATIC
66
67	/*
68	* Mapping of dependency structure types to malloc types.
69	*/
70	#define D_PAGEDEP0 0
71	#define D_INODEDEP1 1
72	#define D_NEWBLK2 2
73	#define D_BMSAFEMAP3 3
74	#define D_ALLOCDIRECT4 4
75	#define D_INDIRDEP5 5
76	#define D_ALLOCINDIR6 6
77	#define D_FREEFRAG7 7
78	#define D_FREEBLKS8 8
79	#define D_FREEFILE9 9
80	#define D_DIRADD10 10
81	#define D_MKDIR11 11
82	#define D_DIRREM12 12
83	#define D_NEWDIRBLK13 13
84	#define D_LAST13 13
85	/*
86	* Names of softdep types.
87	*/
88	const char *softdep_typenames[] = {
89	"pagedep",
90	"inodedep",
91	"newblk",
92	"bmsafemap",
93	"allocdirect",
94	"indirdep",
95	"allocindir",
96	"freefrag",
97	"freeblks",
98	"freefile",
99	"diradd",
100	"mkdir",
101	"dirrem",
102	"newdirblk",
103	};
104	#define TYPENAME(type)((unsigned)(type) <= 13 ? softdep_typenames[type] : "???") \
105	((unsigned)(type) <= D_LAST13 ? softdep_typenames[type] : "???")
106	/*
107	* Finding the current process.
108	*/
109	#define CURPROC({struct cpu_info __ci; asm volatile("movq %%gs:%P1,%0" : "=r" (__ci) :"n" (__builtin_offsetof(struct cpu_info, ci_self))); __ci;})->ci_curproc curproc({struct cpu_info __ci; asm volatile("movq %%gs:%P1,%0" : "=r" (__ci) :"n" (__builtin_offsetof(struct cpu_info, ci_self))); __ci;})->ci_curproc
110	/*
111	* End system adaptation definitions.
112	*/
113
114	/*
115	* Internal function prototypes.
116	*/
117	STATIC void softdep_error(char *, int);
118	STATIC void drain_output(struct vnode *, int);
119	STATIC int getdirtybuf(struct buf *, int);
120	STATIC void clear_remove(struct proc *);
121	STATIC void clear_inodedeps(struct proc *);
122	STATIC int flush_pagedep_deps(struct vnode , struct mount ,
123	struct diraddhd *);
124	STATIC int flush_inodedep_deps(struct fs *, ufsino_t);
125	STATIC int handle_written_filepage(struct pagedep , struct buf );
126	STATIC void diradd_inode_written(struct diradd , struct inodedep );
127	STATIC int handle_written_inodeblock(struct inodedep , struct buf );
128	STATIC void handle_allocdirect_partdone(struct allocdirect *);
129	STATIC void handle_allocindir_partdone(struct allocindir *);
130	STATIC void initiate_write_filepage(struct pagedep , struct buf );
131	STATIC void handle_written_mkdir(struct mkdir *, int);
132	STATIC void initiate_write_inodeblock_ufs1(struct inodedep , struct buf );
133	#ifdef FFS21
134	STATIC void initiate_write_inodeblock_ufs2(struct inodedep , struct buf );
135	#endif
136	STATIC void handle_workitem_freefile(struct freefile *);
137	STATIC void handle_workitem_remove(struct dirrem *);
138	STATIC struct dirrem newdirrem(struct buf , struct inode *,
139	struct inode , int, struct dirrem *);
140	STATIC void free_diradd(struct diradd *);
141	STATIC void free_allocindir(struct allocindir , struct inodedep );
142	STATIC void free_newdirblk(struct newdirblk *);
143	STATIC int indir_trunc(struct inode , daddr_t, int, daddr_t, long );
144	STATIC void deallocate_dependencies(struct buf , struct inodedep );
145	STATIC void free_allocdirect(struct allocdirectlst *,
146	struct allocdirect *, int);
147	STATIC int check_inode_unwritten(struct inodedep *);
148	STATIC int free_inodedep(struct inodedep *);
149	STATIC void handle_workitem_freeblocks(struct freeblks *);
150	STATIC void merge_inode_lists(struct inodedep *);
151	STATIC void setup_allocindir_phase2(struct buf , struct inode ,
152	struct allocindir *);
153	STATIC struct allocindir newallocindir(struct inode , int, daddr_t,
154	daddr_t);
155	STATIC void handle_workitem_freefrag(struct freefrag *);
156	STATIC struct freefrag newfreefrag(struct inode , daddr_t, long);
157	STATIC void allocdirect_merge(struct allocdirectlst *,
158	struct allocdirect , struct allocdirect );
159	STATIC struct bmsafemap bmsafemap_lookup(struct buf );
160	STATIC int newblk_lookup(struct fs *, daddr_t, int,
161	struct newblk **);
162	STATIC int inodedep_lookup(struct fs , ufsino_t, int, struct inodedep *);
163	STATIC int pagedep_lookup(struct inode , daddr_t, int, struct pagedep *);
164	STATIC void pause_timer(void *);
165	STATIC int request_cleanup(int, int);
166	STATIC int process_worklist_item(struct mount , int , int);
167	STATIC void add_to_worklist(struct worklist *);
168
169	/*
170	* Exported softdep operations.
171	*/
172	void softdep_disk_io_initiation(struct buf *);
173	void softdep_disk_write_complete(struct buf *);
174	void softdep_deallocate_dependencies(struct buf *);
175	void softdep_move_dependencies(struct buf , struct buf );
176	int softdep_count_dependencies(struct buf *bp, int, int);
177
178	/*
179	* Locking primitives.
180	*
181	* For a uniprocessor, all we need to do is protect against disk
182	* interrupts. For a multiprocessor, this lock would have to be
183	* a mutex. A single mutex is used throughout this file, though
184	* finer grain locking could be used if contention warranted it.
185	*
186	* For a multiprocessor, the sleep call would accept a lock and
187	* release it after the sleep processing was complete. In a uniprocessor
188	* implementation there is no such interlock, so we simple mark
189	* the places where it needs to be done with the `interlocked' form
190	* of the lock calls. Since the uniprocessor sleep already interlocks
191	* the spl, there is nothing that really needs to be done.
192	*/
193	#ifndef /* NOT */ DEBUG
194	STATIC struct lockit {
195	int lkt_spl;
196	} lk = { 0 };
197	#define ACQUIRE_LOCK(lk)(lk)->lkt_spl = splraise(0x3) (lk)->lkt_spl = splbio()splraise(0x3)
198	#define FREE_LOCK(lk)spllower((lk)->lkt_spl) splx((lk)->lkt_spl)spllower((lk)->lkt_spl)
199	#define ACQUIRE_LOCK_INTERLOCKED(lk,s)(lk)->lkt_spl = (s) (lk)->lkt_spl = (s)
200	#define FREE_LOCK_INTERLOCKED(lk)((lk)->lkt_spl) ((lk)->lkt_spl)
201
202	#else /* DEBUG */
203	STATIC struct lockit {
204	int lkt_spl;
205	pid_t lkt_held;
206	int lkt_line;
207	} lk = { 0, -1 };
208	STATIC int lockcnt;
209
210	STATIC void acquire_lock(struct lockit *, int);
211	STATIC void free_lock(struct lockit *, int);
212	STATIC void acquire_lock_interlocked(struct lockit *, int, int);
213	STATIC int free_lock_interlocked(struct lockit *, int);
214
215	#define ACQUIRE_LOCK(lk)(lk)->lkt_spl = splraise(0x3) acquire_lock(lk, __LINE__215)
216	#define FREE_LOCK(lk)spllower((lk)->lkt_spl) free_lock(lk, __LINE__216)
217	#define ACQUIRE_LOCK_INTERLOCKED(lk,s)(lk)->lkt_spl = (s) acquire_lock_interlocked(lk, (s), __LINE__217)
218	#define FREE_LOCK_INTERLOCKED(lk)((lk)->lkt_spl) free_lock_interlocked(lk, __LINE__218)
219
220	STATIC void
221	acquire_lock(struct lockit *lk, int line)
222	{
223	pid_t holder;
224	int original_line;
225
226	if (lk->lkt_held != -1) {
227	holder = lk->lkt_held;
228	original_line = lk->lkt_line;
229	FREE_LOCK(lk)spllower((lk)->lkt_spl);
230	if (holder == CURPROC({struct cpu_info *__ci; asm volatile("movq %%gs:%P1,%0" : "=r" (__ci) :"n" (__builtin_offsetof(struct cpu_info, ci_self))); __ci;})->ci_curproc->p_tid)
231	panic("softdep_lock: locking against myself, acquired at line %d, relocked at line %d", original_line, line);
232	else
233	panic("softdep_lock: lock held by %d, acquired at line %d, relocked at line %d", holder, original_line, line);
234	}
235	lk->lkt_spl = splbio()splraise(0x3);
236	lk->lkt_held = CURPROC({struct cpu_info *__ci; asm volatile("movq %%gs:%P1,%0" : "=r" (__ci) :"n" (__builtin_offsetof(struct cpu_info, ci_self))); __ci;})->ci_curproc->p_tid;
237	lk->lkt_line = line;
238	lockcnt++;
239	}
240
241	STATIC void
242	free_lock(struct lockit *lk, int line)
243	{
244
245	if (lk->lkt_held == -1)
246	panic("softdep_unlock: lock not held at line %d", line);
247	lk->lkt_held = -1;
248	splx(lk->lkt_spl)spllower(lk->lkt_spl);
249	}
250
251	STATIC void
252	acquire_lock_interlocked(struct lockit *lk, int s, int line)
253	{
254	pid_t holder;
255	int original_line;
256
257	if (lk->lkt_held != -1) {
258	holder = lk->lkt_held;
259	original_line = lk->lkt_line;
260	FREE_LOCK_INTERLOCKED(lk)((lk)->lkt_spl);
261	if (holder == CURPROC({struct cpu_info *__ci; asm volatile("movq %%gs:%P1,%0" : "=r" (__ci) :"n" (__builtin_offsetof(struct cpu_info, ci_self))); __ci;})->ci_curproc->p_tid)
262	panic("softdep_lock: locking against myself, acquired at line %d, relocked at line %d", original_line, line);
263	else
264	panic("softdep_lock: lock held by %d, acquired at line %d, relocked at line %d", holder, original_line, line);
265	}
266	lk->lkt_held = CURPROC({struct cpu_info *__ci; asm volatile("movq %%gs:%P1,%0" : "=r" (__ci) :"n" (__builtin_offsetof(struct cpu_info, ci_self))); __ci;})->ci_curproc->p_tid;
267	lk->lkt_line = line;
268	lk->lkt_spl = s;
269	lockcnt++;
270	}
271
272	STATIC int
273	free_lock_interlocked(struct lockit *lk, int line)
274	{
275
276	if (lk->lkt_held == -1)
277	panic("softdep_unlock_interlocked: lock not held at line %d", line);
278	lk->lkt_held = -1;
279
280	return (lk->lkt_spl);
281	}
282	#endif /* DEBUG */
283
284	/*
285	* Place holder for real semaphores.
286	*/
287	struct sema {
288	int value;
289	pid_t holder;
290	char *name;
291	int prio;
292	};
293	STATIC void sema_init(struct sema , char , int);
294	STATIC int sema_get(struct sema , struct lockit );
295	STATIC void sema_release(struct sema *);
296
297	STATIC void
298	sema_init(struct sema semap, char name, int prio)
299	{
300
301	semap->holder = -1;
302	semap->value = 0;
303	semap->name = name;
304	semap->prio = prio;
305	}
306
307	STATIC int
308	sema_get(struct sema semap, struct lockit interlock)
309	{
310	int s;
311
312	if (semap->value++ > 0) {
313	if (interlock != NULL((void *)0))
314	s = FREE_LOCK_INTERLOCKED(interlock)((interlock)->lkt_spl);
315	tsleep_nsec(semap, semap->prio, semap->name, INFSLP0xffffffffffffffffULL);
316	if (interlock != NULL((void *)0)) {
317	ACQUIRE_LOCK_INTERLOCKED(interlock, s)(interlock)->lkt_spl = (s);
318	FREE_LOCK(interlock)spllower((interlock)->lkt_spl);
319	}
320	return (0);
321	}
322	semap->holder = CURPROC({struct cpu_info *__ci; asm volatile("movq %%gs:%P1,%0" : "=r" (__ci) :"n" (__builtin_offsetof(struct cpu_info, ci_self))); __ci;})->ci_curproc->p_tid;
323	if (interlock != NULL((void *)0))
324	FREE_LOCK(interlock)spllower((interlock)->lkt_spl);
325	return (1);
326	}
327
328	STATIC void
329	sema_release(struct sema *semap)
330	{
331
332	if (semap->value <= 0 \|\| semap->holder != CURPROC({struct cpu_info *__ci; asm volatile("movq %%gs:%P1,%0" : "=r" (__ci) :"n" (__builtin_offsetof(struct cpu_info, ci_self))); __ci;})->ci_curproc->p_tid) {
333	#ifdef DEBUG
334	if (lk.lkt_held != -1)
335	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
336	#endif
337	panic("sema_release: not held");
338	}
339	if (--semap->value > 0) {
340	semap->value = 0;
341	wakeup(semap);
342	}
343	semap->holder = -1;
344	}
345
346	/*
347	* Memory management.
348	*/
349	STATIC struct pool pagedep_pool;
350	STATIC struct pool inodedep_pool;
351	STATIC struct pool newblk_pool;
352	STATIC struct pool bmsafemap_pool;
353	STATIC struct pool allocdirect_pool;
354	STATIC struct pool indirdep_pool;
355	STATIC struct pool allocindir_pool;
356	STATIC struct pool freefrag_pool;
357	STATIC struct pool freeblks_pool;
358	STATIC struct pool freefile_pool;
359	STATIC struct pool diradd_pool;
360	STATIC struct pool mkdir_pool;
361	STATIC struct pool dirrem_pool;
362	STATIC struct pool newdirblk_pool;
363
364	static __inline void
365	softdep_free(struct worklist *item, int type)
366	{
367
368	switch (type) {
369	case D_PAGEDEP0:
370	pool_put(&pagedep_pool, item);
371	break;
372
373	case D_INODEDEP1:
374	pool_put(&inodedep_pool, item);
375	break;
376
377	case D_BMSAFEMAP3:
378	pool_put(&bmsafemap_pool, item);
379	break;
380
381	case D_ALLOCDIRECT4:
382	pool_put(&allocdirect_pool, item);
383	break;
384
385	case D_INDIRDEP5:
386	pool_put(&indirdep_pool, item);
387	break;
388
389	case D_ALLOCINDIR6:
390	pool_put(&allocindir_pool, item);
391	break;
392
393	case D_FREEFRAG7:
394	pool_put(&freefrag_pool, item);
395	break;
396
397	case D_FREEBLKS8:
398	pool_put(&freeblks_pool, item);
399	break;
400
401	case D_FREEFILE9:
402	pool_put(&freefile_pool, item);
403	break;
404
405	case D_DIRADD10:
406	pool_put(&diradd_pool, item);
407	break;
408
409	case D_MKDIR11:
410	pool_put(&mkdir_pool, item);
411	break;
412
413	case D_DIRREM12:
414	pool_put(&dirrem_pool, item);
415	break;
416
417	case D_NEWDIRBLK13:
418	pool_put(&newdirblk_pool, item);
419	break;
420
421	default:
422	#ifdef DEBUG
423	if (lk.lkt_held != -1)
424	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
425	#endif
426	panic("softdep_free: unknown type %d", type);
427	}
428	}
429
430	struct workhead softdep_freequeue;
431
432	static __inline void
433	softdep_freequeue_add(struct worklist *item)
434	{
435	int s;
436
437	s = splbio()splraise(0x3);
438	LIST_INSERT_HEAD(&softdep_freequeue, item, wk_list)do { if (((item)->wk_list.le_next = (&softdep_freequeue )->lh_first) != ((void *)0)) (&softdep_freequeue)-> lh_first->wk_list.le_prev = &(item)->wk_list.le_next ; (&softdep_freequeue)->lh_first = (item); (item)-> wk_list.le_prev = &(&softdep_freequeue)->lh_first; } while (0);
439	splx(s)spllower(s);
440	}
441
442	static __inline void
443	softdep_freequeue_process(void)
444	{
445	struct worklist *wk;
446
447	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
448
449	while ((wk = LIST_FIRST(&softdep_freequeue)((&softdep_freequeue)->lh_first)) != NULL((void *)0)) {
450	LIST_REMOVE(wk, wk_list)do { if ((wk)->wk_list.le_next != ((void )0)) (wk)->wk_list .le_next->wk_list.le_prev = (wk)->wk_list.le_prev; (wk )->wk_list.le_prev = (wk)->wk_list.le_next; ((wk)->wk_list .le_prev) = ((void )-1); ((wk)->wk_list.le_next) = ((void )-1); } while (0);
451	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
452	softdep_free(wk, wk->wk_type);
453	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
454	}
455	}
456
457	/*
458	* Worklist queue management.
459	* These routines require that the lock be held.
460	*/
461	#ifndef /* NOT */ DEBUG
462	#define WORKLIST_INSERT(head, item)do { (item)->wk_state \|= 0x8000; do { if (((item)->wk_list .le_next = (head)->lh_first) != ((void *)0)) (head)->lh_first ->wk_list.le_prev = &(item)->wk_list.le_next; (head )->lh_first = (item); (item)->wk_list.le_prev = &(head )->lh_first; } while (0); } while (0) do { \
463	(item)->wk_state \|= ONWORKLIST0x8000; \
464	LIST_INSERT_HEAD(head, item, wk_list)do { if (((item)->wk_list.le_next = (head)->lh_first) != ((void *)0)) (head)->lh_first->wk_list.le_prev = & (item)->wk_list.le_next; (head)->lh_first = (item); (item )->wk_list.le_prev = &(head)->lh_first; } while (0); \
465	} while (0)
466	#define WORKLIST_REMOVE(item)do { (item)->wk_state &= ~0x8000; do { if ((item)-> wk_list.le_next != ((void )0)) (item)->wk_list.le_next-> wk_list.le_prev = (item)->wk_list.le_prev; (item)->wk_list .le_prev = (item)->wk_list.le_next; ((item)->wk_list.le_prev ) = ((void )-1); ((item)->wk_list.le_next) = ((void )-1) ; } while (0); } while (0) do { \
467	(item)->wk_state &= ~ONWORKLIST0x8000; \
468	LIST_REMOVE(item, wk_list)do { if ((item)->wk_list.le_next != ((void )0)) (item)-> wk_list.le_next->wk_list.le_prev = (item)->wk_list.le_prev ; (item)->wk_list.le_prev = (item)->wk_list.le_next; ( (item)->wk_list.le_prev) = ((void )-1); ((item)->wk_list .le_next) = ((void )-1); } while (0); \
469	} while (0)
470	#define WORKITEM_FREE(item, type)softdep_freequeue_add((struct worklist )item) softdep_freequeue_add((struct worklist )item)
471
472	#else /* DEBUG */
473	STATIC void worklist_insert(struct workhead , struct worklist );
474	STATIC void worklist_remove(struct worklist *);
475	STATIC void workitem_free(struct worklist *);
476
477	#define WORKLIST_INSERT(head, item)do { (item)->wk_state \|= 0x8000; do { if (((item)->wk_list .le_next = (head)->lh_first) != ((void *)0)) (head)->lh_first ->wk_list.le_prev = &(item)->wk_list.le_next; (head )->lh_first = (item); (item)->wk_list.le_prev = &(head )->lh_first; } while (0); } while (0) worklist_insert(head, item)
478	#define WORKLIST_REMOVE(item)do { (item)->wk_state &= ~0x8000; do { if ((item)-> wk_list.le_next != ((void )0)) (item)->wk_list.le_next-> wk_list.le_prev = (item)->wk_list.le_prev; (item)->wk_list .le_prev = (item)->wk_list.le_next; ((item)->wk_list.le_prev ) = ((void )-1); ((item)->wk_list.le_next) = ((void )-1) ; } while (0); } while (0) worklist_remove(item)
479	#define WORKITEM_FREE(item, type)softdep_freequeue_add((struct worklist )item) workitem_free((struct worklist )item)
480
481	STATIC void
482	worklist_insert(struct workhead head, struct worklist item)
483	{
484
485	if (lk.lkt_held == -1)
486	panic("worklist_insert: lock not held");
487	if (item->wk_state & ONWORKLIST0x8000) {
488	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
489	panic("worklist_insert: already on list");
490	}
491	item->wk_state \|= ONWORKLIST0x8000;
492	LIST_INSERT_HEAD(head, item, wk_list)do { if (((item)->wk_list.le_next = (head)->lh_first) != ((void *)0)) (head)->lh_first->wk_list.le_prev = & (item)->wk_list.le_next; (head)->lh_first = (item); (item )->wk_list.le_prev = &(head)->lh_first; } while (0);
493	}
494
495	STATIC void
496	worklist_remove(struct worklist *item)
497	{
498
499	if (lk.lkt_held == -1)
500	panic("worklist_remove: lock not held");
501	if ((item->wk_state & ONWORKLIST0x8000) == 0) {
502	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
503	panic("worklist_remove: not on list");
504	}
505	item->wk_state &= ~ONWORKLIST0x8000;
506	LIST_REMOVE(item, wk_list)do { if ((item)->wk_list.le_next != ((void )0)) (item)-> wk_list.le_next->wk_list.le_prev = (item)->wk_list.le_prev ; (item)->wk_list.le_prev = (item)->wk_list.le_next; ( (item)->wk_list.le_prev) = ((void )-1); ((item)->wk_list .le_next) = ((void )-1); } while (0);
507	}
508
509	STATIC void
510	workitem_free(struct worklist *item)
511	{
512
513	if (item->wk_state & ONWORKLIST0x8000) {
514	if (lk.lkt_held != -1)
515	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
516	panic("workitem_free: still on list");
517	}
518	softdep_freequeue_add(item);
519	}
520	#endif /* DEBUG */
521
522	/*
523	* Workitem queue management
524	*/
525	STATIC struct workhead softdep_workitem_pending;
526	STATIC struct worklist *worklist_tail;
527	STATIC int num_on_worklist; /* number of worklist items to be processed */
528	STATIC int softdep_worklist_busy; /* 1 => trying to do unmount */
529	STATIC int softdep_worklist_req; /* serialized waiters */
530	STATIC int max_softdeps; /* maximum number of structs before slowdown */
531	STATIC int tickdelay = 2; /* number of ticks to pause during slowdown */
532	STATIC int proc_waiting; /* tracks whether we have a timeout posted */
533	STATIC int stat_countp; / statistic to count in proc_waiting timeout */
534	STATIC struct timeout proc_waiting_timeout;
535	STATIC struct proc filesys_syncer; / proc of filesystem syncer process */
536	STATIC int req_clear_inodedeps; /* syncer process flush some inodedeps */
537	#define FLUSH_INODES1 1
538	STATIC int req_clear_remove; /* syncer process flush some freeblks */
539	#define FLUSH_REMOVE2 2
540	/*
541	* runtime statistics
542	*/
543	STATIC int stat_worklist_push; /* number of worklist cleanups */
544	STATIC int stat_blk_limit_push; /* number of times block limit neared */
545	STATIC int stat_ino_limit_push; /* number of times inode limit neared */
546	STATIC int stat_blk_limit_hit; /* number of times block slowdown imposed */
547	STATIC int stat_ino_limit_hit; /* number of times inode slowdown imposed */
548	STATIC int stat_sync_limit_hit; /* number of synchronous slowdowns imposed */
549	STATIC int stat_indir_blk_ptrs; /* bufs redirtied as indir ptrs not written */
550	STATIC int stat_inode_bitmap; /* bufs redirtied as inode bitmap not written */
551	STATIC int stat_direct_blk_ptrs;/* bufs redirtied as direct ptrs not written */
552	STATIC int stat_dir_entry; /* bufs redirtied as dir entry cannot write */
553
554	/*
555	* Add an item to the end of the work queue.
556	* This routine requires that the lock be held.
557	* This is the only routine that adds items to the list.
558	* The following routine is the only one that removes items
559	* and does so in order from first to last.
560	*/
561	STATIC void
562	add_to_worklist(struct worklist *wk)
563	{
564
565	if (wk->wk_state & ONWORKLIST0x8000) {
566	#ifdef DEBUG
567	if (lk.lkt_held != -1)
568	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
569	#endif
570	panic("add_to_worklist: already on list");
571	}
572	wk->wk_state \|= ONWORKLIST0x8000;
573	if (LIST_FIRST(&softdep_workitem_pending)((&softdep_workitem_pending)->lh_first) == NULL((void *)0))
574	LIST_INSERT_HEAD(&softdep_workitem_pending, wk, wk_list)do { if (((wk)->wk_list.le_next = (&softdep_workitem_pending )->lh_first) != ((void *)0)) (&softdep_workitem_pending )->lh_first->wk_list.le_prev = &(wk)->wk_list.le_next ; (&softdep_workitem_pending)->lh_first = (wk); (wk)-> wk_list.le_prev = &(&softdep_workitem_pending)->lh_first ; } while (0);
575	else
576	LIST_INSERT_AFTER(worklist_tail, wk, wk_list)do { if (((wk)->wk_list.le_next = (worklist_tail)->wk_list .le_next) != ((void *)0)) (worklist_tail)->wk_list.le_next ->wk_list.le_prev = &(wk)->wk_list.le_next; (worklist_tail )->wk_list.le_next = (wk); (wk)->wk_list.le_prev = & (worklist_tail)->wk_list.le_next; } while (0);
577	worklist_tail = wk;
578	num_on_worklist += 1;
579	}
580
581	/*
582	* Process that runs once per second to handle items in the background queue.
583	*
584	* Note that we ensure that everything is done in the order in which they
585	* appear in the queue. The code below depends on this property to ensure
586	* that blocks of a file are freed before the inode itself is freed. This
587	* ordering ensures that no new <vfsid, inum, lbn> triples will be generated
588	* until all the old ones have been purged from the dependency lists.
589	*/
590	int
591	softdep_process_worklist(struct mount *matchmnt)
592	{
593	struct proc p = CURPROC({struct cpu_info __ci; asm volatile("movq %%gs:%P1,%0" : "=r" (__ci) :"n" (__builtin_offsetof(struct cpu_info, ci_self))); __ci;})->ci_curproc;
594	int matchcnt, loopcount;
595	struct timeval starttime;
596
597	/*
598	* First process any items on the delayed-free queue.
599	*/
600	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
601	softdep_freequeue_process();
602	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
603
604	/*
605	* Record the process identifier of our caller so that we can give
606	* this process preferential treatment in request_cleanup below.
607	* We can't do this in softdep_initialize, because the syncer doesn't
608	* have to run then.
609	* NOTE! This function _could_ be called with a curproc != syncerproc.
610	*/
611	filesys_syncer = syncerproc;
612	matchcnt = 0;
613
614	/*
615	* There is no danger of having multiple processes run this
616	* code, but we have to single-thread it when softdep_flushfiles()
617	* is in operation to get an accurate count of the number of items
618	* related to its mount point that are in the list.
619	*/
620	if (matchmnt == NULL((void *)0)) {
621	if (softdep_worklist_busy < 0)
622	return(-1);
623	softdep_worklist_busy += 1;
624	}
625
626	/*
627	* If requested, try removing inode or removal dependencies.
628	*/
629	if (req_clear_inodedeps) {
630	clear_inodedeps(p);
631	req_clear_inodedeps -= 1;
632	wakeup_one(&proc_waiting)wakeup_n((&proc_waiting), 1);
633	}
634	if (req_clear_remove) {
635	clear_remove(p);
636	req_clear_remove -= 1;
637	wakeup_one(&proc_waiting)wakeup_n((&proc_waiting), 1);
638	}
639	loopcount = 1;
640	getmicrouptime(&starttime);
641	while (num_on_worklist > 0) {
642	if (process_worklist_item(matchmnt, &matchcnt, LK_NOWAIT0x0040UL) == 0)
643	break;
644
645	/*
646	* If a umount operation wants to run the worklist
647	* accurately, abort.
648	*/
649	if (softdep_worklist_req && matchmnt == NULL((void *)0)) {
650	matchcnt = -1;
651	break;
652	}
653
654	/*
655	* If requested, try removing inode or removal dependencies.
656	*/
657	if (req_clear_inodedeps) {
658	clear_inodedeps(p);
659	req_clear_inodedeps -= 1;
660	wakeup_one(&proc_waiting)wakeup_n((&proc_waiting), 1);
661	}
662	if (req_clear_remove) {
663	clear_remove(p);
664	req_clear_remove -= 1;
665	wakeup_one(&proc_waiting)wakeup_n((&proc_waiting), 1);
666	}
667	/*
668	* We do not generally want to stop for buffer space, but if
669	* we are really being a buffer hog, we will stop and wait.
670	*/
671	#if 0
672	if (loopcount++ % 128 == 0)
673	bwillwrite();
674	#endif
675	/*
676	* Never allow processing to run for more than one
677	* second. Otherwise the other syncer tasks may get
678	* excessively backlogged.
679	*/
680	{
681	struct timeval diff;
682	struct timeval tv;
683
684	getmicrouptime(&tv);
685	timersub(&tv, &starttime, &diff)do { (&diff)->tv_sec = (&tv)->tv_sec - (&starttime )->tv_sec; (&diff)->tv_usec = (&tv)->tv_usec - (&starttime)->tv_usec; if ((&diff)->tv_usec < 0) { (&diff)->tv_sec--; (&diff)->tv_usec += 1000000 ; } } while (0);
686	if (diff.tv_sec != 0 && matchmnt == NULL((void *)0)) {
687	matchcnt = -1;
688	break;
689	}
690	}
691
692	/*
693	* Process any new items on the delayed-free queue.
694	*/
695	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
696	softdep_freequeue_process();
697	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
698	}
699	if (matchmnt == NULL((void *)0)) {
700	softdep_worklist_busy -= 1;
701	if (softdep_worklist_req && softdep_worklist_busy == 0)
702	wakeup(&softdep_worklist_req);
703	}
704	return (matchcnt);
705	}
706
707	/*
708	* Process one item on the worklist.
709	*/
710	STATIC int
711	process_worklist_item(struct mount matchmnt, int matchcnt, int flags)
712	{
713	struct worklist wk, wkend;
714	struct dirrem *dirrem;
715	struct mount *mp;
716	struct vnode *vp;
717
718	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
719	/*
720	* Normally we just process each item on the worklist in order.
721	* However, if we are in a situation where we cannot lock any
722	* inodes, we have to skip over any dirrem requests whose
723	* vnodes are resident and locked.
724	*/
725	LIST_FOREACH(wk, &softdep_workitem_pending, wk_list)for((wk) = ((&softdep_workitem_pending)->lh_first); (wk )!= ((void *)0); (wk) = ((wk)->wk_list.le_next)) {
726	if ((flags & LK_NOWAIT0x0040UL) == 0 \|\| wk->wk_type != D_DIRREM12)
727	break;
728	dirrem = WK_DIRREM(wk)((struct dirrem *)(wk));
729	vp = ufs_ihashlookup(VFSTOUFS(dirrem->dm_mnt)((struct ufsmount *)((dirrem->dm_mnt)->mnt_data))->um_dev,
730	dirrem->dm_oldinum);
731	if (vp == NULL((void *)0) \|\| !VOP_ISLOCKED(vp))
732	break;
733	}
734	if (wk == NULL((void *)0)) {
735	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
736	return (0);
737	}
738	/*
739	* Remove the item to be processed. If we are removing the last
740	* item on the list, we need to recalculate the tail pointer.
741	* As this happens rarely and usually when the list is short,
742	* we just run down the list to find it rather than tracking it
743	* in the above loop.
744	*/
745	WORKLIST_REMOVE(wk)do { (wk)->wk_state &= ~0x8000; do { if ((wk)->wk_list .le_next != ((void )0)) (wk)->wk_list.le_next->wk_list .le_prev = (wk)->wk_list.le_prev; (wk)->wk_list.le_prev = (wk)->wk_list.le_next; ((wk)->wk_list.le_prev) = ((void )-1); ((wk)->wk_list.le_next) = ((void )-1); } while (0 ); } while (0);
746	if (wk == worklist_tail) {
747	LIST_FOREACH(wkend, &softdep_workitem_pending, wk_list)for((wkend) = ((&softdep_workitem_pending)->lh_first); (wkend)!= ((void *)0); (wkend) = ((wkend)->wk_list.le_next ))
748	if (LIST_NEXT(wkend, wk_list)((wkend)->wk_list.le_next) == NULL((void *)0))
749	break;
750	worklist_tail = wkend;
751	}
752	num_on_worklist -= 1;
753	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
754	switch (wk->wk_type) {
755
756	case D_DIRREM12:
757	/* removal of a directory entry */
758	mp = WK_DIRREM(wk)((struct dirrem *)(wk))->dm_mnt;
759	#if 0
760	if (vn_write_suspend_wait(NULL((void *)0), mp, V_NOWAIT))
761	panic("%s: dirrem on suspended filesystem",
762	"process_worklist_item");
763	#endif
764	if (matchmnt != NULL((void *)0) && mp == matchmnt)
765	*matchcnt += 1;
766	handle_workitem_remove(WK_DIRREM(wk)((struct dirrem *)(wk)));
767	break;
768
769	case D_FREEBLKS8:
770	/* releasing blocks and/or fragments from a file */
771	mp = WK_FREEBLKS(wk)((struct freeblks *)(wk))->fb_mnt;
772	#if 0
773	if (vn_write_suspend_wait(NULL((void *)0), mp, V_NOWAIT))
774	panic("%s: freeblks on suspended filesystem",
775	"process_worklist_item");
776	#endif
777	if (matchmnt != NULL((void *)0) && mp == matchmnt)
778	*matchcnt += 1;
779	handle_workitem_freeblocks(WK_FREEBLKS(wk)((struct freeblks *)(wk)));
780	break;
781
782	case D_FREEFRAG7:
783	/* releasing a fragment when replaced as a file grows */
784	mp = WK_FREEFRAG(wk)((struct freefrag *)(wk))->ff_mnt;
785	#if 0
786	if (vn_write_suspend_wait(NULL((void *)0), mp, V_NOWAIT))
787	panic("%s: freefrag on suspended filesystem",
788	"process_worklist_item");
789	#endif
790	if (matchmnt != NULL((void *)0) && mp == matchmnt)
791	*matchcnt += 1;
792	handle_workitem_freefrag(WK_FREEFRAG(wk)((struct freefrag *)(wk)));
793	break;
794
795	case D_FREEFILE9:
796	/* releasing an inode when its link count drops to 0 */
797	mp = WK_FREEFILE(wk)((struct freefile *)(wk))->fx_mnt;
798	#if 0
799	if (vn_write_suspend_wait(NULL((void *)0), mp, V_NOWAIT))
800	panic("%s: freefile on suspended filesystem",
801	"process_worklist_item");
802	#endif
803	if (matchmnt != NULL((void *)0) && mp == matchmnt)
804	*matchcnt += 1;
805	handle_workitem_freefile(WK_FREEFILE(wk)((struct freefile *)(wk)));
806	break;
807
808	default:
809	panic("%s_process_worklist: Unknown type %s",
810	"softdep", TYPENAME(wk->wk_type)((unsigned)(wk->wk_type) <= 13 ? softdep_typenames[wk-> wk_type] : "???"));
811	/* NOTREACHED */
812	}
813	return (1);
814	}
815
816	/*
817	* Move dependencies from one buffer to another.
818	*/
819	void
820	softdep_move_dependencies(struct buf oldbp, struct buf newbp)
821	{
822	struct worklist wk, wktail;
823
824	if (LIST_FIRST(&newbp->b_dep)((&newbp->b_dep)->lh_first) != NULL((void *)0))
825	panic("softdep_move_dependencies: need merge code");
826	wktail = NULL((void *)0);
827	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
828	while ((wk = LIST_FIRST(&oldbp->b_dep)((&oldbp->b_dep)->lh_first)) != NULL((void *)0)) {
829	LIST_REMOVE(wk, wk_list)do { if ((wk)->wk_list.le_next != ((void )0)) (wk)->wk_list .le_next->wk_list.le_prev = (wk)->wk_list.le_prev; (wk )->wk_list.le_prev = (wk)->wk_list.le_next; ((wk)->wk_list .le_prev) = ((void )-1); ((wk)->wk_list.le_next) = ((void )-1); } while (0);
830	if (wktail == NULL((void *)0))
831	LIST_INSERT_HEAD(&newbp->b_dep, wk, wk_list)do { if (((wk)->wk_list.le_next = (&newbp->b_dep)-> lh_first) != ((void *)0)) (&newbp->b_dep)->lh_first ->wk_list.le_prev = &(wk)->wk_list.le_next; (&newbp ->b_dep)->lh_first = (wk); (wk)->wk_list.le_prev = & (&newbp->b_dep)->lh_first; } while (0);
832	else
833	LIST_INSERT_AFTER(wktail, wk, wk_list)do { if (((wk)->wk_list.le_next = (wktail)->wk_list.le_next ) != ((void *)0)) (wktail)->wk_list.le_next->wk_list.le_prev = &(wk)->wk_list.le_next; (wktail)->wk_list.le_next = (wk); (wk)->wk_list.le_prev = &(wktail)->wk_list .le_next; } while (0);
834	wktail = wk;
835	}
836	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
837	}
838
839	/*
840	* Purge the work list of all items associated with a particular mount point.
841	*/
842	int
843	softdep_flushworklist(struct mount oldmnt, int countp, struct proc *p)
844	{
845	struct vnode *devvp;
846	int count, error = 0;
847
848	/*
849	* Await our turn to clear out the queue, then serialize access.
850	*/
851	while (softdep_worklist_busy) {
852	softdep_worklist_req += 1;
853	tsleep_nsec(&softdep_worklist_req, PRIBIO16, "softflush", INFSLP0xffffffffffffffffULL);
854	softdep_worklist_req -= 1;
855	}
856	softdep_worklist_busy = -1;
857	/*
858	* Alternately flush the block device associated with the mount
859	* point and process any dependencies that the flushing
860	* creates. We continue until no more worklist dependencies
861	* are found.
862	*/
863	*countp = 0;
864	devvp = VFSTOUFS(oldmnt)((struct ufsmount *)((oldmnt)->mnt_data))->um_devvp;
865	while ((count = softdep_process_worklist(oldmnt)) > 0) {
866	*countp += count;
867	vn_lock(devvp, LK_EXCLUSIVE0x0001UL \| LK_RETRY0x2000UL);
868	error = VOP_FSYNC(devvp, p->p_ucred, MNT_WAIT1, p);
869	VOP_UNLOCK(devvp);
870	if (error)
871	break;
872	}
873	softdep_worklist_busy = 0;
874	if (softdep_worklist_req)
875	wakeup(&softdep_worklist_req);
876	return (error);
877	}
878
879	/*
880	* Flush all vnodes and worklist items associated with a specified mount point.
881	*/
882	int
883	softdep_flushfiles(struct mount oldmnt, int flags, struct proc p)
884	{
885	int error, count, loopcnt;
886
887	/*
888	* Alternately flush the vnodes associated with the mount
889	* point and process any dependencies that the flushing
890	* creates. In theory, this loop can happen at most twice,
891	* but we give it a few extra just to be sure.
892	*/
893	for (loopcnt = 10; loopcnt > 0; loopcnt--) {
894	/*
895	* Do another flush in case any vnodes were brought in
896	* as part of the cleanup operations.
897	*/
898	if ((error = ffs_flushfiles(oldmnt, flags, p)) != 0)
899	break;
900	if ((error = softdep_flushworklist(oldmnt, &count, p)) != 0 \|\|
901	count == 0)
902	break;
903	}
904	/*
905	* If the reboot process sleeps during the loop, the update
906	* process may call softdep_process_worklist() and create
907	* new dirty vnodes at the mount point. Call ffs_flushfiles()
908	* again after the loop has flushed all soft dependencies.
909	*/
910	if (error == 0)
911	error = ffs_flushfiles(oldmnt, flags, p);
912	/*
913	* If we are unmounting then it is an error to fail. If we
914	* are simply trying to downgrade to read-only, then filesystem
915	* activity can keep us busy forever, so we just fail with EBUSY.
916	*/
917	if (loopcnt == 0) {
918	error = EBUSY16;
919	}
920	return (error);
921	}
922
923	/*
924	* Structure hashing.
925	*
926	* There are three types of structures that can be looked up:
927	* 1) pagedep structures identified by mount point, inode number,
928	* and logical block.
929	* 2) inodedep structures identified by mount point and inode number.
930	* 3) newblk structures identified by mount point and
931	* physical block number.
932	*
933	* The "pagedep" and "inodedep" dependency structures are hashed
934	* separately from the file blocks and inodes to which they correspond.
935	* This separation helps when the in-memory copy of an inode or
936	* file block must be replaced. It also obviates the need to access
937	* an inode or file page when simply updating (or de-allocating)
938	* dependency structures. Lookup of newblk structures is needed to
939	* find newly allocated blocks when trying to associate them with
940	* their allocdirect or allocindir structure.
941	*
942	* The lookup routines optionally create and hash a new instance when
943	* an existing entry is not found.
944	*/
945	#define DEPALLOC0x0001 0x0001 /* allocate structure if lookup fails */
946	#define NODELAY0x0002 0x0002 /* cannot do background work */
947
948	SIPHASH_KEY softdep_hashkey;
949
950	/*
951	* Structures and routines associated with pagedep caching.
952	*/
953	LIST_HEAD(pagedep_hashhead, pagedep)struct pagedep_hashhead { struct pagedep lh_first; } pagedep_hashtbl;
954	u_long pagedep_hash; /* size of hash table - 1 */
955	STATIC struct sema pagedep_in_progress;
956
957	/*
958	* Look up a pagedep. Return 1 if found, 0 if not found or found
959	* when asked to allocate but not associated with any buffer.
960	* If not found, allocate if DEPALLOC flag is passed.
961	* Found or allocated entry is returned in pagedeppp.
962	* This routine must be called with splbio interrupts blocked.
963	*/
964	STATIC int
965	pagedep_lookup(struct inode *ip, daddr_t lbn, int flags,
966	struct pagedep **pagedeppp)
967	{
968	SIPHASH_CTX ctx;
969	struct pagedep *pagedep;
970	struct pagedep_hashhead *pagedephd;
971	struct mount *mp;
972	int i;
973
974	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
975
976	#ifdef DEBUG
977	if (lk.lkt_held == -1)
978	panic("pagedep_lookup: lock not held");
979	#endif
980	mp = ITOV(ip)((ip)->i_vnode)->v_mount;
981
982	SipHash24_Init(&ctx, &softdep_hashkey)SipHash_Init((&ctx), (&softdep_hashkey));
983	SipHash24_Update(&ctx, &mp, sizeof(mp))SipHash_Update((&ctx), 2, 4, (&mp), (sizeof(mp)));
984	SipHash24_Update(&ctx, &ip->i_number, sizeof(ip->i_number))SipHash_Update((&ctx), 2, 4, (&ip->i_number), (sizeof (ip->i_number)));
985	SipHash24_Update(&ctx, &lbn, sizeof(lbn))SipHash_Update((&ctx), 2, 4, (&lbn), (sizeof(lbn)));
986	pagedephd = &pagedep_hashtbl[SipHash24_End(&ctx)SipHash_End((&ctx), 2, 4) & pagedep_hash];
987	top:
988	LIST_FOREACH(pagedep, pagedephd, pd_hash)for((pagedep) = ((pagedephd)->lh_first); (pagedep)!= ((void *)0); (pagedep) = ((pagedep)->pd_hash.le_next))
989	if (ip->i_number == pagedep->pd_ino &&
990	lbn == pagedep->pd_lbn &&
991	mp == pagedep->pd_mnt)
992	break;
993	if (pagedep) {
994	*pagedeppp = pagedep;
995	if ((flags & DEPALLOC0x0001) != 0 &&
996	(pagedep->pd_statepd_list.wk_state & ONWORKLIST0x8000) == 0)
997	return (0);
998	return (1);
999	}
1000	if ((flags & DEPALLOC0x0001) == 0) {
1001	pagedeppp = NULL((void )0);
1002	return (0);
1003	}
1004	if (sema_get(&pagedep_in_progress, &lk) == 0) {
1005	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1006	goto top;
1007	}
1008	pagedep = pool_get(&pagedep_pool, PR_WAITOK0x0001 \| PR_ZERO0x0008);
1009	pagedep->pd_list.wk_type = D_PAGEDEP0;
1010	pagedep->pd_mnt = mp;
1011	pagedep->pd_ino = ip->i_number;
1012	pagedep->pd_lbn = lbn;
1013	LIST_INIT(&pagedep->pd_dirremhd)do { ((&pagedep->pd_dirremhd)->lh_first) = ((void * )0); } while (0);
1014	LIST_INIT(&pagedep->pd_pendinghd)do { ((&pagedep->pd_pendinghd)->lh_first) = ((void * )0); } while (0);
1015	for (i = 0; i < DAHASHSZ6; i++)
1016	LIST_INIT(&pagedep->pd_diraddhd[i])do { ((&pagedep->pd_diraddhd[i])->lh_first) = ((void *)0); } while (0);
1017	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1018	LIST_INSERT_HEAD(pagedephd, pagedep, pd_hash)do { if (((pagedep)->pd_hash.le_next = (pagedephd)->lh_first ) != ((void *)0)) (pagedephd)->lh_first->pd_hash.le_prev = &(pagedep)->pd_hash.le_next; (pagedephd)->lh_first = (pagedep); (pagedep)->pd_hash.le_prev = &(pagedephd )->lh_first; } while (0);
1019	sema_release(&pagedep_in_progress);
1020	*pagedeppp = pagedep;
1021	return (0);
1022	}
1023
1024	/*
1025	* Structures and routines associated with inodedep caching.
1026	*/
1027	LIST_HEAD(inodedep_hashhead, inodedep)struct inodedep_hashhead { struct inodedep lh_first; } inodedep_hashtbl;
1028	STATIC u_long inodedep_hash; /* size of hash table - 1 */
1029	STATIC long num_inodedep; /* number of inodedep allocated */
1030	STATIC struct sema inodedep_in_progress;
1031
1032	/*
1033	* Look up a inodedep. Return 1 if found, 0 if not found.
1034	* If not found, allocate if DEPALLOC flag is passed.
1035	* Found or allocated entry is returned in inodedeppp.
1036	* This routine must be called with splbio interrupts blocked.
1037	*/
1038	STATIC int
1039	inodedep_lookup(struct fs *fs, ufsino_t inum, int flags,
1040	struct inodedep **inodedeppp)
1041	{
1042	SIPHASH_CTX ctx;
1043	struct inodedep *inodedep;
1044	struct inodedep_hashhead *inodedephd;
1045	int firsttry;
1046
1047	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
1048
1049	#ifdef DEBUG
1050	if (lk.lkt_held == -1)
1051	panic("inodedep_lookup: lock not held");
1052	#endif
1053	firsttry = 1;
1054	SipHash24_Init(&ctx, &softdep_hashkey)SipHash_Init((&ctx), (&softdep_hashkey));
1055	SipHash24_Update(&ctx, &fs, sizeof(fs))SipHash_Update((&ctx), 2, 4, (&fs), (sizeof(fs)));
1056	SipHash24_Update(&ctx, &inum, sizeof(inum))SipHash_Update((&ctx), 2, 4, (&inum), (sizeof(inum)));
1057	inodedephd = &inodedep_hashtbl[SipHash24_End(&ctx)SipHash_End((&ctx), 2, 4) & inodedep_hash];
1058	top:
1059	LIST_FOREACH(inodedep, inodedephd, id_hash)for((inodedep) = ((inodedephd)->lh_first); (inodedep)!= (( void *)0); (inodedep) = ((inodedep)->id_hash.le_next))
1060	if (inum == inodedep->id_ino && fs == inodedep->id_fs)
1061	break;
1062	if (inodedep) {
1063	*inodedeppp = inodedep;
1064	return (1);
1065	}
1066	if ((flags & DEPALLOC0x0001) == 0) {
1067	inodedeppp = NULL((void )0);
1068	return (0);
1069	}
1070	/*
1071	* If we are over our limit, try to improve the situation.
1072	*/
1073	if (num_inodedep > max_softdeps && firsttry && (flags & NODELAY0x0002) == 0 &&
1074	request_cleanup(FLUSH_INODES1, 1)) {
1075	firsttry = 0;
1076	goto top;
1077	}
1078	if (sema_get(&inodedep_in_progress, &lk) == 0) {
1079	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1080	goto top;
1081	}
1082	num_inodedep += 1;
1083	inodedep = pool_get(&inodedep_pool, PR_WAITOK0x0001);
1084	inodedep->id_list.wk_type = D_INODEDEP1;
1085	inodedep->id_fs = fs;
1086	inodedep->id_ino = inum;
1087	inodedep->id_stateid_list.wk_state = ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008);
1088	inodedep->id_nlinkdelta = 0;
1089	inodedep->id_savedino1id_un.idu_savedino1 = NULL((void *)0);
1090	inodedep->id_savedsize = -1;
1091	inodedep->id_buf = NULL((void *)0);
1092	LIST_INIT(&inodedep->id_pendinghd)do { ((&inodedep->id_pendinghd)->lh_first) = ((void *)0); } while (0);
1093	LIST_INIT(&inodedep->id_inowait)do { ((&inodedep->id_inowait)->lh_first) = ((void * )0); } while (0);
1094	LIST_INIT(&inodedep->id_bufwait)do { ((&inodedep->id_bufwait)->lh_first) = ((void * )0); } while (0);
1095	TAILQ_INIT(&inodedep->id_inoupdt)do { (&inodedep->id_inoupdt)->tqh_first = ((void *) 0); (&inodedep->id_inoupdt)->tqh_last = &(& inodedep->id_inoupdt)->tqh_first; } while (0);
1096	TAILQ_INIT(&inodedep->id_newinoupdt)do { (&inodedep->id_newinoupdt)->tqh_first = ((void *)0); (&inodedep->id_newinoupdt)->tqh_last = & (&inodedep->id_newinoupdt)->tqh_first; } while (0);
1097	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1098	LIST_INSERT_HEAD(inodedephd, inodedep, id_hash)do { if (((inodedep)->id_hash.le_next = (inodedephd)->lh_first ) != ((void *)0)) (inodedephd)->lh_first->id_hash.le_prev = &(inodedep)->id_hash.le_next; (inodedephd)->lh_first = (inodedep); (inodedep)->id_hash.le_prev = &(inodedephd )->lh_first; } while (0);
1099	sema_release(&inodedep_in_progress);
1100	*inodedeppp = inodedep;
1101	return (0);
1102	}
1103
1104	/*
1105	* Structures and routines associated with newblk caching.
1106	*/
1107	LIST_HEAD(newblk_hashhead, newblk)struct newblk_hashhead { struct newblk lh_first; } newblk_hashtbl;
1108	u_long newblk_hash; /* size of hash table - 1 */
1109	STATIC struct sema newblk_in_progress;
1110
1111	/*
1112	* Look up a newblk. Return 1 if found, 0 if not found.
1113	* If not found, allocate if DEPALLOC flag is passed.
1114	* Found or allocated entry is returned in newblkpp.
1115	*/
1116	STATIC int
1117	newblk_lookup(struct fs *fs, daddr_t newblkno, int flags,
1118	struct newblk **newblkpp)
1119	{
1120	SIPHASH_CTX ctx;
1121	struct newblk *newblk;
1122	struct newblk_hashhead *newblkhd;
1123
1124	SipHash24_Init(&ctx, &softdep_hashkey)SipHash_Init((&ctx), (&softdep_hashkey));
1125	SipHash24_Update(&ctx, &fs, sizeof(fs))SipHash_Update((&ctx), 2, 4, (&fs), (sizeof(fs)));
1126	SipHash24_Update(&ctx, &newblkno, sizeof(newblkno))SipHash_Update((&ctx), 2, 4, (&newblkno), (sizeof(newblkno )));
1127	newblkhd = &newblk_hashtbl[SipHash24_End(&ctx)SipHash_End((&ctx), 2, 4) & newblk_hash];
1128	top:
1129	LIST_FOREACH(newblk, newblkhd, nb_hash)for((newblk) = ((newblkhd)->lh_first); (newblk)!= ((void * )0); (newblk) = ((newblk)->nb_hash.le_next))
1130	if (newblkno == newblk->nb_newblkno && fs == newblk->nb_fs)
1131	break;
1132	if (newblk) {
1133	*newblkpp = newblk;
1134	return (1);
1135	}
1136	if ((flags & DEPALLOC0x0001) == 0) {
1137	newblkpp = NULL((void )0);
1138	return (0);
1139	}
1140	if (sema_get(&newblk_in_progress, NULL((void *)0)) == 0)
1141	goto top;
1142	newblk = pool_get(&newblk_pool, PR_WAITOK0x0001);
1143	newblk->nb_state = 0;
1144	newblk->nb_fs = fs;
1145	newblk->nb_newblkno = newblkno;
1146	LIST_INSERT_HEAD(newblkhd, newblk, nb_hash)do { if (((newblk)->nb_hash.le_next = (newblkhd)->lh_first ) != ((void *)0)) (newblkhd)->lh_first->nb_hash.le_prev = &(newblk)->nb_hash.le_next; (newblkhd)->lh_first = (newblk); (newblk)->nb_hash.le_prev = &(newblkhd)-> lh_first; } while (0);
1147	sema_release(&newblk_in_progress);
1148	*newblkpp = newblk;
1149	return (0);
1150	}
1151
1152	/*
1153	* Executed during filesystem system initialization before
1154	* mounting any file systems.
1155	*/
1156	void
1157	softdep_initialize(void)
1158	{
1159
1160	bioops.io_start = softdep_disk_io_initiation;
1161	bioops.io_complete = softdep_disk_write_complete;
1162	bioops.io_deallocate = softdep_deallocate_dependencies;
1163	bioops.io_movedeps = softdep_move_dependencies;
1164	bioops.io_countdeps = softdep_count_dependencies;
1165
1166	LIST_INIT(&mkdirlisthd)do { ((&mkdirlisthd)->lh_first) = ((void *)0); } while (0);
1167	LIST_INIT(&softdep_workitem_pending)do { ((&softdep_workitem_pending)->lh_first) = ((void * )0); } while (0);
1168	#ifdef KMEMSTATS1
1169	max_softdeps = min (initialvnodes * 8,
1170	kmemstats[M_INODEDEP79].ks_limit / (2 * sizeof(struct inodedep)));
1171	#else
1172	max_softdeps = initialvnodes * 4;
1173	#endif
1174	arc4random_buf(&softdep_hashkey, sizeof(softdep_hashkey));
1175	pagedep_hashtbl = hashinit(initialvnodes / 5, M_PAGEDEP78, M_WAITOK0x0001,
1176	&pagedep_hash);
1177	sema_init(&pagedep_in_progress, "pagedep", PRIBIO16);
1178	inodedep_hashtbl = hashinit(initialvnodes, M_INODEDEP79, M_WAITOK0x0001,
1179	&inodedep_hash);
1180	sema_init(&inodedep_in_progress, "inodedep", PRIBIO16);
1181	newblk_hashtbl = hashinit(64, M_NEWBLK80, M_WAITOK0x0001, &newblk_hash);
1182	sema_init(&newblk_in_progress, "newblk", PRIBIO16);
1183	timeout_set(&proc_waiting_timeout, pause_timer, NULL((void *)0));
1184	pool_init(&pagedep_pool, sizeof(struct pagedep), 0, IPL_NONE0x0,
1185	PR_WAITOK0x0001, "pagedep", NULL((void *)0));
1186	pool_init(&inodedep_pool, sizeof(struct inodedep), 0, IPL_NONE0x0,
1187	PR_WAITOK0x0001, "inodedep", NULL((void *)0));
1188	pool_init(&newblk_pool, sizeof(struct newblk), 0, IPL_NONE0x0,
1189	PR_WAITOK0x0001, "newblk", NULL((void *)0));
1190	pool_init(&bmsafemap_pool, sizeof(struct bmsafemap), 0, IPL_NONE0x0,
1191	PR_WAITOK0x0001, "bmsafemap", NULL((void *)0));
1192	pool_init(&allocdirect_pool, sizeof(struct allocdirect), 0, IPL_NONE0x0,
1193	PR_WAITOK0x0001, "allocdir", NULL((void *)0));
1194	pool_init(&indirdep_pool, sizeof(struct indirdep), 0, IPL_NONE0x0,
1195	PR_WAITOK0x0001, "indirdep", NULL((void *)0));
1196	pool_init(&allocindir_pool, sizeof(struct allocindir), 0, IPL_NONE0x0,
1197	PR_WAITOK0x0001, "allocindir", NULL((void *)0));
1198	pool_init(&freefrag_pool, sizeof(struct freefrag), 0, IPL_NONE0x0,
1199	PR_WAITOK0x0001, "freefrag", NULL((void *)0));
1200	pool_init(&freeblks_pool, sizeof(struct freeblks), 0, IPL_NONE0x0,
1201	PR_WAITOK0x0001, "freeblks", NULL((void *)0));
1202	pool_init(&freefile_pool, sizeof(struct freefile), 0, IPL_NONE0x0,
1203	PR_WAITOK0x0001, "freefile", NULL((void *)0));
1204	pool_init(&diradd_pool, sizeof(struct diradd), 0, IPL_NONE0x0,
1205	PR_WAITOK0x0001, "diradd", NULL((void *)0));
1206	pool_init(&mkdir_pool, sizeof(struct mkdir), 0, IPL_NONE0x0,
1207	PR_WAITOK0x0001, "mkdir", NULL((void *)0));
1208	pool_init(&dirrem_pool, sizeof(struct dirrem), 0, IPL_NONE0x0,
1209	PR_WAITOK0x0001, "dirrem", NULL((void *)0));
1210	pool_init(&newdirblk_pool, sizeof(struct newdirblk), 0, IPL_NONE0x0,
1211	PR_WAITOK0x0001, "newdirblk", NULL((void *)0));
1212	}
1213
1214	/*
1215	* Called at mount time to notify the dependency code that a
1216	* filesystem wishes to use it.
1217	*/
1218	int
1219	softdep_mount(struct vnode devvp, struct mount mp, struct fs *fs,
1220	struct ucred *cred)
1221	{
1222	struct csum_total cstotal;
1223	struct cg *cgp;
1224	struct buf *bp;
1225	int error, cyl;
1226
1227	KASSERTMSG(1, "softdep_mount should not have been called")((1) ? (void)0 : panic("kernel %sassertion \"%s\" failed: file \"%s\", line %d" " " "softdep_mount should not have been called", "diagnostic " , "1", "/usr/src/sys/ufs/ffs/ffs_softdep.c", 1227));
1228
1229	/*
1230	* When doing soft updates, the counters in the
1231	* superblock may have gotten out of sync, so we have
1232	* to scan the cylinder groups and recalculate them.
1233	*/
1234	if ((fs->fs_flags & FS_UNCLEAN0x01) == 0)
1235	return (0);
1236	memset(&cstotal, 0, sizeof(cstotal))__builtin_memset((&cstotal), (0), (sizeof(cstotal)));
1237	for (cyl = 0; cyl < fs->fs_ncg; cyl++) {
1238	if ((error = bread(devvp, fsbtodb(fs, cgtod(fs, cyl))((((((daddr_t)(fs)->fs_fpg * (cyl)) + (fs)->fs_cgoffset * ((cyl) & ~((fs)->fs_cgmask))) + (fs)->fs_cblkno) ) << (fs)->fs_fsbtodb),
1239	fs->fs_cgsize, &bp)) != 0) {
1240	brelse(bp);
1241	return (error);
1242	}
1243	cgp = (struct cg *)bp->b_data;
1244	cstotal.cs_nffree += cgp->cg_cs.cs_nffree;
1245	cstotal.cs_nbfree += cgp->cg_cs.cs_nbfree;
1246	cstotal.cs_nifree += cgp->cg_cs.cs_nifree;
1247	cstotal.cs_ndir += cgp->cg_cs.cs_ndir;
1248	fs->fs_cs(fs, cyl)fs_csp[cyl] = cgp->cg_cs;
1249	brelse(bp);
1250	}
1251	#ifdef DEBUG
1252	if (memcmp(&cstotal, &fs->fs_cstotal, sizeof(cstotal))__builtin_memcmp((&cstotal), (&fs->fs_cstotal), (sizeof (cstotal))))
1253	printf("ffs_mountfs: superblock updated for soft updates\n");
1254	#endif
1255	memcpy(&fs->fs_cstotal, &cstotal, sizeof(cstotal))__builtin_memcpy((&fs->fs_cstotal), (&cstotal), (sizeof (cstotal)));
1256	return (0);
1257	}
1258
1259	/*
1260	* Protecting the freemaps (or bitmaps).
1261	*
1262	* To eliminate the need to execute fsck before mounting a file system
1263	* after a power failure, one must (conservatively) guarantee that the
1264	* on-disk copy of the bitmaps never indicate that a live inode or block is
1265	* free. So, when a block or inode is allocated, the bitmap should be
1266	* updated (on disk) before any new pointers. When a block or inode is
1267	* freed, the bitmap should not be updated until all pointers have been
1268	* reset. The latter dependency is handled by the delayed de-allocation
1269	* approach described below for block and inode de-allocation. The former
1270	* dependency is handled by calling the following procedure when a block or
1271	* inode is allocated. When an inode is allocated an "inodedep" is created
1272	* with its DEPCOMPLETE flag cleared until its bitmap is written to disk.
1273	* Each "inodedep" is also inserted into the hash indexing structure so
1274	* that any additional link additions can be made dependent on the inode
1275	* allocation.
1276	*
1277	* The ufs file system maintains a number of free block counts (e.g., per
1278	* cylinder group, per cylinder and per <cylinder, rotational position> pair)
1279	* in addition to the bitmaps. These counts are used to improve efficiency
1280	* during allocation and therefore must be consistent with the bitmaps.
1281	* There is no convenient way to guarantee post-crash consistency of these
1282	* counts with simple update ordering, for two main reasons: (1) The counts
1283	* and bitmaps for a single cylinder group block are not in the same disk
1284	* sector. If a disk write is interrupted (e.g., by power failure), one may
1285	* be written and the other not. (2) Some of the counts are located in the
1286	* superblock rather than the cylinder group block. So, we focus our soft
1287	* updates implementation on protecting the bitmaps. When mounting a
1288	* filesystem, we recompute the auxiliary counts from the bitmaps.
1289	*/
1290
1291	/*
1292	* Called just after updating the cylinder group block to allocate an inode.
1293	*/
1294	/* buffer for cylgroup block with inode map */
1295	/* inode related to allocation */
1296	/* new inode number being allocated */
1297	void
1298	softdep_setup_inomapdep(struct buf bp, struct inode ip, ufsino_t newinum)
1299	{
1300	struct inodedep *inodedep;
1301	struct bmsafemap *bmsafemap;
1302
1303	/*
1304	* Create a dependency for the newly allocated inode.
1305	* Panic if it already exists as something is seriously wrong.
1306	* Otherwise add it to the dependency list for the buffer holding
1307	* the cylinder group map from which it was allocated.
1308	*/
1309	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1310	if (inodedep_lookup(ip->i_fsinode_u.fs, newinum, DEPALLOC0x0001 \| NODELAY0x0002, &inodedep)
1311	!= 0) {
1312	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1313	panic("softdep_setup_inomapdep: found inode");
1314	}
1315	inodedep->id_buf = bp;
1316	inodedep->id_stateid_list.wk_state &= ~DEPCOMPLETE0x0008;
1317	bmsafemap = bmsafemap_lookup(bp);
1318	LIST_INSERT_HEAD(&bmsafemap->sm_inodedephd, inodedep, id_deps)do { if (((inodedep)->id_deps.le_next = (&bmsafemap-> sm_inodedephd)->lh_first) != ((void *)0)) (&bmsafemap-> sm_inodedephd)->lh_first->id_deps.le_prev = &(inodedep )->id_deps.le_next; (&bmsafemap->sm_inodedephd)-> lh_first = (inodedep); (inodedep)->id_deps.le_prev = & (&bmsafemap->sm_inodedephd)->lh_first; } while (0);
1319	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1320	}
1321
1322	/*
1323	* Called just after updating the cylinder group block to
1324	* allocate block or fragment.
1325	*/
1326	/* buffer for cylgroup block with block map */
1327	/* filesystem doing allocation */
1328	/* number of newly allocated block */
1329	void
1330	softdep_setup_blkmapdep(struct buf bp, struct fs fs, daddr_t newblkno)
1331	{
1332	struct newblk *newblk;
1333	struct bmsafemap *bmsafemap;
1334
1335	/*
1336	* Create a dependency for the newly allocated block.
1337	* Add it to the dependency list for the buffer holding
1338	* the cylinder group map from which it was allocated.
1339	*/
1340	if (newblk_lookup(fs, newblkno, DEPALLOC0x0001, &newblk) != 0)
1341	panic("softdep_setup_blkmapdep: found block");
1342	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1343	newblk->nb_bmsafemap = bmsafemap = bmsafemap_lookup(bp);
1344	LIST_INSERT_HEAD(&bmsafemap->sm_newblkhd, newblk, nb_deps)do { if (((newblk)->nb_deps.le_next = (&bmsafemap-> sm_newblkhd)->lh_first) != ((void *)0)) (&bmsafemap-> sm_newblkhd)->lh_first->nb_deps.le_prev = &(newblk) ->nb_deps.le_next; (&bmsafemap->sm_newblkhd)->lh_first = (newblk); (newblk)->nb_deps.le_prev = &(&bmsafemap ->sm_newblkhd)->lh_first; } while (0);
1345	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1346	}
1347
1348	/*
1349	* Find the bmsafemap associated with a cylinder group buffer.
1350	* If none exists, create one. The buffer must be locked when
1351	* this routine is called and this routine must be called with
1352	* splbio interrupts blocked.
1353	*/
1354	STATIC struct bmsafemap *
1355	bmsafemap_lookup(struct buf *bp)
1356	{
1357	struct bmsafemap *bmsafemap;
1358	struct worklist *wk;
1359
1360	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
1361
1362	#ifdef DEBUG
1363	if (lk.lkt_held == -1)
1364	panic("bmsafemap_lookup: lock not held");
1365	#endif
1366	LIST_FOREACH(wk, &bp->b_dep, wk_list)for((wk) = ((&bp->b_dep)->lh_first); (wk)!= ((void * )0); (wk) = ((wk)->wk_list.le_next))
1367	if (wk->wk_type == D_BMSAFEMAP3)
1368	return (WK_BMSAFEMAP(wk)((struct bmsafemap *)(wk)));
1369	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1370	bmsafemap = pool_get(&bmsafemap_pool, PR_WAITOK0x0001);
1371	bmsafemap->sm_list.wk_type = D_BMSAFEMAP3;
1372	bmsafemap->sm_list.wk_state = 0;
1373	bmsafemap->sm_buf = bp;
1374	LIST_INIT(&bmsafemap->sm_allocdirecthd)do { ((&bmsafemap->sm_allocdirecthd)->lh_first) = ( (void *)0); } while (0);
1375	LIST_INIT(&bmsafemap->sm_allocindirhd)do { ((&bmsafemap->sm_allocindirhd)->lh_first) = (( void *)0); } while (0);
1376	LIST_INIT(&bmsafemap->sm_inodedephd)do { ((&bmsafemap->sm_inodedephd)->lh_first) = ((void *)0); } while (0);
1377	LIST_INIT(&bmsafemap->sm_newblkhd)do { ((&bmsafemap->sm_newblkhd)->lh_first) = ((void *)0); } while (0);
1378	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1379	WORKLIST_INSERT(&bp->b_dep, &bmsafemap->sm_list)do { (&bmsafemap->sm_list)->wk_state \|= 0x8000; do { if (((&bmsafemap->sm_list)->wk_list.le_next = (& bp->b_dep)->lh_first) != ((void *)0)) (&bp->b_dep )->lh_first->wk_list.le_prev = &(&bmsafemap-> sm_list)->wk_list.le_next; (&bp->b_dep)->lh_first = (&bmsafemap->sm_list); (&bmsafemap->sm_list) ->wk_list.le_prev = &(&bp->b_dep)->lh_first; } while (0); } while (0);
1380	return (bmsafemap);
1381	}
1382
1383	/*
1384	* Direct block allocation dependencies.
1385	*
1386	* When a new block is allocated, the corresponding disk locations must be
1387	* initialized (with zeros or new data) before the on-disk inode points to
1388	* them. Also, the freemap from which the block was allocated must be
1389	* updated (on disk) before the inode's pointer. These two dependencies are
1390	* independent of each other and are needed for all file blocks and indirect
1391	* blocks that are pointed to directly by the inode. Just before the
1392	* "in-core" version of the inode is updated with a newly allocated block
1393	* number, a procedure (below) is called to setup allocation dependency
1394	* structures. These structures are removed when the corresponding
1395	* dependencies are satisfied or when the block allocation becomes obsolete
1396	* (i.e., the file is deleted, the block is de-allocated, or the block is a
1397	* fragment that gets upgraded). All of these cases are handled in
1398	* procedures described later.
1399	*
1400	* When a file extension causes a fragment to be upgraded, either to a larger
1401	* fragment or to a full block, the on-disk location may change (if the
1402	* previous fragment could not simply be extended). In this case, the old
1403	* fragment must be de-allocated, but not until after the inode's pointer has
1404	* been updated. In most cases, this is handled by later procedures, which
1405	* will construct a "freefrag" structure to be added to the workitem queue
1406	* when the inode update is complete (or obsolete). The main exception to
1407	* this is when an allocation occurs while a pending allocation dependency
1408	* (for the same block pointer) remains. This case is handled in the main
1409	* allocation dependency setup procedure by immediately freeing the
1410	* unreferenced fragments.
1411	*/
1412	/* inode to which block is being added */
1413	/* block pointer within inode */
1414	/* disk block number being added */
1415	/* previous block number, 0 unless frag */
1416	/* size of new block */
1417	/* size of new block */
1418	/* bp for allocated block */
1419	void
1420	softdep_setup_allocdirect(struct inode *ip, daddr_t lbn, daddr_t newblkno,
1421	daddr_t oldblkno, long newsize, long oldsize, struct buf *bp)
1422	{
1423	struct allocdirect adp, oldadp;
1424	struct allocdirectlst *adphead;
1425	struct bmsafemap *bmsafemap;
1426	struct inodedep *inodedep;
1427	struct pagedep *pagedep;
1428	struct newblk *newblk;
1429
1430	adp = pool_get(&allocdirect_pool, PR_WAITOK0x0001 \| PR_ZERO0x0008);
1431	adp->ad_list.wk_type = D_ALLOCDIRECT4;
1432	adp->ad_lbn = lbn;
1433	adp->ad_newblkno = newblkno;
1434	adp->ad_oldblkno = oldblkno;
1435	adp->ad_newsize = newsize;
1436	adp->ad_oldsize = oldsize;
1437	adp->ad_statead_list.wk_state = ATTACHED0x0001;
1438	LIST_INIT(&adp->ad_newdirblk)do { ((&adp->ad_newdirblk)->lh_first) = ((void *)0) ; } while (0);
1439	if (newblkno == oldblkno)
1440	adp->ad_freefrag = NULL((void *)0);
1441	else
1442	adp->ad_freefrag = newfreefrag(ip, oldblkno, oldsize);
1443
1444	if (newblk_lookup(ip->i_fsinode_u.fs, newblkno, 0, &newblk) == 0)
1445	panic("softdep_setup_allocdirect: lost block");
1446
1447	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1448	inodedep_lookup(ip->i_fsinode_u.fs, ip->i_number, DEPALLOC0x0001 \| NODELAY0x0002, &inodedep);
1449	adp->ad_inodedep = inodedep;
1450
1451	if (newblk->nb_state == DEPCOMPLETE0x0008) {
1452	adp->ad_statead_list.wk_state \|= DEPCOMPLETE0x0008;
1453	adp->ad_buf = NULL((void *)0);
1454	} else {
1455	bmsafemap = newblk->nb_bmsafemap;
1456	adp->ad_buf = bmsafemap->sm_buf;
1457	LIST_REMOVE(newblk, nb_deps)do { if ((newblk)->nb_deps.le_next != ((void )0)) (newblk )->nb_deps.le_next->nb_deps.le_prev = (newblk)->nb_deps .le_prev; (newblk)->nb_deps.le_prev = (newblk)->nb_deps .le_next; ((newblk)->nb_deps.le_prev) = ((void )-1); ((newblk )->nb_deps.le_next) = ((void )-1); } while (0);
1458	LIST_INSERT_HEAD(&bmsafemap->sm_allocdirecthd, adp, ad_deps)do { if (((adp)->ad_deps.le_next = (&bmsafemap->sm_allocdirecthd )->lh_first) != ((void *)0)) (&bmsafemap->sm_allocdirecthd )->lh_first->ad_deps.le_prev = &(adp)->ad_deps.le_next ; (&bmsafemap->sm_allocdirecthd)->lh_first = (adp); (adp)->ad_deps.le_prev = &(&bmsafemap->sm_allocdirecthd )->lh_first; } while (0);
1459	}
1460	LIST_REMOVE(newblk, nb_hash)do { if ((newblk)->nb_hash.le_next != ((void )0)) (newblk )->nb_hash.le_next->nb_hash.le_prev = (newblk)->nb_hash .le_prev; (newblk)->nb_hash.le_prev = (newblk)->nb_hash .le_next; ((newblk)->nb_hash.le_prev) = ((void )-1); ((newblk )->nb_hash.le_next) = ((void )-1); } while (0);
1461	pool_put(&newblk_pool, newblk);
1462
1463	if (bp == NULL((void *)0)) {
1464	/*
1465	* XXXUBC - Yes, I know how to fix this, but not right now.
1466	*/
1467	panic("softdep_setup_allocdirect: Bonk art in the head");
1468	}
1469	WORKLIST_INSERT(&bp->b_dep, &adp->ad_list)do { (&adp->ad_list)->wk_state \|= 0x8000; do { if ( ((&adp->ad_list)->wk_list.le_next = (&bp->b_dep )->lh_first) != ((void *)0)) (&bp->b_dep)->lh_first ->wk_list.le_prev = &(&adp->ad_list)->wk_list .le_next; (&bp->b_dep)->lh_first = (&adp->ad_list ); (&adp->ad_list)->wk_list.le_prev = &(&bp ->b_dep)->lh_first; } while (0); } while (0);
1470	if (lbn >= NDADDR12) {
1471	/* allocating an indirect block */
1472	if (oldblkno != 0) {
1473	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1474	panic("softdep_setup_allocdirect: non-zero indir");
1475	}
1476	} else {
1477	/*
1478	* Allocating a direct block.
1479	*
1480	* If we are allocating a directory block, then we must
1481	* allocate an associated pagedep to track additions and
1482	* deletions.
1483	*/
1484	if ((DIP(ip, mode)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_mode : (ip)->dinode_u.ffs2_din->di_mode) & IFMT0170000) == IFDIR0040000 &&
1485	pagedep_lookup(ip, lbn, DEPALLOC0x0001, &pagedep) == 0)
1486	WORKLIST_INSERT(&bp->b_dep, &pagedep->pd_list)do { (&pagedep->pd_list)->wk_state \|= 0x8000; do { if (((&pagedep->pd_list)->wk_list.le_next = (&bp-> b_dep)->lh_first) != ((void *)0)) (&bp->b_dep)-> lh_first->wk_list.le_prev = &(&pagedep->pd_list )->wk_list.le_next; (&bp->b_dep)->lh_first = (& pagedep->pd_list); (&pagedep->pd_list)->wk_list. le_prev = &(&bp->b_dep)->lh_first; } while (0); } while (0);
1487	}
1488	/*
1489	* The list of allocdirects must be kept in sorted and ascending
1490	* order so that the rollback routines can quickly determine the
1491	* first uncommitted block (the size of the file stored on disk
1492	* ends at the end of the lowest committed fragment, or if there
1493	* are no fragments, at the end of the highest committed block).
1494	* Since files generally grow, the typical case is that the new
1495	* block is to be added at the end of the list. We speed this
1496	* special case by checking against the last allocdirect in the
1497	* list before laboriously traversing the list looking for the
1498	* insertion point.
1499	*/
1500	adphead = &inodedep->id_newinoupdt;
1501	oldadp = TAILQ_LAST(adphead, allocdirectlst)((((struct allocdirectlst )((adphead)->tqh_last))->tqh_last ));
1502	if (oldadp == NULL((void *)0) \|\| oldadp->ad_lbn <= lbn) {
1503	/* insert at end of list */
1504	TAILQ_INSERT_TAIL(adphead, adp, ad_next)do { (adp)->ad_next.tqe_next = ((void )0); (adp)->ad_next .tqe_prev = (adphead)->tqh_last; (adphead)->tqh_last = (adp); (adphead)->tqh_last = &(adp)->ad_next.tqe_next ; } while (0);
1505	if (oldadp != NULL((void *)0) && oldadp->ad_lbn == lbn)
1506	allocdirect_merge(adphead, adp, oldadp);
1507	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1508	return;
1509	}
1510	TAILQ_FOREACH(oldadp, adphead, ad_next)for((oldadp) = ((adphead)->tqh_first); (oldadp) != ((void * )0); (oldadp) = ((oldadp)->ad_next.tqe_next)) {
1511	if (oldadp->ad_lbn >= lbn)
1512	break;
1513	}
1514	if (oldadp == NULL((void *)0)) {
1515	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1516	panic("softdep_setup_allocdirect: lost entry");
1517	}
1518	/* insert in middle of list */
1519	TAILQ_INSERT_BEFORE(oldadp, adp, ad_next)do { (adp)->ad_next.tqe_prev = (oldadp)->ad_next.tqe_prev ; (adp)->ad_next.tqe_next = (oldadp); *(oldadp)->ad_next .tqe_prev = (adp); (oldadp)->ad_next.tqe_prev = &(adp) ->ad_next.tqe_next; } while (0);
1520	if (oldadp->ad_lbn == lbn)
1521	allocdirect_merge(adphead, adp, oldadp);
1522	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1523	}
1524
1525	/*
1526	* Replace an old allocdirect dependency with a newer one.
1527	* This routine must be called with splbio interrupts blocked.
1528	*/
1529	/* head of list holding allocdirects */
1530	/* allocdirect being added */
1531	/* existing allocdirect being checked */
1532	STATIC void
1533	allocdirect_merge(struct allocdirectlst adphead, struct allocdirect newadp,
1534	struct allocdirect *oldadp)
1535	{
1536	struct worklist *wk;
1537	struct freefrag *freefrag;
1538	struct newdirblk *newdirblk;
1539
1540	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
1541
1542	#ifdef DEBUG
1543	if (lk.lkt_held == -1)
1544	panic("allocdirect_merge: lock not held");
1545	#endif
1546	if (newadp->ad_oldblkno != oldadp->ad_newblkno \|\|
1547	newadp->ad_oldsize != oldadp->ad_newsize \|\|
1548	newadp->ad_lbn >= NDADDR12) {
1549	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1550	panic("allocdirect_merge: old %lld != new %lld \|\| lbn %lld >= "
1551	"%d", (long long)newadp->ad_oldblkno,
1552	(long long)oldadp->ad_newblkno, (long long)newadp->ad_lbn,
1553	NDADDR12);
1554	}
1555	newadp->ad_oldblkno = oldadp->ad_oldblkno;
1556	newadp->ad_oldsize = oldadp->ad_oldsize;
1557	/*
1558	* If the old dependency had a fragment to free or had never
1559	* previously had a block allocated, then the new dependency
1560	* can immediately post its freefrag and adopt the old freefrag.
1561	* This action is done by swapping the freefrag dependencies.
1562	* The new dependency gains the old one's freefrag, and the
1563	* old one gets the new one and then immediately puts it on
1564	* the worklist when it is freed by free_allocdirect. It is
1565	* not possible to do this swap when the old dependency had a
1566	* non-zero size but no previous fragment to free. This condition
1567	* arises when the new block is an extension of the old block.
1568	* Here, the first part of the fragment allocated to the new
1569	* dependency is part of the block currently claimed on disk by
1570	* the old dependency, so cannot legitimately be freed until the
1571	* conditions for the new dependency are fulfilled.
1572	*/
1573	if (oldadp->ad_freefrag != NULL((void *)0) \|\| oldadp->ad_oldblkno == 0) {
1574	freefrag = newadp->ad_freefrag;
1575	newadp->ad_freefrag = oldadp->ad_freefrag;
1576	oldadp->ad_freefrag = freefrag;
1577	}
1578	/*
1579	* If we are tracking a new directory-block allocation,
1580	* move it from the old allocdirect to the new allocdirect.
1581	*/
1582	if ((wk = LIST_FIRST(&oldadp->ad_newdirblk)((&oldadp->ad_newdirblk)->lh_first)) != NULL((void *)0)) {
1583	newdirblk = WK_NEWDIRBLK(wk)((struct newdirblk *)(wk));
1584	WORKLIST_REMOVE(&newdirblk->db_list)do { (&newdirblk->db_list)->wk_state &= ~0x8000 ; do { if ((&newdirblk->db_list)->wk_list.le_next != ((void )0)) (&newdirblk->db_list)->wk_list.le_next ->wk_list.le_prev = (&newdirblk->db_list)->wk_list .le_prev; (&newdirblk->db_list)->wk_list.le_prev = (&newdirblk->db_list)->wk_list.le_next; ((&newdirblk ->db_list)->wk_list.le_prev) = ((void )-1); ((&newdirblk ->db_list)->wk_list.le_next) = ((void )-1); } while (0 ); } while (0);
1585	if (LIST_FIRST(&oldadp->ad_newdirblk)((&oldadp->ad_newdirblk)->lh_first) != NULL((void *)0))
1586	panic("allocdirect_merge: extra newdirblk");
1587	WORKLIST_INSERT(&newadp->ad_newdirblk, &newdirblk->db_list)do { (&newdirblk->db_list)->wk_state \|= 0x8000; do { if (((&newdirblk->db_list)->wk_list.le_next = (& newadp->ad_newdirblk)->lh_first) != ((void *)0)) (& newadp->ad_newdirblk)->lh_first->wk_list.le_prev = & (&newdirblk->db_list)->wk_list.le_next; (&newadp ->ad_newdirblk)->lh_first = (&newdirblk->db_list ); (&newdirblk->db_list)->wk_list.le_prev = &(& newadp->ad_newdirblk)->lh_first; } while (0); } while ( 0);
1588	}
1589	free_allocdirect(adphead, oldadp, 0);
1590	}
1591
1592	/*
1593	* Allocate a new freefrag structure if needed.
1594	*/
1595	STATIC struct freefrag *
1596	newfreefrag(struct inode *ip, daddr_t blkno, long size)
1597	{
1598	struct freefrag *freefrag;
1599	struct fs *fs;
1600
1601	if (blkno == 0)
1602	return (NULL((void *)0));
1603	fs = ip->i_fsinode_u.fs;
1604	if (fragnum(fs, blkno)((blkno) & ((fs)->fs_frag - 1)) + numfrags(fs, size)((size) >> (fs)->fs_fshift) > fs->fs_frag)
1605	panic("newfreefrag: frag size");
1606	freefrag = pool_get(&freefrag_pool, PR_WAITOK0x0001);
1607	freefrag->ff_list.wk_type = D_FREEFRAG7;
1608	freefrag->ff_stateff_list.wk_state = DIP(ip, uid)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_uid : (ip)->dinode_u.ffs2_din->di_uid) & ~ONWORKLIST0x8000; /* used below */
1609	freefrag->ff_inum = ip->i_number;
1610	freefrag->ff_mnt = ITOV(ip)((ip)->i_vnode)->v_mount;
1611	freefrag->ff_devvp = ip->i_devvpi_ump->um_devvp;
1612	freefrag->ff_blkno = blkno;
1613	freefrag->ff_fragsize = size;
1614	return (freefrag);
1615	}
1616
1617	/*
1618	* This workitem de-allocates fragments that were replaced during
1619	* file block allocation.
1620	*/
1621	STATIC void
1622	handle_workitem_freefrag(struct freefrag *freefrag)
1623	{
1624	struct inode tip;
1625	struct ufs1_dinode dtip1;
1626
1627	tip.i_vnode = NULL((void *)0);
1628	tip.i_din1dinode_u.ffs1_din = &dtip1;
1629	tip.i_fsinode_u.fs = VFSTOUFS(freefrag->ff_mnt)((struct ufsmount *)((freefrag->ff_mnt)->mnt_data))->um_fsufsmount_u.fs;
1630	tip.i_ump = VFSTOUFS(freefrag->ff_mnt)((struct ufsmount *)((freefrag->ff_mnt)->mnt_data));
1631	tip.i_dev = freefrag->ff_devvp->v_rdevv_un.vu_specinfo->si_rdev;
1632	tip.i_number = freefrag->ff_inum;
1633	tip.i_ffs1_uiddinode_u.ffs1_din->di_uid = freefrag->ff_stateff_list.wk_state & ~ONWORKLIST0x8000; /* set above */
1634	ffs_blkfree(&tip, freefrag->ff_blkno, freefrag->ff_fragsize);
1635	pool_put(&freefrag_pool, freefrag);
1636	}
1637
1638	/*
1639	* Indirect block allocation dependencies.
1640	*
1641	* The same dependencies that exist for a direct block also exist when
1642	* a new block is allocated and pointed to by an entry in a block of
1643	* indirect pointers. The undo/redo states described above are also
1644	* used here. Because an indirect block contains many pointers that
1645	* may have dependencies, a second copy of the entire in-memory indirect
1646	* block is kept. The buffer cache copy is always completely up-to-date.
1647	* The second copy, which is used only as a source for disk writes,
1648	* contains only the safe pointers (i.e., those that have no remaining
1649	* update dependencies). The second copy is freed when all pointers
1650	* are safe. The cache is not allowed to replace indirect blocks with
1651	* pending update dependencies. If a buffer containing an indirect
1652	* block with dependencies is written, these routines will mark it
1653	* dirty again. It can only be successfully written once all the
1654	* dependencies are removed. The ffs_fsync routine in conjunction with
1655	* softdep_sync_metadata work together to get all the dependencies
1656	* removed so that a file can be successfully written to disk. Three
1657	* procedures are used when setting up indirect block pointer
1658	* dependencies. The division is necessary because of the organization
1659	* of the "balloc" routine and because of the distinction between file
1660	* pages and file metadata blocks.
1661	*/
1662
1663	/*
1664	* Allocate a new allocindir structure.
1665	*/
1666	/* inode for file being extended */
1667	/* offset of pointer in indirect block */
1668	/* disk block number being added */
1669	/* previous block number, 0 if none */
1670	STATIC struct allocindir *
1671	newallocindir(struct inode *ip, int ptrno, daddr_t newblkno,
1672	daddr_t oldblkno)
1673	{
1674	struct allocindir *aip;
1675
1676	aip = pool_get(&allocindir_pool, PR_WAITOK0x0001 \| PR_ZERO0x0008);
1677	aip->ai_list.wk_type = D_ALLOCINDIR6;
1678	aip->ai_stateai_list.wk_state = ATTACHED0x0001;
1679	aip->ai_offset = ptrno;
1680	aip->ai_newblkno = newblkno;
1681	aip->ai_oldblkno = oldblkno;
1682	aip->ai_freefrag = newfreefrag(ip, oldblkno, ip->i_fsinode_u.fs->fs_bsize);
1683	return (aip);
1684	}
1685
1686	/*
1687	* Called just before setting an indirect block pointer
1688	* to a newly allocated file page.
1689	*/
1690	/* inode for file being extended */
1691	/* allocated block number within file */
1692	/* buffer with indirect blk referencing page */
1693	/* offset of pointer in indirect block */
1694	/* disk block number being added */
1695	/* previous block number, 0 if none */
1696	/* buffer holding allocated page */
1697	void
1698	softdep_setup_allocindir_page(struct inode ip, daddr_t lbn, struct buf bp,
1699	int ptrno, daddr_t newblkno, daddr_t oldblkno, struct buf *nbp)
1700	{
1701	struct allocindir *aip;
1702	struct pagedep *pagedep;
1703
1704	aip = newallocindir(ip, ptrno, newblkno, oldblkno);
1705	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1706	/*
1707	* If we are allocating a directory page, then we must
1708	* allocate an associated pagedep to track additions and
1709	* deletions.
1710	*/
1711	if ((DIP(ip, mode)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_mode : (ip)->dinode_u.ffs2_din->di_mode) & IFMT0170000) == IFDIR0040000 &&
1712	pagedep_lookup(ip, lbn, DEPALLOC0x0001, &pagedep) == 0)
1713	WORKLIST_INSERT(&nbp->b_dep, &pagedep->pd_list)do { (&pagedep->pd_list)->wk_state \|= 0x8000; do { if (((&pagedep->pd_list)->wk_list.le_next = (&nbp ->b_dep)->lh_first) != ((void *)0)) (&nbp->b_dep )->lh_first->wk_list.le_prev = &(&pagedep->pd_list )->wk_list.le_next; (&nbp->b_dep)->lh_first = (& pagedep->pd_list); (&pagedep->pd_list)->wk_list. le_prev = &(&nbp->b_dep)->lh_first; } while (0) ; } while (0);
1714	if (nbp == NULL((void *)0)) {
1715	/*
1716	* XXXUBC - Yes, I know how to fix this, but not right now.
1717	*/
1718	panic("softdep_setup_allocindir_page: Bonk art in the head");
1719	}
1720	WORKLIST_INSERT(&nbp->b_dep, &aip->ai_list)do { (&aip->ai_list)->wk_state \|= 0x8000; do { if ( ((&aip->ai_list)->wk_list.le_next = (&nbp->b_dep )->lh_first) != ((void *)0)) (&nbp->b_dep)->lh_first ->wk_list.le_prev = &(&aip->ai_list)->wk_list .le_next; (&nbp->b_dep)->lh_first = (&aip->ai_list ); (&aip->ai_list)->wk_list.le_prev = &(&nbp ->b_dep)->lh_first; } while (0); } while (0);
1721	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1722	setup_allocindir_phase2(bp, ip, aip);
1723	}
1724
1725	/*
1726	* Called just before setting an indirect block pointer to a
1727	* newly allocated indirect block.
1728	*/
1729	/* newly allocated indirect block */
1730	/* inode for file being extended */
1731	/* indirect block referencing allocated block */
1732	/* offset of pointer in indirect block */
1733	/* disk block number being added */
1734	void
1735	softdep_setup_allocindir_meta(struct buf nbp, struct inode ip,
1736	struct buf *bp, int ptrno, daddr_t newblkno)
1737	{
1738	struct allocindir *aip;
1739
1740	aip = newallocindir(ip, ptrno, newblkno, 0);
1741	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1742	WORKLIST_INSERT(&nbp->b_dep, &aip->ai_list)do { (&aip->ai_list)->wk_state \|= 0x8000; do { if ( ((&aip->ai_list)->wk_list.le_next = (&nbp->b_dep )->lh_first) != ((void *)0)) (&nbp->b_dep)->lh_first ->wk_list.le_prev = &(&aip->ai_list)->wk_list .le_next; (&nbp->b_dep)->lh_first = (&aip->ai_list ); (&aip->ai_list)->wk_list.le_prev = &(&nbp ->b_dep)->lh_first; } while (0); } while (0);
1743	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1744	setup_allocindir_phase2(bp, ip, aip);
1745	}
1746
1747	/*
1748	* Called to finish the allocation of the "aip" allocated
1749	* by one of the two routines above.
1750	*/
1751	/* in-memory copy of the indirect block */
1752	/* inode for file being extended */
1753	/* allocindir allocated by the above routines */
1754	STATIC void
1755	setup_allocindir_phase2(struct buf bp, struct inode ip,
1756	struct allocindir *aip)
1757	{
1758	struct worklist *wk;
1759	struct indirdep indirdep, newindirdep;
1760	struct bmsafemap *bmsafemap;
1761	struct allocindir *oldaip;
1762	struct freefrag *freefrag;
1763	struct newblk *newblk;
1764
1765	if (bp->b_lblkno >= 0)
1766	panic("setup_allocindir_phase2: not indir blk");
1767	for (indirdep = NULL((void )0), newindirdep = NULL((void )0); ; ) {
1768	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1769	LIST_FOREACH(wk, &bp->b_dep, wk_list)for((wk) = ((&bp->b_dep)->lh_first); (wk)!= ((void * )0); (wk) = ((wk)->wk_list.le_next)) {
1770	if (wk->wk_type != D_INDIRDEP5)
1771	continue;
1772	indirdep = WK_INDIRDEP(wk)((struct indirdep *)(wk));
1773	break;
1774	}
1775	if (indirdep == NULL((void *)0) && newindirdep) {
1776	indirdep = newindirdep;
1777	WORKLIST_INSERT(&bp->b_dep, &indirdep->ir_list)do { (&indirdep->ir_list)->wk_state \|= 0x8000; do { if (((&indirdep->ir_list)->wk_list.le_next = (& bp->b_dep)->lh_first) != ((void *)0)) (&bp->b_dep )->lh_first->wk_list.le_prev = &(&indirdep-> ir_list)->wk_list.le_next; (&bp->b_dep)->lh_first = (&indirdep->ir_list); (&indirdep->ir_list)-> wk_list.le_prev = &(&bp->b_dep)->lh_first; } while (0); } while (0);
1778	newindirdep = NULL((void *)0);
1779	}
1780	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1781	if (indirdep) {
1782	if (newblk_lookup(ip->i_fsinode_u.fs, aip->ai_newblkno, 0,
1783	&newblk) == 0)
1784	panic("setup_allocindir: lost block");
1785	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1786	if (newblk->nb_state == DEPCOMPLETE0x0008) {
1787	aip->ai_stateai_list.wk_state \|= DEPCOMPLETE0x0008;
1788	aip->ai_buf = NULL((void *)0);
1789	} else {
1790	bmsafemap = newblk->nb_bmsafemap;
1791	aip->ai_buf = bmsafemap->sm_buf;
1792	LIST_REMOVE(newblk, nb_deps)do { if ((newblk)->nb_deps.le_next != ((void )0)) (newblk )->nb_deps.le_next->nb_deps.le_prev = (newblk)->nb_deps .le_prev; (newblk)->nb_deps.le_prev = (newblk)->nb_deps .le_next; ((newblk)->nb_deps.le_prev) = ((void )-1); ((newblk )->nb_deps.le_next) = ((void )-1); } while (0);
1793	LIST_INSERT_HEAD(&bmsafemap->sm_allocindirhd,do { if (((aip)->ai_deps.le_next = (&bmsafemap->sm_allocindirhd )->lh_first) != ((void *)0)) (&bmsafemap->sm_allocindirhd )->lh_first->ai_deps.le_prev = &(aip)->ai_deps.le_next ; (&bmsafemap->sm_allocindirhd)->lh_first = (aip); ( aip)->ai_deps.le_prev = &(&bmsafemap->sm_allocindirhd )->lh_first; } while (0)
1794	aip, ai_deps)do { if (((aip)->ai_deps.le_next = (&bmsafemap->sm_allocindirhd )->lh_first) != ((void *)0)) (&bmsafemap->sm_allocindirhd )->lh_first->ai_deps.le_prev = &(aip)->ai_deps.le_next ; (&bmsafemap->sm_allocindirhd)->lh_first = (aip); ( aip)->ai_deps.le_prev = &(&bmsafemap->sm_allocindirhd )->lh_first; } while (0);
1795	}
1796	LIST_REMOVE(newblk, nb_hash)do { if ((newblk)->nb_hash.le_next != ((void )0)) (newblk )->nb_hash.le_next->nb_hash.le_prev = (newblk)->nb_hash .le_prev; (newblk)->nb_hash.le_prev = (newblk)->nb_hash .le_next; ((newblk)->nb_hash.le_prev) = ((void )-1); ((newblk )->nb_hash.le_next) = ((void )-1); } while (0);
1797	pool_put(&newblk_pool, newblk);
1798	aip->ai_indirdep = indirdep;
1799	/*
1800	* Check to see if there is an existing dependency
1801	* for this block. If there is, merge the old
1802	* dependency into the new one.
1803	*/
1804	if (aip->ai_oldblkno == 0)
1805	oldaip = NULL((void *)0);
1806	else
1807
1808	LIST_FOREACH(oldaip, &indirdep->ir_deplisthd, ai_next)for((oldaip) = ((&indirdep->ir_deplisthd)->lh_first ); (oldaip)!= ((void *)0); (oldaip) = ((oldaip)->ai_next.le_next ))
1809	if (oldaip->ai_offset == aip->ai_offset)
1810	break;
1811	freefrag = NULL((void *)0);
1812	if (oldaip != NULL((void *)0)) {
1813	if (oldaip->ai_newblkno != aip->ai_oldblkno) {
1814	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1815	panic("setup_allocindir_phase2: blkno");
1816	}
1817	aip->ai_oldblkno = oldaip->ai_oldblkno;
1818	freefrag = aip->ai_freefrag;
1819	aip->ai_freefrag = oldaip->ai_freefrag;
1820	oldaip->ai_freefrag = NULL((void *)0);
1821	free_allocindir(oldaip, NULL((void *)0));
1822	}
1823	LIST_INSERT_HEAD(&indirdep->ir_deplisthd, aip, ai_next)do { if (((aip)->ai_next.le_next = (&indirdep->ir_deplisthd )->lh_first) != ((void *)0)) (&indirdep->ir_deplisthd )->lh_first->ai_next.le_prev = &(aip)->ai_next.le_next ; (&indirdep->ir_deplisthd)->lh_first = (aip); (aip )->ai_next.le_prev = &(&indirdep->ir_deplisthd) ->lh_first; } while (0);
1824	if (ip->i_ump->um_fstype == UM_UFS11)
1825	((int32_t *)indirdep->ir_savebp->b_data)
1826	[aip->ai_offset] = aip->ai_oldblkno;
1827	else
1828	((int64_t *)indirdep->ir_savebp->b_data)
1829	[aip->ai_offset] = aip->ai_oldblkno;
1830	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1831	if (freefrag != NULL((void *)0))
1832	handle_workitem_freefrag(freefrag);
1833	}
1834	if (newindirdep) {
1835	if (indirdep->ir_savebp != NULL((void *)0))
1836	brelse(newindirdep->ir_savebp);
1837	WORKITEM_FREE(newindirdep, D_INDIRDEP)softdep_freequeue_add((struct worklist *)newindirdep);
1838	}
1839	if (indirdep)
1840	break;
1841	newindirdep = pool_get(&indirdep_pool, PR_WAITOK0x0001);
1842	newindirdep->ir_list.wk_type = D_INDIRDEP5;
1843	newindirdep->ir_stateir_list.wk_state = ATTACHED0x0001;
1844	if (ip->i_ump->um_fstype == UM_UFS11)
1845	newindirdep->ir_stateir_list.wk_state \|= UFS1FMT0x2000;
1846	LIST_INIT(&newindirdep->ir_deplisthd)do { ((&newindirdep->ir_deplisthd)->lh_first) = ((void *)0); } while (0);
1847	LIST_INIT(&newindirdep->ir_donehd)do { ((&newindirdep->ir_donehd)->lh_first) = ((void *)0); } while (0);
1848	if (bp->b_blkno == bp->b_lblkno) {
1849	VOP_BMAP(bp->b_vp, bp->b_lblkno, NULL((void *)0), &bp->b_blkno,
1850	NULL((void *)0));
1851	}
1852	newindirdep->ir_savebp =
1853	getblk(ip->i_devvpi_ump->um_devvp, bp->b_blkno, bp->b_bcount, 0, INFSLP0xffffffffffffffffULL);
1854	#if 0
1855	BUF_KERNPROC(newindirdep->ir_savebp);
1856	#endif
1857	memcpy(newindirdep->ir_savebp->b_data, bp->b_data, bp->b_bcount)__builtin_memcpy((newindirdep->ir_savebp->b_data), (bp-> b_data), (bp->b_bcount));
1858	}
1859	}
1860
1861	/*
1862	* Block de-allocation dependencies.
1863	*
1864	* When blocks are de-allocated, the on-disk pointers must be nullified before
1865	* the blocks are made available for use by other files. (The true
1866	* requirement is that old pointers must be nullified before new on-disk
1867	* pointers are set. We chose this slightly more stringent requirement to
1868	* reduce complexity.) Our implementation handles this dependency by updating
1869	* the inode (or indirect block) appropriately but delaying the actual block
1870	* de-allocation (i.e., freemap and free space count manipulation) until
1871	* after the updated versions reach stable storage. After the disk is
1872	* updated, the blocks can be safely de-allocated whenever it is convenient.
1873	* This implementation handles only the common case of reducing a file's
1874	* length to zero. Other cases are handled by the conventional synchronous
1875	* write approach.
1876	*
1877	* The ffs implementation with which we worked double-checks
1878	* the state of the block pointers and file size as it reduces
1879	* a file's length. Some of this code is replicated here in our
1880	* soft updates implementation. The freeblks->fb_chkcnt field is
1881	* used to transfer a part of this information to the procedure
1882	* that eventually de-allocates the blocks.
1883	*
1884	* This routine should be called from the routine that shortens
1885	* a file's length, before the inode's size or block pointers
1886	* are modified. It will save the block pointer information for
1887	* later release and zero the inode so that the calling routine
1888	* can release it.
1889	*/
1890	/* The inode whose length is to be reduced */
1891	/* The new length for the file */
1892	void
1893	softdep_setup_freeblocks(struct inode *ip, off_t length)
1894	{
1895	struct freeblks *freeblks;
1896	struct inodedep *inodedep;
1897	struct allocdirect *adp;
1898	struct vnode *vp;
1899	struct buf *bp;
1900	struct fs *fs;
1901	int i, delay, error;
1902
1903	fs = ip->i_fsinode_u.fs;
1904	if (length != 0)
1905	panic("softdep_setup_freeblocks: non-zero length");
1906	freeblks = pool_get(&freeblks_pool, PR_WAITOK0x0001 \| PR_ZERO0x0008);
1907	freeblks->fb_list.wk_type = D_FREEBLKS8;
1908	freeblks->fb_statefb_list.wk_state = ATTACHED0x0001;
1909	freeblks->fb_uid = DIP(ip, uid)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_uid : (ip)->dinode_u.ffs2_din->di_uid);
1910	freeblks->fb_previousinum = ip->i_number;
1911	freeblks->fb_devvp = ip->i_devvpi_ump->um_devvp;
1912	freeblks->fb_mnt = ITOV(ip)((ip)->i_vnode)->v_mount;
1913	freeblks->fb_oldsize = DIP(ip, size)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_size : (ip)->dinode_u.ffs2_din->di_size);
1914	freeblks->fb_newsize = length;
1915	freeblks->fb_chkcnt = DIP(ip, blocks)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_blocks : (ip)->dinode_u.ffs2_din->di_blocks);
1916
1917	for (i = 0; i < NDADDR12; i++) {
1918	freeblks->fb_dblks[i] = DIP(ip, db[i])(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_db[i] : (ip)->dinode_u.ffs2_din->di_db[i]);
1919	DIP_ASSIGN(ip, db[i], 0)do { if ((ip)->i_ump->um_fstype == 1) (ip)->dinode_u .ffs1_din->di_db[i] = (0); else (ip)->dinode_u.ffs2_din ->di_db[i] = (0); } while (0);
1920	}
1921
1922	for (i = 0; i < NIADDR3; i++) {
1923	freeblks->fb_iblks[i] = DIP(ip, ib[i])(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_ib[i] : (ip)->dinode_u.ffs2_din->di_ib[i]);
1924	DIP_ASSIGN(ip, ib[i], 0)do { if ((ip)->i_ump->um_fstype == 1) (ip)->dinode_u .ffs1_din->di_ib[i] = (0); else (ip)->dinode_u.ffs2_din ->di_ib[i] = (0); } while (0);
1925	}
1926
1927	DIP_ASSIGN(ip, blocks, 0)do { if ((ip)->i_ump->um_fstype == 1) (ip)->dinode_u .ffs1_din->di_blocks = (0); else (ip)->dinode_u.ffs2_din ->di_blocks = (0); } while (0);
1928	DIP_ASSIGN(ip, size, 0)do { if ((ip)->i_ump->um_fstype == 1) (ip)->dinode_u .ffs1_din->di_size = (0); else (ip)->dinode_u.ffs2_din-> di_size = (0); } while (0);
1929
1930	/*
1931	* Push the zero'ed inode to its disk buffer so that we are free
1932	* to delete its dependencies below. Once the dependencies are gone
1933	* the buffer can be safely released.
1934	*/
1935	if ((error = bread(ip->i_devvpi_ump->um_devvp,
1936	fsbtodb(fs, ino_to_fsba(fs, ip->i_number))((((daddr_t)(((((daddr_t)(fs)->fs_fpg * (((ip->i_number ) / (fs)->fs_ipg))) + (fs)->fs_cgoffset * ((((ip->i_number ) / (fs)->fs_ipg)) & ~((fs)->fs_cgmask))) + (fs)-> fs_iblkno) + ((((((ip->i_number) % (fs)->fs_ipg) / ((fs )->fs_inopb))) << ((fs))->fs_fragshift))))) << (fs)->fs_fsbtodb),
1937	(int)fs->fs_bsize, &bp)) != 0)
1938	softdep_error("softdep_setup_freeblocks", error);
1939
1940	if (ip->i_ump->um_fstype == UM_UFS11)
1941	((struct ufs1_dinode ) bp->b_data +
1942	ino_to_fsbo(fs, ip->i_number)((ip->i_number) % ((fs)->fs_inopb))) = *ip->i_din1dinode_u.ffs1_din;
1943	else
1944	((struct ufs2_dinode ) bp->b_data +
1945	ino_to_fsbo(fs, ip->i_number)((ip->i_number) % ((fs)->fs_inopb))) = *ip->i_din2dinode_u.ffs2_din;
1946
1947	/*
1948	* Find and eliminate any inode dependencies.
1949	*/
1950	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1951	(void) inodedep_lookup(fs, ip->i_number, DEPALLOC0x0001, &inodedep);
1952	if ((inodedep->id_stateid_list.wk_state & IOSTARTED0x0200) != 0) {
1953	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1954	panic("softdep_setup_freeblocks: inode busy");
1955	}
1956	/*
1957	* Add the freeblks structure to the list of operations that
1958	* must await the zero'ed inode being written to disk. If we
1959	* still have a bitmap dependency (delay == 0), then the inode
1960	* has never been written to disk, so we can process the
1961	* freeblks below once we have deleted the dependencies.
1962	*/
1963	delay = (inodedep->id_stateid_list.wk_state & DEPCOMPLETE0x0008);
1964	if (delay)
1965	WORKLIST_INSERT(&inodedep->id_bufwait, &freeblks->fb_list)do { (&freeblks->fb_list)->wk_state \|= 0x8000; do { if (((&freeblks->fb_list)->wk_list.le_next = (& inodedep->id_bufwait)->lh_first) != ((void *)0)) (& inodedep->id_bufwait)->lh_first->wk_list.le_prev = & (&freeblks->fb_list)->wk_list.le_next; (&inodedep ->id_bufwait)->lh_first = (&freeblks->fb_list); ( &freeblks->fb_list)->wk_list.le_prev = &(&inodedep ->id_bufwait)->lh_first; } while (0); } while (0);
1966	/*
1967	* Because the file length has been truncated to zero, any
1968	* pending block allocation dependency structures associated
1969	* with this inode are obsolete and can simply be de-allocated.
1970	* We must first merge the two dependency lists to get rid of
1971	* any duplicate freefrag structures, then purge the merged list.
1972	* If we still have a bitmap dependency, then the inode has never
1973	* been written to disk, so we can free any fragments without delay.
1974	*/
1975	merge_inode_lists(inodedep);
1976	while ((adp = TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first)) != NULL((void *)0))
1977	free_allocdirect(&inodedep->id_inoupdt, adp, delay);
1978	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1979	bdwrite(bp);
1980	/*
1981	* We must wait for any I/O in progress to finish so that
1982	* all potential buffers on the dirty list will be visible.
1983	* Once they are all there, walk the list and get rid of
1984	* any dependencies.
1985	*/
1986	vp = ITOV(ip)((ip)->i_vnode);
1987	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1988	drain_output(vp, 1);
1989	while ((bp = LIST_FIRST(&vp->v_dirtyblkhd)((&vp->v_dirtyblkhd)->lh_first))) {
1990	if (getdirtybuf(bp, MNT_WAIT1) <= 0)
1991	break;
1992	(void) inodedep_lookup(fs, ip->i_number, 0, &inodedep);
1993	deallocate_dependencies(bp, inodedep);
1994	bp->b_flags \|= B_INVAL0x00000800 \| B_NOCACHE0x00001000;
1995	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
1996	brelse(bp);
1997	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
1998	}
1999	if (inodedep_lookup(fs, ip->i_number, 0, &inodedep) != 0)
2000	(void) free_inodedep(inodedep);
2001
2002	if (delay) {
2003	freeblks->fb_statefb_list.wk_state \|= DEPCOMPLETE0x0008;
2004	/*
2005	* If the inode with zeroed block pointers is now on disk we
2006	* can start freeing blocks. Add freeblks to the worklist
2007	* instead of calling handle_workitem_freeblocks() directly as
2008	* it is more likely that additional IO is needed to complete
2009	* the request than in the !delay case.
2010	*/
2011	if ((freeblks->fb_statefb_list.wk_state & ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) == ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008))
2012	add_to_worklist(&freeblks->fb_list);
2013	}
2014
2015	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2016	/*
2017	* If the inode has never been written to disk (delay == 0),
2018	* then we can process the freeblks now that we have deleted
2019	* the dependencies.
2020	*/
2021	if (!delay)
2022	handle_workitem_freeblocks(freeblks);
2023	}
2024
2025	/*
2026	* Reclaim any dependency structures from a buffer that is about to
2027	* be reallocated to a new vnode. The buffer must be locked, thus,
2028	* no I/O completion operations can occur while we are manipulating
2029	* its associated dependencies. The mutex is held so that other I/O's
2030	* associated with related dependencies do not occur.
2031	*/
2032	STATIC void
2033	deallocate_dependencies(struct buf bp, struct inodedep inodedep)
2034	{
2035	struct worklist *wk;
2036	struct indirdep *indirdep;
2037	struct allocindir *aip;
2038	struct pagedep *pagedep;
2039	struct dirrem *dirrem;
2040	struct diradd *dap;
2041	int i;
2042
2043	while ((wk = LIST_FIRST(&bp->b_dep)((&bp->b_dep)->lh_first)) != NULL((void *)0)) {
2044	switch (wk->wk_type) {
2045
2046	case D_INDIRDEP5:
2047	indirdep = WK_INDIRDEP(wk)((struct indirdep *)(wk));
2048	/*
2049	* None of the indirect pointers will ever be visible,
2050	* so they can simply be tossed. GOINGAWAY ensures
2051	* that allocated pointers will be saved in the buffer
2052	* cache until they are freed. Note that they will
2053	* only be able to be found by their physical address
2054	* since the inode mapping the logical address will
2055	* be gone. The save buffer used for the safe copy
2056	* was allocated in setup_allocindir_phase2 using
2057	* the physical address so it could be used for this
2058	* purpose. Hence we swap the safe copy with the real
2059	* copy, allowing the safe copy to be freed and holding
2060	* on to the real copy for later use in indir_trunc.
2061	*/
2062	if (indirdep->ir_stateir_list.wk_state & GOINGAWAY0x0100) {
2063	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2064	panic("deallocate_dependencies: already gone");
2065	}
2066	indirdep->ir_stateir_list.wk_state \|= GOINGAWAY0x0100;
2067	while ((aip = LIST_FIRST(&indirdep->ir_deplisthd)((&indirdep->ir_deplisthd)->lh_first)))
2068	free_allocindir(aip, inodedep);
2069	if (bp->b_lblkno >= 0 \|\|
2070	bp->b_blkno != indirdep->ir_savebp->b_lblkno) {
2071	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2072	panic("deallocate_dependencies: not indir");
2073	}
2074	memcpy(indirdep->ir_savebp->b_data, bp->b_data,__builtin_memcpy((indirdep->ir_savebp->b_data), (bp-> b_data), (bp->b_bcount))
2075	bp->b_bcount)__builtin_memcpy((indirdep->ir_savebp->b_data), (bp-> b_data), (bp->b_bcount));
2076	WORKLIST_REMOVE(wk)do { (wk)->wk_state &= ~0x8000; do { if ((wk)->wk_list .le_next != ((void )0)) (wk)->wk_list.le_next->wk_list .le_prev = (wk)->wk_list.le_prev; (wk)->wk_list.le_prev = (wk)->wk_list.le_next; ((wk)->wk_list.le_prev) = ((void )-1); ((wk)->wk_list.le_next) = ((void )-1); } while (0 ); } while (0);
2077	WORKLIST_INSERT(&indirdep->ir_savebp->b_dep, wk)do { (wk)->wk_state \|= 0x8000; do { if (((wk)->wk_list. le_next = (&indirdep->ir_savebp->b_dep)->lh_first ) != ((void *)0)) (&indirdep->ir_savebp->b_dep)-> lh_first->wk_list.le_prev = &(wk)->wk_list.le_next; (&indirdep->ir_savebp->b_dep)->lh_first = (wk); (wk)->wk_list.le_prev = &(&indirdep->ir_savebp ->b_dep)->lh_first; } while (0); } while (0);
2078	continue;
2079
2080	case D_PAGEDEP0:
2081	pagedep = WK_PAGEDEP(wk)((struct pagedep *)(wk));
2082	/*
2083	* None of the directory additions will ever be
2084	* visible, so they can simply be tossed.
2085	*/
2086	for (i = 0; i < DAHASHSZ6; i++)
2087	while ((dap =
2088	LIST_FIRST(&pagedep->pd_diraddhd[i])((&pagedep->pd_diraddhd[i])->lh_first)))
2089	free_diradd(dap);
2090	while ((dap = LIST_FIRST(&pagedep->pd_pendinghd)((&pagedep->pd_pendinghd)->lh_first)))
2091	free_diradd(dap);
2092	/*
2093	* Copy any directory remove dependencies to the list
2094	* to be processed after the zero'ed inode is written.
2095	* If the inode has already been written, then they
2096	* can be dumped directly onto the work list.
2097	*/
2098	while ((dirrem = LIST_FIRST(&pagedep->pd_dirremhd)((&pagedep->pd_dirremhd)->lh_first))) {
2099	LIST_REMOVE(dirrem, dm_next)do { if ((dirrem)->dm_next.le_next != ((void )0)) (dirrem )->dm_next.le_next->dm_next.le_prev = (dirrem)->dm_next .le_prev; (dirrem)->dm_next.le_prev = (dirrem)->dm_next .le_next; ((dirrem)->dm_next.le_prev) = ((void )-1); ((dirrem )->dm_next.le_next) = ((void )-1); } while (0);
2100	dirrem->dm_dirinumdm_un.dmu_dirinum = pagedep->pd_ino;
2101	if (inodedep == NULL((void *)0) \|\|
2102	(inodedep->id_stateid_list.wk_state & ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) ==
2103	ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008))
2104	add_to_worklist(&dirrem->dm_list);
2105	else
2106	WORKLIST_INSERT(&inodedep->id_bufwait,do { (&dirrem->dm_list)->wk_state \|= 0x8000; do { if (((&dirrem->dm_list)->wk_list.le_next = (&inodedep ->id_bufwait)->lh_first) != ((void *)0)) (&inodedep ->id_bufwait)->lh_first->wk_list.le_prev = &(& dirrem->dm_list)->wk_list.le_next; (&inodedep->id_bufwait )->lh_first = (&dirrem->dm_list); (&dirrem-> dm_list)->wk_list.le_prev = &(&inodedep->id_bufwait )->lh_first; } while (0); } while (0)
2107	&dirrem->dm_list)do { (&dirrem->dm_list)->wk_state \|= 0x8000; do { if (((&dirrem->dm_list)->wk_list.le_next = (&inodedep ->id_bufwait)->lh_first) != ((void *)0)) (&inodedep ->id_bufwait)->lh_first->wk_list.le_prev = &(& dirrem->dm_list)->wk_list.le_next; (&inodedep->id_bufwait )->lh_first = (&dirrem->dm_list); (&dirrem-> dm_list)->wk_list.le_prev = &(&inodedep->id_bufwait )->lh_first; } while (0); } while (0);
2108	}
2109	if ((pagedep->pd_statepd_list.wk_state & NEWBLOCK0x0800) != 0) {
2110	LIST_FOREACH(wk, &inodedep->id_bufwait, wk_list)for((wk) = ((&inodedep->id_bufwait)->lh_first); (wk )!= ((void *)0); (wk) = ((wk)->wk_list.le_next))
2111	if (wk->wk_type == D_NEWDIRBLK13 &&
2112	WK_NEWDIRBLK(wk)((struct newdirblk *)(wk))->db_pagedep ==
2113	pagedep)
2114	break;
2115	if (wk != NULL((void *)0)) {
2116	WORKLIST_REMOVE(wk)do { (wk)->wk_state &= ~0x8000; do { if ((wk)->wk_list .le_next != ((void )0)) (wk)->wk_list.le_next->wk_list .le_prev = (wk)->wk_list.le_prev; (wk)->wk_list.le_prev = (wk)->wk_list.le_next; ((wk)->wk_list.le_prev) = ((void )-1); ((wk)->wk_list.le_next) = ((void )-1); } while (0 ); } while (0);
2117	free_newdirblk(WK_NEWDIRBLK(wk)((struct newdirblk *)(wk)));
2118	} else {
2119	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2120	panic("deallocate_dependencies: "
2121	"lost pagedep");
2122	}
2123	}
2124	WORKLIST_REMOVE(&pagedep->pd_list)do { (&pagedep->pd_list)->wk_state &= ~0x8000; do { if ((&pagedep->pd_list)->wk_list.le_next != ((void )0)) (&pagedep->pd_list)->wk_list.le_next->wk_list .le_prev = (&pagedep->pd_list)->wk_list.le_prev; ( &pagedep->pd_list)->wk_list.le_prev = (&pagedep ->pd_list)->wk_list.le_next; ((&pagedep->pd_list )->wk_list.le_prev) = ((void )-1); ((&pagedep->pd_list )->wk_list.le_next) = ((void )-1); } while (0); } while ( 0);
2125	LIST_REMOVE(pagedep, pd_hash)do { if ((pagedep)->pd_hash.le_next != ((void )0)) (pagedep )->pd_hash.le_next->pd_hash.le_prev = (pagedep)->pd_hash .le_prev; (pagedep)->pd_hash.le_prev = (pagedep)->pd_hash .le_next; ((pagedep)->pd_hash.le_prev) = ((void )-1); ((pagedep )->pd_hash.le_next) = ((void )-1); } while (0);
2126	WORKITEM_FREE(pagedep, D_PAGEDEP)softdep_freequeue_add((struct worklist *)pagedep);
2127	continue;
2128
2129	case D_ALLOCINDIR6:
2130	free_allocindir(WK_ALLOCINDIR(wk)((struct allocindir *)(wk)), inodedep);
2131	continue;
2132
2133	case D_ALLOCDIRECT4:
2134	case D_INODEDEP1:
2135	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2136	panic("deallocate_dependencies: Unexpected type %s",
2137	TYPENAME(wk->wk_type)((unsigned)(wk->wk_type) <= 13 ? softdep_typenames[wk-> wk_type] : "???"));
2138	/* NOTREACHED */
2139
2140	default:
2141	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2142	panic("deallocate_dependencies: Unknown type %s",
2143	TYPENAME(wk->wk_type)((unsigned)(wk->wk_type) <= 13 ? softdep_typenames[wk-> wk_type] : "???"));
2144	/* NOTREACHED */
2145	}
2146	}
2147	}
2148
2149	/*
2150	* Free an allocdirect. Generate a new freefrag work request if appropriate.
2151	* This routine must be called with splbio interrupts blocked.
2152	*/
2153	STATIC void
2154	free_allocdirect(struct allocdirectlst adphead, struct allocdirect adp,
2155	int delay)
2156	{
2157	struct newdirblk *newdirblk;
2158	struct worklist *wk;
2159
2160	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
2161
2162	#ifdef DEBUG
2163	if (lk.lkt_held == -1)
2164	panic("free_allocdirect: lock not held");
2165	#endif
2166	if ((adp->ad_statead_list.wk_state & DEPCOMPLETE0x0008) == 0)
2167	LIST_REMOVE(adp, ad_deps)do { if ((adp)->ad_deps.le_next != ((void )0)) (adp)-> ad_deps.le_next->ad_deps.le_prev = (adp)->ad_deps.le_prev ; (adp)->ad_deps.le_prev = (adp)->ad_deps.le_next; ((adp )->ad_deps.le_prev) = ((void )-1); ((adp)->ad_deps.le_next ) = ((void )-1); } while (0);
2168	TAILQ_REMOVE(adphead, adp, ad_next)do { if (((adp)->ad_next.tqe_next) != ((void )0)) (adp)-> ad_next.tqe_next->ad_next.tqe_prev = (adp)->ad_next.tqe_prev ; else (adphead)->tqh_last = (adp)->ad_next.tqe_prev; (adp)->ad_next.tqe_prev = (adp)->ad_next.tqe_next; ((adp )->ad_next.tqe_prev) = ((void )-1); ((adp)->ad_next.tqe_next ) = ((void )-1); } while (0);
2169	if ((adp->ad_statead_list.wk_state & COMPLETE0x0004) == 0)
2170	WORKLIST_REMOVE(&adp->ad_list)do { (&adp->ad_list)->wk_state &= ~0x8000; do { if ((&adp->ad_list)->wk_list.le_next != ((void )0 )) (&adp->ad_list)->wk_list.le_next->wk_list.le_prev = (&adp->ad_list)->wk_list.le_prev; (&adp-> ad_list)->wk_list.le_prev = (&adp->ad_list)->wk_list .le_next; ((&adp->ad_list)->wk_list.le_prev) = ((void )-1); ((&adp->ad_list)->wk_list.le_next) = ((void )-1); } while (0); } while (0);
2171	if (adp->ad_freefrag != NULL((void *)0)) {
2172	if (delay)
2173	WORKLIST_INSERT(&adp->ad_inodedep->id_bufwait,do { (&adp->ad_freefrag->ff_list)->wk_state \|= 0x8000 ; do { if (((&adp->ad_freefrag->ff_list)->wk_list .le_next = (&adp->ad_inodedep->id_bufwait)->lh_first ) != ((void *)0)) (&adp->ad_inodedep->id_bufwait)-> lh_first->wk_list.le_prev = &(&adp->ad_freefrag ->ff_list)->wk_list.le_next; (&adp->ad_inodedep-> id_bufwait)->lh_first = (&adp->ad_freefrag->ff_list ); (&adp->ad_freefrag->ff_list)->wk_list.le_prev = &(&adp->ad_inodedep->id_bufwait)->lh_first ; } while (0); } while (0)
2174	&adp->ad_freefrag->ff_list)do { (&adp->ad_freefrag->ff_list)->wk_state \|= 0x8000 ; do { if (((&adp->ad_freefrag->ff_list)->wk_list .le_next = (&adp->ad_inodedep->id_bufwait)->lh_first ) != ((void *)0)) (&adp->ad_inodedep->id_bufwait)-> lh_first->wk_list.le_prev = &(&adp->ad_freefrag ->ff_list)->wk_list.le_next; (&adp->ad_inodedep-> id_bufwait)->lh_first = (&adp->ad_freefrag->ff_list ); (&adp->ad_freefrag->ff_list)->wk_list.le_prev = &(&adp->ad_inodedep->id_bufwait)->lh_first ; } while (0); } while (0);
2175	else
2176	add_to_worklist(&adp->ad_freefrag->ff_list);
2177	}
2178	if ((wk = LIST_FIRST(&adp->ad_newdirblk)((&adp->ad_newdirblk)->lh_first)) != NULL((void *)0)) {
2179	newdirblk = WK_NEWDIRBLK(wk)((struct newdirblk *)(wk));
2180	WORKLIST_REMOVE(&newdirblk->db_list)do { (&newdirblk->db_list)->wk_state &= ~0x8000 ; do { if ((&newdirblk->db_list)->wk_list.le_next != ((void )0)) (&newdirblk->db_list)->wk_list.le_next ->wk_list.le_prev = (&newdirblk->db_list)->wk_list .le_prev; (&newdirblk->db_list)->wk_list.le_prev = (&newdirblk->db_list)->wk_list.le_next; ((&newdirblk ->db_list)->wk_list.le_prev) = ((void )-1); ((&newdirblk ->db_list)->wk_list.le_next) = ((void )-1); } while (0 ); } while (0);
2181	if (LIST_FIRST(&adp->ad_newdirblk)((&adp->ad_newdirblk)->lh_first) != NULL((void *)0))
2182	panic("free_allocdirect: extra newdirblk");
2183	if (delay)
2184	WORKLIST_INSERT(&adp->ad_inodedep->id_bufwait,do { (&newdirblk->db_list)->wk_state \|= 0x8000; do { if (((&newdirblk->db_list)->wk_list.le_next = (& adp->ad_inodedep->id_bufwait)->lh_first) != ((void * )0)) (&adp->ad_inodedep->id_bufwait)->lh_first-> wk_list.le_prev = &(&newdirblk->db_list)->wk_list .le_next; (&adp->ad_inodedep->id_bufwait)->lh_first = (&newdirblk->db_list); (&newdirblk->db_list) ->wk_list.le_prev = &(&adp->ad_inodedep->id_bufwait )->lh_first; } while (0); } while (0)
2185	&newdirblk->db_list)do { (&newdirblk->db_list)->wk_state \|= 0x8000; do { if (((&newdirblk->db_list)->wk_list.le_next = (& adp->ad_inodedep->id_bufwait)->lh_first) != ((void * )0)) (&adp->ad_inodedep->id_bufwait)->lh_first-> wk_list.le_prev = &(&newdirblk->db_list)->wk_list .le_next; (&adp->ad_inodedep->id_bufwait)->lh_first = (&newdirblk->db_list); (&newdirblk->db_list) ->wk_list.le_prev = &(&adp->ad_inodedep->id_bufwait )->lh_first; } while (0); } while (0);
2186	else
2187	free_newdirblk(newdirblk);
2188	}
2189	WORKITEM_FREE(adp, D_ALLOCDIRECT)softdep_freequeue_add((struct worklist *)adp);
2190	}
2191
2192	/*
2193	* Free a newdirblk. Clear the NEWBLOCK flag on its associated pagedep.
2194	* This routine must be called with splbio interrupts blocked.
2195	*/
2196	void
2197	free_newdirblk(struct newdirblk *newdirblk)
2198	{
2199	struct pagedep *pagedep;
2200	struct diradd *dap;
2201	int i;
2202
2203	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
2204
2205	#ifdef DEBUG
2206	if (lk.lkt_held == -1)
2207	panic("free_newdirblk: lock not held");
2208	#endif
2209	/*
2210	* If the pagedep is still linked onto the directory buffer
2211	* dependency chain, then some of the entries on the
2212	* pd_pendinghd list may not be committed to disk yet. In
2213	* this case, we will simply clear the NEWBLOCK flag and
2214	* let the pd_pendinghd list be processed when the pagedep
2215	* is next written. If the pagedep is no longer on the buffer
2216	* dependency chain, then all the entries on the pd_pending
2217	* list are committed to disk and we can free them here.
2218	*/
2219	pagedep = newdirblk->db_pagedep;
2220	pagedep->pd_statepd_list.wk_state &= ~NEWBLOCK0x0800;
2221	if ((pagedep->pd_statepd_list.wk_state & ONWORKLIST0x8000) == 0)
2222	while ((dap = LIST_FIRST(&pagedep->pd_pendinghd)((&pagedep->pd_pendinghd)->lh_first)) != NULL((void *)0))
2223	free_diradd(dap);
2224	/*
2225	* If no dependencies remain, the pagedep will be freed.
2226	*/
2227	for (i = 0; i < DAHASHSZ6; i++)
2228	if (LIST_FIRST(&pagedep->pd_diraddhd[i])((&pagedep->pd_diraddhd[i])->lh_first) != NULL((void *)0))
2229	break;
2230	if (i == DAHASHSZ6 && (pagedep->pd_statepd_list.wk_state & ONWORKLIST0x8000) == 0) {
2231	LIST_REMOVE(pagedep, pd_hash)do { if ((pagedep)->pd_hash.le_next != ((void )0)) (pagedep )->pd_hash.le_next->pd_hash.le_prev = (pagedep)->pd_hash .le_prev; (pagedep)->pd_hash.le_prev = (pagedep)->pd_hash .le_next; ((pagedep)->pd_hash.le_prev) = ((void )-1); ((pagedep )->pd_hash.le_next) = ((void )-1); } while (0);
2232	WORKITEM_FREE(pagedep, D_PAGEDEP)softdep_freequeue_add((struct worklist *)pagedep);
2233	}
2234	WORKITEM_FREE(newdirblk, D_NEWDIRBLK)softdep_freequeue_add((struct worklist *)newdirblk);
2235	}
2236
2237	/*
2238	* Prepare an inode to be freed. The actual free operation is not
2239	* done until the zero'ed inode has been written to disk.
2240	*/
2241	void
2242	softdep_freefile(struct vnode *pvp, ufsino_t ino, mode_t mode)
2243	{
2244	struct inode ip = VTOI(pvp)((struct inode )(pvp)->v_data);
2245	struct inodedep *inodedep;
2246	struct freefile *freefile;
2247
2248	/*
2249	* This sets up the inode de-allocation dependency.
2250	*/
2251	freefile = pool_get(&freefile_pool, PR_WAITOK0x0001);
2252	freefile->fx_list.wk_type = D_FREEFILE9;
2253	freefile->fx_list.wk_state = 0;
2254	freefile->fx_mode = mode;
2255	freefile->fx_oldinum = ino;
2256	freefile->fx_devvp = ip->i_devvpi_ump->um_devvp;
2257	freefile->fx_mnt = ITOV(ip)((ip)->i_vnode)->v_mount;
2258
2259	/*
2260	* If the inodedep does not exist, then the zero'ed inode has
2261	* been written to disk. If the allocated inode has never been
2262	* written to disk, then the on-disk inode is zero'ed. In either
2263	* case we can free the file immediately.
2264	*/
2265	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
2266	if (inodedep_lookup(ip->i_fsinode_u.fs, ino, 0, &inodedep) == 0 \|\|
2267	check_inode_unwritten(inodedep)) {
2268	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2269	handle_workitem_freefile(freefile);
2270	return;
2271	}
2272	WORKLIST_INSERT(&inodedep->id_inowait, &freefile->fx_list)do { (&freefile->fx_list)->wk_state \|= 0x8000; do { if (((&freefile->fx_list)->wk_list.le_next = (& inodedep->id_inowait)->lh_first) != ((void *)0)) (& inodedep->id_inowait)->lh_first->wk_list.le_prev = & (&freefile->fx_list)->wk_list.le_next; (&inodedep ->id_inowait)->lh_first = (&freefile->fx_list); ( &freefile->fx_list)->wk_list.le_prev = &(&inodedep ->id_inowait)->lh_first; } while (0); } while (0);
2273	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2274	}
2275
2276	/*
2277	* Check to see if an inode has never been written to disk. If
2278	* so free the inodedep and return success, otherwise return failure.
2279	* This routine must be called with splbio interrupts blocked.
2280	*
2281	* If we still have a bitmap dependency, then the inode has never
2282	* been written to disk. Drop the dependency as it is no longer
2283	* necessary since the inode is being deallocated. We set the
2284	* ALLCOMPLETE flags since the bitmap now properly shows that the
2285	* inode is not allocated. Even if the inode is actively being
2286	* written, it has been rolled back to its zero'ed state, so we
2287	* are ensured that a zero inode is what is on the disk. For short
2288	* lived files, this change will usually result in removing all the
2289	* dependencies from the inode so that it can be freed immediately.
2290	*/
2291	STATIC int
2292	check_inode_unwritten(struct inodedep *inodedep)
2293	{
2294	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
2295
2296	if ((inodedep->id_stateid_list.wk_state & DEPCOMPLETE0x0008) != 0 \|\|
2297	LIST_FIRST(&inodedep->id_pendinghd)((&inodedep->id_pendinghd)->lh_first) != NULL((void *)0) \|\|
2298	LIST_FIRST(&inodedep->id_bufwait)((&inodedep->id_bufwait)->lh_first) != NULL((void *)0) \|\|
2299	LIST_FIRST(&inodedep->id_inowait)((&inodedep->id_inowait)->lh_first) != NULL((void *)0) \|\|
2300	TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first) != NULL((void *)0) \|\|
2301	TAILQ_FIRST(&inodedep->id_newinoupdt)((&inodedep->id_newinoupdt)->tqh_first) != NULL((void *)0) \|\|
2302	inodedep->id_nlinkdelta != 0)
2303	return (0);
2304	inodedep->id_stateid_list.wk_state \|= ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008);
2305	LIST_REMOVE(inodedep, id_deps)do { if ((inodedep)->id_deps.le_next != ((void )0)) (inodedep )->id_deps.le_next->id_deps.le_prev = (inodedep)->id_deps .le_prev; (inodedep)->id_deps.le_prev = (inodedep)->id_deps .le_next; ((inodedep)->id_deps.le_prev) = ((void )-1); (( inodedep)->id_deps.le_next) = ((void )-1); } while (0);
2306	inodedep->id_buf = NULL((void *)0);
2307	if (inodedep->id_stateid_list.wk_state & ONWORKLIST0x8000)
2308	WORKLIST_REMOVE(&inodedep->id_list)do { (&inodedep->id_list)->wk_state &= ~0x8000; do { if ((&inodedep->id_list)->wk_list.le_next != ( (void )0)) (&inodedep->id_list)->wk_list.le_next-> wk_list.le_prev = (&inodedep->id_list)->wk_list.le_prev ; (&inodedep->id_list)->wk_list.le_prev = (&inodedep ->id_list)->wk_list.le_next; ((&inodedep->id_list )->wk_list.le_prev) = ((void )-1); ((&inodedep->id_list )->wk_list.le_next) = ((void )-1); } while (0); } while ( 0);
2309	if (inodedep->id_savedino1id_un.idu_savedino1 != NULL((void *)0)) {
2310	free(inodedep->id_savedino1id_un.idu_savedino1, M_INODEDEP79, inodedep->id_unsize);
2311	inodedep->id_savedino1id_un.idu_savedino1 = NULL((void *)0);
2312	}
2313	if (free_inodedep(inodedep) == 0) {
2314	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2315	panic("check_inode_unwritten: busy inode");
2316	}
2317	return (1);
2318	}
2319
2320	/*
2321	* Try to free an inodedep structure. Return 1 if it could be freed.
2322	*/
2323	STATIC int
2324	free_inodedep(struct inodedep *inodedep)
2325	{
2326
2327	if ((inodedep->id_stateid_list.wk_state & ONWORKLIST0x8000) != 0 \|\|
2328	(inodedep->id_stateid_list.wk_state & ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) != ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008) \|\|
2329	LIST_FIRST(&inodedep->id_pendinghd)((&inodedep->id_pendinghd)->lh_first) != NULL((void *)0) \|\|
2330	LIST_FIRST(&inodedep->id_bufwait)((&inodedep->id_bufwait)->lh_first) != NULL((void *)0) \|\|
2331	LIST_FIRST(&inodedep->id_inowait)((&inodedep->id_inowait)->lh_first) != NULL((void *)0) \|\|
2332	TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first) != NULL((void *)0) \|\|
2333	TAILQ_FIRST(&inodedep->id_newinoupdt)((&inodedep->id_newinoupdt)->tqh_first) != NULL((void *)0) \|\|
2334	inodedep->id_nlinkdelta != 0 \|\| inodedep->id_savedino1id_un.idu_savedino1 != NULL((void *)0))
2335	return (0);
2336	LIST_REMOVE(inodedep, id_hash)do { if ((inodedep)->id_hash.le_next != ((void )0)) (inodedep )->id_hash.le_next->id_hash.le_prev = (inodedep)->id_hash .le_prev; (inodedep)->id_hash.le_prev = (inodedep)->id_hash .le_next; ((inodedep)->id_hash.le_prev) = ((void )-1); (( inodedep)->id_hash.le_next) = ((void )-1); } while (0);
2337	WORKITEM_FREE(inodedep, D_INODEDEP)softdep_freequeue_add((struct worklist *)inodedep);
2338	num_inodedep -= 1;
2339	return (1);
2340	}
2341
2342	/*
2343	* This workitem routine performs the block de-allocation.
2344	* The workitem is added to the pending list after the updated
2345	* inode block has been written to disk. As mentioned above,
2346	* checks regarding the number of blocks de-allocated (compared
2347	* to the number of blocks allocated for the file) are also
2348	* performed in this function.
2349	*/
2350	STATIC void
2351	handle_workitem_freeblocks(struct freeblks *freeblks)
2352	{
2353	struct inode tip;
2354	daddr_t bn;
2355	union {
2356	struct ufs1_dinode di1;
2357	struct ufs2_dinode di2;
2358	} di;
2359	struct fs *fs;
2360	int i, level, bsize;
2361	long nblocks, blocksreleased = 0;
2362	int error, allerror = 0;
2363	daddr_t baselbns[NIADDR3], tmpval;
2364
2365	if (VFSTOUFS(freeblks->fb_mnt)((struct ufsmount *)((freeblks->fb_mnt)->mnt_data))->um_fstype == UM_UFS11)
2366	tip.i_din1dinode_u.ffs1_din = &di.di1;
2367	else
2368	tip.i_din2dinode_u.ffs2_din = &di.di2;
2369
2370	tip.i_fsinode_u.fs = fs = VFSTOUFS(freeblks->fb_mnt)((struct ufsmount *)((freeblks->fb_mnt)->mnt_data))->um_fsufsmount_u.fs;
2371	tip.i_number = freeblks->fb_previousinum;
2372	tip.i_ump = VFSTOUFS(freeblks->fb_mnt)((struct ufsmount *)((freeblks->fb_mnt)->mnt_data));
2373	tip.i_dev = freeblks->fb_devvp->v_rdevv_un.vu_specinfo->si_rdev;
2374	DIP_ASSIGN(&tip, size, freeblks->fb_oldsize)do { if ((&tip)->i_ump->um_fstype == 1) (&tip)-> dinode_u.ffs1_din->di_size = (freeblks->fb_oldsize); else (&tip)->dinode_u.ffs2_din->di_size = (freeblks-> fb_oldsize); } while (0);
2375	DIP_ASSIGN(&tip, uid, freeblks->fb_uid)do { if ((&tip)->i_ump->um_fstype == 1) (&tip)-> dinode_u.ffs1_din->di_uid = (freeblks->fb_uid); else (& tip)->dinode_u.ffs2_din->di_uid = (freeblks->fb_uid) ; } while (0);
2376	tip.i_vnode = NULL((void *)0);
2377	tmpval = 1;
2378	baselbns[0] = NDADDR12;
2379	for (i = 1; i < NIADDR3; i++) {
2380	tmpval *= NINDIR(fs)((fs)->fs_nindir);
2381	baselbns[i] = baselbns[i - 1] + tmpval;
2382	}
2383	nblocks = btodb(fs->fs_bsize)((fs->fs_bsize) >> 9);
2384	blocksreleased = 0;
2385	/*
2386	* Indirect blocks first.
2387	*/
2388	for (level = (NIADDR3 - 1); level >= 0; level--) {
2389	if ((bn = freeblks->fb_iblks[level]) == 0)
2390	continue;
2391	if ((error = indir_trunc(&tip, fsbtodb(fs, bn)((bn) << (fs)->fs_fsbtodb), level,
2392	baselbns[level], &blocksreleased)) != 0)
2393	allerror = error;
2394	ffs_blkfree(&tip, bn, fs->fs_bsize);
2395	blocksreleased += nblocks;
2396	}
2397	/*
2398	* All direct blocks or frags.
2399	*/
2400	for (i = (NDADDR12 - 1); i >= 0; i--) {
2401	if ((bn = freeblks->fb_dblks[i]) == 0)
2402	continue;
2403	bsize = blksize(fs, &tip, i)(((i) >= 12 \|\| ((((&tip))->i_ump->um_fstype == 1 ) ? ((&tip))->dinode_u.ffs1_din->di_size : ((&tip ))->dinode_u.ffs2_din->di_size) >= ((i) + 1) << (fs)->fs_bshift) ? (u_int64_t)(fs)->fs_bsize : ((((((( (((&tip))->i_ump->um_fstype == 1) ? ((&tip))-> dinode_u.ffs1_din->di_size : ((&tip))->dinode_u.ffs2_din ->di_size)) & (fs)->fs_qbmask)) + (fs)->fs_qfmask ) & (fs)->fs_fmask)));
2404	ffs_blkfree(&tip, bn, bsize);
2405	blocksreleased += btodb(bsize)((bsize) >> 9);
2406	}
2407
2408	#ifdef DIAGNOSTIC1
2409	if (freeblks->fb_chkcnt != blocksreleased)
2410	printf("handle_workitem_freeblocks: block count\n");
2411	if (allerror)
2412	softdep_error("handle_workitem_freeblks", allerror);
2413	#endif /* DIAGNOSTIC */
2414	WORKITEM_FREE(freeblks, D_FREEBLKS)softdep_freequeue_add((struct worklist *)freeblks);
2415	}
2416
2417	/*
2418	* Release blocks associated with the inode ip and stored in the indirect
2419	* block dbn. If level is greater than SINGLE, the block is an indirect block
2420	* and recursive calls to indirtrunc must be used to cleanse other indirect
2421	* blocks.
2422	*/
2423	STATIC int
2424	indir_trunc(struct inode *ip, daddr_t dbn, int level, daddr_t lbn,
2425	long *countp)
2426	{
2427	struct buf *bp;
2428	int32_t bap1 = NULL((void )0);
2429	int64_t nb, bap2 = NULL((void )0);
2430	struct fs *fs;
2431	struct worklist *wk;
2432	struct indirdep *indirdep;
2433	int i, lbnadd, nblocks, ufs1fmt;
2434	int error, allerror = 0;
2435
2436	fs = ip->i_fsinode_u.fs;
2437	lbnadd = 1;
2438	for (i = level; i > 0; i--)
2439	lbnadd *= NINDIR(fs)((fs)->fs_nindir);
2440	/*
2441	* Get buffer of block pointers to be freed. This routine is not
2442	* called until the zero'ed inode has been written, so it is safe
2443	* to free blocks as they are encountered. Because the inode has
2444	* been zero'ed, calls to bmap on these blocks will fail. So, we
2445	* have to use the on-disk address and the block device for the
2446	* filesystem to look them up. If the file was deleted before its
2447	* indirect blocks were all written to disk, the routine that set
2448	* us up (deallocate_dependencies) will have arranged to leave
2449	* a complete copy of the indirect block in memory for our use.
2450	* Otherwise we have to read the blocks in from the disk.
2451	*/
2452	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
2453	if ((bp = incore(ip->i_devvpi_ump->um_devvp, dbn)) != NULL((void *)0) &&
2454	(wk = LIST_FIRST(&bp->b_dep)((&bp->b_dep)->lh_first)) != NULL((void *)0)) {
2455	if (wk->wk_type != D_INDIRDEP5 \|\|
2456	(indirdep = WK_INDIRDEP(wk)((struct indirdep *)(wk)))->ir_savebp != bp \|\|
2457	(indirdep->ir_stateir_list.wk_state & GOINGAWAY0x0100) == 0) {
2458	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2459	panic("indir_trunc: lost indirdep");
2460	}
2461	WORKLIST_REMOVE(wk)do { (wk)->wk_state &= ~0x8000; do { if ((wk)->wk_list .le_next != ((void )0)) (wk)->wk_list.le_next->wk_list .le_prev = (wk)->wk_list.le_prev; (wk)->wk_list.le_prev = (wk)->wk_list.le_next; ((wk)->wk_list.le_prev) = ((void )-1); ((wk)->wk_list.le_next) = ((void )-1); } while (0 ); } while (0);
2462	WORKITEM_FREE(indirdep, D_INDIRDEP)softdep_freequeue_add((struct worklist *)indirdep);
2463	if (LIST_FIRST(&bp->b_dep)((&bp->b_dep)->lh_first) != NULL((void *)0)) {
2464	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2465	panic("indir_trunc: dangling dep");
2466	}
2467	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2468	} else {
2469	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2470	error = bread(ip->i_devvpi_ump->um_devvp, dbn, (int)fs->fs_bsize, &bp);
2471	if (error)
2472	return (error);
2473	}
2474	/*
2475	* Recursively free indirect blocks.
2476	*/
2477	if (ip->i_ump->um_fstype == UM_UFS11) {
2478	ufs1fmt = 1;
2479	bap1 = (int32_t *)bp->b_data;
2480	} else {
2481	ufs1fmt = 0;
2482	bap2 = (int64_t *)bp->b_data;
2483	}
2484	nblocks = btodb(fs->fs_bsize)((fs->fs_bsize) >> 9);
2485	for (i = NINDIR(fs)((fs)->fs_nindir) - 1; i >= 0; i--) {
2486	if (ufs1fmt)
2487	nb = bap1[i];
2488	else
2489	nb = bap2[i];
2490	if (nb == 0)
2491	continue;
2492	if (level != 0) {
2493	if ((error = indir_trunc(ip, fsbtodb(fs, nb)((nb) << (fs)->fs_fsbtodb),
2494	level - 1, lbn + (i * lbnadd), countp)) != 0)
2495	allerror = error;
2496	}
2497	ffs_blkfree(ip, nb, fs->fs_bsize);
2498	*countp += nblocks;
2499	}
2500	bp->b_flags \|= B_INVAL0x00000800 \| B_NOCACHE0x00001000;
2501	brelse(bp);
2502	return (allerror);
2503	}
2504
2505	/*
2506	* Free an allocindir.
2507	* This routine must be called with splbio interrupts blocked.
2508	*/
2509	STATIC void
2510	free_allocindir(struct allocindir aip, struct inodedep inodedep)
2511	{
2512	struct freefrag *freefrag;
2513
2514	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
2515
2516	#ifdef DEBUG
2517	if (lk.lkt_held == -1)
2518	panic("free_allocindir: lock not held");
2519	#endif
2520	if ((aip->ai_stateai_list.wk_state & DEPCOMPLETE0x0008) == 0)
2521	LIST_REMOVE(aip, ai_deps)do { if ((aip)->ai_deps.le_next != ((void )0)) (aip)-> ai_deps.le_next->ai_deps.le_prev = (aip)->ai_deps.le_prev ; (aip)->ai_deps.le_prev = (aip)->ai_deps.le_next; ((aip )->ai_deps.le_prev) = ((void )-1); ((aip)->ai_deps.le_next ) = ((void )-1); } while (0);
2522	if (aip->ai_stateai_list.wk_state & ONWORKLIST0x8000)
2523	WORKLIST_REMOVE(&aip->ai_list)do { (&aip->ai_list)->wk_state &= ~0x8000; do { if ((&aip->ai_list)->wk_list.le_next != ((void )0 )) (&aip->ai_list)->wk_list.le_next->wk_list.le_prev = (&aip->ai_list)->wk_list.le_prev; (&aip-> ai_list)->wk_list.le_prev = (&aip->ai_list)->wk_list .le_next; ((&aip->ai_list)->wk_list.le_prev) = ((void )-1); ((&aip->ai_list)->wk_list.le_next) = ((void )-1); } while (0); } while (0);
2524	LIST_REMOVE(aip, ai_next)do { if ((aip)->ai_next.le_next != ((void )0)) (aip)-> ai_next.le_next->ai_next.le_prev = (aip)->ai_next.le_prev ; (aip)->ai_next.le_prev = (aip)->ai_next.le_next; ((aip )->ai_next.le_prev) = ((void )-1); ((aip)->ai_next.le_next ) = ((void )-1); } while (0);
2525	if ((freefrag = aip->ai_freefrag) != NULL((void *)0)) {
2526	if (inodedep == NULL((void *)0))
2527	add_to_worklist(&freefrag->ff_list);
2528	else
2529	WORKLIST_INSERT(&inodedep->id_bufwait,do { (&freefrag->ff_list)->wk_state \|= 0x8000; do { if (((&freefrag->ff_list)->wk_list.le_next = (& inodedep->id_bufwait)->lh_first) != ((void *)0)) (& inodedep->id_bufwait)->lh_first->wk_list.le_prev = & (&freefrag->ff_list)->wk_list.le_next; (&inodedep ->id_bufwait)->lh_first = (&freefrag->ff_list); ( &freefrag->ff_list)->wk_list.le_prev = &(&inodedep ->id_bufwait)->lh_first; } while (0); } while (0)
2530	&freefrag->ff_list)do { (&freefrag->ff_list)->wk_state \|= 0x8000; do { if (((&freefrag->ff_list)->wk_list.le_next = (& inodedep->id_bufwait)->lh_first) != ((void *)0)) (& inodedep->id_bufwait)->lh_first->wk_list.le_prev = & (&freefrag->ff_list)->wk_list.le_next; (&inodedep ->id_bufwait)->lh_first = (&freefrag->ff_list); ( &freefrag->ff_list)->wk_list.le_prev = &(&inodedep ->id_bufwait)->lh_first; } while (0); } while (0);
2531	}
2532	WORKITEM_FREE(aip, D_ALLOCINDIR)softdep_freequeue_add((struct worklist *)aip);
2533	}
2534
2535	/*
2536	* Directory entry addition dependencies.
2537	*
2538	* When adding a new directory entry, the inode (with its incremented link
2539	* count) must be written to disk before the directory entry's pointer to it.
2540	* Also, if the inode is newly allocated, the corresponding freemap must be
2541	* updated (on disk) before the directory entry's pointer. These requirements
2542	* are met via undo/redo on the directory entry's pointer, which consists
2543	* simply of the inode number.
2544	*
2545	* As directory entries are added and deleted, the free space within a
2546	* directory block can become fragmented. The ufs file system will compact
2547	* a fragmented directory block to make space for a new entry. When this
2548	* occurs, the offsets of previously added entries change. Any "diradd"
2549	* dependency structures corresponding to these entries must be updated with
2550	* the new offsets.
2551	*/
2552
2553	/*
2554	* This routine is called after the in-memory inode's link
2555	* count has been incremented, but before the directory entry's
2556	* pointer to the inode has been set.
2557	*/
2558	/* buffer containing directory block */
2559	/* inode for directory */
2560	/* offset of new entry in directory */
2561	/* inode referenced by new directory entry */
2562	/* non-NULL => contents of new mkdir */
2563	/* entry is in a newly allocated block */
2564	int
2565	softdep_setup_directory_add(struct buf bp, struct inode dp, off_t diroffset,
2566	long newinum, struct buf *newdirbp, int isnewblk)
2567	{
2568	int offset; /* offset of new entry within directory block */
2569	daddr_t lbn; /* block in directory containing new entry */
2570	struct fs *fs;
2571	struct diradd *dap;
2572	struct allocdirect *adp;
2573	struct pagedep *pagedep;
2574	struct inodedep *inodedep;
2575	struct newdirblk newdirblk = NULL((void )0);
2576	struct mkdir mkdir1, mkdir2;
2577
2578
2579	fs = dp->i_fsinode_u.fs;
2580	lbn = lblkno(fs, diroffset)((diroffset) >> (fs)->fs_bshift);
2581	offset = blkoff(fs, diroffset)((diroffset) & (fs)->fs_qbmask);
2582	dap = pool_get(&diradd_pool, PR_WAITOK0x0001 \| PR_ZERO0x0008);
2583	dap->da_list.wk_type = D_DIRADD10;
2584	dap->da_offset = offset;
2585	dap->da_newinum = newinum;
2586	dap->da_stateda_list.wk_state = ATTACHED0x0001;
2587	if (isnewblk && lbn < NDADDR12 && fragoff(fs, diroffset)((diroffset) & (fs)->fs_qfmask) == 0) {
2588	newdirblk = pool_get(&newdirblk_pool, PR_WAITOK0x0001);
2589	newdirblk->db_list.wk_type = D_NEWDIRBLK13;
2590	newdirblk->db_statedb_list.wk_state = 0;
2591	}
2592	if (newdirbp == NULL((void *)0)) {
2593	dap->da_stateda_list.wk_state \|= DEPCOMPLETE0x0008;
2594	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
2595	} else {
2596	dap->da_stateda_list.wk_state \|= MKDIR_BODY0x0020 \| MKDIR_PARENT0x0010;
2597	mkdir1 = pool_get(&mkdir_pool, PR_WAITOK0x0001);
2598	mkdir1->md_list.wk_type = D_MKDIR11;
2599	mkdir1->md_statemd_list.wk_state = MKDIR_BODY0x0020;
2600	mkdir1->md_diradd = dap;
2601	mkdir2 = pool_get(&mkdir_pool, PR_WAITOK0x0001);
2602	mkdir2->md_list.wk_type = D_MKDIR11;
2603	mkdir2->md_statemd_list.wk_state = MKDIR_PARENT0x0010;
2604	mkdir2->md_diradd = dap;
2605	/*
2606	* Dependency on "." and ".." being written to disk.
2607	*/
2608	mkdir1->md_buf = newdirbp;
2609	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
2610	LIST_INSERT_HEAD(&mkdirlisthd, mkdir1, md_mkdirs)do { if (((mkdir1)->md_mkdirs.le_next = (&mkdirlisthd) ->lh_first) != ((void *)0)) (&mkdirlisthd)->lh_first ->md_mkdirs.le_prev = &(mkdir1)->md_mkdirs.le_next; (&mkdirlisthd)->lh_first = (mkdir1); (mkdir1)->md_mkdirs .le_prev = &(&mkdirlisthd)->lh_first; } while (0);
2611	WORKLIST_INSERT(&newdirbp->b_dep, &mkdir1->md_list)do { (&mkdir1->md_list)->wk_state \|= 0x8000; do { if (((&mkdir1->md_list)->wk_list.le_next = (&newdirbp ->b_dep)->lh_first) != ((void *)0)) (&newdirbp-> b_dep)->lh_first->wk_list.le_prev = &(&mkdir1-> md_list)->wk_list.le_next; (&newdirbp->b_dep)->lh_first = (&mkdir1->md_list); (&mkdir1->md_list)->wk_list .le_prev = &(&newdirbp->b_dep)->lh_first; } while (0); } while (0);
2612	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2613	bdwrite(newdirbp);
2614	/*
2615	* Dependency on link count increase for parent directory
2616	*/
2617	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
2618	if (inodedep_lookup(fs, dp->i_number, 0, &inodedep) == 0
2619	\|\| (inodedep->id_stateid_list.wk_state & ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) == ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) {
2620	dap->da_stateda_list.wk_state &= ~MKDIR_PARENT0x0010;
2621	WORKITEM_FREE(mkdir2, D_MKDIR)softdep_freequeue_add((struct worklist *)mkdir2);
2622	} else {
2623	LIST_INSERT_HEAD(&mkdirlisthd, mkdir2, md_mkdirs)do { if (((mkdir2)->md_mkdirs.le_next = (&mkdirlisthd) ->lh_first) != ((void *)0)) (&mkdirlisthd)->lh_first ->md_mkdirs.le_prev = &(mkdir2)->md_mkdirs.le_next; (&mkdirlisthd)->lh_first = (mkdir2); (mkdir2)->md_mkdirs .le_prev = &(&mkdirlisthd)->lh_first; } while (0);
2624	WORKLIST_INSERT(&inodedep->id_bufwait,&mkdir2->md_list)do { (&mkdir2->md_list)->wk_state \|= 0x8000; do { if (((&mkdir2->md_list)->wk_list.le_next = (&inodedep ->id_bufwait)->lh_first) != ((void *)0)) (&inodedep ->id_bufwait)->lh_first->wk_list.le_prev = &(& mkdir2->md_list)->wk_list.le_next; (&inodedep->id_bufwait )->lh_first = (&mkdir2->md_list); (&mkdir2-> md_list)->wk_list.le_prev = &(&inodedep->id_bufwait )->lh_first; } while (0); } while (0);
2625	}
2626	}
2627	/*
2628	* Link into parent directory pagedep to await its being written.
2629	*/
2630	if (pagedep_lookup(dp, lbn, DEPALLOC0x0001, &pagedep) == 0)
2631	WORKLIST_INSERT(&bp->b_dep, &pagedep->pd_list)do { (&pagedep->pd_list)->wk_state \|= 0x8000; do { if (((&pagedep->pd_list)->wk_list.le_next = (&bp-> b_dep)->lh_first) != ((void *)0)) (&bp->b_dep)-> lh_first->wk_list.le_prev = &(&pagedep->pd_list )->wk_list.le_next; (&bp->b_dep)->lh_first = (& pagedep->pd_list); (&pagedep->pd_list)->wk_list. le_prev = &(&bp->b_dep)->lh_first; } while (0); } while (0);
2632	dap->da_pagedepda_un.dau_pagedep = pagedep;
2633	LIST_INSERT_HEAD(&pagedep->pd_diraddhd[DIRADDHASH(offset)], dap,do { if (((dap)->da_pdlist.le_next = (&pagedep->pd_diraddhd [(((offset) >> 2) % 6)])->lh_first) != ((void *)0)) ( &pagedep->pd_diraddhd[(((offset) >> 2) % 6)])-> lh_first->da_pdlist.le_prev = &(dap)->da_pdlist.le_next ; (&pagedep->pd_diraddhd[(((offset) >> 2) % 6)]) ->lh_first = (dap); (dap)->da_pdlist.le_prev = &(& pagedep->pd_diraddhd[(((offset) >> 2) % 6)])->lh_first ; } while (0)
2634	da_pdlist)do { if (((dap)->da_pdlist.le_next = (&pagedep->pd_diraddhd [(((offset) >> 2) % 6)])->lh_first) != ((void *)0)) ( &pagedep->pd_diraddhd[(((offset) >> 2) % 6)])-> lh_first->da_pdlist.le_prev = &(dap)->da_pdlist.le_next ; (&pagedep->pd_diraddhd[(((offset) >> 2) % 6)]) ->lh_first = (dap); (dap)->da_pdlist.le_prev = &(& pagedep->pd_diraddhd[(((offset) >> 2) % 6)])->lh_first ; } while (0);
2635	/*
2636	* Link into its inodedep. Put it on the id_bufwait list if the inode
2637	* is not yet written. If it is written, do the post-inode write
2638	* processing to put it on the id_pendinghd list.
2639	*/
2640	(void) inodedep_lookup(fs, newinum, DEPALLOC0x0001, &inodedep);
2641	if ((inodedep->id_stateid_list.wk_state & ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) == ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008))
2642	diradd_inode_written(dap, inodedep);
2643	else
2644	WORKLIST_INSERT(&inodedep->id_bufwait, &dap->da_list)do { (&dap->da_list)->wk_state \|= 0x8000; do { if ( ((&dap->da_list)->wk_list.le_next = (&inodedep-> id_bufwait)->lh_first) != ((void *)0)) (&inodedep-> id_bufwait)->lh_first->wk_list.le_prev = &(&dap ->da_list)->wk_list.le_next; (&inodedep->id_bufwait )->lh_first = (&dap->da_list); (&dap->da_list )->wk_list.le_prev = &(&inodedep->id_bufwait)-> lh_first; } while (0); } while (0);
2645	if (isnewblk) {
2646	/*
2647	* Directories growing into indirect blocks are rare
2648	* enough and the frequency of new block allocation
2649	* in those cases even more rare, that we choose not
2650	* to bother tracking them. Rather we simply force the
2651	* new directory entry to disk.
2652	*/
2653	if (lbn >= NDADDR12) {
2654	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2655	/*
2656	* We only have a new allocation when at the
2657	* beginning of a new block, not when we are
2658	* expanding into an existing block.
2659	*/
2660	if (blkoff(fs, diroffset)((diroffset) & (fs)->fs_qbmask) == 0)
2661	return (1);
2662	return (0);
2663	}
2664	/*
2665	* We only have a new allocation when at the beginning
2666	* of a new fragment, not when we are expanding into an
2667	* existing fragment. Also, there is nothing to do if we
2668	* are already tracking this block.
2669	*/
2670	if (fragoff(fs, diroffset)((diroffset) & (fs)->fs_qfmask) != 0) {
2671	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2672	return (0);
2673	}
2674
2675	if ((pagedep->pd_statepd_list.wk_state & NEWBLOCK0x0800) != 0) {
2676	WORKITEM_FREE(newdirblk, D_NEWDIRBLK)softdep_freequeue_add((struct worklist *)newdirblk);
2677	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2678	return (0);
2679	}
2680	/*
2681	* Find our associated allocdirect and have it track us.
2682	*/
2683	if (inodedep_lookup(fs, dp->i_number, 0, &inodedep) == 0)
2684	panic("softdep_setup_directory_add: lost inodedep");
2685	adp = TAILQ_LAST(&inodedep->id_newinoupdt, allocdirectlst)((((struct allocdirectlst )((&inodedep->id_newinoupdt )->tqh_last))->tqh_last));
2686	if (adp == NULL((void *)0) \|\| adp->ad_lbn != lbn) {
2687	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2688	panic("softdep_setup_directory_add: lost entry");
2689	}
2690	pagedep->pd_statepd_list.wk_state \|= NEWBLOCK0x0800;
2691	newdirblk->db_pagedep = pagedep;
2692	WORKLIST_INSERT(&adp->ad_newdirblk, &newdirblk->db_list)do { (&newdirblk->db_list)->wk_state \|= 0x8000; do { if (((&newdirblk->db_list)->wk_list.le_next = (& adp->ad_newdirblk)->lh_first) != ((void *)0)) (&adp ->ad_newdirblk)->lh_first->wk_list.le_prev = &(& newdirblk->db_list)->wk_list.le_next; (&adp->ad_newdirblk )->lh_first = (&newdirblk->db_list); (&newdirblk ->db_list)->wk_list.le_prev = &(&adp->ad_newdirblk )->lh_first; } while (0); } while (0);
2693	}
2694	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2695	return (0);
2696	}
2697
2698	/*
2699	* This procedure is called to change the offset of a directory
2700	* entry when compacting a directory block which must be owned
2701	* exclusively by the caller. Note that the actual entry movement
2702	* must be done in this procedure to ensure that no I/O completions
2703	* occur while the move is in progress.
2704	*/
2705	/* inode for directory */
2706	/* address of dp->i_offset */
2707	/* address of old directory location */
2708	/* address of new directory location */
2709	/* size of directory entry */
2710	void
2711	softdep_change_directoryentry_offset(struct inode *dp, caddr_t base,
2712	caddr_t oldloc, caddr_t newloc, int entrysize)
2713	{
2714	int offset, oldoffset, newoffset;
2715	struct pagedep *pagedep;
2716	struct diradd *dap;
2717	daddr_t lbn;
2718
2719	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
2720	lbn = lblkno(dp->i_fs, dp->i_offset)((dp->i_offset) >> (dp->inode_u.fs)->fs_bshift );
2721	offset = blkoff(dp->i_fs, dp->i_offset)((dp->i_offset) & (dp->inode_u.fs)->fs_qbmask);
2722	if (pagedep_lookup(dp, lbn, 0, &pagedep) == 0)
2723	goto done;
2724	oldoffset = offset + (oldloc - base);
2725	newoffset = offset + (newloc - base);
2726
2727	LIST_FOREACH(dap, &pagedep->pd_diraddhd[DIRADDHASH(oldoffset)], da_pdlist)for((dap) = ((&pagedep->pd_diraddhd[(((oldoffset) >> 2) % 6)])->lh_first); (dap)!= ((void *)0); (dap) = ((dap) ->da_pdlist.le_next)) {
2728	if (dap->da_offset != oldoffset)
2729	continue;
2730	dap->da_offset = newoffset;
2731	if (DIRADDHASH(newoffset)(((newoffset) >> 2) % 6) == DIRADDHASH(oldoffset)(((oldoffset) >> 2) % 6))
2732	break;
2733	LIST_REMOVE(dap, da_pdlist)do { if ((dap)->da_pdlist.le_next != ((void )0)) (dap)-> da_pdlist.le_next->da_pdlist.le_prev = (dap)->da_pdlist .le_prev; (dap)->da_pdlist.le_prev = (dap)->da_pdlist. le_next; ((dap)->da_pdlist.le_prev) = ((void )-1); ((dap) ->da_pdlist.le_next) = ((void )-1); } while (0);
2734	LIST_INSERT_HEAD(&pagedep->pd_diraddhd[DIRADDHASH(newoffset)],do { if (((dap)->da_pdlist.le_next = (&pagedep->pd_diraddhd [(((newoffset) >> 2) % 6)])->lh_first) != ((void *)0 )) (&pagedep->pd_diraddhd[(((newoffset) >> 2) % 6 )])->lh_first->da_pdlist.le_prev = &(dap)->da_pdlist .le_next; (&pagedep->pd_diraddhd[(((newoffset) >> 2) % 6)])->lh_first = (dap); (dap)->da_pdlist.le_prev = &(&pagedep->pd_diraddhd[(((newoffset) >> 2) % 6)])->lh_first; } while (0)
2735	dap, da_pdlist)do { if (((dap)->da_pdlist.le_next = (&pagedep->pd_diraddhd [(((newoffset) >> 2) % 6)])->lh_first) != ((void *)0 )) (&pagedep->pd_diraddhd[(((newoffset) >> 2) % 6 )])->lh_first->da_pdlist.le_prev = &(dap)->da_pdlist .le_next; (&pagedep->pd_diraddhd[(((newoffset) >> 2) % 6)])->lh_first = (dap); (dap)->da_pdlist.le_prev = &(&pagedep->pd_diraddhd[(((newoffset) >> 2) % 6)])->lh_first; } while (0);
2736	break;
2737	}
2738	if (dap == NULL((void *)0)) {
2739
2740	LIST_FOREACH(dap, &pagedep->pd_pendinghd, da_pdlist)for((dap) = ((&pagedep->pd_pendinghd)->lh_first); ( dap)!= ((void *)0); (dap) = ((dap)->da_pdlist.le_next)) {
2741	if (dap->da_offset == oldoffset) {
2742	dap->da_offset = newoffset;
2743	break;
2744	}
2745	}
2746	}
2747	done:
2748	memmove(newloc, oldloc, entrysize)__builtin_memmove((newloc), (oldloc), (entrysize));
2749	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2750	}
2751
2752	/*
2753	* Free a diradd dependency structure. This routine must be called
2754	* with splbio interrupts blocked.
2755	*/
2756	STATIC void
2757	free_diradd(struct diradd *dap)
2758	{
2759	struct dirrem *dirrem;
2760	struct pagedep *pagedep;
2761	struct inodedep *inodedep;
2762	struct mkdir mkdir, nextmd;
2763
2764	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
2765
2766	#ifdef DEBUG
2767	if (lk.lkt_held == -1)
2768	panic("free_diradd: lock not held");
2769	#endif
2770	WORKLIST_REMOVE(&dap->da_list)do { (&dap->da_list)->wk_state &= ~0x8000; do { if ((&dap->da_list)->wk_list.le_next != ((void )0 )) (&dap->da_list)->wk_list.le_next->wk_list.le_prev = (&dap->da_list)->wk_list.le_prev; (&dap-> da_list)->wk_list.le_prev = (&dap->da_list)->wk_list .le_next; ((&dap->da_list)->wk_list.le_prev) = ((void )-1); ((&dap->da_list)->wk_list.le_next) = ((void )-1); } while (0); } while (0);
2771	LIST_REMOVE(dap, da_pdlist)do { if ((dap)->da_pdlist.le_next != ((void )0)) (dap)-> da_pdlist.le_next->da_pdlist.le_prev = (dap)->da_pdlist .le_prev; (dap)->da_pdlist.le_prev = (dap)->da_pdlist. le_next; ((dap)->da_pdlist.le_prev) = ((void )-1); ((dap) ->da_pdlist.le_next) = ((void )-1); } while (0);
2772	if ((dap->da_stateda_list.wk_state & DIRCHG0x0080) == 0) {
2773	pagedep = dap->da_pagedepda_un.dau_pagedep;
2774	} else {
2775	dirrem = dap->da_previousda_un.dau_previous;
2776	pagedep = dirrem->dm_pagedepdm_un.dmu_pagedep;
2777	dirrem->dm_dirinumdm_un.dmu_dirinum = pagedep->pd_ino;
2778	add_to_worklist(&dirrem->dm_list);
2779	}
2780	if (inodedep_lookup(VFSTOUFS(pagedep->pd_mnt)((struct ufsmount *)((pagedep->pd_mnt)->mnt_data))->um_fsufsmount_u.fs, dap->da_newinum,
2781	0, &inodedep) != 0)
2782	(void) free_inodedep(inodedep);
2783	if ((dap->da_stateda_list.wk_state & (MKDIR_PARENT0x0010 \| MKDIR_BODY0x0020)) != 0) {
2784	for (mkdir = LIST_FIRST(&mkdirlisthd)((&mkdirlisthd)->lh_first); mkdir; mkdir = nextmd) {
2785	nextmd = LIST_NEXT(mkdir, md_mkdirs)((mkdir)->md_mkdirs.le_next);
2786	if (mkdir->md_diradd != dap)
2787	continue;
2788	dap->da_stateda_list.wk_state &= ~mkdir->md_statemd_list.wk_state;
2789	WORKLIST_REMOVE(&mkdir->md_list)do { (&mkdir->md_list)->wk_state &= ~0x8000; do { if ((&mkdir->md_list)->wk_list.le_next != ((void )0)) (&mkdir->md_list)->wk_list.le_next->wk_list .le_prev = (&mkdir->md_list)->wk_list.le_prev; (& mkdir->md_list)->wk_list.le_prev = (&mkdir->md_list )->wk_list.le_next; ((&mkdir->md_list)->wk_list. le_prev) = ((void )-1); ((&mkdir->md_list)->wk_list .le_next) = ((void )-1); } while (0); } while (0);
2790	LIST_REMOVE(mkdir, md_mkdirs)do { if ((mkdir)->md_mkdirs.le_next != ((void )0)) (mkdir )->md_mkdirs.le_next->md_mkdirs.le_prev = (mkdir)->md_mkdirs .le_prev; (mkdir)->md_mkdirs.le_prev = (mkdir)->md_mkdirs .le_next; ((mkdir)->md_mkdirs.le_prev) = ((void )-1); ((mkdir )->md_mkdirs.le_next) = ((void )-1); } while (0);
2791	WORKITEM_FREE(mkdir, D_MKDIR)softdep_freequeue_add((struct worklist *)mkdir);
2792	}
2793	if ((dap->da_stateda_list.wk_state & (MKDIR_PARENT0x0010 \| MKDIR_BODY0x0020)) != 0) {
2794	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2795	panic("free_diradd: unfound ref");
2796	}
2797	}
2798	WORKITEM_FREE(dap, D_DIRADD)softdep_freequeue_add((struct worklist *)dap);
2799	}
2800
2801	/*
2802	* Directory entry removal dependencies.
2803	*
2804	* When removing a directory entry, the entry's inode pointer must be
2805	* zero'ed on disk before the corresponding inode's link count is decremented
2806	* (possibly freeing the inode for re-use). This dependency is handled by
2807	* updating the directory entry but delaying the inode count reduction until
2808	* after the directory block has been written to disk. After this point, the
2809	* inode count can be decremented whenever it is convenient.
2810	*/
2811
2812	/*
2813	* This routine should be called immediately after removing
2814	* a directory entry. The inode's link count should not be
2815	* decremented by the calling procedure -- the soft updates
2816	* code will do this task when it is safe.
2817	*/
2818	/* buffer containing directory block */
2819	/* inode for the directory being modified */
2820	/* inode for directory entry being removed */
2821	/* indicates if doing RMDIR */
2822	void
2823	softdep_setup_remove(struct buf bp, struct inode dp, struct inode *ip,
2824	int isrmdir)
2825	{
2826	struct dirrem dirrem, prevdirrem;
2827
2828	/*
2829	* Allocate a new dirrem if appropriate and ACQUIRE_LOCK.
2830	*/
2831	dirrem = newdirrem(bp, dp, ip, isrmdir, &prevdirrem);
2832
2833	/*
2834	* If the COMPLETE flag is clear, then there were no active
2835	* entries and we want to roll back to a zeroed entry until
2836	* the new inode is committed to disk. If the COMPLETE flag is
2837	* set then we have deleted an entry that never made it to
2838	* disk. If the entry we deleted resulted from a name change,
2839	* then the old name still resides on disk. We cannot delete
2840	* its inode (returned to us in prevdirrem) until the zeroed
2841	* directory entry gets to disk. The new inode has never been
2842	* referenced on the disk, so can be deleted immediately.
2843	*/
2844	if ((dirrem->dm_statedm_list.wk_state & COMPLETE0x0004) == 0) {
2845	LIST_INSERT_HEAD(&dirrem->dm_pagedep->pd_dirremhd, dirrem,do { if (((dirrem)->dm_next.le_next = (&dirrem->dm_un .dmu_pagedep->pd_dirremhd)->lh_first) != ((void *)0)) ( &dirrem->dm_un.dmu_pagedep->pd_dirremhd)->lh_first ->dm_next.le_prev = &(dirrem)->dm_next.le_next; (& dirrem->dm_un.dmu_pagedep->pd_dirremhd)->lh_first = ( dirrem); (dirrem)->dm_next.le_prev = &(&dirrem-> dm_un.dmu_pagedep->pd_dirremhd)->lh_first; } while (0)
2846	dm_next)do { if (((dirrem)->dm_next.le_next = (&dirrem->dm_un .dmu_pagedep->pd_dirremhd)->lh_first) != ((void *)0)) ( &dirrem->dm_un.dmu_pagedep->pd_dirremhd)->lh_first ->dm_next.le_prev = &(dirrem)->dm_next.le_next; (& dirrem->dm_un.dmu_pagedep->pd_dirremhd)->lh_first = ( dirrem); (dirrem)->dm_next.le_prev = &(&dirrem-> dm_un.dmu_pagedep->pd_dirremhd)->lh_first; } while (0);
2847	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2848	} else {
2849	if (prevdirrem != NULL((void *)0))
2850	LIST_INSERT_HEAD(&dirrem->dm_pagedep->pd_dirremhd,do { if (((prevdirrem)->dm_next.le_next = (&dirrem-> dm_un.dmu_pagedep->pd_dirremhd)->lh_first) != ((void *) 0)) (&dirrem->dm_un.dmu_pagedep->pd_dirremhd)->lh_first ->dm_next.le_prev = &(prevdirrem)->dm_next.le_next; (&dirrem->dm_un.dmu_pagedep->pd_dirremhd)->lh_first = (prevdirrem); (prevdirrem)->dm_next.le_prev = &(& dirrem->dm_un.dmu_pagedep->pd_dirremhd)->lh_first; } while (0)
2851	prevdirrem, dm_next)do { if (((prevdirrem)->dm_next.le_next = (&dirrem-> dm_un.dmu_pagedep->pd_dirremhd)->lh_first) != ((void *) 0)) (&dirrem->dm_un.dmu_pagedep->pd_dirremhd)->lh_first ->dm_next.le_prev = &(prevdirrem)->dm_next.le_next; (&dirrem->dm_un.dmu_pagedep->pd_dirremhd)->lh_first = (prevdirrem); (prevdirrem)->dm_next.le_prev = &(& dirrem->dm_un.dmu_pagedep->pd_dirremhd)->lh_first; } while (0);
2852	dirrem->dm_dirinumdm_un.dmu_dirinum = dirrem->dm_pagedepdm_un.dmu_pagedep->pd_ino;
2853	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2854	handle_workitem_remove(dirrem);
2855	}
2856	}
2857
2858	STATIC long num_dirrem; /* number of dirrem allocated */
2859	/*
2860	* Allocate a new dirrem if appropriate and return it along with
2861	* its associated pagedep. Called without a lock, returns with lock.
2862	*/
2863	/* buffer containing directory block */
2864	/* inode for the directory being modified */
2865	/* inode for directory entry being removed */
2866	/* indicates if doing RMDIR */
2867	/* previously referenced inode, if any */
2868	STATIC struct dirrem *
2869	newdirrem(struct buf bp, struct inode dp, struct inode *ip, int isrmdir,
2870	struct dirrem **prevdirremp)
2871	{
2872	int offset;
2873	daddr_t lbn;
2874	struct diradd *dap;
2875	struct dirrem *dirrem;
2876	struct pagedep *pagedep;
2877
2878	/*
2879	* Whiteouts have no deletion dependencies.
2880	*/
2881	if (ip == NULL((void *)0))
2882	panic("newdirrem: whiteout");
2883	/*
2884	* If we are over our limit, try to improve the situation.
2885	* Limiting the number of dirrem structures will also limit
2886	* the number of freefile and freeblks structures.
2887	*/
2888	if (num_dirrem > max_softdeps / 2)
2889	(void) request_cleanup(FLUSH_REMOVE2, 0);
2890	num_dirrem += 1;
2891	dirrem = pool_get(&dirrem_pool, PR_WAITOK0x0001 \| PR_ZERO0x0008);
2892	dirrem->dm_list.wk_type = D_DIRREM12;
2893	dirrem->dm_statedm_list.wk_state = isrmdir ? RMDIR0x0040 : 0;
2894	dirrem->dm_mnt = ITOV(ip)((ip)->i_vnode)->v_mount;
2895	dirrem->dm_oldinum = ip->i_number;
2896	prevdirremp = NULL((void )0);
2897
2898	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
2899	lbn = lblkno(dp->i_fs, dp->i_offset)((dp->i_offset) >> (dp->inode_u.fs)->fs_bshift );
2900	offset = blkoff(dp->i_fs, dp->i_offset)((dp->i_offset) & (dp->inode_u.fs)->fs_qbmask);
2901	if (pagedep_lookup(dp, lbn, DEPALLOC0x0001, &pagedep) == 0)
2902	WORKLIST_INSERT(&bp->b_dep, &pagedep->pd_list)do { (&pagedep->pd_list)->wk_state \|= 0x8000; do { if (((&pagedep->pd_list)->wk_list.le_next = (&bp-> b_dep)->lh_first) != ((void *)0)) (&bp->b_dep)-> lh_first->wk_list.le_prev = &(&pagedep->pd_list )->wk_list.le_next; (&bp->b_dep)->lh_first = (& pagedep->pd_list); (&pagedep->pd_list)->wk_list. le_prev = &(&bp->b_dep)->lh_first; } while (0); } while (0);
2903	dirrem->dm_pagedepdm_un.dmu_pagedep = pagedep;
2904	/*
2905	* Check for a diradd dependency for the same directory entry.
2906	* If present, then both dependencies become obsolete and can
2907	* be de-allocated. Check for an entry on both the pd_dirraddhd
2908	* list and the pd_pendinghd list.
2909	*/
2910
2911	LIST_FOREACH(dap, &pagedep->pd_diraddhd[DIRADDHASH(offset)], da_pdlist)for((dap) = ((&pagedep->pd_diraddhd[(((offset) >> 2) % 6)])->lh_first); (dap)!= ((void *)0); (dap) = ((dap) ->da_pdlist.le_next))
2912	if (dap->da_offset == offset)
2913	break;
2914	if (dap == NULL((void *)0)) {
2915
2916	LIST_FOREACH(dap, &pagedep->pd_pendinghd, da_pdlist)for((dap) = ((&pagedep->pd_pendinghd)->lh_first); ( dap)!= ((void *)0); (dap) = ((dap)->da_pdlist.le_next))
2917	if (dap->da_offset == offset)
2918	break;
2919	if (dap == NULL((void *)0))
2920	return (dirrem);
2921	}
2922	/*
2923	* Must be ATTACHED at this point.
2924	*/
2925	if ((dap->da_stateda_list.wk_state & ATTACHED0x0001) == 0) {
2926	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2927	panic("newdirrem: not ATTACHED");
2928	}
2929	if (dap->da_newinum != ip->i_number) {
2930	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
2931	panic("newdirrem: inum %u should be %u",
2932	ip->i_number, dap->da_newinum);
2933	}
2934	/*
2935	* If we are deleting a changed name that never made it to disk,
2936	* then return the dirrem describing the previous inode (which
2937	* represents the inode currently referenced from this entry on disk).
2938	*/
2939	if ((dap->da_stateda_list.wk_state & DIRCHG0x0080) != 0) {
2940	*prevdirremp = dap->da_previousda_un.dau_previous;
2941	dap->da_stateda_list.wk_state &= ~DIRCHG0x0080;
2942	dap->da_pagedepda_un.dau_pagedep = pagedep;
2943	}
2944	/*
2945	* We are deleting an entry that never made it to disk.
2946	* Mark it COMPLETE so we can delete its inode immediately.
2947	*/
2948	dirrem->dm_statedm_list.wk_state \|= COMPLETE0x0004;
2949	free_diradd(dap);
2950	return (dirrem);
2951	}
2952
2953	/*
2954	* Directory entry change dependencies.
2955	*
2956	* Changing an existing directory entry requires that an add operation
2957	* be completed first followed by a deletion. The semantics for the addition
2958	* are identical to the description of adding a new entry above except
2959	* that the rollback is to the old inode number rather than zero. Once
2960	* the addition dependency is completed, the removal is done as described
2961	* in the removal routine above.
2962	*/
2963
2964	/*
2965	* This routine should be called immediately after changing
2966	* a directory entry. The inode's link count should not be
2967	* decremented by the calling procedure -- the soft updates
2968	* code will perform this task when it is safe.
2969	*/
2970	/* buffer containing directory block */
2971	/* inode for the directory being modified */
2972	/* inode for directory entry being removed */
2973	/* new inode number for changed entry */
2974	/* indicates if doing RMDIR */
2975	void
2976	softdep_setup_directory_change(struct buf bp, struct inode dp,
2977	struct inode *ip, long newinum, int isrmdir)
2978	{
2979	int offset;
2980	struct diradd *dap;
2981	struct dirrem dirrem, prevdirrem;
2982	struct pagedep *pagedep;
2983	struct inodedep *inodedep;
2984
2985	offset = blkoff(dp->i_fs, dp->i_offset)((dp->i_offset) & (dp->inode_u.fs)->fs_qbmask);
2986	dap = pool_get(&diradd_pool, PR_WAITOK0x0001 \| PR_ZERO0x0008);
2987	dap->da_list.wk_type = D_DIRADD10;
2988	dap->da_stateda_list.wk_state = DIRCHG0x0080 \| ATTACHED0x0001 \| DEPCOMPLETE0x0008;
2989	dap->da_offset = offset;
2990	dap->da_newinum = newinum;
2991
2992	/*
2993	* Allocate a new dirrem and ACQUIRE_LOCK.
2994	*/
2995	dirrem = newdirrem(bp, dp, ip, isrmdir, &prevdirrem);
2996	pagedep = dirrem->dm_pagedepdm_un.dmu_pagedep;
2997	/*
2998	* The possible values for isrmdir:
2999	* 0 - non-directory file rename
3000	* 1 - directory rename within same directory
3001	* inum - directory rename to new directory of given inode number
3002	* When renaming to a new directory, we are both deleting and
3003	* creating a new directory entry, so the link count on the new
3004	* directory should not change. Thus we do not need the followup
3005	* dirrem which is usually done in handle_workitem_remove. We set
3006	* the DIRCHG flag to tell handle_workitem_remove to skip the
3007	* followup dirrem.
3008	*/
3009	if (isrmdir > 1)
3010	dirrem->dm_statedm_list.wk_state \|= DIRCHG0x0080;
3011
3012	/*
3013	* If the COMPLETE flag is clear, then there were no active
3014	* entries and we want to roll back to the previous inode until
3015	* the new inode is committed to disk. If the COMPLETE flag is
3016	* set, then we have deleted an entry that never made it to disk.
3017	* If the entry we deleted resulted from a name change, then the old
3018	* inode reference still resides on disk. Any rollback that we do
3019	* needs to be to that old inode (returned to us in prevdirrem). If
3020	* the entry we deleted resulted from a create, then there is
3021	* no entry on the disk, so we want to roll back to zero rather
3022	* than the uncommitted inode. In either of the COMPLETE cases we
3023	* want to immediately free the unwritten and unreferenced inode.
3024	*/
3025	if ((dirrem->dm_statedm_list.wk_state & COMPLETE0x0004) == 0) {
3026	dap->da_previousda_un.dau_previous = dirrem;
3027	} else {
3028	if (prevdirrem != NULL((void *)0)) {
3029	dap->da_previousda_un.dau_previous = prevdirrem;
3030	} else {
3031	dap->da_stateda_list.wk_state &= ~DIRCHG0x0080;
3032	dap->da_pagedepda_un.dau_pagedep = pagedep;
3033	}
3034	dirrem->dm_dirinumdm_un.dmu_dirinum = pagedep->pd_ino;
3035	add_to_worklist(&dirrem->dm_list);
3036	}
3037	/*
3038	* Link into its inodedep. Put it on the id_bufwait list if the inode
3039	* is not yet written. If it is written, do the post-inode write
3040	* processing to put it on the id_pendinghd list.
3041	*/
3042	if (inodedep_lookup(dp->i_fsinode_u.fs, newinum, DEPALLOC0x0001, &inodedep) == 0 \|\|
3043	(inodedep->id_stateid_list.wk_state & ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) == ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) {
3044	dap->da_stateda_list.wk_state \|= COMPLETE0x0004;
3045	LIST_INSERT_HEAD(&pagedep->pd_pendinghd, dap, da_pdlist)do { if (((dap)->da_pdlist.le_next = (&pagedep->pd_pendinghd )->lh_first) != ((void *)0)) (&pagedep->pd_pendinghd )->lh_first->da_pdlist.le_prev = &(dap)->da_pdlist .le_next; (&pagedep->pd_pendinghd)->lh_first = (dap ); (dap)->da_pdlist.le_prev = &(&pagedep->pd_pendinghd )->lh_first; } while (0);
3046	WORKLIST_INSERT(&inodedep->id_pendinghd, &dap->da_list)do { (&dap->da_list)->wk_state \|= 0x8000; do { if ( ((&dap->da_list)->wk_list.le_next = (&inodedep-> id_pendinghd)->lh_first) != ((void *)0)) (&inodedep-> id_pendinghd)->lh_first->wk_list.le_prev = &(&dap ->da_list)->wk_list.le_next; (&inodedep->id_pendinghd )->lh_first = (&dap->da_list); (&dap->da_list )->wk_list.le_prev = &(&inodedep->id_pendinghd) ->lh_first; } while (0); } while (0);
3047	} else {
3048	LIST_INSERT_HEAD(&pagedep->pd_diraddhd[DIRADDHASH(offset)],do { if (((dap)->da_pdlist.le_next = (&pagedep->pd_diraddhd [(((offset) >> 2) % 6)])->lh_first) != ((void *)0)) ( &pagedep->pd_diraddhd[(((offset) >> 2) % 6)])-> lh_first->da_pdlist.le_prev = &(dap)->da_pdlist.le_next ; (&pagedep->pd_diraddhd[(((offset) >> 2) % 6)]) ->lh_first = (dap); (dap)->da_pdlist.le_prev = &(& pagedep->pd_diraddhd[(((offset) >> 2) % 6)])->lh_first ; } while (0)
3049	dap, da_pdlist)do { if (((dap)->da_pdlist.le_next = (&pagedep->pd_diraddhd [(((offset) >> 2) % 6)])->lh_first) != ((void *)0)) ( &pagedep->pd_diraddhd[(((offset) >> 2) % 6)])-> lh_first->da_pdlist.le_prev = &(dap)->da_pdlist.le_next ; (&pagedep->pd_diraddhd[(((offset) >> 2) % 6)]) ->lh_first = (dap); (dap)->da_pdlist.le_prev = &(& pagedep->pd_diraddhd[(((offset) >> 2) % 6)])->lh_first ; } while (0);
3050	WORKLIST_INSERT(&inodedep->id_bufwait, &dap->da_list)do { (&dap->da_list)->wk_state \|= 0x8000; do { if ( ((&dap->da_list)->wk_list.le_next = (&inodedep-> id_bufwait)->lh_first) != ((void *)0)) (&inodedep-> id_bufwait)->lh_first->wk_list.le_prev = &(&dap ->da_list)->wk_list.le_next; (&inodedep->id_bufwait )->lh_first = (&dap->da_list); (&dap->da_list )->wk_list.le_prev = &(&inodedep->id_bufwait)-> lh_first; } while (0); } while (0);
3051	}
3052	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3053	}
3054
3055	/*
3056	* Called whenever the link count on an inode is changed.
3057	* It creates an inode dependency so that the new reference(s)
3058	* to the inode cannot be committed to disk until the updated
3059	* inode has been written.
3060	*/
3061	/* the inode with the increased link count */
3062	/* do background work or not */
3063	void
3064	softdep_change_linkcnt(struct inode *ip, int nodelay)
3065	{
3066	struct inodedep *inodedep;
3067	int flags;
3068
3069	/*
3070	* If requested, do not allow background work to happen.
3071	*/
3072	flags = DEPALLOC0x0001;
3073	if (nodelay)
3074	flags \|= NODELAY0x0002;
3075
3076	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
3077
3078	(void) inodedep_lookup(ip->i_fsinode_u.fs, ip->i_number, flags, &inodedep);
3079	if (DIP(ip, nlink)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_nlink : (ip)->dinode_u.ffs2_din->di_nlink) < ip->i_effnlink) {
3080	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3081	panic("softdep_change_linkcnt: bad delta");
3082	}
3083
3084	inodedep->id_nlinkdelta = DIP(ip, nlink)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_nlink : (ip)->dinode_u.ffs2_din->di_nlink) - ip->i_effnlink;
3085
3086	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3087	}
3088
3089	/*
3090	* This workitem decrements the inode's link count.
3091	* If the link count reaches zero, the file is removed.
3092	*/
3093	STATIC void
3094	handle_workitem_remove(struct dirrem *dirrem)
3095	{
3096	struct proc p = CURPROC({struct cpu_info __ci; asm volatile("movq %%gs:%P1,%0" : "=r" (__ci) :"n" (__builtin_offsetof(struct cpu_info, ci_self))); __ci;})->ci_curproc; /* XXX */
3097	struct inodedep *inodedep;
3098	struct vnode *vp;
3099	struct inode *ip;
3100	ufsino_t oldinum;
3101	int error;
3102
3103	if ((error = VFS_VGET(dirrem->dm_mnt, dirrem->dm_oldinum, &vp)(*(dirrem->dm_mnt)->mnt_op->vfs_vget)(dirrem->dm_mnt , dirrem->dm_oldinum, &vp)) != 0) {
3104	softdep_error("handle_workitem_remove: vget", error);
3105	return;
3106	}
3107	ip = VTOI(vp)((struct inode *)(vp)->v_data);
3108	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
3109	if ((inodedep_lookup(ip->i_fsinode_u.fs, dirrem->dm_oldinum, 0, &inodedep))
3110	== 0) {
3111	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3112	panic("handle_workitem_remove: lost inodedep");
3113	}
3114	/*
3115	* Normal file deletion.
3116	*/
3117	if ((dirrem->dm_statedm_list.wk_state & RMDIR0x0040) == 0) {
3118	DIP_ADD(ip, nlink, -1)do { if ((ip)->i_ump->um_fstype == 1) (ip)->dinode_u .ffs1_din->di_nlink += (-1); else (ip)->dinode_u.ffs2_din ->di_nlink += (-1); } while (0);
3119	ip->i_flag \|= IN_CHANGE0x0002;
3120	if (DIP(ip, nlink)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_nlink : (ip)->dinode_u.ffs2_din->di_nlink) < ip->i_effnlink) {
3121	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3122	panic("handle_workitem_remove: bad file delta");
3123	}
3124	inodedep->id_nlinkdelta = DIP(ip, nlink)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_nlink : (ip)->dinode_u.ffs2_din->di_nlink) - ip->i_effnlink;
3125	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3126	vput(vp);
3127	num_dirrem -= 1;
3128	WORKITEM_FREE(dirrem, D_DIRREM)softdep_freequeue_add((struct worklist *)dirrem);
3129	return;
3130	}
3131	/*
3132	* Directory deletion. Decrement reference count for both the
3133	* just deleted parent directory entry and the reference for ".".
3134	* Next truncate the directory to length zero. When the
3135	* truncation completes, arrange to have the reference count on
3136	* the parent decremented to account for the loss of "..".
3137	*/
3138	DIP_ADD(ip, nlink, -2)do { if ((ip)->i_ump->um_fstype == 1) (ip)->dinode_u .ffs1_din->di_nlink += (-2); else (ip)->dinode_u.ffs2_din ->di_nlink += (-2); } while (0);
3139	ip->i_flag \|= IN_CHANGE0x0002;
3140	if (DIP(ip, nlink)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_nlink : (ip)->dinode_u.ffs2_din->di_nlink) < ip->i_effnlink)
3141	panic("handle_workitem_remove: bad dir delta");
3142	inodedep->id_nlinkdelta = DIP(ip, nlink)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_nlink : (ip)->dinode_u.ffs2_din->di_nlink) - ip->i_effnlink;
3143	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3144	if ((error = UFS_TRUNCATE(ip, (off_t)0, 0, p->p_ucred)((ip)->i_vtbl->iv_truncate)((ip), ((off_t)0), (0), (p-> p_ucred))) != 0)
3145	softdep_error("handle_workitem_remove: truncate", error);
3146	/*
3147	* Rename a directory to a new parent. Since, we are both deleting
3148	* and creating a new directory entry, the link count on the new
3149	* directory should not change. Thus we skip the followup dirrem.
3150	*/
3151	if (dirrem->dm_statedm_list.wk_state & DIRCHG0x0080) {
3152	vput(vp);
3153	num_dirrem -= 1;
3154	WORKITEM_FREE(dirrem, D_DIRREM)softdep_freequeue_add((struct worklist *)dirrem);
3155	return;
3156	}
3157	/*
3158	* If the inodedep does not exist, then the zero'ed inode has
3159	* been written to disk. If the allocated inode has never been
3160	* written to disk, then the on-disk inode is zero'ed. In either
3161	* case we can remove the file immediately.
3162	*/
3163	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
3164	dirrem->dm_statedm_list.wk_state = 0;
3165	oldinum = dirrem->dm_oldinum;
3166	dirrem->dm_oldinum = dirrem->dm_dirinumdm_un.dmu_dirinum;
3167	if (inodedep_lookup(ip->i_fsinode_u.fs, oldinum, 0, &inodedep) == 0 \|\|
3168	check_inode_unwritten(inodedep)) {
3169	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3170	vput(vp);
3171	handle_workitem_remove(dirrem);
3172	return;
3173	}
3174	WORKLIST_INSERT(&inodedep->id_inowait, &dirrem->dm_list)do { (&dirrem->dm_list)->wk_state \|= 0x8000; do { if (((&dirrem->dm_list)->wk_list.le_next = (&inodedep ->id_inowait)->lh_first) != ((void *)0)) (&inodedep ->id_inowait)->lh_first->wk_list.le_prev = &(& dirrem->dm_list)->wk_list.le_next; (&inodedep->id_inowait )->lh_first = (&dirrem->dm_list); (&dirrem-> dm_list)->wk_list.le_prev = &(&inodedep->id_inowait )->lh_first; } while (0); } while (0);
3175	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3176	ip->i_flag \|= IN_CHANGE0x0002;
3177	UFS_UPDATE(VTOI(vp), 0)((((struct inode )(vp)->v_data))->i_vtbl->iv_update )((((struct inode )(vp)->v_data)), (0));
3178	vput(vp);
3179	}
3180
3181	/*
3182	* Inode de-allocation dependencies.
3183	*
3184	* When an inode's link count is reduced to zero, it can be de-allocated. We
3185	* found it convenient to postpone de-allocation until after the inode is
3186	* written to disk with its new link count (zero). At this point, all of the
3187	* on-disk inode's block pointers are nullified and, with careful dependency
3188	* list ordering, all dependencies related to the inode will be satisfied and
3189	* the corresponding dependency structures de-allocated. So, if/when the
3190	* inode is reused, there will be no mixing of old dependencies with new
3191	* ones. This artificial dependency is set up by the block de-allocation
3192	* procedure above (softdep_setup_freeblocks) and completed by the
3193	* following procedure.
3194	*/
3195	STATIC void
3196	handle_workitem_freefile(struct freefile *freefile)
3197	{
3198	struct fs *fs;
3199	struct vnode vp;
3200	struct inode tip;
3201	#ifdef DEBUG
3202	struct inodedep *idp;
3203	#endif
3204	int error;
3205
3206	fs = VFSTOUFS(freefile->fx_mnt)((struct ufsmount *)((freefile->fx_mnt)->mnt_data))->um_fsufsmount_u.fs;
3207	#ifdef DEBUG
3208	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
3209	error = inodedep_lookup(fs, freefile->fx_oldinum, 0, &idp);
3210	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3211	if (error)
3212	panic("handle_workitem_freefile: inodedep survived");
3213	#endif
3214	tip.i_ump = VFSTOUFS(freefile->fx_mnt)((struct ufsmount *)((freefile->fx_mnt)->mnt_data));
3215	tip.i_dev = freefile->fx_devvp->v_rdevv_un.vu_specinfo->si_rdev;
3216	tip.i_fsinode_u.fs = fs;
3217	tip.i_vnode = &vp;
3218	vp.v_data = &tip;
3219
3220	if ((error = ffs_freefile(&tip, freefile->fx_oldinum,
3221	freefile->fx_mode)) != 0) {
3222	softdep_error("handle_workitem_freefile", error);
3223	}
3224	WORKITEM_FREE(freefile, D_FREEFILE)softdep_freequeue_add((struct worklist *)freefile);
3225	}
3226
3227	/*
3228	* Disk writes.
3229	*
3230	* The dependency structures constructed above are most actively used when file
3231	* system blocks are written to disk. No constraints are placed on when a
3232	* block can be written, but unsatisfied update dependencies are made safe by
3233	* modifying (or replacing) the source memory for the duration of the disk
3234	* write. When the disk write completes, the memory block is again brought
3235	* up-to-date.
3236	*
3237	* In-core inode structure reclamation.
3238	*
3239	* Because there are a finite number of "in-core" inode structures, they are
3240	* reused regularly. By transferring all inode-related dependencies to the
3241	* in-memory inode block and indexing them separately (via "inodedep"s), we
3242	* can allow "in-core" inode structures to be reused at any time and avoid
3243	* any increase in contention.
3244	*
3245	* Called just before entering the device driver to initiate a new disk I/O.
3246	* The buffer must be locked, thus, no I/O completion operations can occur
3247	* while we are manipulating its associated dependencies.
3248	*/
3249	/* structure describing disk write to occur */
3250	void
3251	softdep_disk_io_initiation(struct buf *bp)
3252	{
3253	struct worklist wk, nextwk;
3254	struct indirdep *indirdep;
3255	struct inodedep *inodedep;
3256	struct buf *sbp;
3257
3258	/*
3259	* We only care about write operations. There should never
3260	* be dependencies for reads.
3261	*/
3262	if (bp->b_flags & B_READ0x00008000)
3263	panic("softdep_disk_io_initiation: read");
3264
3265	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
3266
3267	/*
3268	* Do any necessary pre-I/O processing.
3269	*/
3270	for (wk = LIST_FIRST(&bp->b_dep)((&bp->b_dep)->lh_first); wk; wk = nextwk) {
3271	nextwk = LIST_NEXT(wk, wk_list)((wk)->wk_list.le_next);
3272	switch (wk->wk_type) {
3273
3274	case D_PAGEDEP0:
3275	initiate_write_filepage(WK_PAGEDEP(wk)((struct pagedep *)(wk)), bp);
3276	continue;
3277
3278	case D_INODEDEP1:
3279	inodedep = WK_INODEDEP(wk)((struct inodedep *)(wk));
3280	if (inodedep->id_fs->fs_magic == FS_UFS1_MAGIC0x011954)
3281	initiate_write_inodeblock_ufs1(inodedep, bp);
3282	#ifdef FFS21
3283	else
3284	initiate_write_inodeblock_ufs2(inodedep, bp);
3285	#endif
3286	continue;
3287
3288	case D_INDIRDEP5:
3289	indirdep = WK_INDIRDEP(wk)((struct indirdep *)(wk));
3290	if (indirdep->ir_stateir_list.wk_state & GOINGAWAY0x0100)
3291	panic("disk_io_initiation: indirdep gone");
3292	/*
3293	* If there are no remaining dependencies, this
3294	* will be writing the real pointers, so the
3295	* dependency can be freed.
3296	*/
3297	if (LIST_FIRST(&indirdep->ir_deplisthd)((&indirdep->ir_deplisthd)->lh_first) == NULL((void *)0)) {
3298	sbp = indirdep->ir_savebp;
3299	sbp->b_flags \|= B_INVAL0x00000800 \| B_NOCACHE0x00001000;
3300	/* inline expand WORKLIST_REMOVE(wk); */
3301	wk->wk_state &= ~ONWORKLIST0x8000;
3302	LIST_REMOVE(wk, wk_list)do { if ((wk)->wk_list.le_next != ((void )0)) (wk)->wk_list .le_next->wk_list.le_prev = (wk)->wk_list.le_prev; (wk )->wk_list.le_prev = (wk)->wk_list.le_next; ((wk)->wk_list .le_prev) = ((void )-1); ((wk)->wk_list.le_next) = ((void )-1); } while (0);
3303	WORKITEM_FREE(indirdep, D_INDIRDEP)softdep_freequeue_add((struct worklist *)indirdep);
3304	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3305	brelse(sbp);
3306	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
3307	continue;
3308	}
3309	/*
3310	* Replace up-to-date version with safe version.
3311	*/
3312	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3313	indirdep->ir_saveddata = malloc(bp->b_bcount,
3314	M_INDIRDEP83, M_WAITOK0x0001);
3315	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
3316	indirdep->ir_stateir_list.wk_state &= ~ATTACHED0x0001;
3317	indirdep->ir_stateir_list.wk_state \|= UNDONE0x0002;
3318	memcpy(indirdep->ir_saveddata, bp->b_data, bp->b_bcount)__builtin_memcpy((indirdep->ir_saveddata), (bp->b_data) , (bp->b_bcount));
3319	memcpy(bp->b_data, indirdep->ir_savebp->b_data,__builtin_memcpy((bp->b_data), (indirdep->ir_savebp-> b_data), (bp->b_bcount))
3320	bp->b_bcount)__builtin_memcpy((bp->b_data), (indirdep->ir_savebp-> b_data), (bp->b_bcount));
3321	continue;
3322
3323	case D_MKDIR11:
3324	case D_BMSAFEMAP3:
3325	case D_ALLOCDIRECT4:
3326	case D_ALLOCINDIR6:
3327	continue;
3328
3329	default:
3330	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3331	panic("handle_disk_io_initiation: Unexpected type %s",
3332	TYPENAME(wk->wk_type)((unsigned)(wk->wk_type) <= 13 ? softdep_typenames[wk-> wk_type] : "???"));
3333	/* NOTREACHED */
3334	}
3335	}
3336
3337	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3338	}
3339
3340	/*
3341	* Called from within the procedure above to deal with unsatisfied
3342	* allocation dependencies in a directory. The buffer must be locked,
3343	* thus, no I/O completion operations can occur while we are
3344	* manipulating its associated dependencies.
3345	*/
3346	STATIC void
3347	initiate_write_filepage(struct pagedep pagedep, struct buf bp)
3348	{
3349	struct diradd *dap;
3350	struct direct *ep;
3351	int i;
3352
3353	if (pagedep->pd_statepd_list.wk_state & IOSTARTED0x0200) {
3354	/*
3355	* This can only happen if there is a driver that does not
3356	* understand chaining. Here biodone will reissue the call
3357	* to strategy for the incomplete buffers.
3358	*/
3359	printf("initiate_write_filepage: already started\n");
3360	return;
3361	}
3362	pagedep->pd_statepd_list.wk_state \|= IOSTARTED0x0200;
3363	for (i = 0; i < DAHASHSZ6; i++) {
3364	LIST_FOREACH(dap, &pagedep->pd_diraddhd[i], da_pdlist)for((dap) = ((&pagedep->pd_diraddhd[i])->lh_first); (dap)!= ((void *)0); (dap) = ((dap)->da_pdlist.le_next)) {
3365	ep = (struct direct *)
3366	((char *)bp->b_data + dap->da_offset);
3367	if (ep->d_ino != dap->da_newinum) {
3368	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3369	panic("%s: dir inum %u != new %u",
3370	"initiate_write_filepage",
3371	ep->d_ino, dap->da_newinum);
3372	}
3373	if (dap->da_stateda_list.wk_state & DIRCHG0x0080)
3374	ep->d_ino = dap->da_previousda_un.dau_previous->dm_oldinum;
3375	else
3376	ep->d_ino = 0;
3377	dap->da_stateda_list.wk_state &= ~ATTACHED0x0001;
3378	dap->da_stateda_list.wk_state \|= UNDONE0x0002;
3379	}
3380	}
3381	}
3382
3383	/*
3384	* Called from within the procedure above to deal with unsatisfied
3385	* allocation dependencies in an inodeblock. The buffer must be
3386	* locked, thus, no I/O completion operations can occur while we
3387	* are manipulating its associated dependencies.
3388	*/
3389	/* The inode block */
3390	STATIC void
3391	initiate_write_inodeblock_ufs1(struct inodedep inodedep, struct buf bp)
3392	{
3393	struct allocdirect adp, lastadp;
3394	struct ufs1_dinode *dp;
3395	struct fs *fs;
3396	#ifdef DIAGNOSTIC1
3397	daddr_t prevlbn = 0;
3398	int32_t d1, d2;
3399	#endif
3400	int i, deplist;
3401
3402	if (inodedep->id_stateid_list.wk_state & IOSTARTED0x0200) {
3403	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3404	panic("initiate_write_inodeblock: already started");
3405	}
3406	inodedep->id_stateid_list.wk_state \|= IOSTARTED0x0200;
3407	fs = inodedep->id_fs;
3408	dp = (struct ufs1_dinode *)bp->b_data +
3409	ino_to_fsbo(fs, inodedep->id_ino)((inodedep->id_ino) % ((fs)->fs_inopb));
3410	/*
3411	* If the bitmap is not yet written, then the allocated
3412	* inode cannot be written to disk.
3413	*/
3414	if ((inodedep->id_stateid_list.wk_state & DEPCOMPLETE0x0008) == 0) {
3415	if (inodedep->id_savedino1id_un.idu_savedino1 != NULL((void *)0)) {
3416	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3417	panic("initiate_write_inodeblock: already doing I/O");
3418	}
3419	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3420	inodedep->id_savedino1id_un.idu_savedino1 = malloc(sizeof(struct ufs1_dinode),
3421	M_INODEDEP79, M_WAITOK0x0001);
3422	inodedep->id_unsize = sizeof(struct ufs1_dinode);
3423	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
3424	inodedep->id_savedino1id_un.idu_savedino1 = dp;
3425	memset(dp, 0, sizeof(struct ufs1_dinode))__builtin_memset((dp), (0), (sizeof(struct ufs1_dinode)));
3426	return;
3427	}
3428	/*
3429	* If no dependencies, then there is nothing to roll back.
3430	*/
3431	inodedep->id_savedsize = dp->di_size;
3432	if (TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first) == NULL((void *)0))
3433	return;
3434	/*
3435	* Set the dependencies to busy.
3436	*/
3437	for (deplist = 0, adp = TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first); adp;
3438	adp = TAILQ_NEXT(adp, ad_next)((adp)->ad_next.tqe_next)) {
3439	#ifdef DIAGNOSTIC1
3440	if (deplist != 0 && prevlbn >= adp->ad_lbn) {
3441	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3442	panic("softdep_write_inodeblock: lbn order");
3443	}
3444	prevlbn = adp->ad_lbn;
3445	if (adp->ad_lbn < NDADDR12 &&
3446	(d1 = dp->di_db[adp->ad_lbn]) != (d2 = adp->ad_newblkno)) {
3447	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3448	panic("%s: direct pointer #%lld mismatch %d != %d",
3449	"softdep_write_inodeblock", (long long)adp->ad_lbn,
3450	d1, d2);
3451	}
3452	if (adp->ad_lbn >= NDADDR12 &&
3453	(d1 = dp->di_ib[adp->ad_lbn - NDADDR12]) !=
3454	(d2 = adp->ad_newblkno)) {
3455	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3456	panic("%s: indirect pointer #%lld mismatch %d != %d",
3457	"softdep_write_inodeblock", (long long)(adp->ad_lbn -
3458	NDADDR12), d1, d2);
3459	}
3460	deplist \|= 1 << adp->ad_lbn;
3461	if ((adp->ad_statead_list.wk_state & ATTACHED0x0001) == 0) {
3462	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3463	panic("softdep_write_inodeblock: Unknown state 0x%x",
3464	adp->ad_statead_list.wk_state);
3465	}
3466	#endif /* DIAGNOSTIC */
3467	adp->ad_statead_list.wk_state &= ~ATTACHED0x0001;
3468	adp->ad_statead_list.wk_state \|= UNDONE0x0002;
3469	}
3470	/*
3471	* The on-disk inode cannot claim to be any larger than the last
3472	* fragment that has been written. Otherwise, the on-disk inode
3473	* might have fragments that were not the last block in the file
3474	* which would corrupt the filesystem.
3475	*/
3476	for (lastadp = NULL((void *)0), adp = TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first); adp;
3477	lastadp = adp, adp = TAILQ_NEXT(adp, ad_next)((adp)->ad_next.tqe_next)) {
3478	if (adp->ad_lbn >= NDADDR12)
3479	break;
3480	dp->di_db[adp->ad_lbn] = adp->ad_oldblkno;
3481	/* keep going until hitting a rollback to a frag */
3482	if (adp->ad_oldsize == 0 \|\| adp->ad_oldsize == fs->fs_bsize)
3483	continue;
3484	dp->di_size = fs->fs_bsize * adp->ad_lbn + adp->ad_oldsize;
3485	for (i = adp->ad_lbn + 1; i < NDADDR12; i++) {
3486	#ifdef DIAGNOSTIC1
3487	if (dp->di_db[i] != 0 && (deplist & (1 << i)) == 0) {
3488	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3489	panic("softdep_write_inodeblock: lost dep1");
3490	}
3491	#endif /* DIAGNOSTIC */
3492	dp->di_db[i] = 0;
3493	}
3494	for (i = 0; i < NIADDR3; i++) {
3495	#ifdef DIAGNOSTIC1
3496	if (dp->di_ib[i] != 0 &&
3497	(deplist & ((1 << NDADDR12) << i)) == 0) {
3498	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3499	panic("softdep_write_inodeblock: lost dep2");
3500	}
3501	#endif /* DIAGNOSTIC */
3502	dp->di_ib[i] = 0;
3503	}
3504	return;
3505	}
3506	/*
3507	* If we have zero'ed out the last allocated block of the file,
3508	* roll back the size to the last currently allocated block.
3509	* We know that this last allocated block is a full-sized as
3510	* we already checked for fragments in the loop above.
3511	*/
3512	if (lastadp != NULL((void *)0) &&
3513	dp->di_size <= (lastadp->ad_lbn + 1) * fs->fs_bsize) {
3514	for (i = lastadp->ad_lbn; i >= 0; i--)
3515	if (dp->di_db[i] != 0)
3516	break;
3517	dp->di_size = (i + 1) * fs->fs_bsize;
3518	}
3519	/*
3520	* The only dependencies are for indirect blocks.
3521	*
3522	* The file size for indirect block additions is not guaranteed.
3523	* Such a guarantee would be non-trivial to achieve. The conventional
3524	* synchronous write implementation also does not make this guarantee.
3525	* Fsck should catch and fix discrepancies. Arguably, the file size
3526	* can be over-estimated without destroying integrity when the file
3527	* moves into the indirect blocks (i.e., is large). If we want to
3528	* postpone fsck, we are stuck with this argument.
3529	*/
3530	for (; adp; adp = TAILQ_NEXT(adp, ad_next)((adp)->ad_next.tqe_next))
3531	dp->di_ib[adp->ad_lbn - NDADDR12] = 0;
3532	}
3533
3534	#ifdef FFS21
3535	/*
3536	* Version of initiate_write_inodeblock that handles FFS2 dinodes.
3537	*/
3538	/* The inode block */
3539	STATIC void
3540	initiate_write_inodeblock_ufs2(struct inodedep inodedep, struct buf bp)
3541	{
3542	struct allocdirect adp, lastadp;
3543	struct ufs2_dinode *dp;
3544	struct fs *fs = inodedep->id_fs;
3545	#ifdef DIAGNOSTIC1
3546	daddr_t prevlbn = -1, d1, d2;
3547	#endif
3548	int deplist, i;
3549
3550	if (inodedep->id_stateid_list.wk_state & IOSTARTED0x0200)
3551	panic("initiate_write_inodeblock_ufs2: already started");
3552	inodedep->id_stateid_list.wk_state \|= IOSTARTED0x0200;
3553	fs = inodedep->id_fs;
3554	dp = (struct ufs2_dinode *)bp->b_data +
3555	ino_to_fsbo(fs, inodedep->id_ino)((inodedep->id_ino) % ((fs)->fs_inopb));
3556	/*
3557	* If the bitmap is not yet written, then the allocated
3558	* inode cannot be written to disk.
3559	*/
3560	if ((inodedep->id_stateid_list.wk_state & DEPCOMPLETE0x0008) == 0) {
3561	if (inodedep->id_savedino2id_un.idu_savedino2 != NULL((void *)0))
3562	panic("initiate_write_inodeblock_ufs2: I/O underway");
3563	inodedep->id_savedino2id_un.idu_savedino2 = malloc(sizeof(struct ufs2_dinode),
3564	M_INODEDEP79, M_WAITOK0x0001);
3565	inodedep->id_unsize = sizeof(struct ufs2_dinode);
3566	inodedep->id_savedino2id_un.idu_savedino2 = dp;
3567	memset(dp, 0, sizeof(struct ufs2_dinode))__builtin_memset((dp), (0), (sizeof(struct ufs2_dinode)));
3568	return;
3569	}
3570	/*
3571	* If no dependencies, then there is nothing to roll back.
3572	*/
3573	inodedep->id_savedsize = dp->di_size;
3574	if (TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first) == NULL((void *)0))
3575	return;
3576
3577	#ifdef notyet
3578	inodedep->id_savedextsize = dp->di_extsize;
3579	if (TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first) == NULL((void *)0) &&
3580	TAILQ_FIRST(&inodedep->id_extupdt)((&inodedep->id_extupdt)->tqh_first) == NULL((void *)0))
3581	return;
3582	/*
3583	* Set the ext data dependencies to busy.
3584	*/
3585	for (deplist = 0, adp = TAILQ_FIRST(&inodedep->id_extupdt)((&inodedep->id_extupdt)->tqh_first); adp;
3586	adp = TAILQ_NEXT(adp, ad_next)((adp)->ad_next.tqe_next)) {
3587	#ifdef DIAGNOSTIC1
3588	if (deplist != 0 && prevlbn >= adp->ad_lbn) {
3589	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3590	panic("softdep_write_inodeblock: lbn order");
3591	}
3592	prevlbn = adp->ad_lbn;
3593	if ((d1 = dp->di_extb[adp->ad_lbn]) !=
3594	(d2 = adp->ad_newblkno)) {
3595	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3596	panic("%s: direct pointer #%lld mismatch %lld != %lld",
3597	"softdep_write_inodeblock", (long long)adp->ad_lbn,
3598	d1, d2);
3599	}
3600	deplist \|= 1 << adp->ad_lbn;
3601	if ((adp->ad_statead_list.wk_state & ATTACHED0x0001) == 0) {
3602	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3603	panic("softdep_write_inodeblock: Unknown state 0x%x",
3604	adp->ad_statead_list.wk_state);
3605	}
3606	#endif /* DIAGNOSTIC */
3607	adp->ad_statead_list.wk_state &= ~ATTACHED0x0001;
3608	adp->ad_statead_list.wk_state \|= UNDONE0x0002;
3609	}
3610	/*
3611	* The on-disk inode cannot claim to be any larger than the last
3612	* fragment that has been written. Otherwise, the on-disk inode
3613	* might have fragments that were not the last block in the ext
3614	* data which would corrupt the filesystem.
3615	*/
3616	for (lastadp = NULL((void *)0), adp = TAILQ_FIRST(&inodedep->id_extupdt)((&inodedep->id_extupdt)->tqh_first); adp;
3617	lastadp = adp, adp = TAILQ_NEXT(adp, ad_next)((adp)->ad_next.tqe_next)) {
3618	dp->di_extb[adp->ad_lbn] = adp->ad_oldblkno;
3619	/* keep going until hitting a rollback to a frag */
3620	if (adp->ad_oldsize == 0 \|\| adp->ad_oldsize == fs->fs_bsize)
3621	continue;
3622	dp->di_extsize = fs->fs_bsize * adp->ad_lbn + adp->ad_oldsize;
3623	for (i = adp->ad_lbn + 1; i < NXADDR2; i++) {
3624	#ifdef DIAGNOSTIC1
3625	if (dp->di_extb[i] != 0 && (deplist & (1 << i)) == 0) {
3626	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3627	panic("softdep_write_inodeblock: lost dep1");
3628	}
3629	#endif /* DIAGNOSTIC */
3630	dp->di_extb[i] = 0;
3631	}
3632	lastadp = NULL((void *)0);
3633	break;
3634	}
3635	/*
3636	* If we have zero'ed out the last allocated block of the ext
3637	* data, roll back the size to the last currently allocated block.
3638	* We know that this last allocated block is a full-sized as
3639	* we already checked for fragments in the loop above.
3640	*/
3641	if (lastadp != NULL((void *)0) &&
3642	dp->di_extsize <= (lastadp->ad_lbn + 1) * fs->fs_bsize) {
3643	for (i = lastadp->ad_lbn; i >= 0; i--)
3644	if (dp->di_extb[i] != 0)
3645	break;
3646	dp->di_extsize = (i + 1) * fs->fs_bsize;
3647	}
3648	#endif /* notyet */
3649
3650	/*
3651	* Set the file data dependencies to busy.
3652	*/
3653	for (deplist = 0, adp = TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first); adp;
3654	adp = TAILQ_NEXT(adp, ad_next)((adp)->ad_next.tqe_next)) {
3655	#ifdef DIAGNOSTIC1
3656	if (deplist != 0 && prevlbn >= adp->ad_lbn) {
3657	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3658	panic("softdep_write_inodeblock: lbn order");
3659	}
3660	prevlbn = adp->ad_lbn;
3661	if (adp->ad_lbn < NDADDR12 &&
3662	(d1 = dp->di_db[adp->ad_lbn]) != (d2 = adp->ad_newblkno)) {
3663	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3664	panic("%s: direct pointer #%lld mismatch %lld != %lld",
3665	"softdep_write_inodeblock", (long long)adp->ad_lbn,
3666	d1, d2);
3667	}
3668	if (adp->ad_lbn >= NDADDR12 &&
3669	(d1 = dp->di_ib[adp->ad_lbn - NDADDR12]) !=
3670	(d2 = adp->ad_newblkno)) {
3671	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3672	panic("%s: indirect pointer #%lld mismatch %lld != %lld",
3673	"softdep_write_inodeblock", (long long)(adp->ad_lbn -
3674	NDADDR12), d1, d2);
3675	}
3676	deplist \|= 1 << adp->ad_lbn;
3677	if ((adp->ad_statead_list.wk_state & ATTACHED0x0001) == 0) {
3678	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3679	panic("softdep_write_inodeblock: Unknown state 0x%x",
3680	adp->ad_statead_list.wk_state);
3681	}
3682	#endif /* DIAGNOSTIC */
3683	adp->ad_statead_list.wk_state &= ~ATTACHED0x0001;
3684	adp->ad_statead_list.wk_state \|= UNDONE0x0002;
3685	}
3686	/*
3687	* The on-disk inode cannot claim to be any larger than the last
3688	* fragment that has been written. Otherwise, the on-disk inode
3689	* might have fragments that were not the last block in the file
3690	* which would corrupt the filesystem.
3691	*/
3692	for (lastadp = NULL((void *)0), adp = TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first); adp;
3693	lastadp = adp, adp = TAILQ_NEXT(adp, ad_next)((adp)->ad_next.tqe_next)) {
3694	if (adp->ad_lbn >= NDADDR12)
3695	break;
3696	dp->di_db[adp->ad_lbn] = adp->ad_oldblkno;
3697	/* keep going until hitting a rollback to a frag */
3698	if (adp->ad_oldsize == 0 \|\| adp->ad_oldsize == fs->fs_bsize)
3699	continue;
3700	dp->di_size = fs->fs_bsize * adp->ad_lbn + adp->ad_oldsize;
3701	for (i = adp->ad_lbn + 1; i < NDADDR12; i++) {
3702	#ifdef DIAGNOSTIC1
3703	if (dp->di_db[i] != 0 && (deplist & (1 << i)) == 0) {
3704	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3705	panic("softdep_write_inodeblock: lost dep2");
3706	}
3707	#endif /* DIAGNOSTIC */
3708	dp->di_db[i] = 0;
3709	}
3710	for (i = 0; i < NIADDR3; i++) {
3711	#ifdef DIAGNOSTIC1
3712	if (dp->di_ib[i] != 0 &&
3713	(deplist & ((1 << NDADDR12) << i)) == 0) {
3714	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
3715	panic("softdep_write_inodeblock: lost dep3");
3716	}
3717	#endif /* DIAGNOSTIC */
3718	dp->di_ib[i] = 0;
3719	}
3720	return;
3721	}
3722	/*
3723	* If we have zero'ed out the last allocated block of the file,
3724	* roll back the size to the last currently allocated block.
3725	* We know that this last allocated block is a full-sized as
3726	* we already checked for fragments in the loop above.
3727	*/
3728	if (lastadp != NULL((void *)0) &&
3729	dp->di_size <= (lastadp->ad_lbn + 1) * fs->fs_bsize) {
3730	for (i = lastadp->ad_lbn; i >= 0; i--)
3731	if (dp->di_db[i] != 0)
3732	break;
3733	dp->di_size = (i + 1) * fs->fs_bsize;
3734	}
3735	/*
3736	* The only dependencies are for indirect blocks.
3737	*
3738	* The file size for indirect block additions is not guaranteed.
3739	* Such a guarantee would be non-trivial to achieve. The conventional
3740	* synchronous write implementation also does not make this guarantee.
3741	* Fsck should catch and fix discrepancies. Arguably, the file size
3742	* can be over-estimated without destroying integrity when the file
3743	* moves into the indirect blocks (i.e., is large). If we want to
3744	* postpone fsck, we are stuck with this argument.
3745	*/
3746	for (; adp; adp = TAILQ_NEXT(adp, ad_next)((adp)->ad_next.tqe_next))
3747	dp->di_ib[adp->ad_lbn - NDADDR12] = 0;
3748	}
3749	#endif /* FFS2 */
3750
3751	/*
3752	* This routine is called during the completion interrupt
3753	* service routine for a disk write (from the procedure called
3754	* by the device driver to inform the file system caches of
3755	* a request completion). It should be called early in this
3756	* procedure, before the block is made available to other
3757	* processes or other routines are called.
3758	*/
3759	/* describes the completed disk write */
3760	void
3761	softdep_disk_write_complete(struct buf *bp)
3762	{
3763	struct worklist *wk;
3764	struct workhead reattach;
3765	struct newblk *newblk;
3766	struct allocindir *aip;
3767	struct allocdirect *adp;
3768	struct indirdep *indirdep;
3769	struct inodedep *inodedep;
3770	struct bmsafemap *bmsafemap;
3771
3772	/*
3773	* If an error occurred while doing the write, then the data
3774	* has not hit the disk and the dependencies cannot be unrolled.
3775	*/
3776	if ((bp->b_flags & B_ERROR0x00000400) && !(bp->b_flags & B_INVAL0x00000800))
3777	return;
3778
3779	#ifdef DEBUG
3780	if (lk.lkt_held != -1)
3781	panic("softdep_disk_write_complete: lock is held");
3782	lk.lkt_held = -2;
3783	#endif
3784	LIST_INIT(&reattach)do { ((&reattach)->lh_first) = ((void *)0); } while (0 );
3785	while ((wk = LIST_FIRST(&bp->b_dep)((&bp->b_dep)->lh_first)) != NULL((void *)0)) {
3786	WORKLIST_REMOVE(wk)do { (wk)->wk_state &= ~0x8000; do { if ((wk)->wk_list .le_next != ((void )0)) (wk)->wk_list.le_next->wk_list .le_prev = (wk)->wk_list.le_prev; (wk)->wk_list.le_prev = (wk)->wk_list.le_next; ((wk)->wk_list.le_prev) = ((void )-1); ((wk)->wk_list.le_next) = ((void )-1); } while (0 ); } while (0);
3787	switch (wk->wk_type) {
3788
3789	case D_PAGEDEP0:
3790	if (handle_written_filepage(WK_PAGEDEP(wk)((struct pagedep *)(wk)), bp))
3791	WORKLIST_INSERT(&reattach, wk)do { (wk)->wk_state \|= 0x8000; do { if (((wk)->wk_list. le_next = (&reattach)->lh_first) != ((void *)0)) (& reattach)->lh_first->wk_list.le_prev = &(wk)->wk_list .le_next; (&reattach)->lh_first = (wk); (wk)->wk_list .le_prev = &(&reattach)->lh_first; } while (0); } while (0);
3792	continue;
3793
3794	case D_INODEDEP1:
3795	if (handle_written_inodeblock(WK_INODEDEP(wk)((struct inodedep *)(wk)), bp))
3796	WORKLIST_INSERT(&reattach, wk)do { (wk)->wk_state \|= 0x8000; do { if (((wk)->wk_list. le_next = (&reattach)->lh_first) != ((void *)0)) (& reattach)->lh_first->wk_list.le_prev = &(wk)->wk_list .le_next; (&reattach)->lh_first = (wk); (wk)->wk_list .le_prev = &(&reattach)->lh_first; } while (0); } while (0);
3797	continue;
3798
3799	case D_BMSAFEMAP3:
3800	bmsafemap = WK_BMSAFEMAP(wk)((struct bmsafemap *)(wk));
3801	while ((newblk = LIST_FIRST(&bmsafemap->sm_newblkhd)((&bmsafemap->sm_newblkhd)->lh_first))) {
3802	newblk->nb_state \|= DEPCOMPLETE0x0008;
3803	newblk->nb_bmsafemap = NULL((void *)0);
3804	LIST_REMOVE(newblk, nb_deps)do { if ((newblk)->nb_deps.le_next != ((void )0)) (newblk )->nb_deps.le_next->nb_deps.le_prev = (newblk)->nb_deps .le_prev; (newblk)->nb_deps.le_prev = (newblk)->nb_deps .le_next; ((newblk)->nb_deps.le_prev) = ((void )-1); ((newblk )->nb_deps.le_next) = ((void )-1); } while (0);
3805	}
3806	while ((adp =
3807	LIST_FIRST(&bmsafemap->sm_allocdirecthd)((&bmsafemap->sm_allocdirecthd)->lh_first))) {
3808	adp->ad_statead_list.wk_state \|= DEPCOMPLETE0x0008;
3809	adp->ad_buf = NULL((void *)0);
3810	LIST_REMOVE(adp, ad_deps)do { if ((adp)->ad_deps.le_next != ((void )0)) (adp)-> ad_deps.le_next->ad_deps.le_prev = (adp)->ad_deps.le_prev ; (adp)->ad_deps.le_prev = (adp)->ad_deps.le_next; ((adp )->ad_deps.le_prev) = ((void )-1); ((adp)->ad_deps.le_next ) = ((void )-1); } while (0);
3811	handle_allocdirect_partdone(adp);
3812	}
3813	while ((aip =
3814	LIST_FIRST(&bmsafemap->sm_allocindirhd)((&bmsafemap->sm_allocindirhd)->lh_first))) {
3815	aip->ai_stateai_list.wk_state \|= DEPCOMPLETE0x0008;
3816	aip->ai_buf = NULL((void *)0);
3817	LIST_REMOVE(aip, ai_deps)do { if ((aip)->ai_deps.le_next != ((void )0)) (aip)-> ai_deps.le_next->ai_deps.le_prev = (aip)->ai_deps.le_prev ; (aip)->ai_deps.le_prev = (aip)->ai_deps.le_next; ((aip )->ai_deps.le_prev) = ((void )-1); ((aip)->ai_deps.le_next ) = ((void )-1); } while (0);
3818	handle_allocindir_partdone(aip);
3819	}
3820	while ((inodedep =
3821	LIST_FIRST(&bmsafemap->sm_inodedephd)((&bmsafemap->sm_inodedephd)->lh_first)) != NULL((void *)0)) {
3822	inodedep->id_stateid_list.wk_state \|= DEPCOMPLETE0x0008;
3823	LIST_REMOVE(inodedep, id_deps)do { if ((inodedep)->id_deps.le_next != ((void )0)) (inodedep )->id_deps.le_next->id_deps.le_prev = (inodedep)->id_deps .le_prev; (inodedep)->id_deps.le_prev = (inodedep)->id_deps .le_next; ((inodedep)->id_deps.le_prev) = ((void )-1); (( inodedep)->id_deps.le_next) = ((void )-1); } while (0);
3824	inodedep->id_buf = NULL((void *)0);
3825	}
3826	WORKITEM_FREE(bmsafemap, D_BMSAFEMAP)softdep_freequeue_add((struct worklist *)bmsafemap);
3827	continue;
3828
3829	case D_MKDIR11:
3830	handle_written_mkdir(WK_MKDIR(wk)((struct mkdir *)(wk)), MKDIR_BODY0x0020);
3831	continue;
3832
3833	case D_ALLOCDIRECT4:
3834	adp = WK_ALLOCDIRECT(wk)((struct allocdirect *)(wk));
3835	adp->ad_statead_list.wk_state \|= COMPLETE0x0004;
3836	handle_allocdirect_partdone(adp);
3837	continue;
3838
3839	case D_ALLOCINDIR6:
3840	aip = WK_ALLOCINDIR(wk)((struct allocindir *)(wk));
3841	aip->ai_stateai_list.wk_state \|= COMPLETE0x0004;
3842	handle_allocindir_partdone(aip);
3843	continue;
3844
3845	case D_INDIRDEP5:
3846	indirdep = WK_INDIRDEP(wk)((struct indirdep *)(wk));
3847	if (indirdep->ir_stateir_list.wk_state & GOINGAWAY0x0100)
3848	panic("disk_write_complete: indirdep gone");
3849	memcpy(bp->b_data, indirdep->ir_saveddata, bp->b_bcount)__builtin_memcpy((bp->b_data), (indirdep->ir_saveddata) , (bp->b_bcount));
3850	free(indirdep->ir_saveddata, M_INDIRDEP83, bp->b_bcount);
3851	indirdep->ir_saveddata = NULL((void *)0);
3852	indirdep->ir_stateir_list.wk_state &= ~UNDONE0x0002;
3853	indirdep->ir_stateir_list.wk_state \|= ATTACHED0x0001;
3854	while ((aip = LIST_FIRST(&indirdep->ir_donehd)((&indirdep->ir_donehd)->lh_first))) {
3855	handle_allocindir_partdone(aip);
3856	if (aip == LIST_FIRST(&indirdep->ir_donehd)((&indirdep->ir_donehd)->lh_first))
3857	panic("disk_write_complete: not gone");
3858	}
3859	WORKLIST_INSERT(&reattach, wk)do { (wk)->wk_state \|= 0x8000; do { if (((wk)->wk_list. le_next = (&reattach)->lh_first) != ((void *)0)) (& reattach)->lh_first->wk_list.le_prev = &(wk)->wk_list .le_next; (&reattach)->lh_first = (wk); (wk)->wk_list .le_prev = &(&reattach)->lh_first; } while (0); } while (0);
3860	if ((bp->b_flags & B_DELWRI0x00000080) == 0)
3861	stat_indir_blk_ptrs++;
3862	buf_dirty(bp);
3863	continue;
3864
3865	default:
3866	panic("handle_disk_write_complete: Unknown type %s",
3867	TYPENAME(wk->wk_type)((unsigned)(wk->wk_type) <= 13 ? softdep_typenames[wk-> wk_type] : "???"));
3868	/* NOTREACHED */
3869	}
3870	}
3871	/*
3872	* Reattach any requests that must be redone.
3873	*/
3874	while ((wk = LIST_FIRST(&reattach)((&reattach)->lh_first)) != NULL((void *)0)) {
3875	WORKLIST_REMOVE(wk)do { (wk)->wk_state &= ~0x8000; do { if ((wk)->wk_list .le_next != ((void )0)) (wk)->wk_list.le_next->wk_list .le_prev = (wk)->wk_list.le_prev; (wk)->wk_list.le_prev = (wk)->wk_list.le_next; ((wk)->wk_list.le_prev) = ((void )-1); ((wk)->wk_list.le_next) = ((void )-1); } while (0 ); } while (0);
3876	WORKLIST_INSERT(&bp->b_dep, wk)do { (wk)->wk_state \|= 0x8000; do { if (((wk)->wk_list. le_next = (&bp->b_dep)->lh_first) != ((void *)0)) ( &bp->b_dep)->lh_first->wk_list.le_prev = &(wk )->wk_list.le_next; (&bp->b_dep)->lh_first = (wk ); (wk)->wk_list.le_prev = &(&bp->b_dep)->lh_first ; } while (0); } while (0);
3877	}
3878	#ifdef DEBUG
3879	if (lk.lkt_held != -2)
3880	panic("softdep_disk_write_complete: lock lost");
3881	lk.lkt_held = -1;
3882	#endif
3883	}
3884
3885	/*
3886	* Called from within softdep_disk_write_complete above. Note that
3887	* this routine is always called from interrupt level with further
3888	* splbio interrupts blocked.
3889	*/
3890	/* the completed allocdirect */
3891	STATIC void
3892	handle_allocdirect_partdone(struct allocdirect *adp)
3893	{
3894	struct allocdirect *listadp;
3895	struct inodedep *inodedep;
3896	long bsize, delay;
3897
3898	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
3899
3900	if ((adp->ad_statead_list.wk_state & ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) != ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008))
3901	return;
3902	if (adp->ad_buf != NULL((void *)0))
3903	panic("handle_allocdirect_partdone: dangling dep");
3904
3905	/*
3906	* The on-disk inode cannot claim to be any larger than the last
3907	* fragment that has been written. Otherwise, the on-disk inode
3908	* might have fragments that were not the last block in the file
3909	* which would corrupt the filesystem. Thus, we cannot free any
3910	* allocdirects after one whose ad_oldblkno claims a fragment as
3911	* these blocks must be rolled back to zero before writing the inode.
3912	* We check the currently active set of allocdirects in id_inoupdt.
3913	*/
3914	inodedep = adp->ad_inodedep;
3915	bsize = inodedep->id_fs->fs_bsize;
3916	TAILQ_FOREACH(listadp, &inodedep->id_inoupdt, ad_next)for((listadp) = ((&inodedep->id_inoupdt)->tqh_first ); (listadp) != ((void *)0); (listadp) = ((listadp)->ad_next .tqe_next)) {
3917	/* found our block */
3918	if (listadp == adp)
3919	break;
3920	/* continue if ad_oldlbn is not a fragment */
3921	if (listadp->ad_oldsize == 0 \|\|
3922	listadp->ad_oldsize == bsize)
3923	continue;
3924	/* hit a fragment */
3925	return;
3926	}
3927	/*
3928	* If we have reached the end of the current list without
3929	* finding the just finished dependency, then it must be
3930	* on the future dependency list. Future dependencies cannot
3931	* be freed until they are moved to the current list.
3932	*/
3933	if (listadp == NULL((void *)0)) {
3934	#ifdef DEBUG
3935	TAILQ_FOREACH(listadp, &inodedep->id_newinoupdt, ad_next)for((listadp) = ((&inodedep->id_newinoupdt)->tqh_first ); (listadp) != ((void *)0); (listadp) = ((listadp)->ad_next .tqe_next))
3936	/* found our block */
3937	if (listadp == adp)
3938	break;
3939	if (listadp == NULL((void *)0))
3940	panic("handle_allocdirect_partdone: lost dep");
3941	#endif /* DEBUG */
3942	return;
3943	}
3944	/*
3945	* If we have found the just finished dependency, then free
3946	* it along with anything that follows it that is complete.
3947	* If the inode still has a bitmap dependency, then it has
3948	* never been written to disk, hence the on-disk inode cannot
3949	* reference the old fragment so we can free it without delay.
3950	*/
3951	delay = (inodedep->id_stateid_list.wk_state & DEPCOMPLETE0x0008);
3952	for (; adp; adp = listadp) {
3953	listadp = TAILQ_NEXT(adp, ad_next)((adp)->ad_next.tqe_next);
3954	if ((adp->ad_statead_list.wk_state & ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) != ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008))
3955	return;
3956	free_allocdirect(&inodedep->id_inoupdt, adp, delay);
3957	}
3958	}
3959
3960	/*
3961	* Called from within softdep_disk_write_complete above. Note that
3962	* this routine is always called from interrupt level with further
3963	* splbio interrupts blocked.
3964	*/
3965	/* the completed allocindir */
3966	STATIC void
3967	handle_allocindir_partdone(struct allocindir *aip)
3968	{
3969	struct indirdep *indirdep;
3970
3971	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
3972
3973	if ((aip->ai_stateai_list.wk_state & ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) != ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008))
3974	return;
3975	if (aip->ai_buf != NULL((void *)0))
3976	panic("handle_allocindir_partdone: dangling dependency");
3977	indirdep = aip->ai_indirdep;
3978	if (indirdep->ir_stateir_list.wk_state & UNDONE0x0002) {
3979	LIST_REMOVE(aip, ai_next)do { if ((aip)->ai_next.le_next != ((void )0)) (aip)-> ai_next.le_next->ai_next.le_prev = (aip)->ai_next.le_prev ; (aip)->ai_next.le_prev = (aip)->ai_next.le_next; ((aip )->ai_next.le_prev) = ((void )-1); ((aip)->ai_next.le_next ) = ((void )-1); } while (0);
3980	LIST_INSERT_HEAD(&indirdep->ir_donehd, aip, ai_next)do { if (((aip)->ai_next.le_next = (&indirdep->ir_donehd )->lh_first) != ((void *)0)) (&indirdep->ir_donehd) ->lh_first->ai_next.le_prev = &(aip)->ai_next.le_next ; (&indirdep->ir_donehd)->lh_first = (aip); (aip)-> ai_next.le_prev = &(&indirdep->ir_donehd)->lh_first ; } while (0);
3981	return;
3982	}
3983	if (indirdep->ir_stateir_list.wk_state & UFS1FMT0x2000)
3984	((int32_t *)indirdep->ir_savebp->b_data)[aip->ai_offset] =
3985	aip->ai_newblkno;
3986	else
3987	((int64_t *)indirdep->ir_savebp->b_data)[aip->ai_offset] =
3988	aip->ai_newblkno;
3989	LIST_REMOVE(aip, ai_next)do { if ((aip)->ai_next.le_next != ((void )0)) (aip)-> ai_next.le_next->ai_next.le_prev = (aip)->ai_next.le_prev ; (aip)->ai_next.le_prev = (aip)->ai_next.le_next; ((aip )->ai_next.le_prev) = ((void )-1); ((aip)->ai_next.le_next ) = ((void )-1); } while (0);
3990	if (aip->ai_freefrag != NULL((void *)0))
3991	add_to_worklist(&aip->ai_freefrag->ff_list);
3992	WORKITEM_FREE(aip, D_ALLOCINDIR)softdep_freequeue_add((struct worklist *)aip);
3993	}
3994
3995	/*
3996	* Called from within softdep_disk_write_complete above to restore
3997	* in-memory inode block contents to their most up-to-date state. Note
3998	* that this routine is always called from interrupt level with further
3999	* splbio interrupts blocked.
4000	*/
4001	/* buffer containing the inode block */
4002	STATIC int
4003	handle_written_inodeblock(struct inodedep inodedep, struct buf bp)
4004	{
4005	struct worklist wk, filefree;
4006	struct allocdirect adp, nextadp;
4007	struct ufs1_dinode dp1 = NULL((void )0);
4008	struct ufs2_dinode dp2 = NULL((void )0);
4009	int hadchanges, fstype;
4010
4011	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
4012
4013	if ((inodedep->id_stateid_list.wk_state & IOSTARTED0x0200) == 0)
4014	panic("handle_written_inodeblock: not started");
4015	inodedep->id_stateid_list.wk_state &= ~IOSTARTED0x0200;
4016
4017	if (inodedep->id_fs->fs_magic == FS_UFS1_MAGIC0x011954) {
4018	fstype = UM_UFS11;
4019	dp1 = (struct ufs1_dinode *) bp->b_data +
4020	ino_to_fsbo(inodedep->id_fs, inodedep->id_ino)((inodedep->id_ino) % ((inodedep->id_fs)->fs_inopb));
4021	} else {
4022	fstype = UM_UFS22;
4023	dp2 = (struct ufs2_dinode *) bp->b_data +
4024	ino_to_fsbo(inodedep->id_fs, inodedep->id_ino)((inodedep->id_ino) % ((inodedep->id_fs)->fs_inopb));
4025	}
4026
4027	/*
4028	* If we had to rollback the inode allocation because of
4029	* bitmaps being incomplete, then simply restore it.
4030	* Keep the block dirty so that it will not be reclaimed until
4031	* all associated dependencies have been cleared and the
4032	* corresponding updates written to disk.
4033	*/
4034	if (inodedep->id_savedino1id_un.idu_savedino1 != NULL((void *)0)) {
4035	if (fstype == UM_UFS11)
4036	dp1 = inodedep->id_savedino1id_un.idu_savedino1;
4037	else
4038	dp2 = inodedep->id_savedino2id_un.idu_savedino2;
4039	free(inodedep->id_savedino1id_un.idu_savedino1, M_INODEDEP79, inodedep->id_unsize);
4040	inodedep->id_savedino1id_un.idu_savedino1 = NULL((void *)0);
4041	if ((bp->b_flags & B_DELWRI0x00000080) == 0)
4042	stat_inode_bitmap++;
4043	buf_dirty(bp);
4044	return (1);
4045	}
4046	inodedep->id_stateid_list.wk_state \|= COMPLETE0x0004;
4047	/*
4048	* Roll forward anything that had to be rolled back before
4049	* the inode could be updated.
4050	*/
4051	hadchanges = 0;
4052	for (adp = TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first); adp; adp = nextadp) {
4053	nextadp = TAILQ_NEXT(adp, ad_next)((adp)->ad_next.tqe_next);
4054	if (adp->ad_statead_list.wk_state & ATTACHED0x0001)
4055	panic("handle_written_inodeblock: new entry");
4056	if (fstype == UM_UFS11) {
4057	if (adp->ad_lbn < NDADDR12) {
4058	if (dp1->di_db[adp->ad_lbn] != adp->ad_oldblkno)
4059	panic("%s: %s #%lld mismatch %d != "
4060	"%lld",
4061	"handle_written_inodeblock",
4062	"direct pointer",
4063	(long long)adp->ad_lbn,
4064	dp1->di_db[adp->ad_lbn],
4065	(long long)adp->ad_oldblkno);
4066	dp1->di_db[adp->ad_lbn] = adp->ad_newblkno;
4067	} else {
4068	if (dp1->di_ib[adp->ad_lbn - NDADDR12] != 0)
4069	panic("%s: %s #%lld allocated as %d",
4070	"handle_written_inodeblock",
4071	"indirect pointer",
4072	(long long)(adp->ad_lbn - NDADDR12),
4073	dp1->di_ib[adp->ad_lbn - NDADDR12]);
4074	dp1->di_ib[adp->ad_lbn - NDADDR12] =
4075	adp->ad_newblkno;
4076	}
4077	} else {
4078	if (adp->ad_lbn < NDADDR12) {
4079	if (dp2->di_db[adp->ad_lbn] != adp->ad_oldblkno)
4080	panic("%s: %s #%lld mismatch %lld != "
4081	"%lld", "handle_written_inodeblock",
4082	"direct pointer",
4083	(long long)adp->ad_lbn,
4084	dp2->di_db[adp->ad_lbn],
4085	(long long)adp->ad_oldblkno);
4086	dp2->di_db[adp->ad_lbn] = adp->ad_newblkno;
4087	} else {
4088	if (dp2->di_ib[adp->ad_lbn - NDADDR12] != 0)
4089	panic("%s: %s #%lld allocated as %lld",
4090	"handle_written_inodeblock",
4091	"indirect pointer",
4092	(long long)(adp->ad_lbn - NDADDR12),
4093	dp2->di_ib[adp->ad_lbn - NDADDR12]);
4094	dp2->di_ib[adp->ad_lbn - NDADDR12] =
4095	adp->ad_newblkno;
4096	}
4097	}
4098	adp->ad_statead_list.wk_state &= ~UNDONE0x0002;
4099	adp->ad_statead_list.wk_state \|= ATTACHED0x0001;
4100	hadchanges = 1;
4101	}
4102	if (hadchanges && (bp->b_flags & B_DELWRI0x00000080) == 0)
4103	stat_direct_blk_ptrs++;
4104	/*
4105	* Reset the file size to its most up-to-date value.
4106	*/
4107	if (inodedep->id_savedsize == -1)
4108	panic("handle_written_inodeblock: bad size");
4109
4110	if (fstype == UM_UFS11) {
4111	if (dp1->di_size != inodedep->id_savedsize) {
4112	dp1->di_size = inodedep->id_savedsize;
4113	hadchanges = 1;
4114	}
4115	} else {
4116	if (dp2->di_size != inodedep->id_savedsize) {
4117	dp2->di_size = inodedep->id_savedsize;
4118	hadchanges = 1;
4119	}
4120	}
4121	inodedep->id_savedsize = -1;
4122	/*
4123	* If there were any rollbacks in the inode block, then it must be
4124	* marked dirty so that its will eventually get written back in
4125	* its correct form.
4126	*/
4127	if (hadchanges)
4128	buf_dirty(bp);
4129	/*
4130	* Process any allocdirects that completed during the update.
4131	*/
4132	if ((adp = TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first)) != NULL((void *)0))
4133	handle_allocdirect_partdone(adp);
4134	/*
4135	* Process deallocations that were held pending until the
4136	* inode had been written to disk. Freeing of the inode
4137	* is delayed until after all blocks have been freed to
4138	* avoid creation of new <vfsid, inum, lbn> triples
4139	* before the old ones have been deleted.
4140	*/
4141	filefree = NULL((void *)0);
4142	while ((wk = LIST_FIRST(&inodedep->id_bufwait)((&inodedep->id_bufwait)->lh_first)) != NULL((void *)0)) {
4143	WORKLIST_REMOVE(wk)do { (wk)->wk_state &= ~0x8000; do { if ((wk)->wk_list .le_next != ((void )0)) (wk)->wk_list.le_next->wk_list .le_prev = (wk)->wk_list.le_prev; (wk)->wk_list.le_prev = (wk)->wk_list.le_next; ((wk)->wk_list.le_prev) = ((void )-1); ((wk)->wk_list.le_next) = ((void )-1); } while (0 ); } while (0);
4144	switch (wk->wk_type) {
4145
4146	case D_FREEFILE9:
4147	/*
4148	* We defer adding filefree to the worklist until
4149	* all other additions have been made to ensure
4150	* that it will be done after all the old blocks
4151	* have been freed.
4152	*/
4153	if (filefree != NULL((void *)0))
4154	panic("handle_written_inodeblock: filefree");
4155	filefree = wk;
4156	continue;
4157
4158	case D_MKDIR11:
4159	handle_written_mkdir(WK_MKDIR(wk)((struct mkdir *)(wk)), MKDIR_PARENT0x0010);
4160	continue;
4161
4162	case D_DIRADD10:
4163	diradd_inode_written(WK_DIRADD(wk)((struct diradd *)(wk)), inodedep);
4164	continue;
4165
4166	case D_FREEBLKS8:
4167	wk->wk_state \|= COMPLETE0x0004;
4168	if ((wk->wk_state & ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) != ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008))
4169	continue;
4170	/* FALLTHROUGH */
4171	case D_FREEFRAG7:
4172	case D_DIRREM12:
4173	add_to_worklist(wk);
4174	continue;
4175
4176	case D_NEWDIRBLK13:
4177	free_newdirblk(WK_NEWDIRBLK(wk)((struct newdirblk *)(wk)));
4178	continue;
4179
4180	default:
4181	panic("handle_written_inodeblock: Unknown type %s",
4182	TYPENAME(wk->wk_type)((unsigned)(wk->wk_type) <= 13 ? softdep_typenames[wk-> wk_type] : "???"));
4183	/* NOTREACHED */
4184	}
4185	}
4186	if (filefree != NULL((void *)0)) {
4187	if (free_inodedep(inodedep) == 0)
4188	panic("handle_written_inodeblock: live inodedep");
4189	add_to_worklist(filefree);
4190	return (0);
4191	}
4192
4193	/*
4194	* If no outstanding dependencies, free it.
4195	*/
4196	if (free_inodedep(inodedep) \|\|
4197	TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first) == NULL((void *)0))
4198	return (0);
4199	return (hadchanges);
4200	}
4201
4202	/*
4203	* Process a diradd entry after its dependent inode has been written.
4204	* This routine must be called with splbio interrupts blocked.
4205	*/
4206	STATIC void
4207	diradd_inode_written(struct diradd dap, struct inodedep inodedep)
4208	{
4209	struct pagedep *pagedep;
4210
4211	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
4212
4213	dap->da_stateda_list.wk_state \|= COMPLETE0x0004;
4214	if ((dap->da_stateda_list.wk_state & ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) == ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) {
4215	if (dap->da_stateda_list.wk_state & DIRCHG0x0080)
4216	pagedep = dap->da_previousda_un.dau_previous->dm_pagedepdm_un.dmu_pagedep;
4217	else
4218	pagedep = dap->da_pagedepda_un.dau_pagedep;
4219	LIST_REMOVE(dap, da_pdlist)do { if ((dap)->da_pdlist.le_next != ((void )0)) (dap)-> da_pdlist.le_next->da_pdlist.le_prev = (dap)->da_pdlist .le_prev; (dap)->da_pdlist.le_prev = (dap)->da_pdlist. le_next; ((dap)->da_pdlist.le_prev) = ((void )-1); ((dap) ->da_pdlist.le_next) = ((void )-1); } while (0);
4220	LIST_INSERT_HEAD(&pagedep->pd_pendinghd, dap, da_pdlist)do { if (((dap)->da_pdlist.le_next = (&pagedep->pd_pendinghd )->lh_first) != ((void *)0)) (&pagedep->pd_pendinghd )->lh_first->da_pdlist.le_prev = &(dap)->da_pdlist .le_next; (&pagedep->pd_pendinghd)->lh_first = (dap ); (dap)->da_pdlist.le_prev = &(&pagedep->pd_pendinghd )->lh_first; } while (0);
4221	}
4222	WORKLIST_INSERT(&inodedep->id_pendinghd, &dap->da_list)do { (&dap->da_list)->wk_state \|= 0x8000; do { if ( ((&dap->da_list)->wk_list.le_next = (&inodedep-> id_pendinghd)->lh_first) != ((void *)0)) (&inodedep-> id_pendinghd)->lh_first->wk_list.le_prev = &(&dap ->da_list)->wk_list.le_next; (&inodedep->id_pendinghd )->lh_first = (&dap->da_list); (&dap->da_list )->wk_list.le_prev = &(&inodedep->id_pendinghd) ->lh_first; } while (0); } while (0);
4223	}
4224
4225	/*
4226	* Handle the completion of a mkdir dependency.
4227	*/
4228	STATIC void
4229	handle_written_mkdir(struct mkdir *mkdir, int type)
4230	{
4231	struct diradd *dap;
4232	struct pagedep *pagedep;
4233
4234	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
4235
4236	if (mkdir->md_statemd_list.wk_state != type)
4237	panic("handle_written_mkdir: bad type");
4238	dap = mkdir->md_diradd;
4239	dap->da_stateda_list.wk_state &= ~type;
4240	if ((dap->da_stateda_list.wk_state & (MKDIR_PARENT0x0010 \| MKDIR_BODY0x0020)) == 0)
4241	dap->da_stateda_list.wk_state \|= DEPCOMPLETE0x0008;
4242	if ((dap->da_stateda_list.wk_state & ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) == ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) {
4243	if (dap->da_stateda_list.wk_state & DIRCHG0x0080)
4244	pagedep = dap->da_previousda_un.dau_previous->dm_pagedepdm_un.dmu_pagedep;
4245	else
4246	pagedep = dap->da_pagedepda_un.dau_pagedep;
4247	LIST_REMOVE(dap, da_pdlist)do { if ((dap)->da_pdlist.le_next != ((void )0)) (dap)-> da_pdlist.le_next->da_pdlist.le_prev = (dap)->da_pdlist .le_prev; (dap)->da_pdlist.le_prev = (dap)->da_pdlist. le_next; ((dap)->da_pdlist.le_prev) = ((void )-1); ((dap) ->da_pdlist.le_next) = ((void )-1); } while (0);
4248	LIST_INSERT_HEAD(&pagedep->pd_pendinghd, dap, da_pdlist)do { if (((dap)->da_pdlist.le_next = (&pagedep->pd_pendinghd )->lh_first) != ((void *)0)) (&pagedep->pd_pendinghd )->lh_first->da_pdlist.le_prev = &(dap)->da_pdlist .le_next; (&pagedep->pd_pendinghd)->lh_first = (dap ); (dap)->da_pdlist.le_prev = &(&pagedep->pd_pendinghd )->lh_first; } while (0);
4249	}
4250	LIST_REMOVE(mkdir, md_mkdirs)do { if ((mkdir)->md_mkdirs.le_next != ((void )0)) (mkdir )->md_mkdirs.le_next->md_mkdirs.le_prev = (mkdir)->md_mkdirs .le_prev; (mkdir)->md_mkdirs.le_prev = (mkdir)->md_mkdirs .le_next; ((mkdir)->md_mkdirs.le_prev) = ((void )-1); ((mkdir )->md_mkdirs.le_next) = ((void )-1); } while (0);
4251	WORKITEM_FREE(mkdir, D_MKDIR)softdep_freequeue_add((struct worklist *)mkdir);
4252	}
4253
4254	/*
4255	* Called from within softdep_disk_write_complete above.
4256	* A write operation was just completed. Removed inodes can
4257	* now be freed and associated block pointers may be committed.
4258	* Note that this routine is always called from interrupt level
4259	* with further splbio interrupts blocked.
4260	*/
4261	/* buffer containing the written page */
4262	STATIC int
4263	handle_written_filepage(struct pagedep pagedep, struct buf bp)
4264	{
4265	struct dirrem *dirrem;
4266	struct diradd dap, nextdap;
4267	struct direct *ep;
4268	int i, chgs;
4269
4270	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
4271
4272	if ((pagedep->pd_statepd_list.wk_state & IOSTARTED0x0200) == 0)
4273	panic("handle_written_filepage: not started");
4274	pagedep->pd_statepd_list.wk_state &= ~IOSTARTED0x0200;
4275	/*
4276	* Process any directory removals that have been committed.
4277	*/
4278	while ((dirrem = LIST_FIRST(&pagedep->pd_dirremhd)((&pagedep->pd_dirremhd)->lh_first)) != NULL((void *)0)) {
4279	LIST_REMOVE(dirrem, dm_next)do { if ((dirrem)->dm_next.le_next != ((void )0)) (dirrem )->dm_next.le_next->dm_next.le_prev = (dirrem)->dm_next .le_prev; (dirrem)->dm_next.le_prev = (dirrem)->dm_next .le_next; ((dirrem)->dm_next.le_prev) = ((void )-1); ((dirrem )->dm_next.le_next) = ((void )-1); } while (0);
4280	dirrem->dm_dirinumdm_un.dmu_dirinum = pagedep->pd_ino;
4281	add_to_worklist(&dirrem->dm_list);
4282	}
4283	/*
4284	* Free any directory additions that have been committed.
4285	* If it is a newly allocated block, we have to wait until
4286	* the on-disk directory inode claims the new block.
4287	*/
4288	if ((pagedep->pd_statepd_list.wk_state & NEWBLOCK0x0800) == 0)
4289	while ((dap = LIST_FIRST(&pagedep->pd_pendinghd)((&pagedep->pd_pendinghd)->lh_first)) != NULL((void *)0))
4290	free_diradd(dap);
4291	/*
4292	* Uncommitted directory entries must be restored.
4293	*/
4294	for (chgs = 0, i = 0; i < DAHASHSZ6; i++) {
4295	for (dap = LIST_FIRST(&pagedep->pd_diraddhd[i])((&pagedep->pd_diraddhd[i])->lh_first); dap;
4296	dap = nextdap) {
4297	nextdap = LIST_NEXT(dap, da_pdlist)((dap)->da_pdlist.le_next);
4298	if (dap->da_stateda_list.wk_state & ATTACHED0x0001)
4299	panic("handle_written_filepage: attached");
4300	ep = (struct direct *)
4301	((char *)bp->b_data + dap->da_offset);
4302	ep->d_ino = dap->da_newinum;
4303	dap->da_stateda_list.wk_state &= ~UNDONE0x0002;
4304	dap->da_stateda_list.wk_state \|= ATTACHED0x0001;
4305	chgs = 1;
4306	/*
4307	* If the inode referenced by the directory has
4308	* been written out, then the dependency can be
4309	* moved to the pending list.
4310	*/
4311	if ((dap->da_stateda_list.wk_state & ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) == ALLCOMPLETE(0x0001 \| 0x0004 \| 0x0008)) {
4312	LIST_REMOVE(dap, da_pdlist)do { if ((dap)->da_pdlist.le_next != ((void )0)) (dap)-> da_pdlist.le_next->da_pdlist.le_prev = (dap)->da_pdlist .le_prev; (dap)->da_pdlist.le_prev = (dap)->da_pdlist. le_next; ((dap)->da_pdlist.le_prev) = ((void )-1); ((dap) ->da_pdlist.le_next) = ((void )-1); } while (0);
4313	LIST_INSERT_HEAD(&pagedep->pd_pendinghd, dap,do { if (((dap)->da_pdlist.le_next = (&pagedep->pd_pendinghd )->lh_first) != ((void *)0)) (&pagedep->pd_pendinghd )->lh_first->da_pdlist.le_prev = &(dap)->da_pdlist .le_next; (&pagedep->pd_pendinghd)->lh_first = (dap ); (dap)->da_pdlist.le_prev = &(&pagedep->pd_pendinghd )->lh_first; } while (0)
4314	da_pdlist)do { if (((dap)->da_pdlist.le_next = (&pagedep->pd_pendinghd )->lh_first) != ((void *)0)) (&pagedep->pd_pendinghd )->lh_first->da_pdlist.le_prev = &(dap)->da_pdlist .le_next; (&pagedep->pd_pendinghd)->lh_first = (dap ); (dap)->da_pdlist.le_prev = &(&pagedep->pd_pendinghd )->lh_first; } while (0);
4315	}
4316	}
4317	}
4318	/*
4319	* If there were any rollbacks in the directory, then it must be
4320	* marked dirty so that its will eventually get written back in
4321	* its correct form.
4322	*/
4323	if (chgs) {
4324	if ((bp->b_flags & B_DELWRI0x00000080) == 0)
4325	stat_dir_entry++;
4326	buf_dirty(bp);
4327	return (1);
4328	}
4329	/*
4330	* If we are not waiting for a new directory block to be
4331	* claimed by its inode, then the pagedep will be freed.
4332	* Otherwise it will remain to track any new entries on
4333	* the page in case they are fsync'ed.
4334	*/
4335	if ((pagedep->pd_statepd_list.wk_state & NEWBLOCK0x0800) == 0) {
4336	LIST_REMOVE(pagedep, pd_hash)do { if ((pagedep)->pd_hash.le_next != ((void )0)) (pagedep )->pd_hash.le_next->pd_hash.le_prev = (pagedep)->pd_hash .le_prev; (pagedep)->pd_hash.le_prev = (pagedep)->pd_hash .le_next; ((pagedep)->pd_hash.le_prev) = ((void )-1); ((pagedep )->pd_hash.le_next) = ((void )-1); } while (0);
4337	WORKITEM_FREE(pagedep, D_PAGEDEP)softdep_freequeue_add((struct worklist *)pagedep);
4338	}
4339	return (0);
4340	}
4341
4342	/*
4343	* Writing back in-core inode structures.
4344	*
4345	* The file system only accesses an inode's contents when it occupies an
4346	* "in-core" inode structure. These "in-core" structures are separate from
4347	* the page frames used to cache inode blocks. Only the latter are
4348	* transferred to/from the disk. So, when the updated contents of the
4349	* "in-core" inode structure are copied to the corresponding in-memory inode
4350	* block, the dependencies are also transferred. The following procedure is
4351	* called when copying a dirty "in-core" inode to a cached inode block.
4352	*/
4353
4354	/*
4355	* Called when an inode is loaded from disk. If the effective link count
4356	* differed from the actual link count when it was last flushed, then we
4357	* need to ensure that the correct effective link count is put back.
4358	*/
4359	/* the "in_core" copy of the inode */
4360	void
4361	softdep_load_inodeblock(struct inode *ip)
4362	{
4363	struct inodedep *inodedep;
4364
4365	/*
4366	* Check for alternate nlink count.
4367	*/
4368	ip->i_effnlink = DIP(ip, nlink)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_nlink : (ip)->dinode_u.ffs2_din->di_nlink);
4369	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4370	if (inodedep_lookup(ip->i_fsinode_u.fs, ip->i_number, 0, &inodedep) == 0) {
4371	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4372	return;
4373	}
4374	ip->i_effnlink -= inodedep->id_nlinkdelta;
4375	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4376	}
4377
4378	/*
4379	* This routine is called just before the "in-core" inode
4380	* information is to be copied to the in-memory inode block.
4381	* Recall that an inode block contains several inodes. If
4382	* the force flag is set, then the dependencies will be
4383	* cleared so that the update can always be made. Note that
4384	* the buffer is locked when this routine is called, so we
4385	* will never be in the middle of writing the inode block
4386	* to disk.
4387	*/
4388	/* the "in_core" copy of the inode */
4389	/* the buffer containing the inode block */
4390	/* nonzero => update must be allowed */
4391	void
4392	softdep_update_inodeblock(struct inode ip, struct buf bp, int waitfor)
4393	{
4394	struct inodedep *inodedep;
4395	struct worklist *wk;
4396	int error, gotit;
4397
4398	/*
4399	* If the effective link count is not equal to the actual link
4400	* count, then we must track the difference in an inodedep while
4401	* the inode is (potentially) tossed out of the cache. Otherwise,
4402	* if there is no existing inodedep, then there are no dependencies
4403	* to track.
4404	*/
4405	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4406	if (inodedep_lookup(ip->i_fsinode_u.fs, ip->i_number, 0, &inodedep) == 0) {
4407	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4408	if (ip->i_effnlink != DIP(ip, nlink)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_nlink : (ip)->dinode_u.ffs2_din->di_nlink))
4409	panic("softdep_update_inodeblock: bad link count");
4410	return;
4411	}
4412	if (inodedep->id_nlinkdelta != DIP(ip, nlink)(((ip)->i_ump->um_fstype == 1) ? (ip)->dinode_u.ffs1_din ->di_nlink : (ip)->dinode_u.ffs2_din->di_nlink) - ip->i_effnlink) {
4413	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4414	panic("softdep_update_inodeblock: bad delta");
4415	}
4416	/*
4417	* Changes have been initiated. Anything depending on these
4418	* changes cannot occur until this inode has been written.
4419	*/
4420	inodedep->id_stateid_list.wk_state &= ~COMPLETE0x0004;
4421	if ((inodedep->id_stateid_list.wk_state & ONWORKLIST0x8000) == 0)
4422	WORKLIST_INSERT(&bp->b_dep, &inodedep->id_list)do { (&inodedep->id_list)->wk_state \|= 0x8000; do { if (((&inodedep->id_list)->wk_list.le_next = (& bp->b_dep)->lh_first) != ((void *)0)) (&bp->b_dep )->lh_first->wk_list.le_prev = &(&inodedep-> id_list)->wk_list.le_next; (&bp->b_dep)->lh_first = (&inodedep->id_list); (&inodedep->id_list)-> wk_list.le_prev = &(&bp->b_dep)->lh_first; } while (0); } while (0);
4423	/*
4424	* Any new dependencies associated with the incore inode must
4425	* now be moved to the list associated with the buffer holding
4426	* the in-memory copy of the inode. Once merged process any
4427	* allocdirects that are completed by the merger.
4428	*/
4429	merge_inode_lists(inodedep);
4430	if (TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first) != NULL((void *)0))
4431	handle_allocdirect_partdone(TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first));
4432	/*
4433	* Now that the inode has been pushed into the buffer, the
4434	* operations dependent on the inode being written to disk
4435	* can be moved to the id_bufwait so that they will be
4436	* processed when the buffer I/O completes.
4437	*/
4438	while ((wk = LIST_FIRST(&inodedep->id_inowait)((&inodedep->id_inowait)->lh_first)) != NULL((void *)0)) {
4439	WORKLIST_REMOVE(wk)do { (wk)->wk_state &= ~0x8000; do { if ((wk)->wk_list .le_next != ((void )0)) (wk)->wk_list.le_next->wk_list .le_prev = (wk)->wk_list.le_prev; (wk)->wk_list.le_prev = (wk)->wk_list.le_next; ((wk)->wk_list.le_prev) = ((void )-1); ((wk)->wk_list.le_next) = ((void )-1); } while (0 ); } while (0);
4440	WORKLIST_INSERT(&inodedep->id_bufwait, wk)do { (wk)->wk_state \|= 0x8000; do { if (((wk)->wk_list. le_next = (&inodedep->id_bufwait)->lh_first) != ((void *)0)) (&inodedep->id_bufwait)->lh_first->wk_list .le_prev = &(wk)->wk_list.le_next; (&inodedep-> id_bufwait)->lh_first = (wk); (wk)->wk_list.le_prev = & (&inodedep->id_bufwait)->lh_first; } while (0); } while (0);
4441	}
4442	/*
4443	* Newly allocated inodes cannot be written until the bitmap
4444	* that allocates them have been written (indicated by
4445	* DEPCOMPLETE being set in id_state). If we are doing a
4446	* forced sync (e.g., an fsync on a file), we force the bitmap
4447	* to be written so that the update can be done.
4448	*/
4449	do {
4450	if ((inodedep->id_stateid_list.wk_state & DEPCOMPLETE0x0008) != 0 \|\| waitfor == 0) {
4451	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4452	return;
4453	}
4454	bp = inodedep->id_buf;
4455	gotit = getdirtybuf(bp, MNT_WAIT1);
4456	} while (gotit == -1);
4457	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4458	if (gotit && (error = bwrite(bp)) != 0)
4459	softdep_error("softdep_update_inodeblock: bwrite", error);
4460	if ((inodedep->id_stateid_list.wk_state & DEPCOMPLETE0x0008) == 0)
4461	panic("softdep_update_inodeblock: update failed");
4462	}
4463
4464	/*
4465	* Merge the new inode dependency list (id_newinoupdt) into the old
4466	* inode dependency list (id_inoupdt). This routine must be called
4467	* with splbio interrupts blocked.
4468	*/
4469	STATIC void
4470	merge_inode_lists(struct inodedep *inodedep)
4471	{
4472	struct allocdirect listadp, newadp;
4473
4474	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
4475
4476	newadp = TAILQ_FIRST(&inodedep->id_newinoupdt)((&inodedep->id_newinoupdt)->tqh_first);
4477	for (listadp = TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first); listadp && newadp;) {
4478	if (listadp->ad_lbn < newadp->ad_lbn) {
4479	listadp = TAILQ_NEXT(listadp, ad_next)((listadp)->ad_next.tqe_next);
4480	continue;
4481	}
4482	TAILQ_REMOVE(&inodedep->id_newinoupdt, newadp, ad_next)do { if (((newadp)->ad_next.tqe_next) != ((void )0)) (newadp )->ad_next.tqe_next->ad_next.tqe_prev = (newadp)->ad_next .tqe_prev; else (&inodedep->id_newinoupdt)->tqh_last = (newadp)->ad_next.tqe_prev; (newadp)->ad_next.tqe_prev = (newadp)->ad_next.tqe_next; ((newadp)->ad_next.tqe_prev ) = ((void )-1); ((newadp)->ad_next.tqe_next) = ((void ) -1); } while (0);
4483	TAILQ_INSERT_BEFORE(listadp, newadp, ad_next)do { (newadp)->ad_next.tqe_prev = (listadp)->ad_next.tqe_prev ; (newadp)->ad_next.tqe_next = (listadp); *(listadp)->ad_next .tqe_prev = (newadp); (listadp)->ad_next.tqe_prev = &( newadp)->ad_next.tqe_next; } while (0);
4484	if (listadp->ad_lbn == newadp->ad_lbn) {
4485	allocdirect_merge(&inodedep->id_inoupdt, newadp,
4486	listadp);
4487	listadp = newadp;
4488	}
4489	newadp = TAILQ_FIRST(&inodedep->id_newinoupdt)((&inodedep->id_newinoupdt)->tqh_first);
4490	}
4491	TAILQ_CONCAT(&inodedep->id_inoupdt, &inodedep->id_newinoupdt, ad_next)do { if (!(((&inodedep->id_newinoupdt)->tqh_first) == ((void )0))) { (&inodedep->id_inoupdt)->tqh_last = (&inodedep->id_newinoupdt)->tqh_first; (&inodedep ->id_newinoupdt)->tqh_first->ad_next.tqe_prev = (& inodedep->id_inoupdt)->tqh_last; (&inodedep->id_inoupdt )->tqh_last = (&inodedep->id_newinoupdt)->tqh_last ; do { ((&inodedep->id_newinoupdt))->tqh_first = (( void *)0); ((&inodedep->id_newinoupdt))->tqh_last = &((&inodedep->id_newinoupdt))->tqh_first; } while (0); } } while (0);
4492	}
4493
4494	/*
4495	* If we are doing an fsync, then we must ensure that any directory
4496	* entries for the inode have been written after the inode gets to disk.
4497	*/
4498	/* the "in_core" copy of the inode */
4499	int
4500	softdep_fsync(struct vnode *vp)
4501	{
4502	struct inodedep *inodedep;
4503	struct pagedep *pagedep;
4504	struct worklist *wk;
4505	struct diradd *dap;
4506	struct mount *mnt;
4507	struct vnode *pvp;
4508	struct inode *ip;
4509	struct inode *pip;
4510	struct buf *bp;
4511	struct fs *fs;
4512	struct proc p = CURPROC({struct cpu_info __ci; asm volatile("movq %%gs:%P1,%0" : "=r" (__ci) :"n" (__builtin_offsetof(struct cpu_info, ci_self))); __ci;})->ci_curproc; /* XXX */
4513	int error, flushparent;
4514	ufsino_t parentino;
4515	daddr_t lbn;
4516
4517	ip = VTOI(vp)((struct inode *)(vp)->v_data);
4518	fs = ip->i_fsinode_u.fs;
4519	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4520	if (inodedep_lookup(fs, ip->i_number, 0, &inodedep) == 0) {
4521	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4522	return (0);
4523	}
4524	if (LIST_FIRST(&inodedep->id_inowait)((&inodedep->id_inowait)->lh_first) != NULL((void *)0) \|\|
4525	LIST_FIRST(&inodedep->id_bufwait)((&inodedep->id_bufwait)->lh_first) != NULL((void *)0) \|\|
4526	TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first) != NULL((void *)0) \|\|
4527	TAILQ_FIRST(&inodedep->id_newinoupdt)((&inodedep->id_newinoupdt)->tqh_first) != NULL((void *)0)) {
4528	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4529	panic("softdep_fsync: pending ops");
4530	}
4531	for (error = 0, flushparent = 0; ; ) {
	Although the value stored to 'flushparent' is used in the enclosing expression, the value is never actually read from 'flushparent'
4532	if ((wk = LIST_FIRST(&inodedep->id_pendinghd)((&inodedep->id_pendinghd)->lh_first)) == NULL((void *)0))
4533	break;
4534	if (wk->wk_type != D_DIRADD10) {
4535	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4536	panic("softdep_fsync: Unexpected type %s",
4537	TYPENAME(wk->wk_type)((unsigned)(wk->wk_type) <= 13 ? softdep_typenames[wk-> wk_type] : "???"));
4538	}
4539	dap = WK_DIRADD(wk)((struct diradd *)(wk));
4540	/*
4541	* Flush our parent if this directory entry has a MKDIR_PARENT
4542	* dependency or is contained in a newly allocated block.
4543	*/
4544	if (dap->da_stateda_list.wk_state & DIRCHG0x0080)
4545	pagedep = dap->da_previousda_un.dau_previous->dm_pagedepdm_un.dmu_pagedep;
4546	else
4547	pagedep = dap->da_pagedepda_un.dau_pagedep;
4548	mnt = pagedep->pd_mnt;
4549	parentino = pagedep->pd_ino;
4550	lbn = pagedep->pd_lbn;
4551	if ((dap->da_stateda_list.wk_state & (MKDIR_BODY0x0020 \| COMPLETE0x0004)) != COMPLETE0x0004) {
4552	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4553	panic("softdep_fsync: dirty");
4554	}
4555	if ((dap->da_stateda_list.wk_state & MKDIR_PARENT0x0010) \|\|
4556	(pagedep->pd_statepd_list.wk_state & NEWBLOCK0x0800))
4557	flushparent = 1;
4558	else
4559	flushparent = 0;
4560	/*
4561	* If we are being fsync'ed as part of vgone'ing this vnode,
4562	* then we will not be able to release and recover the
4563	* vnode below, so we just have to give up on writing its
4564	* directory entry out. It will eventually be written, just
4565	* not now, but then the user was not asking to have it
4566	* written, so we are not breaking any promises.
4567	*/
4568	mtx_enter(&vnode_mtx);
4569	if (vp->v_lflag & VXLOCK0x0100) {
4570	mtx_leave(&vnode_mtx);
4571	break;
4572	}
4573	mtx_leave(&vnode_mtx);
4574	/*
4575	* We prevent deadlock by always fetching inodes from the
4576	* root, moving down the directory tree. Thus, when fetching
4577	* our parent directory, we must unlock ourselves before
4578	* requesting the lock on our parent. See the comment in
4579	* ufs_lookup for details on possible races.
4580	*/
4581	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4582	VOP_UNLOCK(vp);
4583	error = VFS_VGET(mnt, parentino, &pvp)(*(mnt)->mnt_op->vfs_vget)(mnt, parentino, &pvp);
4584	vn_lock(vp, LK_EXCLUSIVE0x0001UL \| LK_RETRY0x2000UL);
4585	if (error != 0)
4586	return (error);
4587	/*
4588	* All MKDIR_PARENT dependencies and all the NEWBLOCK pagedeps
4589	* that are contained in direct blocks will be resolved by
4590	* doing a UFS_UPDATE. Pagedeps contained in indirect blocks
4591	* may require a complete sync'ing of the directory. So, we
4592	* try the cheap and fast UFS_UPDATE first, and if that fails,
4593	* then we do the slower VOP_FSYNC of the directory.
4594	*/
4595	pip = VTOI(pvp)((struct inode *)(pvp)->v_data);
4596	if (flushparent) {
4597	error = UFS_UPDATE(pip, 1)((pip)->i_vtbl->iv_update)((pip), (1));
4598	if (error) {
4599	vput(pvp);
4600	return (error);
4601	}
4602	if (pagedep->pd_statepd_list.wk_state & NEWBLOCK0x0800) {
4603	error = VOP_FSYNC(pvp, p->p_ucred, MNT_WAIT1, p);
4604	if (error) {
4605	vput(pvp);
4606	return (error);
4607	}
4608	}
4609	}
4610	/*
4611	* Flush directory page containing the inode's name.
4612	*/
4613	error = bread(pvp, lbn, fs->fs_bsize, &bp);
4614	if (error == 0) {
4615	bp->b_bcount = blksize(fs, pip, lbn)(((lbn) >= 12 \|\| ((((pip))->i_ump->um_fstype == 1) ? ((pip))->dinode_u.ffs1_din->di_size : ((pip))->dinode_u .ffs2_din->di_size) >= ((lbn) + 1) << (fs)->fs_bshift ) ? (u_int64_t)(fs)->fs_bsize : ((((((((((pip))->i_ump-> um_fstype == 1) ? ((pip))->dinode_u.ffs1_din->di_size : ((pip))->dinode_u.ffs2_din->di_size)) & (fs)->fs_qbmask )) + (fs)->fs_qfmask) & (fs)->fs_fmask)));
4616	error = bwrite(bp);
4617	} else
4618	brelse(bp);
4619	vput(pvp);
4620	if (error != 0)
4621	return (error);
4622	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4623	if (inodedep_lookup(fs, ip->i_number, 0, &inodedep) == 0)
4624	break;
4625	}
4626	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4627	return (0);
4628	}
4629
4630	/*
4631	* Flush all the dirty bitmaps associated with the block device
4632	* before flushing the rest of the dirty blocks so as to reduce
4633	* the number of dependencies that will have to be rolled back.
4634	*/
4635	void
4636	softdep_fsync_mountdev(struct vnode *vp, int waitfor)
4637	{
4638	struct buf bp, nbp;
4639	struct worklist *wk;
4640
4641	if (!vn_isdisk(vp, NULL((void *)0)))
4642	panic("softdep_fsync_mountdev: vnode not a disk");
4643	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4644	LIST_FOREACH_SAFE(bp, &vp->v_dirtyblkhd, b_vnbufs, nbp)for ((bp) = ((&vp->v_dirtyblkhd)->lh_first); (bp) && ((nbp) = ((bp)->b_vnbufs.le_next), 1); (bp) = (nbp)) {
4645	/*
4646	* If it is already scheduled, skip to the next buffer.
4647	*/
4648	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
4649	if (bp->b_flags & B_BUSY0x00000010)
4650	continue;
4651
4652	if ((bp->b_flags & B_DELWRI0x00000080) == 0) {
4653	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4654	panic("softdep_fsync_mountdev: not dirty");
4655	}
4656	/*
4657	* We are only interested in bitmaps with outstanding
4658	* dependencies.
4659	*/
4660	if ((wk = LIST_FIRST(&bp->b_dep)((&bp->b_dep)->lh_first)) == NULL((void *)0) \|\|
4661	wk->wk_type != D_BMSAFEMAP3) {
4662	continue;
4663	}
4664	bremfreebufcache_take(bp);
4665	buf_acquire(bp);
4666	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4667	(void) bawrite(bp);
4668	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4669	/*
4670	* Since we may have slept during the I/O, we need
4671	* to start from a known point.
4672	*/
4673	nbp = LIST_FIRST(&vp->v_dirtyblkhd)((&vp->v_dirtyblkhd)->lh_first);
4674	}
4675	if (waitfor == MNT_WAIT1)
4676	drain_output(vp, 1);
4677	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4678	}
4679
4680	/*
4681	* This routine is called when we are trying to synchronously flush a
4682	* file. This routine must eliminate any filesystem metadata dependencies
4683	* so that the syncing routine can succeed by pushing the dirty blocks
4684	* associated with the file. If any I/O errors occur, they are returned.
4685	*/
4686	int
4687	softdep_sync_metadata(struct vop_fsync_args *ap)
4688	{
4689	struct vnode *vp = ap->a_vp;
4690	struct pagedep *pagedep;
4691	struct allocdirect *adp;
4692	struct allocindir *aip;
4693	struct buf bp, nbp;
4694	struct worklist *wk;
4695	int i, gotit, error, waitfor;
4696
4697	/*
4698	* Check whether this vnode is involved in a filesystem
4699	* that is doing soft dependency processing.
4700	*/
4701	if (!vn_isdisk(vp, NULL((void *)0))) {
4702	if (!DOINGSOFTDEP(vp)((vp)->v_mount->mnt_flag & 0x04000000))
4703	return (0);
4704	} else
4705	if (vp->v_specmountpointv_un.vu_specinfo->si_mountpoint == NULL((void *)0) \|\|
4706	(vp->v_specmountpointv_un.vu_specinfo->si_mountpoint->mnt_flag & MNT_SOFTDEP0x04000000) == 0)
4707	return (0);
4708	/*
4709	* Ensure that any direct block dependencies have been cleared.
4710	*/
4711	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4712	if ((error = flush_inodedep_deps(VTOI(vp)((struct inode )(vp)->v_data)->i_fsinode_u.fs, VTOI(vp)((struct inode )(vp)->v_data)->i_number))) {
4713	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4714	return (error);
4715	}
4716	/*
4717	* For most files, the only metadata dependencies are the
4718	* cylinder group maps that allocate their inode or blocks.
4719	* The block allocation dependencies can be found by traversing
4720	* the dependency lists for any buffers that remain on their
4721	* dirty buffer list. The inode allocation dependency will
4722	* be resolved when the inode is updated with MNT_WAIT.
4723	* This work is done in two passes. The first pass grabs most
4724	* of the buffers and begins asynchronously writing them. The
4725	* only way to wait for these asynchronous writes is to sleep
4726	* on the filesystem vnode which may stay busy for a long time
4727	* if the filesystem is active. So, instead, we make a second
4728	* pass over the dependencies blocking on each write. In the
4729	* usual case we will be blocking against a write that we
4730	* initiated, so when it is done the dependency will have been
4731	* resolved. Thus the second pass is expected to end quickly.
4732	*/
4733	waitfor = MNT_NOWAIT2;
4734	top:
4735	/*
4736	* We must wait for any I/O in progress to finish so that
4737	* all potential buffers on the dirty list will be visible.
4738	*/
4739	drain_output(vp, 1);
4740	bp = LIST_FIRST(&vp->v_dirtyblkhd)((&vp->v_dirtyblkhd)->lh_first);
4741	gotit = getdirtybuf(bp, MNT_WAIT1);
4742	if (gotit == 0) {
4743	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4744	return (0);
4745	} else if (gotit == -1)
4746	goto top;
4747	loop:
4748	/*
4749	* As we hold the buffer locked, none of its dependencies
4750	* will disappear.
4751	*/
4752	LIST_FOREACH(wk, &bp->b_dep, wk_list)for((wk) = ((&bp->b_dep)->lh_first); (wk)!= ((void * )0); (wk) = ((wk)->wk_list.le_next)) {
4753	switch (wk->wk_type) {
4754
4755	case D_ALLOCDIRECT4:
4756	adp = WK_ALLOCDIRECT(wk)((struct allocdirect *)(wk));
4757	if (adp->ad_statead_list.wk_state & DEPCOMPLETE0x0008)
4758	break;
4759	nbp = adp->ad_buf;
4760	gotit = getdirtybuf(nbp, waitfor);
4761	if (gotit == 0)
4762	break;
4763	else if (gotit == -1)
4764	goto loop;
4765	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4766	if (waitfor == MNT_NOWAIT2) {
4767	bawrite(nbp);
4768	} else if ((error = VOP_BWRITE(nbp)) != 0) {
4769	bawrite(bp);
4770	return (error);
4771	}
4772	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4773	break;
4774
4775	case D_ALLOCINDIR6:
4776	aip = WK_ALLOCINDIR(wk)((struct allocindir *)(wk));
4777	if (aip->ai_stateai_list.wk_state & DEPCOMPLETE0x0008)
4778	break;
4779	nbp = aip->ai_buf;
4780	gotit = getdirtybuf(nbp, waitfor);
4781	if (gotit == 0)
4782	break;
4783	else if (gotit == -1)
4784	goto loop;
4785	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4786	if (waitfor == MNT_NOWAIT2) {
4787	bawrite(nbp);
4788	} else if ((error = VOP_BWRITE(nbp)) != 0) {
4789	bawrite(bp);
4790	return (error);
4791	}
4792	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4793	break;
4794
4795	case D_INDIRDEP5:
4796	restart:
4797
4798	LIST_FOREACH(aip, &WK_INDIRDEP(wk)->ir_deplisthd, ai_next)for((aip) = ((&((struct indirdep )(wk))->ir_deplisthd )->lh_first); (aip)!= ((void )0); (aip) = ((aip)->ai_next .le_next)) {
4799	if (aip->ai_stateai_list.wk_state & DEPCOMPLETE0x0008)
4800	continue;
4801	nbp = aip->ai_buf;
4802	if (getdirtybuf(nbp, MNT_WAIT1) <= 0)
4803	goto restart;
4804	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4805	if ((error = VOP_BWRITE(nbp)) != 0) {
4806	bawrite(bp);
4807	return (error);
4808	}
4809	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4810	goto restart;
4811	}
4812	break;
4813
4814	case D_INODEDEP1:
4815	if ((error = flush_inodedep_deps(WK_INODEDEP(wk)((struct inodedep *)(wk))->id_fs,
4816	WK_INODEDEP(wk)((struct inodedep *)(wk))->id_ino)) != 0) {
4817	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4818	bawrite(bp);
4819	return (error);
4820	}
4821	break;
4822
4823	case D_PAGEDEP0:
4824	/*
4825	* We are trying to sync a directory that may
4826	* have dependencies on both its own metadata
4827	* and/or dependencies on the inodes of any
4828	* recently allocated files. We walk its diradd
4829	* lists pushing out the associated inode.
4830	*/
4831	pagedep = WK_PAGEDEP(wk)((struct pagedep *)(wk));
4832	for (i = 0; i < DAHASHSZ6; i++) {
4833	if (LIST_FIRST(&pagedep->pd_diraddhd[i])((&pagedep->pd_diraddhd[i])->lh_first) ==
4834	NULL((void *)0))
4835	continue;
4836	if ((error =
4837	flush_pagedep_deps(vp, pagedep->pd_mnt,
4838	&pagedep->pd_diraddhd[i]))) {
4839	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4840	bawrite(bp);
4841	return (error);
4842	}
4843	}
4844	break;
4845
4846	case D_MKDIR11:
4847	/*
4848	* This case should never happen if the vnode has
4849	* been properly sync'ed. However, if this function
4850	* is used at a place where the vnode has not yet
4851	* been sync'ed, this dependency can show up. So,
4852	* rather than panic, just flush it.
4853	*/
4854	nbp = WK_MKDIR(wk)((struct mkdir *)(wk))->md_buf;
4855	KASSERT(bp != nbp)((bp != nbp) ? (void)0 : __assert("diagnostic ", "/usr/src/sys/ufs/ffs/ffs_softdep.c" , 4855, "bp != nbp"));
4856	gotit = getdirtybuf(nbp, waitfor);
4857	if (gotit == 0)
4858	break;
4859	else if (gotit == -1)
4860	goto loop;
4861	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4862	if (waitfor == MNT_NOWAIT2) {
4863	bawrite(nbp);
4864	} else if ((error = VOP_BWRITE(nbp)) != 0) {
4865	bawrite(bp);
4866	return (error);
4867	}
4868	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4869	break;
4870
4871	case D_BMSAFEMAP3:
4872	/*
4873	* This case should never happen if the vnode has
4874	* been properly sync'ed. However, if this function
4875	* is used at a place where the vnode has not yet
4876	* been sync'ed, this dependency can show up. So,
4877	* rather than panic, just flush it.
4878	*/
4879	nbp = WK_BMSAFEMAP(wk)((struct bmsafemap *)(wk))->sm_buf;
4880	if (bp == nbp)
4881	break;
4882	gotit = getdirtybuf(nbp, waitfor);
4883	if (gotit == 0)
4884	break;
4885	else if (gotit == -1)
4886	goto loop;
4887	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4888	if (waitfor == MNT_NOWAIT2) {
4889	bawrite(nbp);
4890	} else if ((error = VOP_BWRITE(nbp)) != 0) {
4891	bawrite(bp);
4892	return (error);
4893	}
4894	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4895	break;
4896
4897	default:
4898	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4899	panic("softdep_sync_metadata: Unknown type %s",
4900	TYPENAME(wk->wk_type)((unsigned)(wk->wk_type) <= 13 ? softdep_typenames[wk-> wk_type] : "???"));
4901	/* NOTREACHED */
4902	}
4903	}
4904	do {
4905	nbp = LIST_NEXT(bp, b_vnbufs)((bp)->b_vnbufs.le_next);
4906	gotit = getdirtybuf(nbp, MNT_WAIT1);
4907	} while (gotit == -1);
4908	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4909	bawrite(bp);
4910	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4911	if (nbp != NULL((void *)0)) {
4912	bp = nbp;
4913	goto loop;
4914	}
4915	/*
4916	* The brief unlock is to allow any pent up dependency
4917	* processing to be done. Then proceed with the second pass.
4918	*/
4919	if (waitfor == MNT_NOWAIT2) {
4920	waitfor = MNT_WAIT1;
4921	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4922	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4923	goto top;
4924	}
4925
4926	/*
4927	* If we have managed to get rid of all the dirty buffers,
4928	* then we are done. For certain directories and block
4929	* devices, we may need to do further work.
4930	*
4931	* We must wait for any I/O in progress to finish so that
4932	* all potential buffers on the dirty list will be visible.
4933	*/
4934	drain_output(vp, 1);
4935	if (LIST_EMPTY(&vp->v_dirtyblkhd)(((&vp->v_dirtyblkhd)->lh_first) == ((void *)0))) {
4936	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4937	return (0);
4938	}
4939
4940	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4941	/*
4942	* If we are trying to sync a block device, some of its buffers may
4943	* contain metadata that cannot be written until the contents of some
4944	* partially written files have been written to disk. The only easy
4945	* way to accomplish this is to sync the entire filesystem (luckily
4946	* this happens rarely).
4947	*/
4948	if (vn_isdisk(vp, NULL((void *)0)) &&
4949	vp->v_specmountpointv_un.vu_specinfo->si_mountpoint && !VOP_ISLOCKED(vp) &&
4950	(error = VFS_SYNC(vp->v_specmountpoint, MNT_WAIT, 0, ap->a_cred,(*(vp->v_un.vu_specinfo->si_mountpoint)->mnt_op-> vfs_sync)(vp->v_un.vu_specinfo->si_mountpoint, 1, 0, ap ->a_cred, ap->a_p)
4951	ap->a_p)(*(vp->v_un.vu_specinfo->si_mountpoint)->mnt_op-> vfs_sync)(vp->v_un.vu_specinfo->si_mountpoint, 1, 0, ap ->a_cred, ap->a_p)) != 0)
4952	return (error);
4953	return (0);
4954	}
4955
4956	/*
4957	* Flush the dependencies associated with an inodedep.
4958	* Called with splbio blocked.
4959	*/
4960	STATIC int
4961	flush_inodedep_deps(struct fs *fs, ufsino_t ino)
4962	{
4963	struct inodedep *inodedep;
4964	struct allocdirect *adp;
4965	int gotit, error, waitfor;
4966	struct buf *bp;
4967
4968	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
4969
4970	/*
4971	* This work is done in two passes. The first pass grabs most
4972	* of the buffers and begins asynchronously writing them. The
4973	* only way to wait for these asynchronous writes is to sleep
4974	* on the filesystem vnode which may stay busy for a long time
4975	* if the filesystem is active. So, instead, we make a second
4976	* pass over the dependencies blocking on each write. In the
4977	* usual case we will be blocking against a write that we
4978	* initiated, so when it is done the dependency will have been
4979	* resolved. Thus the second pass is expected to end quickly.
4980	* We give a brief window at the top of the loop to allow
4981	* any pending I/O to complete.
4982	*/
4983	for (waitfor = MNT_NOWAIT2; ; ) {
4984	retry_ino:
4985	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
4986	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
4987	if (inodedep_lookup(fs, ino, 0, &inodedep) == 0)
4988	return (0);
4989	TAILQ_FOREACH(adp, &inodedep->id_inoupdt, ad_next)for((adp) = ((&inodedep->id_inoupdt)->tqh_first); ( adp) != ((void *)0); (adp) = ((adp)->ad_next.tqe_next)) {
4990	if (adp->ad_statead_list.wk_state & DEPCOMPLETE0x0008)
4991	continue;
4992	bp = adp->ad_buf;
4993	gotit = getdirtybuf(bp, waitfor);
4994	if (gotit == 0) {
4995	if (waitfor == MNT_NOWAIT2)
4996	continue;
4997	break;
4998	} else if (gotit == -1)
4999	goto retry_ino;
5000	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5001	if (waitfor == MNT_NOWAIT2) {
5002	bawrite(bp);
5003	} else if ((error = VOP_BWRITE(bp)) != 0) {
5004	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5005	return (error);
5006	}
5007	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5008	break;
5009	}
5010	if (adp != NULL((void *)0))
5011	continue;
5012	retry_newino:
5013	TAILQ_FOREACH(adp, &inodedep->id_newinoupdt, ad_next)for((adp) = ((&inodedep->id_newinoupdt)->tqh_first) ; (adp) != ((void *)0); (adp) = ((adp)->ad_next.tqe_next)) {
5014	if (adp->ad_statead_list.wk_state & DEPCOMPLETE0x0008)
5015	continue;
5016	bp = adp->ad_buf;
5017	gotit = getdirtybuf(bp, waitfor);
5018	if (gotit == 0) {
5019	if (waitfor == MNT_NOWAIT2)
5020	continue;
5021	break;
5022	} else if (gotit == -1)
5023	goto retry_newino;
5024	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5025	if (waitfor == MNT_NOWAIT2) {
5026	bawrite(bp);
5027	} else if ((error = VOP_BWRITE(bp)) != 0) {
5028	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5029	return (error);
5030	}
5031	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5032	break;
5033	}
5034	if (adp != NULL((void *)0))
5035	continue;
5036	/*
5037	* If pass2, we are done, otherwise do pass 2.
5038	*/
5039	if (waitfor == MNT_WAIT1)
5040	break;
5041	waitfor = MNT_WAIT1;
5042	}
5043	/*
5044	* Try freeing inodedep in case all dependencies have been removed.
5045	*/
5046	if (inodedep_lookup(fs, ino, 0, &inodedep) != 0)
5047	(void) free_inodedep(inodedep);
5048	return (0);
5049	}
5050
5051	/*
5052	* Eliminate a pagedep dependency by flushing out all its diradd dependencies.
5053	* Called with splbio blocked.
5054	*/
5055	STATIC int
5056	flush_pagedep_deps(struct vnode pvp, struct mount mp,
5057	struct diraddhd *diraddhdp)
5058	{
5059	struct proc p = CURPROC({struct cpu_info __ci; asm volatile("movq %%gs:%P1,%0" : "=r" (__ci) :"n" (__builtin_offsetof(struct cpu_info, ci_self))); __ci;})->ci_curproc; /* XXX */
5060	struct worklist *wk;
5061	struct inodedep *inodedep;
5062	struct ufsmount *ump;
5063	struct diradd *dap;
5064	struct vnode *vp;
5065	int gotit, error = 0;
5066	struct buf *bp;
5067	ufsino_t inum;
5068
5069	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
5070
5071	ump = VFSTOUFS(mp)((struct ufsmount *)((mp)->mnt_data));
5072	while ((dap = LIST_FIRST(diraddhdp)((diraddhdp)->lh_first)) != NULL((void *)0)) {
5073	/*
5074	* Flush ourselves if this directory entry
5075	* has a MKDIR_PARENT dependency.
5076	*/
5077	if (dap->da_stateda_list.wk_state & MKDIR_PARENT0x0010) {
5078	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5079	if ((error = UFS_UPDATE(VTOI(pvp), 1)((((struct inode )(pvp)->v_data))->i_vtbl->iv_update )((((struct inode )(pvp)->v_data)), (1))))
5080	break;
5081	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5082	/*
5083	* If that cleared dependencies, go on to next.
5084	*/
5085	if (dap != LIST_FIRST(diraddhdp)((diraddhdp)->lh_first))
5086	continue;
5087	if (dap->da_stateda_list.wk_state & MKDIR_PARENT0x0010) {
5088	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5089	panic("flush_pagedep_deps: MKDIR_PARENT");
5090	}
5091	}
5092	/*
5093	* A newly allocated directory must have its "." and
5094	* ".." entries written out before its name can be
5095	* committed in its parent. We do not want or need
5096	* the full semantics of a synchronous VOP_FSYNC as
5097	* that may end up here again, once for each directory
5098	* level in the filesystem. Instead, we push the blocks
5099	* and wait for them to clear. We have to fsync twice
5100	* because the first call may choose to defer blocks
5101	* that still have dependencies, but deferral will
5102	* happen at most once.
5103	*/
5104	inum = dap->da_newinum;
5105	if (dap->da_stateda_list.wk_state & MKDIR_BODY0x0020) {
5106	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5107	if ((error = VFS_VGET(mp, inum, &vp)(*(mp)->mnt_op->vfs_vget)(mp, inum, &vp)) != 0)
5108	break;
5109	if ((error=VOP_FSYNC(vp, p->p_ucred, MNT_NOWAIT2, p)) \|\|
5110	(error=VOP_FSYNC(vp, p->p_ucred, MNT_NOWAIT2, p))) {
5111	vput(vp);
5112	break;
5113	}
5114	drain_output(vp, 0);
5115	/*
5116	* If first block is still dirty with a D_MKDIR
5117	* dependency then it needs to be written now.
5118	*/
5119	for (;;) {
5120	error = 0;
5121	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5122	bp = incore(vp, 0);
5123	if (bp == NULL((void *)0)) {
5124	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5125	break;
5126	}
5127	LIST_FOREACH(wk, &bp->b_dep, wk_list)for((wk) = ((&bp->b_dep)->lh_first); (wk)!= ((void * )0); (wk) = ((wk)->wk_list.le_next))
5128	if (wk->wk_type == D_MKDIR11)
5129	break;
5130	if (wk) {
5131	gotit = getdirtybuf(bp, MNT_WAIT1);
5132	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5133	if (gotit == -1)
5134	continue;
5135	if (gotit && (error = bwrite(bp)) != 0)
5136	break;
5137	} else
5138	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5139	break;
5140	}
5141	vput(vp);
5142	/* Flushing of first block failed */
5143	if (error)
5144	break;
5145	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5146	/*
5147	* If that cleared dependencies, go on to next.
5148	*/
5149	if (dap != LIST_FIRST(diraddhdp)((diraddhdp)->lh_first))
5150	continue;
5151	if (dap->da_stateda_list.wk_state & MKDIR_BODY0x0020) {
5152	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5153	panic("flush_pagedep_deps: MKDIR_BODY");
5154	}
5155	}
5156	/*
5157	* Flush the inode on which the directory entry depends.
5158	* Having accounted for MKDIR_PARENT and MKDIR_BODY above,
5159	* the only remaining dependency is that the updated inode
5160	* count must get pushed to disk. The inode has already
5161	* been pushed into its inode buffer (via VOP_UPDATE) at
5162	* the time of the reference count change. So we need only
5163	* locate that buffer, ensure that there will be no rollback
5164	* caused by a bitmap dependency, then write the inode buffer.
5165	*/
5166	if (inodedep_lookup(ump->um_fsufsmount_u.fs, inum, 0, &inodedep) == 0) {
5167	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5168	panic("flush_pagedep_deps: lost inode");
5169	}
5170	/*
5171	* If the inode still has bitmap dependencies,
5172	* push them to disk.
5173	*/
5174	retry:
5175	if ((inodedep->id_stateid_list.wk_state & DEPCOMPLETE0x0008) == 0) {
5176	bp = inodedep->id_buf;
5177	gotit = getdirtybuf(bp, MNT_WAIT1);
5178	if (gotit == -1)
5179	goto retry;
5180	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5181	if (gotit && (error = bwrite(bp)) != 0)
5182	break;
5183	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5184	if (dap != LIST_FIRST(diraddhdp)((diraddhdp)->lh_first))
5185	continue;
5186	}
5187	/*
5188	* If the inode is still sitting in a buffer waiting
5189	* to be written, push it to disk.
5190	*/
5191	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5192	if ((error = bread(ump->um_devvp,
5193	fsbtodb(ump->um_fs, ino_to_fsba(ump->um_fs, inum))((((daddr_t)(((((daddr_t)(ump->ufsmount_u.fs)->fs_fpg * (((inum) / (ump->ufsmount_u.fs)->fs_ipg))) + (ump-> ufsmount_u.fs)->fs_cgoffset * ((((inum) / (ump->ufsmount_u .fs)->fs_ipg)) & ~((ump->ufsmount_u.fs)->fs_cgmask ))) + (ump->ufsmount_u.fs)->fs_iblkno) + ((((((inum) % ( ump->ufsmount_u.fs)->fs_ipg) / ((ump->ufsmount_u.fs) ->fs_inopb))) << ((ump->ufsmount_u.fs))->fs_fragshift ))))) << (ump->ufsmount_u.fs)->fs_fsbtodb),
5194	(int)ump->um_fsufsmount_u.fs->fs_bsize, &bp)) != 0) {
5195	brelse(bp);
5196	break;
5197	}
5198	if ((error = bwrite(bp)) != 0)
5199	break;
5200	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5201	/*
5202	* If we have failed to get rid of all the dependencies
5203	* then something is seriously wrong.
5204	*/
5205	if (dap == LIST_FIRST(diraddhdp)((diraddhdp)->lh_first)) {
5206	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5207	panic("flush_pagedep_deps: flush failed");
5208	}
5209	}
5210	if (error)
5211	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5212	return (error);
5213	}
5214
5215	/*
5216	* A large burst of file addition or deletion activity can drive the
5217	* memory load excessively high. First attempt to slow things down
5218	* using the techniques below. If that fails, this routine requests
5219	* the offending operations to fall back to running synchronously
5220	* until the memory load returns to a reasonable level.
5221	*/
5222	int
5223	softdep_slowdown(struct vnode *vp)
5224	{
5225	int max_softdeps_hard;
5226
5227	max_softdeps_hard = max_softdeps * 11 / 10;
5228	if (num_dirrem < max_softdeps_hard / 2 &&
5229	num_inodedep < max_softdeps_hard)
5230	return (0);
5231	stat_sync_limit_hit += 1;
5232	return (1);
5233	}
5234
5235	/*
5236	* If memory utilization has gotten too high, deliberately slow things
5237	* down and speed up the I/O processing.
5238	*/
5239	STATIC int
5240	request_cleanup(int resource, int islocked)
5241	{
5242	struct proc p = CURPROC({struct cpu_info __ci; asm volatile("movq %%gs:%P1,%0" : "=r" (__ci) :"n" (__builtin_offsetof(struct cpu_info, ci_self))); __ci;})->ci_curproc;
5243	int s;
5244
5245	/*
5246	* We never hold up the filesystem syncer process.
5247	*/
5248	if (p == filesys_syncer \|\| (p->p_flag & P_SOFTDEP0x10000000))
5249	return (0);
5250	/*
5251	* First check to see if the work list has gotten backlogged.
5252	* If it has, co-opt this process to help clean up two entries.
5253	* Because this process may hold inodes locked, we cannot
5254	* handle any remove requests that might block on a locked
5255	* inode as that could lead to deadlock. We set P_SOFTDEP
5256	* to avoid recursively processing the worklist.
5257	*/
5258	if (num_on_worklist > max_softdeps / 10) {
5259	atomic_setbits_intx86_atomic_setbits_u32(&p->p_flag, P_SOFTDEP0x10000000);
5260	if (islocked)
5261	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5262	process_worklist_item(NULL((void )0), NULL((void )0), LK_NOWAIT0x0040UL);
5263	process_worklist_item(NULL((void )0), NULL((void )0), LK_NOWAIT0x0040UL);
5264	atomic_clearbits_intx86_atomic_clearbits_u32(&p->p_flag, P_SOFTDEP0x10000000);
5265	stat_worklist_push += 2;
5266	if (islocked)
5267	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5268	return(1);
5269	}
5270	/*
5271	* Next, we attempt to speed up the syncer process. If that
5272	* is successful, then we allow the process to continue.
5273	*/
5274	if (speedup_syncer())
5275	return(0);
5276	/*
5277	* If we are resource constrained on inode dependencies, try
5278	* flushing some dirty inodes. Otherwise, we are constrained
5279	* by file deletions, so try accelerating flushes of directories
5280	* with removal dependencies. We would like to do the cleanup
5281	* here, but we probably hold an inode locked at this point and
5282	* that might deadlock against one that we try to clean. So,
5283	* the best that we can do is request the syncer daemon to do
5284	* the cleanup for us.
5285	*/
5286	switch (resource) {
5287
5288	case FLUSH_INODES1:
5289	stat_ino_limit_push += 1;
5290	req_clear_inodedeps += 1;
5291	stat_countp = &stat_ino_limit_hit;
5292	break;
5293
5294	case FLUSH_REMOVE2:
5295	stat_blk_limit_push += 1;
5296	req_clear_remove += 1;
5297	stat_countp = &stat_blk_limit_hit;
5298	break;
5299
5300	default:
5301	if (islocked)
5302	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5303	panic("request_cleanup: unknown type");
5304	}
5305	/*
5306	* Hopefully the syncer daemon will catch up and awaken us.
5307	* We wait at most tickdelay before proceeding in any case.
5308	*/
5309	if (islocked == 0)
5310	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5311	proc_waiting += 1;
5312	if (!timeout_pending(&proc_waiting_timeout)((&proc_waiting_timeout)->to_flags & 0x02))
5313	timeout_add(&proc_waiting_timeout, tickdelay > 2 ? tickdelay : 2);
5314
5315	s = FREE_LOCK_INTERLOCKED(&lk)((&lk)->lkt_spl);
5316	tsleep_nsec(&proc_waiting, PPAUSE40, "softupdate", INFSLP0xffffffffffffffffULL);
5317	ACQUIRE_LOCK_INTERLOCKED(&lk, s)(&lk)->lkt_spl = (s);
5318	proc_waiting -= 1;
5319	if (islocked == 0)
5320	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5321	return (1);
5322	}
5323
5324	/*
5325	* Awaken processes pausing in request_cleanup and clear proc_waiting
5326	* to indicate that there is no longer a timer running.
5327	*/
5328	void
5329	pause_timer(void *arg)
5330	{
5331
5332	*stat_countp += 1;
5333	wakeup_one(&proc_waiting)wakeup_n((&proc_waiting), 1);
5334	if (proc_waiting > 0)
5335	timeout_add(&proc_waiting_timeout, tickdelay > 2 ? tickdelay : 2);
5336	}
5337
5338	/*
5339	* Flush out a directory with at least one removal dependency in an effort to
5340	* reduce the number of dirrem, freefile, and freeblks dependency structures.
5341	*/
5342	STATIC void
5343	clear_remove(struct proc *p)
5344	{
5345	struct pagedep_hashhead *pagedephd;
5346	struct pagedep *pagedep;
5347	static int next = 0;
5348	struct mount *mp;
5349	struct vnode *vp;
5350	int error, cnt;
5351	ufsino_t ino;
5352
5353	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5354	for (cnt = 0; cnt <= pagedep_hash; cnt++) {
5355	pagedephd = &pagedep_hashtbl[next++];
5356	if (next > pagedep_hash)
5357	next = 0;
5358	LIST_FOREACH(pagedep, pagedephd, pd_hash)for((pagedep) = ((pagedephd)->lh_first); (pagedep)!= ((void *)0); (pagedep) = ((pagedep)->pd_hash.le_next)) {
5359	if (LIST_FIRST(&pagedep->pd_dirremhd)((&pagedep->pd_dirremhd)->lh_first) == NULL((void *)0))
5360	continue;
5361	mp = pagedep->pd_mnt;
5362	ino = pagedep->pd_ino;
5363	#if 0
5364	if (vn_start_write(NULL((void *)0), &mp, V_NOWAIT) != 0)
5365	continue;
5366	#endif
5367	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5368	if ((error = VFS_VGET(mp, ino, &vp)(*(mp)->mnt_op->vfs_vget)(mp, ino, &vp)) != 0) {
5369	softdep_error("clear_remove: vget", error);
5370	#if 0
5371	vn_finished_write(mp);
5372	#endif
5373	return;
5374	}
5375	if ((error = VOP_FSYNC(vp, p->p_ucred, MNT_NOWAIT2, p)))
5376	softdep_error("clear_remove: fsync", error);
5377	drain_output(vp, 0);
5378	vput(vp);
5379	#if 0
5380	vn_finished_write(mp);
5381	#endif
5382	return;
5383	}
5384	}
5385	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5386	}
5387
5388	/*
5389	* Clear out a block of dirty inodes in an effort to reduce
5390	* the number of inodedep dependency structures.
5391	*/
5392	STATIC void
5393	clear_inodedeps(struct proc *p)
5394	{
5395	struct inodedep_hashhead *inodedephd;
5396	struct inodedep inodedep = NULL((void )0);
5397	static int next = 0;
5398	struct mount *mp;
5399	struct vnode *vp;
5400	struct fs *fs;
5401	int error, cnt;
5402	ufsino_t firstino, lastino, ino;
5403
5404	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5405	/*
5406	* Pick a random inode dependency to be cleared.
5407	* We will then gather up all the inodes in its block
5408	* that have dependencies and flush them out.
5409	*/
5410	for (cnt = 0; cnt <= inodedep_hash; cnt++) {
5411	inodedephd = &inodedep_hashtbl[next++];
5412	if (next > inodedep_hash)
5413	next = 0;
5414	if ((inodedep = LIST_FIRST(inodedephd)((inodedephd)->lh_first)) != NULL((void *)0))
5415	break;
5416	}
5417	if (inodedep == NULL((void *)0)) {
5418	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5419	return;
5420	}
5421	/*
5422	* Ugly code to find mount point given pointer to superblock.
5423	*/
5424	fs = inodedep->id_fs;
5425	TAILQ_FOREACH(mp, &mountlist, mnt_list)for((mp) = ((&mountlist)->tqh_first); (mp) != ((void * )0); (mp) = ((mp)->mnt_list.tqe_next))
5426	if ((mp->mnt_flag & MNT_SOFTDEP0x04000000) && fs == VFSTOUFS(mp)((struct ufsmount *)((mp)->mnt_data))->um_fsufsmount_u.fs)
5427	break;
5428	/*
5429	* Find the last inode in the block with dependencies.
5430	*/
5431	firstino = inodedep->id_ino & ~(INOPB(fs)((fs)->fs_inopb) - 1);
5432	for (lastino = firstino + INOPB(fs)((fs)->fs_inopb) - 1; lastino > firstino; lastino--)
5433	if (inodedep_lookup(fs, lastino, 0, &inodedep) != 0)
5434	break;
5435	/*
5436	* Asynchronously push all but the last inode with dependencies.
5437	* Synchronously push the last inode with dependencies to ensure
5438	* that the inode block gets written to free up the inodedeps.
5439	*/
5440	for (ino = firstino; ino <= lastino; ino++) {
5441	if (inodedep_lookup(fs, ino, 0, &inodedep) == 0)
5442	continue;
5443	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5444	#if 0
5445	if (vn_start_write(NULL((void *)0), &mp, V_NOWAIT) != 0)
5446	continue;
5447	#endif
5448	if ((error = VFS_VGET(mp, ino, &vp)(*(mp)->mnt_op->vfs_vget)(mp, ino, &vp)) != 0) {
5449	softdep_error("clear_inodedeps: vget", error);
5450	#if 0
5451	vn_finished_write(mp);
5452	#endif
5453	return;
5454	}
5455	if (ino == lastino) {
5456	if ((error = VOP_FSYNC(vp, p->p_ucred, MNT_WAIT1, p)))
5457	softdep_error("clear_inodedeps: fsync1", error);
5458	} else {
5459	if ((error = VOP_FSYNC(vp, p->p_ucred, MNT_NOWAIT2, p)))
5460	softdep_error("clear_inodedeps: fsync2", error);
5461	drain_output(vp, 0);
5462	}
5463	vput(vp);
5464	#if 0
5465	vn_finished_write(mp);
5466	#endif
5467	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5468	}
5469	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5470	}
5471
5472	/*
5473	* Function to determine if the buffer has outstanding dependencies
5474	* that will cause a roll-back if the buffer is written. If wantcount
5475	* is set, return number of dependencies, otherwise just yes or no.
5476	*/
5477	int
5478	softdep_count_dependencies(struct buf *bp, int wantcount, int islocked)
5479	{
5480	struct worklist *wk;
5481	struct inodedep *inodedep;
5482	struct indirdep *indirdep;
5483	struct allocindir *aip;
5484	struct pagedep *pagedep;
5485	struct diradd *dap;
5486	int i, retval;
5487
5488	retval = 0;
5489	if (!islocked)
5490	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5491	LIST_FOREACH(wk, &bp->b_dep, wk_list)for((wk) = ((&bp->b_dep)->lh_first); (wk)!= ((void * )0); (wk) = ((wk)->wk_list.le_next)) {
5492	switch (wk->wk_type) {
5493
5494	case D_INODEDEP1:
5495	inodedep = WK_INODEDEP(wk)((struct inodedep *)(wk));
5496	if ((inodedep->id_stateid_list.wk_state & DEPCOMPLETE0x0008) == 0) {
5497	/* bitmap allocation dependency */
5498	retval += 1;
5499	if (!wantcount)
5500	goto out;
5501	}
5502	if (TAILQ_FIRST(&inodedep->id_inoupdt)((&inodedep->id_inoupdt)->tqh_first)) {
5503	/* direct block pointer dependency */
5504	retval += 1;
5505	if (!wantcount)
5506	goto out;
5507	}
5508	continue;
5509
5510	case D_INDIRDEP5:
5511	indirdep = WK_INDIRDEP(wk)((struct indirdep *)(wk));
5512
5513	LIST_FOREACH(aip, &indirdep->ir_deplisthd, ai_next)for((aip) = ((&indirdep->ir_deplisthd)->lh_first); ( aip)!= ((void *)0); (aip) = ((aip)->ai_next.le_next)) {
5514	/* indirect block pointer dependency */
5515	retval += 1;
5516	if (!wantcount)
5517	goto out;
5518	}
5519	continue;
5520
5521	case D_PAGEDEP0:
5522	pagedep = WK_PAGEDEP(wk)((struct pagedep *)(wk));
5523	for (i = 0; i < DAHASHSZ6; i++) {
5524
5525	LIST_FOREACH(dap, &pagedep->pd_diraddhd[i], da_pdlist)for((dap) = ((&pagedep->pd_diraddhd[i])->lh_first); (dap)!= ((void *)0); (dap) = ((dap)->da_pdlist.le_next)) {
5526	/* directory entry dependency */
5527	retval += 1;
5528	if (!wantcount)
5529	goto out;
5530	}
5531	}
5532	continue;
5533
5534	case D_BMSAFEMAP3:
5535	case D_ALLOCDIRECT4:
5536	case D_ALLOCINDIR6:
5537	case D_MKDIR11:
5538	/* never a dependency on these blocks */
5539	continue;
5540
5541	default:
5542	if (!islocked)
5543	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5544	panic("softdep_check_for_rollback: Unexpected type %s",
5545	TYPENAME(wk->wk_type)((unsigned)(wk->wk_type) <= 13 ? softdep_typenames[wk-> wk_type] : "???"));
5546	/* NOTREACHED */
5547	}
5548	}
5549	out:
5550	if (!islocked)
5551	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5552	return retval;
5553	}
5554
5555	/*
5556	* Acquire exclusive access to a buffer.
5557	* Must be called with splbio blocked.
5558	* Returns:
5559	* 1 if the buffer was acquired and is dirty;
5560	* 0 if the buffer was clean, or we would have slept but had MN_NOWAIT;
5561	* -1 if we slept and may try again (but not with this bp).
5562	*/
5563	STATIC int
5564	getdirtybuf(struct buf *bp, int waitfor)
5565	{
5566	int s;
5567
5568	if (bp == NULL((void *)0))
5569	return (0);
5570
5571	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
5572
5573	if (bp->b_flags & B_BUSY0x00000010) {
5574	if (waitfor != MNT_WAIT1)
5575	return (0);
5576	bp->b_flags \|= B_WANTED0x00010000;
5577	s = FREE_LOCK_INTERLOCKED(&lk)((&lk)->lkt_spl);
5578	tsleep_nsec(bp, PRIBIO16+1, "sdsdty", INFSLP0xffffffffffffffffULL);
5579	ACQUIRE_LOCK_INTERLOCKED(&lk, s)(&lk)->lkt_spl = (s);
5580	return (-1);
5581	}
5582	if ((bp->b_flags & B_DELWRI0x00000080) == 0)
5583	return (0);
5584	bremfreebufcache_take(bp);
5585	buf_acquire(bp);
5586	return (1);
5587	}
5588
5589	/*
5590	* Wait for pending output on a vnode to complete.
5591	* Must be called with vnode locked.
5592	*/
5593	STATIC void
5594	drain_output(struct vnode *vp, int islocked)
5595	{
5596	int s;
5597
5598	if (!islocked)
5599	ACQUIRE_LOCK(&lk)(&lk)->lkt_spl = splraise(0x3);
5600
5601	splassert(IPL_BIO)do { if (splassert_ctl > 0) { splassert_check(0x3, __func__ ); } } while (0);
5602
5603	while (vp->v_numoutput) {
5604	vp->v_bioflag \|= VBIOWAIT0x0001;
5605	s = FREE_LOCK_INTERLOCKED(&lk)((&lk)->lkt_spl);
5606	tsleep_nsec(&vp->v_numoutput, PRIBIO16+1, "drain_output", INFSLP0xffffffffffffffffULL);
5607	ACQUIRE_LOCK_INTERLOCKED(&lk, s)(&lk)->lkt_spl = (s);
5608	}
5609	if (!islocked)
5610	FREE_LOCK(&lk)spllower((&lk)->lkt_spl);
5611	}
5612
5613	/*
5614	* Called whenever a buffer that is being invalidated or reallocated
5615	* contains dependencies. This should only happen if an I/O error has
5616	* occurred. The routine is called with the buffer locked.
5617	*/
5618	void
5619	softdep_deallocate_dependencies(struct buf *bp)
5620	{
5621
5622	if ((bp->b_flags & B_ERROR0x00000400) == 0)
5623	panic("softdep_deallocate_dependencies: dangling deps");
5624	softdep_error(bp->b_vp->v_mount->mnt_stat.f_mntonname, bp->b_error);
5625	panic("softdep_deallocate_dependencies: unrecovered I/O error");
5626	}
5627
5628	/*
5629	* Function to handle asynchronous write errors in the filesystem.
5630	*/
5631	void
5632	softdep_error(char *func, int error)
5633	{
5634
5635	/* XXX should do something better! */
5636	printf("%s: got error %d while accessing filesystem\n", func, error);
5637	}
5638
5639	#ifdef DDB1
5640	#include <machine/db_machdep.h>
5641	#include <ddb/db_interface.h>
5642	#include <ddb/db_output.h>
5643
5644	void
5645	softdep_print(struct buf *bp, int full,
5646	int (pr)(const char , ...) __attribute__((__format__(__kprintf__,1,2))))
5647	{
5648	struct worklist *wk;
5649
5650	(*pr)(" deps:\n");
5651	LIST_FOREACH(wk, &bp->b_dep, wk_list)for((wk) = ((&bp->b_dep)->lh_first); (wk)!= ((void * )0); (wk) = ((wk)->wk_list.le_next))
5652	worklist_print(wk, full, pr);
5653	}
5654
5655	void
5656	worklist_print(struct worklist *wk, int full,
5657	int (pr)(const char , ...) __attribute__((__format__(__kprintf__,1,2))))
5658	{
5659	struct pagedep *pagedep;
5660	struct inodedep *inodedep;
5661	struct newblk *newblk;
5662	struct bmsafemap *bmsafemap;
5663	struct allocdirect *adp;
5664	struct indirdep *indirdep;
5665	struct allocindir *aip;
5666	struct freefrag *freefrag;
5667	struct freeblks *freeblks;
5668	struct freefile *freefile;
5669	struct diradd *dap;
5670	struct mkdir *mkdir;
5671	struct dirrem *dirrem;
5672	struct newdirblk *newdirblk;
5673	char prefix[33];
5674	int i;
5675
5676	for (prefix[i = 2 * MIN(16, full)(((16)<(full))?(16):(full))] = '\0'; i--; prefix[i] = ' ')
5677	;
5678
5679	(*pr)("%s%s(%p) state %b\n%s", prefix, TYPENAME(wk->wk_type)((unsigned)(wk->wk_type) <= 13 ? softdep_typenames[wk-> wk_type] : "???"), wk,
5680	wk->wk_state, DEP_BITS"\020\01ATTACHED\02UNDONE\03COMPLETE\04DEPCOMPLETE" "\05MKDIR_PARENT\06MKDIR_BODY\07RMDIR\010DIRCHG\011GOINGAWAY" "\012IOSTARTED\013SPACECOUNTED\014NEWBLOCK\016UFS1FMT\020ONWORKLIST", prefix);
5681	switch (wk->wk_type) {
5682	case D_PAGEDEP0:
5683	pagedep = WK_PAGEDEP(wk)((struct pagedep *)(wk));
5684	(*pr)("mount %p ino %u lbn %lld\n", pagedep->pd_mnt,
5685	pagedep->pd_ino, (long long)pagedep->pd_lbn);
5686	break;
5687	case D_INODEDEP1:
5688	inodedep = WK_INODEDEP(wk)((struct inodedep *)(wk));
5689	(*pr)("fs %p ino %u nlinkdelta %u dino %p\n"
5690	"%s bp %p savsz %lld\n", inodedep->id_fs,
5691	inodedep->id_ino, inodedep->id_nlinkdelta,
5692	inodedep->id_un.idu_savedino1,
5693	prefix, inodedep->id_buf, inodedep->id_savedsize);
5694	break;
5695	case D_NEWBLK2:
5696	newblk = WK_NEWBLK(wk)((struct newblk *)(wk));
5697	(*pr)("fs %p newblk %lld state %d bmsafemap %p\n",
5698	newblk->nb_fs, (long long)newblk->nb_newblkno,
5699	newblk->nb_state, newblk->nb_bmsafemap);
5700	break;
5701	case D_BMSAFEMAP3:
5702	bmsafemap = WK_BMSAFEMAP(wk)((struct bmsafemap *)(wk));
5703	(*pr)("buf %p\n", bmsafemap->sm_buf);
5704	break;
5705	case D_ALLOCDIRECT4:
5706	adp = WK_ALLOCDIRECT(wk)((struct allocdirect *)(wk));
5707	(*pr)("lbn %lld newlbk %lld oldblk %lld newsize %ld olsize "
5708	"%ld\n%s bp %p inodedep %p freefrag %p\n",
5709	(long long)adp->ad_lbn, (long long)adp->ad_newblkno,
5710	(long long)adp->ad_oldblkno, adp->ad_newsize,
5711	adp->ad_oldsize,
5712	prefix, adp->ad_buf, adp->ad_inodedep, adp->ad_freefrag);
5713	break;
5714	case D_INDIRDEP5:
5715	indirdep = WK_INDIRDEP(wk)((struct indirdep *)(wk));
5716	(*pr)("savedata %p savebp %p\n", indirdep->ir_saveddata,
5717	indirdep->ir_savebp);
5718	break;
5719	case D_ALLOCINDIR6:
5720	aip = WK_ALLOCINDIR(wk)((struct allocindir *)(wk));
5721	(*pr)("off %d newblk %lld oldblk %lld freefrag %p\n"
5722	"%s indirdep %p buf %p\n", aip->ai_offset,
5723	(long long)aip->ai_newblkno, (long long)aip->ai_oldblkno,
5724	aip->ai_freefrag, prefix, aip->ai_indirdep, aip->ai_buf);
5725	break;
5726	case D_FREEFRAG7:
5727	freefrag = WK_FREEFRAG(wk)((struct freefrag *)(wk));
5728	(*pr)("vnode %p mp %p blkno %lld fsize %ld ino %u\n",
5729	freefrag->ff_devvp, freefrag->ff_mnt,
5730	(long long)freefrag->ff_blkno, freefrag->ff_fragsize,
5731	freefrag->ff_inum);
5732	break;
5733	case D_FREEBLKS8:
5734	freeblks = WK_FREEBLKS(wk)((struct freeblks *)(wk));
5735	(*pr)("previno %u devvp %p mp %p oldsz %lld newsz %lld\n"
5736	"%s chkcnt %d uid %d\n", freeblks->fb_previousinum,
5737	freeblks->fb_devvp, freeblks->fb_mnt, freeblks->fb_oldsize,
5738	freeblks->fb_newsize,
5739	prefix, freeblks->fb_chkcnt, freeblks->fb_uid);
5740	break;
5741	case D_FREEFILE9:
5742	freefile = WK_FREEFILE(wk)((struct freefile *)(wk));
5743	(*pr)("mode %x oldino %u vnode %p mp %p\n", freefile->fx_mode,
5744	freefile->fx_oldinum, freefile->fx_devvp, freefile->fx_mnt);
5745	break;
5746	case D_DIRADD10:
5747	dap = WK_DIRADD(wk)((struct diradd *)(wk));
5748	(*pr)("off %d ino %u da_un %p\n", dap->da_offset,
5749	dap->da_newinum, dap->da_un.dau_previous);
5750	break;
5751	case D_MKDIR11:
5752	mkdir = WK_MKDIR(wk)((struct mkdir *)(wk));
5753	(*pr)("diradd %p bp %p\n", mkdir->md_diradd, mkdir->md_buf);
5754	break;
5755	case D_DIRREM12:
5756	dirrem = WK_DIRREM(wk)((struct dirrem *)(wk));
5757	(*pr)("mp %p ino %u dm_un %p\n", dirrem->dm_mnt,
5758	dirrem->dm_oldinum, dirrem->dm_un.dmu_pagedep);
5759	break;
5760	case D_NEWDIRBLK13:
5761	newdirblk = WK_NEWDIRBLK(wk)((struct newdirblk *)(wk));
5762	(*pr)("pagedep %p\n", newdirblk->db_pagedep);
5763	break;
5764	}
5765	}
5766	#endif