xref: /original-bsd/sys/ufs/lfs/lfs_bio.c (revision 0842ddeb)
1 /*
2  * Copyright (c) 1991, 1993
3  *	The Regents of the University of California.  All rights reserved.
4  *
5  * %sccs.include.redist.c%
6  *
7  *	@(#)lfs_bio.c	8.9 (Berkeley) 05/20/95
8  */
9 
10 #include <sys/param.h>
11 #include <sys/proc.h>
12 #include <sys/buf.h>
13 #include <sys/vnode.h>
14 #include <sys/resourcevar.h>
15 #include <sys/mount.h>
16 #include <sys/kernel.h>
17 
18 #include <ufs/ufs/quota.h>
19 #include <ufs/ufs/inode.h>
20 #include <ufs/ufs/ufsmount.h>
21 
22 #include <ufs/lfs/lfs.h>
23 #include <ufs/lfs/lfs_extern.h>
24 
25 /*
26  * LFS block write function.
27  *
28  * XXX
29  * No write cost accounting is done.
30  * This is almost certainly wrong for synchronous operations and NFS.
31  */
32 int	lfs_allclean_wakeup;		/* Cleaner wakeup address. */
33 int	locked_queue_count;		/* XXX Count of locked-down buffers. */
34 int	lfs_writing;			/* Set if already kicked off a writer
35 					   because of buffer space */
36 /*
37 #define WRITE_THRESHHOLD	((nbuf >> 2) - 10)
38 #define WAIT_THRESHHOLD		((nbuf >> 1) - 10)
39 */
40 #define WAIT_THRESHHOLD         (nbuf - (nbuf >> 2) - 10)
41 #define WRITE_THRESHHOLD        ((nbuf >> 1) - 10)
42 #define LFS_BUFWAIT	2
43 
44 int
45 lfs_bwrite(ap)
46 	struct vop_bwrite_args /* {
47 		struct buf *a_bp;
48 	} */ *ap;
49 {
50 	register struct buf *bp = ap->a_bp;
51 	struct lfs *fs;
52 	struct inode *ip;
53 	int db, error, s;
54 
55 	/*
56 	 * Set the delayed write flag and use reassignbuf to move the buffer
57 	 * from the clean list to the dirty one.
58 	 *
59 	 * Set the B_LOCKED flag and unlock the buffer, causing brelse to move
60 	 * the buffer onto the LOCKED free list.  This is necessary, otherwise
61 	 * getnewbuf() would try to reclaim the buffers using bawrite, which
62 	 * isn't going to work.
63 	 *
64 	 * XXX we don't let meta-data writes run out of space because they can
65 	 * come from the segment writer.  We need to make sure that there is
66 	 * enough space reserved so that there's room to write meta-data
67 	 * blocks.
68 	 */
69 	if (!(bp->b_flags & B_LOCKED)) {
70 		fs = VFSTOUFS(bp->b_vp->v_mount)->um_lfs;
71 		db = fragstodb(fs, numfrags(fs, bp->b_bcount));
72 		while (!LFS_FITS(fs, db) && !IS_IFILE(bp) &&
73 		    bp->b_lblkno > 0) {
74 			/* Out of space, need cleaner to run */
75 			wakeup(&lfs_allclean_wakeup);
76 			if (error = tsleep(&fs->lfs_avail, PCATCH | PUSER,
77 			    "cleaner", NULL)) {
78 				brelse(bp);
79 				return (error);
80 			}
81 		}
82 		ip = VTOI((bp)->b_vp);
83 		if (!(ip->i_flag & IN_MODIFIED))
84 			++fs->lfs_uinodes;
85 		ip->i_flag |= IN_CHANGE | IN_MODIFIED | IN_UPDATE;
86 		fs->lfs_avail -= db;
87 		++locked_queue_count;
88 		bp->b_flags |= B_DELWRI | B_LOCKED;
89 		bp->b_flags &= ~(B_READ | B_ERROR);
90 		s = splbio();
91 		reassignbuf(bp, bp->b_vp);
92 		splx(s);
93 	}
94 	brelse(bp);
95 	return (0);
96 }
97 
98 /*
99  * XXX
100  * This routine flushes buffers out of the B_LOCKED queue when LFS has too
101  * many locked down.  Eventually the pageout daemon will simply call LFS
102  * when pages need to be reclaimed.  Note, we have one static count of locked
103  * buffers, so we can't have more than a single file system.  To make this
104  * work for multiple file systems, put the count into the mount structure.
105  */
106 void
107 lfs_flush()
108 {
109 	register struct mount *mp, *nmp;
110 	struct proc *p = curproc;	/* XXX */
111 
112 #ifdef DOSTATS
113 	++lfs_stats.write_exceeded;
114 #endif
115 	if (lfs_writing)
116 		return;
117 	lfs_writing = 1;
118 	simple_lock(&mountlist_slock);
119 	for (mp = mountlist.cqh_first; mp != (void *)&mountlist; mp = nmp) {
120 		if (vfs_busy(mp, LK_NOWAIT, &mountlist_slock, p)) {
121 			nmp = mp->mnt_list.cqe_next;
122 			continue;
123 		}
124 		if (mp->mnt_stat.f_type == lfs_mount_type &&
125 		    (mp->mnt_flag & MNT_RDONLY) == 0 &&
126 		    !((((struct ufsmount *)mp->mnt_data))->ufsmount_u.lfs)->lfs_dirops ) {
127 			/*
128 			 * We set the queue to 0 here because we are about to
129 			 * write all the dirty buffers we have.  If more come
130 			 * in while we're writing the segment, they may not
131 			 * get written, so we want the count to reflect these
132 			 * new writes after the segwrite completes.
133 			 */
134 #ifdef DOSTATS
135 			++lfs_stats.flush_invoked;
136 #endif
137 			lfs_segwrite(mp, 0);
138 		}
139 		simple_lock(&mountlist_slock);
140 		nmp = mp->mnt_list.cqe_next;
141 		vfs_unbusy(mp, p);
142 	}
143 	simple_unlock(&mountlist_slock);
144 	lfs_writing = 0;
145 }
146 
147 int
148 lfs_check(vp, blkno)
149 	struct vnode *vp;
150 	ufs_daddr_t blkno;
151 {
152 	extern int lfs_allclean_wakeup;
153 	int error;
154 
155 	error = 0;
156 	if (incore(vp, blkno))
157 		return (0);
158 	if (locked_queue_count > WRITE_THRESHHOLD)
159 		lfs_flush();
160 
161 	/* If out of buffers, wait on writer */
162 	while (locked_queue_count > WAIT_THRESHHOLD) {
163 #ifdef DOSTATS
164 	    ++lfs_stats.wait_exceeded;
165 #endif
166 	    error = tsleep(&locked_queue_count, PCATCH | PUSER, "buffers",
167 	        hz * LFS_BUFWAIT);
168 	}
169 
170 	return (error);
171 }
172