1 /* $NetBSD: ulfs_inode.c,v 1.26 2020/09/05 16:30:13 riastradh Exp $ */ 2 /* from NetBSD: ufs_inode.c,v 1.95 2015/06/13 14:56:45 hannken Exp */ 3 4 /* 5 * Copyright (c) 1991, 1993 6 * The Regents of the University of California. All rights reserved. 7 * (c) UNIX System Laboratories, Inc. 8 * All or some portions of this file are derived from material licensed 9 * to the University of California by American Telephone and Telegraph 10 * Co. or Unix System Laboratories, Inc. and are reproduced herein with 11 * the permission of UNIX System Laboratories, Inc. 12 * 13 * Redistribution and use in source and binary forms, with or without 14 * modification, are permitted provided that the following conditions 15 * are met: 16 * 1. Redistributions of source code must retain the above copyright 17 * notice, this list of conditions and the following disclaimer. 18 * 2. Redistributions in binary form must reproduce the above copyright 19 * notice, this list of conditions and the following disclaimer in the 20 * documentation and/or other materials provided with the distribution. 21 * 3. Neither the name of the University nor the names of its contributors 22 * may be used to endorse or promote products derived from this software 23 * without specific prior written permission. 24 * 25 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 26 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 27 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 28 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 29 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 30 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 31 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 32 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 33 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 34 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 35 * SUCH DAMAGE. 36 * 37 * @(#)ufs_inode.c 8.9 (Berkeley) 5/14/95 38 */ 39 40 #include <sys/cdefs.h> 41 __KERNEL_RCSID(0, "$NetBSD: ulfs_inode.c,v 1.26 2020/09/05 16:30:13 riastradh Exp $"); 42 43 #if defined(_KERNEL_OPT) 44 #include "opt_lfs.h" 45 #include "opt_quota.h" 46 #include "opt_uvmhist.h" 47 #endif 48 49 #include <sys/param.h> 50 #include <sys/systm.h> 51 #include <sys/proc.h> 52 #include <sys/vnode.h> 53 #include <sys/mount.h> 54 #include <sys/kernel.h> 55 #include <sys/namei.h> 56 #include <sys/kauth.h> 57 #include <sys/kmem.h> 58 59 #include <ufs/lfs/lfs.h> 60 #include <ufs/lfs/lfs_accessors.h> 61 #include <ufs/lfs/lfs_extern.h> 62 63 #include <ufs/lfs/ulfs_inode.h> 64 #include <ufs/lfs/ulfsmount.h> 65 #include <ufs/lfs/ulfs_extern.h> 66 #ifdef LFS_DIRHASH 67 #include <ufs/lfs/ulfs_dirhash.h> 68 #endif 69 #ifdef LFS_EXTATTR 70 #include <ufs/lfs/ulfs_extattr.h> 71 #endif 72 73 #ifdef UVMHIST 74 #include <uvm/uvm.h> 75 #endif 76 #include <uvm/uvm_page.h> 77 #include <uvm/uvm_stat.h> 78 79 /* 80 * Last reference to an inode. If necessary, write or delete it. 81 */ 82 int 83 ulfs_inactive(void *v) 84 { 85 struct vop_inactive_v2_args /* { 86 struct vnode *a_vp; 87 struct bool *a_recycle; 88 } */ *ap = v; 89 struct vnode *vp = ap->a_vp; 90 struct inode *ip = VTOI(vp); 91 mode_t mode; 92 int error = 0; 93 94 /* 95 * Ignore inodes related to stale file handles. 96 */ 97 if (ip->i_mode == 0) 98 goto out; 99 if (ip->i_nlink <= 0 && (vp->v_mount->mnt_flag & MNT_RDONLY) == 0) { 100 #ifdef LFS_EXTATTR 101 ulfs_extattr_vnode_inactive(vp, curlwp); 102 #endif 103 if (ip->i_size != 0) { 104 error = lfs_truncate(vp, (off_t)0, 0, NOCRED); 105 } 106 #if defined(LFS_QUOTA) || defined(LFS_QUOTA2) 107 (void)lfs_chkiq(ip, -1, NOCRED, 0); 108 #endif 109 DIP_ASSIGN(ip, rdev, 0); 110 mode = ip->i_mode; 111 ip->i_mode = 0; 112 ip->i_omode = mode; 113 DIP_ASSIGN(ip, mode, 0); 114 ip->i_state |= IN_CHANGE | IN_UPDATE; 115 /* 116 * Defer final inode free and update to ulfs_reclaim(). 117 */ 118 } 119 120 if (ip->i_state & (IN_CHANGE | IN_UPDATE | IN_MODIFIED)) { 121 lfs_update(vp, NULL, NULL, 0); 122 } 123 124 out: 125 /* 126 * If we are done with the inode, reclaim it 127 * so that it can be reused immediately. 128 */ 129 *ap->a_recycle = (ip->i_mode == 0); 130 131 return (error); 132 } 133 134 /* 135 * Reclaim an inode so that it can be used for other purposes. 136 */ 137 int 138 ulfs_reclaim(struct vnode *vp) 139 { 140 struct inode *ip = VTOI(vp); 141 142 /* XXX: do we really need two of these? */ 143 /* note: originally the first was inside a wapbl txn */ 144 lfs_update(vp, NULL, NULL, UPDATE_CLOSE); 145 lfs_update(vp, NULL, NULL, UPDATE_CLOSE); 146 147 if (ip->i_devvp) { 148 vrele(ip->i_devvp); 149 ip->i_devvp = 0; 150 } 151 #if defined(LFS_QUOTA) || defined(LFS_QUOTA2) 152 ulfsquota_free(ip); 153 #endif 154 #ifdef LFS_DIRHASH 155 if (ip->i_dirhash != NULL) 156 ulfsdirhash_free(ip); 157 #endif 158 return (0); 159 } 160 161 /* 162 * allocate a range of blocks in a file. 163 * after this function returns, any page entirely contained within the range 164 * will map to invalid data and thus must be overwritten before it is made 165 * accessible to others. 166 */ 167 168 int 169 ulfs_balloc_range(struct vnode *vp, off_t off, off_t len, kauth_cred_t cred, 170 int flags) 171 { 172 off_t neweof; /* file size after the operation */ 173 off_t neweob; /* offset next to the last block after the operation */ 174 off_t pagestart; /* starting offset of range covered by pgs */ 175 off_t eob; /* offset next to allocated blocks */ 176 struct uvm_object *uobj; 177 int i, delta, error, npages; 178 int bshift = vp->v_mount->mnt_fs_bshift; 179 int bsize = 1 << bshift; 180 int ppb = MAX(bsize >> PAGE_SHIFT, 1); 181 struct vm_page **pgs; 182 size_t pgssize; 183 UVMHIST_FUNC("ulfs_balloc_range"); UVMHIST_CALLED(ubchist); 184 UVMHIST_LOG(ubchist, "vp %#jx off 0x%jx len 0x%jx u_size 0x%jx", 185 (uintptr_t)vp, off, len, vp->v_size); 186 187 neweof = MAX(vp->v_size, off + len); 188 GOP_SIZE(vp, neweof, &neweob, 0); 189 190 error = 0; 191 uobj = &vp->v_uobj; 192 193 /* 194 * read or create pages covering the range of the allocation and 195 * keep them locked until the new block is allocated, so there 196 * will be no window where the old contents of the new block are 197 * visible to racing threads. 198 */ 199 200 pagestart = trunc_page(off) & ~(bsize - 1); 201 npages = MIN(ppb, (round_page(neweob) - pagestart) >> PAGE_SHIFT); 202 pgssize = npages * sizeof(struct vm_page *); 203 pgs = kmem_zalloc(pgssize, KM_SLEEP); 204 205 /* 206 * adjust off to be block-aligned. 207 */ 208 209 delta = off & (bsize - 1); 210 off -= delta; 211 len += delta; 212 213 genfs_node_wrlock(vp); 214 rw_enter(uobj->vmobjlock, RW_WRITER); 215 error = VOP_GETPAGES(vp, pagestart, pgs, &npages, 0, 216 VM_PROT_WRITE, 0, PGO_SYNCIO | PGO_PASTEOF | PGO_NOBLOCKALLOC | 217 PGO_NOTIMESTAMP | PGO_GLOCKHELD); 218 if (error) { 219 genfs_node_unlock(vp); 220 goto out; 221 } 222 223 /* 224 * now allocate the range. 225 */ 226 227 error = GOP_ALLOC(vp, off, len, flags, cred); 228 genfs_node_unlock(vp); 229 230 /* 231 * if the allocation succeeded, mark all pages dirty and clear 232 * PG_RDONLY on any pages that are now fully backed by disk blocks. 233 * if the allocation failed, we do not invalidate the pages since 234 * they might have already existed and been dirty, in which case we 235 * need to keep them around. if we created the pages, they will be 236 * clean and read-only, and leaving such pages in the cache won't 237 * cause any problems. 238 */ 239 240 GOP_SIZE(vp, off + len, &eob, 0); 241 rw_enter(uobj->vmobjlock, RW_WRITER); 242 for (i = 0; i < npages; i++) { 243 KASSERT((pgs[i]->flags & PG_RELEASED) == 0); 244 if (!error) { 245 if (off <= pagestart + (i << PAGE_SHIFT) && 246 pagestart + ((i + 1) << PAGE_SHIFT) <= eob) { 247 pgs[i]->flags &= ~PG_RDONLY; 248 } 249 uvm_pagemarkdirty(pgs[i], UVM_PAGE_STATUS_DIRTY); 250 } 251 uvm_pagelock(pgs[i]); 252 uvm_pageactivate(pgs[i]); 253 uvm_pageunlock(pgs[i]); 254 } 255 uvm_page_unbusy(pgs, npages); 256 rw_exit(uobj->vmobjlock); 257 258 out: 259 kmem_free(pgs, pgssize); 260 return error; 261 } 262