// SPDX-License-Identifier: GPL-2.0-or-later /* * Copyright (C) 2024, Alibaba Cloud */ #include #include #include "internal.h" #include "xattr.h" #include "../internal.h" static struct vfsmount *erofs_ishare_mnt; static inline bool erofs_is_ishare_inode(struct inode *inode) { /* assumed FS_ONDEMAND is excluded with FS_PAGE_CACHE_SHARE feature */ return inode->i_sb->s_type == &erofs_anon_fs_type; } static int erofs_ishare_iget5_eq(struct inode *inode, void *data) { struct erofs_inode_fingerprint *fp1 = &EROFS_I(inode)->fingerprint; struct erofs_inode_fingerprint *fp2 = data; return fp1->size == fp2->size && !memcmp(fp1->opaque, fp2->opaque, fp2->size); } static int erofs_ishare_iget5_set(struct inode *inode, void *data) { struct erofs_inode *vi = EROFS_I(inode); vi->fingerprint = *(struct erofs_inode_fingerprint *)data; INIT_LIST_HEAD(&vi->ishare_list); spin_lock_init(&vi->ishare_lock); return 0; } bool erofs_ishare_fill_inode(struct inode *inode) { struct erofs_sb_info *sbi = EROFS_SB(inode->i_sb); struct erofs_inode *vi = EROFS_I(inode); const struct address_space_operations *aops; struct erofs_inode_fingerprint fp; struct inode *sharedinode; unsigned long hash; aops = erofs_get_aops(inode, true); if (IS_ERR(aops)) return false; if (erofs_xattr_fill_inode_fingerprint(&fp, inode, sbi->domain_id)) return false; hash = xxh32(fp.opaque, fp.size, 0); sharedinode = iget5_locked(erofs_ishare_mnt->mnt_sb, hash, erofs_ishare_iget5_eq, erofs_ishare_iget5_set, &fp); if (!sharedinode) { kfree(fp.opaque); return false; } if (inode_state_read_once(sharedinode) & I_NEW) { sharedinode->i_mapping->a_ops = aops; sharedinode->i_size = vi->vfs_inode.i_size; unlock_new_inode(sharedinode); } else { kfree(fp.opaque); if (aops != sharedinode->i_mapping->a_ops) { iput(sharedinode); return false; } if (sharedinode->i_size != vi->vfs_inode.i_size) { _erofs_printk(inode->i_sb, KERN_WARNING "size(%lld:%lld) not matches for the same fingerprint\n", vi->vfs_inode.i_size, sharedinode->i_size); iput(sharedinode); return false; } } vi->sharedinode = sharedinode; INIT_LIST_HEAD(&vi->ishare_list); spin_lock(&EROFS_I(sharedinode)->ishare_lock); list_add(&vi->ishare_list, &EROFS_I(sharedinode)->ishare_list); spin_unlock(&EROFS_I(sharedinode)->ishare_lock); return true; } void erofs_ishare_free_inode(struct inode *inode) { struct erofs_inode *vi = EROFS_I(inode); struct inode *sharedinode = vi->sharedinode; if (!sharedinode) return; spin_lock(&EROFS_I(sharedinode)->ishare_lock); list_del(&vi->ishare_list); spin_unlock(&EROFS_I(sharedinode)->ishare_lock); iput(sharedinode); vi->sharedinode = NULL; } static int erofs_ishare_file_open(struct inode *inode, struct file *file) { struct inode *sharedinode = EROFS_I(inode)->sharedinode; struct file *realfile; if (file->f_flags & O_DIRECT) return -EINVAL; realfile = alloc_empty_backing_file(O_RDONLY|O_NOATIME, current_cred()); if (IS_ERR(realfile)) return PTR_ERR(realfile); ihold(sharedinode); realfile->f_op = &erofs_file_fops; realfile->f_inode = sharedinode; realfile->f_mapping = sharedinode->i_mapping; path_get(&file->f_path); backing_file_set_user_path(realfile, &file->f_path); file_ra_state_init(&realfile->f_ra, file->f_mapping); realfile->private_data = EROFS_I(inode); file->private_data = realfile; return 0; } static int erofs_ishare_file_release(struct inode *inode, struct file *file) { struct file *realfile = file->private_data; iput(realfile->f_inode); fput(realfile); file->private_data = NULL; return 0; } static ssize_t erofs_ishare_file_read_iter(struct kiocb *iocb, struct iov_iter *to) { struct file *realfile = iocb->ki_filp->private_data; struct kiocb dedup_iocb; ssize_t nread; if (!iov_iter_count(to)) return 0; kiocb_clone(&dedup_iocb, iocb, realfile); nread = filemap_read(&dedup_iocb, to, 0); iocb->ki_pos = dedup_iocb.ki_pos; return nread; } static int erofs_ishare_mmap(struct file *file, struct vm_area_struct *vma) { struct file *realfile = file->private_data; vma_set_file(vma, realfile); return generic_file_readonly_mmap(file, vma); } static int erofs_ishare_fadvise(struct file *file, loff_t offset, loff_t len, int advice) { return vfs_fadvise(file->private_data, offset, len, advice); } const struct file_operations erofs_ishare_fops = { .open = erofs_ishare_file_open, .llseek = generic_file_llseek, .read_iter = erofs_ishare_file_read_iter, .mmap = erofs_ishare_mmap, .release = erofs_ishare_file_release, .get_unmapped_area = thp_get_unmapped_area, .splice_read = filemap_splice_read, .fadvise = erofs_ishare_fadvise, }; struct inode *erofs_real_inode(struct inode *inode, bool *need_iput) { struct erofs_inode *vi, *vi_share; struct inode *realinode; *need_iput = false; if (!erofs_is_ishare_inode(inode)) return inode; vi_share = EROFS_I(inode); spin_lock(&vi_share->ishare_lock); /* fetch any one as real inode */ DBG_BUGON(list_empty(&vi_share->ishare_list)); list_for_each_entry(vi, &vi_share->ishare_list, ishare_list) { realinode = igrab(&vi->vfs_inode); if (realinode) { *need_iput = true; break; } } spin_unlock(&vi_share->ishare_lock); DBG_BUGON(!realinode); return realinode; } int __init erofs_init_ishare(void) { erofs_ishare_mnt = kern_mount(&erofs_anon_fs_type); return PTR_ERR_OR_ZERO(erofs_ishare_mnt); } void erofs_exit_ishare(void) { kern_unmount(erofs_ishare_mnt); }