devfs_fdesc_support.c [plain text]
#include <sys/param.h>
#include <sys/systm.h>
#include <sys/types.h>
#include <sys/time.h>
#include <sys/proc_internal.h>
#include <sys/kernel.h>
#include <sys/resourcevar.h>
#include <sys/filedesc.h>
#include <sys/kauth.h>
#include <sys/vnode_internal.h>
#include <sys/malloc.h>
#include <sys/file_internal.h>
#include <sys/stat.h>
#include <sys/mount_internal.h>
#include <sys/namei.h>
#include <sys/dirent.h>
#include <sys/ubc.h>
#include <sys/socketvar.h>
#include <sys/pipe.h>
#include <sys/uio_internal.h>
#include <vfs/vfs_support.h>
#include <pexpert/pexpert.h>
#include <miscfs/devfs/fdesc.h>
#include <miscfs/devfs/devfs.h>
#include <miscfs/devfs/devfsdefs.h>
#define FDL_WANT 0x01
#define FDL_LOCKED 0x02
static int fdcache_lock;
#if (FD_STDIN != FD_STDOUT - 1) || (FD_STDOUT != FD_STDERR - 1)
FD_STDIN, FD_STDOUT, FD_STDERR must be a sequence n, n + 1, n + 2
#endif
#define NFDCACHE 3
#define FD_NHASH(ix) \
(&fdhashtbl[(ix) & fdhash])
LIST_HEAD(fdhashhead, fdescnode) * fdhashtbl;
u_long fdhash;
static int fdesc_attr(int fd, struct vnode_attr *vap, vfs_context_t a_context);
lck_mtx_t fdesc_mtx;
lck_grp_t *fdesc_lckgrp;
static void
fdesc_lock(void)
{
lck_mtx_lock(&fdesc_mtx);
}
static void
fdesc_unlock(void)
{
lck_mtx_unlock(&fdesc_mtx);
}
int
devfs_fdesc_init()
{
int error = 0;
devnode_t *rootdir = dev_root->de_dnp;
devdirent_t *direntp;
fdhashtbl = hashinit(NFDCACHE, M_CACHE, &fdhash);
fdesc_lckgrp = lck_grp_alloc_init("fdesc", NULL);
lck_mtx_init(&fdesc_mtx, fdesc_lckgrp, NULL);
DEVFS_LOCK();
dev_add_entry("fd", rootdir, DEV_DEVFD, NULL, NULL, NULL, &direntp);
devfs_fdesc_makelinks();
DEVFS_UNLOCK();
return error;
}
int
devfs_fdesc_makelinks()
{
int error = 0;
devdirent_t *stdin_ent = NULL, *stdout_ent = NULL, *stderr_ent = NULL;
devnode_t *root_devnode = dev_root->de_dnp;
char in[] = "stdin";
char out[] = "stdout";
char err[] = "stderr";
char zero[] = "fd/0";
char one[] = "fd/1";
char two[] = "fd/2";
if ((error = devfs_make_symlink(root_devnode, in, 0555, zero, &stdin_ent))) {
printf("Couldn't make stdin, err %d.\n", error);
goto bad;
}
if ((error = devfs_make_symlink(root_devnode, out, 0555, one, &stdout_ent))) {
printf("Couldn't make stdout, err %d.\n", error);
goto bad;
}
if ((error = devfs_make_symlink(root_devnode, err, 0555, two, &stderr_ent))) {
printf("Couldn't make stderr, err %d.\n", error);
goto bad;
}
return 0;
bad:
if (stdin_ent) {
dev_free_name(stdin_ent);
}
if (stdout_ent) {
dev_free_name(stdout_ent);
}
if (stderr_ent) {
dev_free_name(stderr_ent);
}
return error;
}
int
fdesc_allocvp(fdntype ftype, int ix, struct mount *mp, struct vnode **vpp, enum vtype vtype, int fdno)
{
struct fdhashhead *fc;
struct fdescnode *fd;
int error = 0;
int vid = 0;
struct vnode_fsparam vfsp;
fdesc_lock();
fc = FD_NHASH(ix);
loop:
for (fd = fc->lh_first; fd != 0; fd = fd->fd_hash.le_next) {
if (fd->fd_ix == ix && vnode_mount(fd->fd_vnode) == mp) {
vid = vnode_vid(fd->fd_vnode);
fdesc_unlock();
if (vnode_getwithvid(fd->fd_vnode, vid)) {
fdesc_lock();
goto loop;
}
*vpp = fd->fd_vnode;
(*vpp)->v_type = (uint16_t)vtype;
return error;
}
}
if (fdcache_lock & FDL_LOCKED) {
fdcache_lock |= FDL_WANT;
msleep((caddr_t) &fdcache_lock, &fdesc_mtx, PINOD, "fdesc_allocvp", NULL);
goto loop;
}
fdcache_lock |= FDL_LOCKED;
fdesc_unlock();
MALLOC(fd, void *, sizeof(struct fdescnode), M_TEMP, M_WAITOK);
vfsp.vnfs_mp = mp;
vfsp.vnfs_vtype = vtype;
vfsp.vnfs_str = "fdesc";
vfsp.vnfs_dvp = NULL;
vfsp.vnfs_fsnode = fd;
vfsp.vnfs_cnp = NULL;
vfsp.vnfs_vops = fdesc_vnodeop_p;
vfsp.vnfs_rdev = 0;
vfsp.vnfs_filesize = 0;
vfsp.vnfs_flags = VNFS_NOCACHE | VNFS_CANTCACHE;
vfsp.vnfs_marksystem = 0;
vfsp.vnfs_markroot = 0;
error = vnode_create(VNCREATE_FLAVOR, VCREATESIZE, &vfsp, vpp);
if (error) {
FREE(fd, M_TEMP);
fdesc_lock();
goto out;
}
(*vpp)->v_tag = VT_FDESC;
fd->fd_vnode = *vpp;
fd->fd_type = ftype;
fd->fd_fd = -1;
fd->fd_link = NULL;
fd->fd_ix = ix;
fd->fd_fd = fdno;
fdesc_lock();
LIST_INSERT_HEAD(fc, fd, fd_hash);
out:
fdcache_lock &= ~FDL_LOCKED;
if (fdcache_lock & FDL_WANT) {
fdcache_lock &= ~FDL_WANT;
wakeup((caddr_t) &fdcache_lock);
}
fdesc_unlock();
return error;
}
int
devfs_devfd_lookup(struct vnop_lookup_args *ap)
{
struct vnode **vpp = ap->a_vpp;
struct vnode *dvp = ap->a_dvp;
struct componentname *cnp = ap->a_cnp;
char *pname = cnp->cn_nameptr;
struct proc *p = vfs_context_proc(ap->a_context);
int numfiles = p->p_fd->fd_nfiles;
int fd;
int error;
struct vnode *fvp;
if (cnp->cn_namelen == 1 && *pname == '.') {
*vpp = dvp;
if ((error = vnode_get(dvp))) {
return error;
}
return 0;
}
fd = 0;
while (*pname >= '0' && *pname <= '9') {
fd = 10 * fd + *pname++ - '0';
if (fd >= numfiles) {
break;
}
}
if (*pname != '\0') {
error = ENOENT;
goto bad;
}
if (fd < 0 || fd >= numfiles ||
*fdfile(p, fd) == NULL ||
(*fdflags(p, fd) & UF_RESERVED)) {
error = EBADF;
goto bad;
}
error = fdesc_allocvp(Fdesc, FD_DESC + fd, dvp->v_mount, &fvp, VNON, fd);
if (error) {
goto bad;
}
*vpp = fvp;
return 0;
bad:
*vpp = NULL;
return error;
}
int
fdesc_open(struct vnop_open_args *ap)
{
struct vnode *vp = ap->a_vp;
thread_t thr = vfs_context_thread(ap->a_context);
uthread_t uu;
int error = 0;
if (thr == NULL) {
return EINVAL;
}
uu = get_bsdthread_info(thr);
switch (VTOFDESC(vp)->fd_type) {
case Fdesc:
uu->uu_dupfd = VTOFDESC(vp)->fd_fd;
error = ENODEV;
break;
default:
panic("Invalid type for fdesc node!");
break;
}
return error;
}
static int
fdesc_attr(int fd, struct vnode_attr *vap, vfs_context_t a_context)
{
struct fileproc *fp;
struct proc *p = vfs_context_proc(a_context);
struct stat stb;
int error;
if ((error = fp_lookup(p, fd, &fp, 0))) {
return error;
}
switch (FILEGLOB_DTYPE(fp->fp_glob)) {
case DTYPE_VNODE:
if ((error = vnode_getwithref((struct vnode *) fp->fp_glob->fg_data)) != 0) {
break;
}
if ((error = vnode_authorize((struct vnode *)fp->fp_glob->fg_data,
NULL,
KAUTH_VNODE_READ_ATTRIBUTES | KAUTH_VNODE_READ_SECURITY,
a_context)) == 0) {
error = vnode_getattr((struct vnode *)fp->fp_glob->fg_data, vap, a_context);
}
if (error == 0 && vap->va_type == VDIR) {
vap->va_mode &= ~((VEXEC) | (VEXEC >> 3) | (VEXEC >> 6));
}
(void)vnode_put((struct vnode *) fp->fp_glob->fg_data);
break;
case DTYPE_SOCKET:
case DTYPE_PIPE:
#if SOCKETS
if (FILEGLOB_DTYPE(fp->fp_glob) == DTYPE_SOCKET) {
error = soo_stat((struct socket *)fp->fp_glob->fg_data, (void *)&stb, 0);
} else
#endif
error = pipe_stat((struct pipe *)fp->fp_glob->fg_data, (void *)&stb, 0);
if (error == 0) {
if (FILEGLOB_DTYPE(fp->fp_glob) == DTYPE_SOCKET) {
VATTR_RETURN(vap, va_type, VSOCK);
} else {
VATTR_RETURN(vap, va_type, VFIFO);
}
VATTR_RETURN(vap, va_mode, stb.st_mode);
VATTR_RETURN(vap, va_nlink, stb.st_nlink);
VATTR_RETURN(vap, va_uid, stb.st_uid);
VATTR_RETURN(vap, va_gid, stb.st_gid);
VATTR_RETURN(vap, va_fsid, stb.st_dev);
VATTR_RETURN(vap, va_fileid, stb.st_ino);
VATTR_RETURN(vap, va_data_size, stb.st_size);
VATTR_RETURN(vap, va_access_time, stb.st_atimespec);
VATTR_RETURN(vap, va_modify_time, stb.st_mtimespec);
VATTR_RETURN(vap, va_change_time, stb.st_ctimespec);
VATTR_RETURN(vap, va_gen, stb.st_gen);
VATTR_RETURN(vap, va_flags, stb.st_flags);
VATTR_RETURN(vap, va_rdev, stb.st_rdev);
VATTR_RETURN(vap, va_total_alloc, stb.st_blocks * stb.st_blksize);
VATTR_RETURN(vap, va_acl, NULL);
}
break;
default:
error = EBADF;
}
fp_drop(p, fd, fp, 0);
return error;
}
int
fdesc_getattr(struct vnop_getattr_args *ap)
{
struct vnode *vp = ap->a_vp;
struct vnode_attr *vap = ap->a_vap;
unsigned fd;
int error = 0;
switch (VTOFDESC(vp)->fd_type) {
case Fdesc:
fd = VTOFDESC(vp)->fd_fd;
error = fdesc_attr(fd, vap, ap->a_context);
break;
default:
panic("Invalid type for an fdesc node!\n");
break;
}
if (error == 0) {
vp->v_type = (uint16_t)vap->va_type;
vnode_setneedinactive(vp);
}
return error;
}
int
fdesc_setattr(struct vnop_setattr_args *ap)
{
struct fileproc *fp;
unsigned fd;
int error;
struct proc * p = vfs_context_proc(ap->a_context);
switch (VTOFDESC(ap->a_vp)->fd_type) {
case Fdesc:
break;
default:
panic("Invalid type for an fdesc node!\n");
return EACCES;
}
fd = VTOFDESC(ap->a_vp)->fd_fd;
if ((error = fp_lookup(vfs_context_proc(ap->a_context), fd, &fp, 0))) {
return error;
}
switch (FILEGLOB_DTYPE(fp->fp_glob)) {
case DTYPE_VNODE:
{
if ((error = vnode_getwithref((struct vnode *) fp->fp_glob->fg_data)) != 0) {
break;
}
error = vnode_setattr((struct vnode *) fp->fp_glob->fg_data, ap->a_vap, ap->a_context);
(void)vnode_put((struct vnode *) fp->fp_glob->fg_data);
break;
}
case DTYPE_SOCKET:
case DTYPE_PIPE:
error = 0;
break;
default:
error = EBADF;
break;
}
fp_drop(p, fd, fp, 0);
return error;
}
#define UIO_MX 16
int
devfs_devfd_readdir(struct vnop_readdir_args *ap)
{
struct uio *uio = ap->a_uio;
struct proc *p = current_proc();
off_t i;
int error;
if (ap->a_flags & (VNODE_READDIR_EXTENDED | VNODE_READDIR_REQSEEKOFF)) {
return EINVAL;
}
if (uio_resid(uio) < UIO_MX) {
return EINVAL;
}
i = uio->uio_offset / UIO_MX;
error = 0;
while (uio_resid(uio) >= UIO_MX) {
if (i >= p->p_fd->fd_nfiles || i < 0) {
break;
}
if (*fdfile(p, i) != NULL && !(*fdflags(p, i) & UF_RESERVED)) {
struct dirent d;
struct dirent *dp = &d;
bzero((caddr_t) dp, UIO_MX);
dp->d_namlen = (__uint8_t)scnprintf(dp->d_name, sizeof(dp->d_name),
"%lld", i);
dp->d_reclen = UIO_MX;
dp->d_type = DT_UNKNOWN;
dp->d_fileno = (ino_t)i + FD_STDIN;
error = uiomove((caddr_t) dp, UIO_MX, uio);
if (error) {
break;
}
}
i++;
}
uio->uio_offset = i * UIO_MX;
return error;
}
int
fdesc_read(__unused struct vnop_read_args *ap)
{
return ENOTSUP;
}
int
fdesc_write(__unused struct vnop_write_args *ap)
{
return ENOTSUP;
}
int
fdesc_ioctl(__unused struct vnop_ioctl_args *ap)
{
return ENOTSUP;
}
int
fdesc_select(__unused struct vnop_select_args *ap)
{
return ENOTSUP;
}
int
fdesc_inactive(struct vnop_inactive_args *ap)
{
struct vnode *vp = ap->a_vp;
vp->v_type = VNON;
return 0;
}
int
fdesc_reclaim(struct vnop_reclaim_args *ap)
{
struct vnode *vp = ap->a_vp;
struct fdescnode *fd = VTOFDESC(vp);
fdesc_lock();
LIST_REMOVE(fd, fd_hash);
FREE(vp->v_data, M_TEMP);
vp->v_data = NULL;
fdesc_unlock();
return 0;
}
int
fdesc_pathconf(struct vnop_pathconf_args *ap)
{
switch (ap->a_name) {
case _PC_LINK_MAX:
*ap->a_retval = LINK_MAX;
return 0;
case _PC_MAX_CANON:
*ap->a_retval = MAX_CANON;
return 0;
case _PC_MAX_INPUT:
*ap->a_retval = MAX_INPUT;
return 0;
case _PC_PIPE_BUF:
*ap->a_retval = PIPE_BUF;
return 0;
case _PC_CHOWN_RESTRICTED:
*ap->a_retval = 200112;
return 0;
case _PC_VDISABLE:
*ap->a_retval = _POSIX_VDISABLE;
return 0;
default:
return EINVAL;
}
}
int
fdesc_badop(void)
{
return ENOTSUP;
}
#define VOPFUNC int (*)(void *)
#define fdesc_create (int (*) (struct vnop_create_args *))eopnotsupp
#define fdesc_mknod (int (*) (struct vnop_mknod_args *))eopnotsupp
#define fdesc_close (int (*) (struct vnop_close_args *))nullop
#define fdesc_access (int (*) (struct vnop_access_args *))nullop
#define fdesc_mmap (int (*) (struct vnop_mmap_args *))eopnotsupp
#define fdesc_revoke nop_revoke
#define fdesc_fsync (int (*) (struct vnop_fsync_args *))nullop
#define fdesc_remove (int (*) (struct vnop_remove_args *))eopnotsupp
#define fdesc_link (int (*) (struct vnop_link_args *))eopnotsupp
#define fdesc_rename (int (*) (struct vnop_rename_args *))eopnotsupp
#define fdesc_mkdir (int (*) (struct vnop_mkdir_args *))eopnotsupp
#define fdesc_rmdir (int (*) (struct vnop_rmdir_args *))eopnotsupp
#define fdesc_symlink (int (*) (struct vnop_symlink_args *))eopnotsupp
#define fdesc_strategy (int (*) (struct vnop_strategy_args *))fdesc_badop
#define fdesc_advlock (int (*) (struct vnop_advlock_args *))eopnotsupp
#define fdesc_bwrite (int (*) (struct vnop_bwrite_args *))eopnotsupp
#define fdesc_blktooff (int (*) (struct vnop_blktooff_args *))eopnotsupp
#define fdesc_offtoblk (int (*) (struct vnop_offtoblk_args *))eopnotsupp
#define fdesc_blockmap (int (*) (struct vnop_blockmap_args *))eopnotsupp
int(**fdesc_vnodeop_p)(void *);
const struct vnodeopv_entry_desc devfs_fdesc_vnodeop_entries[] = {
{ .opve_op = &vnop_default_desc, .opve_impl = (VOPFUNC)vn_default_error },
{ .opve_op = &vnop_lookup_desc, .opve_impl = (VOPFUNC)vn_default_error},
{ .opve_op = &vnop_create_desc, .opve_impl = (VOPFUNC)fdesc_create },
{ .opve_op = &vnop_mknod_desc, .opve_impl = (VOPFUNC)fdesc_mknod },
{ .opve_op = &vnop_open_desc, .opve_impl = (VOPFUNC)fdesc_open },
{ .opve_op = &vnop_close_desc, .opve_impl = (VOPFUNC)fdesc_close },
{ .opve_op = &vnop_access_desc, .opve_impl = (VOPFUNC)fdesc_access },
{ .opve_op = &vnop_getattr_desc, .opve_impl = (VOPFUNC)fdesc_getattr },
{ .opve_op = &vnop_setattr_desc, .opve_impl = (VOPFUNC)fdesc_setattr },
{ .opve_op = &vnop_read_desc, .opve_impl = (VOPFUNC)fdesc_read },
{ .opve_op = &vnop_write_desc, .opve_impl = (VOPFUNC)fdesc_write },
{ .opve_op = &vnop_ioctl_desc, .opve_impl = (VOPFUNC)fdesc_ioctl },
{ .opve_op = &vnop_select_desc, .opve_impl = (VOPFUNC)fdesc_select },
{ .opve_op = &vnop_revoke_desc, .opve_impl = (VOPFUNC)fdesc_revoke },
{ .opve_op = &vnop_mmap_desc, .opve_impl = (VOPFUNC)fdesc_mmap },
{ .opve_op = &vnop_fsync_desc, .opve_impl = (VOPFUNC)fdesc_fsync },
{ .opve_op = &vnop_remove_desc, .opve_impl = (VOPFUNC)fdesc_remove },
{ .opve_op = &vnop_link_desc, .opve_impl = (VOPFUNC)fdesc_link },
{ .opve_op = &vnop_rename_desc, .opve_impl = (VOPFUNC)fdesc_rename },
{ .opve_op = &vnop_mkdir_desc, .opve_impl = (VOPFUNC)fdesc_mkdir },
{ .opve_op = &vnop_rmdir_desc, .opve_impl = (VOPFUNC)fdesc_rmdir },
{ .opve_op = &vnop_symlink_desc, .opve_impl = (VOPFUNC)fdesc_symlink },
{ .opve_op = &vnop_readdir_desc, .opve_impl = (VOPFUNC)vn_default_error},
{ .opve_op = &vnop_readlink_desc, .opve_impl = (VOPFUNC)err_readlink},
{ .opve_op = &vnop_inactive_desc, .opve_impl = (VOPFUNC)fdesc_inactive },
{ .opve_op = &vnop_reclaim_desc, .opve_impl = (VOPFUNC)fdesc_reclaim },
{ .opve_op = &vnop_strategy_desc, .opve_impl = (VOPFUNC)fdesc_strategy },
{ .opve_op = &vnop_pathconf_desc, .opve_impl = (VOPFUNC)fdesc_pathconf },
{ .opve_op = &vnop_advlock_desc, .opve_impl = (VOPFUNC)fdesc_advlock },
{ .opve_op = &vnop_bwrite_desc, .opve_impl = (VOPFUNC)fdesc_bwrite },
{ .opve_op = &vnop_pagein_desc, .opve_impl = (VOPFUNC)err_pagein },
{ .opve_op = &vnop_pageout_desc, .opve_impl = (VOPFUNC)err_pageout },
{ .opve_op = &vnop_copyfile_desc, .opve_impl = (VOPFUNC)err_copyfile },
{ .opve_op = &vnop_blktooff_desc, .opve_impl = (VOPFUNC)fdesc_blktooff },
{ .opve_op = &vnop_blktooff_desc, .opve_impl = (VOPFUNC)fdesc_offtoblk },
{ .opve_op = &vnop_blockmap_desc, .opve_impl = (VOPFUNC)fdesc_blockmap },
{ .opve_op = (struct vnodeop_desc*)NULL, .opve_impl = (VOPFUNC)NULL }
};
const struct vnodeopv_desc devfs_fdesc_vnodeop_opv_desc =
{ .opv_desc_vector_p = &fdesc_vnodeop_p, .opv_desc_ops = devfs_fdesc_vnodeop_entries };