freebsd-nq/sys/i386/linux/linux_file.c
Doug Rabson d41979a063 Fix linux_getdents so that it can cope with filesystems which translate
the directory format (ext2fs, cd9660).  For these filesystems, it must use
cookies to find the correct offset to use for subsequent reads.  Without it,
linux /bin/ls tends to loop re-reading the same block over and over again.

2.2 candidate.
1997-04-05 14:50:56 +00:00

806 lines
19 KiB
C

/*-
* Copyright (c) 1994-1995 Søren Schmidt
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer
* in this position and unchanged.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* 3. The name of the author may not be used to endorse or promote products
* derived from this software withough specific prior written permission
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
* IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
* IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
* NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
* THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*
* $Id: linux_file.c,v 1.12 1997/03/24 11:24:29 bde Exp $
*/
#include <sys/param.h>
#include <sys/systm.h>
#include <sys/sysproto.h>
#include <sys/fcntl.h>
#include <sys/file.h>
#include <sys/filedesc.h>
#include <sys/proc.h>
#include <sys/stat.h>
#include <sys/vnode.h>
#include <sys/malloc.h>
#include <sys/exec.h>
#include <sys/dirent.h>
#include <sys/sysproto.h>
#include <sys/conf.h>
#include <sys/tty.h>
#include <ufs/ufs/dir.h>
#include <i386/linux/linux.h>
#include <i386/linux/linux_proto.h>
#include <i386/linux/linux_util.h>
int
linux_creat(struct proc *p, struct linux_creat_args *args, int *retval)
{
struct open_args /* {
char *path;
int flags;
int mode;
} */ bsd_open_args;
caddr_t sg;
sg = stackgap_init();
CHECKALTCREAT(p, &sg, args->path);
#ifdef DEBUG
printf("Linux-emul(%d): creat(%s, %d)\n",
p->p_pid, args->path, args->mode);
#endif
bsd_open_args.path = args->path;
bsd_open_args.mode = args->mode;
bsd_open_args.flags = O_WRONLY | O_CREAT | O_TRUNC;
return open(p, &bsd_open_args, retval);
}
int
linux_open(struct proc *p, struct linux_open_args *args, int *retval)
{
struct open_args /* {
char *path;
int flags;
int mode;
} */ bsd_open_args;
int error;
caddr_t sg;
sg = stackgap_init();
if (args->flags & LINUX_O_CREAT)
CHECKALTCREAT(p, &sg, args->path);
else
CHECKALTEXIST(p, &sg, args->path);
#ifdef DEBUG
printf("Linux-emul(%d): open(%s, 0x%x, 0x%x)\n",
p->p_pid, args->path, args->flags, args->mode);
#endif
bsd_open_args.flags = 0;
if (args->flags & LINUX_O_RDONLY)
bsd_open_args.flags |= O_RDONLY;
if (args->flags & LINUX_O_WRONLY)
bsd_open_args.flags |= O_WRONLY;
if (args->flags & LINUX_O_RDWR)
bsd_open_args.flags |= O_RDWR;
if (args->flags & LINUX_O_NDELAY)
bsd_open_args.flags |= O_NONBLOCK;
if (args->flags & LINUX_O_APPEND)
bsd_open_args.flags |= O_APPEND;
if (args->flags & LINUX_O_SYNC)
bsd_open_args.flags |= O_FSYNC;
if (args->flags & LINUX_O_NONBLOCK)
bsd_open_args.flags |= O_NONBLOCK;
if (args->flags & LINUX_FASYNC)
bsd_open_args.flags |= O_ASYNC;
if (args->flags & LINUX_O_CREAT)
bsd_open_args.flags |= O_CREAT;
if (args->flags & LINUX_O_TRUNC)
bsd_open_args.flags |= O_TRUNC;
if (args->flags & LINUX_O_EXCL)
bsd_open_args.flags |= O_EXCL;
if (args->flags & LINUX_O_NOCTTY)
bsd_open_args.flags |= O_NOCTTY;
bsd_open_args.path = args->path;
bsd_open_args.mode = args->mode;
error = open(p, &bsd_open_args, retval);
if (!error && !(bsd_open_args.flags & O_NOCTTY) &&
SESS_LEADER(p) && !(p->p_flag & P_CONTROLT)) {
struct filedesc *fdp = p->p_fd;
struct file *fp = fdp->fd_ofiles[*retval];
if (fp->f_type == DTYPE_VNODE)
(fp->f_ops->fo_ioctl)(fp, TIOCSCTTY, (caddr_t) 0, p);
}
#ifdef DEBUG
printf("Linux-emul(%d): open returns error %d\n",
p->p_pid, error);
#endif
return error;
}
struct linux_flock {
short l_type;
short l_whence;
linux_off_t l_start;
linux_off_t l_len;
linux_pid_t l_pid;
};
static void
linux_to_bsd_flock(struct linux_flock *linux_flock, struct flock *bsd_flock)
{
switch (linux_flock->l_type) {
case LINUX_F_RDLCK:
bsd_flock->l_type = F_RDLCK;
break;
case LINUX_F_WRLCK:
bsd_flock->l_type = F_WRLCK;
break;
case LINUX_F_UNLCK:
bsd_flock->l_type = F_UNLCK;
break;
}
bsd_flock->l_whence = linux_flock->l_whence;
bsd_flock->l_start = (off_t)linux_flock->l_start;
bsd_flock->l_len = (off_t)linux_flock->l_len;
bsd_flock->l_pid = (pid_t)linux_flock->l_pid;
}
static void
bsd_to_linux_flock(struct flock *bsd_flock, struct linux_flock *linux_flock)
{
switch (bsd_flock->l_type) {
case F_RDLCK:
linux_flock->l_type = LINUX_F_RDLCK;
break;
case F_WRLCK:
linux_flock->l_type = LINUX_F_WRLCK;
break;
case F_UNLCK:
linux_flock->l_type = LINUX_F_UNLCK;
break;
}
linux_flock->l_whence = bsd_flock->l_whence;
linux_flock->l_start = (linux_off_t)bsd_flock->l_start;
linux_flock->l_len = (linux_off_t)bsd_flock->l_len;
linux_flock->l_pid = (linux_pid_t)bsd_flock->l_pid;
}
int
linux_fcntl(struct proc *p, struct linux_fcntl_args *args, int *retval)
{
int error, result;
struct fcntl_args /* {
int fd;
int cmd;
int arg;
} */ fcntl_args;
struct linux_flock linux_flock;
struct flock *bsd_flock;
struct filedesc *fdp;
struct file *fp;
struct vnode *vp;
struct vattr va;
long pgid;
struct pgrp *pgrp;
struct tty *tp, *(*d_tty) __P((dev_t));
caddr_t sg;
sg = stackgap_init();
bsd_flock = (struct flock *)stackgap_alloc(&sg, sizeof(struct flock));
d_tty = NULL;
#ifdef DEBUG
printf("Linux-emul(%d): fcntl(%d, %08x, *)\n",
p->p_pid, args->fd, args->cmd);
#endif
fcntl_args.fd = args->fd;
fcntl_args.arg = 0;
switch (args->cmd) {
case LINUX_F_DUPFD:
fcntl_args.cmd = F_DUPFD;
return fcntl(p, &fcntl_args, retval);
case LINUX_F_GETFD:
fcntl_args.cmd = F_GETFD;
return fcntl(p, &fcntl_args, retval);
case LINUX_F_SETFD:
fcntl_args.cmd = F_SETFD;
return fcntl(p, &fcntl_args, retval);
case LINUX_F_GETFL:
fcntl_args.cmd = F_GETFL;
error = fcntl(p, &fcntl_args, &result);
*retval = 0;
if (result & O_RDONLY) *retval |= LINUX_O_RDONLY;
if (result & O_WRONLY) *retval |= LINUX_O_WRONLY;
if (result & O_RDWR) *retval |= LINUX_O_RDWR;
if (result & O_NDELAY) *retval |= LINUX_O_NONBLOCK;
if (result & O_APPEND) *retval |= LINUX_O_APPEND;
if (result & O_FSYNC) *retval |= LINUX_O_SYNC;
return error;
case LINUX_F_SETFL:
if (args->arg & LINUX_O_NDELAY) fcntl_args.arg |= O_NONBLOCK;
if (args->arg & LINUX_O_APPEND) fcntl_args.arg |= O_APPEND;
if (args->arg & LINUX_O_SYNC) fcntl_args.arg |= O_FSYNC;
fcntl_args.cmd = F_SETFL;
return fcntl(p, &fcntl_args, retval);
case LINUX_F_GETLK:
if ((error = copyin((caddr_t)args->arg, (caddr_t)&linux_flock,
sizeof(struct linux_flock))))
return error;
linux_to_bsd_flock(&linux_flock, bsd_flock);
fcntl_args.cmd = F_GETLK;
fcntl_args.arg = (int)bsd_flock;
if (error = fcntl(p, &fcntl_args, retval))
return error;
bsd_to_linux_flock(bsd_flock, &linux_flock);
return copyout((caddr_t)&linux_flock, (caddr_t)args->arg,
sizeof(struct linux_flock));
case LINUX_F_SETLK:
if ((error = copyin((caddr_t)args->arg, (caddr_t)&linux_flock,
sizeof(struct linux_flock))))
return error;
linux_to_bsd_flock(&linux_flock, bsd_flock);
fcntl_args.cmd = F_SETLK;
fcntl_args.arg = (int)bsd_flock;
return fcntl(p, &fcntl_args, retval);
case LINUX_F_SETLKW:
if ((error = copyin((caddr_t)args->arg, (caddr_t)&linux_flock,
sizeof(struct linux_flock))))
return error;
linux_to_bsd_flock(&linux_flock, bsd_flock);
fcntl_args.cmd = F_SETLKW;
fcntl_args.arg = (int)bsd_flock;
return fcntl(p, &fcntl_args, retval);
case LINUX_F_SETOWN:
case LINUX_F_GETOWN:
/*
* We need to route around the normal fcntl() for these calls,
* since it uses TIOC{G,S}PGRP, which is too restrictive for
* Linux F_{G,S}ETOWN semantics. For sockets, this problem
* does not exist.
*/
fdp = p->p_fd;
if ((u_int)args->fd >= fdp->fd_nfiles ||
(fp = fdp->fd_ofiles[args->fd]) == NULL)
return EBADF;
if (fp->f_type == DTYPE_SOCKET) {
fcntl_args.cmd = args->cmd == LINUX_F_SETOWN ? F_SETOWN : F_GETOWN;
return fcntl(p, &fcntl_args, retval);
}
vp = (struct vnode *)fp->f_data;
if (vp->v_type != VCHR)
return EINVAL;
if ((error = VOP_GETATTR(vp, &va, p->p_ucred, p)))
return error;
d_tty = cdevsw[major(va.va_rdev)]->d_devtotty;
if (!d_tty || (!(tp = (*d_tty)(va.va_rdev))))
return EINVAL;
if (args->cmd == LINUX_F_GETOWN) {
retval[0] = tp->t_pgrp ? tp->t_pgrp->pg_id : NO_PID;
return 0;
}
if ((long)args->arg <= 0) {
pgid = -(long)args->arg;
} else {
struct proc *p1 = pfind((long)args->arg);
if (p1 == 0)
return (ESRCH);
pgid = (long)p1->p_pgrp->pg_id;
}
pgrp = pgfind(pgid);
if (pgrp == NULL || pgrp->pg_session != p->p_session)
return EPERM;
tp->t_pgrp = pgrp;
return 0;
}
return EINVAL;
}
int
linux_lseek(struct proc *p, struct linux_lseek_args *args, int *retval)
{
struct lseek_args /* {
int fd;
int pad;
off_t offset;
int whence;
} */ tmp_args;
int error;
#ifdef DEBUG
printf("Linux-emul(%d): lseek(%d, %d, %d)\n",
p->p_pid, args->fdes, args->off, args->whence);
#endif
tmp_args.fd = args->fdes;
tmp_args.offset = (off_t)args->off;
tmp_args.whence = args->whence;
error = lseek(p, &tmp_args, retval);
return error;
}
int
linux_llseek(struct proc *p, struct linux_llseek_args *args, int *retval)
{
struct lseek_args bsd_args;
int error;
off_t off;
#ifdef DEBUG
printf("Linux-emul(%d): llseek(%d, %d:%d, %d)\n",
p->p_pid, args->fd, args->ohigh, args->olow, args->whence);
#endif
off = (args->olow) | (((off_t) args->ohigh) << 32);
bsd_args.fd = args->fd;
bsd_args.offset = off;
bsd_args.whence = args->whence;
if ((error = lseek(p, &bsd_args, retval)))
return error;
if ((error = copyout(retval, (caddr_t)args->res, sizeof (off_t))))
return error;
retval[0] = 0;
return 0;
}
struct linux_dirent {
long dino;
linux_off_t doff;
unsigned short dreclen;
char dname[LINUX_NAME_MAX + 1];
};
#define LINUX_RECLEN(de,namlen) \
ALIGN((((char *)&(de)->dname - (char *)de) + (namlen) + 1))
int
linux_readdir(struct proc *p, struct linux_readdir_args *args, int *retval)
{
struct linux_getdents_args lda;
lda.fd = args->fd;
lda.dent = args->dent;
lda.count = 1;
return linux_getdents(p, &lda, retval);
}
int
linux_getdents(struct proc *p, struct linux_getdents_args *args, int *retval)
{
register struct dirent *bdp;
struct vnode *vp;
caddr_t inp, buf; /* BSD-format */
int len, reclen; /* BSD-format */
caddr_t outp; /* Linux-format */
int resid, linuxreclen=0; /* Linux-format */
struct file *fp;
struct uio auio;
struct iovec aiov;
struct vattr va;
off_t off;
struct linux_dirent linux_dirent;
int buflen, error, eofflag, nbytes, justone;
u_long *cookies = NULL, *cookiep;
int ncookies;
#ifdef DEBUG
printf("Linux-emul(%d): getdents(%d, *, %d)\n",
p->p_pid, args->fd, args->count);
#endif
if ((error = getvnode(p->p_fd, args->fd, &fp)) != 0) {
return (error);
}
if ((fp->f_flag & FREAD) == 0)
return (EBADF);
vp = (struct vnode *) fp->f_data;
if (vp->v_type != VDIR)
return (EINVAL);
if ((error = VOP_GETATTR(vp, &va, p->p_ucred, p))) {
return error;
}
nbytes = args->count;
if (nbytes == 1) {
nbytes = sizeof (struct linux_dirent);
justone = 1;
}
else
justone = 0;
off = fp->f_offset;
buflen = max(DIRBLKSIZ, nbytes);
buflen = min(buflen, MAXBSIZE);
buf = malloc(buflen, M_TEMP, M_WAITOK);
vn_lock(vp, LK_EXCLUSIVE | LK_RETRY, p);
again:
aiov.iov_base = buf;
aiov.iov_len = buflen;
auio.uio_iov = &aiov;
auio.uio_iovcnt = 1;
auio.uio_rw = UIO_READ;
auio.uio_segflg = UIO_SYSSPACE;
auio.uio_procp = p;
auio.uio_resid = buflen;
auio.uio_offset = off;
if (cookies) {
free(cookies, M_TEMP);
cookies = NULL;
}
error = VOP_READDIR(vp, &auio, fp->f_cred, &eofflag, &ncookies, &cookies);
if (error) {
goto out;
}
inp = buf;
outp = (caddr_t) args->dent;
resid = nbytes;
if ((len = buflen - auio.uio_resid) <= 0) {
goto eof;
}
cookiep = cookies;
if (cookies) {
/*
* When using cookies, the vfs has the option of reading from
* a different offset than that supplied (UFS truncates the
* offset to a block boundary to make sure that it never reads
* partway through a directory entry, even if the directory
* has been compacted).
*/
while (len > 0 && ncookies > 0 && *cookiep <= off) {
bdp = (struct dirent *) inp;
len -= bdp->d_reclen;
inp += bdp->d_reclen;
cookiep++;
ncookies--;
}
}
while (len > 0) {
if (cookiep && ncookies == 0)
break;
bdp = (struct dirent *) inp;
reclen = bdp->d_reclen;
if (reclen & 3) {
printf("linux_readdir: reclen=%d\n", reclen);
error = EFAULT;
goto out;
}
if (bdp->d_fileno == 0) {
inp += reclen;
if (cookiep) {
off = *cookiep++;
ncookies--;
} else
off += reclen;
len -= reclen;
continue;
}
linuxreclen = LINUX_RECLEN(&linux_dirent, bdp->d_namlen);
if (reclen > len || resid < linuxreclen) {
outp++;
break;
}
linux_dirent.dino = (long) bdp->d_fileno;
if (justone) {
/*
* old linux-style readdir usage.
*/
linux_dirent.doff = (linux_off_t) linuxreclen;
linux_dirent.dreclen = (u_short) bdp->d_namlen;
} else {
linux_dirent.doff = (linux_off_t) off;
linux_dirent.dreclen = (u_short) linuxreclen;
}
strcpy(linux_dirent.dname, bdp->d_name);
if ((error = copyout((caddr_t)&linux_dirent, outp, linuxreclen))) {
goto out;
}
inp += reclen;
if (cookiep) {
off = *cookiep++;
ncookies--;
} else
off += reclen;
outp += linuxreclen;
resid -= linuxreclen;
len -= reclen;
if (justone)
break;
}
if (outp == (caddr_t) args->dent)
goto again;
fp->f_offset = off;
if (justone)
nbytes = resid + linuxreclen;
eof:
*retval = nbytes - resid;
out:
if (cookies)
free(cookies, M_TEMP);
VOP_UNLOCK(vp, 0, p);
free(buf, M_TEMP);
return error;
}
/*
* These exist mainly for hooks for doing /compat/linux translation.
*/
int
linux_access(struct proc *p, struct linux_access_args *args, int *retval)
{
struct access_args bsd;
caddr_t sg;
sg = stackgap_init();
CHECKALTEXIST(p, &sg, args->path);
#ifdef DEBUG
printf("Linux-emul(%d): access(%s, %d)\n",
p->p_pid, args->path, args->flags);
#endif
bsd.path = args->path;
bsd.flags = args->flags;
return access(p, &bsd, retval);
}
int
linux_unlink(struct proc *p, struct linux_unlink_args *args, int *retval)
{
struct unlink_args bsd;
caddr_t sg;
sg = stackgap_init();
CHECKALTEXIST(p, &sg, args->path);
#ifdef DEBUG
printf("Linux-emul(%d): unlink(%s)\n",
p->p_pid, args->path);
#endif
bsd.path = args->path;
return unlink(p, &bsd, retval);
}
int
linux_chdir(struct proc *p, struct linux_chdir_args *args, int *retval)
{
struct chdir_args bsd;
caddr_t sg;
sg = stackgap_init();
CHECKALTEXIST(p, &sg, args->path);
#ifdef DEBUG
printf("Linux-emul(%d): chdir(%s)\n",
p->p_pid, args->path);
#endif
bsd.path = args->path;
return chdir(p, &bsd, retval);
}
int
linux_chmod(struct proc *p, struct linux_chmod_args *args, int *retval)
{
struct chmod_args bsd;
caddr_t sg;
sg = stackgap_init();
CHECKALTEXIST(p, &sg, args->path);
#ifdef DEBUG
printf("Linux-emul(%d): chmod(%s, %d)\n",
p->p_pid, args->path, args->mode);
#endif
bsd.path = args->path;
bsd.mode = args->mode;
return chmod(p, &bsd, retval);
}
int
linux_chown(struct proc *p, struct linux_chown_args *args, int *retval)
{
struct chown_args bsd;
caddr_t sg;
sg = stackgap_init();
CHECKALTEXIST(p, &sg, args->path);
#ifdef DEBUG
printf("Linux-emul(%d): chown(%s, %d, %d)\n",
p->p_pid, args->path, args->uid, args->gid);
#endif
bsd.path = args->path;
/* XXX size casts here */
bsd.uid = args->uid;
bsd.gid = args->gid;
return chown(p, &bsd, retval);
}
int
linux_mkdir(struct proc *p, struct linux_mkdir_args *args, int *retval)
{
struct mkdir_args bsd;
caddr_t sg;
sg = stackgap_init();
CHECKALTCREAT(p, &sg, args->path);
#ifdef DEBUG
printf("Linux-emul(%d): mkdir(%s, %d)\n",
p->p_pid, args->path, args->mode);
#endif
bsd.path = args->path;
bsd.mode = args->mode;
return mkdir(p, &bsd, retval);
}
int
linux_rmdir(struct proc *p, struct linux_rmdir_args *args, int *retval)
{
struct rmdir_args bsd;
caddr_t sg;
sg = stackgap_init();
CHECKALTEXIST(p, &sg, args->path);
#ifdef DEBUG
printf("Linux-emul(%d): rmdir(%s)\n",
p->p_pid, args->path);
#endif
bsd.path = args->path;
return rmdir(p, &bsd, retval);
}
int
linux_rename(struct proc *p, struct linux_rename_args *args, int *retval)
{
struct rename_args bsd;
caddr_t sg;
sg = stackgap_init();
CHECKALTEXIST(p, &sg, args->from);
CHECKALTCREAT(p, &sg, args->to);
#ifdef DEBUG
printf("Linux-emul(%d): rename(%s, %s)\n",
p->p_pid, args->from, args->to);
#endif
bsd.from = args->from;
bsd.to = args->to;
return rename(p, &bsd, retval);
}
int
linux_symlink(struct proc *p, struct linux_symlink_args *args, int *retval)
{
struct symlink_args bsd;
caddr_t sg;
sg = stackgap_init();
CHECKALTEXIST(p, &sg, args->path);
CHECKALTCREAT(p, &sg, args->to);
#ifdef DEBUG
printf("Linux-emul(%d): symlink(%s, %s)\n",
p->p_pid, args->path, args->to);
#endif
bsd.path = args->path;
bsd.link = args->to;
return symlink(p, &bsd, retval);
}
int
linux_execve(struct proc *p, struct linux_execve_args *args, int *retval)
{
struct execve_args bsd;
caddr_t sg;
sg = stackgap_init();
CHECKALTEXIST(p, &sg, args->path);
#ifdef DEBUG
printf("Linux-emul(%d): execve(%s)\n",
p->p_pid, args->path);
#endif
bsd.fname = args->path;
bsd.argv = args->argp;
bsd.envv = args->envp;
return execve(p, &bsd, retval);
}
int
linux_readlink(struct proc *p, struct linux_readlink_args *args, int *retval)
{
struct readlink_args bsd;
caddr_t sg;
sg = stackgap_init();
CHECKALTEXIST(p, &sg, args->name);
#ifdef DEBUG
printf("Linux-emul(%d): readlink(%s, 0x%x, %d)\n",
p->p_pid, args->name, args->buf, args->count);
#endif
bsd.path = args->name;
bsd.buf = args->buf;
bsd.count = args->count;
return readlink(p, &bsd, retval);
}
int
linux_truncate(struct proc *p, struct linux_truncate_args *args, int *retval)
{
struct otruncate_args bsd;
caddr_t sg;
sg = stackgap_init();
CHECKALTEXIST(p, &sg, args->path);
#ifdef DEBUG
printf("Linux-emul(%d): truncate(%s)\n",
p->p_pid, args->path);
#endif
bsd.path = args->path;
return otruncate(p, &bsd, retval);
}