/* * 32bit Socket syscall emulation. Based on arch/sparc64/kernel/sys_sparc32.c. * * Copyright (C) 2000 VA Linux Co * Copyright (C) 2000 Don Dugger * Copyright (C) 1999 Arun Sharma * Copyright (C) 1997,1998 Jakub Jelinek (jj@sunsite.mff.cuni.cz) * Copyright (C) 1997 David S. Miller (davem@caip.rutgers.edu) * Copyright (C) 2000 Hewlett-Packard Co. * Copyright (C) 2000 David Mosberger-Tang * Copyright (C) 2000,2001 Andi Kleen, SuSE Labs */ #include #include #include #include #include #include #include #include #include #include #include #include #include #include #define A(__x) ((unsigned long)(__x)) #define AA(__x) ((unsigned long)(__x)) extern asmlinkage long sys_getsockopt(int fd, int level, int optname, void * optval, int *optlen); static inline int iov_from_user_compat_to_kern(struct iovec *kiov, struct compat_iovec *uiov32, int niov) { int tot_len = 0; while(niov > 0) { u32 len, buf; if(get_user(len, &uiov32->iov_len) || get_user(buf, &uiov32->iov_base)) { tot_len = -EFAULT; break; } tot_len += len; kiov->iov_base = (void *)A(buf); kiov->iov_len = (__kernel_size_t) len; uiov32++; kiov++; niov--; } return tot_len; } int msghdr_from_user_compat_to_kern(struct msghdr *kmsg, struct compat_msghdr *umsg) { u32 tmp1, tmp2, tmp3; int err; err = get_user(tmp1, &umsg->msg_name); err |= __get_user(tmp2, &umsg->msg_iov); err |= __get_user(tmp3, &umsg->msg_control); if (err) return -EFAULT; kmsg->msg_name = (void *)A(tmp1); kmsg->msg_iov = (struct iovec *)A(tmp2); kmsg->msg_control = (void *)A(tmp3); err = get_user(kmsg->msg_namelen, &umsg->msg_namelen); err |= get_user(kmsg->msg_iovlen, &umsg->msg_iovlen); err |= get_user(kmsg->msg_controllen, &umsg->msg_controllen); err |= get_user(kmsg->msg_flags, &umsg->msg_flags); return err; } /* I've named the args so it is easy to tell whose space the pointers are in. */ int verify_compat_iovec(struct msghdr *kern_msg, struct iovec *kern_iov, char *kern_address, int mode) { int tot_len; if(kern_msg->msg_namelen) { if(mode==VERIFY_READ) { int err = move_addr_to_kernel(kern_msg->msg_name, kern_msg->msg_namelen, kern_address); if(err < 0) return err; } kern_msg->msg_name = kern_address; } else kern_msg->msg_name = NULL; if(kern_msg->msg_iovlen > UIO_FASTIOV) { kern_iov = kmalloc(kern_msg->msg_iovlen * sizeof(struct iovec), GFP_KERNEL); if(!kern_iov) return -ENOMEM; } tot_len = iov_from_user_compat_to_kern(kern_iov, (struct compat_iovec *)kern_msg->msg_iov, kern_msg->msg_iovlen); if(tot_len >= 0) kern_msg->msg_iov = kern_iov; else if(kern_msg->msg_iovlen > UIO_FASTIOV) kfree(kern_iov); return tot_len; } /* There is a lot of hair here because the alignment rules (and * thus placement) of cmsg headers and length are different for * 32-bit apps. -DaveM */ int cmsghdr_from_user_compat_to_kern(struct msghdr *kmsg, unsigned char *stackbuf, int stackbuf_size) { struct compat_cmsghdr *ucmsg; struct cmsghdr *kcmsg, *kcmsg_base; compat_size_t ucmlen; __kernel_size_t kcmlen, tmp; kcmlen = 0; kcmsg_base = kcmsg = (struct cmsghdr *)stackbuf; ucmsg = CMSG_COMPAT_FIRSTHDR(kmsg); while(ucmsg != NULL) { if(get_user(ucmlen, &ucmsg->cmsg_len)) return -EFAULT; /* Catch bogons. */ if(CMSG_COMPAT_ALIGN(ucmlen) < CMSG_COMPAT_ALIGN(sizeof(struct compat_cmsghdr))) return -EINVAL; if((unsigned long)(((char *)ucmsg - (char *)kmsg->msg_control) + ucmlen) > kmsg->msg_controllen) return -EINVAL; tmp = ((ucmlen - CMSG_COMPAT_ALIGN(sizeof(*ucmsg))) + CMSG_ALIGN(sizeof(struct cmsghdr))); kcmlen += tmp; ucmsg = CMSG_COMPAT_NXTHDR(kmsg, ucmsg, ucmlen); } if(kcmlen == 0) return -EINVAL; /* The kcmlen holds the 64-bit version of the control length. * It may not be modified as we do not stick it into the kmsg * until we have successfully copied over all of the data * from the user. */ if(kcmlen > stackbuf_size) kcmsg_base = kcmsg = kmalloc(kcmlen, GFP_KERNEL); if(kcmsg == NULL) return -ENOBUFS; /* Now copy them over neatly. */ memset(kcmsg, 0, kcmlen); ucmsg = CMSG_COMPAT_FIRSTHDR(kmsg); while(ucmsg != NULL) { __get_user(ucmlen, &ucmsg->cmsg_len); tmp = ((ucmlen - CMSG_COMPAT_ALIGN(sizeof(*ucmsg))) + CMSG_ALIGN(sizeof(struct cmsghdr))); kcmsg->cmsg_len = tmp; __get_user(kcmsg->cmsg_level, &ucmsg->cmsg_level); __get_user(kcmsg->cmsg_type, &ucmsg->cmsg_type); /* Copy over the data. */ if(copy_from_user(CMSG_DATA(kcmsg), CMSG_COMPAT_DATA(ucmsg), (ucmlen - CMSG_COMPAT_ALIGN(sizeof(*ucmsg))))) goto out_free_efault; /* Advance. */ kcmsg = (struct cmsghdr *)((char *)kcmsg + CMSG_ALIGN(tmp)); ucmsg = CMSG_COMPAT_NXTHDR(kmsg, ucmsg, ucmlen); } /* Ok, looks like we made it. Hook it up and return success. */ kmsg->msg_control = kcmsg_base; kmsg->msg_controllen = kcmlen; return 0; out_free_efault: if(kcmsg_base != (struct cmsghdr *)stackbuf) kfree(kcmsg_base); return -EFAULT; } int put_cmsg_compat(struct msghdr *kmsg, int level, int type, int len, void *data) { struct compat_cmsghdr *cm = (struct compat_cmsghdr *) kmsg->msg_control; struct compat_cmsghdr cmhdr; int cmlen = CMSG_COMPAT_LEN(len); if(cm == NULL || kmsg->msg_controllen < sizeof(*cm)) { kmsg->msg_flags |= MSG_CTRUNC; return 0; /* XXX: return error? check spec. */ } if(kmsg->msg_controllen < cmlen) { kmsg->msg_flags |= MSG_CTRUNC; cmlen = kmsg->msg_controllen; } cmhdr.cmsg_level = level; cmhdr.cmsg_type = type; cmhdr.cmsg_len = cmlen; if(copy_to_user(cm, &cmhdr, sizeof cmhdr)) return -EFAULT; if(copy_to_user(CMSG_COMPAT_DATA(cm), data, cmlen - sizeof(struct compat_cmsghdr))) return -EFAULT; cmlen = CMSG_COMPAT_SPACE(len); kmsg->msg_control += cmlen; kmsg->msg_controllen -= cmlen; return 0; } void scm_detach_fds_compat(struct msghdr *kmsg, struct scm_cookie *scm) { struct compat_cmsghdr *cm = (struct compat_cmsghdr *) kmsg->msg_control; int fdmax = (kmsg->msg_controllen - sizeof(struct compat_cmsghdr)) / sizeof(int); int fdnum = scm->fp->count; struct file **fp = scm->fp->fp; int *cmfptr; int err = 0, i; if (fdnum < fdmax) fdmax = fdnum; for (i = 0, cmfptr = (int *) CMSG_COMPAT_DATA(cm); i < fdmax; i++, cmfptr++) { int new_fd; err = get_unused_fd(); if (err < 0) break; new_fd = err; err = put_user(new_fd, cmfptr); if (err) { put_unused_fd(new_fd); break; } /* Bump the usage count and install the file. */ get_file(fp[i]); fd_install(new_fd, fp[i]); } if (i > 0) { int cmlen = CMSG_COMPAT_LEN(i * sizeof(int)); if (!err) err = put_user(SOL_SOCKET, &cm->cmsg_level); if (!err) err = put_user(SCM_RIGHTS, &cm->cmsg_type); if (!err) err = put_user(cmlen, &cm->cmsg_len); if (!err) { cmlen = CMSG_COMPAT_SPACE(i * sizeof(int)); kmsg->msg_control += cmlen; kmsg->msg_controllen -= cmlen; } } if (i < fdnum) kmsg->msg_flags |= MSG_CTRUNC; /* * All of the files that fit in the message have had their * usage counts incremented, so we just free the list. */ __scm_destroy(scm); } /* In these cases we (currently) can just copy to data over verbatim * because all CMSGs created by the kernel have well defined types which * have the same layout in both the 32-bit and 64-bit API. One must add * some special cased conversions here if we start sending control messages * with incompatible types. * * SCM_RIGHTS and SCM_CREDENTIALS are done by hand in recvmsg_compat right after * we do our work. The remaining cases are: * * SOL_IP IP_PKTINFO struct in_pktinfo 32-bit clean * IP_TTL int 32-bit clean * IP_TOS __u8 32-bit clean * IP_RECVOPTS variable length 32-bit clean * IP_RETOPTS variable length 32-bit clean * (these last two are clean because the types are defined * by the IPv4 protocol) * IP_RECVERR struct sock_extended_err + * struct sockaddr_in 32-bit clean * SOL_IPV6 IPV6_RECVERR struct sock_extended_err + * struct sockaddr_in6 32-bit clean * IPV6_PKTINFO struct in6_pktinfo 32-bit clean * IPV6_HOPLIMIT int 32-bit clean * IPV6_FLOWINFO u32 32-bit clean * IPV6_HOPOPTS ipv6 hop exthdr 32-bit clean * IPV6_DSTOPTS ipv6 dst exthdr(s) 32-bit clean * IPV6_RTHDR ipv6 routing exthdr 32-bit clean * IPV6_AUTHHDR ipv6 auth exthdr 32-bit clean */ void cmsg_compat_recvmsg_fixup(struct msghdr *kmsg, unsigned long orig_cmsg_uptr) { unsigned char *workbuf, *wp; unsigned long bufsz, space_avail; struct cmsghdr *ucmsg; bufsz = ((unsigned long)kmsg->msg_control) - orig_cmsg_uptr; space_avail = kmsg->msg_controllen + bufsz; wp = workbuf = kmalloc(bufsz, GFP_KERNEL); if(workbuf == NULL) goto fail; /* To make this more sane we assume the kernel sends back properly * formatted control messages. Because of how the kernel will truncate * the cmsg_len for MSG_TRUNC cases, we need not check that case either. */ ucmsg = (struct cmsghdr *) orig_cmsg_uptr; while(((unsigned long)ucmsg) <= (((unsigned long)kmsg->msg_control) - sizeof(struct cmsghdr))) { struct compat_cmsghdr *kcmsg_compat = (struct compat_cmsghdr *) wp; int clen64, clen32; /* UCMSG is the 64-bit format CMSG entry in user-space. * KCMSG_COMPAT is within the kernel space temporary buffer * we use to convert into a 32-bit style CMSG. */ __get_user(kcmsg_compat->cmsg_len, &ucmsg->cmsg_len); __get_user(kcmsg_compat->cmsg_level, &ucmsg->cmsg_level); __get_user(kcmsg_compat->cmsg_type, &ucmsg->cmsg_type); clen64 = kcmsg_compat->cmsg_len; copy_from_user(CMSG_COMPAT_DATA(kcmsg_compat), CMSG_DATA(ucmsg), clen64 - CMSG_ALIGN(sizeof(*ucmsg))); clen32 = ((clen64 - CMSG_ALIGN(sizeof(*ucmsg))) + CMSG_COMPAT_ALIGN(sizeof(struct compat_cmsghdr))); kcmsg_compat->cmsg_len = clen32; ucmsg = (struct cmsghdr *) (((char *)ucmsg) + CMSG_ALIGN(clen64)); wp = (((char *)kcmsg_compat) + CMSG_COMPAT_ALIGN(clen32)); } /* Copy back fixed up data, and adjust pointers. */ bufsz = (wp - workbuf); copy_to_user((void *)orig_cmsg_uptr, workbuf, bufsz); kmsg->msg_control = (struct cmsghdr *) (((char *)orig_cmsg_uptr) + bufsz); kmsg->msg_controllen = space_avail - bufsz; kfree(workbuf); return; fail: /* If we leave the 64-bit format CMSG chunks in there, * the application could get confused and crash. So to * ensure greater recovery, we report no CMSGs. */ kmsg->msg_controllen += bufsz; kmsg->msg_control = (void *) orig_cmsg_uptr; } extern asmlinkage int sys_setsockopt(int fd, int level, int optname, char *optval, int optlen); static int do_netfilter_replace(int fd, int level, int optname, char *optval, int optlen) { struct ipt_replace32 { char name[IPT_TABLE_MAXNAMELEN]; __u32 valid_hooks; __u32 num_entries; __u32 size; __u32 hook_entry[NF_IP_NUMHOOKS]; __u32 underflow[NF_IP_NUMHOOKS]; __u32 num_counters; __u32 counters; struct ipt_entry entries[0]; } *repl32 = (struct ipt_replace32 *)optval; struct ipt_replace *krepl; struct ipt_counters *counters32; __u32 origsize; unsigned int kreplsize, kcountersize; mm_segment_t old_fs; int ret; if (optlen < sizeof(repl32)) return -EINVAL; if (copy_from_user(&origsize, &repl32->size, sizeof(origsize))) return -EFAULT; kreplsize = sizeof(*krepl) + origsize; kcountersize = krepl->num_counters * sizeof(struct ipt_counters); /* Hack: Causes ipchains to give correct error msg --RR */ if (optlen != kreplsize) return -ENOPROTOOPT; krepl = (struct ipt_replace *)kmalloc(kreplsize, GFP_KERNEL); if (krepl == NULL) return -ENOMEM; if (copy_from_user(krepl, optval, kreplsize)) { kfree(krepl); return -EFAULT; } counters32 = (struct ipt_counters *)AA( ((struct ipt_replace32 *)krepl)->counters); kcountersize = krepl->num_counters * sizeof(struct ipt_counters); krepl->counters = (struct ipt_counters *)kmalloc( kcountersize, GFP_KERNEL); if (krepl->counters == NULL) { kfree(krepl); return -ENOMEM; } old_fs = get_fs(); set_fs(KERNEL_DS); ret = sys_setsockopt(fd, level, optname, (char *)krepl, kreplsize); set_fs(old_fs); if (ret == 0 && copy_to_user(counters32, krepl->counters, kcountersize)) ret = -EFAULT; kfree(krepl->counters); kfree(krepl); return ret; } static int do_set_attach_filter(int fd, int level, int optname, char *optval, int optlen) { struct sock_fprog32 { __u16 len; __u32 filter; } *fprog32 = (struct sock_fprog32 *)optval; struct sock_fprog kfprog; struct sock_filter *kfilter; unsigned int fsize; mm_segment_t old_fs; __u32 uptr; int ret; if (get_user(kfprog.len, &fprog32->len) || __get_user(uptr, &fprog32->filter)) return -EFAULT; kfprog.filter = (struct sock_filter *)A(uptr); fsize = kfprog.len * sizeof(struct sock_filter); kfilter = (struct sock_filter *)kmalloc(fsize, GFP_KERNEL); if (kfilter == NULL) return -ENOMEM; if (copy_from_user(kfilter, kfprog.filter, fsize)) { kfree(kfilter); return -EFAULT; } kfprog.filter = kfilter; old_fs = get_fs(); set_fs(KERNEL_DS); ret = sys_setsockopt(fd, level, optname, (char *)&kfprog, sizeof(kfprog)); set_fs(old_fs); kfree(kfilter); return ret; } static int do_set_icmpv6_filter(int fd, int level, int optname, char *optval, int optlen) { struct icmp6_filter kfilter; mm_segment_t old_fs; int ret, i; if (copy_from_user(&kfilter, optval, sizeof(kfilter))) return -EFAULT; for (i = 0; i < 8; i += 2) { u32 tmp = kfilter.data[i]; kfilter.data[i] = kfilter.data[i + 1]; kfilter.data[i + 1] = tmp; } old_fs = get_fs(); set_fs(KERNEL_DS); ret = sys_setsockopt(fd, level, optname, (char *) &kfilter, sizeof(kfilter)); set_fs(old_fs); return ret; } static int do_set_sock_timeout(int fd, int level, int optname, char *optval, int optlen) { struct compat_timeval *up = (struct compat_timeval *) optval; struct timeval ktime; mm_segment_t old_fs; int err; if (optlen < sizeof(*up)) return -EINVAL; if (get_user(ktime.tv_sec, &up->tv_sec) || __get_user(ktime.tv_usec, &up->tv_usec)) return -EFAULT; old_fs = get_fs(); set_fs(KERNEL_DS); err = sys_setsockopt(fd, level, optname, (char *) &ktime, sizeof(ktime)); set_fs(old_fs); return err; } asmlinkage int compat_sys_setsockopt(int fd, int level, int optname, char *optval, int optlen) { if (optname == IPT_SO_SET_REPLACE) return do_netfilter_replace(fd, level, optname, optval, optlen); if (optname == SO_ATTACH_FILTER) return do_set_attach_filter(fd, level, optname, optval, optlen); if (optname == SO_RCVTIMEO || optname == SO_SNDTIMEO) return do_set_sock_timeout(fd, level, optname, optval, optlen); if (level == SOL_ICMPV6 && optname == ICMPV6_FILTER) return do_set_icmpv6_filter(fd, level, optname, optval, optlen); return sys_setsockopt(fd, level, optname, optval, optlen); } static int do_get_sock_timeout(int fd, int level, int optname, char *optval, int *optlen) { struct compat_timeval *up = (struct compat_timeval *) optval; struct timeval ktime; mm_segment_t old_fs; int len, err; if (get_user(len, optlen)) return -EFAULT; if (len < sizeof(*up)) return -EINVAL; len = sizeof(ktime); old_fs = get_fs(); set_fs(KERNEL_DS); err = sys_getsockopt(fd, level, optname, (char *) &ktime, &len); set_fs(old_fs); if (!err) { if (put_user(sizeof(*up), optlen) || put_user(ktime.tv_sec, &up->tv_sec) || __put_user(ktime.tv_usec, &up->tv_usec)) err = -EFAULT; } return err; } asmlinkage long compat_sys_getsockopt(int fd, int level, int optname, char *optval, int *optlen) { if (optname == SO_RCVTIMEO || optname == SO_SNDTIMEO) return do_get_sock_timeout(fd, level, optname, optval, optlen); return sys_getsockopt(fd, level, optname, optval, optlen); } /* Argument list sizes for compat_sys_socketcall */ #define AL(x) ((x) * sizeof(u32)) static unsigned char nas[18]={AL(0),AL(3),AL(3),AL(3),AL(2),AL(3), AL(3),AL(3),AL(4),AL(4),AL(4),AL(6), AL(6),AL(2),AL(5),AL(5),AL(3),AL(3)}; #undef AL extern asmlinkage long sys_bind(int fd, struct sockaddr *umyaddr, int addrlen); extern asmlinkage long sys_connect(int fd, struct sockaddr *uservaddr, int addrlen); extern asmlinkage long sys_accept(int fd, struct sockaddr *upeer_sockaddr, int *upeer_addrlen); extern asmlinkage long sys_getsockname(int fd, struct sockaddr *usockaddr, int *usockaddr_len); extern asmlinkage long sys_getpeername(int fd, struct sockaddr *usockaddr, int *usockaddr_len); extern asmlinkage long sys_send(int fd, void *buff, size_t len, unsigned flags); extern asmlinkage long sys_sendto(int fd, u32 buff, compat_size_t len, unsigned flags, u32 addr, int addr_len); extern asmlinkage long sys_recv(int fd, void *ubuf, size_t size, unsigned flags); extern asmlinkage long sys_recvfrom(int fd, u32 ubuf, compat_size_t size, unsigned flags, u32 addr, u32 addr_len); extern asmlinkage long sys_socket(int family, int type, int protocol); extern asmlinkage long sys_socketpair(int family, int type, int protocol, int usockvec[2]); extern asmlinkage long sys_shutdown(int fd, int how); extern asmlinkage long sys_listen(int fd, int backlog); asmlinkage long compat_sys_sendmsg(int fd, struct compat_msghdr *msg, unsigned flags) { return sys_sendmsg(fd, (struct msghdr *)msg, flags | MSG_CMSG_COMPAT); } asmlinkage long compat_sys_recvmsg(int fd, struct compat_msghdr *msg, unsigned int flags) { return sys_recvmsg(fd, (struct msghdr *)msg, flags | MSG_CMSG_COMPAT); } asmlinkage long compat_sys_socketcall(int call, u32 *args) { int ret; u32 a[6]; u32 a0, a1; if (call < SYS_SOCKET || call > SYS_RECVMSG) return -EINVAL; if (copy_from_user(a, args, nas[call])) return -EFAULT; a0 = a[0]; a1 = a[1]; switch(call) { case SYS_SOCKET: ret = sys_socket(a0, a1, a[2]); break; case SYS_BIND: ret = sys_bind(a0, (struct sockaddr *)A(a1), a[2]); break; case SYS_CONNECT: ret = sys_connect(a0, (struct sockaddr *)A(a1), a[2]); break; case SYS_LISTEN: ret = sys_listen(a0, a1); break; case SYS_ACCEPT: ret = sys_accept(a0, (struct sockaddr *)A(a1), (int *)A(a[2])); break; case SYS_GETSOCKNAME: ret = sys_getsockname(a0, (struct sockaddr *)A(a1), (int *)A(a[2])); break; case SYS_GETPEERNAME: ret = sys_getpeername(a0, (struct sockaddr *)A(a1), (int *)A(a[2])); break; case SYS_SOCKETPAIR: ret = sys_socketpair(a0, a1, a[2], (int *)A(a[3])); break; case SYS_SEND: ret = sys_send(a0, (void *)A(a1), a[2], a[3]); break; case SYS_SENDTO: ret = sys_sendto(a0, a1, a[2], a[3], a[4], a[5]); break; case SYS_RECV: ret = sys_recv(a0, (void *)A(a1), a[2], a[3]); break; case SYS_RECVFROM: ret = sys_recvfrom(a0, a1, a[2], a[3], a[4], a[5]); break; case SYS_SHUTDOWN: ret = sys_shutdown(a0,a1); break; case SYS_SETSOCKOPT: ret = compat_sys_setsockopt(a0, a1, a[2], (char *)A(a[3]), a[4]); break; case SYS_GETSOCKOPT: ret = compat_sys_getsockopt(a0, a1, a[2], (char *)(u64)a[3], (int *)(u64)a[4]); break; case SYS_SENDMSG: ret = compat_sys_sendmsg(a0, (struct compat_msghdr *)A(a1), a[2]); break; case SYS_RECVMSG: ret = compat_sys_recvmsg(a0, (struct compat_msghdr *)A(a1), a[2]); break; default: ret = -EINVAL; break; } return ret; }