4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License version 2 for more details (a copy is included
14 * in the LICENSE file that accompanied this code).
16 * You should have received a copy of the GNU General Public License
17 * version 2 along with this program; If not, see
18 * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf
20 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
21 * CA 95054 USA or visit www.sun.com if you need additional information or
27 * Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved.
28 * Use is subject to license terms.
30 * Copyright (c) 2012, Intel Corporation.
33 * This file is part of Lustre, http://www.lustre.org/
34 * Lustre is a trademark of Sun Microsystems, Inc.
36 #define DEBUG_SUBSYSTEM S_LNET
38 #include <libcfs/libcfs.h>
39 #include <libcfs/libcfs.h>
43 #include <linux/file.h>
44 /* For sys_open & sys_close */
45 #include <linux/syscalls.h>
48 static inline wait_queue_head_t *sk_sleep(struct sock *sk)
55 libcfs_sock_ioctl(int cmd, unsigned long arg)
57 mm_segment_t oldmm = get_fs();
61 struct file *sock_filp;
63 rc = sock_create (PF_INET, SOCK_STREAM, 0, &sock);
65 CERROR ("Can't create socket: %d\n", rc);
69 #if !defined(HAVE_SOCK_ALLOC_FILE) && !defined(HAVE_SOCK_ALLOC_FILE_3ARGS)
70 fd = sock_map_fd(sock, 0);
78 # ifdef HAVE_SOCK_ALLOC_FILE_3ARGS
79 sock_filp = sock_alloc_file(sock, 0, NULL);
81 sock_filp = sock_alloc_file(sock, 0);
91 if (sock_filp->f_op->unlocked_ioctl)
92 rc = sock_filp->f_op->unlocked_ioctl(sock_filp, cmd, arg);
105 libcfs_ipif_query (char *name, int *up, __u32 *ip, __u32 *mask)
112 nob = strnlen(name, IFNAMSIZ);
113 if (nob == IFNAMSIZ) {
114 CERROR("Interface name %s too long\n", name);
118 CLASSERT (sizeof(ifr.ifr_name) >= IFNAMSIZ);
120 if (strlen(name) > sizeof(ifr.ifr_name)-1)
122 strncpy(ifr.ifr_name, name, sizeof(ifr.ifr_name));
124 rc = libcfs_sock_ioctl(SIOCGIFFLAGS, (unsigned long)&ifr);
127 CERROR("Can't get flags for interface %s\n", name);
131 if ((ifr.ifr_flags & IFF_UP) == 0) {
132 CDEBUG(D_NET, "Interface %s down\n", name);
140 if (strlen(name) > sizeof(ifr.ifr_name)-1)
142 strncpy(ifr.ifr_name, name, sizeof(ifr.ifr_name));
144 ifr.ifr_addr.sa_family = AF_INET;
145 rc = libcfs_sock_ioctl(SIOCGIFADDR, (unsigned long)&ifr);
148 CERROR("Can't get IP address for interface %s\n", name);
152 val = ((struct sockaddr_in *)&ifr.ifr_addr)->sin_addr.s_addr;
155 if (strlen(name) > sizeof(ifr.ifr_name)-1)
157 strncpy(ifr.ifr_name, name, sizeof(ifr.ifr_name));
159 ifr.ifr_addr.sa_family = AF_INET;
160 rc = libcfs_sock_ioctl(SIOCGIFNETMASK, (unsigned long)&ifr);
163 CERROR("Can't get netmask for interface %s\n", name);
167 val = ((struct sockaddr_in *)&ifr.ifr_netmask)->sin_addr.s_addr;
173 EXPORT_SYMBOL(libcfs_ipif_query);
176 libcfs_ipif_enumerate (char ***namesp)
178 /* Allocate and fill in 'names', returning # interfaces/error */
190 nalloc = 16; /* first guess at max interfaces */
193 if (nalloc * sizeof(*ifr) > PAGE_CACHE_SIZE) {
195 nalloc = PAGE_CACHE_SIZE/sizeof(*ifr);
196 CWARN("Too many interfaces: only enumerating first %d\n",
200 LIBCFS_ALLOC(ifr, nalloc * sizeof(*ifr));
202 CERROR ("ENOMEM enumerating up to %d interfaces\n", nalloc);
207 ifc.ifc_buf = (char *)ifr;
208 ifc.ifc_len = nalloc * sizeof(*ifr);
210 rc = libcfs_sock_ioctl(SIOCGIFCONF, (unsigned long)&ifc);
213 CERROR ("Error %d enumerating interfaces\n", rc);
219 nfound = ifc.ifc_len/sizeof(*ifr);
220 LASSERT (nfound <= nalloc);
222 if (nfound < nalloc || toobig)
225 LIBCFS_FREE(ifr, nalloc * sizeof(*ifr));
232 LIBCFS_ALLOC(names, nfound * sizeof(*names));
238 for (i = 0; i < nfound; i++) {
240 nob = strnlen (ifr[i].ifr_name, IFNAMSIZ);
241 if (nob == IFNAMSIZ) {
242 /* no space for terminating NULL */
243 CERROR("interface name %.*s too long (%d max)\n",
244 nob, ifr[i].ifr_name, IFNAMSIZ);
249 LIBCFS_ALLOC(names[i], IFNAMSIZ);
250 if (names[i] == NULL) {
255 memcpy(names[i], ifr[i].ifr_name, nob);
264 libcfs_ipif_free_enumeration(names, nfound);
266 LIBCFS_FREE(ifr, nalloc * sizeof(*ifr));
271 EXPORT_SYMBOL(libcfs_ipif_enumerate);
274 libcfs_ipif_free_enumeration (char **names, int n)
280 for (i = 0; i < n && names[i] != NULL; i++)
281 LIBCFS_FREE(names[i], IFNAMSIZ);
283 LIBCFS_FREE(names, n * sizeof(*names));
286 EXPORT_SYMBOL(libcfs_ipif_free_enumeration);
289 libcfs_sock_write (struct socket *sock, void *buffer, int nob, int timeout)
292 mm_segment_t oldmm = get_fs();
293 long jiffies_left = timeout * msecs_to_jiffies(MSEC_PER_SEC);
298 /* Caller may pass a zero timeout if she thinks the socket buffer is
299 * empty enough to take the whole message immediately */
306 struct msghdr msg = {
307 .msg_flags = (timeout == 0) ? MSG_DONTWAIT : 0
311 /* Set send timeout to remaining time */
312 tv = (struct timeval) {
313 .tv_sec = jiffies_left /
314 msecs_to_jiffies(MSEC_PER_SEC),
315 .tv_usec = ((jiffies_left %
316 msecs_to_jiffies(MSEC_PER_SEC)) *
318 msecs_to_jiffies(MSEC_PER_SEC)
321 rc = sock_setsockopt(sock, SOL_SOCKET, SO_SNDTIMEO,
322 (char *)&tv, sizeof(tv));
325 CERROR("Can't set socket send timeout "
327 (long)tv.tv_sec, (int)tv.tv_usec, rc);
333 rc = kernel_sendmsg(sock, &msg, &iov, 1, nob);
334 jiffies_left -= jiffies - then;
343 CERROR ("Unexpected zero rc\n");
344 return (-ECONNABORTED);
347 if (jiffies_left <= 0)
350 buffer = ((char *)buffer) + rc;
356 EXPORT_SYMBOL(libcfs_sock_write);
359 libcfs_sock_read (struct socket *sock, void *buffer, int nob, int timeout)
362 mm_segment_t oldmm = get_fs();
363 long jiffies_left = timeout * msecs_to_jiffies(MSEC_PER_SEC);
368 LASSERT(jiffies_left > 0);
375 struct msghdr msg = {
379 /* Set receive timeout to remaining time */
380 tv = (struct timeval) {
381 .tv_sec = jiffies_left / msecs_to_jiffies(MSEC_PER_SEC),
382 .tv_usec = ((jiffies_left %
383 msecs_to_jiffies(MSEC_PER_SEC)) *
385 msecs_to_jiffies(MSEC_PER_SEC)
388 rc = sock_setsockopt(sock, SOL_SOCKET, SO_RCVTIMEO,
389 (char *)&tv, sizeof(tv));
392 CERROR("Can't set socket recv timeout %ld.%06d: %d\n",
393 (long)tv.tv_sec, (int)tv.tv_usec, rc);
398 rc = kernel_recvmsg(sock, &msg, &iov, 1, nob, 0);
399 jiffies_left -= jiffies - then;
407 buffer = ((char *)buffer) + rc;
413 if (jiffies_left <= 0)
418 EXPORT_SYMBOL(libcfs_sock_read);
421 libcfs_sock_create (struct socket **sockp, int *fatal,
422 __u32 local_ip, int local_port)
424 struct sockaddr_in locaddr;
428 mm_segment_t oldmm = get_fs();
430 /* All errors are fatal except bind failure if the port is in use */
433 rc = sock_create (PF_INET, SOCK_STREAM, 0, &sock);
436 CERROR ("Can't create socket: %d\n", rc);
442 rc = sock_setsockopt(sock, SOL_SOCKET, SO_REUSEADDR,
443 (char *)&option, sizeof (option));
446 CERROR("Can't set SO_REUSEADDR for socket: %d\n", rc);
450 if (local_ip != 0 || local_port != 0) {
451 memset(&locaddr, 0, sizeof(locaddr));
452 locaddr.sin_family = AF_INET;
453 locaddr.sin_port = htons(local_port);
454 locaddr.sin_addr.s_addr = (local_ip == 0) ?
455 INADDR_ANY : htonl(local_ip);
457 rc = sock->ops->bind(sock, (struct sockaddr *)&locaddr,
459 if (rc == -EADDRINUSE) {
460 CDEBUG(D_NET, "Port %d already in use\n", local_port);
465 CERROR("Error trying to bind to port %d: %d\n",
479 libcfs_sock_setbuf (struct socket *sock, int txbufsize, int rxbufsize)
481 mm_segment_t oldmm = get_fs();
485 if (txbufsize != 0) {
488 rc = sock_setsockopt(sock, SOL_SOCKET, SO_SNDBUF,
489 (char *)&option, sizeof (option));
492 CERROR ("Can't set send buffer %d: %d\n",
498 if (rxbufsize != 0) {
501 rc = sock_setsockopt (sock, SOL_SOCKET, SO_RCVBUF,
502 (char *)&option, sizeof (option));
505 CERROR ("Can't set receive buffer %d: %d\n",
514 EXPORT_SYMBOL(libcfs_sock_setbuf);
517 libcfs_sock_getaddr (struct socket *sock, int remote, __u32 *ip, int *port)
519 struct sockaddr_in sin;
520 int len = sizeof (sin);
523 rc = sock->ops->getname (sock, (struct sockaddr *)&sin, &len,
526 CERROR ("Error %d getting sock %s IP/port\n",
527 rc, remote ? "peer" : "local");
532 *ip = ntohl (sin.sin_addr.s_addr);
535 *port = ntohs (sin.sin_port);
540 EXPORT_SYMBOL(libcfs_sock_getaddr);
543 libcfs_sock_getbuf (struct socket *sock, int *txbufsize, int *rxbufsize)
546 if (txbufsize != NULL) {
547 *txbufsize = sock->sk->sk_sndbuf;
550 if (rxbufsize != NULL) {
551 *rxbufsize = sock->sk->sk_rcvbuf;
557 EXPORT_SYMBOL(libcfs_sock_getbuf);
560 libcfs_sock_listen (struct socket **sockp,
561 __u32 local_ip, int local_port, int backlog)
566 rc = libcfs_sock_create(sockp, &fatal, local_ip, local_port);
569 CERROR("Can't create socket: port %d already in use\n",
574 rc = (*sockp)->ops->listen(*sockp, backlog);
578 CERROR("Can't set listen backlog %d: %d\n", backlog, rc);
579 sock_release(*sockp);
583 EXPORT_SYMBOL(libcfs_sock_listen);
586 libcfs_sock_accept (struct socket **newsockp, struct socket *sock)
589 struct socket *newsock;
592 init_waitqueue_entry(&wait, current);
594 /* XXX this should add a ref to sock->ops->owner, if
595 * TCP could be a module */
596 rc = sock_create_lite(PF_PACKET, sock->type, IPPROTO_TCP, &newsock);
598 CERROR("Can't allocate socket\n");
602 newsock->ops = sock->ops;
604 set_current_state(TASK_INTERRUPTIBLE);
605 add_wait_queue(sk_sleep(sock->sk), &wait);
607 rc = sock->ops->accept(sock, newsock, O_NONBLOCK);
609 /* Nothing ready, so wait for activity */
611 rc = sock->ops->accept(sock, newsock, O_NONBLOCK);
614 remove_wait_queue(sk_sleep(sock->sk), &wait);
615 set_current_state(TASK_RUNNING);
624 sock_release(newsock);
628 EXPORT_SYMBOL(libcfs_sock_accept);
631 libcfs_sock_abort_accept (struct socket *sock)
633 wake_up_all(sk_sleep(sock->sk));
636 EXPORT_SYMBOL(libcfs_sock_abort_accept);
639 libcfs_sock_connect (struct socket **sockp, int *fatal,
640 __u32 local_ip, int local_port,
641 __u32 peer_ip, int peer_port)
643 struct sockaddr_in srvaddr;
646 rc = libcfs_sock_create(sockp, fatal, local_ip, local_port);
650 memset (&srvaddr, 0, sizeof (srvaddr));
651 srvaddr.sin_family = AF_INET;
652 srvaddr.sin_port = htons(peer_port);
653 srvaddr.sin_addr.s_addr = htonl(peer_ip);
655 rc = (*sockp)->ops->connect(*sockp,
656 (struct sockaddr *)&srvaddr, sizeof(srvaddr),
661 /* EADDRNOTAVAIL probably means we're already connected to the same
662 * peer/port on the same local port on a differently typed
663 * connection. Let our caller retry with a different local
665 *fatal = !(rc == -EADDRNOTAVAIL);
667 CDEBUG_LIMIT(*fatal ? D_NETERROR : D_NET,
668 "Error %d connecting %u.%u.%u.%u/%d -> %u.%u.%u.%u/%d\n", rc,
669 HIPQUAD(local_ip), local_port, HIPQUAD(peer_ip), peer_port);
671 sock_release(*sockp);
675 EXPORT_SYMBOL(libcfs_sock_connect);
678 libcfs_sock_release (struct socket *sock)
683 EXPORT_SYMBOL(libcfs_sock_release);