xref: /original-bsd/sys/kern/uipc_usrreq.c (revision e4dd4c49)
1 /*
2  * Copyright (c) 1982, 1986, 1989 Regents of the University of California.
3  * All rights reserved.
4  *
5  * Redistribution and use in source and binary forms are permitted
6  * provided that the above copyright notice and this paragraph are
7  * duplicated in all such forms and that any documentation,
8  * advertising materials, and other materials related to such
9  * distribution and use acknowledge that the software was developed
10  * by the University of California, Berkeley.  The name of the
11  * University may not be used to endorse or promote products derived
12  * from this software without specific prior written permission.
13  * THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR
14  * IMPLIED WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED
15  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
16  *
17  *	@(#)uipc_usrreq.c	7.15 (Berkeley) 04/16/90
18  */
19 
20 #include "param.h"
21 #include "user.h"
22 #include "domain.h"
23 #include "protosw.h"
24 #include "socket.h"
25 #include "socketvar.h"
26 #include "unpcb.h"
27 #include "un.h"
28 #include "vnode.h"
29 #include "mount.h"
30 #include "file.h"
31 #include "stat.h"
32 #include "mbuf.h"	/* XXX must appear after mount.h */
33 
34 /*
35  * Unix communications domain.
36  *
37  * TODO:
38  *	SEQPACKET, RDM
39  *	rethink name space problems
40  *	need a proper out-of-band
41  */
42 struct	sockaddr sun_noname = { sizeof(sun_noname), AF_UNIX };
43 ino_t	unp_ino;			/* prototype for fake inode numbers */
44 
45 /*ARGSUSED*/
46 uipc_usrreq(so, req, m, nam, control)
47 	struct socket *so;
48 	int req;
49 	struct mbuf *m, *nam, *control;
50 {
51 	struct unpcb *unp = sotounpcb(so);
52 	register struct socket *so2;
53 	register int error = 0;
54 
55 	if (req == PRU_CONTROL)
56 		return (EOPNOTSUPP);
57 	if (req != PRU_SEND && control && control->m_len) {
58 		error = EOPNOTSUPP;
59 		goto release;
60 	}
61 	if (unp == 0 && req != PRU_ATTACH) {
62 		error = EINVAL;
63 		goto release;
64 	}
65 	switch (req) {
66 
67 	case PRU_ATTACH:
68 		if (unp) {
69 			error = EISCONN;
70 			break;
71 		}
72 		error = unp_attach(so);
73 		break;
74 
75 	case PRU_DETACH:
76 		unp_detach(unp);
77 		break;
78 
79 	case PRU_BIND:
80 		error = unp_bind(unp, nam);
81 		break;
82 
83 	case PRU_LISTEN:
84 		if (unp->unp_vnode == 0)
85 			error = EINVAL;
86 		break;
87 
88 	case PRU_CONNECT:
89 		error = unp_connect(so, nam);
90 		break;
91 
92 	case PRU_CONNECT2:
93 		error = unp_connect2(so, (struct socket *)nam);
94 		break;
95 
96 	case PRU_DISCONNECT:
97 		unp_disconnect(unp);
98 		break;
99 
100 	case PRU_ACCEPT:
101 		/*
102 		 * Pass back name of connected socket,
103 		 * if it was bound and we are still connected
104 		 * (our peer may have closed already!).
105 		 */
106 		if (unp->unp_conn && unp->unp_conn->unp_addr) {
107 			nam->m_len = unp->unp_conn->unp_addr->m_len;
108 			bcopy(mtod(unp->unp_conn->unp_addr, caddr_t),
109 			    mtod(nam, caddr_t), (unsigned)nam->m_len);
110 		} else {
111 			nam->m_len = sizeof(sun_noname);
112 			*(mtod(nam, struct sockaddr *)) = sun_noname;
113 		}
114 		break;
115 
116 	case PRU_SHUTDOWN:
117 		socantsendmore(so);
118 		unp_usrclosed(unp);
119 		break;
120 
121 	case PRU_RCVD:
122 		switch (so->so_type) {
123 
124 		case SOCK_DGRAM:
125 			panic("uipc 1");
126 			/*NOTREACHED*/
127 
128 		case SOCK_STREAM:
129 #define	rcv (&so->so_rcv)
130 #define snd (&so2->so_snd)
131 			if (unp->unp_conn == 0)
132 				break;
133 			so2 = unp->unp_conn->unp_socket;
134 			/*
135 			 * Adjust backpressure on sender
136 			 * and wakeup any waiting to write.
137 			 */
138 			snd->sb_mbmax += unp->unp_mbcnt - rcv->sb_mbcnt;
139 			unp->unp_mbcnt = rcv->sb_mbcnt;
140 			snd->sb_hiwat += unp->unp_cc - rcv->sb_cc;
141 			unp->unp_cc = rcv->sb_cc;
142 			sowwakeup(so2);
143 #undef snd
144 #undef rcv
145 			break;
146 
147 		default:
148 			panic("uipc 2");
149 		}
150 		break;
151 
152 	case PRU_SEND:
153 		if (control && (error = unp_internalize(control)))
154 			break;
155 		switch (so->so_type) {
156 
157 		case SOCK_DGRAM: {
158 			struct sockaddr *from;
159 
160 			if (nam) {
161 				if (unp->unp_conn) {
162 					error = EISCONN;
163 					break;
164 				}
165 				error = unp_connect(so, nam);
166 				if (error)
167 					break;
168 			} else {
169 				if (unp->unp_conn == 0) {
170 					error = ENOTCONN;
171 					break;
172 				}
173 			}
174 			so2 = unp->unp_conn->unp_socket;
175 			if (unp->unp_addr)
176 				from = mtod(unp->unp_addr, struct sockaddr *);
177 			else
178 				from = &sun_noname;
179 			if (sbappendaddr(&so2->so_rcv, from, m, control)) {
180 				sorwakeup(so2);
181 				m = 0;
182 				control = 0;
183 			} else
184 				error = ENOBUFS;
185 			if (nam)
186 				unp_disconnect(unp);
187 			break;
188 		}
189 
190 		case SOCK_STREAM:
191 #define	rcv (&so2->so_rcv)
192 #define	snd (&so->so_snd)
193 			if (so->so_state & SS_CANTSENDMORE) {
194 				error = EPIPE;
195 				break;
196 			}
197 			if (unp->unp_conn == 0)
198 				panic("uipc 3");
199 			so2 = unp->unp_conn->unp_socket;
200 			/*
201 			 * Send to paired receive port, and then reduce
202 			 * send buffer hiwater marks to maintain backpressure.
203 			 * Wake up readers.
204 			 */
205 			if (control) {
206 				(void)sbappendcontrol(rcv, m, control);
207 				control = 0;
208 			} else
209 				sbappend(rcv, m);
210 			snd->sb_mbmax -=
211 			    rcv->sb_mbcnt - unp->unp_conn->unp_mbcnt;
212 			unp->unp_conn->unp_mbcnt = rcv->sb_mbcnt;
213 			snd->sb_hiwat -= rcv->sb_cc - unp->unp_conn->unp_cc;
214 			unp->unp_conn->unp_cc = rcv->sb_cc;
215 			sorwakeup(so2);
216 			m = 0;
217 #undef snd
218 #undef rcv
219 			break;
220 
221 		default:
222 			panic("uipc 4");
223 		}
224 		break;
225 
226 	case PRU_ABORT:
227 		unp_drop(unp, ECONNABORTED);
228 		break;
229 
230 	case PRU_SENSE:
231 		((struct stat *) m)->st_blksize = so->so_snd.sb_hiwat;
232 		if (so->so_type == SOCK_STREAM && unp->unp_conn != 0) {
233 			so2 = unp->unp_conn->unp_socket;
234 			((struct stat *) m)->st_blksize += so2->so_rcv.sb_cc;
235 		}
236 		((struct stat *) m)->st_dev = NODEV;
237 		if (unp->unp_ino == 0)
238 			unp->unp_ino = unp_ino++;
239 		((struct stat *) m)->st_ino = unp->unp_ino;
240 		return (0);
241 
242 	case PRU_RCVOOB:
243 		return (EOPNOTSUPP);
244 
245 	case PRU_SENDOOB:
246 		error = EOPNOTSUPP;
247 		break;
248 
249 	case PRU_SOCKADDR:
250 		if (unp->unp_addr) {
251 			nam->m_len = unp->unp_addr->m_len;
252 			bcopy(mtod(unp->unp_addr, caddr_t),
253 			    mtod(nam, caddr_t), (unsigned)nam->m_len);
254 		} else
255 			nam->m_len = 0;
256 		break;
257 
258 	case PRU_PEERADDR:
259 		if (unp->unp_conn && unp->unp_conn->unp_addr) {
260 			nam->m_len = unp->unp_conn->unp_addr->m_len;
261 			bcopy(mtod(unp->unp_conn->unp_addr, caddr_t),
262 			    mtod(nam, caddr_t), (unsigned)nam->m_len);
263 		} else
264 			nam->m_len = 0;
265 		break;
266 
267 	case PRU_SLOWTIMO:
268 		break;
269 
270 	default:
271 		panic("piusrreq");
272 	}
273 release:
274 	if (control)
275 		m_freem(control);
276 	if (m)
277 		m_freem(m);
278 	return (error);
279 }
280 
281 /*
282  * Both send and receive buffers are allocated PIPSIZ bytes of buffering
283  * for stream sockets, although the total for sender and receiver is
284  * actually only PIPSIZ.
285  * Datagram sockets really use the sendspace as the maximum datagram size,
286  * and don't really want to reserve the sendspace.  Their recvspace should
287  * be large enough for at least one max-size datagram plus address.
288  */
289 #define	PIPSIZ	4096
290 u_long	unpst_sendspace = PIPSIZ;
291 u_long	unpst_recvspace = PIPSIZ;
292 u_long	unpdg_sendspace = 2*1024;	/* really max datagram size */
293 u_long	unpdg_recvspace = 4*1024;
294 
295 int	unp_rights;			/* file descriptors in flight */
296 
297 unp_attach(so)
298 	struct socket *so;
299 {
300 	register struct mbuf *m;
301 	register struct unpcb *unp;
302 	int error;
303 
304 	if (so->so_snd.sb_hiwat == 0 || so->so_rcv.sb_hiwat == 0) {
305 		switch (so->so_type) {
306 
307 		case SOCK_STREAM:
308 			error = soreserve(so, unpst_sendspace, unpst_recvspace);
309 			break;
310 
311 		case SOCK_DGRAM:
312 			error = soreserve(so, unpdg_sendspace, unpdg_recvspace);
313 			break;
314 		}
315 		if (error)
316 			return (error);
317 	}
318 	m = m_getclr(M_DONTWAIT, MT_PCB);
319 	if (m == NULL)
320 		return (ENOBUFS);
321 	unp = mtod(m, struct unpcb *);
322 	so->so_pcb = (caddr_t)unp;
323 	unp->unp_socket = so;
324 	return (0);
325 }
326 
327 unp_detach(unp)
328 	register struct unpcb *unp;
329 {
330 
331 	if (unp->unp_vnode) {
332 		unp->unp_vnode->v_socket = 0;
333 		vrele(unp->unp_vnode);
334 		unp->unp_vnode = 0;
335 	}
336 	if (unp->unp_conn)
337 		unp_disconnect(unp);
338 	while (unp->unp_refs)
339 		unp_drop(unp->unp_refs, ECONNRESET);
340 	soisdisconnected(unp->unp_socket);
341 	unp->unp_socket->so_pcb = 0;
342 	m_freem(unp->unp_addr);
343 	(void) m_free(dtom(unp));
344 	if (unp_rights)
345 		unp_gc();
346 }
347 
348 unp_bind(unp, nam)
349 	struct unpcb *unp;
350 	struct mbuf *nam;
351 {
352 	struct sockaddr_un *soun = mtod(nam, struct sockaddr_un *);
353 	register struct vnode *vp;
354 	register struct nameidata *ndp = &u.u_nd;
355 	struct vattr vattr;
356 	int error;
357 
358 	ndp->ni_dirp = soun->sun_path;
359 	if (unp->unp_vnode != NULL)
360 		return (EINVAL);
361 	if (nam->m_len == MLEN) {
362 		if (*(mtod(nam, caddr_t) + nam->m_len - 1) != 0)
363 			return (EINVAL);
364 	} else
365 		*(mtod(nam, caddr_t) + nam->m_len) = 0;
366 /* SHOULD BE ABLE TO ADOPT EXISTING AND wakeup() ALA FIFO's */
367 	ndp->ni_nameiop = CREATE | FOLLOW | LOCKPARENT;
368 	ndp->ni_segflg = UIO_SYSSPACE;
369 	if (error = namei(ndp))
370 		return (error);
371 	vp = ndp->ni_vp;
372 	if (vp != NULL) {
373 		VOP_ABORTOP(ndp);
374 		return (EADDRINUSE);
375 	}
376 	vattr_null(&vattr);
377 	vattr.va_type = VSOCK;
378 	vattr.va_mode = 0777;
379 	if (error = VOP_CREATE(ndp, &vattr))
380 		return (error);
381 	vp = ndp->ni_vp;
382 	vp->v_socket = unp->unp_socket;
383 	unp->unp_vnode = vp;
384 	unp->unp_addr = m_copy(nam, 0, (int)M_COPYALL);
385 	VOP_UNLOCK(vp);
386 	return (0);
387 }
388 
389 unp_connect(so, nam)
390 	struct socket *so;
391 	struct mbuf *nam;
392 {
393 	register struct sockaddr_un *soun = mtod(nam, struct sockaddr_un *);
394 	register struct vnode *vp;
395 	register struct socket *so2, *so3;
396 	register struct nameidata *ndp = &u.u_nd;
397 	struct unpcb *unp2, *unp3;
398 	int error;
399 
400 	ndp->ni_dirp = soun->sun_path;
401 	if (nam->m_data + nam->m_len == &nam->m_dat[MLEN]) {	/* XXX */
402 		if (*(mtod(nam, caddr_t) + nam->m_len - 1) != 0)
403 			return (EMSGSIZE);
404 	} else
405 		*(mtod(nam, caddr_t) + nam->m_len) = 0;
406 	ndp->ni_nameiop = LOOKUP | FOLLOW | LOCKLEAF;
407 	ndp->ni_segflg = UIO_SYSSPACE;
408 	if (error = namei(ndp))
409 		return (error);
410 	vp = ndp->ni_vp;
411 	if (vp->v_type != VSOCK) {
412 		error = ENOTSOCK;
413 		goto bad;
414 	}
415 	if (error = VOP_ACCESS(vp, VWRITE, ndp->ni_cred))
416 		goto bad;
417 	so2 = vp->v_socket;
418 	if (so2 == 0) {
419 		error = ECONNREFUSED;
420 		goto bad;
421 	}
422 	if (so->so_type != so2->so_type) {
423 		error = EPROTOTYPE;
424 		goto bad;
425 	}
426 	if (so->so_proto->pr_flags & PR_CONNREQUIRED) {
427 		if ((so2->so_options & SO_ACCEPTCONN) == 0 ||
428 		    (so3 = sonewconn(so2, 0)) == 0) {
429 			error = ECONNREFUSED;
430 			goto bad;
431 		}
432 		unp2 = sotounpcb(so2);
433 		unp3 = sotounpcb(so3);
434 		if (unp2->unp_addr)
435 			unp3->unp_addr =
436 				  m_copy(unp2->unp_addr, 0, (int)M_COPYALL);
437 		so2 = so3;
438 	}
439 	error = unp_connect2(so, so2);
440 bad:
441 	vput(vp);
442 	return (error);
443 }
444 
445 unp_connect2(so, so2)
446 	register struct socket *so;
447 	register struct socket *so2;
448 {
449 	register struct unpcb *unp = sotounpcb(so);
450 	register struct unpcb *unp2;
451 
452 	if (so2->so_type != so->so_type)
453 		return (EPROTOTYPE);
454 	unp2 = sotounpcb(so2);
455 	unp->unp_conn = unp2;
456 	switch (so->so_type) {
457 
458 	case SOCK_DGRAM:
459 		unp->unp_nextref = unp2->unp_refs;
460 		unp2->unp_refs = unp;
461 		soisconnected(so);
462 		break;
463 
464 	case SOCK_STREAM:
465 		unp2->unp_conn = unp;
466 		soisconnected(so);
467 		soisconnected(so2);
468 		break;
469 
470 	default:
471 		panic("unp_connect2");
472 	}
473 	return (0);
474 }
475 
476 unp_disconnect(unp)
477 	struct unpcb *unp;
478 {
479 	register struct unpcb *unp2 = unp->unp_conn;
480 
481 	if (unp2 == 0)
482 		return;
483 	unp->unp_conn = 0;
484 	switch (unp->unp_socket->so_type) {
485 
486 	case SOCK_DGRAM:
487 		if (unp2->unp_refs == unp)
488 			unp2->unp_refs = unp->unp_nextref;
489 		else {
490 			unp2 = unp2->unp_refs;
491 			for (;;) {
492 				if (unp2 == 0)
493 					panic("unp_disconnect");
494 				if (unp2->unp_nextref == unp)
495 					break;
496 				unp2 = unp2->unp_nextref;
497 			}
498 			unp2->unp_nextref = unp->unp_nextref;
499 		}
500 		unp->unp_nextref = 0;
501 		unp->unp_socket->so_state &= ~SS_ISCONNECTED;
502 		break;
503 
504 	case SOCK_STREAM:
505 		soisdisconnected(unp->unp_socket);
506 		unp2->unp_conn = 0;
507 		soisdisconnected(unp2->unp_socket);
508 		break;
509 	}
510 }
511 
512 #ifdef notdef
513 unp_abort(unp)
514 	struct unpcb *unp;
515 {
516 
517 	unp_detach(unp);
518 }
519 #endif
520 
521 /*ARGSUSED*/
522 unp_usrclosed(unp)
523 	struct unpcb *unp;
524 {
525 
526 }
527 
528 unp_drop(unp, errno)
529 	struct unpcb *unp;
530 	int errno;
531 {
532 	struct socket *so = unp->unp_socket;
533 
534 	so->so_error = errno;
535 	unp_disconnect(unp);
536 	if (so->so_head) {
537 		so->so_pcb = (caddr_t) 0;
538 		m_freem(unp->unp_addr);
539 		(void) m_free(dtom(unp));
540 		sofree(so);
541 	}
542 }
543 
544 #ifdef notdef
545 unp_drain()
546 {
547 
548 }
549 #endif
550 
551 unp_externalize(rights)
552 	struct mbuf *rights;
553 {
554 	register int i;
555 	register struct cmsghdr *cm = mtod(rights, struct cmsghdr *);
556 	register struct file **rp = (struct file **)(cm + 1);
557 	register struct file *fp;
558 	int newfds = (cm->cmsg_len - sizeof(*cm)) / sizeof (int);
559 	int f;
560 
561 	if (newfds > ufavail()) {
562 		for (i = 0; i < newfds; i++) {
563 			fp = *rp;
564 			unp_discard(fp);
565 			*rp++ = 0;
566 		}
567 		return (EMSGSIZE);
568 	}
569 	for (i = 0; i < newfds; i++) {
570 		if (ufalloc(0, &f))
571 			panic("unp_externalize");
572 		fp = *rp;
573 		u.u_ofile[f] = fp;
574 		fp->f_msgcount--;
575 		unp_rights--;
576 		*(int *)rp++ = f;
577 	}
578 	return (0);
579 }
580 
581 unp_internalize(control)
582 	struct mbuf *control;
583 {
584 	register struct cmsghdr *cm = mtod(control, struct cmsghdr *);
585 	register struct file **rp;
586 	register struct file *fp;
587 	register int i, fd;
588 	int oldfds;
589 
590 	if (cm->cmsg_type != SCM_RIGHTS || cm->cmsg_level != SOL_SOCKET ||
591 	    cm->cmsg_len != control->m_len)
592 		return (EINVAL);
593 	oldfds = (cm->cmsg_len - sizeof (*cm)) / sizeof (int);
594 	rp = (struct file **)(cm + 1);
595 	for (i = 0; i < oldfds; i++) {
596 		fd = *(int *)rp++;
597 		if ((unsigned)fd >= NOFILE || u.u_ofile[fd] == NULL)
598 			return (EBADF);
599 	}
600 	rp = (struct file **)(cm + 1);
601 	for (i = 0; i < oldfds; i++) {
602 		fp = u.u_ofile[*(int *)rp];
603 		*rp++ = fp;
604 		fp->f_count++;
605 		fp->f_msgcount++;
606 		unp_rights++;
607 	}
608 	return (0);
609 }
610 
611 int	unp_defer, unp_gcing;
612 int	unp_mark();
613 extern	struct domain unixdomain;
614 
615 unp_gc()
616 {
617 	register struct file *fp;
618 	register struct socket *so;
619 
620 	if (unp_gcing)
621 		return;
622 	unp_gcing = 1;
623 restart:
624 	unp_defer = 0;
625 	for (fp = file; fp < fileNFILE; fp++)
626 		fp->f_flag &= ~(FMARK|FDEFER);
627 	do {
628 		for (fp = file; fp < fileNFILE; fp++) {
629 			if (fp->f_count == 0)
630 				continue;
631 			if (fp->f_flag & FDEFER) {
632 				fp->f_flag &= ~FDEFER;
633 				unp_defer--;
634 			} else {
635 				if (fp->f_flag & FMARK)
636 					continue;
637 				if (fp->f_count == fp->f_msgcount)
638 					continue;
639 				fp->f_flag |= FMARK;
640 			}
641 			if (fp->f_type != DTYPE_SOCKET ||
642 			    (so = (struct socket *)fp->f_data) == 0)
643 				continue;
644 			if (so->so_proto->pr_domain != &unixdomain ||
645 			    (so->so_proto->pr_flags&PR_RIGHTS) == 0)
646 				continue;
647 			if (so->so_rcv.sb_flags & SB_LOCK) {
648 				sbwait(&so->so_rcv);
649 				goto restart;
650 			}
651 			unp_scan(so->so_rcv.sb_mb, unp_mark);
652 		}
653 	} while (unp_defer);
654 	for (fp = file; fp < fileNFILE; fp++) {
655 		if (fp->f_count == 0)
656 			continue;
657 		if (fp->f_count == fp->f_msgcount && (fp->f_flag & FMARK) == 0)
658 			while (fp->f_msgcount)
659 				unp_discard(fp);
660 	}
661 	unp_gcing = 0;
662 }
663 
664 unp_dispose(m)
665 	struct mbuf *m;
666 {
667 	int unp_discard();
668 
669 	if (m)
670 		unp_scan(m, unp_discard);
671 }
672 
673 unp_scan(m0, op)
674 	register struct mbuf *m0;
675 	int (*op)();
676 {
677 	register struct mbuf *m;
678 	register struct file **rp;
679 	register struct cmsghdr *cm;
680 	register int i;
681 	int qfds;
682 
683 	while (m0) {
684 		for (m = m0; m; m = m->m_next)
685 			if (m->m_type == MT_CONTROL &&
686 			    m->m_len >= sizeof(*cm)) {
687 				cm = mtod(m, struct cmsghdr *);
688 				if (cm->cmsg_level != SOL_SOCKET ||
689 				    cm->cmsg_type != SCM_RIGHTS)
690 					continue;
691 				qfds = (cm->cmsg_len - sizeof *cm)
692 						/ sizeof (struct file *);
693 				rp = (struct file **)(cm + 1);
694 				for (i = 0; i < qfds; i++)
695 					(*op)(*rp++);
696 				break;		/* XXX, but saves time */
697 			}
698 		m0 = m0->m_act;
699 	}
700 }
701 
702 unp_mark(fp)
703 	struct file *fp;
704 {
705 
706 	if (fp->f_flag & FMARK)
707 		return;
708 	unp_defer++;
709 	fp->f_flag |= (FMARK|FDEFER);
710 }
711 
712 unp_discard(fp)
713 	struct file *fp;
714 {
715 
716 	fp->f_msgcount--;
717 	unp_rights--;
718 	(void) closef(fp);
719 }
720