db_sockets.c 43 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492
  1. /* -*- mode:c; c-file-style:"k&r"; c-basic-offset: 4; tab-width:4; indent-tabs-mode:nil; mode:auto-fill; fill-column:78; -*- */
  2. /* vim: set ts=4 sw=4 et tw=78 fo=cqt wm=0: */
  3. /* Copyright (C) 2014 Stony Brook University
  4. This file is part of Graphene Library OS.
  5. Graphene Library OS is free software: you can redistribute it and/or
  6. modify it under the terms of the GNU Lesser General Public License
  7. as published by the Free Software Foundation, either version 3 of the
  8. License, or (at your option) any later version.
  9. Graphene Library OS is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU Lesser General Public License for more details.
  13. You should have received a copy of the GNU Lesser General Public License
  14. along with this program. If not, see <http://www.gnu.org/licenses/>. */
  15. /*
  16. * db_socket.c
  17. *
  18. * This file contains operands for streams with URIs that start with
  19. * "tcp:", "tcp.srv:", "udp:", "udp.srv:".
  20. */
  21. #include "pal_defs.h"
  22. #include "pal_linux_defs.h"
  23. #include "pal.h"
  24. #include "pal_internal.h"
  25. #include "pal_linux.h"
  26. #include "pal_debug.h"
  27. #include "pal_security.h"
  28. #include "pal_error.h"
  29. #include "api.h"
  30. #include "graphene.h"
  31. #include <linux/types.h>
  32. #include <linux/poll.h>
  33. typedef __kernel_pid_t pid_t;
  34. #include <asm/fcntl.h>
  35. #include <sys/socket.h>
  36. #include <linux/in.h>
  37. #include <linux/in6.h>
  38. #include <linux/time.h>
  39. #include <netinet/tcp.h>
  40. #include <asm/errno.h>
  41. #ifndef SOL_TCP
  42. # define SOL_TCP 6
  43. #endif
  44. #ifndef TCP_NODELAY
  45. # define TCP_NODELAY 1
  46. #endif
  47. #ifndef TCP_CORK
  48. # define TCP_CORK 3
  49. #endif
  50. #ifndef SOL_IPV6
  51. # define SOL_IPV6 41
  52. #endif
  53. /* 96 bytes is the minimal size of buffer to store a IPv4/IPv6
  54. address */
  55. #define PAL_SOCKADDR_SIZE 96
  56. static size_t addr_size(const struct sockaddr* addr) {
  57. switch (addr->sa_family) {
  58. case AF_INET:
  59. return sizeof(struct sockaddr_in);
  60. case AF_INET6:
  61. return sizeof(struct sockaddr_in6);
  62. default:
  63. return 0;
  64. }
  65. }
  66. /* parsing the string of uri, and fill in the socket address structure.
  67. the latest pointer of uri, length of socket address are returned. */
  68. static int inet_parse_uri (char ** uri, struct sockaddr * addr, size_t * addrlen)
  69. {
  70. char * tmp = *uri, * end;
  71. char * addr_str = NULL, * port_str;
  72. int af;
  73. void * addr_buf;
  74. size_t addr_len;
  75. __be16 * port_buf;
  76. size_t slen;
  77. if (tmp[0] == '[') {
  78. /* for IPv6, the address will be in the form of
  79. "[xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx]:port". */
  80. struct sockaddr_in6 * addr_in6 = (struct sockaddr_in6 *) addr;
  81. slen = sizeof(struct sockaddr_in6);
  82. memset(addr, 0, slen);
  83. end = strchr(tmp + 1, ']');
  84. if (!end || *(end + 1) != ':')
  85. goto inval;
  86. addr_str = tmp + 1;
  87. addr_len = end - tmp - 1;
  88. port_str = end + 2;
  89. for (end = port_str ; *end >= '0' && *end <= '9' ; end++);
  90. addr_in6->sin6_family = af = AF_INET6;
  91. addr_buf = &addr_in6->sin6_addr.s6_addr;
  92. port_buf = &addr_in6->sin6_port;
  93. } else {
  94. /* for IP, the address will be in the form of "x.x.x.x:port". */
  95. struct sockaddr_in * addr_in = (struct sockaddr_in *) addr;
  96. slen = sizeof(struct sockaddr_in);
  97. memset(addr, 0, slen);
  98. end = strchr(tmp, ':');
  99. if (!end)
  100. goto inval;
  101. addr_str = tmp;
  102. addr_len = end - tmp;
  103. port_str = end + 1;
  104. for (end = port_str ; *end >= '0' && *end <= '9' ; end++);
  105. addr_in->sin_family = af = AF_INET;
  106. addr_buf = &addr_in->sin_addr.s_addr;
  107. port_buf = &addr_in->sin_port;
  108. }
  109. if (af == AF_INET) {
  110. if (!inet_pton4(addr_str, addr_len, addr_buf))
  111. goto inval;
  112. } else {
  113. if (!inet_pton6(addr_str, addr_len, addr_buf))
  114. goto inval;
  115. }
  116. *port_buf = __htons(atoi(port_str));
  117. *uri = *end ? end + 1 : NULL;
  118. if (addrlen)
  119. *addrlen = slen;
  120. return 0;
  121. inval:
  122. return -PAL_ERROR_INVAL;
  123. }
  124. /* create the string of uri from the given socket address */
  125. static int inet_create_uri (char * uri, size_t count, struct sockaddr * addr,
  126. size_t addrlen)
  127. {
  128. size_t len = 0;
  129. if (addr->sa_family == AF_INET) {
  130. if (addrlen != sizeof(struct sockaddr_in))
  131. return -PAL_ERROR_INVAL;
  132. struct sockaddr_in * addr_in = (struct sockaddr_in *) addr;
  133. char * addr = (char *) &addr_in->sin_addr.s_addr;
  134. /* for IP, the address will be in the form of "x.x.x.x:port". */
  135. len = snprintf(uri, count, "%u.%u.%u.%u:%u",
  136. (unsigned char) addr[0],
  137. (unsigned char) addr[1],
  138. (unsigned char) addr[2],
  139. (unsigned char) addr[3],
  140. __ntohs(addr_in->sin_port));
  141. } else if (addr->sa_family == AF_INET6) {
  142. if (addrlen != sizeof(struct sockaddr_in6))
  143. return -PAL_ERROR_INVAL;
  144. struct sockaddr_in6 * addr_in6 = (struct sockaddr_in6 *) addr;
  145. unsigned short * addr = (unsigned short *) &addr_in6->sin6_addr.s6_addr;
  146. /* for IPv6, the address will be in the form of
  147. "[xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx]:port". */
  148. len = snprintf(uri, count, "[%04x:%04x:%04x:%04x:%04x:%04x:%04x:%04x]:%u",
  149. addr[0], addr[1], addr[2], addr[3],
  150. addr[4], addr[5], addr[6], addr[7],
  151. __ntohs(addr_in6->sin6_port));
  152. } else {
  153. return -PAL_ERROR_INVAL;
  154. }
  155. if (len >= count)
  156. return -PAL_ERROR_TOOLONG;
  157. return len;
  158. }
  159. /* parse the uri for a socket stream. The uri might have both binding
  160. address and connecting address, or connecting address only. The form
  161. of uri will be either "bind-addr:bind-port:connect-addr:connect-port"
  162. or "addr:port". */
  163. static int socket_parse_uri (char * uri,
  164. struct sockaddr ** bind_addr, size_t * bind_addrlen,
  165. struct sockaddr ** dest_addr, size_t * dest_addrlen)
  166. {
  167. int ret;
  168. if (!bind_addr && !dest_addr)
  169. return 0;
  170. if (!uri || !(*uri)) {
  171. if (bind_addr)
  172. *bind_addr = NULL;
  173. if (bind_addrlen)
  174. *bind_addrlen = 0;
  175. if (dest_addr)
  176. *dest_addr = NULL;
  177. if (dest_addrlen)
  178. *dest_addrlen = 0;
  179. return 0;
  180. }
  181. /* at least parse uri once */
  182. if ((ret = inet_parse_uri(&uri, bind_addr ? *bind_addr : *dest_addr,
  183. bind_addr ? bind_addrlen : dest_addrlen)) < 0)
  184. return ret;
  185. if (!(bind_addr && dest_addr))
  186. return 0;
  187. /* if you reach here, it can only be connection address */
  188. if (!uri || (ret = inet_parse_uri(&uri, *dest_addr, dest_addrlen)) < 0) {
  189. *dest_addr = *bind_addr;
  190. *dest_addrlen = *bind_addrlen;
  191. *bind_addr = NULL;
  192. *bind_addrlen = 0;
  193. }
  194. return 0;
  195. }
  196. /* fill in the PAL handle based on the file descriptors and address given. */
  197. static inline
  198. PAL_HANDLE socket_create_handle (int type, int fd, int options,
  199. struct sockaddr * bind_addr, size_t bind_addrlen,
  200. struct sockaddr * dest_addr, size_t dest_addrlen)
  201. {
  202. PAL_HANDLE hdl = malloc(HANDLE_SIZE(sock) + (bind_addr ? bind_addrlen : 0) +
  203. (dest_addr ? dest_addrlen : 0));
  204. if (!hdl)
  205. return NULL;
  206. memset(hdl, 0, sizeof(struct pal_handle));
  207. init_handle_hdr(HANDLE_HDR(hdl), type);
  208. HANDLE_HDR(hdl)->flags |= RFD(0)|(type != pal_type_tcpsrv ? WFD(0) : 0);
  209. hdl->sock.fd = fd;
  210. void * addr = (void *) hdl + HANDLE_SIZE(sock);
  211. if (bind_addr) {
  212. hdl->sock.bind = (PAL_PTR) addr;
  213. memcpy(addr, bind_addr, bind_addrlen);
  214. addr += bind_addrlen;
  215. } else {
  216. hdl->sock.bind = (PAL_PTR) NULL;
  217. }
  218. if (dest_addr) {
  219. hdl->sock.conn = (PAL_PTR) addr;
  220. memcpy(addr, dest_addr, dest_addrlen);
  221. addr += dest_addrlen;
  222. } else {
  223. hdl->sock.conn = (PAL_PTR) NULL;
  224. }
  225. hdl->sock.nonblocking = (options & PAL_OPTION_NONBLOCK) ?
  226. PAL_TRUE : PAL_FALSE;
  227. hdl->sock.linger = 0;
  228. if (type == pal_type_tcpsrv) {
  229. hdl->sock.receivebuf = 0;
  230. hdl->sock.sendbuf = 0;
  231. } else {
  232. int ret, val;
  233. socklen_t len = sizeof(int);
  234. ret = INLINE_SYSCALL(getsockopt, 5, fd, SOL_SOCKET, SO_RCVBUF,
  235. &val, &len);
  236. hdl->sock.receivebuf = IS_ERR(ret) ? 0 : val;
  237. ret = INLINE_SYSCALL(getsockopt, 5, fd, SOL_SOCKET, SO_SNDBUF,
  238. &val, &len);
  239. hdl->sock.sendbuf = IS_ERR(ret) ? 0 : val;
  240. }
  241. hdl->sock.receivetimeout = 0;
  242. hdl->sock.sendtimeout = 0;
  243. hdl->sock.tcp_cork = PAL_FALSE;
  244. hdl->sock.tcp_keepalive = PAL_FALSE;
  245. hdl->sock.tcp_nodelay = PAL_FALSE;
  246. return hdl;
  247. }
  248. static bool check_zero (void * mem, size_t size)
  249. {
  250. void * p = mem, * q = mem + size;
  251. while (p < q) {
  252. if (p <= q - sizeof(long)) {
  253. if (*(long *) p)
  254. return false;
  255. p += sizeof(long);
  256. } else if (p <= q - sizeof(int)) {
  257. if (*(int *) p)
  258. return false;
  259. p += sizeof(int);
  260. } else if (p <= q - sizeof(short)) {
  261. if (*(short *) p)
  262. return false;
  263. p += sizeof(short);
  264. } else {
  265. if (*(char *) p)
  266. return false;
  267. p++;
  268. }
  269. }
  270. return true;
  271. }
  272. /* check if an address is "Any" */
  273. static bool check_any_addr (struct sockaddr * addr)
  274. {
  275. if (addr->sa_family == AF_INET) {
  276. struct sockaddr_in * addr_in =
  277. (struct sockaddr_in *) addr;
  278. return addr_in->sin_port == 0 &&
  279. check_zero(&addr_in->sin_addr,
  280. sizeof(addr_in->sin_addr));
  281. } else if (addr->sa_family == AF_INET6) {
  282. struct sockaddr_in6 * addr_in6 =
  283. (struct sockaddr_in6 *) addr;
  284. return addr_in6->sin6_port == 0 &&
  285. check_zero(&addr_in6->sin6_addr,
  286. sizeof(addr_in6->sin6_addr));
  287. }
  288. return false;
  289. }
  290. /* listen on a tcp socket */
  291. static int tcp_listen (PAL_HANDLE * handle, char * uri, int options)
  292. {
  293. struct sockaddr buffer, * bind_addr = &buffer;
  294. size_t bind_addrlen;
  295. int ret, fd = -1;
  296. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  297. NULL, NULL)) < 0)
  298. return ret;
  299. assert(bind_addr);
  300. assert(bind_addrlen == addr_size(bind_addr));
  301. #if ALLOW_BIND_ANY == 0
  302. /* the socket need to have a binding address, a null address or an
  303. any address is not allowed */
  304. if (check_any_addr(bind_addr))
  305. return -PAL_ERROR_INVAL;
  306. #endif
  307. fd = INLINE_SYSCALL(socket, 3, bind_addr->sa_family,
  308. SOCK_STREAM|SOCK_CLOEXEC|options, 0);
  309. if (IS_ERR(fd))
  310. return -PAL_ERROR_DENIED;
  311. if (bind_addr->sa_family == AF_INET6) {
  312. int ipv6only = 1;
  313. INLINE_SYSCALL(setsockopt, 5, fd, SOL_IPV6, IPV6_V6ONLY, &ipv6only,
  314. sizeof(int));
  315. }
  316. /* must set the socket to be reuseable */
  317. int reuseaddr = 1;
  318. INLINE_SYSCALL(setsockopt, 5, fd, SOL_SOCKET, SO_REUSEADDR, &reuseaddr,
  319. sizeof(int));
  320. ret = INLINE_SYSCALL(bind, 3, fd, bind_addr, bind_addrlen);
  321. if (IS_ERR(ret)) {
  322. switch(ERRNO(ret)) {
  323. case EINVAL:
  324. ret = -PAL_ERROR_INVAL;
  325. goto failed;
  326. case EADDRINUSE:
  327. ret = -PAL_ERROR_STREAMEXIST;
  328. goto failed;
  329. default:
  330. ret = -PAL_ERROR_DENIED;
  331. goto failed;
  332. }
  333. }
  334. if (check_any_addr(bind_addr)) {
  335. /* call getsockname to get socket address */
  336. if ((ret = INLINE_SYSCALL(getsockname, 3, fd,
  337. bind_addr, &bind_addrlen)) < 0)
  338. goto failed;
  339. }
  340. ret = INLINE_SYSCALL(listen, 2, fd, DEFAULT_BACKLOG);
  341. if (IS_ERR(ret))
  342. return -PAL_ERROR_DENIED;
  343. *handle = socket_create_handle(pal_type_tcpsrv, fd, options,
  344. bind_addr, bind_addrlen, NULL, 0);
  345. if (!(*handle)) {
  346. ret = -PAL_ERROR_NOMEM;
  347. goto failed;
  348. }
  349. return 0;
  350. failed:
  351. INLINE_SYSCALL(close, 1, fd);
  352. return ret;
  353. }
  354. /* accept a tcp connection */
  355. static int tcp_accept (PAL_HANDLE handle, PAL_HANDLE * client)
  356. {
  357. if (!IS_HANDLE_TYPE(handle, tcpsrv) ||
  358. !handle->sock.bind || handle->sock.conn)
  359. return -PAL_ERROR_NOTSERVER;
  360. if (handle->sock.fd == PAL_IDX_POISON)
  361. return -PAL_ERROR_BADHANDLE;
  362. struct sockaddr * bind_addr = (struct sockaddr *) handle->sock.bind;
  363. size_t bind_addrlen = addr_size(bind_addr);
  364. struct sockaddr buffer;
  365. socklen_t addrlen = sizeof(struct sockaddr);
  366. int ret = 0;
  367. int newfd = INLINE_SYSCALL(accept4, 4, handle->sock.fd, &buffer,
  368. &addrlen, O_CLOEXEC);
  369. if (IS_ERR(newfd))
  370. switch(ERRNO(newfd)) {
  371. case EWOULDBLOCK:
  372. return -PAL_ERROR_TRYAGAIN;
  373. case ECONNABORTED:
  374. return -PAL_ERROR_STREAMNOTEXIST;
  375. default:
  376. return unix_to_pal_error(ERRNO(newfd));
  377. }
  378. struct sockaddr * dest_addr = &buffer;
  379. size_t dest_addrlen = addrlen;
  380. *client = socket_create_handle(pal_type_tcp, newfd, 0,
  381. bind_addr, bind_addrlen,
  382. dest_addr, dest_addrlen);
  383. if (!(*client)) {
  384. ret = -PAL_ERROR_NOMEM;
  385. goto failed;
  386. }
  387. return 0;
  388. failed:
  389. INLINE_SYSCALL(close, 1, newfd);
  390. return ret;
  391. }
  392. /* connect on a tcp socket */
  393. static int tcp_connect (PAL_HANDLE * handle, char * uri, int options)
  394. {
  395. struct sockaddr buffer[3];
  396. struct sockaddr * bind_addr = buffer, * dest_addr = buffer + 1;
  397. size_t bind_addrlen, dest_addrlen;
  398. int ret, fd = -1;
  399. /* accepting two kind of different uri:
  400. dest-ip:dest-port or bind-ip:bind-port:dest-ip:dest-port */
  401. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  402. &dest_addr, &dest_addrlen)) < 0)
  403. return ret;
  404. if (!dest_addr)
  405. return -PAL_ERROR_INVAL;
  406. if (bind_addr && bind_addr->sa_family != dest_addr->sa_family)
  407. return -PAL_ERROR_INVAL;
  408. fd = INLINE_SYSCALL(socket, 3, dest_addr->sa_family,
  409. SOCK_STREAM|SOCK_CLOEXEC|options, 0);
  410. if (IS_ERR(fd))
  411. return -PAL_ERROR_DENIED;
  412. if (bind_addr) {
  413. if (IS_ERR(ret)) {
  414. INLINE_SYSCALL(close, 1, fd);
  415. switch (ERRNO(ret)) {
  416. case EADDRINUSE:
  417. ret = -PAL_ERROR_STREAMEXIST;
  418. goto failed;
  419. case EADDRNOTAVAIL:
  420. ret = -PAL_ERROR_ADDRNOTEXIST;
  421. goto failed;
  422. default:
  423. ret = unix_to_pal_error(ERRNO(ret));
  424. goto failed;
  425. }
  426. }
  427. }
  428. if (dest_addr->sa_family == AF_INET6) {
  429. int ipv6only = 1;
  430. INLINE_SYSCALL(setsockopt, 5, fd, SOL_IPV6, IPV6_V6ONLY, &ipv6only,
  431. sizeof(int));
  432. }
  433. ret = INLINE_SYSCALL(connect, 3, fd, dest_addr, dest_addrlen);
  434. if (IS_ERR(ret) && ERRNO(ret) == EINPROGRESS) {
  435. struct pollfd pfd = { .fd = fd, .events = POLLOUT, .revents = 0 };
  436. ret = INLINE_SYSCALL(ppoll, 5, &pfd, 1, NULL, NULL, 0);
  437. }
  438. if (IS_ERR(ret)) {
  439. ret = unix_to_pal_error(ERRNO(ret));
  440. goto failed;
  441. }
  442. if (!bind_addr) {
  443. /* save some space to get socket address */
  444. bind_addr = buffer + 2;
  445. bind_addrlen = sizeof(struct sockaddr);
  446. /* call getsockname to get socket address */
  447. if ((ret = INLINE_SYSCALL(getsockname, 3, fd,
  448. bind_addr, &bind_addrlen)) < 0)
  449. bind_addr = NULL;
  450. }
  451. *handle = socket_create_handle(pal_type_tcp, fd, options,
  452. bind_addr, bind_addrlen,
  453. dest_addr, dest_addrlen);
  454. if (!(*handle)) {
  455. ret = -PAL_ERROR_NOMEM;
  456. goto failed;
  457. }
  458. return 0;
  459. failed:
  460. INLINE_SYSCALL(close, 1, fd);
  461. return ret;
  462. }
  463. /* 'open' operation of tcp stream */
  464. static int tcp_open (PAL_HANDLE *handle, const char * type, const char * uri,
  465. int access, int share, int create, int options)
  466. {
  467. if (!WITHIN_MASK(access, PAL_ACCESS_MASK) ||
  468. !WITHIN_MASK(share, PAL_SHARE_MASK) ||
  469. !WITHIN_MASK(create, PAL_CREATE_MASK))
  470. return -PAL_ERROR_INVAL;
  471. size_t uri_len = strlen(uri) + 1;
  472. if (uri_len > PAL_SOCKADDR_SIZE)
  473. return -PAL_ERROR_TOOLONG;
  474. char uri_buf[PAL_SOCKADDR_SIZE];
  475. memcpy(uri_buf, uri, uri_len);
  476. if (strcmp_static(type, "tcp.srv"))
  477. return tcp_listen(handle, uri_buf, options);
  478. if (strcmp_static(type, "tcp"))
  479. return tcp_connect(handle, uri_buf, options);
  480. return -PAL_ERROR_NOTSUPPORT;
  481. }
  482. /* 'read' operation of tcp stream */
  483. static int64_t tcp_read (PAL_HANDLE handle, uint64_t offset, size_t len,
  484. void * buf)
  485. {
  486. if (offset)
  487. return -PAL_ERROR_INVAL;
  488. if (!IS_HANDLE_TYPE(handle, tcp) || !handle->sock.conn)
  489. return -PAL_ERROR_NOTCONNECTION;
  490. if (handle->sock.fd == PAL_IDX_POISON)
  491. return -PAL_ERROR_ENDOFSTREAM;
  492. struct msghdr hdr;
  493. struct iovec iov;
  494. iov.iov_base = buf;
  495. iov.iov_len = len;
  496. hdr.msg_name = NULL;
  497. hdr.msg_namelen = 0;
  498. hdr.msg_iov = &iov;
  499. hdr.msg_iovlen = 1;
  500. hdr.msg_control = NULL;
  501. hdr.msg_controllen = 0;
  502. hdr.msg_flags = 0;
  503. int64_t bytes = INLINE_SYSCALL(recvmsg, 3, handle->sock.fd, &hdr, 0);
  504. if (IS_ERR(bytes))
  505. return unix_to_pal_error(ERRNO(bytes));
  506. if (!bytes)
  507. return -PAL_ERROR_ENDOFSTREAM;
  508. return bytes;
  509. }
  510. /* write' operation of tcp stream */
  511. static int64_t tcp_write (PAL_HANDLE handle, uint64_t offset, size_t len,
  512. const void * buf)
  513. {
  514. if (offset)
  515. return -PAL_ERROR_INVAL;
  516. if (!IS_HANDLE_TYPE(handle, tcp) || !handle->sock.conn)
  517. return -PAL_ERROR_NOTCONNECTION;
  518. if (handle->sock.fd == PAL_IDX_POISON)
  519. return -PAL_ERROR_CONNFAILED;
  520. struct msghdr hdr;
  521. struct iovec iov;
  522. iov.iov_base = (void *) buf;
  523. iov.iov_len = len;
  524. hdr.msg_name = NULL;
  525. hdr.msg_namelen = 0;
  526. hdr.msg_iov = &iov;
  527. hdr.msg_iovlen = 1;
  528. hdr.msg_control = NULL;
  529. hdr.msg_controllen = 0;
  530. hdr.msg_flags = 0;
  531. int64_t bytes = INLINE_SYSCALL(sendmsg, 3, handle->sock.fd, &hdr, MSG_NOSIGNAL);
  532. if (!IS_ERR(bytes) && (size_t)bytes == len)
  533. HANDLE_HDR(handle)->flags |= WRITABLE(0);
  534. else
  535. HANDLE_HDR(handle)->flags &= ~WRITABLE(0);
  536. if (IS_ERR(bytes))
  537. bytes = unix_to_pal_error(ERRNO(bytes));
  538. return bytes;
  539. }
  540. /* used by 'open' operation of tcp stream for bound socket */
  541. static int udp_bind (PAL_HANDLE * handle, char * uri, int options)
  542. {
  543. struct sockaddr buffer, * bind_addr = &buffer;
  544. size_t bind_addrlen;
  545. int ret = 0, fd = -1;
  546. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  547. NULL, NULL)) < 0)
  548. return ret;
  549. assert(bind_addr);
  550. assert(bind_addrlen == addr_size(bind_addr));
  551. #if ALLOW_BIND_ANY == 0
  552. /* the socket need to have a binding address, a null address or an
  553. any address is not allowed */
  554. if (check_any_addr(bind_addr))
  555. return -PAL_ERROR_INVAL;
  556. #endif
  557. fd = INLINE_SYSCALL(socket, 3, bind_addr->sa_family,
  558. SOCK_DGRAM|SOCK_CLOEXEC|options, 0);
  559. if (IS_ERR(fd))
  560. return -PAL_ERROR_DENIED;
  561. if (bind_addr->sa_family == AF_INET6) {
  562. int ipv6only = 1;
  563. INLINE_SYSCALL(setsockopt, 5, fd, SOL_IPV6, IPV6_V6ONLY, &ipv6only,
  564. sizeof(int));
  565. }
  566. ret = INLINE_SYSCALL(bind, 3, fd, bind_addr, bind_addrlen);
  567. if (IS_ERR(ret)) {
  568. switch (ERRNO(ret)) {
  569. case EADDRINUSE:
  570. ret = -PAL_ERROR_STREAMEXIST;
  571. goto failed;
  572. case EADDRNOTAVAIL:
  573. ret = -PAL_ERROR_ADDRNOTEXIST;
  574. goto failed;
  575. default:
  576. ret = unix_to_pal_error(ERRNO(ret));
  577. goto failed;
  578. }
  579. }
  580. *handle = socket_create_handle(pal_type_udpsrv, fd, options,
  581. bind_addr, bind_addrlen, NULL, 0);
  582. if (!(*handle)) {
  583. ret = -ENOMEM;
  584. goto failed;
  585. }
  586. return 0;
  587. failed:
  588. INLINE_SYSCALL(close, 1, fd);
  589. return ret;
  590. }
  591. /* used by 'open' operation of tcp stream for connected socket */
  592. static int udp_connect (PAL_HANDLE * handle, char * uri, int options)
  593. {
  594. struct sockaddr buffer[2];
  595. struct sockaddr * bind_addr = buffer, * dest_addr = buffer + 1;
  596. size_t bind_addrlen, dest_addrlen;
  597. int ret, fd = -1;
  598. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  599. &dest_addr, &dest_addrlen)) < 0)
  600. return ret;
  601. #if ALLOW_BIND_ANY == 0
  602. /* the socket need to have a binding address, a null address or an
  603. any address is not allowed */
  604. if (bind_addr && check_any_addr(bind_addr))
  605. return -PAL_ERROR_INVAL;
  606. #endif
  607. fd = INLINE_SYSCALL(socket, 3, dest_addr ? dest_addr->sa_family : AF_INET,
  608. SOCK_DGRAM|SOCK_CLOEXEC|options, 0);
  609. if (IS_ERR(fd))
  610. return -PAL_ERROR_DENIED;
  611. if (dest_addr && dest_addr->sa_family == AF_INET6) {
  612. int ipv6only = 1;
  613. INLINE_SYSCALL(setsockopt, 5, fd, SOL_IPV6, IPV6_V6ONLY, &ipv6only,
  614. sizeof(int));
  615. }
  616. if (bind_addr) {
  617. ret = INLINE_SYSCALL(bind, 3, fd, bind_addr, bind_addrlen);
  618. if (IS_ERR(ret)) {
  619. switch (ERRNO(ret)) {
  620. case EADDRINUSE:
  621. ret = -PAL_ERROR_STREAMEXIST;
  622. goto failed;
  623. case EADDRNOTAVAIL:
  624. ret = -PAL_ERROR_ADDRNOTEXIST;
  625. goto failed;
  626. default:
  627. ret = unix_to_pal_error(ERRNO(ret));
  628. goto failed;
  629. }
  630. }
  631. }
  632. *handle = socket_create_handle(dest_addr ? pal_type_udp : pal_type_udpsrv,
  633. fd, options,
  634. bind_addr, bind_addrlen,
  635. dest_addr, dest_addrlen);
  636. if (!(*handle)) {
  637. ret = -ENOMEM;
  638. goto failed;
  639. }
  640. return 0;
  641. failed:
  642. INLINE_SYSCALL(close, 1, fd);
  643. return ret;
  644. }
  645. static int udp_open (PAL_HANDLE *hdl, const char * type, const char * uri,
  646. int access, int share, int create, int options)
  647. {
  648. if (!WITHIN_MASK(access, PAL_ACCESS_MASK) ||
  649. !WITHIN_MASK(share, PAL_SHARE_MASK) ||
  650. !WITHIN_MASK(create, PAL_CREATE_MASK) ||
  651. !WITHIN_MASK(options, PAL_OPTION_MASK))
  652. return -PAL_ERROR_INVAL;
  653. char buf[PAL_SOCKADDR_SIZE];
  654. size_t len = strlen(uri);
  655. if (len >= PAL_SOCKADDR_SIZE)
  656. return -PAL_ERROR_TOOLONG;
  657. memcpy(buf, uri, len + 1);
  658. if (strcmp_static(type, "udp.srv"))
  659. return udp_bind(hdl, buf, options);
  660. if (strcmp_static(type, "udp"))
  661. return udp_connect(hdl, buf, options);
  662. return -PAL_ERROR_NOTSUPPORT;
  663. }
  664. static int64_t udp_receive (PAL_HANDLE handle, uint64_t offset, size_t len,
  665. void * buf)
  666. {
  667. if (offset)
  668. return -PAL_ERROR_INVAL;
  669. if (!IS_HANDLE_TYPE(handle, udp))
  670. return -PAL_ERROR_NOTCONNECTION;
  671. if (handle->sock.fd == PAL_IDX_POISON)
  672. return -PAL_ERROR_BADHANDLE;
  673. struct msghdr hdr;
  674. struct iovec iov;
  675. iov.iov_base = buf;
  676. iov.iov_len = len;
  677. hdr.msg_name = NULL;
  678. hdr.msg_namelen = 0;
  679. hdr.msg_iov = &iov;
  680. hdr.msg_iovlen = 1;
  681. hdr.msg_control = NULL;
  682. hdr.msg_controllen = 0;
  683. hdr.msg_flags = 0;
  684. int64_t bytes = INLINE_SYSCALL(recvmsg, 3, handle->sock.fd, &hdr, 0);
  685. if (IS_ERR(bytes))
  686. return unix_to_pal_error(ERRNO(bytes));
  687. return bytes;
  688. }
  689. static int64_t udp_receivebyaddr (PAL_HANDLE handle, uint64_t offset, size_t len,
  690. void * buf, char * addr, size_t addrlen)
  691. {
  692. if (offset)
  693. return -PAL_ERROR_INVAL;
  694. if (!IS_HANDLE_TYPE(handle, udpsrv))
  695. return -PAL_ERROR_NOTCONNECTION;
  696. if (handle->sock.fd == PAL_IDX_POISON)
  697. return -PAL_ERROR_BADHANDLE;
  698. struct sockaddr conn_addr;
  699. socklen_t conn_addrlen = sizeof(struct sockaddr);
  700. struct msghdr hdr;
  701. struct iovec iov;
  702. iov.iov_base = buf;
  703. iov.iov_len = len;
  704. hdr.msg_name = &conn_addr;
  705. hdr.msg_namelen = conn_addrlen;
  706. hdr.msg_iov = &iov;
  707. hdr.msg_iovlen = 1;
  708. hdr.msg_control = NULL;
  709. hdr.msg_controllen = 0;
  710. hdr.msg_flags = 0;
  711. int64_t bytes = INLINE_SYSCALL(recvmsg, 3, handle->sock.fd, &hdr, 0);
  712. if (IS_ERR(bytes))
  713. return unix_to_pal_error(ERRNO(bytes));
  714. char * addr_uri = strcpy_static(addr, "udp:", addrlen);
  715. if (!addr_uri)
  716. return -PAL_ERROR_OVERFLOW;
  717. int ret = inet_create_uri(addr_uri, addr + addrlen - addr_uri, &conn_addr,
  718. hdr.msg_namelen);
  719. if (ret < 0)
  720. return ret;
  721. return bytes;
  722. }
  723. static int64_t udp_send (PAL_HANDLE handle, uint64_t offset, size_t len,
  724. const void * buf)
  725. {
  726. if (offset)
  727. return -PAL_ERROR_INVAL;
  728. if (!IS_HANDLE_TYPE(handle, udp))
  729. return -PAL_ERROR_NOTCONNECTION;
  730. if (handle->sock.fd == PAL_IDX_POISON)
  731. return -PAL_ERROR_BADHANDLE;
  732. struct msghdr hdr;
  733. struct iovec iov;
  734. iov.iov_base = (void *) buf;
  735. iov.iov_len = len;
  736. hdr.msg_name = (void *) handle->sock.conn;
  737. hdr.msg_namelen = addr_size((struct sockaddr *) handle->sock.conn);
  738. hdr.msg_iov = &iov;
  739. hdr.msg_iovlen = 1;
  740. hdr.msg_control = NULL;
  741. hdr.msg_controllen = 0;
  742. hdr.msg_flags = 0;
  743. int64_t bytes = INLINE_SYSCALL(sendmsg, 3, handle->sock.fd, &hdr, MSG_NOSIGNAL);
  744. if (!IS_ERR(bytes) && (size_t)bytes == len)
  745. HANDLE_HDR(handle)->flags |= WRITABLE(0);
  746. else
  747. HANDLE_HDR(handle)->flags &= ~WRITABLE(0);
  748. if (IS_ERR(bytes))
  749. bytes = unix_to_pal_error(ERRNO(bytes));
  750. return bytes;
  751. }
  752. static int64_t udp_sendbyaddr (PAL_HANDLE handle, uint64_t offset, size_t len,
  753. const void * buf, const char * addr, size_t addrlen)
  754. {
  755. if (offset)
  756. return -PAL_ERROR_INVAL;
  757. if (!IS_HANDLE_TYPE(handle, udpsrv))
  758. return -PAL_ERROR_NOTCONNECTION;
  759. if (handle->sock.fd == PAL_IDX_POISON)
  760. return -PAL_ERROR_BADHANDLE;
  761. if (!strpartcmp_static(addr, "udp:"))
  762. return -PAL_ERROR_INVAL;
  763. addr += static_strlen("udp:");
  764. addrlen -= static_strlen("udp:");
  765. char * addrbuf = __alloca(addrlen);
  766. memcpy(addrbuf, addr, addrlen);
  767. struct sockaddr conn_addr;
  768. size_t conn_addrlen;
  769. int ret = inet_parse_uri(&addrbuf, &conn_addr, &conn_addrlen);
  770. if (ret < 0)
  771. return ret;
  772. struct msghdr hdr;
  773. struct iovec iov;
  774. iov.iov_base = (void *) buf;
  775. iov.iov_len = len;
  776. hdr.msg_name = &conn_addr;
  777. hdr.msg_namelen = conn_addrlen;
  778. hdr.msg_iov = &iov;
  779. hdr.msg_iovlen = 1;
  780. hdr.msg_control = NULL;
  781. hdr.msg_controllen = 0;
  782. hdr.msg_flags = 0;
  783. int64_t bytes = INLINE_SYSCALL(sendmsg, 3, handle->sock.fd, &hdr, MSG_NOSIGNAL);
  784. if (!IS_ERR(bytes) && (size_t)bytes == len)
  785. HANDLE_HDR(handle)->flags |= WRITABLE(0);
  786. else
  787. HANDLE_HDR(handle)->flags &= ~WRITABLE(0);
  788. if (IS_ERR(bytes))
  789. bytes = unix_to_pal_error(ERRNO(bytes));
  790. return bytes;
  791. }
  792. static int socket_delete (PAL_HANDLE handle, int access)
  793. {
  794. if (handle->sock.fd == PAL_IDX_POISON)
  795. return 0;
  796. if (!IS_HANDLE_TYPE(handle, tcp) && access)
  797. return -PAL_ERROR_INVAL;
  798. if (IS_HANDLE_TYPE(handle, tcp) || IS_HANDLE_TYPE(handle, tcpsrv)) {
  799. int shutdown;
  800. switch (access) {
  801. case 0:
  802. shutdown = SHUT_RDWR;
  803. break;
  804. case PAL_DELETE_RD:
  805. shutdown = SHUT_RD;
  806. break;
  807. case PAL_DELETE_WR:
  808. shutdown = SHUT_WR;
  809. break;
  810. default:
  811. return -PAL_ERROR_INVAL;
  812. }
  813. INLINE_SYSCALL(shutdown, 2, handle->sock.fd, shutdown);
  814. }
  815. return 0;
  816. }
  817. struct __kernel_linger {
  818. int l_onoff;
  819. int l_linger;
  820. };
  821. static int socket_close (PAL_HANDLE handle)
  822. {
  823. if (handle->sock.fd != PAL_IDX_POISON) {
  824. struct __kernel_linger l;
  825. l.l_onoff = 1;
  826. l.l_linger = 0;
  827. INLINE_SYSCALL(setsockopt, 5, handle->sock.fd, SOL_SOCKET, SO_LINGER,
  828. &l, sizeof(struct __kernel_linger));
  829. INLINE_SYSCALL(close, 1, handle->sock.fd);
  830. handle->sock.fd = PAL_IDX_POISON;
  831. }
  832. if (handle->sock.bind)
  833. handle->sock.bind = (PAL_PTR) NULL;
  834. if (handle->sock.conn)
  835. handle->sock.conn = (PAL_PTR) NULL;
  836. return 0;
  837. }
  838. #ifndef FIONREAD
  839. # define FIONREAD 0x541B
  840. #endif
  841. static int socket_attrquerybyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  842. {
  843. if (handle->sock.fd == PAL_IDX_POISON)
  844. return -PAL_ERROR_BADHANDLE;
  845. attr->handle_type = HANDLE_HDR(handle)->type;
  846. attr->disconnected = HANDLE_HDR(handle)->flags & ERROR(0);
  847. attr->nonblocking = handle->sock.nonblocking;
  848. attr->writable = HANDLE_HDR(handle)->flags & WRITABLE(0);
  849. attr->pending_size = 0; /* fill in later */
  850. attr->socket.linger = handle->sock.linger;
  851. attr->socket.receivebuf = handle->sock.receivebuf;
  852. attr->socket.sendbuf = handle->sock.sendbuf;
  853. attr->socket.receivetimeout = handle->sock.receivetimeout;
  854. attr->socket.sendtimeout = handle->sock.sendtimeout;
  855. attr->socket.tcp_cork = handle->sock.tcp_cork;
  856. attr->socket.tcp_keepalive = handle->sock.tcp_keepalive;
  857. attr->socket.tcp_nodelay = handle->sock.tcp_nodelay;
  858. int fd = handle->sock.fd, ret, val;
  859. if (!IS_HANDLE_TYPE(handle, tcpsrv)) {
  860. /* try use ioctl FIONEAD to get the size of socket */
  861. ret = INLINE_SYSCALL(ioctl, 3, fd, FIONREAD, &val);
  862. if (IS_ERR(ret))
  863. return unix_to_pal_error(ERRNO(ret));
  864. attr->pending_size = val;
  865. }
  866. struct pollfd pfd = { .fd = fd, .events = POLLIN, .revents = 0 };
  867. struct timespec tp = { 0, 0 };
  868. ret = INLINE_SYSCALL(ppoll, 5, &pfd, 1, &tp, NULL, 0);
  869. attr->readable = (ret == 1 && pfd.revents == POLLIN);
  870. return 0;
  871. }
  872. static int socket_attrsetbyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  873. {
  874. if (handle->sock.fd == PAL_IDX_POISON)
  875. return -PAL_ERROR_BADHANDLE;
  876. int fd = handle->sock.fd, ret, val;
  877. if (attr->nonblocking != handle->sock.nonblocking) {
  878. ret = INLINE_SYSCALL(fcntl, 3, fd, F_SETFL,
  879. attr->nonblocking ? O_NONBLOCK : 0);
  880. if (IS_ERR(ret))
  881. return unix_to_pal_error(ERRNO(ret));
  882. handle->sock.nonblocking = attr->nonblocking;
  883. }
  884. if (IS_HANDLE_TYPE(handle, tcpsrv)) {
  885. if (attr->socket.linger != handle->sock.linger) {
  886. struct __kernel_linger l;
  887. l.l_onoff = attr->socket.linger ? 1 : 0;
  888. l.l_linger = attr->socket.linger;
  889. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_SOCKET, SO_LINGER,
  890. &l, sizeof(struct __kernel_linger));
  891. if (IS_ERR(ret))
  892. return unix_to_pal_error(ERRNO(ret));
  893. handle->sock.linger = attr->socket.linger;
  894. }
  895. if (attr->socket.receivebuf != handle->sock.receivebuf) {
  896. int val = attr->socket.receivebuf;
  897. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_SOCKET, SO_RCVBUF,
  898. &val, sizeof(int));
  899. if (IS_ERR(ret))
  900. return unix_to_pal_error(ERRNO(ret));
  901. handle->sock.receivebuf = attr->socket.receivebuf;
  902. }
  903. if (attr->socket.sendbuf != handle->sock.sendbuf) {
  904. int val = attr->socket.sendbuf;
  905. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_SOCKET, SO_SNDBUF,
  906. &val, sizeof(int));
  907. if (IS_ERR(ret))
  908. return unix_to_pal_error(ERRNO(ret));
  909. handle->sock.sendbuf = attr->socket.sendbuf;
  910. }
  911. if (attr->socket.receivetimeout != handle->sock.receivetimeout) {
  912. int val = attr->socket.receivetimeout;
  913. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_SOCKET, SO_RCVTIMEO,
  914. &val, sizeof(int));
  915. if (IS_ERR(ret))
  916. return unix_to_pal_error(ERRNO(ret));
  917. handle->sock.receivetimeout = attr->socket.receivetimeout;
  918. }
  919. if (attr->socket.sendtimeout != handle->sock.sendtimeout) {
  920. int val = attr->socket.sendtimeout;
  921. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_SOCKET, SO_SNDTIMEO,
  922. &val, sizeof(int));
  923. if (IS_ERR(ret))
  924. return unix_to_pal_error(ERRNO(ret));
  925. handle->sock.sendtimeout = attr->socket.sendtimeout;
  926. }
  927. }
  928. if (IS_HANDLE_TYPE(handle, tcp) || IS_HANDLE_TYPE(handle, tcpsrv)) {
  929. if (attr->socket.tcp_cork != handle->sock.tcp_cork) {
  930. val = attr->socket.tcp_cork ? 1 : 0;
  931. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_TCP, TCP_CORK,
  932. &val, sizeof(int));
  933. if (IS_ERR(ret))
  934. return unix_to_pal_error(ERRNO(ret));
  935. handle->sock.tcp_cork = attr->socket.tcp_cork;
  936. }
  937. if (attr->socket.tcp_keepalive != handle->sock.tcp_keepalive) {
  938. val = attr->socket.tcp_keepalive ? 1 : 0;
  939. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_SOCKET, SO_KEEPALIVE,
  940. &val, sizeof(int));
  941. if (IS_ERR(ret))
  942. return unix_to_pal_error(ERRNO(ret));
  943. handle->sock.tcp_keepalive = attr->socket.tcp_keepalive;
  944. }
  945. if (attr->socket.tcp_nodelay != handle->sock.tcp_nodelay) {
  946. val = attr->socket.tcp_nodelay ? 1 : 0;
  947. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_TCP, TCP_NODELAY,
  948. &val, sizeof(int));
  949. if (IS_ERR(ret))
  950. return unix_to_pal_error(ERRNO(ret));
  951. handle->sock.tcp_nodelay = attr->socket.tcp_nodelay;
  952. }
  953. }
  954. return 0;
  955. }
  956. static int socket_getname (PAL_HANDLE handle, char * buffer, size_t count)
  957. {
  958. size_t old_count = count;
  959. int ret;
  960. const char * prefix = NULL;
  961. size_t prefix_len = 0;
  962. struct sockaddr * bind_addr = NULL, * dest_addr = NULL;
  963. switch (PAL_GET_TYPE(handle)) {
  964. case pal_type_tcpsrv:
  965. prefix_len = static_strlen("tcp.srv");
  966. prefix = "tcp.srv";
  967. bind_addr = (struct sockaddr *) handle->sock.bind;
  968. break;
  969. case pal_type_tcp:
  970. prefix_len = static_strlen("tcp");
  971. prefix = "tcp";
  972. bind_addr = (struct sockaddr *) handle->sock.bind;
  973. dest_addr = (struct sockaddr *) handle->sock.conn;
  974. break;
  975. case pal_type_udpsrv:
  976. prefix_len = static_strlen("udp.srv");
  977. prefix = "udp.srv";
  978. bind_addr = (struct sockaddr *) handle->sock.bind;
  979. break;
  980. case pal_type_udp:
  981. prefix_len = static_strlen("udp");
  982. prefix = "udp";
  983. bind_addr = (struct sockaddr *) handle->sock.bind;
  984. dest_addr = (struct sockaddr *) handle->sock.conn;
  985. break;
  986. default:
  987. return -PAL_ERROR_INVAL;
  988. }
  989. if (prefix_len >= count)
  990. return -PAL_ERROR_OVERFLOW;
  991. memcpy(buffer, prefix, prefix_len + 1);
  992. buffer += prefix_len;
  993. count -= prefix_len;
  994. for (int i = 0 ; i < 2 ; i++) {
  995. struct sockaddr * addr = i ? dest_addr : bind_addr;
  996. if (addr) {
  997. if (count <= 1)
  998. return -PAL_ERROR_OVERFLOW;
  999. buffer[0] = ':';
  1000. buffer[1] = 0;
  1001. buffer++;
  1002. count--;
  1003. if ((ret = inet_create_uri(buffer, count, addr,
  1004. addr_size(addr))) < 0)
  1005. return ret;
  1006. buffer += ret;
  1007. count -= ret;
  1008. }
  1009. }
  1010. return old_count - count;
  1011. }
  1012. struct handle_ops tcp_ops = {
  1013. .getname = &socket_getname,
  1014. .open = &tcp_open,
  1015. .waitforclient = &tcp_accept,
  1016. .read = &tcp_read,
  1017. .write = &tcp_write,
  1018. .delete = &socket_delete,
  1019. .close = &socket_close,
  1020. .attrquerybyhdl = &socket_attrquerybyhdl,
  1021. .attrsetbyhdl = &socket_attrsetbyhdl,
  1022. };
  1023. struct handle_ops udp_ops = {
  1024. .getname = &socket_getname,
  1025. .open = &udp_open,
  1026. .read = &udp_receive,
  1027. .write = &udp_send,
  1028. .delete = &socket_delete,
  1029. .close = &socket_close,
  1030. .attrquerybyhdl = &socket_attrquerybyhdl,
  1031. .attrsetbyhdl = &socket_attrsetbyhdl,
  1032. };
  1033. struct handle_ops udpsrv_ops = {
  1034. .getname = &socket_getname,
  1035. .open = &udp_open,
  1036. .readbyaddr = &udp_receivebyaddr,
  1037. .writebyaddr = &udp_sendbyaddr,
  1038. .delete = &socket_delete,
  1039. .close = &socket_close,
  1040. .attrquerybyhdl = &socket_attrquerybyhdl,
  1041. .attrsetbyhdl = &socket_attrsetbyhdl,
  1042. };
  1043. PAL_HANDLE _DkBroadcastStreamOpen (void)
  1044. {
  1045. if (!pal_sec.mcast_port) {
  1046. unsigned short mcast_port;
  1047. _DkFastRandomBitsRead(&mcast_port, sizeof(unsigned short));
  1048. pal_sec.mcast_port = mcast_port > 1024 ? mcast_port : mcast_port + 1024;
  1049. }
  1050. struct sockaddr_in addr;
  1051. int ret = 0;
  1052. addr.sin_family = AF_INET;
  1053. addr.sin_addr.s_addr = INADDR_ANY;
  1054. addr.sin_port = __htons(pal_sec.mcast_port);
  1055. /* set up server (sender) side */
  1056. int srv = INLINE_SYSCALL(socket, 3, AF_INET, SOCK_DGRAM|SOCK_CLOEXEC, 0);
  1057. if (IS_ERR(srv))
  1058. goto err;
  1059. ret = INLINE_SYSCALL(setsockopt, 5, srv, IPPROTO_IP, IP_MULTICAST_IF,
  1060. &addr.sin_addr.s_addr, sizeof(addr.sin_addr.s_addr));
  1061. if (IS_ERR(ret))
  1062. goto err_srv;
  1063. /* set up client (receiver) side */
  1064. int cli = INLINE_SYSCALL(socket, 3, AF_INET, SOCK_DGRAM|SOCK_CLOEXEC, 0);
  1065. if (IS_ERR(cli))
  1066. goto err_srv;
  1067. int reuse = 1;
  1068. INLINE_SYSCALL(setsockopt, 5, cli, SOL_SOCKET, SO_REUSEADDR,
  1069. &reuse, sizeof(reuse));
  1070. ret = INLINE_SYSCALL(bind, 3, cli, &addr, sizeof(addr));
  1071. if (IS_ERR(ret))
  1072. goto err_cli;
  1073. ret = INLINE_SYSCALL(setsockopt, 5, cli, IPPROTO_IP, IP_MULTICAST_IF,
  1074. &addr.sin_addr.s_addr, sizeof(addr.sin_addr.s_addr));
  1075. if (IS_ERR(ret))
  1076. goto err_cli;
  1077. inet_pton4(GRAPHENE_MCAST_GROUP, sizeof(GRAPHENE_MCAST_GROUP) - 1,
  1078. &addr.sin_addr.s_addr);
  1079. struct ip_mreq group;
  1080. group.imr_multiaddr.s_addr = addr.sin_addr.s_addr;
  1081. group.imr_interface.s_addr = INADDR_ANY;
  1082. ret = INLINE_SYSCALL(setsockopt, 5, cli, IPPROTO_IP, IP_ADD_MEMBERSHIP,
  1083. &group, sizeof(group));
  1084. if (IS_ERR(ret))
  1085. goto err_cli;
  1086. PAL_HANDLE hdl = malloc(HANDLE_SIZE(mcast));
  1087. SET_HANDLE_TYPE(hdl, mcast);
  1088. HANDLE_HDR(hdl)->flags |= WFD(1)|WRITABLE(1);
  1089. hdl->mcast.srv = srv;
  1090. hdl->mcast.cli = cli;
  1091. hdl->mcast.port = (PAL_NUM) pal_sec.mcast_port;
  1092. hdl->mcast.nonblocking = PAL_FALSE;
  1093. hdl->mcast.addr = (PAL_PTR) malloc_copy(&addr, sizeof(addr));
  1094. return hdl;
  1095. err_cli:
  1096. INLINE_SYSCALL(close, 1, cli);
  1097. err_srv:
  1098. INLINE_SYSCALL(close, 1, srv);
  1099. err:
  1100. return NULL;
  1101. }
  1102. static int64_t mcast_send (PAL_HANDLE handle, uint64_t offset, uint64_t size,
  1103. const void * buf)
  1104. {
  1105. if (offset)
  1106. return -PAL_ERROR_INVAL;
  1107. if (handle->mcast.srv == PAL_IDX_POISON)
  1108. return -PAL_ERROR_BADHANDLE;
  1109. struct msghdr hdr;
  1110. struct iovec iov;
  1111. iov.iov_base = (void *) buf;
  1112. iov.iov_len = size;
  1113. hdr.msg_name = (char *) handle->mcast.addr;
  1114. hdr.msg_namelen = sizeof(struct sockaddr_in);
  1115. hdr.msg_iov = &iov;
  1116. hdr.msg_iovlen = 1;
  1117. hdr.msg_control = NULL;
  1118. hdr.msg_controllen = 0;
  1119. hdr.msg_flags = 0;
  1120. int64_t bytes = INLINE_SYSCALL(sendmsg, 3, handle->mcast.srv, &hdr,
  1121. MSG_NOSIGNAL);
  1122. if (IS_ERR(bytes))
  1123. switch(ERRNO(bytes)) {
  1124. case ECONNRESET:
  1125. case EPIPE:
  1126. return -PAL_ERROR_CONNFAILED;
  1127. case EAGAIN:
  1128. HANDLE_HDR(handle)->flags &= ~WRITABLE(1);
  1129. /* fallthrough */
  1130. default:
  1131. return unix_to_pal_error(ERRNO(bytes));
  1132. }
  1133. assert(!IS_ERR(bytes));
  1134. if ((size_t)bytes == size)
  1135. HANDLE_HDR(handle)->flags |= WRITABLE(1);
  1136. else
  1137. HANDLE_HDR(handle)->flags &= ~WRITABLE(1);
  1138. return bytes;
  1139. }
  1140. static int64_t mcast_receive (PAL_HANDLE handle, uint64_t offset, size_t size,
  1141. void * buf)
  1142. {
  1143. if (offset)
  1144. return -PAL_ERROR_INVAL;
  1145. if (handle->mcast.cli == PAL_IDX_POISON)
  1146. return -PAL_ERROR_BADHANDLE;
  1147. struct msghdr hdr;
  1148. struct iovec iov;
  1149. iov.iov_base = buf;
  1150. iov.iov_len = size;
  1151. hdr.msg_name = NULL;
  1152. hdr.msg_namelen = 0;
  1153. hdr.msg_iov = &iov;
  1154. hdr.msg_iovlen = 1;
  1155. hdr.msg_control = NULL;
  1156. hdr.msg_controllen = 0;
  1157. hdr.msg_flags = 0;
  1158. int64_t bytes = INLINE_SYSCALL(recvmsg, 3, handle->mcast.cli, &hdr, 0);
  1159. if (IS_ERR(bytes))
  1160. return -PAL_ERROR_DENIED;
  1161. return bytes;
  1162. }
  1163. static int mcast_attrquerybyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  1164. {
  1165. int ret, val;
  1166. if (handle->mcast.cli == PAL_IDX_POISON)
  1167. return -PAL_ERROR_BADHANDLE;
  1168. ret = INLINE_SYSCALL(ioctl, 3, handle->mcast.cli, FIONREAD, &val);
  1169. if (IS_ERR(ret))
  1170. return unix_to_pal_error(ERRNO(ret));
  1171. attr->handle_type = pal_type_mcast;
  1172. attr->disconnected = HANDLE_HDR(handle)->flags & (ERROR(0)|ERROR(1));
  1173. attr->nonblocking = handle->mcast.nonblocking;
  1174. attr->readable = !!val;
  1175. attr->writable = HANDLE_HDR(handle)->flags & WRITABLE(1);
  1176. attr->runnable = PAL_FALSE;
  1177. attr->pending_size = val;
  1178. return 0;
  1179. }
  1180. static int mcast_attrsetbyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  1181. {
  1182. if (handle->mcast.cli == PAL_IDX_POISON)
  1183. return -PAL_ERROR_BADHANDLE;
  1184. int ret;
  1185. PAL_BOL * nonblocking = &handle->mcast.nonblocking;
  1186. if (attr->nonblocking != *nonblocking) {
  1187. ret = INLINE_SYSCALL(fcntl, 3, handle->mcast.cli, F_SETFL,
  1188. *nonblocking ? O_NONBLOCK : 0);
  1189. if (IS_ERR(ret))
  1190. return unix_to_pal_error(ERRNO(ret));
  1191. *nonblocking = attr->nonblocking;
  1192. }
  1193. return 0;
  1194. }
  1195. struct handle_ops mcast_ops = {
  1196. .write = &mcast_send,
  1197. .read = &mcast_receive,
  1198. .attrquerybyhdl = &mcast_attrquerybyhdl,
  1199. .attrsetbyhdl = &mcast_attrsetbyhdl,
  1200. };