db_sockets.c 42 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451
  1. /* -*- mode:c; c-file-style:"k&r"; c-basic-offset: 4; tab-width:4; indent-tabs-mode:nil; mode:auto-fill; fill-column:78; -*- */
  2. /* vim: set ts=4 sw=4 et tw=78 fo=cqt wm=0: */
  3. /* Copyright (C) 2014 Stony Brook University
  4. This file is part of Graphene Library OS.
  5. Graphene Library OS is free software: you can redistribute it and/or
  6. modify it under the terms of the GNU Lesser General Public License
  7. as published by the Free Software Foundation, either version 3 of the
  8. License, or (at your option) any later version.
  9. Graphene Library OS is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU Lesser General Public License for more details.
  13. You should have received a copy of the GNU Lesser General Public License
  14. along with this program. If not, see <http://www.gnu.org/licenses/>. */
  15. /*
  16. * db_socket.c
  17. *
  18. * This file contains operands for streams with URIs that start with
  19. * "tcp:", "tcp.srv:", "udp:", "udp.srv:".
  20. */
  21. #include "pal_defs.h"
  22. #include "pal_linux_defs.h"
  23. #include "pal.h"
  24. #include "pal_internal.h"
  25. #include "pal_linux.h"
  26. #include "pal_debug.h"
  27. #include "pal_security.h"
  28. #include "pal_error.h"
  29. #include "api.h"
  30. #include "graphene.h"
  31. #include <linux/types.h>
  32. #include <linux/poll.h>
  33. typedef __kernel_pid_t pid_t;
  34. #include <asm/fcntl.h>
  35. #include <sys/socket.h>
  36. #include <linux/in.h>
  37. #include <linux/in6.h>
  38. #include <netinet/tcp.h>
  39. #include <asm/errno.h>
  40. #ifndef SOL_TCP
  41. # define SOL_TCP 6
  42. #endif
  43. #ifndef TCP_NODELAY
  44. # define TCP_NODELAY 1
  45. #endif
  46. #ifndef TCP_CORK
  47. # define TCP_CORK 3
  48. #endif
  49. #ifndef SOL_IPV6
  50. # define SOL_IPV6 41
  51. #endif
  52. /* 96 bytes is the minimal size of buffer to store a IPv4/IPv6
  53. address */
  54. #define PAL_SOCKADDR_SIZE 96
  55. static inline int addr_size (struct sockaddr * addr)
  56. {
  57. switch (addr->sa_family) {
  58. case AF_INET:
  59. return sizeof(struct sockaddr_in);
  60. case AF_INET6:
  61. return sizeof(struct sockaddr_in6);
  62. default:
  63. return 0;
  64. }
  65. }
  66. /* parsing the string of uri, and fill in the socket address structure.
  67. the latest pointer of uri, length of socket address are returned. */
  68. static int inet_parse_uri (char ** uri, struct sockaddr * addr, int * addrlen)
  69. {
  70. char * tmp = *uri, * end;
  71. char * addr_str = NULL, * port_str;
  72. int af;
  73. void * addr_buf;
  74. int addr_len;
  75. __be16 * port_buf;
  76. int slen;
  77. if (tmp[0] == '[') {
  78. /* for IPv6, the address will be in the form of
  79. "[xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx]:port". */
  80. struct sockaddr_in6 * addr_in6 = (struct sockaddr_in6 *) addr;
  81. slen = sizeof(struct sockaddr_in6);
  82. memset(addr, 0, slen);
  83. end = strchr(tmp + 1, ']');
  84. if (!end || *(end + 1) != ':')
  85. goto inval;
  86. addr_str = tmp + 1;
  87. addr_len = end - tmp - 1;
  88. port_str = end + 2;
  89. for (end = port_str ; *end >= '0' && *end <= '9' ; end++);
  90. addr_in6->sin6_family = af = AF_INET6;
  91. addr_buf = &addr_in6->sin6_addr.s6_addr;
  92. port_buf = &addr_in6->sin6_port;
  93. } else {
  94. /* for IP, the address will be in the form of "x.x.x.x:port". */
  95. struct sockaddr_in * addr_in = (struct sockaddr_in *) addr;
  96. slen = sizeof(struct sockaddr_in);
  97. memset(addr, 0, slen);
  98. end = strchr(tmp, ':');
  99. if (!end)
  100. goto inval;
  101. addr_str = tmp;
  102. addr_len = end - tmp;
  103. port_str = end + 1;
  104. for (end = port_str ; *end >= '0' && *end <= '9' ; end++);
  105. addr_in->sin_family = af = AF_INET;
  106. addr_buf = &addr_in->sin_addr.s_addr;
  107. port_buf = &addr_in->sin_port;
  108. }
  109. if (af == AF_INET) {
  110. if (!inet_pton4(addr_str, addr_len, addr_buf))
  111. goto inval;
  112. } else {
  113. if (!inet_pton6(addr_str, addr_len, addr_buf))
  114. goto inval;
  115. }
  116. *port_buf = __htons(atoi(port_str));
  117. *uri = *end ? end + 1 : NULL;
  118. if (addrlen)
  119. *addrlen = slen;
  120. return 0;
  121. inval:
  122. return -PAL_ERROR_INVAL;
  123. }
  124. /* create the string of uri from the given socket address */
  125. static int inet_create_uri (char * uri, int count, struct sockaddr * addr,
  126. int addrlen)
  127. {
  128. int len = 0;
  129. if (addr->sa_family == AF_INET) {
  130. if (addrlen != sizeof(struct sockaddr_in))
  131. return PAL_ERROR_INVAL;
  132. struct sockaddr_in * addr_in = (struct sockaddr_in *) addr;
  133. char * addr = (char *) &addr_in->sin_addr.s_addr;
  134. /* for IP, the address will be in the form of "x.x.x.x:port". */
  135. len = snprintf(uri, count, "%u.%u.%u.%u:%u",
  136. (unsigned char) addr[0],
  137. (unsigned char) addr[1],
  138. (unsigned char) addr[2],
  139. (unsigned char) addr[3],
  140. __ntohs(addr_in->sin_port));
  141. } else if (addr->sa_family == AF_INET6) {
  142. if (addrlen != sizeof(struct sockaddr_in6))
  143. return PAL_ERROR_INVAL;
  144. struct sockaddr_in6 * addr_in6 = (struct sockaddr_in6 *) addr;
  145. unsigned short * addr = (unsigned short *) &addr_in6->sin6_addr.s6_addr;
  146. /* for IPv6, the address will be in the form of
  147. "[xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx]:port". */
  148. len = snprintf(uri, count, "[%04x:%04x:%04x:%04x:%04x:%04x:%04x:%04x]:%u",
  149. addr[0], addr[1], addr[2], addr[3],
  150. addr[4], addr[5], addr[6], addr[7],
  151. __ntohs(addr_in6->sin6_port));
  152. } else {
  153. return -PAL_ERROR_INVAL;
  154. }
  155. if (len >= count)
  156. return -PAL_ERROR_TOOLONG;
  157. return len;
  158. }
  159. /* parse the uri for a socket stream. The uri might have both binding
  160. address and connecting address, or connecting address only. The form
  161. of uri will be either "bind-addr:bind-port:connect-addr:connect-port"
  162. or "addr:port". */
  163. static int socket_parse_uri (char * uri,
  164. struct sockaddr ** bind_addr, int * bind_addrlen,
  165. struct sockaddr ** dest_addr, int * dest_addrlen)
  166. {
  167. int ret;
  168. if (!bind_addr && !dest_addr)
  169. return 0;
  170. if (!uri || !(*uri)) {
  171. if (bind_addr)
  172. *bind_addr = NULL;
  173. if (dest_addr)
  174. *dest_addr = NULL;
  175. return 0;
  176. }
  177. /* at least parse uri once */
  178. if ((ret = inet_parse_uri(&uri, bind_addr ? *bind_addr : *dest_addr,
  179. bind_addr ? bind_addrlen : dest_addrlen)) < 0)
  180. return ret;
  181. if (!(bind_addr && dest_addr))
  182. return 0;
  183. /* if you reach here, it can only be connection address */
  184. if (!uri || (ret = inet_parse_uri(&uri, *dest_addr, dest_addrlen)) < 0) {
  185. *dest_addr = *bind_addr;
  186. *dest_addrlen = *bind_addrlen;
  187. *bind_addr = NULL;
  188. *bind_addrlen = 0;
  189. }
  190. return 0;
  191. }
  192. /* fill in the PAL handle based on the file descriptors and address given. */
  193. static inline
  194. PAL_HANDLE socket_create_handle (int type, int fd, int options,
  195. struct sockaddr * bind_addr, int bind_addrlen,
  196. struct sockaddr * dest_addr, int dest_addrlen)
  197. {
  198. PAL_HANDLE hdl = malloc(HANDLE_SIZE(sock) + (bind_addr ? bind_addrlen : 0) +
  199. (dest_addr ? dest_addrlen : 0));
  200. if (!hdl)
  201. return NULL;
  202. memset(hdl, 0, sizeof(struct pal_handle));
  203. init_handle_hdr(HANDLE_HDR(hdl), type);
  204. HANDLE_HDR(hdl)->flags |= RFD(0)|(type != pal_type_tcpsrv ? WFD(0) : 0);
  205. hdl->sock.fd = fd;
  206. void * addr = (void *) hdl + HANDLE_SIZE(sock);
  207. if (bind_addr) {
  208. hdl->sock.bind = (PAL_PTR) addr;
  209. memcpy(addr, bind_addr, bind_addrlen);
  210. addr += bind_addrlen;
  211. } else {
  212. hdl->sock.bind = (PAL_PTR) NULL;
  213. }
  214. if (dest_addr) {
  215. hdl->sock.conn = (PAL_PTR) addr;
  216. memcpy(addr, dest_addr, dest_addrlen);
  217. addr += dest_addrlen;
  218. } else {
  219. hdl->sock.conn = (PAL_PTR) NULL;
  220. }
  221. hdl->sock.nonblocking = (options & PAL_OPTION_NONBLOCK) ?
  222. PAL_TRUE : PAL_FALSE;
  223. hdl->sock.linger = 0;
  224. if (type == pal_type_tcpsrv) {
  225. hdl->sock.receivebuf = 0;
  226. hdl->sock.sendbuf = 0;
  227. } else {
  228. int ret, val, len = sizeof(int);
  229. ret = INLINE_SYSCALL(getsockopt, 5, fd, SOL_SOCKET, SO_RCVBUF,
  230. &val, &len);
  231. hdl->sock.receivebuf = IS_ERR(ret) ? 0 : val;
  232. ret = INLINE_SYSCALL(getsockopt, 5, fd, SOL_SOCKET, SO_SNDBUF,
  233. &val, &len);
  234. hdl->sock.sendbuf = IS_ERR(ret) ? 0 : val;
  235. }
  236. hdl->sock.receivetimeout = 0;
  237. hdl->sock.sendtimeout = 0;
  238. hdl->sock.tcp_cork = PAL_FALSE;
  239. hdl->sock.tcp_keepalive = PAL_FALSE;
  240. hdl->sock.tcp_nodelay = PAL_FALSE;
  241. return hdl;
  242. }
  243. static bool check_zero (void * mem, size_t size)
  244. {
  245. void * p = mem, * q = mem + size;
  246. while (p < q) {
  247. if (p <= q - sizeof(long)) {
  248. if (*(long *) p)
  249. return false;
  250. p += sizeof(long);
  251. } else if (p <= q - sizeof(int)) {
  252. if (*(int *) p)
  253. return false;
  254. p += sizeof(int);
  255. } else if (p <= q - sizeof(short)) {
  256. if (*(short *) p)
  257. return false;
  258. p += sizeof(short);
  259. } else {
  260. if (*(char *) p)
  261. return false;
  262. p++;
  263. }
  264. }
  265. return true;
  266. }
  267. /* check if an address is "Any" */
  268. static bool check_any_addr (struct sockaddr * addr)
  269. {
  270. if (addr->sa_family == AF_INET) {
  271. struct sockaddr_in * addr_in =
  272. (struct sockaddr_in *) addr;
  273. return addr_in->sin_port == 0 &&
  274. check_zero(&addr_in->sin_addr,
  275. sizeof(addr_in->sin_addr));
  276. } else if (addr->sa_family == AF_INET6) {
  277. struct sockaddr_in6 * addr_in6 =
  278. (struct sockaddr_in6 *) addr;
  279. return addr_in6->sin6_port == 0 &&
  280. check_zero(&addr_in6->sin6_addr,
  281. sizeof(addr_in6->sin6_addr));
  282. }
  283. return false;
  284. }
  285. /* listen on a tcp socket */
  286. static int tcp_listen (PAL_HANDLE * handle, char * uri, int options)
  287. {
  288. struct sockaddr buffer, * bind_addr = &buffer;
  289. int bind_addrlen;
  290. int ret, fd = -1;
  291. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  292. NULL, NULL)) < 0)
  293. return ret;
  294. assert(bind_addr);
  295. assert(bind_addrlen == addr_size(bind_addr));
  296. #if ALLOW_BIND_ANY == 0
  297. /* the socket need to have a binding address, a null address or an
  298. any address is not allowed */
  299. if (check_any_addr(bind_addr))
  300. return -PAL_ERROR_INVAL;
  301. #endif
  302. fd = INLINE_SYSCALL(socket, 3, bind_addr->sa_family,
  303. SOCK_STREAM|SOCK_CLOEXEC|options, 0);
  304. if (IS_ERR(fd))
  305. return -PAL_ERROR_DENIED;
  306. if (bind_addr->sa_family == AF_INET6) {
  307. int ipv6only = 1;
  308. INLINE_SYSCALL(setsockopt, 5, fd, SOL_IPV6, IPV6_V6ONLY, &ipv6only,
  309. sizeof(int));
  310. }
  311. /* must set the socket to be reuseable */
  312. int reuseaddr = 1;
  313. INLINE_SYSCALL(setsockopt, 5, fd, SOL_SOCKET, SO_REUSEADDR, &reuseaddr,
  314. sizeof(int));
  315. ret = INLINE_SYSCALL(bind, 3, fd, bind_addr, bind_addrlen);
  316. if (IS_ERR(ret)) {
  317. switch(ERRNO(ret)) {
  318. case EINVAL:
  319. ret = -PAL_ERROR_INVAL;
  320. goto failed;
  321. case EADDRINUSE:
  322. ret = -PAL_ERROR_STREAMEXIST;
  323. goto failed;
  324. default:
  325. ret = -PAL_ERROR_DENIED;
  326. goto failed;
  327. }
  328. }
  329. if (check_any_addr(bind_addr)) {
  330. /* call getsockname to get socket address */
  331. if ((ret = INLINE_SYSCALL(getsockname, 3, fd,
  332. bind_addr, &bind_addrlen)) < 0)
  333. goto failed;
  334. }
  335. ret = INLINE_SYSCALL(listen, 2, fd, DEFAULT_BACKLOG);
  336. if (IS_ERR(ret))
  337. return -PAL_ERROR_DENIED;
  338. *handle = socket_create_handle(pal_type_tcpsrv, fd, options,
  339. bind_addr, bind_addrlen, NULL, 0);
  340. if (!(*handle)) {
  341. ret = -PAL_ERROR_NOMEM;
  342. goto failed;
  343. }
  344. return 0;
  345. failed:
  346. INLINE_SYSCALL(close, 1, fd);
  347. return ret;
  348. }
  349. /* accept a tcp connection */
  350. static int tcp_accept (PAL_HANDLE handle, PAL_HANDLE * client)
  351. {
  352. if (!IS_HANDLE_TYPE(handle, tcpsrv) ||
  353. !handle->sock.bind || handle->sock.conn)
  354. return -PAL_ERROR_NOTSERVER;
  355. if (handle->sock.fd == PAL_IDX_POISON)
  356. return -PAL_ERROR_BADHANDLE;
  357. struct sockaddr * bind_addr = (struct sockaddr *) handle->sock.bind;
  358. int bind_addrlen = addr_size(bind_addr);
  359. struct sockaddr buffer;
  360. socklen_t addrlen = sizeof(struct sockaddr);
  361. int ret = 0;
  362. int newfd = INLINE_SYSCALL(accept4, 4, handle->sock.fd, &buffer,
  363. &addrlen, O_CLOEXEC);
  364. if (IS_ERR(newfd))
  365. switch(ERRNO(newfd)) {
  366. case EWOULDBLOCK:
  367. return -PAL_ERROR_TRYAGAIN;
  368. case ECONNABORTED:
  369. return -PAL_ERROR_STREAMNOTEXIST;
  370. default:
  371. return unix_to_pal_error(ERRNO(newfd));
  372. }
  373. struct sockaddr * dest_addr = &buffer;
  374. int dest_addrlen = addrlen;
  375. *client = socket_create_handle(pal_type_tcp, newfd, 0,
  376. bind_addr, bind_addrlen,
  377. dest_addr, dest_addrlen);
  378. if (!(*client)) {
  379. ret = -PAL_ERROR_NOMEM;
  380. goto failed;
  381. }
  382. return 0;
  383. failed:
  384. INLINE_SYSCALL(close, 1, newfd);
  385. return ret;
  386. }
  387. /* connect on a tcp socket */
  388. static int tcp_connect (PAL_HANDLE * handle, char * uri, int options)
  389. {
  390. struct sockaddr buffer[3];
  391. struct sockaddr * bind_addr = buffer, * dest_addr = buffer + 1;
  392. int bind_addrlen, dest_addrlen;
  393. int ret, fd = -1;
  394. /* accepting two kind of different uri:
  395. dest-ip:dest-port or bind-ip:bind-port:dest-ip:dest-port */
  396. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  397. &dest_addr, &dest_addrlen)) < 0)
  398. return ret;
  399. if (!dest_addr)
  400. return -PAL_ERROR_INVAL;
  401. if (bind_addr && bind_addr->sa_family != dest_addr->sa_family)
  402. return -PAL_ERROR_INVAL;
  403. fd = INLINE_SYSCALL(socket, 3, dest_addr->sa_family,
  404. SOCK_STREAM|SOCK_CLOEXEC|options, 0);
  405. if (IS_ERR(fd))
  406. return -PAL_ERROR_DENIED;
  407. if (bind_addr) {
  408. if (IS_ERR(ret)) {
  409. INLINE_SYSCALL(close, 1, fd);
  410. switch (ERRNO(ret)) {
  411. case EADDRINUSE:
  412. ret = -PAL_ERROR_STREAMEXIST;
  413. goto failed;
  414. case EADDRNOTAVAIL:
  415. ret = -PAL_ERROR_ADDRNOTEXIST;
  416. goto failed;
  417. default:
  418. ret = unix_to_pal_error(ERRNO(ret));
  419. goto failed;
  420. }
  421. }
  422. }
  423. if (dest_addr->sa_family == AF_INET6) {
  424. int ipv6only = 1;
  425. INLINE_SYSCALL(setsockopt, 5, fd, SOL_IPV6, IPV6_V6ONLY, &ipv6only,
  426. sizeof(int));
  427. }
  428. ret = INLINE_SYSCALL(connect, 3, fd, dest_addr, dest_addrlen);
  429. if (IS_ERR(ret) && ERRNO(ret) == EINPROGRESS) {
  430. struct pollfd pfd = { .fd = fd, .events = POLLOUT, .revents = 0 };
  431. ret = INLINE_SYSCALL(ppoll, 5, &pfd, 1, NULL, NULL, 0);
  432. }
  433. if (IS_ERR(ret)) {
  434. ret = unix_to_pal_error(ERRNO(ret));
  435. goto failed;
  436. }
  437. if (!bind_addr) {
  438. /* save some space to get socket address */
  439. bind_addr = buffer + 2;
  440. bind_addrlen = sizeof(struct sockaddr);
  441. /* call getsockname to get socket address */
  442. if ((ret = INLINE_SYSCALL(getsockname, 3, fd,
  443. bind_addr, &bind_addrlen)) < 0)
  444. bind_addr = NULL;
  445. }
  446. *handle = socket_create_handle(pal_type_tcp, fd, options,
  447. bind_addr, bind_addrlen,
  448. dest_addr, dest_addrlen);
  449. if (!(*handle)) {
  450. ret = -PAL_ERROR_NOMEM;
  451. goto failed;
  452. }
  453. return 0;
  454. failed:
  455. INLINE_SYSCALL(close, 1, fd);
  456. return ret;
  457. }
  458. /* 'open' operation of tcp stream */
  459. static int tcp_open (PAL_HANDLE *handle, const char * type, const char * uri,
  460. int access, int share, int create, int options)
  461. {
  462. int uri_len = strlen(uri) + 1;
  463. if (uri_len > PAL_SOCKADDR_SIZE)
  464. return -PAL_ERROR_TOOLONG;
  465. char uri_buf[PAL_SOCKADDR_SIZE];
  466. memcpy(uri_buf, uri, uri_len);
  467. if (strpartcmp_static(type, "tcp.srv:"))
  468. return tcp_listen(handle, uri_buf, options);
  469. if (strpartcmp_static(type, "tcp:"))
  470. return tcp_connect(handle, uri_buf, options);
  471. return -PAL_ERROR_NOTSUPPORT;
  472. }
  473. /* 'read' operation of tcp stream */
  474. static int64_t tcp_read (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  475. void * buf)
  476. {
  477. if (!IS_HANDLE_TYPE(handle, tcp) || !handle->sock.conn)
  478. return -PAL_ERROR_NOTCONNECTION;
  479. if (handle->sock.fd == PAL_IDX_POISON)
  480. return -PAL_ERROR_ENDOFSTREAM;
  481. struct msghdr hdr;
  482. struct iovec iov;
  483. iov.iov_base = buf;
  484. iov.iov_len = len;
  485. hdr.msg_name = NULL;
  486. hdr.msg_namelen = 0;
  487. hdr.msg_iov = &iov;
  488. hdr.msg_iovlen = 1;
  489. hdr.msg_control = NULL;
  490. hdr.msg_controllen = 0;
  491. hdr.msg_flags = 0;
  492. int64_t bytes = INLINE_SYSCALL(recvmsg, 3, handle->sock.fd, &hdr, 0);
  493. if (IS_ERR(bytes))
  494. return unix_to_pal_error(ERRNO(bytes));
  495. if (!bytes)
  496. return -PAL_ERROR_ENDOFSTREAM;
  497. return bytes;
  498. }
  499. /* write' operation of tcp stream */
  500. static int64_t tcp_write (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  501. const void * buf)
  502. {
  503. if (!IS_HANDLE_TYPE(handle, tcp) || !handle->sock.conn)
  504. return -PAL_ERROR_NOTCONNECTION;
  505. if (handle->sock.fd == PAL_IDX_POISON)
  506. return -PAL_ERROR_CONNFAILED;
  507. struct msghdr hdr;
  508. struct iovec iov;
  509. iov.iov_base = (void *) buf;
  510. iov.iov_len = len;
  511. hdr.msg_name = NULL;
  512. hdr.msg_namelen = 0;
  513. hdr.msg_iov = &iov;
  514. hdr.msg_iovlen = 1;
  515. hdr.msg_control = NULL;
  516. hdr.msg_controllen = 0;
  517. hdr.msg_flags = 0;
  518. int64_t bytes = INLINE_SYSCALL(sendmsg, 3, handle->sock.fd, &hdr, MSG_NOSIGNAL);
  519. if (IS_ERR(bytes))
  520. bytes = unix_to_pal_error(ERRNO(bytes));
  521. if (bytes == len)
  522. HANDLE_HDR(handle)->flags |= WRITEABLE(0);
  523. else
  524. HANDLE_HDR(handle)->flags &= ~WRITEABLE(0);
  525. return bytes;
  526. }
  527. /* used by 'open' operation of tcp stream for bound socket */
  528. static int udp_bind (PAL_HANDLE * handle, char * uri, int options)
  529. {
  530. struct sockaddr buffer, * bind_addr = &buffer;
  531. int bind_addrlen;
  532. int ret = 0, fd = -1;
  533. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  534. NULL, NULL)) < 0)
  535. return ret;
  536. assert(bind_addr);
  537. assert(bind_addrlen == addr_size(bind_addr));
  538. #if ALLOW_BIND_ANY == 0
  539. /* the socket need to have a binding address, a null address or an
  540. any address is not allowed */
  541. if (check_any_addr(bind_addr))
  542. return -PAL_ERROR_INVAL;
  543. #endif
  544. fd = INLINE_SYSCALL(socket, 3, bind_addr->sa_family,
  545. SOCK_DGRAM|SOCK_CLOEXEC|options, 0);
  546. if (IS_ERR(fd))
  547. return -PAL_ERROR_DENIED;
  548. if (bind_addr->sa_family == AF_INET6) {
  549. int ipv6only = 1;
  550. INLINE_SYSCALL(setsockopt, 5, fd, SOL_IPV6, IPV6_V6ONLY, &ipv6only,
  551. sizeof(int));
  552. }
  553. ret = INLINE_SYSCALL(bind, 3, fd, bind_addr, bind_addrlen);
  554. if (IS_ERR(ret)) {
  555. switch (ERRNO(ret)) {
  556. case EADDRINUSE:
  557. ret = -PAL_ERROR_STREAMEXIST;
  558. goto failed;
  559. case EADDRNOTAVAIL:
  560. ret = -PAL_ERROR_ADDRNOTEXIST;
  561. goto failed;
  562. default:
  563. ret = unix_to_pal_error(ERRNO(ret));
  564. goto failed;
  565. }
  566. }
  567. *handle = socket_create_handle(pal_type_udpsrv, fd, options,
  568. bind_addr, bind_addrlen, NULL, 0);
  569. if (!(*handle)) {
  570. ret = -ENOMEM;
  571. goto failed;
  572. }
  573. return 0;
  574. failed:
  575. INLINE_SYSCALL(close, 1, fd);
  576. return ret;
  577. }
  578. /* used by 'open' operation of tcp stream for connected socket */
  579. static int udp_connect (PAL_HANDLE * handle, char * uri, int options)
  580. {
  581. struct sockaddr buffer[2];
  582. struct sockaddr * bind_addr = buffer, * dest_addr = buffer + 1;
  583. int bind_addrlen, dest_addrlen;
  584. int ret, fd = -1;
  585. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  586. &dest_addr, &dest_addrlen)) < 0)
  587. return ret;
  588. #if ALLOW_BIND_ANY == 0
  589. /* the socket need to have a binding address, a null address or an
  590. any address is not allowed */
  591. if (bind_addr && check_any_addr(bind_addr))
  592. return -PAL_ERROR_INVAL;
  593. #endif
  594. fd = INLINE_SYSCALL(socket, 3, dest_addr ? dest_addr->sa_family : AF_INET,
  595. SOCK_DGRAM|SOCK_CLOEXEC|options, 0);
  596. if (IS_ERR(fd))
  597. return -PAL_ERROR_DENIED;
  598. if (dest_addr->sa_family == AF_INET6) {
  599. int ipv6only = 1;
  600. INLINE_SYSCALL(setsockopt, 5, fd, SOL_IPV6, IPV6_V6ONLY, &ipv6only,
  601. sizeof(int));
  602. }
  603. if (bind_addr) {
  604. ret = INLINE_SYSCALL(bind, 3, fd, bind_addr, bind_addrlen);
  605. if (IS_ERR(ret)) {
  606. switch (ERRNO(ret)) {
  607. case EADDRINUSE:
  608. ret = -PAL_ERROR_STREAMEXIST;
  609. goto failed;
  610. case EADDRNOTAVAIL:
  611. ret = -PAL_ERROR_ADDRNOTEXIST;
  612. goto failed;
  613. default:
  614. ret = unix_to_pal_error(ERRNO(ret));
  615. goto failed;
  616. }
  617. }
  618. }
  619. *handle = socket_create_handle(dest_addr ? pal_type_udp : pal_type_udpsrv,
  620. fd, options,
  621. bind_addr, bind_addrlen,
  622. dest_addr, dest_addrlen);
  623. if (!(*handle)) {
  624. ret = -ENOMEM;
  625. goto failed;
  626. }
  627. return 0;
  628. failed:
  629. INLINE_SYSCALL(close, 1, fd);
  630. return ret;
  631. }
  632. static int udp_open (PAL_HANDLE *hdl, const char * type, const char * uri,
  633. int access, int share, int create, int options)
  634. {
  635. char buf[PAL_SOCKADDR_SIZE];
  636. int len = strlen(uri);
  637. if (len >= PAL_SOCKADDR_SIZE)
  638. return -PAL_ERROR_TOOLONG;
  639. memcpy(buf, uri, len + 1);
  640. options &= PAL_OPTION_MASK;
  641. if (strpartcmp_static(type, "udp.srv:"))
  642. return udp_bind(hdl, buf, options);
  643. if (strpartcmp_static(type, "udp:"))
  644. return udp_connect(hdl, buf, options);
  645. return -PAL_ERROR_NOTSUPPORT;
  646. }
  647. static int64_t udp_receive (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  648. void * buf)
  649. {
  650. if (!IS_HANDLE_TYPE(handle, udp))
  651. return -PAL_ERROR_NOTCONNECTION;
  652. if (handle->sock.fd == PAL_IDX_POISON)
  653. return -PAL_ERROR_BADHANDLE;
  654. struct msghdr hdr;
  655. struct iovec iov;
  656. iov.iov_base = buf;
  657. iov.iov_len = len;
  658. hdr.msg_name = NULL;
  659. hdr.msg_namelen = 0;
  660. hdr.msg_iov = &iov;
  661. hdr.msg_iovlen = 1;
  662. hdr.msg_control = NULL;
  663. hdr.msg_controllen = 0;
  664. hdr.msg_flags = 0;
  665. int64_t bytes = INLINE_SYSCALL(recvmsg, 3, handle->sock.fd, &hdr, 0);
  666. if (IS_ERR(bytes))
  667. return unix_to_pal_error(ERRNO(bytes));
  668. return bytes;
  669. }
  670. static int64_t udp_receivebyaddr (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  671. void * buf, char * addr, int addrlen)
  672. {
  673. if (!IS_HANDLE_TYPE(handle, udpsrv))
  674. return -PAL_ERROR_NOTCONNECTION;
  675. if (handle->sock.fd == PAL_IDX_POISON)
  676. return -PAL_ERROR_BADHANDLE;
  677. struct sockaddr conn_addr;
  678. socklen_t conn_addrlen = sizeof(struct sockaddr);
  679. struct msghdr hdr;
  680. struct iovec iov;
  681. iov.iov_base = buf;
  682. iov.iov_len = len;
  683. hdr.msg_name = &conn_addr;
  684. hdr.msg_namelen = conn_addrlen;
  685. hdr.msg_iov = &iov;
  686. hdr.msg_iovlen = 1;
  687. hdr.msg_control = NULL;
  688. hdr.msg_controllen = 0;
  689. hdr.msg_flags = 0;
  690. int64_t bytes = INLINE_SYSCALL(recvmsg, 3, handle->sock.fd, &hdr, 0);
  691. if (IS_ERR(bytes))
  692. return unix_to_pal_error(ERRNO(bytes));
  693. char * addr_uri = strcpy_static(addr, "udp:", addrlen);
  694. if (!addr_uri)
  695. return -PAL_ERROR_OVERFLOW;
  696. int ret = inet_create_uri(addr_uri, addr + addrlen - addr_uri, &conn_addr,
  697. hdr.msg_namelen);
  698. if (ret < 0)
  699. return ret;
  700. return bytes;
  701. }
  702. static int64_t udp_send (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  703. const void * buf)
  704. {
  705. if (!IS_HANDLE_TYPE(handle, udp))
  706. return -PAL_ERROR_NOTCONNECTION;
  707. if (handle->sock.fd == PAL_IDX_POISON)
  708. return -PAL_ERROR_BADHANDLE;
  709. struct msghdr hdr;
  710. struct iovec iov;
  711. iov.iov_base = (void *) buf;
  712. iov.iov_len = len;
  713. hdr.msg_name = (void *) handle->sock.conn;
  714. hdr.msg_namelen = addr_size((struct sockaddr *) handle->sock.conn);
  715. hdr.msg_iov = &iov;
  716. hdr.msg_iovlen = 1;
  717. hdr.msg_control = NULL;
  718. hdr.msg_controllen = 0;
  719. hdr.msg_flags = 0;
  720. int64_t bytes = INLINE_SYSCALL(sendmsg, 3, handle->sock.fd, &hdr, MSG_NOSIGNAL);
  721. if (IS_ERR(bytes))
  722. bytes = unix_to_pal_error(ERRNO(bytes));
  723. if (bytes == len)
  724. HANDLE_HDR(handle)->flags |= WRITEABLE(0);
  725. else
  726. HANDLE_HDR(handle)->flags &= ~WRITEABLE(0);
  727. return bytes;
  728. }
  729. static int64_t udp_sendbyaddr (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  730. const void * buf, const char * addr, int addrlen)
  731. {
  732. if (!IS_HANDLE_TYPE(handle, udpsrv))
  733. return -PAL_ERROR_NOTCONNECTION;
  734. if (handle->sock.fd == PAL_IDX_POISON)
  735. return -PAL_ERROR_BADHANDLE;
  736. if (!strpartcmp_static(addr, "udp:"))
  737. return -PAL_ERROR_INVAL;
  738. addr += static_strlen("udp:");
  739. addrlen -= static_strlen("udp:");
  740. char * addrbuf = __alloca(addrlen);
  741. memcpy(addrbuf, addr, addrlen);
  742. struct sockaddr conn_addr;
  743. int conn_addrlen;
  744. int ret = inet_parse_uri(&addrbuf, &conn_addr, &conn_addrlen);
  745. if (ret < 0)
  746. return ret;
  747. struct msghdr hdr;
  748. struct iovec iov;
  749. iov.iov_base = (void *) buf;
  750. iov.iov_len = len;
  751. hdr.msg_name = &conn_addr;
  752. hdr.msg_namelen = conn_addrlen;
  753. hdr.msg_iov = &iov;
  754. hdr.msg_iovlen = 1;
  755. hdr.msg_control = NULL;
  756. hdr.msg_controllen = 0;
  757. hdr.msg_flags = 0;
  758. int64_t bytes = INLINE_SYSCALL(sendmsg, 3, handle->sock.fd, &hdr, MSG_NOSIGNAL);
  759. if (IS_ERR(bytes))
  760. bytes = unix_to_pal_error(ERRNO(bytes));
  761. if (bytes == len)
  762. HANDLE_HDR(handle)->flags |= WRITEABLE(0);
  763. else
  764. HANDLE_HDR(handle)->flags &= ~WRITEABLE(0);
  765. return bytes;
  766. }
  767. static int socket_delete (PAL_HANDLE handle, int access)
  768. {
  769. if (handle->sock.fd == PAL_IDX_POISON)
  770. return 0;
  771. if (!IS_HANDLE_TYPE(handle, tcp) && access)
  772. return -PAL_ERROR_INVAL;
  773. if (IS_HANDLE_TYPE(handle, tcp) || IS_HANDLE_TYPE(handle, tcpsrv)) {
  774. int shutdown;
  775. switch (access) {
  776. case 0:
  777. shutdown = SHUT_RDWR;
  778. break;
  779. case PAL_DELETE_RD:
  780. shutdown = SHUT_RD;
  781. break;
  782. case PAL_DELETE_WR:
  783. shutdown = SHUT_WR;
  784. break;
  785. default:
  786. return -PAL_ERROR_INVAL;
  787. }
  788. INLINE_SYSCALL(shutdown, 2, handle->sock.fd, shutdown);
  789. }
  790. return 0;
  791. }
  792. struct __kernel_linger {
  793. int l_onoff;
  794. int l_linger;
  795. };
  796. static int socket_close (PAL_HANDLE handle)
  797. {
  798. if (handle->sock.fd != PAL_IDX_POISON) {
  799. struct __kernel_linger l;
  800. l.l_onoff = 1;
  801. l.l_linger = 0;
  802. INLINE_SYSCALL(setsockopt, 5, handle->sock.fd, SOL_SOCKET, SO_LINGER,
  803. &l, sizeof(struct __kernel_linger));
  804. INLINE_SYSCALL(close, 1, handle->sock.fd);
  805. handle->sock.fd = PAL_IDX_POISON;
  806. }
  807. if (handle->sock.bind)
  808. handle->sock.bind = (PAL_PTR) NULL;
  809. if (handle->sock.conn)
  810. handle->sock.conn = (PAL_PTR) NULL;
  811. return 0;
  812. }
  813. #ifndef FIONREAD
  814. # define FIONREAD 0x541B
  815. #endif
  816. static int socket_attrquerybyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  817. {
  818. if (handle->sock.fd == PAL_IDX_POISON)
  819. return -PAL_ERROR_BADHANDLE;
  820. attr->handle_type = HANDLE_HDR(handle)->type;
  821. attr->disconnected = HANDLE_HDR(handle)->flags & ERROR(0);
  822. attr->nonblocking = handle->sock.nonblocking;
  823. attr->writeable = HANDLE_HDR(handle)->flags & WRITEABLE(0);
  824. attr->pending_size = 0; /* fill in later */
  825. attr->socket.linger = handle->sock.linger;
  826. attr->socket.receivebuf = handle->sock.receivebuf;
  827. attr->socket.sendbuf = handle->sock.sendbuf;
  828. attr->socket.receivetimeout = handle->sock.receivetimeout;
  829. attr->socket.sendtimeout = handle->sock.sendtimeout;
  830. attr->socket.tcp_cork = handle->sock.tcp_cork;
  831. attr->socket.tcp_keepalive = handle->sock.tcp_keepalive;
  832. attr->socket.tcp_nodelay = handle->sock.tcp_nodelay;
  833. int fd = handle->sock.fd, ret, val;
  834. if (!IS_HANDLE_TYPE(handle, tcpsrv)) {
  835. /* try use ioctl FIONEAD to get the size of socket */
  836. ret = INLINE_SYSCALL(ioctl, 3, fd, FIONREAD, &val);
  837. if (IS_ERR(ret))
  838. return unix_to_pal_error(ERRNO(ret));
  839. attr->pending_size = val;
  840. }
  841. struct pollfd pfd = { .fd = fd, .events = POLLIN, .revents = 0 };
  842. struct timespec tp = { 0, 0 };
  843. ret = INLINE_SYSCALL(ppoll, 5, &pfd, 1, &tp, NULL, 0);
  844. attr->readable = (ret == 1 && pfd.revents == POLLIN);
  845. return 0;
  846. }
  847. static int socket_attrsetbyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  848. {
  849. if (handle->sock.fd == PAL_IDX_POISON)
  850. return -PAL_ERROR_BADHANDLE;
  851. int fd = handle->sock.fd, ret, val;
  852. if (attr->nonblocking != handle->sock.nonblocking) {
  853. ret = INLINE_SYSCALL(fcntl, 3, fd, F_SETFL,
  854. attr->nonblocking ? O_NONBLOCK : 0);
  855. if (IS_ERR(ret))
  856. return unix_to_pal_error(ERRNO(ret));
  857. handle->sock.nonblocking = attr->nonblocking;
  858. }
  859. if (IS_HANDLE_TYPE(handle, tcpsrv)) {
  860. if (attr->socket.linger != handle->sock.linger) {
  861. struct __kernel_linger l;
  862. l.l_onoff = attr->socket.linger ? 1 : 0;
  863. l.l_linger = attr->socket.linger;
  864. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_SOCKET, SO_LINGER,
  865. &l, sizeof(struct __kernel_linger));
  866. if (IS_ERR(ret))
  867. return unix_to_pal_error(ERRNO(ret));
  868. handle->sock.linger = attr->socket.linger;
  869. }
  870. if (attr->socket.receivebuf != handle->sock.receivebuf) {
  871. int val = attr->socket.receivebuf;
  872. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_SOCKET, SO_RCVBUF,
  873. &val, sizeof(int));
  874. if (IS_ERR(ret))
  875. return unix_to_pal_error(ERRNO(ret));
  876. handle->sock.receivebuf = attr->socket.receivebuf;
  877. }
  878. if (attr->socket.sendbuf != handle->sock.sendbuf) {
  879. int val = attr->socket.sendbuf;
  880. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_SOCKET, SO_SNDBUF,
  881. &val, sizeof(int));
  882. if (IS_ERR(ret))
  883. return unix_to_pal_error(ERRNO(ret));
  884. handle->sock.sendbuf = attr->socket.sendbuf;
  885. }
  886. if (attr->socket.receivetimeout != handle->sock.receivetimeout) {
  887. int val = attr->socket.receivetimeout;
  888. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_SOCKET, SO_RCVTIMEO,
  889. &val, sizeof(int));
  890. if (IS_ERR(ret))
  891. return unix_to_pal_error(ERRNO(ret));
  892. handle->sock.receivetimeout = attr->socket.receivetimeout;
  893. }
  894. if (attr->socket.sendtimeout != handle->sock.sendtimeout) {
  895. int val = attr->socket.sendtimeout;
  896. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_SOCKET, SO_SNDTIMEO,
  897. &val, sizeof(int));
  898. if (IS_ERR(ret))
  899. return unix_to_pal_error(ERRNO(ret));
  900. handle->sock.sendtimeout = attr->socket.sendtimeout;
  901. }
  902. }
  903. if (IS_HANDLE_TYPE(handle, tcp) || IS_HANDLE_TYPE(handle, tcpsrv)) {
  904. if (attr->socket.tcp_cork != handle->sock.tcp_cork) {
  905. val = attr->socket.tcp_cork ? 1 : 0;
  906. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_TCP, TCP_CORK,
  907. &val, sizeof(int));
  908. if (IS_ERR(ret))
  909. return unix_to_pal_error(ERRNO(ret));
  910. handle->sock.tcp_cork = attr->socket.tcp_cork;
  911. }
  912. if (attr->socket.tcp_keepalive != handle->sock.tcp_keepalive) {
  913. val = attr->socket.tcp_keepalive ? 1 : 0;
  914. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_SOCKET, SO_KEEPALIVE,
  915. &val, sizeof(int));
  916. if (IS_ERR(ret))
  917. return unix_to_pal_error(ERRNO(ret));
  918. handle->sock.tcp_keepalive = attr->socket.tcp_keepalive;
  919. }
  920. if (attr->socket.tcp_nodelay != handle->sock.tcp_nodelay) {
  921. val = attr->socket.tcp_nodelay ? 1 : 0;
  922. ret = INLINE_SYSCALL(setsockopt, 5, fd, SOL_TCP, TCP_NODELAY,
  923. &val, sizeof(int));
  924. if (IS_ERR(ret))
  925. return unix_to_pal_error(ERRNO(ret));
  926. handle->sock.tcp_nodelay = attr->socket.tcp_nodelay;
  927. }
  928. }
  929. return 0;
  930. }
  931. static int socket_getname (PAL_HANDLE handle, char * buffer, int count)
  932. {
  933. int old_count = count;
  934. int ret;
  935. const char * prefix = NULL;
  936. int prefix_len = 0;
  937. struct sockaddr * bind_addr = NULL, * dest_addr = NULL;
  938. switch (PAL_GET_TYPE(handle)) {
  939. case pal_type_tcpsrv:
  940. prefix_len = static_strlen("tcp.srv");
  941. prefix = "tcp.srv";
  942. bind_addr = (struct sockaddr *) handle->sock.bind;
  943. break;
  944. case pal_type_tcp:
  945. prefix_len = static_strlen("tcp");
  946. prefix = "tcp";
  947. bind_addr = (struct sockaddr *) handle->sock.bind;
  948. dest_addr = (struct sockaddr *) handle->sock.conn;
  949. break;
  950. case pal_type_udpsrv:
  951. prefix_len = static_strlen("udp.srv");
  952. prefix = "udp.srv";
  953. bind_addr = (struct sockaddr *) handle->sock.bind;
  954. break;
  955. case pal_type_udp:
  956. prefix_len = static_strlen("udp");
  957. prefix = "udp";
  958. bind_addr = (struct sockaddr *) handle->sock.bind;
  959. dest_addr = (struct sockaddr *) handle->sock.conn;
  960. break;
  961. default:
  962. return -PAL_ERROR_INVAL;
  963. }
  964. if (prefix_len >= count)
  965. return -PAL_ERROR_OVERFLOW;
  966. memcpy(buffer, prefix, prefix_len + 1);
  967. buffer += prefix_len;
  968. count -= prefix_len;
  969. for (int i = 0 ; i < 2 ; i++) {
  970. struct sockaddr * addr = i ? dest_addr : bind_addr;
  971. if (addr) {
  972. if (count <= 1)
  973. return -PAL_ERROR_OVERFLOW;
  974. buffer[0] = ':';
  975. buffer[1] = 0;
  976. buffer++;
  977. count--;
  978. if ((ret = inet_create_uri(buffer, count, addr,
  979. addr_size(addr))) < 0)
  980. return ret;
  981. buffer += ret;
  982. count -= ret;
  983. }
  984. }
  985. return old_count - count;
  986. }
  987. struct handle_ops tcp_ops = {
  988. .getname = &socket_getname,
  989. .open = &tcp_open,
  990. .waitforclient = &tcp_accept,
  991. .read = &tcp_read,
  992. .write = &tcp_write,
  993. .delete = &socket_delete,
  994. .close = &socket_close,
  995. .attrquerybyhdl = &socket_attrquerybyhdl,
  996. .attrsetbyhdl = &socket_attrsetbyhdl,
  997. };
  998. struct handle_ops udp_ops = {
  999. .getname = &socket_getname,
  1000. .open = &udp_open,
  1001. .read = &udp_receive,
  1002. .write = &udp_send,
  1003. .delete = &socket_delete,
  1004. .close = &socket_close,
  1005. .attrquerybyhdl = &socket_attrquerybyhdl,
  1006. .attrsetbyhdl = &socket_attrsetbyhdl,
  1007. };
  1008. struct handle_ops udpsrv_ops = {
  1009. .getname = &socket_getname,
  1010. .open = &udp_open,
  1011. .readbyaddr = &udp_receivebyaddr,
  1012. .writebyaddr = &udp_sendbyaddr,
  1013. .delete = &socket_delete,
  1014. .close = &socket_close,
  1015. .attrquerybyhdl = &socket_attrquerybyhdl,
  1016. .attrsetbyhdl = &socket_attrsetbyhdl,
  1017. };
  1018. PAL_HANDLE _DkBroadcastStreamOpen (void)
  1019. {
  1020. if (!pal_sec.mcast_port) {
  1021. unsigned short mcast_port;
  1022. _DkFastRandomBitsRead(&mcast_port, sizeof(unsigned short));
  1023. pal_sec.mcast_port = mcast_port > 1024 ? mcast_port : mcast_port + 1024;
  1024. }
  1025. struct sockaddr_in addr;
  1026. int ret = 0;
  1027. addr.sin_family = AF_INET;
  1028. addr.sin_addr.s_addr = INADDR_ANY;
  1029. addr.sin_port = __htons(pal_sec.mcast_port);
  1030. /* set up server (sender) side */
  1031. int srv = INLINE_SYSCALL(socket, 3, AF_INET, SOCK_DGRAM|SOCK_CLOEXEC, 0);
  1032. if (IS_ERR(srv))
  1033. goto err;
  1034. ret = INLINE_SYSCALL(setsockopt, 5, srv, IPPROTO_IP, IP_MULTICAST_IF,
  1035. &addr.sin_addr.s_addr, sizeof(addr.sin_addr.s_addr));
  1036. if (IS_ERR(ret))
  1037. goto err_srv;
  1038. /* set up client (receiver) side */
  1039. int cli = INLINE_SYSCALL(socket, 3, AF_INET, SOCK_DGRAM|SOCK_CLOEXEC, 0);
  1040. if (IS_ERR(cli))
  1041. goto err_srv;
  1042. int reuse = 1;
  1043. INLINE_SYSCALL(setsockopt, 5, cli, SOL_SOCKET, SO_REUSEADDR,
  1044. &reuse, sizeof(reuse));
  1045. ret = INLINE_SYSCALL(bind, 3, cli, &addr, sizeof(addr));
  1046. if (IS_ERR(ret))
  1047. goto err_cli;
  1048. ret = INLINE_SYSCALL(setsockopt, 5, cli, IPPROTO_IP, IP_MULTICAST_IF,
  1049. &addr.sin_addr.s_addr, sizeof(addr.sin_addr.s_addr));
  1050. if (IS_ERR(ret))
  1051. goto err_cli;
  1052. inet_pton4(GRAPHENE_MCAST_GROUP, sizeof(GRAPHENE_MCAST_GROUP) - 1,
  1053. &addr.sin_addr.s_addr);
  1054. struct ip_mreq group;
  1055. group.imr_multiaddr.s_addr = addr.sin_addr.s_addr;
  1056. group.imr_interface.s_addr = INADDR_ANY;
  1057. ret = INLINE_SYSCALL(setsockopt, 5, cli, IPPROTO_IP, IP_ADD_MEMBERSHIP,
  1058. &group, sizeof(group));
  1059. if (IS_ERR(ret))
  1060. goto err_cli;
  1061. PAL_HANDLE hdl = malloc(HANDLE_SIZE(mcast));
  1062. SET_HANDLE_TYPE(hdl, mcast);
  1063. HANDLE_HDR(hdl)->flags |= WFD(1)|WRITEABLE(1);
  1064. hdl->mcast.srv = srv;
  1065. hdl->mcast.cli = cli;
  1066. hdl->mcast.port = (PAL_NUM) pal_sec.mcast_port;
  1067. hdl->mcast.nonblocking = PAL_FALSE;
  1068. hdl->mcast.addr = (PAL_PTR) malloc_copy(&addr, sizeof(addr));
  1069. return hdl;
  1070. err_cli:
  1071. INLINE_SYSCALL(close, 1, cli);
  1072. err_srv:
  1073. INLINE_SYSCALL(close, 1, srv);
  1074. err:
  1075. return NULL;
  1076. }
  1077. static int64_t mcast_send (PAL_HANDLE handle, uint64_t offset, uint64_t size,
  1078. const void * buf)
  1079. {
  1080. if (handle->mcast.srv == PAL_IDX_POISON)
  1081. return -PAL_ERROR_BADHANDLE;
  1082. struct msghdr hdr;
  1083. struct iovec iov;
  1084. iov.iov_base = (void *) buf;
  1085. iov.iov_len = size;
  1086. hdr.msg_name = (char *) handle->mcast.addr;
  1087. hdr.msg_namelen = sizeof(struct sockaddr_in);
  1088. hdr.msg_iov = &iov;
  1089. hdr.msg_iovlen = 1;
  1090. hdr.msg_control = NULL;
  1091. hdr.msg_controllen = 0;
  1092. hdr.msg_flags = 0;
  1093. int64_t bytes = INLINE_SYSCALL(sendmsg, 3, handle->mcast.srv, &hdr,
  1094. MSG_NOSIGNAL);
  1095. if (IS_ERR(bytes))
  1096. switch(ERRNO(bytes)) {
  1097. case ECONNRESET:
  1098. case EPIPE:
  1099. return -PAL_ERROR_CONNFAILED;
  1100. case EAGAIN:
  1101. HANDLE_HDR(handle)->flags &= ~WRITEABLE(1);
  1102. default:
  1103. return unix_to_pal_error(ERRNO(bytes));
  1104. }
  1105. if (bytes == size)
  1106. HANDLE_HDR(handle)->flags |= WRITEABLE(1);
  1107. else
  1108. HANDLE_HDR(handle)->flags &= ~WRITEABLE(1);
  1109. return bytes;
  1110. }
  1111. static int64_t mcast_receive (PAL_HANDLE handle, uint64_t offset, uint64_t size,
  1112. void * buf)
  1113. {
  1114. if (handle->mcast.cli == PAL_IDX_POISON)
  1115. return -PAL_ERROR_BADHANDLE;
  1116. struct msghdr hdr;
  1117. struct iovec iov;
  1118. iov.iov_base = buf;
  1119. iov.iov_len = size;
  1120. hdr.msg_name = NULL;
  1121. hdr.msg_namelen = 0;
  1122. hdr.msg_iov = &iov;
  1123. hdr.msg_iovlen = 1;
  1124. hdr.msg_control = NULL;
  1125. hdr.msg_controllen = 0;
  1126. hdr.msg_flags = 0;
  1127. int64_t bytes = INLINE_SYSCALL(recvmsg, 3, handle->mcast.cli, &hdr, 0);
  1128. if (IS_ERR(bytes))
  1129. return -PAL_ERROR_DENIED;
  1130. return bytes;
  1131. }
  1132. static int mcast_attrquerybyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  1133. {
  1134. int ret, val;
  1135. if (handle->mcast.cli == PAL_IDX_POISON)
  1136. return -PAL_ERROR_BADHANDLE;
  1137. ret = INLINE_SYSCALL(ioctl, 3, handle->mcast.cli, FIONREAD, &val);
  1138. if (IS_ERR(ret))
  1139. return unix_to_pal_error(ERRNO(ret));
  1140. attr->handle_type = pal_type_mcast;
  1141. attr->disconnected = HANDLE_HDR(handle)->flags & (ERROR(0)|ERROR(1));
  1142. attr->nonblocking = handle->mcast.nonblocking;
  1143. attr->readable = !!val;
  1144. attr->writeable = HANDLE_HDR(handle)->flags & WRITEABLE(1);
  1145. attr->runnable = PAL_FALSE;
  1146. attr->pending_size = val;
  1147. return 0;
  1148. }
  1149. static int mcast_attrsetbyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  1150. {
  1151. if (handle->mcast.cli == PAL_IDX_POISON)
  1152. return -PAL_ERROR_BADHANDLE;
  1153. int ret;
  1154. PAL_BOL * nonblocking = &handle->mcast.nonblocking;
  1155. if (attr->nonblocking != *nonblocking) {
  1156. ret = INLINE_SYSCALL(fcntl, 3, handle->mcast.cli, F_SETFL,
  1157. *nonblocking ? O_NONBLOCK : 0);
  1158. if (IS_ERR(ret))
  1159. return unix_to_pal_error(ERRNO(ret));
  1160. *nonblocking = attr->nonblocking;
  1161. }
  1162. return 0;
  1163. }
  1164. struct handle_ops mcast_ops = {
  1165. .write = &mcast_send,
  1166. .read = &mcast_receive,
  1167. .attrquerybyhdl = &mcast_attrquerybyhdl,
  1168. .attrsetbyhdl = &mcast_attrsetbyhdl,
  1169. };