db_sockets.c 34 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161
  1. /* -*- mode:c; c-file-style:"k&r"; c-basic-offset: 4; tab-width:4; indent-tabs-mode:nil; mode:auto-fill; fill-column:78; -*- */
  2. /* vim: set ts=4 sw=4 et tw=78 fo=cqt wm=0: */
  3. /* Copyright (C) 2014 Stony Brook University
  4. This file is part of Graphene Library OS.
  5. Graphene Library OS is free software: you can redistribute it and/or
  6. modify it under the terms of the GNU Lesser General Public License
  7. as published by the Free Software Foundation, either version 3 of the
  8. License, or (at your option) any later version.
  9. Graphene Library OS is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU Lesser General Public License for more details.
  13. You should have received a copy of the GNU Lesser General Public License
  14. along with this program. If not, see <http://www.gnu.org/licenses/>. */
  15. /*
  16. * db_socket.c
  17. *
  18. * This file contains operands for streams with URIs that start with
  19. * "tcp:", "tcp.srv:", "udp:", "udp.srv:".
  20. */
  21. #include "pal_defs.h"
  22. #include "pal_linux_defs.h"
  23. #include "pal.h"
  24. #include "pal_internal.h"
  25. #include "pal_linux.h"
  26. #include "pal_debug.h"
  27. #include "pal_security.h"
  28. #include "pal_error.h"
  29. #include "api.h"
  30. #include <linux/types.h>
  31. #include <linux/poll.h>
  32. #include <linux/in.h>
  33. #include <linux/in6.h>
  34. typedef __kernel_pid_t pid_t;
  35. #include <asm/fcntl.h>
  36. #include <asm-generic/socket.h>
  37. #ifndef SOL_TCP
  38. # define SOL_TCP 6
  39. #endif
  40. #ifndef TCP_NODELAY
  41. # define TCP_NODELAY 1
  42. #endif
  43. #ifndef TCP_CORK
  44. # define TCP_CORK 3
  45. #endif
  46. /* 96 bytes is the minimal size of buffer to store a IPv4/IPv6
  47. address */
  48. #define PAL_SOCKADDR_SIZE 96
  49. static inline int addr_size (struct sockaddr * addr)
  50. {
  51. switch (addr->sa_family) {
  52. case AF_INET:
  53. return sizeof(struct sockaddr_in);
  54. case AF_INET6:
  55. return sizeof(struct sockaddr_in6);
  56. default:
  57. return 0;
  58. }
  59. }
  60. /* parsing the string of uri, and fill in the socket address structure.
  61. the latest pointer of uri, length of socket address are returned. */
  62. static int inet_parse_uri (char ** uri, struct sockaddr * addr, unsigned int * addrlen)
  63. {
  64. char * tmp = *uri, * end;
  65. char * addr_str = NULL, * port_str;
  66. int af;
  67. void * addr_buf;
  68. int addr_len;
  69. __be16 * port_buf;
  70. int slen;
  71. if (tmp[0] == '[') {
  72. /* for IPv6, the address will be in the form of
  73. "[xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx]:port". */
  74. struct sockaddr_in6 * addr_in6 = (struct sockaddr_in6 *) addr;
  75. slen = sizeof(struct sockaddr_in6);
  76. memset(addr, 0, slen);
  77. end = strchr(tmp + 1, ']');
  78. if (!end || *(end + 1) != ':')
  79. goto inval;
  80. addr_str = tmp + 1;
  81. addr_len = end - tmp - 1;
  82. port_str = end + 2;
  83. for (end = port_str ; *end >= '0' && *end <= '9' ; end++);
  84. addr_in6->sin6_family = af = AF_INET6;
  85. addr_buf = &addr_in6->sin6_addr.s6_addr;
  86. port_buf = &addr_in6->sin6_port;
  87. } else {
  88. /* for IP, the address will be in the form of "x.x.x.x:port". */
  89. struct sockaddr_in * addr_in = (struct sockaddr_in *) addr;
  90. slen = sizeof(struct sockaddr_in);
  91. memset(addr, 0, slen);
  92. end = strchr(tmp, ':');
  93. if (!end)
  94. goto inval;
  95. addr_str = tmp;
  96. addr_len = end - tmp;
  97. port_str = end + 1;
  98. for (end = port_str ; *end >= '0' && *end <= '9' ; end++);
  99. addr_in->sin_family = af = AF_INET;
  100. addr_buf = &addr_in->sin_addr.s_addr;
  101. port_buf = &addr_in->sin_port;
  102. }
  103. if (af == AF_INET) {
  104. if (!inet_pton4(addr_str, addr_len, addr_buf))
  105. goto inval;
  106. } else {
  107. if (!inet_pton6(addr_str, addr_len, addr_buf))
  108. goto inval;
  109. }
  110. *port_buf = __htons(atoi(port_str));
  111. *uri = *end ? end + 1 : NULL;
  112. if (addrlen)
  113. *addrlen = slen;
  114. return 0;
  115. inval:
  116. return -PAL_ERROR_INVAL;
  117. }
  118. /* create the string of uri from the given socket address */
  119. static int inet_create_uri (char * uri, int count, struct sockaddr * addr,
  120. int addrlen)
  121. {
  122. int len = 0;
  123. if (addr->sa_family == AF_INET) {
  124. if (addrlen != sizeof(struct sockaddr_in))
  125. return PAL_ERROR_INVAL;
  126. struct sockaddr_in * addr_in = (struct sockaddr_in *) addr;
  127. char * addr = (char *) &addr_in->sin_addr.s_addr;
  128. /* for IP, the address will be in the form of "x.x.x.x:port". */
  129. len = snprintf(uri, count, "%u.%u.%u.%u:%u",
  130. (unsigned char) addr[0],
  131. (unsigned char) addr[1],
  132. (unsigned char) addr[2],
  133. (unsigned char) addr[3],
  134. __ntohs(addr_in->sin_port));
  135. } else if (addr->sa_family == AF_INET6) {
  136. if (addrlen != sizeof(struct sockaddr_in6))
  137. return PAL_ERROR_INVAL;
  138. struct sockaddr_in6 * addr_in6 = (struct sockaddr_in6 *) addr;
  139. unsigned short * addr = (unsigned short *) &addr_in6->sin6_addr.s6_addr;
  140. /* for IPv6, the address will be in the form of
  141. "[xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx]:port". */
  142. len = snprintf(uri, count, "[%04x:%04x:%04x:%04x:%04x:%04x:%04x:%04x]:%u",
  143. addr[0], addr[1], addr[2], addr[3],
  144. addr[4], addr[5], addr[6], addr[7],
  145. __ntohs(addr_in6->sin6_port));
  146. } else {
  147. return -PAL_ERROR_INVAL;
  148. }
  149. if (len >= count)
  150. return -PAL_ERROR_TOOLONG;
  151. return len;
  152. }
  153. /* parse the uri for a socket stream. The uri might have both binding
  154. address and connecting address, or connecting address only. The form
  155. of uri will be either "bind-addr:bind-port:connect-addr:connect-port"
  156. or "addr:port". */
  157. static int socket_parse_uri (char * uri,
  158. struct sockaddr ** bind_addr, unsigned int * bind_addrlen,
  159. struct sockaddr ** dest_addr, unsigned int * dest_addrlen)
  160. {
  161. int ret;
  162. if (!bind_addr && !dest_addr)
  163. return 0;
  164. if (!uri || !(*uri)) {
  165. if (bind_addr)
  166. *bind_addr = NULL;
  167. if (dest_addr)
  168. *dest_addr = NULL;
  169. return 0;
  170. }
  171. /* at least parse uri once */
  172. if ((ret = inet_parse_uri(&uri, bind_addr ? *bind_addr : *dest_addr,
  173. bind_addr ? bind_addrlen : dest_addrlen)) < 0)
  174. return ret;
  175. if (!(bind_addr && dest_addr))
  176. return 0;
  177. /* if you reach here, it can only be connection address */
  178. if (!uri || (ret = inet_parse_uri(&uri, *dest_addr, dest_addrlen)) < 0) {
  179. *dest_addr = *bind_addr;
  180. *dest_addrlen = *bind_addrlen;
  181. *bind_addr = NULL;
  182. *bind_addrlen = 0;
  183. }
  184. return 0;
  185. }
  186. /* fill in the PAL handle based on the file descriptors and address given. */
  187. static inline
  188. PAL_HANDLE socket_create_handle (int type, int fd, int options,
  189. struct sockaddr * bind_addr,
  190. unsigned int bind_addrlen,
  191. struct sockaddr * dest_addr,
  192. unsigned int dest_addrlen,
  193. struct sockopt * sock_options)
  194. {
  195. PAL_HANDLE hdl = malloc(HANDLE_SIZE(sock) + (bind_addr ? bind_addrlen : 0) +
  196. (dest_addr ? dest_addrlen : 0));
  197. if (!hdl)
  198. return NULL;
  199. memset(hdl, 0, sizeof(struct pal_handle));
  200. init_handle_hdr(HANDLE_HDR(hdl), type);
  201. HANDLE_HDR(hdl)->flags |= RFD(0)|(type != pal_type_tcpsrv ? WFD(0) : 0);
  202. hdl->sock.fd = fd;
  203. void * addr = (void *) hdl + HANDLE_SIZE(sock);
  204. if (bind_addr) {
  205. hdl->sock.bind = (PAL_PTR) addr;
  206. memcpy(addr, bind_addr, bind_addrlen);
  207. addr += bind_addrlen;
  208. } else {
  209. hdl->sock.bind = (PAL_PTR) NULL;
  210. }
  211. if (dest_addr) {
  212. hdl->sock.conn = (PAL_PTR) addr;
  213. memcpy(addr, dest_addr, dest_addrlen);
  214. addr += dest_addrlen;
  215. } else {
  216. hdl->sock.conn = (PAL_PTR) NULL;
  217. }
  218. hdl->sock.nonblocking = (options & PAL_OPTION_NONBLOCK) ?
  219. PAL_TRUE : PAL_FALSE;
  220. hdl->sock.linger = sock_options->linger;
  221. hdl->sock.receivebuf = sock_options->receivebuf;
  222. hdl->sock.sendbuf = sock_options->sendbuf;
  223. hdl->sock.receivetimeout = sock_options->receivetimeout;
  224. hdl->sock.sendtimeout = sock_options->sendtimeout;
  225. hdl->sock.tcp_cork = sock_options->tcp_cork;
  226. hdl->sock.tcp_keepalive = sock_options->tcp_keepalive;
  227. hdl->sock.tcp_nodelay = sock_options->tcp_nodelay;
  228. return hdl;
  229. }
  230. #if ALLOW_BIND_ANY == 0
  231. static bool check_zero (void * mem, size_t size)
  232. {
  233. void * p = mem, * q = mem + size;
  234. while (p < q) {
  235. if (p <= q - sizeof(long)) {
  236. if (*(long *) p)
  237. return false;
  238. p += sizeof(long);
  239. } else if (p <= q - sizeof(int)) {
  240. if (*(int *) p)
  241. return false;
  242. p += sizeof(int);
  243. } else if (p <= q - sizeof(short)) {
  244. if (*(short *) p)
  245. return false;
  246. p += sizeof(short);
  247. } else {
  248. if (*(char *) p)
  249. return false;
  250. p++;
  251. }
  252. }
  253. return true;
  254. }
  255. /* check if an address is "Any" */
  256. static bool check_any_addr (struct sockaddr * addr)
  257. {
  258. if (addr->sa_family == AF_INET) {
  259. struct sockaddr_in * addr_in =
  260. (struct sockaddr_in *) addr;
  261. return addr_in->sin_port == 0 &&
  262. check_zero(&addr_in->sin_addr,
  263. sizeof(addr_in->sin_addr));
  264. } else if (addr->sa_family == AF_INET6) {
  265. struct sockaddr_in6 * addr_in6 =
  266. (struct sockaddr_in6 *) addr;
  267. return addr_in6->sin6_port == 0 &&
  268. check_zero(&addr_in6->sin6_addr,
  269. sizeof(addr_in6->sin6_addr));
  270. }
  271. return false;
  272. }
  273. #endif
  274. static inline int sock_type (int type, int options)
  275. {
  276. if (options & PAL_OPTION_NONBLOCK)
  277. type |= SOCK_NONBLOCK;
  278. return type;
  279. }
  280. /* listen on a tcp socket */
  281. static int tcp_listen (PAL_HANDLE * handle, char * uri, int options)
  282. {
  283. struct sockaddr buffer, * bind_addr = &buffer;
  284. unsigned int bind_addrlen;
  285. int ret;
  286. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  287. NULL, NULL)) < 0)
  288. return ret;
  289. #if ALLOW_BIND_ANY == 0
  290. /* the socket need to have a binding address, a null address or an
  291. any address is not allowed */
  292. if (addr_check_any(bind_addr))
  293. return -PAL_ERROR_INVAL;
  294. #endif
  295. struct sockopt sock_options;
  296. ret = ocall_sock_listen(bind_addr->sa_family,
  297. sock_type(SOCK_STREAM, options), 0,
  298. bind_addr, bind_addrlen,
  299. &sock_options);
  300. if (ret < 0)
  301. return ret;
  302. *handle = socket_create_handle(pal_type_tcpsrv, ret, options,
  303. bind_addr, bind_addrlen, NULL, 0,
  304. &sock_options);
  305. if (!(*handle)) {
  306. ocall_close(ret);
  307. return -PAL_ERROR_NOMEM;
  308. }
  309. return 0;
  310. }
  311. /* accept a tcp connection */
  312. static int tcp_accept (PAL_HANDLE handle, PAL_HANDLE * client)
  313. {
  314. if (!IS_HANDLE_TYPE(handle, tcpsrv) ||
  315. !handle->sock.bind || handle->sock.conn)
  316. return -PAL_ERROR_NOTSERVER;
  317. if (handle->sock.fd == PAL_IDX_POISON)
  318. return -PAL_ERROR_BADHANDLE;
  319. struct sockaddr * bind_addr = (struct sockaddr *) handle->sock.bind;
  320. unsigned int bind_addrlen = addr_size(bind_addr);
  321. struct sockaddr dest_addr;
  322. unsigned int dest_addrlen = sizeof(struct sockaddr);
  323. int ret = 0;
  324. struct sockopt sock_options;
  325. ret = ocall_sock_accept(handle->sock.fd, &dest_addr, &dest_addrlen,
  326. &sock_options);
  327. if (ret < 0)
  328. return ret;
  329. *client = socket_create_handle(pal_type_tcp, ret, 0, bind_addr,
  330. bind_addrlen,
  331. &dest_addr, dest_addrlen,
  332. &sock_options);
  333. if (!(*client)) {
  334. ocall_close(ret);
  335. return -PAL_ERROR_NOMEM;
  336. }
  337. return 0;
  338. }
  339. /* connect on a tcp socket */
  340. static int tcp_connect (PAL_HANDLE * handle, char * uri, int options)
  341. {
  342. struct sockaddr buffer[2];
  343. struct sockaddr * bind_addr = buffer, * dest_addr = buffer + 1;
  344. unsigned int bind_addrlen, dest_addrlen;
  345. int ret;
  346. /* accepting two kind of different uri:
  347. dest-ip:dest-port or bind-ip:bind-port:dest-ip:dest-port */
  348. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  349. &dest_addr, &dest_addrlen)) < 0)
  350. return ret;
  351. if (!dest_addr)
  352. return -PAL_ERROR_INVAL;
  353. if (bind_addr && bind_addr->sa_family != dest_addr->sa_family)
  354. return -PAL_ERROR_INVAL;
  355. #if ALLOW_BIND_ANY == 0
  356. /* the socket need to have a binding address, a null address or an
  357. any address is not allowed */
  358. if (bind_addr && addr_check_any(bind_addr))
  359. return -PAL_ERROR_INVAL;
  360. #endif
  361. struct sockopt sock_options;
  362. ret = ocall_sock_connect(dest_addr->sa_family,
  363. sock_type(SOCK_STREAM, options), 0,
  364. dest_addr, dest_addrlen,
  365. bind_addr, &bind_addrlen, &sock_options);
  366. if (ret < 0)
  367. return ret;
  368. *handle = socket_create_handle(pal_type_tcp, ret, options,
  369. bind_addr, bind_addrlen,
  370. dest_addr, dest_addrlen,
  371. &sock_options);
  372. if (!(*handle)) {
  373. ocall_close(ret);
  374. return -PAL_ERROR_NOMEM;
  375. }
  376. return 0;
  377. }
  378. /* 'open' operation of tcp stream */
  379. static int tcp_open (PAL_HANDLE *handle, const char * type, const char * uri,
  380. int access, int share, int create, int options)
  381. {
  382. int uri_len = strlen(uri) + 1;
  383. if (uri_len > PAL_SOCKADDR_SIZE)
  384. return -PAL_ERROR_TOOLONG;
  385. char uri_buf[PAL_SOCKADDR_SIZE];
  386. memcpy(uri_buf, uri, uri_len);
  387. if (strpartcmp_static(type, "tcp.srv:"))
  388. return tcp_listen(handle, uri_buf, options);
  389. if (strpartcmp_static(type, "tcp:"))
  390. return tcp_connect(handle, uri_buf, options);
  391. return -PAL_ERROR_NOTSUPPORT;
  392. }
  393. /* 'read' operation of tcp stream */
  394. static int64_t tcp_read (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  395. void * buf)
  396. {
  397. if (!IS_HANDLE_TYPE(handle, tcp) || !handle->sock.conn)
  398. return -PAL_ERROR_NOTCONNECTION;
  399. if (handle->sock.fd == PAL_IDX_POISON)
  400. return -PAL_ERROR_ENDOFSTREAM;
  401. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  402. return -PAL_ERROR_INVAL;
  403. int bytes = ocall_sock_recv(handle->sock.fd, buf, len, NULL, NULL);
  404. if (bytes < 0)
  405. return bytes;
  406. if (!bytes)
  407. return -PAL_ERROR_ENDOFSTREAM;
  408. return bytes;
  409. }
  410. /* write' operation of tcp stream */
  411. static int64_t tcp_write (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  412. const void * buf)
  413. {
  414. if (!IS_HANDLE_TYPE(handle, tcp) || !handle->sock.conn)
  415. return -PAL_ERROR_NOTCONNECTION;
  416. if (handle->sock.fd == PAL_IDX_POISON)
  417. return -PAL_ERROR_CONNFAILED;
  418. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  419. return -PAL_ERROR_INVAL;
  420. int bytes = ocall_sock_send(handle->sock.fd, buf, len, NULL, 0);
  421. if (bytes == -PAL_ERROR_TRYAGAIN)
  422. HANDLE_HDR(handle)->flags &= ~WRITEABLE(0);
  423. if (bytes < 0)
  424. return bytes;
  425. if (bytes == len)
  426. HANDLE_HDR(handle)->flags |= WRITEABLE(0);
  427. else
  428. HANDLE_HDR(handle)->flags &= ~WRITEABLE(0);
  429. return bytes;
  430. }
  431. /* used by 'open' operation of tcp stream for bound socket */
  432. static int udp_bind (PAL_HANDLE * handle, char * uri, int options)
  433. {
  434. struct sockaddr buffer, * bind_addr = &buffer;
  435. unsigned int bind_addrlen;
  436. int ret = 0;
  437. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  438. NULL, NULL)) < 0)
  439. return ret;
  440. assert(bind_addr);
  441. assert(bind_addrlen == addr_size(bind_addr));
  442. #if ALLOW_BIND_ANY == 0
  443. /* the socket need to have a binding address, a null address or an
  444. any address is not allowed */
  445. if (addr_check_any(bind_addr))
  446. return -PAL_ERROR_INVAL;
  447. #endif
  448. struct sockopt sock_options;
  449. ret = ocall_sock_listen(bind_addr->sa_family,
  450. sock_type(SOCK_DGRAM, options), 0,
  451. bind_addr, bind_addrlen, &sock_options);
  452. if (ret < 0)
  453. return ret;
  454. *handle = socket_create_handle(pal_type_udpsrv, ret, options,
  455. bind_addr, bind_addrlen, NULL, 0,
  456. &sock_options);
  457. if (!(*handle)) {
  458. ocall_close(ret);
  459. return -PAL_ERROR_NOMEM;
  460. }
  461. return 0;
  462. }
  463. /* used by 'open' operation of tcp stream for connected socket */
  464. static int udp_connect (PAL_HANDLE * handle, char * uri, int options)
  465. {
  466. struct sockaddr buffer[2];
  467. struct sockaddr * bind_addr = buffer, * dest_addr = buffer + 1;
  468. unsigned int bind_addrlen, dest_addrlen;
  469. int ret;
  470. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  471. &dest_addr, &dest_addrlen)) < 0)
  472. return ret;
  473. #if ALLOW_BIND_ANY == 0
  474. /* the socket need to have a binding address, a null address or an
  475. any address is not allowed */
  476. if (bind_addr && addr_check_any(bind_addr))
  477. return -PAL_ERROR_INVAL;
  478. #endif
  479. struct sockopt sock_options;
  480. ret = ocall_sock_connect(dest_addr ? dest_addr->sa_family : AF_INET,
  481. sock_type(SOCK_DGRAM, options), 0,
  482. dest_addr, dest_addrlen,
  483. bind_addr, &bind_addrlen, &sock_options);
  484. if (ret < 0)
  485. return ret;
  486. *handle = socket_create_handle(dest_addr ? pal_type_udp :
  487. pal_type_udpsrv, ret, options,
  488. bind_addr, bind_addrlen,
  489. dest_addr, dest_addrlen,
  490. &sock_options);
  491. if (!(*handle)) {
  492. ocall_close(ret);
  493. return -PAL_ERROR_NOMEM;
  494. }
  495. return 0;
  496. }
  497. static int udp_open (PAL_HANDLE *hdl, const char * type, const char * uri,
  498. int access, int share, int create, int options)
  499. {
  500. char buf[PAL_SOCKADDR_SIZE];
  501. int len = strlen(uri);
  502. if (len >= PAL_SOCKADDR_SIZE)
  503. return -PAL_ERROR_TOOLONG;
  504. memcpy(buf, uri, len + 1);
  505. options &= PAL_OPTION_MASK;
  506. if (strpartcmp_static(type, "udp.srv:"))
  507. return udp_bind(hdl, buf, options);
  508. if (strpartcmp_static(type, "udp:"))
  509. return udp_connect(hdl, buf, options);
  510. return -PAL_ERROR_NOTSUPPORT;
  511. }
  512. static int64_t udp_receive (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  513. void * buf)
  514. {
  515. if (!IS_HANDLE_TYPE(handle, udp))
  516. return -PAL_ERROR_NOTCONNECTION;
  517. if (handle->sock.fd == PAL_IDX_POISON)
  518. return -PAL_ERROR_BADHANDLE;
  519. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  520. return -PAL_ERROR_INVAL;
  521. return ocall_sock_recv(handle->sock.fd, buf, len, NULL, NULL);
  522. }
  523. static int64_t udp_receivebyaddr (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  524. void * buf, char * addr, int addrlen)
  525. {
  526. if (!IS_HANDLE_TYPE(handle, udpsrv))
  527. return -PAL_ERROR_NOTCONNECTION;
  528. if (handle->sock.fd == PAL_IDX_POISON)
  529. return -PAL_ERROR_BADHANDLE;
  530. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  531. return -PAL_ERROR_INVAL;
  532. struct sockaddr conn_addr;
  533. socklen_t conn_addrlen = sizeof(struct sockaddr);
  534. int bytes = ocall_sock_recv(handle->sock.fd, buf, len, &conn_addr,
  535. &conn_addrlen);
  536. if (bytes < 0)
  537. return bytes;
  538. char * addr_uri = strcpy_static(addr, "udp:", addrlen);
  539. if (!addr_uri)
  540. return -PAL_ERROR_OVERFLOW;
  541. int ret = inet_create_uri(addr_uri, addr + addrlen - addr_uri, &conn_addr,
  542. conn_addrlen);
  543. if (ret < 0)
  544. return ret;
  545. return bytes;
  546. }
  547. static int64_t udp_send (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  548. const void * buf)
  549. {
  550. if (!IS_HANDLE_TYPE(handle, udp))
  551. return -PAL_ERROR_NOTCONNECTION;
  552. if (handle->sock.fd == PAL_IDX_POISON)
  553. return -PAL_ERROR_BADHANDLE;
  554. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  555. return -PAL_ERROR_INVAL;
  556. int bytes = ocall_sock_send(handle->sock.fd, buf, len, NULL, 0);
  557. if (bytes == -PAL_ERROR_TRYAGAIN)
  558. HANDLE_HDR(handle)->flags &= ~WRITEABLE(0);
  559. if (bytes < 0)
  560. return bytes;
  561. if (bytes == len)
  562. HANDLE_HDR(handle)->flags |= WRITEABLE(0);
  563. else
  564. HANDLE_HDR(handle)->flags &= ~WRITEABLE(0);
  565. return bytes;
  566. }
  567. static int64_t udp_sendbyaddr (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  568. const void * buf, const char * addr, int addrlen)
  569. {
  570. if (!IS_HANDLE_TYPE(handle, udpsrv))
  571. return -PAL_ERROR_NOTCONNECTION;
  572. if (handle->sock.fd == PAL_IDX_POISON)
  573. return -PAL_ERROR_BADHANDLE;
  574. if (!strpartcmp_static(addr, "udp:"))
  575. return -PAL_ERROR_INVAL;
  576. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  577. return -PAL_ERROR_INVAL;
  578. addr += static_strlen("udp:");
  579. addrlen -= static_strlen("udp:");
  580. char * addrbuf = __alloca(addrlen);
  581. memcpy(addrbuf, addr, addrlen);
  582. struct sockaddr conn_addr;
  583. unsigned int conn_addrlen = sizeof(struct sockaddr);
  584. int ret = inet_parse_uri(&addrbuf, &conn_addr, &conn_addrlen);
  585. if (ret < 0)
  586. return ret;
  587. int bytes = ocall_sock_send(handle->sock.fd, buf, len, &conn_addr,
  588. conn_addrlen);
  589. if (bytes == -PAL_ERROR_TRYAGAIN)
  590. HANDLE_HDR(handle)->flags &= ~WRITEABLE(0);
  591. if (bytes < 0)
  592. return bytes;
  593. if (bytes == len)
  594. HANDLE_HDR(handle)->flags |= WRITEABLE(0);
  595. else
  596. HANDLE_HDR(handle)->flags &= ~WRITEABLE(0);
  597. return bytes;
  598. }
  599. static int socket_delete (PAL_HANDLE handle, int access)
  600. {
  601. if (handle->sock.fd == PAL_IDX_POISON)
  602. return 0;
  603. if (!IS_HANDLE_TYPE(handle, tcp) && access)
  604. return -PAL_ERROR_INVAL;
  605. if (IS_HANDLE_TYPE(handle, tcp) || IS_HANDLE_TYPE(handle, tcpsrv)) {
  606. int shutdown;
  607. switch (access) {
  608. case 0:
  609. shutdown = SHUT_RDWR;
  610. break;
  611. case PAL_DELETE_RD:
  612. shutdown = SHUT_RD;
  613. break;
  614. case PAL_DELETE_WR:
  615. shutdown = SHUT_WR;
  616. break;
  617. default:
  618. return -PAL_ERROR_INVAL;
  619. }
  620. ocall_sock_shutdown(handle->sock.fd, shutdown);
  621. }
  622. return 0;
  623. }
  624. static int socket_close (PAL_HANDLE handle)
  625. {
  626. if (handle->sock.fd != PAL_IDX_POISON) {
  627. ocall_close(handle->sock.fd);
  628. handle->sock.fd = PAL_IDX_POISON;
  629. }
  630. if (handle->sock.bind)
  631. handle->sock.bind = (PAL_PTR) NULL;
  632. if (handle->sock.conn)
  633. handle->sock.conn = (PAL_PTR) NULL;
  634. return 0;
  635. }
  636. static int socket_attrquerybyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  637. {
  638. if (handle->sock.fd == PAL_IDX_POISON)
  639. return -PAL_ERROR_BADHANDLE;
  640. attr->handle_type = HANDLE_HDR(handle)->type;
  641. attr->disconnected = HANDLE_HDR(handle)->flags & ERROR(0);
  642. attr->nonblocking = handle->sock.nonblocking;
  643. attr->writeable = HANDLE_HDR(handle)->flags & WRITEABLE(0);
  644. attr->pending_size = 0; /* fill in later */
  645. attr->socket.linger = handle->sock.linger;
  646. attr->socket.receivebuf = handle->sock.receivebuf;
  647. attr->socket.sendbuf = handle->sock.sendbuf;
  648. attr->socket.receivetimeout = handle->sock.receivetimeout;
  649. attr->socket.sendtimeout = handle->sock.sendtimeout;
  650. attr->socket.tcp_cork = handle->sock.tcp_cork;
  651. attr->socket.tcp_keepalive = handle->sock.tcp_keepalive;
  652. attr->socket.tcp_nodelay = handle->sock.tcp_nodelay;
  653. int fd = handle->sock.fd, ret;
  654. if (!IS_HANDLE_TYPE(handle, tcpsrv)) {
  655. /* try use ioctl FIONEAD to get the size of socket */
  656. ret = ocall_fionread(fd);
  657. if (ret < 0)
  658. return ret;
  659. attr->pending_size = ret;
  660. }
  661. struct pollfd pfd = { .fd = fd, .events = POLLIN, .revents = 0 };
  662. unsigned long waittime = 0;
  663. ret = ocall_poll(&pfd, 1, &waittime);
  664. if (ret < 0)
  665. return ret;
  666. attr->readable = (ret == 1 && pfd.revents == POLLIN);
  667. return 0;
  668. }
  669. static int socket_attrsetbyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  670. {
  671. if (handle->sock.fd == PAL_IDX_POISON)
  672. return -PAL_ERROR_BADHANDLE;
  673. int fd = handle->sock.fd, ret, val;
  674. if (attr->nonblocking != handle->sock.nonblocking) {
  675. ret = ocall_fsetnonblock(fd, attr->nonblocking);
  676. if (ret < 0)
  677. return ret;
  678. handle->sock.nonblocking = attr->nonblocking;
  679. }
  680. if (HANDLE_TYPE(handle) != pal_type_tcpsrv) {
  681. struct __kernel_linger {
  682. int l_onoff;
  683. int l_linger;
  684. };
  685. if (attr->socket.linger != handle->sock.linger) {
  686. struct __kernel_linger l;
  687. l.l_onoff = attr->socket.linger ? 1 : 0;
  688. l.l_linger = attr->socket.linger;
  689. ret = ocall_sock_setopt(fd, SOL_SOCKET, SO_LINGER, &l,
  690. sizeof(struct __kernel_linger));
  691. if (ret < 0)
  692. return ret;
  693. handle->sock.linger = attr->socket.linger;
  694. }
  695. if (attr->socket.receivebuf != handle->sock.receivebuf) {
  696. val = attr->socket.receivebuf;
  697. ret = ocall_sock_setopt(fd, SOL_SOCKET, SO_RCVBUF, &val,
  698. sizeof(int));
  699. if (ret < 0)
  700. return ret;
  701. handle->sock.receivebuf = attr->socket.receivebuf;
  702. }
  703. if (attr->socket.sendbuf != handle->sock.sendbuf) {
  704. val = attr->socket.sendbuf;
  705. ret = ocall_sock_setopt(fd, SOL_SOCKET, SO_SNDBUF,
  706. &val, sizeof(int));
  707. if (ret < 0)
  708. return ret;
  709. handle->sock.sendbuf = attr->socket.sendbuf;
  710. }
  711. if (attr->socket.receivetimeout != handle->sock.receivetimeout) {
  712. val = attr->socket.receivetimeout;
  713. ret = ocall_sock_setopt(fd, SOL_SOCKET, SO_RCVTIMEO,
  714. &val, sizeof(int));
  715. if (ret < 0)
  716. return ret;
  717. handle->sock.receivetimeout = attr->socket.receivetimeout;
  718. }
  719. if (attr->socket.sendtimeout != handle->sock.sendtimeout) {
  720. val = attr->socket.sendtimeout;
  721. ret = ocall_sock_setopt(fd, SOL_SOCKET, SO_SNDTIMEO,
  722. &val, sizeof(int));
  723. if (ret < 0)
  724. return ret;
  725. handle->sock.sendtimeout = attr->socket.sendtimeout;
  726. }
  727. }
  728. if (HANDLE_TYPE(handle) == pal_type_tcp ||
  729. HANDLE_TYPE(handle) == pal_type_tcpsrv) {
  730. if (attr->socket.tcp_cork != handle->sock.tcp_cork) {
  731. val = attr->socket.tcp_cork ? 1 : 0;
  732. ret = ocall_sock_setopt(fd, SOL_TCP, TCP_CORK,
  733. &val, sizeof(int));
  734. if (ret < 0)
  735. return ret;
  736. handle->sock.tcp_cork = attr->socket.tcp_cork;
  737. }
  738. if (attr->socket.tcp_keepalive != handle->sock.tcp_keepalive) {
  739. val = attr->socket.tcp_keepalive ? 1 : 0;
  740. ret = ocall_sock_setopt(fd, SOL_SOCKET, SO_KEEPALIVE,
  741. &val, sizeof(int));
  742. if (ret < 0)
  743. return ret;
  744. handle->sock.tcp_keepalive = attr->socket.tcp_keepalive;
  745. }
  746. if (attr->socket.tcp_nodelay != handle->sock.tcp_nodelay) {
  747. val = attr->socket.tcp_nodelay ? 1 : 0;
  748. ret = ocall_sock_setopt(fd, SOL_TCP, TCP_NODELAY,
  749. &val, sizeof(int));
  750. if (ret < 0)
  751. return ret;
  752. handle->sock.tcp_nodelay = attr->socket.tcp_nodelay;
  753. }
  754. }
  755. return 0;
  756. }
  757. static int socket_getname (PAL_HANDLE handle, char * buffer, int count)
  758. {
  759. int old_count = count;
  760. int ret;
  761. const char * prefix = NULL;
  762. int prefix_len = 0;
  763. struct sockaddr * bind_addr = NULL, * dest_addr = NULL;
  764. switch (HANDLE_TYPE(handle)) {
  765. case pal_type_tcpsrv:
  766. prefix_len = static_strlen("tcp.srv");
  767. prefix = "tcp.srv";
  768. bind_addr = (struct sockaddr *) handle->sock.bind;
  769. break;
  770. case pal_type_tcp:
  771. prefix_len = static_strlen("tcp");
  772. prefix = "tcp";
  773. bind_addr = (struct sockaddr *) handle->sock.bind;
  774. dest_addr = (struct sockaddr *) handle->sock.conn;
  775. break;
  776. case pal_type_udpsrv:
  777. prefix_len = static_strlen("udp.srv");
  778. prefix = "udp.srv";
  779. bind_addr = (struct sockaddr *) handle->sock.bind;
  780. break;
  781. case pal_type_udp:
  782. prefix_len = static_strlen("udp");
  783. prefix = "udp";
  784. bind_addr = (struct sockaddr *) handle->sock.bind;
  785. dest_addr = (struct sockaddr *) handle->sock.conn;
  786. break;
  787. default:
  788. return -PAL_ERROR_INVAL;
  789. }
  790. if (prefix_len >= count)
  791. return -PAL_ERROR_OVERFLOW;
  792. memcpy(buffer, prefix, prefix_len + 1);
  793. buffer += prefix_len;
  794. count -= prefix_len;
  795. for (int i = 0 ; i < 2 ; i++) {
  796. struct sockaddr * addr = i ? dest_addr : bind_addr;
  797. if (addr) {
  798. if (count <= 1)
  799. return -PAL_ERROR_OVERFLOW;
  800. buffer[0] = ':';
  801. buffer[1] = 0;
  802. buffer++;
  803. count--;
  804. if ((ret = inet_create_uri(buffer, count, addr,
  805. addr_size(addr))) < 0)
  806. return ret;
  807. buffer += ret;
  808. count -= ret;
  809. }
  810. }
  811. return old_count - count;
  812. }
  813. struct handle_ops tcp_ops = {
  814. .getname = &socket_getname,
  815. .open = &tcp_open,
  816. .waitforclient = &tcp_accept,
  817. .read = &tcp_read,
  818. .write = &tcp_write,
  819. .delete = &socket_delete,
  820. .close = &socket_close,
  821. .attrquerybyhdl = &socket_attrquerybyhdl,
  822. .attrsetbyhdl = &socket_attrsetbyhdl,
  823. };
  824. struct handle_ops udp_ops = {
  825. .getname = &socket_getname,
  826. .open = &udp_open,
  827. .read = &udp_receive,
  828. .write = &udp_send,
  829. .delete = &socket_delete,
  830. .close = &socket_close,
  831. .attrquerybyhdl = &socket_attrquerybyhdl,
  832. .attrsetbyhdl = &socket_attrsetbyhdl,
  833. };
  834. struct handle_ops udpsrv_ops = {
  835. .getname = &socket_getname,
  836. .open = &udp_open,
  837. .readbyaddr = &udp_receivebyaddr,
  838. .writebyaddr = &udp_sendbyaddr,
  839. .delete = &socket_delete,
  840. .close = &socket_close,
  841. .attrquerybyhdl = &socket_attrquerybyhdl,
  842. .attrsetbyhdl = &socket_attrsetbyhdl,
  843. };
  844. PAL_HANDLE _DkBroadcastStreamOpen (void)
  845. {
  846. PAL_HANDLE hdl = malloc(HANDLE_SIZE(file));
  847. SET_HANDLE_TYPE(hdl, mcast);
  848. HANDLE_HDR(hdl)->flags |= RFD(0)|WFD(1)|WRITEABLE(1);
  849. hdl->mcast.port = pal_sec.mcast_port;
  850. hdl->mcast.srv = pal_sec.mcast_srv;
  851. hdl->mcast.cli = pal_sec.mcast_cli;
  852. return hdl;
  853. }
  854. static int64_t mcast_send (PAL_HANDLE handle, uint64_t offset, uint64_t size,
  855. const void * buf)
  856. {
  857. if (handle->mcast.srv == PAL_IDX_POISON)
  858. return -PAL_ERROR_BADHANDLE;
  859. if (size >= (1ULL << (sizeof(unsigned int) * 8)))
  860. return -PAL_ERROR_INVAL;
  861. int bytes = ocall_sock_send(handle->mcast.srv, buf, size,
  862. NULL, 0);
  863. if (bytes == -PAL_ERROR_TRYAGAIN)
  864. HANDLE_HDR(handle)->flags &= ~WRITEABLE(1);
  865. if (bytes < 0)
  866. return bytes;
  867. if (bytes == size)
  868. HANDLE_HDR(handle)->flags |= WRITEABLE(1);
  869. else
  870. HANDLE_HDR(handle)->flags &= ~WRITEABLE(1);
  871. return bytes;
  872. }
  873. static int64_t mcast_receive (PAL_HANDLE handle, uint64_t offset, uint64_t size,
  874. void * buf)
  875. {
  876. if (handle->mcast.cli == PAL_IDX_POISON)
  877. return -PAL_ERROR_BADHANDLE;
  878. if (size >= (1ULL << (sizeof(unsigned int) * 8)))
  879. return -PAL_ERROR_INVAL;
  880. int bytes = ocall_sock_recv(handle->mcast.cli, buf, size, NULL,
  881. NULL);
  882. if (bytes == -PAL_ERROR_TRYAGAIN)
  883. HANDLE_HDR(handle)->flags &= ~WRITEABLE(1);
  884. return bytes;
  885. }
  886. static int mcast_close (PAL_HANDLE handle)
  887. {
  888. if (handle->mcast.srv != PAL_IDX_POISON) {
  889. ocall_close(handle->mcast.srv);
  890. handle->mcast.srv = PAL_IDX_POISON;
  891. }
  892. if (handle->mcast.cli != PAL_IDX_POISON) {
  893. ocall_close(handle->mcast.cli);
  894. handle->mcast.cli = PAL_IDX_POISON;
  895. }
  896. return 0;
  897. }
  898. static int mcast_attrquerybyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  899. {
  900. if (handle->mcast.cli == PAL_IDX_POISON)
  901. return -PAL_ERROR_BADHANDLE;
  902. int ret = ocall_fionread(handle->mcast.cli);
  903. if (ret < 0)
  904. return ret;
  905. memset(attr, 0, sizeof(PAL_STREAM_ATTR));
  906. attr->pending_size = ret;
  907. attr->disconnected = HANDLE_HDR(handle)->flags & (ERROR(0)|ERROR(1));
  908. attr->readable = (attr->pending_size > 0);
  909. attr->writeable = HANDLE_HDR(handle)->flags & WRITEABLE(1);
  910. attr->nonblocking = handle->mcast.nonblocking;
  911. return 0;
  912. }
  913. static int mcast_attrsetbyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  914. {
  915. if (handle->mcast.cli == PAL_IDX_POISON)
  916. return -PAL_ERROR_BADHANDLE;
  917. PAL_BOL * nonblocking = &handle->mcast.nonblocking;
  918. if (attr->nonblocking != *nonblocking) {
  919. int ret = ocall_fsetnonblock(handle->mcast.cli, *nonblocking);
  920. if (ret < 0)
  921. return ret;
  922. *nonblocking = attr->nonblocking;
  923. }
  924. return 0;
  925. }
  926. struct handle_ops mcast_ops = {
  927. .write = &mcast_send,
  928. .read = &mcast_receive,
  929. .close = &mcast_close,
  930. .attrquerybyhdl = &mcast_attrquerybyhdl,
  931. .attrsetbyhdl = &mcast_attrsetbyhdl,
  932. };