db_sockets.c 36 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208
  1. /* -*- mode:c; c-file-style:"k&r"; c-basic-offset: 4; tab-width:4; indent-tabs-mode:nil; mode:auto-fill; fill-column:78; -*- */
  2. /* vim: set ts=4 sw=4 et tw=78 fo=cqt wm=0: */
  3. /* Copyright (C) 2014 Stony Brook University
  4. This file is part of Graphene Library OS.
  5. Graphene Library OS is free software: you can redistribute it and/or
  6. modify it under the terms of the GNU Lesser General Public License
  7. as published by the Free Software Foundation, either version 3 of the
  8. License, or (at your option) any later version.
  9. Graphene Library OS is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU Lesser General Public License for more details.
  13. You should have received a copy of the GNU Lesser General Public License
  14. along with this program. If not, see <http://www.gnu.org/licenses/>. */
  15. /*
  16. * db_socket.c
  17. *
  18. * This file contains operands for streams with URIs that start with
  19. * "tcp:", "tcp.srv:", "udp:", "udp.srv:".
  20. */
  21. #include "pal_defs.h"
  22. #include "pal_linux_defs.h"
  23. #include "pal.h"
  24. #include "pal_internal.h"
  25. #include "pal_linux.h"
  26. #include "pal_linux_error.h"
  27. #include "pal_debug.h"
  28. #include "pal_security.h"
  29. #include "pal_error.h"
  30. #include "api.h"
  31. #include <linux/types.h>
  32. #include <linux/poll.h>
  33. #include <linux/in.h>
  34. #include <linux/in6.h>
  35. typedef __kernel_pid_t pid_t;
  36. #include <asm/fcntl.h>
  37. #include <asm-generic/socket.h>
  38. #ifndef SOL_TCP
  39. # define SOL_TCP 6
  40. #endif
  41. #ifndef TCP_NODELAY
  42. # define TCP_NODELAY 1
  43. #endif
  44. #ifndef TCP_CORK
  45. # define TCP_CORK 3
  46. #endif
  47. /* 96 bytes is the minimal size of buffer to store a IPv4/IPv6
  48. address */
  49. #define PAL_SOCKADDR_SIZE 96
  50. static size_t addr_size(const struct sockaddr* addr) {
  51. switch (addr->sa_family) {
  52. case AF_INET:
  53. return sizeof(struct sockaddr_in);
  54. case AF_INET6:
  55. return sizeof(struct sockaddr_in6);
  56. default:
  57. return 0;
  58. }
  59. }
  60. /* parsing the string of uri, and fill in the socket address structure.
  61. the latest pointer of uri, length of socket address are returned. */
  62. static int inet_parse_uri (char ** uri, struct sockaddr * addr, unsigned int * addrlen)
  63. {
  64. char * tmp = *uri, * end;
  65. char * addr_str = NULL, * port_str;
  66. int af;
  67. void * addr_buf;
  68. int addr_len;
  69. __be16 * port_buf;
  70. int slen;
  71. if (tmp[0] == '[') {
  72. /* for IPv6, the address will be in the form of
  73. "[xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx]:port". */
  74. struct sockaddr_in6 * addr_in6 = (struct sockaddr_in6 *) addr;
  75. slen = sizeof(struct sockaddr_in6);
  76. memset(addr, 0, slen);
  77. end = strchr(tmp + 1, ']');
  78. if (!end || *(end + 1) != ':')
  79. goto inval;
  80. addr_str = tmp + 1;
  81. addr_len = end - tmp - 1;
  82. port_str = end + 2;
  83. for (end = port_str ; *end >= '0' && *end <= '9' ; end++);
  84. addr_in6->sin6_family = af = AF_INET6;
  85. addr_buf = &addr_in6->sin6_addr.s6_addr;
  86. port_buf = &addr_in6->sin6_port;
  87. } else {
  88. /* for IP, the address will be in the form of "x.x.x.x:port". */
  89. struct sockaddr_in * addr_in = (struct sockaddr_in *) addr;
  90. slen = sizeof(struct sockaddr_in);
  91. memset(addr, 0, slen);
  92. end = strchr(tmp, ':');
  93. if (!end)
  94. goto inval;
  95. addr_str = tmp;
  96. addr_len = end - tmp;
  97. port_str = end + 1;
  98. for (end = port_str ; *end >= '0' && *end <= '9' ; end++);
  99. addr_in->sin_family = af = AF_INET;
  100. addr_buf = &addr_in->sin_addr.s_addr;
  101. port_buf = &addr_in->sin_port;
  102. }
  103. if (af == AF_INET) {
  104. if (!inet_pton4(addr_str, addr_len, addr_buf))
  105. goto inval;
  106. } else {
  107. if (!inet_pton6(addr_str, addr_len, addr_buf))
  108. goto inval;
  109. }
  110. *port_buf = __htons(atoi(port_str));
  111. *uri = *end ? end + 1 : NULL;
  112. if (addrlen)
  113. *addrlen = slen;
  114. return 0;
  115. inval:
  116. return -PAL_ERROR_INVAL;
  117. }
  118. /* create the string of uri from the given socket address */
  119. static int inet_create_uri (char * uri, int count, struct sockaddr * addr,
  120. int addrlen)
  121. {
  122. int len = 0;
  123. if (addr->sa_family == AF_INET) {
  124. if (addrlen != sizeof(struct sockaddr_in))
  125. return -PAL_ERROR_INVAL;
  126. struct sockaddr_in * addr_in = (struct sockaddr_in *) addr;
  127. char * addr = (char *) &addr_in->sin_addr.s_addr;
  128. /* for IP, the address will be in the form of "x.x.x.x:port". */
  129. len = snprintf(uri, count, "%u.%u.%u.%u:%u",
  130. (unsigned char) addr[0],
  131. (unsigned char) addr[1],
  132. (unsigned char) addr[2],
  133. (unsigned char) addr[3],
  134. __ntohs(addr_in->sin_port));
  135. } else if (addr->sa_family == AF_INET6) {
  136. if (addrlen != sizeof(struct sockaddr_in6))
  137. return -PAL_ERROR_INVAL;
  138. struct sockaddr_in6 * addr_in6 = (struct sockaddr_in6 *) addr;
  139. unsigned short * addr = (unsigned short *) &addr_in6->sin6_addr.s6_addr;
  140. /* for IPv6, the address will be in the form of
  141. "[xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx]:port". */
  142. len = snprintf(uri, count, "[%04x:%04x:%04x:%04x:%04x:%04x:%04x:%04x]:%u",
  143. addr[0], addr[1], addr[2], addr[3],
  144. addr[4], addr[5], addr[6], addr[7],
  145. __ntohs(addr_in6->sin6_port));
  146. } else {
  147. return -PAL_ERROR_INVAL;
  148. }
  149. if (len >= count)
  150. return -PAL_ERROR_TOOLONG;
  151. return len;
  152. }
  153. /* parse the uri for a socket stream. The uri might have both binding
  154. address and connecting address, or connecting address only. The form
  155. of uri will be either "bind-addr:bind-port:connect-addr:connect-port"
  156. or "addr:port". */
  157. static int socket_parse_uri (char * uri,
  158. struct sockaddr ** bind_addr, unsigned int * bind_addrlen,
  159. struct sockaddr ** dest_addr, unsigned int * dest_addrlen)
  160. {
  161. int ret;
  162. if (!bind_addr && !dest_addr)
  163. return 0;
  164. if (!uri || !(*uri)) {
  165. if (bind_addr)
  166. *bind_addr = NULL;
  167. if (bind_addrlen)
  168. *bind_addrlen = 0;
  169. if (dest_addr)
  170. *dest_addr = NULL;
  171. if (dest_addrlen)
  172. *dest_addrlen = 0;
  173. return 0;
  174. }
  175. /* at least parse uri once */
  176. if ((ret = inet_parse_uri(&uri, bind_addr ? *bind_addr : *dest_addr,
  177. bind_addr ? bind_addrlen : dest_addrlen)) < 0)
  178. return ret;
  179. if (!(bind_addr && dest_addr))
  180. return 0;
  181. /* if you reach here, it can only be connection address */
  182. if (!uri || (ret = inet_parse_uri(&uri, *dest_addr, dest_addrlen)) < 0) {
  183. *dest_addr = *bind_addr;
  184. *dest_addrlen = *bind_addrlen;
  185. *bind_addr = NULL;
  186. *bind_addrlen = 0;
  187. }
  188. return 0;
  189. }
  190. /* fill in the PAL handle based on the file descriptors and address given. */
  191. static inline
  192. PAL_HANDLE socket_create_handle (int type, int fd, int options,
  193. struct sockaddr * bind_addr,
  194. unsigned int bind_addrlen,
  195. struct sockaddr * dest_addr,
  196. unsigned int dest_addrlen,
  197. struct sockopt * sock_options)
  198. {
  199. PAL_HANDLE hdl = malloc(HANDLE_SIZE(sock) + (bind_addr ? bind_addrlen : 0) +
  200. (dest_addr ? dest_addrlen : 0));
  201. if (!hdl)
  202. return NULL;
  203. memset(hdl, 0, sizeof(struct pal_handle));
  204. init_handle_hdr(HANDLE_HDR(hdl), type);
  205. HANDLE_HDR(hdl)->flags |= RFD(0)|(type != pal_type_tcpsrv ? WFD(0) : 0);
  206. hdl->sock.fd = fd;
  207. void * addr = (void *) hdl + HANDLE_SIZE(sock);
  208. if (bind_addr) {
  209. hdl->sock.bind = (PAL_PTR) addr;
  210. memcpy(addr, bind_addr, bind_addrlen);
  211. addr += bind_addrlen;
  212. } else {
  213. hdl->sock.bind = (PAL_PTR) NULL;
  214. }
  215. if (dest_addr) {
  216. hdl->sock.conn = (PAL_PTR) addr;
  217. memcpy(addr, dest_addr, dest_addrlen);
  218. addr += dest_addrlen;
  219. } else {
  220. hdl->sock.conn = (PAL_PTR) NULL;
  221. }
  222. hdl->sock.nonblocking = (options & PAL_OPTION_NONBLOCK) ?
  223. PAL_TRUE : PAL_FALSE;
  224. hdl->sock.linger = sock_options->linger;
  225. hdl->sock.receivebuf = sock_options->receivebuf;
  226. hdl->sock.sendbuf = sock_options->sendbuf;
  227. hdl->sock.receivetimeout = sock_options->receivetimeout;
  228. hdl->sock.sendtimeout = sock_options->sendtimeout;
  229. hdl->sock.tcp_cork = sock_options->tcp_cork;
  230. hdl->sock.tcp_keepalive = sock_options->tcp_keepalive;
  231. hdl->sock.tcp_nodelay = sock_options->tcp_nodelay;
  232. return hdl;
  233. }
  234. #if ALLOW_BIND_ANY == 0
  235. static bool check_zero (void * mem, size_t size)
  236. {
  237. void * p = mem, * q = mem + size;
  238. while (p < q) {
  239. if (p <= q - sizeof(long)) {
  240. if (*(long *) p)
  241. return false;
  242. p += sizeof(long);
  243. } else if (p <= q - sizeof(int)) {
  244. if (*(int *) p)
  245. return false;
  246. p += sizeof(int);
  247. } else if (p <= q - sizeof(short)) {
  248. if (*(short *) p)
  249. return false;
  250. p += sizeof(short);
  251. } else {
  252. if (*(char *) p)
  253. return false;
  254. p++;
  255. }
  256. }
  257. return true;
  258. }
  259. /* check if an address is "Any" */
  260. static bool check_any_addr (struct sockaddr * addr)
  261. {
  262. if (addr->sa_family == AF_INET) {
  263. struct sockaddr_in * addr_in =
  264. (struct sockaddr_in *) addr;
  265. return addr_in->sin_port == 0 &&
  266. check_zero(&addr_in->sin_addr,
  267. sizeof(addr_in->sin_addr));
  268. } else if (addr->sa_family == AF_INET6) {
  269. struct sockaddr_in6 * addr_in6 =
  270. (struct sockaddr_in6 *) addr;
  271. return addr_in6->sin6_port == 0 &&
  272. check_zero(&addr_in6->sin6_addr,
  273. sizeof(addr_in6->sin6_addr));
  274. }
  275. return false;
  276. }
  277. #endif
  278. static inline int sock_type (int type, int options)
  279. {
  280. if (options & PAL_OPTION_NONBLOCK)
  281. type |= SOCK_NONBLOCK;
  282. return type;
  283. }
  284. /* listen on a tcp socket */
  285. static int tcp_listen (PAL_HANDLE * handle, char * uri, int options)
  286. {
  287. struct sockaddr buffer, * bind_addr = &buffer;
  288. unsigned int bind_addrlen;
  289. int ret;
  290. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  291. NULL, NULL)) < 0)
  292. return ret;
  293. #if ALLOW_BIND_ANY == 0
  294. /* the socket need to have a binding address, a null address or an
  295. any address is not allowed */
  296. if (check_any_addr(bind_addr))
  297. return -PAL_ERROR_INVAL;
  298. #endif
  299. struct sockopt sock_options;
  300. ret = ocall_sock_listen(bind_addr->sa_family,
  301. sock_type(SOCK_STREAM, options), 0,
  302. bind_addr, &bind_addrlen,
  303. &sock_options);
  304. if (IS_ERR(ret))
  305. return unix_to_pal_error(ERRNO(ret));
  306. *handle = socket_create_handle(pal_type_tcpsrv, ret, options,
  307. bind_addr, bind_addrlen, NULL, 0,
  308. &sock_options);
  309. if (!(*handle)) {
  310. ocall_close(ret);
  311. return -PAL_ERROR_NOMEM;
  312. }
  313. return 0;
  314. }
  315. /* accept a tcp connection */
  316. static int tcp_accept (PAL_HANDLE handle, PAL_HANDLE * client)
  317. {
  318. if (!IS_HANDLE_TYPE(handle, tcpsrv) ||
  319. !handle->sock.bind || handle->sock.conn)
  320. return -PAL_ERROR_NOTSERVER;
  321. if (handle->sock.fd == PAL_IDX_POISON)
  322. return -PAL_ERROR_BADHANDLE;
  323. struct sockaddr * bind_addr = (struct sockaddr *) handle->sock.bind;
  324. unsigned int bind_addrlen = addr_size(bind_addr);
  325. struct sockaddr dest_addr;
  326. unsigned int dest_addrlen = sizeof(struct sockaddr);
  327. int ret = 0;
  328. struct sockopt sock_options;
  329. ret = ocall_sock_accept(handle->sock.fd, &dest_addr, &dest_addrlen,
  330. &sock_options);
  331. if (IS_ERR(ret))
  332. return unix_to_pal_error(ERRNO(ret));
  333. *client = socket_create_handle(pal_type_tcp, ret, 0, bind_addr,
  334. bind_addrlen,
  335. &dest_addr, dest_addrlen,
  336. &sock_options);
  337. if (!(*client)) {
  338. ocall_close(ret);
  339. return -PAL_ERROR_NOMEM;
  340. }
  341. return 0;
  342. }
  343. /* connect on a tcp socket */
  344. static int tcp_connect (PAL_HANDLE * handle, char * uri, int options)
  345. {
  346. struct sockaddr buffer[2];
  347. struct sockaddr * bind_addr = buffer, * dest_addr = buffer + 1;
  348. unsigned int bind_addrlen, dest_addrlen;
  349. int ret;
  350. /* accepting two kind of different uri:
  351. dest-ip:dest-port or bind-ip:bind-port:dest-ip:dest-port */
  352. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  353. &dest_addr, &dest_addrlen)) < 0)
  354. return ret;
  355. if (!dest_addr)
  356. return -PAL_ERROR_INVAL;
  357. if (bind_addr && bind_addr->sa_family != dest_addr->sa_family)
  358. return -PAL_ERROR_INVAL;
  359. #if ALLOW_BIND_ANY == 0
  360. /* the socket need to have a binding address, a null address or an
  361. any address is not allowed */
  362. if (bind_addr && addr_check_any(bind_addr))
  363. return -PAL_ERROR_INVAL;
  364. #endif
  365. struct sockopt sock_options;
  366. ret = ocall_sock_connect(dest_addr->sa_family,
  367. sock_type(SOCK_STREAM, options), 0,
  368. dest_addr, dest_addrlen,
  369. bind_addr, &bind_addrlen, &sock_options);
  370. if (IS_ERR(ret))
  371. return unix_to_pal_error(ERRNO(ret));
  372. *handle = socket_create_handle(pal_type_tcp, ret, options,
  373. bind_addr, bind_addrlen,
  374. dest_addr, dest_addrlen,
  375. &sock_options);
  376. if (!(*handle)) {
  377. ocall_close(ret);
  378. return -PAL_ERROR_NOMEM;
  379. }
  380. return 0;
  381. }
  382. /* 'open' operation of tcp stream */
  383. static int tcp_open (PAL_HANDLE *handle, const char * type, const char * uri,
  384. int access, int share, int create, int options)
  385. {
  386. if (!WITHIN_MASK(access, PAL_ACCESS_MASK) ||
  387. !WITHIN_MASK(share, PAL_SHARE_MASK) ||
  388. !WITHIN_MASK(create, PAL_CREATE_MASK) ||
  389. !WITHIN_MASK(options, PAL_OPTION_MASK))
  390. return -PAL_ERROR_INVAL;
  391. int uri_len = strlen(uri) + 1;
  392. if (uri_len > PAL_SOCKADDR_SIZE)
  393. return -PAL_ERROR_TOOLONG;
  394. char uri_buf[PAL_SOCKADDR_SIZE];
  395. memcpy(uri_buf, uri, uri_len);
  396. if (strcmp_static(type, "tcp.srv"))
  397. return tcp_listen(handle, uri_buf, options);
  398. if (strcmp_static(type, "tcp"))
  399. return tcp_connect(handle, uri_buf, options);
  400. return -PAL_ERROR_NOTSUPPORT;
  401. }
  402. /* 'read' operation of tcp stream */
  403. static int64_t tcp_read (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  404. void * buf)
  405. {
  406. if (offset)
  407. return -PAL_ERROR_INVAL;
  408. if (!IS_HANDLE_TYPE(handle, tcp) || !handle->sock.conn)
  409. return -PAL_ERROR_NOTCONNECTION;
  410. if (handle->sock.fd == PAL_IDX_POISON)
  411. return -PAL_ERROR_ENDOFSTREAM;
  412. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  413. return -PAL_ERROR_INVAL;
  414. int bytes = ocall_sock_recv(handle->sock.fd, buf, len, NULL, NULL);
  415. if (IS_ERR(bytes))
  416. return unix_to_pal_error(ERRNO(bytes));
  417. if (!bytes)
  418. return -PAL_ERROR_ENDOFSTREAM;
  419. return bytes;
  420. }
  421. /* write' operation of tcp stream */
  422. static int64_t tcp_write (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  423. const void * buf)
  424. {
  425. if (offset)
  426. return -PAL_ERROR_INVAL;
  427. if (!IS_HANDLE_TYPE(handle, tcp) || !handle->sock.conn)
  428. return -PAL_ERROR_NOTCONNECTION;
  429. if (handle->sock.fd == PAL_IDX_POISON)
  430. return -PAL_ERROR_CONNFAILED;
  431. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  432. return -PAL_ERROR_INVAL;
  433. int bytes = ocall_sock_send(handle->sock.fd, buf, len, NULL, 0);
  434. if (IS_ERR(bytes)) {
  435. bytes = unix_to_pal_error(ERRNO(bytes));
  436. if (bytes == -PAL_ERROR_TRYAGAIN)
  437. HANDLE_HDR(handle)->flags &= ~WRITABLE(0);
  438. return bytes;
  439. }
  440. if ((uint64_t)bytes == len)
  441. HANDLE_HDR(handle)->flags |= WRITABLE(0);
  442. else
  443. HANDLE_HDR(handle)->flags &= ~WRITABLE(0);
  444. return bytes;
  445. }
  446. /* used by 'open' operation of tcp stream for bound socket */
  447. static int udp_bind (PAL_HANDLE * handle, char * uri, int options)
  448. {
  449. struct sockaddr buffer, * bind_addr = &buffer;
  450. unsigned int bind_addrlen;
  451. int ret = 0;
  452. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  453. NULL, NULL)) < 0)
  454. return ret;
  455. assert(bind_addr);
  456. assert(bind_addrlen == addr_size(bind_addr));
  457. #if ALLOW_BIND_ANY == 0
  458. /* the socket need to have a binding address, a null address or an
  459. any address is not allowed */
  460. if (addr_check_any(bind_addr))
  461. return -PAL_ERROR_INVAL;
  462. #endif
  463. struct sockopt sock_options;
  464. ret = ocall_sock_listen(bind_addr->sa_family,
  465. sock_type(SOCK_DGRAM, options), 0,
  466. bind_addr, &bind_addrlen, &sock_options);
  467. if (IS_ERR(ret))
  468. return unix_to_pal_error(ERRNO(ret));
  469. *handle = socket_create_handle(pal_type_udpsrv, ret, options,
  470. bind_addr, bind_addrlen, NULL, 0,
  471. &sock_options);
  472. if (!(*handle)) {
  473. ocall_close(ret);
  474. return -PAL_ERROR_NOMEM;
  475. }
  476. return 0;
  477. }
  478. /* used by 'open' operation of tcp stream for connected socket */
  479. static int udp_connect (PAL_HANDLE * handle, char * uri, int options)
  480. {
  481. struct sockaddr buffer[2];
  482. struct sockaddr * bind_addr = buffer, * dest_addr = buffer + 1;
  483. unsigned int bind_addrlen, dest_addrlen;
  484. int ret;
  485. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen,
  486. &dest_addr, &dest_addrlen)) < 0)
  487. return ret;
  488. #if ALLOW_BIND_ANY == 0
  489. /* the socket need to have a binding address, a null address or an
  490. any address is not allowed */
  491. if (bind_addr && addr_check_any(bind_addr))
  492. return -PAL_ERROR_INVAL;
  493. #endif
  494. struct sockopt sock_options;
  495. ret = ocall_sock_connect(dest_addr ? dest_addr->sa_family : AF_INET,
  496. sock_type(SOCK_DGRAM, options), 0,
  497. dest_addr, dest_addrlen,
  498. bind_addr, &bind_addrlen, &sock_options);
  499. if (IS_ERR(ret))
  500. return unix_to_pal_error(ERRNO(ret));
  501. *handle = socket_create_handle(dest_addr ? pal_type_udp :
  502. pal_type_udpsrv, ret, options,
  503. bind_addr, bind_addrlen,
  504. dest_addr, dest_addrlen,
  505. &sock_options);
  506. if (!(*handle)) {
  507. ocall_close(ret);
  508. return -PAL_ERROR_NOMEM;
  509. }
  510. return 0;
  511. }
  512. static int udp_open (PAL_HANDLE *hdl, const char * type, const char * uri,
  513. int access, int share, int create, int options)
  514. {
  515. if (!WITHIN_MASK(access, PAL_ACCESS_MASK) ||
  516. !WITHIN_MASK(share, PAL_SHARE_MASK) ||
  517. !WITHIN_MASK(create, PAL_CREATE_MASK) ||
  518. !WITHIN_MASK(options, PAL_OPTION_MASK))
  519. return -PAL_ERROR_INVAL;
  520. char buf[PAL_SOCKADDR_SIZE];
  521. int len = strlen(uri);
  522. if (len >= PAL_SOCKADDR_SIZE)
  523. return -PAL_ERROR_TOOLONG;
  524. memcpy(buf, uri, len + 1);
  525. if (strcmp_static(type, "udp.srv"))
  526. return udp_bind(hdl, buf, options);
  527. if (strcmp_static(type, "udp"))
  528. return udp_connect(hdl, buf, options);
  529. return -PAL_ERROR_NOTSUPPORT;
  530. }
  531. static int64_t udp_receive (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  532. void * buf)
  533. {
  534. if (offset)
  535. return -PAL_ERROR_INVAL;
  536. if (!IS_HANDLE_TYPE(handle, udp))
  537. return -PAL_ERROR_NOTCONNECTION;
  538. if (handle->sock.fd == PAL_IDX_POISON)
  539. return -PAL_ERROR_BADHANDLE;
  540. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  541. return -PAL_ERROR_INVAL;
  542. int ret = ocall_sock_recv(handle->sock.fd, buf, len, NULL, NULL);
  543. return IS_ERR(ret) ? unix_to_pal_error(ERRNO(ret)) : ret;
  544. }
  545. static int64_t udp_receivebyaddr (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  546. void * buf, char * addr, size_t addrlen)
  547. {
  548. if (offset)
  549. return -PAL_ERROR_INVAL;
  550. if (!IS_HANDLE_TYPE(handle, udpsrv))
  551. return -PAL_ERROR_NOTCONNECTION;
  552. if (handle->sock.fd == PAL_IDX_POISON)
  553. return -PAL_ERROR_BADHANDLE;
  554. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  555. return -PAL_ERROR_INVAL;
  556. struct sockaddr conn_addr;
  557. socklen_t conn_addrlen = sizeof(struct sockaddr);
  558. int bytes = ocall_sock_recv(handle->sock.fd, buf, len, &conn_addr,
  559. &conn_addrlen);
  560. if (IS_ERR(bytes))
  561. return unix_to_pal_error(ERRNO(bytes));
  562. char * addr_uri = strcpy_static(addr, "udp:", addrlen);
  563. if (!addr_uri)
  564. return -PAL_ERROR_OVERFLOW;
  565. int ret = inet_create_uri(addr_uri, addr + addrlen - addr_uri, &conn_addr,
  566. conn_addrlen);
  567. if (ret < 0)
  568. return ret;
  569. return bytes;
  570. }
  571. static int64_t udp_send (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  572. const void * buf)
  573. {
  574. if (offset)
  575. return -PAL_ERROR_INVAL;
  576. if (!IS_HANDLE_TYPE(handle, udp))
  577. return -PAL_ERROR_NOTCONNECTION;
  578. if (handle->sock.fd == PAL_IDX_POISON)
  579. return -PAL_ERROR_BADHANDLE;
  580. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  581. return -PAL_ERROR_INVAL;
  582. int bytes = ocall_sock_send(handle->sock.fd, buf, len, NULL, 0);
  583. if (IS_ERR(bytes)) {
  584. bytes = unix_to_pal_error(ERRNO(bytes));
  585. if (bytes == -PAL_ERROR_TRYAGAIN)
  586. HANDLE_HDR(handle)->flags &= ~WRITABLE(0);
  587. return bytes;
  588. }
  589. if ((uint64_t)bytes == len)
  590. HANDLE_HDR(handle)->flags |= WRITABLE(0);
  591. else
  592. HANDLE_HDR(handle)->flags &= ~WRITABLE(0);
  593. return bytes;
  594. }
  595. static int64_t udp_sendbyaddr (PAL_HANDLE handle, uint64_t offset, uint64_t len,
  596. const void * buf, const char * addr, size_t addrlen)
  597. {
  598. if (offset)
  599. return -PAL_ERROR_INVAL;
  600. if (!IS_HANDLE_TYPE(handle, udpsrv))
  601. return -PAL_ERROR_NOTCONNECTION;
  602. if (handle->sock.fd == PAL_IDX_POISON)
  603. return -PAL_ERROR_BADHANDLE;
  604. if (!strpartcmp_static(addr, "udp:"))
  605. return -PAL_ERROR_INVAL;
  606. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  607. return -PAL_ERROR_INVAL;
  608. addr += static_strlen("udp:");
  609. addrlen -= static_strlen("udp:");
  610. char * addrbuf = __alloca(addrlen);
  611. memcpy(addrbuf, addr, addrlen);
  612. struct sockaddr conn_addr;
  613. unsigned int conn_addrlen = sizeof(struct sockaddr);
  614. int ret = inet_parse_uri(&addrbuf, &conn_addr, &conn_addrlen);
  615. if (ret < 0)
  616. return ret;
  617. int bytes = ocall_sock_send(handle->sock.fd, buf, len, &conn_addr,
  618. conn_addrlen);
  619. if (IS_ERR(bytes)) {
  620. bytes = unix_to_pal_error(ERRNO(bytes));
  621. if (bytes == -PAL_ERROR_TRYAGAIN)
  622. HANDLE_HDR(handle)->flags &= ~WRITABLE(0);
  623. return bytes;
  624. }
  625. if ((uint64_t)bytes == len)
  626. HANDLE_HDR(handle)->flags |= WRITABLE(0);
  627. else
  628. HANDLE_HDR(handle)->flags &= ~WRITABLE(0);
  629. return bytes;
  630. }
  631. static int socket_delete (PAL_HANDLE handle, int access)
  632. {
  633. if (handle->sock.fd == PAL_IDX_POISON)
  634. return 0;
  635. if (!IS_HANDLE_TYPE(handle, tcp) && access)
  636. return -PAL_ERROR_INVAL;
  637. if (IS_HANDLE_TYPE(handle, tcp) || IS_HANDLE_TYPE(handle, tcpsrv)) {
  638. int shutdown;
  639. switch (access) {
  640. case 0:
  641. shutdown = SHUT_RDWR;
  642. break;
  643. case PAL_DELETE_RD:
  644. shutdown = SHUT_RD;
  645. break;
  646. case PAL_DELETE_WR:
  647. shutdown = SHUT_WR;
  648. break;
  649. default:
  650. return -PAL_ERROR_INVAL;
  651. }
  652. ocall_sock_shutdown(handle->sock.fd, shutdown);
  653. }
  654. return 0;
  655. }
  656. static int socket_close (PAL_HANDLE handle)
  657. {
  658. if (handle->sock.fd != PAL_IDX_POISON) {
  659. ocall_close(handle->sock.fd);
  660. handle->sock.fd = PAL_IDX_POISON;
  661. }
  662. if (handle->sock.bind)
  663. handle->sock.bind = (PAL_PTR) NULL;
  664. if (handle->sock.conn)
  665. handle->sock.conn = (PAL_PTR) NULL;
  666. return 0;
  667. }
  668. static int socket_attrquerybyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  669. {
  670. if (handle->sock.fd == PAL_IDX_POISON)
  671. return -PAL_ERROR_BADHANDLE;
  672. attr->handle_type = HANDLE_HDR(handle)->type;
  673. attr->disconnected = HANDLE_HDR(handle)->flags & ERROR(0);
  674. attr->nonblocking = handle->sock.nonblocking;
  675. attr->writable = HANDLE_HDR(handle)->flags & WRITABLE(0);
  676. attr->pending_size = 0; /* fill in later */
  677. attr->socket.linger = handle->sock.linger;
  678. attr->socket.receivebuf = handle->sock.receivebuf;
  679. attr->socket.sendbuf = handle->sock.sendbuf;
  680. attr->socket.receivetimeout = handle->sock.receivetimeout;
  681. attr->socket.sendtimeout = handle->sock.sendtimeout;
  682. attr->socket.tcp_cork = handle->sock.tcp_cork;
  683. attr->socket.tcp_keepalive = handle->sock.tcp_keepalive;
  684. attr->socket.tcp_nodelay = handle->sock.tcp_nodelay;
  685. int fd = handle->sock.fd, ret;
  686. if (!IS_HANDLE_TYPE(handle, tcpsrv)) {
  687. /* try use ioctl FIONEAD to get the size of socket */
  688. ret = ocall_fionread(fd);
  689. if (IS_ERR(ret))
  690. return unix_to_pal_error(ERRNO(ret));
  691. attr->pending_size = ret;
  692. }
  693. struct pollfd pfd = { .fd = fd, .events = POLLIN, .revents = 0 };
  694. int64_t waittime = 0;
  695. ret = ocall_poll(&pfd, 1, &waittime);
  696. if (IS_ERR(ret))
  697. return unix_to_pal_error(ERRNO(ret));
  698. attr->readable = (ret == 1 && pfd.revents == POLLIN);
  699. return 0;
  700. }
  701. static int socket_attrsetbyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  702. {
  703. if (handle->sock.fd == PAL_IDX_POISON)
  704. return -PAL_ERROR_BADHANDLE;
  705. int fd = handle->sock.fd, ret, val;
  706. if (attr->nonblocking != handle->sock.nonblocking) {
  707. ret = ocall_fsetnonblock(fd, attr->nonblocking);
  708. if (IS_ERR(ret))
  709. return unix_to_pal_error(ERRNO(ret));
  710. handle->sock.nonblocking = attr->nonblocking;
  711. }
  712. if (HANDLE_TYPE(handle) != pal_type_tcpsrv) {
  713. struct __kernel_linger {
  714. int l_onoff;
  715. int l_linger;
  716. };
  717. if (attr->socket.linger != handle->sock.linger) {
  718. struct __kernel_linger l;
  719. l.l_onoff = attr->socket.linger ? 1 : 0;
  720. l.l_linger = attr->socket.linger;
  721. ret = ocall_sock_setopt(fd, SOL_SOCKET, SO_LINGER, &l,
  722. sizeof(struct __kernel_linger));
  723. if (IS_ERR(ret))
  724. return unix_to_pal_error(ERRNO(ret));
  725. handle->sock.linger = attr->socket.linger;
  726. }
  727. if (attr->socket.receivebuf != handle->sock.receivebuf) {
  728. val = attr->socket.receivebuf;
  729. ret = ocall_sock_setopt(fd, SOL_SOCKET, SO_RCVBUF, &val,
  730. sizeof(int));
  731. if (IS_ERR(ret))
  732. return unix_to_pal_error(ERRNO(ret));
  733. handle->sock.receivebuf = attr->socket.receivebuf;
  734. }
  735. if (attr->socket.sendbuf != handle->sock.sendbuf) {
  736. val = attr->socket.sendbuf;
  737. ret = ocall_sock_setopt(fd, SOL_SOCKET, SO_SNDBUF,
  738. &val, sizeof(int));
  739. if (IS_ERR(ret))
  740. return unix_to_pal_error(ERRNO(ret));
  741. handle->sock.sendbuf = attr->socket.sendbuf;
  742. }
  743. if (attr->socket.receivetimeout != handle->sock.receivetimeout) {
  744. val = attr->socket.receivetimeout;
  745. ret = ocall_sock_setopt(fd, SOL_SOCKET, SO_RCVTIMEO,
  746. &val, sizeof(int));
  747. if (IS_ERR(ret))
  748. return unix_to_pal_error(ERRNO(ret));
  749. handle->sock.receivetimeout = attr->socket.receivetimeout;
  750. }
  751. if (attr->socket.sendtimeout != handle->sock.sendtimeout) {
  752. val = attr->socket.sendtimeout;
  753. ret = ocall_sock_setopt(fd, SOL_SOCKET, SO_SNDTIMEO,
  754. &val, sizeof(int));
  755. if (IS_ERR(ret))
  756. return unix_to_pal_error(ERRNO(ret));
  757. handle->sock.sendtimeout = attr->socket.sendtimeout;
  758. }
  759. }
  760. if (HANDLE_TYPE(handle) == pal_type_tcp ||
  761. HANDLE_TYPE(handle) == pal_type_tcpsrv) {
  762. if (attr->socket.tcp_cork != handle->sock.tcp_cork) {
  763. val = attr->socket.tcp_cork ? 1 : 0;
  764. ret = ocall_sock_setopt(fd, SOL_TCP, TCP_CORK,
  765. &val, sizeof(int));
  766. if (IS_ERR(ret))
  767. return unix_to_pal_error(ERRNO(ret));
  768. handle->sock.tcp_cork = attr->socket.tcp_cork;
  769. }
  770. if (attr->socket.tcp_keepalive != handle->sock.tcp_keepalive) {
  771. val = attr->socket.tcp_keepalive ? 1 : 0;
  772. ret = ocall_sock_setopt(fd, SOL_SOCKET, SO_KEEPALIVE,
  773. &val, sizeof(int));
  774. if (IS_ERR(ret))
  775. return unix_to_pal_error(ERRNO(ret));
  776. handle->sock.tcp_keepalive = attr->socket.tcp_keepalive;
  777. }
  778. if (attr->socket.tcp_nodelay != handle->sock.tcp_nodelay) {
  779. val = attr->socket.tcp_nodelay ? 1 : 0;
  780. ret = ocall_sock_setopt(fd, SOL_TCP, TCP_NODELAY,
  781. &val, sizeof(int));
  782. if (IS_ERR(ret))
  783. return unix_to_pal_error(ERRNO(ret));
  784. handle->sock.tcp_nodelay = attr->socket.tcp_nodelay;
  785. }
  786. }
  787. return 0;
  788. }
  789. static int socket_getname (PAL_HANDLE handle, char * buffer, size_t count)
  790. {
  791. int old_count = count;
  792. int ret;
  793. const char * prefix = NULL;
  794. size_t prefix_len = 0;
  795. struct sockaddr * bind_addr = NULL, * dest_addr = NULL;
  796. switch (HANDLE_TYPE(handle)) {
  797. case pal_type_tcpsrv:
  798. prefix_len = static_strlen("tcp.srv");
  799. prefix = "tcp.srv";
  800. bind_addr = (struct sockaddr *) handle->sock.bind;
  801. break;
  802. case pal_type_tcp:
  803. prefix_len = static_strlen("tcp");
  804. prefix = "tcp";
  805. bind_addr = (struct sockaddr *) handle->sock.bind;
  806. dest_addr = (struct sockaddr *) handle->sock.conn;
  807. break;
  808. case pal_type_udpsrv:
  809. prefix_len = static_strlen("udp.srv");
  810. prefix = "udp.srv";
  811. bind_addr = (struct sockaddr *) handle->sock.bind;
  812. break;
  813. case pal_type_udp:
  814. prefix_len = static_strlen("udp");
  815. prefix = "udp";
  816. bind_addr = (struct sockaddr *) handle->sock.bind;
  817. dest_addr = (struct sockaddr *) handle->sock.conn;
  818. break;
  819. default:
  820. return -PAL_ERROR_INVAL;
  821. }
  822. if (prefix_len >= count)
  823. return -PAL_ERROR_OVERFLOW;
  824. memcpy(buffer, prefix, prefix_len + 1);
  825. buffer += prefix_len;
  826. count -= prefix_len;
  827. for (int i = 0 ; i < 2 ; i++) {
  828. struct sockaddr * addr = i ? dest_addr : bind_addr;
  829. if (addr) {
  830. if (count <= 1)
  831. return -PAL_ERROR_OVERFLOW;
  832. buffer[0] = ':';
  833. buffer[1] = 0;
  834. buffer++;
  835. count--;
  836. if ((ret = inet_create_uri(buffer, count, addr,
  837. addr_size(addr))) < 0)
  838. return ret;
  839. buffer += ret;
  840. count -= ret;
  841. }
  842. }
  843. return old_count - count;
  844. }
  845. struct handle_ops tcp_ops = {
  846. .getname = &socket_getname,
  847. .open = &tcp_open,
  848. .waitforclient = &tcp_accept,
  849. .read = &tcp_read,
  850. .write = &tcp_write,
  851. .delete = &socket_delete,
  852. .close = &socket_close,
  853. .attrquerybyhdl = &socket_attrquerybyhdl,
  854. .attrsetbyhdl = &socket_attrsetbyhdl,
  855. };
  856. struct handle_ops udp_ops = {
  857. .getname = &socket_getname,
  858. .open = &udp_open,
  859. .read = &udp_receive,
  860. .write = &udp_send,
  861. .delete = &socket_delete,
  862. .close = &socket_close,
  863. .attrquerybyhdl = &socket_attrquerybyhdl,
  864. .attrsetbyhdl = &socket_attrsetbyhdl,
  865. };
  866. struct handle_ops udpsrv_ops = {
  867. .getname = &socket_getname,
  868. .open = &udp_open,
  869. .readbyaddr = &udp_receivebyaddr,
  870. .writebyaddr = &udp_sendbyaddr,
  871. .delete = &socket_delete,
  872. .close = &socket_close,
  873. .attrquerybyhdl = &socket_attrquerybyhdl,
  874. .attrsetbyhdl = &socket_attrsetbyhdl,
  875. };
  876. PAL_HANDLE _DkBroadcastStreamOpen (void)
  877. {
  878. PAL_HANDLE hdl = malloc(HANDLE_SIZE(file));
  879. SET_HANDLE_TYPE(hdl, mcast);
  880. HANDLE_HDR(hdl)->flags |= RFD(0)|WFD(1)|WRITABLE(1);
  881. hdl->mcast.port = pal_sec.mcast_port;
  882. hdl->mcast.srv = pal_sec.mcast_srv;
  883. hdl->mcast.cli = pal_sec.mcast_cli;
  884. return hdl;
  885. }
  886. static int64_t mcast_send (PAL_HANDLE handle, uint64_t offset, uint64_t size,
  887. const void * buf)
  888. {
  889. if (offset)
  890. return -PAL_ERROR_INVAL;
  891. if (handle->mcast.srv == PAL_IDX_POISON)
  892. return -PAL_ERROR_BADHANDLE;
  893. if (size >= (1ULL << (sizeof(unsigned int) * 8)))
  894. return -PAL_ERROR_INVAL;
  895. int bytes = ocall_sock_send(handle->mcast.srv, buf, size,
  896. NULL, 0);
  897. if (IS_ERR(bytes)) {
  898. bytes = unix_to_pal_error(ERRNO(bytes));
  899. if (bytes == -PAL_ERROR_TRYAGAIN)
  900. HANDLE_HDR(handle)->flags &= ~WRITABLE(1);
  901. return bytes;
  902. }
  903. if ((uint64_t)bytes == size)
  904. HANDLE_HDR(handle)->flags |= WRITABLE(1);
  905. else
  906. HANDLE_HDR(handle)->flags &= ~WRITABLE(1);
  907. return bytes;
  908. }
  909. static int64_t mcast_receive (PAL_HANDLE handle, uint64_t offset, uint64_t size,
  910. void * buf)
  911. {
  912. if (offset)
  913. return -PAL_ERROR_INVAL;
  914. if (handle->mcast.cli == PAL_IDX_POISON)
  915. return -PAL_ERROR_BADHANDLE;
  916. if (size >= (1ULL << (sizeof(unsigned int) * 8)))
  917. return -PAL_ERROR_INVAL;
  918. int bytes = ocall_sock_recv(handle->mcast.cli, buf, size, NULL,
  919. NULL);
  920. if (IS_ERR(bytes))
  921. bytes = unix_to_pal_error(ERRNO(bytes));
  922. if (bytes == -PAL_ERROR_TRYAGAIN)
  923. HANDLE_HDR(handle)->flags &= ~WRITABLE(1);
  924. return bytes;
  925. }
  926. static int mcast_close (PAL_HANDLE handle)
  927. {
  928. if (handle->mcast.srv != PAL_IDX_POISON) {
  929. ocall_close(handle->mcast.srv);
  930. handle->mcast.srv = PAL_IDX_POISON;
  931. }
  932. if (handle->mcast.cli != PAL_IDX_POISON) {
  933. ocall_close(handle->mcast.cli);
  934. handle->mcast.cli = PAL_IDX_POISON;
  935. }
  936. return 0;
  937. }
  938. static int mcast_attrquerybyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  939. {
  940. if (handle->mcast.cli == PAL_IDX_POISON)
  941. return -PAL_ERROR_BADHANDLE;
  942. int ret = ocall_fionread(handle->mcast.cli);
  943. if (IS_ERR(ret))
  944. return unix_to_pal_error(ERRNO(ret));
  945. memset(attr, 0, sizeof(PAL_STREAM_ATTR));
  946. attr->pending_size = ret;
  947. attr->disconnected = HANDLE_HDR(handle)->flags & (ERROR(0)|ERROR(1));
  948. attr->readable = (attr->pending_size > 0);
  949. attr->writable = HANDLE_HDR(handle)->flags & WRITABLE(1);
  950. attr->nonblocking = handle->mcast.nonblocking;
  951. return 0;
  952. }
  953. static int mcast_attrsetbyhdl (PAL_HANDLE handle, PAL_STREAM_ATTR * attr)
  954. {
  955. if (handle->mcast.cli == PAL_IDX_POISON)
  956. return -PAL_ERROR_BADHANDLE;
  957. PAL_BOL * nonblocking = &handle->mcast.nonblocking;
  958. if (attr->nonblocking != *nonblocking) {
  959. int ret = ocall_fsetnonblock(handle->mcast.cli, *nonblocking);
  960. if (IS_ERR(ret))
  961. return unix_to_pal_error(ERRNO(ret));
  962. *nonblocking = attr->nonblocking;
  963. }
  964. return 0;
  965. }
  966. struct handle_ops mcast_ops = {
  967. .write = &mcast_send,
  968. .read = &mcast_receive,
  969. .close = &mcast_close,
  970. .attrquerybyhdl = &mcast_attrquerybyhdl,
  971. .attrsetbyhdl = &mcast_attrsetbyhdl,
  972. };