db_sockets.c 31 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009
  1. /* Copyright (C) 2014 Stony Brook University
  2. This file is part of Graphene Library OS.
  3. Graphene Library OS is free software: you can redistribute it and/or
  4. modify it under the terms of the GNU Lesser General Public License
  5. as published by the Free Software Foundation, either version 3 of the
  6. License, or (at your option) any later version.
  7. Graphene Library OS is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. GNU Lesser General Public License for more details.
  11. You should have received a copy of the GNU Lesser General Public License
  12. along with this program. If not, see <http://www.gnu.org/licenses/>. */
  13. /*
  14. * db_socket.c
  15. *
  16. * This file contains operands for streams with URIs that start with
  17. * "tcp:", "tcp.srv:", "udp:", "udp.srv:".
  18. */
  19. #include <linux/in.h>
  20. #include <linux/in6.h>
  21. #include <linux/poll.h>
  22. #include <linux/types.h>
  23. #include "api.h"
  24. #include "pal.h"
  25. #include "pal_debug.h"
  26. #include "pal_defs.h"
  27. #include "pal_error.h"
  28. #include "pal_internal.h"
  29. #include "pal_linux.h"
  30. #include "pal_linux_defs.h"
  31. #include "pal_linux_error.h"
  32. #include "pal_security.h"
  33. typedef __kernel_pid_t pid_t;
  34. #include <asm-generic/socket.h>
  35. #include <asm/fcntl.h>
  36. #ifndef SOL_TCP
  37. #define SOL_TCP 6
  38. #endif
  39. #ifndef TCP_NODELAY
  40. #define TCP_NODELAY 1
  41. #endif
  42. #ifndef TCP_CORK
  43. #define TCP_CORK 3
  44. #endif
  45. /* 96 bytes is the minimal size of buffer to store a IPv4/IPv6
  46. address */
  47. #define PAL_SOCKADDR_SIZE 96
  48. static size_t addr_size(const struct sockaddr* addr) {
  49. switch (addr->sa_family) {
  50. case AF_INET:
  51. return sizeof(struct sockaddr_in);
  52. case AF_INET6:
  53. return sizeof(struct sockaddr_in6);
  54. default:
  55. return 0;
  56. }
  57. }
  58. /* parsing the string of uri, and fill in the socket address structure.
  59. the latest pointer of uri, length of socket address are returned. */
  60. static int inet_parse_uri(char** uri, struct sockaddr* addr, unsigned int* addrlen) {
  61. char* tmp = *uri;
  62. char* end;
  63. char* addr_str = NULL;
  64. char* port_str;
  65. int af;
  66. void* addr_buf;
  67. int addr_len;
  68. __be16* port_buf;
  69. int slen;
  70. if (tmp[0] == '[') {
  71. /* for IPv6, the address will be in the form of
  72. "[xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx]:port". */
  73. struct sockaddr_in6* addr_in6 = (struct sockaddr_in6*)addr;
  74. slen = sizeof(struct sockaddr_in6);
  75. memset(addr, 0, slen);
  76. end = strchr(tmp + 1, ']');
  77. if (!end || *(end + 1) != ':')
  78. goto inval;
  79. addr_str = tmp + 1;
  80. addr_len = end - tmp - 1;
  81. port_str = end + 2;
  82. for (end = port_str; *end >= '0' && *end <= '9'; end++)
  83. ;
  84. addr_in6->sin6_family = af = AF_INET6;
  85. addr_buf = &addr_in6->sin6_addr.s6_addr;
  86. port_buf = &addr_in6->sin6_port;
  87. } else {
  88. /* for IP, the address will be in the form of "x.x.x.x:port". */
  89. struct sockaddr_in* addr_in = (struct sockaddr_in*)addr;
  90. slen = sizeof(struct sockaddr_in);
  91. memset(addr, 0, slen);
  92. end = strchr(tmp, ':');
  93. if (!end)
  94. goto inval;
  95. addr_str = tmp;
  96. addr_len = end - tmp;
  97. port_str = end + 1;
  98. for (end = port_str; *end >= '0' && *end <= '9'; end++)
  99. ;
  100. addr_in->sin_family = af = AF_INET;
  101. addr_buf = &addr_in->sin_addr.s_addr;
  102. port_buf = &addr_in->sin_port;
  103. }
  104. if (af == AF_INET) {
  105. if (!inet_pton4(addr_str, addr_len, addr_buf))
  106. goto inval;
  107. } else {
  108. if (!inet_pton6(addr_str, addr_len, addr_buf))
  109. goto inval;
  110. }
  111. *port_buf = __htons(atoi(port_str));
  112. *uri = *end ? end + 1 : NULL;
  113. if (addrlen)
  114. *addrlen = slen;
  115. return 0;
  116. inval:
  117. return -PAL_ERROR_INVAL;
  118. }
  119. /* create the string of uri from the given socket address */
  120. static int inet_create_uri(char* uri, int count, struct sockaddr* addr, int addrlen) {
  121. int len = 0;
  122. if (addr->sa_family == AF_INET) {
  123. if (addrlen != sizeof(struct sockaddr_in))
  124. return -PAL_ERROR_INVAL;
  125. struct sockaddr_in* addr_in = (struct sockaddr_in*)addr;
  126. char* addr = (char*)&addr_in->sin_addr.s_addr;
  127. /* for IP, the address will be in the form of "x.x.x.x:port". */
  128. len = snprintf(uri, count, "%u.%u.%u.%u:%u", (unsigned char)addr[0], (unsigned char)addr[1],
  129. (unsigned char)addr[2], (unsigned char)addr[3], __ntohs(addr_in->sin_port));
  130. } else if (addr->sa_family == AF_INET6) {
  131. if (addrlen != sizeof(struct sockaddr_in6))
  132. return -PAL_ERROR_INVAL;
  133. struct sockaddr_in6* addr_in6 = (struct sockaddr_in6*)addr;
  134. unsigned short* addr = (unsigned short*)&addr_in6->sin6_addr.s6_addr;
  135. /* for IPv6, the address will be in the form of
  136. "[xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx]:port". */
  137. len = snprintf(uri, count, "[%04x:%04x:%04x:%04x:%04x:%04x:%04x:%04x]:%u", addr[0], addr[1],
  138. addr[2], addr[3], addr[4], addr[5], addr[6], addr[7],
  139. __ntohs(addr_in6->sin6_port));
  140. } else {
  141. return -PAL_ERROR_INVAL;
  142. }
  143. if (len >= count)
  144. return -PAL_ERROR_TOOLONG;
  145. return len;
  146. }
  147. /* parse the uri for a socket stream. The uri might have both binding
  148. address and connecting address, or connecting address only. The form
  149. of uri will be either "bind-addr:bind-port:connect-addr:connect-port"
  150. or "addr:port". */
  151. static int socket_parse_uri(char* uri, struct sockaddr** bind_addr, unsigned int* bind_addrlen,
  152. struct sockaddr** dest_addr, unsigned int* dest_addrlen) {
  153. int ret;
  154. if (!bind_addr && !dest_addr)
  155. return 0;
  156. if (!uri || !(*uri)) {
  157. if (bind_addr)
  158. *bind_addr = NULL;
  159. if (bind_addrlen)
  160. *bind_addrlen = 0;
  161. if (dest_addr)
  162. *dest_addr = NULL;
  163. if (dest_addrlen)
  164. *dest_addrlen = 0;
  165. return 0;
  166. }
  167. /* at least parse uri once */
  168. if ((ret = inet_parse_uri(&uri, bind_addr ? *bind_addr : *dest_addr,
  169. bind_addr ? bind_addrlen : dest_addrlen)) < 0)
  170. return ret;
  171. if (!(bind_addr && dest_addr))
  172. return 0;
  173. /* if you reach here, it can only be connection address */
  174. if (!uri || (ret = inet_parse_uri(&uri, *dest_addr, dest_addrlen)) < 0) {
  175. *dest_addr = *bind_addr;
  176. *dest_addrlen = *bind_addrlen;
  177. *bind_addr = NULL;
  178. *bind_addrlen = 0;
  179. }
  180. return 0;
  181. }
  182. /* fill in the PAL handle based on the file descriptors and address given. */
  183. static inline PAL_HANDLE socket_create_handle(int type, int fd, int options,
  184. struct sockaddr* bind_addr, unsigned int bind_addrlen,
  185. struct sockaddr* dest_addr, unsigned int dest_addrlen,
  186. struct sockopt* sock_options) {
  187. PAL_HANDLE hdl =
  188. malloc(HANDLE_SIZE(sock) + (bind_addr ? bind_addrlen : 0) + (dest_addr ? dest_addrlen : 0));
  189. if (!hdl)
  190. return NULL;
  191. memset(hdl, 0, sizeof(struct pal_handle));
  192. init_handle_hdr(HANDLE_HDR(hdl), type);
  193. HANDLE_HDR(hdl)->flags |= RFD(0) | (type != pal_type_tcpsrv ? WFD(0) : 0);
  194. hdl->sock.fd = fd;
  195. void* addr = (void*)hdl + HANDLE_SIZE(sock);
  196. if (bind_addr) {
  197. hdl->sock.bind = (PAL_PTR)addr;
  198. memcpy(addr, bind_addr, bind_addrlen);
  199. addr += bind_addrlen;
  200. } else {
  201. hdl->sock.bind = (PAL_PTR)NULL;
  202. }
  203. if (dest_addr) {
  204. hdl->sock.conn = (PAL_PTR)addr;
  205. memcpy(addr, dest_addr, dest_addrlen);
  206. addr += dest_addrlen;
  207. } else {
  208. hdl->sock.conn = (PAL_PTR)NULL;
  209. }
  210. hdl->sock.nonblocking = (options & PAL_OPTION_NONBLOCK) ? PAL_TRUE : PAL_FALSE;
  211. hdl->sock.linger = sock_options->linger;
  212. hdl->sock.receivebuf = sock_options->receivebuf;
  213. hdl->sock.sendbuf = sock_options->sendbuf;
  214. hdl->sock.receivetimeout = sock_options->receivetimeout;
  215. hdl->sock.sendtimeout = sock_options->sendtimeout;
  216. hdl->sock.tcp_cork = sock_options->tcp_cork;
  217. hdl->sock.tcp_keepalive = sock_options->tcp_keepalive;
  218. hdl->sock.tcp_nodelay = sock_options->tcp_nodelay;
  219. return hdl;
  220. }
  221. #if ALLOW_BIND_ANY == 0
  222. static bool check_zero(void* mem, size_t size) {
  223. void* p = mem;
  224. void* q = mem + size;
  225. while (p < q) {
  226. if (p <= q - sizeof(long)) {
  227. if (*(long*)p)
  228. return false;
  229. p += sizeof(long);
  230. } else if (p <= q - sizeof(int)) {
  231. if (*(int*)p)
  232. return false;
  233. p += sizeof(int);
  234. } else if (p <= q - sizeof(short)) {
  235. if (*(short*)p)
  236. return false;
  237. p += sizeof(short);
  238. } else {
  239. if (*(char*)p)
  240. return false;
  241. p++;
  242. }
  243. }
  244. return true;
  245. }
  246. /* check if an address is "Any" */
  247. static bool check_any_addr(struct sockaddr* addr) {
  248. if (addr->sa_family == AF_INET) {
  249. struct sockaddr_in* addr_in = (struct sockaddr_in*)addr;
  250. return addr_in->sin_port == 0 && check_zero(&addr_in->sin_addr, sizeof(addr_in->sin_addr));
  251. } else if (addr->sa_family == AF_INET6) {
  252. struct sockaddr_in6* addr_in6 = (struct sockaddr_in6*)addr;
  253. return addr_in6->sin6_port == 0 &&
  254. check_zero(&addr_in6->sin6_addr, sizeof(addr_in6->sin6_addr));
  255. }
  256. return false;
  257. }
  258. #endif
  259. static inline int sock_type(int type, int options) {
  260. if (options & PAL_OPTION_NONBLOCK)
  261. type |= SOCK_NONBLOCK;
  262. return type;
  263. }
  264. /* listen on a tcp socket */
  265. static int tcp_listen(PAL_HANDLE* handle, char* uri, int options) {
  266. struct sockaddr buffer;
  267. struct sockaddr* bind_addr = &buffer;
  268. unsigned int bind_addrlen;
  269. int ret;
  270. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen, NULL, NULL)) < 0)
  271. return ret;
  272. #if ALLOW_BIND_ANY == 0
  273. /* the socket need to have a binding address, a null address or an
  274. any address is not allowed */
  275. if (check_any_addr(bind_addr))
  276. return -PAL_ERROR_INVAL;
  277. #endif
  278. struct sockopt sock_options;
  279. memset(&sock_options, 0, sizeof(sock_options));
  280. sock_options.reuseaddr = 1; /* sockets are always set as reusable in Graphene */
  281. ret = ocall_listen(bind_addr->sa_family, sock_type(SOCK_STREAM, options), 0, bind_addr,
  282. &bind_addrlen, &sock_options);
  283. if (IS_ERR(ret))
  284. return unix_to_pal_error(ERRNO(ret));
  285. *handle = socket_create_handle(pal_type_tcpsrv, ret, options, bind_addr, bind_addrlen, NULL, 0,
  286. &sock_options);
  287. if (!(*handle)) {
  288. ocall_close(ret);
  289. return -PAL_ERROR_NOMEM;
  290. }
  291. return 0;
  292. }
  293. /* accept a tcp connection */
  294. static int tcp_accept(PAL_HANDLE handle, PAL_HANDLE* client) {
  295. if (!IS_HANDLE_TYPE(handle, tcpsrv) || !handle->sock.bind || handle->sock.conn)
  296. return -PAL_ERROR_NOTSERVER;
  297. if (handle->sock.fd == PAL_IDX_POISON)
  298. return -PAL_ERROR_BADHANDLE;
  299. struct sockaddr* bind_addr = (struct sockaddr*)handle->sock.bind;
  300. unsigned int bind_addrlen = addr_size(bind_addr);
  301. struct sockaddr dest_addr;
  302. unsigned int dest_addrlen = sizeof(struct sockaddr);
  303. int ret = 0;
  304. struct sockopt sock_options;
  305. memset(&sock_options, 0, sizeof(sock_options));
  306. sock_options.reuseaddr = 1; /* sockets are always set as reusable in Graphene */
  307. ret = ocall_accept(handle->sock.fd, &dest_addr, &dest_addrlen, &sock_options);
  308. if (IS_ERR(ret))
  309. return unix_to_pal_error(ERRNO(ret));
  310. *client = socket_create_handle(pal_type_tcp, ret, 0, bind_addr, bind_addrlen, &dest_addr,
  311. dest_addrlen, &sock_options);
  312. if (!(*client)) {
  313. ocall_close(ret);
  314. return -PAL_ERROR_NOMEM;
  315. }
  316. return 0;
  317. }
  318. /* connect on a tcp socket */
  319. static int tcp_connect(PAL_HANDLE* handle, char* uri, int options) {
  320. struct sockaddr buffer[2];
  321. struct sockaddr* bind_addr = buffer;
  322. struct sockaddr* dest_addr = buffer + 1;
  323. unsigned int bind_addrlen, dest_addrlen;
  324. int ret;
  325. /* accepting two kind of different uri:
  326. dest-ip:dest-port or bind-ip:bind-port:dest-ip:dest-port */
  327. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen, &dest_addr, &dest_addrlen)) < 0)
  328. return ret;
  329. if (!dest_addr)
  330. return -PAL_ERROR_INVAL;
  331. if (bind_addr && bind_addr->sa_family != dest_addr->sa_family)
  332. return -PAL_ERROR_INVAL;
  333. #if ALLOW_BIND_ANY == 0
  334. /* the socket need to have a binding address, a null address or an
  335. any address is not allowed */
  336. if (bind_addr && addr_check_any(bind_addr))
  337. return -PAL_ERROR_INVAL;
  338. #endif
  339. struct sockopt sock_options;
  340. memset(&sock_options, 0, sizeof(sock_options));
  341. sock_options.reuseaddr = 1; /* sockets are always set as reusable in Graphene */
  342. ret = ocall_connect(dest_addr->sa_family, sock_type(SOCK_STREAM, options), 0, dest_addr,
  343. dest_addrlen, bind_addr, &bind_addrlen, &sock_options);
  344. if (IS_ERR(ret))
  345. return unix_to_pal_error(ERRNO(ret));
  346. *handle = socket_create_handle(pal_type_tcp, ret, options, bind_addr, bind_addrlen, dest_addr,
  347. dest_addrlen, &sock_options);
  348. if (!(*handle)) {
  349. ocall_close(ret);
  350. return -PAL_ERROR_NOMEM;
  351. }
  352. return 0;
  353. }
  354. /* 'open' operation of tcp stream */
  355. static int tcp_open(PAL_HANDLE* handle, const char* type, const char* uri, int access, int share,
  356. int create, int options) {
  357. if (!WITHIN_MASK(access, PAL_ACCESS_MASK) || !WITHIN_MASK(share, PAL_SHARE_MASK) ||
  358. !WITHIN_MASK(create, PAL_CREATE_MASK) || !WITHIN_MASK(options, PAL_OPTION_MASK))
  359. return -PAL_ERROR_INVAL;
  360. int uri_len = strlen(uri) + 1;
  361. if (uri_len > PAL_SOCKADDR_SIZE)
  362. return -PAL_ERROR_TOOLONG;
  363. char uri_buf[PAL_SOCKADDR_SIZE];
  364. memcpy(uri_buf, uri, uri_len);
  365. if (!strcmp_static(type, URI_TYPE_TCP_SRV))
  366. return tcp_listen(handle, uri_buf, options);
  367. if (!strcmp_static(type, URI_TYPE_TCP))
  368. return tcp_connect(handle, uri_buf, options);
  369. return -PAL_ERROR_NOTSUPPORT;
  370. }
  371. /* 'read' operation of tcp stream */
  372. static int64_t tcp_read(PAL_HANDLE handle, uint64_t offset, uint64_t len, void* buf) {
  373. if (offset)
  374. return -PAL_ERROR_INVAL;
  375. if (!IS_HANDLE_TYPE(handle, tcp) || !handle->sock.conn)
  376. return -PAL_ERROR_NOTCONNECTION;
  377. if (handle->sock.fd == PAL_IDX_POISON)
  378. return -PAL_ERROR_ENDOFSTREAM;
  379. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  380. return -PAL_ERROR_INVAL;
  381. int bytes = ocall_recv(handle->sock.fd, buf, len, NULL, NULL, NULL, NULL);
  382. if (IS_ERR(bytes))
  383. return unix_to_pal_error(ERRNO(bytes));
  384. if (!bytes)
  385. return -PAL_ERROR_ENDOFSTREAM;
  386. return bytes;
  387. }
  388. /* write' operation of tcp stream */
  389. static int64_t tcp_write(PAL_HANDLE handle, uint64_t offset, uint64_t len, const void* buf) {
  390. if (offset)
  391. return -PAL_ERROR_INVAL;
  392. if (!IS_HANDLE_TYPE(handle, tcp) || !handle->sock.conn)
  393. return -PAL_ERROR_NOTCONNECTION;
  394. if (handle->sock.fd == PAL_IDX_POISON)
  395. return -PAL_ERROR_CONNFAILED;
  396. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  397. return -PAL_ERROR_INVAL;
  398. int bytes = ocall_send(handle->sock.fd, buf, len, NULL, 0, NULL, 0);
  399. if (IS_ERR(bytes))
  400. return unix_to_pal_error(ERRNO(bytes));
  401. return bytes;
  402. }
  403. /* used by 'open' operation of tcp stream for bound socket */
  404. static int udp_bind(PAL_HANDLE* handle, char* uri, int options) {
  405. struct sockaddr buffer;
  406. struct sockaddr* bind_addr = &buffer;
  407. unsigned int bind_addrlen;
  408. int ret = 0;
  409. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen, NULL, NULL)) < 0)
  410. return ret;
  411. assert(bind_addr);
  412. assert(bind_addrlen == addr_size(bind_addr));
  413. #if ALLOW_BIND_ANY == 0
  414. /* the socket need to have a binding address, a null address or an
  415. any address is not allowed */
  416. if (addr_check_any(bind_addr))
  417. return -PAL_ERROR_INVAL;
  418. #endif
  419. struct sockopt sock_options;
  420. memset(&sock_options, 0, sizeof(sock_options));
  421. sock_options.reuseaddr = 1; /* sockets are always set as reusable in Graphene */
  422. ret = ocall_listen(bind_addr->sa_family, sock_type(SOCK_DGRAM, options), 0, bind_addr,
  423. &bind_addrlen, &sock_options);
  424. if (IS_ERR(ret))
  425. return unix_to_pal_error(ERRNO(ret));
  426. *handle = socket_create_handle(pal_type_udpsrv, ret, options, bind_addr, bind_addrlen, NULL, 0,
  427. &sock_options);
  428. if (!(*handle)) {
  429. ocall_close(ret);
  430. return -PAL_ERROR_NOMEM;
  431. }
  432. return 0;
  433. }
  434. /* used by 'open' operation of tcp stream for connected socket */
  435. static int udp_connect(PAL_HANDLE* handle, char* uri, int options) {
  436. struct sockaddr buffer[2];
  437. struct sockaddr* bind_addr = buffer;
  438. struct sockaddr* dest_addr = buffer + 1;
  439. unsigned int bind_addrlen, dest_addrlen;
  440. int ret;
  441. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen, &dest_addr, &dest_addrlen)) < 0)
  442. return ret;
  443. #if ALLOW_BIND_ANY == 0
  444. /* the socket need to have a binding address, a null address or an
  445. any address is not allowed */
  446. if (bind_addr && addr_check_any(bind_addr))
  447. return -PAL_ERROR_INVAL;
  448. #endif
  449. struct sockopt sock_options;
  450. memset(&sock_options, 0, sizeof(sock_options));
  451. sock_options.reuseaddr = 1; /* sockets are always set as reusable in Graphene */
  452. ret = ocall_connect(dest_addr ? dest_addr->sa_family : AF_INET,
  453. sock_type(SOCK_DGRAM, options), 0, dest_addr, dest_addrlen, bind_addr,
  454. &bind_addrlen, &sock_options);
  455. if (IS_ERR(ret))
  456. return unix_to_pal_error(ERRNO(ret));
  457. *handle = socket_create_handle(dest_addr ? pal_type_udp : pal_type_udpsrv, ret, options,
  458. bind_addr, bind_addrlen, dest_addr, dest_addrlen, &sock_options);
  459. if (!(*handle)) {
  460. ocall_close(ret);
  461. return -PAL_ERROR_NOMEM;
  462. }
  463. return 0;
  464. }
  465. static int udp_open(PAL_HANDLE* hdl, const char* type, const char* uri, int access, int share,
  466. int create, int options) {
  467. if (!WITHIN_MASK(access, PAL_ACCESS_MASK) || !WITHIN_MASK(share, PAL_SHARE_MASK) ||
  468. !WITHIN_MASK(create, PAL_CREATE_MASK) || !WITHIN_MASK(options, PAL_OPTION_MASK))
  469. return -PAL_ERROR_INVAL;
  470. char buf[PAL_SOCKADDR_SIZE];
  471. int len = strlen(uri);
  472. if (len >= PAL_SOCKADDR_SIZE)
  473. return -PAL_ERROR_TOOLONG;
  474. memcpy(buf, uri, len + 1);
  475. if (!strcmp_static(type, URI_TYPE_UDP_SRV))
  476. return udp_bind(hdl, buf, options);
  477. if (!strcmp_static(type, URI_TYPE_UDP))
  478. return udp_connect(hdl, buf, options);
  479. return -PAL_ERROR_NOTSUPPORT;
  480. }
  481. static int64_t udp_receive(PAL_HANDLE handle, uint64_t offset, uint64_t len, void* buf) {
  482. if (offset)
  483. return -PAL_ERROR_INVAL;
  484. if (!IS_HANDLE_TYPE(handle, udp))
  485. return -PAL_ERROR_NOTCONNECTION;
  486. if (handle->sock.fd == PAL_IDX_POISON)
  487. return -PAL_ERROR_BADHANDLE;
  488. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  489. return -PAL_ERROR_INVAL;
  490. int ret = ocall_recv(handle->sock.fd, buf, len, NULL, NULL, NULL, NULL);
  491. return IS_ERR(ret) ? unix_to_pal_error(ERRNO(ret)) : ret;
  492. }
  493. static int64_t udp_receivebyaddr(PAL_HANDLE handle, uint64_t offset, uint64_t len, void* buf,
  494. char* addr, size_t addrlen) {
  495. if (offset)
  496. return -PAL_ERROR_INVAL;
  497. if (!IS_HANDLE_TYPE(handle, udpsrv))
  498. return -PAL_ERROR_NOTCONNECTION;
  499. if (handle->sock.fd == PAL_IDX_POISON)
  500. return -PAL_ERROR_BADHANDLE;
  501. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  502. return -PAL_ERROR_INVAL;
  503. struct sockaddr conn_addr;
  504. socklen_t conn_addrlen = sizeof(struct sockaddr);
  505. int bytes = ocall_recv(handle->sock.fd, buf, len, &conn_addr, &conn_addrlen, NULL, NULL);
  506. if (IS_ERR(bytes))
  507. return unix_to_pal_error(ERRNO(bytes));
  508. char* addr_uri = strcpy_static(addr, URI_PREFIX_UDP, addrlen);
  509. if (!addr_uri)
  510. return -PAL_ERROR_OVERFLOW;
  511. int ret = inet_create_uri(addr_uri, addr + addrlen - addr_uri, &conn_addr, conn_addrlen);
  512. if (ret < 0)
  513. return ret;
  514. return bytes;
  515. }
  516. static int64_t udp_send(PAL_HANDLE handle, uint64_t offset, uint64_t len, const void* buf) {
  517. if (offset)
  518. return -PAL_ERROR_INVAL;
  519. if (!IS_HANDLE_TYPE(handle, udp))
  520. return -PAL_ERROR_NOTCONNECTION;
  521. if (handle->sock.fd == PAL_IDX_POISON)
  522. return -PAL_ERROR_BADHANDLE;
  523. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  524. return -PAL_ERROR_INVAL;
  525. int bytes = ocall_send(handle->sock.fd, buf, len, NULL, 0, NULL, 0);
  526. if (IS_ERR(bytes))
  527. return unix_to_pal_error(ERRNO(bytes));
  528. return bytes;
  529. }
  530. static int64_t udp_sendbyaddr(PAL_HANDLE handle, uint64_t offset, uint64_t len, const void* buf,
  531. const char* addr, size_t addrlen) {
  532. if (offset)
  533. return -PAL_ERROR_INVAL;
  534. if (!IS_HANDLE_TYPE(handle, udpsrv))
  535. return -PAL_ERROR_NOTCONNECTION;
  536. if (handle->sock.fd == PAL_IDX_POISON)
  537. return -PAL_ERROR_BADHANDLE;
  538. if (!strstartswith_static(addr, URI_PREFIX_UDP))
  539. return -PAL_ERROR_INVAL;
  540. if (len >= (1ULL << (sizeof(unsigned int) * 8)))
  541. return -PAL_ERROR_INVAL;
  542. addr += static_strlen(URI_PREFIX_UDP);
  543. addrlen -= static_strlen(URI_PREFIX_UDP);
  544. char* addrbuf = __alloca(addrlen);
  545. memcpy(addrbuf, addr, addrlen);
  546. struct sockaddr conn_addr;
  547. unsigned int conn_addrlen = sizeof(struct sockaddr);
  548. int ret = inet_parse_uri(&addrbuf, &conn_addr, &conn_addrlen);
  549. if (ret < 0)
  550. return ret;
  551. int bytes = ocall_send(handle->sock.fd, buf, len, &conn_addr, conn_addrlen, NULL, 0);
  552. if (IS_ERR(bytes))
  553. return unix_to_pal_error(ERRNO(bytes));
  554. return bytes;
  555. }
  556. static int socket_delete(PAL_HANDLE handle, int access) {
  557. if (handle->sock.fd == PAL_IDX_POISON)
  558. return 0;
  559. if (!IS_HANDLE_TYPE(handle, tcp) && access)
  560. return -PAL_ERROR_INVAL;
  561. if (IS_HANDLE_TYPE(handle, tcp) || IS_HANDLE_TYPE(handle, tcpsrv)) {
  562. int shutdown;
  563. switch (access) {
  564. case 0:
  565. shutdown = SHUT_RDWR;
  566. break;
  567. case PAL_DELETE_RD:
  568. shutdown = SHUT_RD;
  569. break;
  570. case PAL_DELETE_WR:
  571. shutdown = SHUT_WR;
  572. break;
  573. default:
  574. return -PAL_ERROR_INVAL;
  575. }
  576. ocall_shutdown(handle->sock.fd, shutdown);
  577. }
  578. return 0;
  579. }
  580. static int socket_close(PAL_HANDLE handle) {
  581. if (handle->sock.fd != PAL_IDX_POISON) {
  582. ocall_close(handle->sock.fd);
  583. handle->sock.fd = PAL_IDX_POISON;
  584. }
  585. if (handle->sock.bind)
  586. handle->sock.bind = (PAL_PTR)NULL;
  587. if (handle->sock.conn)
  588. handle->sock.conn = (PAL_PTR)NULL;
  589. return 0;
  590. }
  591. static int socket_attrquerybyhdl(PAL_HANDLE handle, PAL_STREAM_ATTR* attr) {
  592. int ret;
  593. if (handle->sock.fd == PAL_IDX_POISON)
  594. return -PAL_ERROR_BADHANDLE;
  595. attr->handle_type = HANDLE_HDR(handle)->type;
  596. attr->nonblocking = handle->sock.nonblocking;
  597. attr->disconnected = HANDLE_HDR(handle)->flags & ERROR(0);
  598. attr->socket.linger = handle->sock.linger;
  599. attr->socket.receivebuf = handle->sock.receivebuf;
  600. attr->socket.sendbuf = handle->sock.sendbuf;
  601. attr->socket.receivetimeout = handle->sock.receivetimeout;
  602. attr->socket.sendtimeout = handle->sock.sendtimeout;
  603. attr->socket.tcp_cork = handle->sock.tcp_cork;
  604. attr->socket.tcp_keepalive = handle->sock.tcp_keepalive;
  605. attr->socket.tcp_nodelay = handle->sock.tcp_nodelay;
  606. /* get number of bytes available for reading (doesn't make sense for listening sockets) */
  607. attr->pending_size = 0;
  608. if (!IS_HANDLE_TYPE(handle, tcpsrv)) {
  609. ret = ocall_fionread(handle->sock.fd);
  610. if (IS_ERR(ret))
  611. return unix_to_pal_error(ERRNO(ret));
  612. attr->pending_size = ret;
  613. }
  614. /* query if there is data available for reading */
  615. struct pollfd pfd = {.fd = handle->sock.fd, .events = POLLIN | POLLOUT, .revents = 0};
  616. ret = ocall_poll(&pfd, 1, 0);
  617. if (IS_ERR(ret))
  618. return unix_to_pal_error(ERRNO(ret));
  619. attr->readable = ret == 1 && (pfd.revents & (POLLIN | POLLERR | POLLHUP)) == POLLIN;
  620. attr->writable = ret == 1 && (pfd.revents & (POLLOUT | POLLERR | POLLHUP)) == POLLOUT;
  621. return 0;
  622. }
  623. static int socket_attrsetbyhdl(PAL_HANDLE handle, PAL_STREAM_ATTR* attr) {
  624. if (handle->sock.fd == PAL_IDX_POISON)
  625. return -PAL_ERROR_BADHANDLE;
  626. int fd = handle->sock.fd, ret, val;
  627. if (attr->nonblocking != handle->sock.nonblocking) {
  628. ret = ocall_fsetnonblock(fd, attr->nonblocking);
  629. if (IS_ERR(ret))
  630. return unix_to_pal_error(ERRNO(ret));
  631. handle->sock.nonblocking = attr->nonblocking;
  632. }
  633. if (HANDLE_TYPE(handle) != pal_type_tcpsrv) {
  634. struct __kernel_linger {
  635. int l_onoff;
  636. int l_linger;
  637. };
  638. if (attr->socket.linger != handle->sock.linger) {
  639. struct __kernel_linger l;
  640. l.l_onoff = attr->socket.linger ? 1 : 0;
  641. l.l_linger = attr->socket.linger;
  642. ret = ocall_setsockopt(fd, SOL_SOCKET, SO_LINGER, &l, sizeof(struct __kernel_linger));
  643. if (IS_ERR(ret))
  644. return unix_to_pal_error(ERRNO(ret));
  645. handle->sock.linger = attr->socket.linger;
  646. }
  647. if (attr->socket.receivebuf != handle->sock.receivebuf) {
  648. val = attr->socket.receivebuf;
  649. ret = ocall_setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &val, sizeof(int));
  650. if (IS_ERR(ret))
  651. return unix_to_pal_error(ERRNO(ret));
  652. handle->sock.receivebuf = attr->socket.receivebuf;
  653. }
  654. if (attr->socket.sendbuf != handle->sock.sendbuf) {
  655. val = attr->socket.sendbuf;
  656. ret = ocall_setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &val, sizeof(int));
  657. if (IS_ERR(ret))
  658. return unix_to_pal_error(ERRNO(ret));
  659. handle->sock.sendbuf = attr->socket.sendbuf;
  660. }
  661. if (attr->socket.receivetimeout != handle->sock.receivetimeout) {
  662. val = attr->socket.receivetimeout;
  663. ret = ocall_setsockopt(fd, SOL_SOCKET, SO_RCVTIMEO, &val, sizeof(int));
  664. if (IS_ERR(ret))
  665. return unix_to_pal_error(ERRNO(ret));
  666. handle->sock.receivetimeout = attr->socket.receivetimeout;
  667. }
  668. if (attr->socket.sendtimeout != handle->sock.sendtimeout) {
  669. val = attr->socket.sendtimeout;
  670. ret = ocall_setsockopt(fd, SOL_SOCKET, SO_SNDTIMEO, &val, sizeof(int));
  671. if (IS_ERR(ret))
  672. return unix_to_pal_error(ERRNO(ret));
  673. handle->sock.sendtimeout = attr->socket.sendtimeout;
  674. }
  675. }
  676. if (HANDLE_TYPE(handle) == pal_type_tcp || HANDLE_TYPE(handle) == pal_type_tcpsrv) {
  677. if (attr->socket.tcp_cork != handle->sock.tcp_cork) {
  678. val = attr->socket.tcp_cork ? 1 : 0;
  679. ret = ocall_setsockopt(fd, SOL_TCP, TCP_CORK, &val, sizeof(int));
  680. if (IS_ERR(ret))
  681. return unix_to_pal_error(ERRNO(ret));
  682. handle->sock.tcp_cork = attr->socket.tcp_cork;
  683. }
  684. if (attr->socket.tcp_keepalive != handle->sock.tcp_keepalive) {
  685. val = attr->socket.tcp_keepalive ? 1 : 0;
  686. ret = ocall_setsockopt(fd, SOL_SOCKET, SO_KEEPALIVE, &val, sizeof(int));
  687. if (IS_ERR(ret))
  688. return unix_to_pal_error(ERRNO(ret));
  689. handle->sock.tcp_keepalive = attr->socket.tcp_keepalive;
  690. }
  691. if (attr->socket.tcp_nodelay != handle->sock.tcp_nodelay) {
  692. val = attr->socket.tcp_nodelay ? 1 : 0;
  693. ret = ocall_setsockopt(fd, SOL_TCP, TCP_NODELAY, &val, sizeof(int));
  694. if (IS_ERR(ret))
  695. return unix_to_pal_error(ERRNO(ret));
  696. handle->sock.tcp_nodelay = attr->socket.tcp_nodelay;
  697. }
  698. }
  699. return 0;
  700. }
  701. static int socket_getname(PAL_HANDLE handle, char* buffer, size_t count) {
  702. size_t orig_count = count;
  703. int ret;
  704. const char* prefix = NULL;
  705. size_t prefix_len = 0;
  706. struct sockaddr* bind_addr = NULL;
  707. struct sockaddr* dest_addr = NULL;
  708. switch (PAL_GET_TYPE(handle)) {
  709. case pal_type_tcpsrv:
  710. prefix_len = static_strlen(URI_PREFIX_TCP_SRV);
  711. prefix = URI_PREFIX_TCP_SRV;
  712. bind_addr = (struct sockaddr*)handle->sock.bind;
  713. break;
  714. case pal_type_tcp:
  715. prefix_len = static_strlen(URI_PREFIX_TCP);
  716. prefix = URI_PREFIX_TCP;
  717. bind_addr = (struct sockaddr*)handle->sock.bind;
  718. dest_addr = (struct sockaddr*)handle->sock.conn;
  719. break;
  720. case pal_type_udpsrv:
  721. prefix_len = static_strlen(URI_PREFIX_UDP_SRV);
  722. prefix = URI_PREFIX_UDP_SRV;
  723. bind_addr = (struct sockaddr*)handle->sock.bind;
  724. break;
  725. case pal_type_udp:
  726. prefix_len = static_strlen(URI_PREFIX_UDP);
  727. prefix = URI_PREFIX_UDP;
  728. bind_addr = (struct sockaddr*)handle->sock.bind;
  729. dest_addr = (struct sockaddr*)handle->sock.conn;
  730. break;
  731. default:
  732. return -PAL_ERROR_INVAL;
  733. }
  734. if (count < prefix_len + 1) {
  735. return -PAL_ERROR_OVERFLOW;
  736. }
  737. memcpy(buffer, prefix, prefix_len + 1);
  738. buffer += prefix_len;
  739. count -= prefix_len;
  740. if (bind_addr) {
  741. if ((ret = inet_create_uri(buffer, count, bind_addr, addr_size(bind_addr))) < 0) {
  742. return ret;
  743. }
  744. buffer += ret;
  745. count -= ret;
  746. }
  747. if (dest_addr) {
  748. if (bind_addr) {
  749. if (count < 2) {
  750. return -PAL_ERROR_OVERFLOW;
  751. }
  752. *buffer++ = ':';
  753. *buffer = '\0';
  754. count--;
  755. }
  756. if ((ret = inet_create_uri(buffer, count, dest_addr, addr_size(dest_addr))) < 0) {
  757. return ret;
  758. }
  759. buffer += ret;
  760. count -= ret;
  761. }
  762. return orig_count - count;
  763. }
  764. struct handle_ops tcp_ops = {
  765. .getname = &socket_getname,
  766. .open = &tcp_open,
  767. .waitforclient = &tcp_accept,
  768. .read = &tcp_read,
  769. .write = &tcp_write,
  770. .delete = &socket_delete,
  771. .close = &socket_close,
  772. .attrquerybyhdl = &socket_attrquerybyhdl,
  773. .attrsetbyhdl = &socket_attrsetbyhdl,
  774. };
  775. struct handle_ops udp_ops = {
  776. .getname = &socket_getname,
  777. .open = &udp_open,
  778. .read = &udp_receive,
  779. .write = &udp_send,
  780. .delete = &socket_delete,
  781. .close = &socket_close,
  782. .attrquerybyhdl = &socket_attrquerybyhdl,
  783. .attrsetbyhdl = &socket_attrsetbyhdl,
  784. };
  785. struct handle_ops udpsrv_ops = {
  786. .getname = &socket_getname,
  787. .open = &udp_open,
  788. .readbyaddr = &udp_receivebyaddr,
  789. .writebyaddr = &udp_sendbyaddr,
  790. .delete = &socket_delete,
  791. .close = &socket_close,
  792. .attrquerybyhdl = &socket_attrquerybyhdl,
  793. .attrsetbyhdl = &socket_attrsetbyhdl,
  794. };