db_sockets.c 31 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012
  1. /* Copyright (C) 2014 Stony Brook University
  2. This file is part of Graphene Library OS.
  3. Graphene Library OS is free software: you can redistribute it and/or
  4. modify it under the terms of the GNU Lesser General Public License
  5. as published by the Free Software Foundation, either version 3 of the
  6. License, or (at your option) any later version.
  7. Graphene Library OS is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. GNU Lesser General Public License for more details.
  11. You should have received a copy of the GNU Lesser General Public License
  12. along with this program. If not, see <http://www.gnu.org/licenses/>. */
  13. /*
  14. * db_socket.c
  15. *
  16. * This file contains operands for streams with URIs that start with
  17. * "tcp:", "tcp.srv:", "udp:", "udp.srv:".
  18. */
  19. #include <linux/in.h>
  20. #include <linux/in6.h>
  21. #include <linux/poll.h>
  22. #include <linux/types.h>
  23. #include "api.h"
  24. #include "pal.h"
  25. #include "pal_debug.h"
  26. #include "pal_defs.h"
  27. #include "pal_error.h"
  28. #include "pal_internal.h"
  29. #include "pal_linux.h"
  30. #include "pal_linux_defs.h"
  31. #include "pal_linux_error.h"
  32. #include "pal_security.h"
  33. typedef __kernel_pid_t pid_t;
  34. #include <asm-generic/socket.h>
  35. #include <asm/fcntl.h>
  36. #ifndef SOL_TCP
  37. #define SOL_TCP 6
  38. #endif
  39. #ifndef TCP_NODELAY
  40. #define TCP_NODELAY 1
  41. #endif
  42. #ifndef TCP_CORK
  43. #define TCP_CORK 3
  44. #endif
  45. /* 96 bytes is the minimal size of buffer to store a IPv4/IPv6
  46. address */
  47. #define PAL_SOCKADDR_SIZE 96
  48. static size_t addr_size(const struct sockaddr* addr) {
  49. switch (addr->sa_family) {
  50. case AF_INET:
  51. return sizeof(struct sockaddr_in);
  52. case AF_INET6:
  53. return sizeof(struct sockaddr_in6);
  54. default:
  55. return 0;
  56. }
  57. }
  58. /* parsing the string of uri, and fill in the socket address structure.
  59. the latest pointer of uri, length of socket address are returned. */
  60. static int inet_parse_uri(char** uri, struct sockaddr* addr, unsigned int* addrlen) {
  61. char* tmp = *uri;
  62. char* end;
  63. char* addr_str = NULL;
  64. char* port_str;
  65. int af;
  66. void* addr_buf;
  67. int addr_len;
  68. __be16* port_buf;
  69. int slen;
  70. if (tmp[0] == '[') {
  71. /* for IPv6, the address will be in the form of
  72. "[xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx]:port". */
  73. struct sockaddr_in6* addr_in6 = (struct sockaddr_in6*)addr;
  74. slen = sizeof(struct sockaddr_in6);
  75. memset(addr, 0, slen);
  76. end = strchr(tmp + 1, ']');
  77. if (!end || *(end + 1) != ':')
  78. goto inval;
  79. addr_str = tmp + 1;
  80. addr_len = end - tmp - 1;
  81. port_str = end + 2;
  82. for (end = port_str; *end >= '0' && *end <= '9'; end++)
  83. ;
  84. addr_in6->sin6_family = af = AF_INET6;
  85. addr_buf = &addr_in6->sin6_addr.s6_addr;
  86. port_buf = &addr_in6->sin6_port;
  87. } else {
  88. /* for IP, the address will be in the form of "x.x.x.x:port". */
  89. struct sockaddr_in* addr_in = (struct sockaddr_in*)addr;
  90. slen = sizeof(struct sockaddr_in);
  91. memset(addr, 0, slen);
  92. end = strchr(tmp, ':');
  93. if (!end)
  94. goto inval;
  95. addr_str = tmp;
  96. addr_len = end - tmp;
  97. port_str = end + 1;
  98. for (end = port_str; *end >= '0' && *end <= '9'; end++)
  99. ;
  100. addr_in->sin_family = af = AF_INET;
  101. addr_buf = &addr_in->sin_addr.s_addr;
  102. port_buf = &addr_in->sin_port;
  103. }
  104. if (af == AF_INET) {
  105. if (!inet_pton4(addr_str, addr_len, addr_buf))
  106. goto inval;
  107. } else {
  108. if (!inet_pton6(addr_str, addr_len, addr_buf))
  109. goto inval;
  110. }
  111. *port_buf = __htons(atoi(port_str));
  112. *uri = *end ? end + 1 : NULL;
  113. if (addrlen)
  114. *addrlen = slen;
  115. return 0;
  116. inval:
  117. return -PAL_ERROR_INVAL;
  118. }
  119. /* create the string of uri from the given socket address */
  120. static int inet_create_uri(char* uri, int count, struct sockaddr* addr, int addrlen) {
  121. int len = 0;
  122. if (addr->sa_family == AF_INET) {
  123. if (addrlen != sizeof(struct sockaddr_in))
  124. return -PAL_ERROR_INVAL;
  125. struct sockaddr_in* addr_in = (struct sockaddr_in*)addr;
  126. char* addr = (char*)&addr_in->sin_addr.s_addr;
  127. /* for IP, the address will be in the form of "x.x.x.x:port". */
  128. len = snprintf(uri, count, "%u.%u.%u.%u:%u", (unsigned char)addr[0], (unsigned char)addr[1],
  129. (unsigned char)addr[2], (unsigned char)addr[3], __ntohs(addr_in->sin_port));
  130. } else if (addr->sa_family == AF_INET6) {
  131. if (addrlen != sizeof(struct sockaddr_in6))
  132. return -PAL_ERROR_INVAL;
  133. struct sockaddr_in6* addr_in6 = (struct sockaddr_in6*)addr;
  134. unsigned short* addr = (unsigned short*)&addr_in6->sin6_addr.s6_addr;
  135. /* for IPv6, the address will be in the form of
  136. "[xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx:xxxx]:port". */
  137. len = snprintf(uri, count, "[%04x:%04x:%04x:%04x:%04x:%04x:%04x:%04x]:%u", addr[0], addr[1],
  138. addr[2], addr[3], addr[4], addr[5], addr[6], addr[7],
  139. __ntohs(addr_in6->sin6_port));
  140. } else {
  141. return -PAL_ERROR_INVAL;
  142. }
  143. if (len >= count)
  144. return -PAL_ERROR_TOOLONG;
  145. return len;
  146. }
  147. /* parse the uri for a socket stream. The uri might have both binding
  148. address and connecting address, or connecting address only. The form
  149. of uri will be either "bind-addr:bind-port:connect-addr:connect-port"
  150. or "addr:port". */
  151. static int socket_parse_uri(char* uri, struct sockaddr** bind_addr, unsigned int* bind_addrlen,
  152. struct sockaddr** dest_addr, unsigned int* dest_addrlen) {
  153. int ret;
  154. if (!bind_addr && !dest_addr)
  155. return 0;
  156. if (!uri || !(*uri)) {
  157. if (bind_addr)
  158. *bind_addr = NULL;
  159. if (bind_addrlen)
  160. *bind_addrlen = 0;
  161. if (dest_addr)
  162. *dest_addr = NULL;
  163. if (dest_addrlen)
  164. *dest_addrlen = 0;
  165. return 0;
  166. }
  167. /* at least parse uri once */
  168. if ((ret = inet_parse_uri(&uri, bind_addr ? *bind_addr : *dest_addr,
  169. bind_addr ? bind_addrlen : dest_addrlen)) < 0)
  170. return ret;
  171. if (!(bind_addr && dest_addr))
  172. return 0;
  173. /* if you reach here, it can only be connection address */
  174. if (!uri || (ret = inet_parse_uri(&uri, *dest_addr, dest_addrlen)) < 0) {
  175. *dest_addr = *bind_addr;
  176. *dest_addrlen = *bind_addrlen;
  177. *bind_addr = NULL;
  178. *bind_addrlen = 0;
  179. }
  180. return 0;
  181. }
  182. /* fill in the PAL handle based on the file descriptors and address given. */
  183. static inline PAL_HANDLE socket_create_handle(int type, int fd, int options,
  184. struct sockaddr* bind_addr, unsigned int bind_addrlen,
  185. struct sockaddr* dest_addr, unsigned int dest_addrlen,
  186. struct sockopt* sock_options) {
  187. PAL_HANDLE hdl =
  188. malloc(HANDLE_SIZE(sock) + (bind_addr ? bind_addrlen : 0) + (dest_addr ? dest_addrlen : 0));
  189. if (!hdl)
  190. return NULL;
  191. memset(hdl, 0, sizeof(struct pal_handle));
  192. init_handle_hdr(HANDLE_HDR(hdl), type);
  193. HANDLE_HDR(hdl)->flags |= RFD(0) | (type != pal_type_tcpsrv ? WFD(0) : 0);
  194. hdl->sock.fd = fd;
  195. void* addr = (void*)hdl + HANDLE_SIZE(sock);
  196. if (bind_addr) {
  197. hdl->sock.bind = (PAL_PTR)addr;
  198. memcpy(addr, bind_addr, bind_addrlen);
  199. addr += bind_addrlen;
  200. } else {
  201. hdl->sock.bind = (PAL_PTR)NULL;
  202. }
  203. if (dest_addr) {
  204. hdl->sock.conn = (PAL_PTR)addr;
  205. memcpy(addr, dest_addr, dest_addrlen);
  206. addr += dest_addrlen;
  207. } else {
  208. hdl->sock.conn = (PAL_PTR)NULL;
  209. }
  210. hdl->sock.nonblocking = (options & PAL_OPTION_NONBLOCK) ? PAL_TRUE : PAL_FALSE;
  211. hdl->sock.linger = sock_options->linger;
  212. hdl->sock.receivebuf = sock_options->receivebuf;
  213. hdl->sock.sendbuf = sock_options->sendbuf;
  214. hdl->sock.receivetimeout = sock_options->receivetimeout;
  215. hdl->sock.sendtimeout = sock_options->sendtimeout;
  216. hdl->sock.tcp_cork = sock_options->tcp_cork;
  217. hdl->sock.tcp_keepalive = sock_options->tcp_keepalive;
  218. hdl->sock.tcp_nodelay = sock_options->tcp_nodelay;
  219. return hdl;
  220. }
  221. #if ALLOW_BIND_ANY == 0
  222. static bool check_zero(void* mem, size_t size) {
  223. void* p = mem;
  224. void* q = mem + size;
  225. while (p < q) {
  226. if (p <= q - sizeof(long)) {
  227. if (*(long*)p)
  228. return false;
  229. p += sizeof(long);
  230. } else if (p <= q - sizeof(int)) {
  231. if (*(int*)p)
  232. return false;
  233. p += sizeof(int);
  234. } else if (p <= q - sizeof(short)) {
  235. if (*(short*)p)
  236. return false;
  237. p += sizeof(short);
  238. } else {
  239. if (*(char*)p)
  240. return false;
  241. p++;
  242. }
  243. }
  244. return true;
  245. }
  246. /* check if an address is "Any" */
  247. static bool check_any_addr(struct sockaddr* addr) {
  248. if (addr->sa_family == AF_INET) {
  249. struct sockaddr_in* addr_in = (struct sockaddr_in*)addr;
  250. return addr_in->sin_port == 0 && check_zero(&addr_in->sin_addr, sizeof(addr_in->sin_addr));
  251. } else if (addr->sa_family == AF_INET6) {
  252. struct sockaddr_in6* addr_in6 = (struct sockaddr_in6*)addr;
  253. return addr_in6->sin6_port == 0 &&
  254. check_zero(&addr_in6->sin6_addr, sizeof(addr_in6->sin6_addr));
  255. }
  256. return false;
  257. }
  258. #endif
  259. static inline int sock_type(int type, int options) {
  260. if (options & PAL_OPTION_NONBLOCK)
  261. type |= SOCK_NONBLOCK;
  262. return type;
  263. }
  264. /* listen on a tcp socket */
  265. static int tcp_listen(PAL_HANDLE* handle, char* uri, int create, int options) {
  266. struct sockaddr buffer;
  267. struct sockaddr* bind_addr = &buffer;
  268. unsigned int bind_addrlen;
  269. int ret;
  270. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen, NULL, NULL)) < 0)
  271. return ret;
  272. #if ALLOW_BIND_ANY == 0
  273. /* the socket need to have a binding address, a null address or an
  274. any address is not allowed */
  275. if (check_any_addr(bind_addr))
  276. return -PAL_ERROR_INVAL;
  277. #endif
  278. struct sockopt sock_options;
  279. memset(&sock_options, 0, sizeof(sock_options));
  280. sock_options.reuseaddr = 1; /* sockets are always set as reusable in Graphene */
  281. int ipv6_v6only = create & PAL_CREATE_DUALSTACK ? 0 : 1;
  282. ret = ocall_listen(bind_addr->sa_family, sock_type(SOCK_STREAM, options), 0, ipv6_v6only,
  283. bind_addr, &bind_addrlen, &sock_options);
  284. if (IS_ERR(ret))
  285. return unix_to_pal_error(ERRNO(ret));
  286. *handle = socket_create_handle(pal_type_tcpsrv, ret, options, bind_addr, bind_addrlen, NULL, 0,
  287. &sock_options);
  288. if (!(*handle)) {
  289. ocall_close(ret);
  290. return -PAL_ERROR_NOMEM;
  291. }
  292. return 0;
  293. }
  294. /* accept a tcp connection */
  295. static int tcp_accept(PAL_HANDLE handle, PAL_HANDLE* client) {
  296. if (!IS_HANDLE_TYPE(handle, tcpsrv) || !handle->sock.bind || handle->sock.conn)
  297. return -PAL_ERROR_NOTSERVER;
  298. if (handle->sock.fd == PAL_IDX_POISON)
  299. return -PAL_ERROR_BADHANDLE;
  300. struct sockaddr* bind_addr = (struct sockaddr*)handle->sock.bind;
  301. unsigned int bind_addrlen = addr_size(bind_addr);
  302. struct sockaddr dest_addr;
  303. unsigned int dest_addrlen = sizeof(struct sockaddr);
  304. int ret = 0;
  305. struct sockopt sock_options;
  306. memset(&sock_options, 0, sizeof(sock_options));
  307. sock_options.reuseaddr = 1; /* sockets are always set as reusable in Graphene */
  308. ret = ocall_accept(handle->sock.fd, &dest_addr, &dest_addrlen, &sock_options);
  309. if (IS_ERR(ret))
  310. return unix_to_pal_error(ERRNO(ret));
  311. *client = socket_create_handle(pal_type_tcp, ret, 0, bind_addr, bind_addrlen, &dest_addr,
  312. dest_addrlen, &sock_options);
  313. if (!(*client)) {
  314. ocall_close(ret);
  315. return -PAL_ERROR_NOMEM;
  316. }
  317. return 0;
  318. }
  319. /* connect on a tcp socket */
  320. static int tcp_connect(PAL_HANDLE* handle, char* uri, int options) {
  321. struct sockaddr buffer[2];
  322. struct sockaddr* bind_addr = buffer;
  323. struct sockaddr* dest_addr = buffer + 1;
  324. unsigned int bind_addrlen, dest_addrlen;
  325. int ret;
  326. /* accepting two kind of different uri:
  327. dest-ip:dest-port or bind-ip:bind-port:dest-ip:dest-port */
  328. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen, &dest_addr, &dest_addrlen)) < 0)
  329. return ret;
  330. if (!dest_addr)
  331. return -PAL_ERROR_INVAL;
  332. if (bind_addr && bind_addr->sa_family != dest_addr->sa_family)
  333. return -PAL_ERROR_INVAL;
  334. #if ALLOW_BIND_ANY == 0
  335. /* the socket need to have a binding address, a null address or an
  336. any address is not allowed */
  337. if (bind_addr && addr_check_any(bind_addr))
  338. return -PAL_ERROR_INVAL;
  339. #endif
  340. struct sockopt sock_options;
  341. memset(&sock_options, 0, sizeof(sock_options));
  342. sock_options.reuseaddr = 1; /* sockets are always set as reusable in Graphene */
  343. ret = ocall_connect(dest_addr->sa_family, sock_type(SOCK_STREAM, options), 0, /*ipv6_v6only=*/0,
  344. dest_addr, dest_addrlen, bind_addr, &bind_addrlen, &sock_options);
  345. if (IS_ERR(ret))
  346. return unix_to_pal_error(ERRNO(ret));
  347. *handle = socket_create_handle(pal_type_tcp, ret, options, bind_addr, bind_addrlen, dest_addr,
  348. dest_addrlen, &sock_options);
  349. if (!(*handle)) {
  350. ocall_close(ret);
  351. return -PAL_ERROR_NOMEM;
  352. }
  353. return 0;
  354. }
  355. /* 'open' operation of tcp stream */
  356. static int tcp_open(PAL_HANDLE* handle, const char* type, const char* uri, int access, int share,
  357. int create, int options) {
  358. if (!WITHIN_MASK(access, PAL_ACCESS_MASK) || !WITHIN_MASK(share, PAL_SHARE_MASK) ||
  359. !WITHIN_MASK(create, PAL_CREATE_MASK) || !WITHIN_MASK(options, PAL_OPTION_MASK))
  360. return -PAL_ERROR_INVAL;
  361. int uri_len = strlen(uri) + 1;
  362. if (uri_len > PAL_SOCKADDR_SIZE)
  363. return -PAL_ERROR_TOOLONG;
  364. char uri_buf[PAL_SOCKADDR_SIZE];
  365. memcpy(uri_buf, uri, uri_len);
  366. if (!strcmp_static(type, URI_TYPE_TCP_SRV))
  367. return tcp_listen(handle, uri_buf, create, options);
  368. if (!strcmp_static(type, URI_TYPE_TCP))
  369. return tcp_connect(handle, uri_buf, options);
  370. return -PAL_ERROR_NOTSUPPORT;
  371. }
  372. /* 'read' operation of tcp stream */
  373. static int64_t tcp_read(PAL_HANDLE handle, uint64_t offset, uint64_t len, void* buf) {
  374. if (offset)
  375. return -PAL_ERROR_INVAL;
  376. if (!IS_HANDLE_TYPE(handle, tcp) || !handle->sock.conn)
  377. return -PAL_ERROR_NOTCONNECTION;
  378. if (handle->sock.fd == PAL_IDX_POISON)
  379. return -PAL_ERROR_ENDOFSTREAM;
  380. if (len != (uint32_t)len)
  381. return -PAL_ERROR_INVAL;
  382. ssize_t bytes = ocall_recv(handle->sock.fd, buf, len, NULL, NULL, NULL, NULL);
  383. if (IS_ERR(bytes))
  384. return unix_to_pal_error(ERRNO(bytes));
  385. if (!bytes)
  386. return -PAL_ERROR_ENDOFSTREAM;
  387. return bytes;
  388. }
  389. /* write' operation of tcp stream */
  390. static int64_t tcp_write(PAL_HANDLE handle, uint64_t offset, uint64_t len, const void* buf) {
  391. if (offset)
  392. return -PAL_ERROR_INVAL;
  393. if (!IS_HANDLE_TYPE(handle, tcp) || !handle->sock.conn)
  394. return -PAL_ERROR_NOTCONNECTION;
  395. if (handle->sock.fd == PAL_IDX_POISON)
  396. return -PAL_ERROR_CONNFAILED;
  397. if (len != (uint32_t)len)
  398. return -PAL_ERROR_INVAL;
  399. ssize_t bytes = ocall_send(handle->sock.fd, buf, len, NULL, 0, NULL, 0);
  400. if (IS_ERR(bytes))
  401. return unix_to_pal_error(ERRNO(bytes));
  402. return bytes;
  403. }
  404. /* used by 'open' operation of tcp stream for bound socket */
  405. static int udp_bind(PAL_HANDLE* handle, char* uri, int create, int options) {
  406. struct sockaddr buffer;
  407. struct sockaddr* bind_addr = &buffer;
  408. unsigned int bind_addrlen;
  409. int ret = 0;
  410. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen, NULL, NULL)) < 0)
  411. return ret;
  412. assert(bind_addr);
  413. assert(bind_addrlen == addr_size(bind_addr));
  414. #if ALLOW_BIND_ANY == 0
  415. /* the socket need to have a binding address, a null address or an
  416. any address is not allowed */
  417. if (addr_check_any(bind_addr))
  418. return -PAL_ERROR_INVAL;
  419. #endif
  420. struct sockopt sock_options;
  421. memset(&sock_options, 0, sizeof(sock_options));
  422. sock_options.reuseaddr = 1; /* sockets are always set as reusable in Graphene */
  423. int ipv6_v6only = create & PAL_CREATE_DUALSTACK ? 0 : 1;
  424. ret = ocall_listen(bind_addr->sa_family, sock_type(SOCK_DGRAM, options), 0, ipv6_v6only,
  425. bind_addr, &bind_addrlen, &sock_options);
  426. if (IS_ERR(ret))
  427. return unix_to_pal_error(ERRNO(ret));
  428. *handle = socket_create_handle(pal_type_udpsrv, ret, options, bind_addr, bind_addrlen, NULL, 0,
  429. &sock_options);
  430. if (!(*handle)) {
  431. ocall_close(ret);
  432. return -PAL_ERROR_NOMEM;
  433. }
  434. return 0;
  435. }
  436. /* used by 'open' operation of tcp stream for connected socket */
  437. static int udp_connect(PAL_HANDLE* handle, char* uri, int create, int options) {
  438. struct sockaddr buffer[2];
  439. struct sockaddr* bind_addr = buffer;
  440. struct sockaddr* dest_addr = buffer + 1;
  441. unsigned int bind_addrlen, dest_addrlen;
  442. int ret;
  443. if ((ret = socket_parse_uri(uri, &bind_addr, &bind_addrlen, &dest_addr, &dest_addrlen)) < 0)
  444. return ret;
  445. #if ALLOW_BIND_ANY == 0
  446. /* the socket need to have a binding address, a null address or an
  447. any address is not allowed */
  448. if (bind_addr && addr_check_any(bind_addr))
  449. return -PAL_ERROR_INVAL;
  450. #endif
  451. struct sockopt sock_options;
  452. memset(&sock_options, 0, sizeof(sock_options));
  453. sock_options.reuseaddr = 1; /* sockets are always set as reusable in Graphene */
  454. int ipv6_v6only = create & PAL_CREATE_DUALSTACK ? 0 : 1;
  455. ret = ocall_connect(dest_addr ? dest_addr->sa_family : AF_INET, sock_type(SOCK_DGRAM, options),
  456. 0, ipv6_v6only, dest_addr, dest_addrlen, bind_addr, &bind_addrlen,
  457. &sock_options);
  458. if (IS_ERR(ret))
  459. return unix_to_pal_error(ERRNO(ret));
  460. *handle = socket_create_handle(dest_addr ? pal_type_udp : pal_type_udpsrv, ret, options,
  461. bind_addr, bind_addrlen, dest_addr, dest_addrlen, &sock_options);
  462. if (!(*handle)) {
  463. ocall_close(ret);
  464. return -PAL_ERROR_NOMEM;
  465. }
  466. return 0;
  467. }
  468. static int udp_open(PAL_HANDLE* hdl, const char* type, const char* uri, int access, int share,
  469. int create, int options) {
  470. if (!WITHIN_MASK(access, PAL_ACCESS_MASK) || !WITHIN_MASK(share, PAL_SHARE_MASK) ||
  471. !WITHIN_MASK(create, PAL_CREATE_MASK) || !WITHIN_MASK(options, PAL_OPTION_MASK))
  472. return -PAL_ERROR_INVAL;
  473. char buf[PAL_SOCKADDR_SIZE];
  474. int len = strlen(uri);
  475. if (len >= PAL_SOCKADDR_SIZE)
  476. return -PAL_ERROR_TOOLONG;
  477. memcpy(buf, uri, len + 1);
  478. if (!strcmp_static(type, URI_TYPE_UDP_SRV))
  479. return udp_bind(hdl, buf, create, options);
  480. if (!strcmp_static(type, URI_TYPE_UDP))
  481. return udp_connect(hdl, buf, create, options);
  482. return -PAL_ERROR_NOTSUPPORT;
  483. }
  484. static int64_t udp_receive(PAL_HANDLE handle, uint64_t offset, uint64_t len, void* buf) {
  485. if (offset)
  486. return -PAL_ERROR_INVAL;
  487. if (!IS_HANDLE_TYPE(handle, udp))
  488. return -PAL_ERROR_NOTCONNECTION;
  489. if (handle->sock.fd == PAL_IDX_POISON)
  490. return -PAL_ERROR_BADHANDLE;
  491. if (len != (uint32_t)len)
  492. return -PAL_ERROR_INVAL;
  493. ssize_t ret = ocall_recv(handle->sock.fd, buf, len, NULL, NULL, NULL, NULL);
  494. return IS_ERR(ret) ? unix_to_pal_error(ERRNO(ret)) : ret;
  495. }
  496. static int64_t udp_receivebyaddr(PAL_HANDLE handle, uint64_t offset, uint64_t len, void* buf,
  497. char* addr, size_t addrlen) {
  498. if (offset)
  499. return -PAL_ERROR_INVAL;
  500. if (!IS_HANDLE_TYPE(handle, udpsrv))
  501. return -PAL_ERROR_NOTCONNECTION;
  502. if (handle->sock.fd == PAL_IDX_POISON)
  503. return -PAL_ERROR_BADHANDLE;
  504. if (len != (uint32_t)len)
  505. return -PAL_ERROR_INVAL;
  506. struct sockaddr conn_addr;
  507. socklen_t conn_addrlen = sizeof(struct sockaddr);
  508. ssize_t bytes = ocall_recv(handle->sock.fd, buf, len, &conn_addr, &conn_addrlen, NULL, NULL);
  509. if (IS_ERR(bytes))
  510. return unix_to_pal_error(ERRNO(bytes));
  511. char* addr_uri = strcpy_static(addr, URI_PREFIX_UDP, addrlen);
  512. if (!addr_uri)
  513. return -PAL_ERROR_OVERFLOW;
  514. int ret = inet_create_uri(addr_uri, addr + addrlen - addr_uri, &conn_addr, conn_addrlen);
  515. if (ret < 0)
  516. return ret;
  517. return bytes;
  518. }
  519. static int64_t udp_send(PAL_HANDLE handle, uint64_t offset, uint64_t len, const void* buf) {
  520. if (offset)
  521. return -PAL_ERROR_INVAL;
  522. if (!IS_HANDLE_TYPE(handle, udp))
  523. return -PAL_ERROR_NOTCONNECTION;
  524. if (handle->sock.fd == PAL_IDX_POISON)
  525. return -PAL_ERROR_BADHANDLE;
  526. if (len != (uint32_t)len)
  527. return -PAL_ERROR_INVAL;
  528. ssize_t bytes = ocall_send(handle->sock.fd, buf, len, NULL, 0, NULL, 0);
  529. if (IS_ERR(bytes))
  530. return unix_to_pal_error(ERRNO(bytes));
  531. return bytes;
  532. }
  533. static int64_t udp_sendbyaddr(PAL_HANDLE handle, uint64_t offset, uint64_t len, const void* buf,
  534. const char* addr, size_t addrlen) {
  535. if (offset)
  536. return -PAL_ERROR_INVAL;
  537. if (!IS_HANDLE_TYPE(handle, udpsrv))
  538. return -PAL_ERROR_NOTCONNECTION;
  539. if (handle->sock.fd == PAL_IDX_POISON)
  540. return -PAL_ERROR_BADHANDLE;
  541. if (!strstartswith_static(addr, URI_PREFIX_UDP))
  542. return -PAL_ERROR_INVAL;
  543. if (len != (uint32_t)len)
  544. return -PAL_ERROR_INVAL;
  545. addr += static_strlen(URI_PREFIX_UDP);
  546. addrlen -= static_strlen(URI_PREFIX_UDP);
  547. char* addrbuf = __alloca(addrlen);
  548. memcpy(addrbuf, addr, addrlen);
  549. struct sockaddr conn_addr;
  550. unsigned int conn_addrlen = sizeof(struct sockaddr);
  551. int ret = inet_parse_uri(&addrbuf, &conn_addr, &conn_addrlen);
  552. if (ret < 0)
  553. return ret;
  554. ssize_t bytes = ocall_send(handle->sock.fd, buf, len, &conn_addr, conn_addrlen, NULL, 0);
  555. if (IS_ERR(bytes))
  556. return unix_to_pal_error(ERRNO(bytes));
  557. return bytes;
  558. }
  559. static int socket_delete(PAL_HANDLE handle, int access) {
  560. if (handle->sock.fd == PAL_IDX_POISON)
  561. return 0;
  562. if (!IS_HANDLE_TYPE(handle, tcp) && access)
  563. return -PAL_ERROR_INVAL;
  564. if (IS_HANDLE_TYPE(handle, tcp) || IS_HANDLE_TYPE(handle, tcpsrv)) {
  565. int shutdown;
  566. switch (access) {
  567. case 0:
  568. shutdown = SHUT_RDWR;
  569. break;
  570. case PAL_DELETE_RD:
  571. shutdown = SHUT_RD;
  572. break;
  573. case PAL_DELETE_WR:
  574. shutdown = SHUT_WR;
  575. break;
  576. default:
  577. return -PAL_ERROR_INVAL;
  578. }
  579. ocall_shutdown(handle->sock.fd, shutdown);
  580. }
  581. return 0;
  582. }
  583. static int socket_close(PAL_HANDLE handle) {
  584. if (handle->sock.fd != PAL_IDX_POISON) {
  585. ocall_close(handle->sock.fd);
  586. handle->sock.fd = PAL_IDX_POISON;
  587. }
  588. if (handle->sock.bind)
  589. handle->sock.bind = (PAL_PTR)NULL;
  590. if (handle->sock.conn)
  591. handle->sock.conn = (PAL_PTR)NULL;
  592. return 0;
  593. }
  594. static int socket_attrquerybyhdl(PAL_HANDLE handle, PAL_STREAM_ATTR* attr) {
  595. int ret;
  596. if (handle->sock.fd == PAL_IDX_POISON)
  597. return -PAL_ERROR_BADHANDLE;
  598. attr->handle_type = HANDLE_HDR(handle)->type;
  599. attr->nonblocking = handle->sock.nonblocking;
  600. attr->disconnected = HANDLE_HDR(handle)->flags & ERROR(0);
  601. attr->socket.linger = handle->sock.linger;
  602. attr->socket.receivebuf = handle->sock.receivebuf;
  603. attr->socket.sendbuf = handle->sock.sendbuf;
  604. attr->socket.receivetimeout = handle->sock.receivetimeout;
  605. attr->socket.sendtimeout = handle->sock.sendtimeout;
  606. attr->socket.tcp_cork = handle->sock.tcp_cork;
  607. attr->socket.tcp_keepalive = handle->sock.tcp_keepalive;
  608. attr->socket.tcp_nodelay = handle->sock.tcp_nodelay;
  609. /* get number of bytes available for reading (doesn't make sense for listening sockets) */
  610. attr->pending_size = 0;
  611. if (!IS_HANDLE_TYPE(handle, tcpsrv)) {
  612. ret = ocall_fionread(handle->sock.fd);
  613. if (IS_ERR(ret))
  614. return unix_to_pal_error(ERRNO(ret));
  615. attr->pending_size = ret;
  616. }
  617. /* query if there is data available for reading */
  618. struct pollfd pfd = {.fd = handle->sock.fd, .events = POLLIN | POLLOUT, .revents = 0};
  619. ret = ocall_poll(&pfd, 1, 0);
  620. if (IS_ERR(ret))
  621. return unix_to_pal_error(ERRNO(ret));
  622. attr->readable = ret == 1 && (pfd.revents & (POLLIN | POLLERR | POLLHUP)) == POLLIN;
  623. attr->writable = ret == 1 && (pfd.revents & (POLLOUT | POLLERR | POLLHUP)) == POLLOUT;
  624. return 0;
  625. }
  626. static int socket_attrsetbyhdl(PAL_HANDLE handle, PAL_STREAM_ATTR* attr) {
  627. if (handle->sock.fd == PAL_IDX_POISON)
  628. return -PAL_ERROR_BADHANDLE;
  629. int fd = handle->sock.fd, ret, val;
  630. if (attr->nonblocking != handle->sock.nonblocking) {
  631. ret = ocall_fsetnonblock(fd, attr->nonblocking);
  632. if (IS_ERR(ret))
  633. return unix_to_pal_error(ERRNO(ret));
  634. handle->sock.nonblocking = attr->nonblocking;
  635. }
  636. if (HANDLE_TYPE(handle) != pal_type_tcpsrv) {
  637. struct __kernel_linger {
  638. int l_onoff;
  639. int l_linger;
  640. };
  641. if (attr->socket.linger != handle->sock.linger) {
  642. struct __kernel_linger l;
  643. l.l_onoff = attr->socket.linger ? 1 : 0;
  644. l.l_linger = attr->socket.linger;
  645. ret = ocall_setsockopt(fd, SOL_SOCKET, SO_LINGER, &l, sizeof(struct __kernel_linger));
  646. if (IS_ERR(ret))
  647. return unix_to_pal_error(ERRNO(ret));
  648. handle->sock.linger = attr->socket.linger;
  649. }
  650. if (attr->socket.receivebuf != handle->sock.receivebuf) {
  651. val = attr->socket.receivebuf;
  652. ret = ocall_setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &val, sizeof(int));
  653. if (IS_ERR(ret))
  654. return unix_to_pal_error(ERRNO(ret));
  655. handle->sock.receivebuf = attr->socket.receivebuf;
  656. }
  657. if (attr->socket.sendbuf != handle->sock.sendbuf) {
  658. val = attr->socket.sendbuf;
  659. ret = ocall_setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &val, sizeof(int));
  660. if (IS_ERR(ret))
  661. return unix_to_pal_error(ERRNO(ret));
  662. handle->sock.sendbuf = attr->socket.sendbuf;
  663. }
  664. if (attr->socket.receivetimeout != handle->sock.receivetimeout) {
  665. val = attr->socket.receivetimeout;
  666. ret = ocall_setsockopt(fd, SOL_SOCKET, SO_RCVTIMEO, &val, sizeof(int));
  667. if (IS_ERR(ret))
  668. return unix_to_pal_error(ERRNO(ret));
  669. handle->sock.receivetimeout = attr->socket.receivetimeout;
  670. }
  671. if (attr->socket.sendtimeout != handle->sock.sendtimeout) {
  672. val = attr->socket.sendtimeout;
  673. ret = ocall_setsockopt(fd, SOL_SOCKET, SO_SNDTIMEO, &val, sizeof(int));
  674. if (IS_ERR(ret))
  675. return unix_to_pal_error(ERRNO(ret));
  676. handle->sock.sendtimeout = attr->socket.sendtimeout;
  677. }
  678. }
  679. if (HANDLE_TYPE(handle) == pal_type_tcp || HANDLE_TYPE(handle) == pal_type_tcpsrv) {
  680. if (attr->socket.tcp_cork != handle->sock.tcp_cork) {
  681. val = attr->socket.tcp_cork ? 1 : 0;
  682. ret = ocall_setsockopt(fd, SOL_TCP, TCP_CORK, &val, sizeof(int));
  683. if (IS_ERR(ret))
  684. return unix_to_pal_error(ERRNO(ret));
  685. handle->sock.tcp_cork = attr->socket.tcp_cork;
  686. }
  687. if (attr->socket.tcp_keepalive != handle->sock.tcp_keepalive) {
  688. val = attr->socket.tcp_keepalive ? 1 : 0;
  689. ret = ocall_setsockopt(fd, SOL_SOCKET, SO_KEEPALIVE, &val, sizeof(int));
  690. if (IS_ERR(ret))
  691. return unix_to_pal_error(ERRNO(ret));
  692. handle->sock.tcp_keepalive = attr->socket.tcp_keepalive;
  693. }
  694. if (attr->socket.tcp_nodelay != handle->sock.tcp_nodelay) {
  695. val = attr->socket.tcp_nodelay ? 1 : 0;
  696. ret = ocall_setsockopt(fd, SOL_TCP, TCP_NODELAY, &val, sizeof(int));
  697. if (IS_ERR(ret))
  698. return unix_to_pal_error(ERRNO(ret));
  699. handle->sock.tcp_nodelay = attr->socket.tcp_nodelay;
  700. }
  701. }
  702. return 0;
  703. }
  704. static int socket_getname(PAL_HANDLE handle, char* buffer, size_t count) {
  705. size_t orig_count = count;
  706. int ret;
  707. const char* prefix = NULL;
  708. size_t prefix_len = 0;
  709. struct sockaddr* bind_addr = NULL;
  710. struct sockaddr* dest_addr = NULL;
  711. switch (PAL_GET_TYPE(handle)) {
  712. case pal_type_tcpsrv:
  713. prefix_len = static_strlen(URI_PREFIX_TCP_SRV);
  714. prefix = URI_PREFIX_TCP_SRV;
  715. bind_addr = (struct sockaddr*)handle->sock.bind;
  716. break;
  717. case pal_type_tcp:
  718. prefix_len = static_strlen(URI_PREFIX_TCP);
  719. prefix = URI_PREFIX_TCP;
  720. bind_addr = (struct sockaddr*)handle->sock.bind;
  721. dest_addr = (struct sockaddr*)handle->sock.conn;
  722. break;
  723. case pal_type_udpsrv:
  724. prefix_len = static_strlen(URI_PREFIX_UDP_SRV);
  725. prefix = URI_PREFIX_UDP_SRV;
  726. bind_addr = (struct sockaddr*)handle->sock.bind;
  727. break;
  728. case pal_type_udp:
  729. prefix_len = static_strlen(URI_PREFIX_UDP);
  730. prefix = URI_PREFIX_UDP;
  731. bind_addr = (struct sockaddr*)handle->sock.bind;
  732. dest_addr = (struct sockaddr*)handle->sock.conn;
  733. break;
  734. default:
  735. return -PAL_ERROR_INVAL;
  736. }
  737. if (count < prefix_len + 1) {
  738. return -PAL_ERROR_OVERFLOW;
  739. }
  740. memcpy(buffer, prefix, prefix_len + 1);
  741. buffer += prefix_len;
  742. count -= prefix_len;
  743. if (bind_addr) {
  744. if ((ret = inet_create_uri(buffer, count, bind_addr, addr_size(bind_addr))) < 0) {
  745. return ret;
  746. }
  747. buffer += ret;
  748. count -= ret;
  749. }
  750. if (dest_addr) {
  751. if (bind_addr) {
  752. if (count < 2) {
  753. return -PAL_ERROR_OVERFLOW;
  754. }
  755. *buffer++ = ':';
  756. *buffer = '\0';
  757. count--;
  758. }
  759. if ((ret = inet_create_uri(buffer, count, dest_addr, addr_size(dest_addr))) < 0) {
  760. return ret;
  761. }
  762. buffer += ret;
  763. count -= ret;
  764. }
  765. return orig_count - count;
  766. }
  767. struct handle_ops tcp_ops = {
  768. .getname = &socket_getname,
  769. .open = &tcp_open,
  770. .waitforclient = &tcp_accept,
  771. .read = &tcp_read,
  772. .write = &tcp_write,
  773. .delete = &socket_delete,
  774. .close = &socket_close,
  775. .attrquerybyhdl = &socket_attrquerybyhdl,
  776. .attrsetbyhdl = &socket_attrsetbyhdl,
  777. };
  778. struct handle_ops udp_ops = {
  779. .getname = &socket_getname,
  780. .open = &udp_open,
  781. .read = &udp_receive,
  782. .write = &udp_send,
  783. .delete = &socket_delete,
  784. .close = &socket_close,
  785. .attrquerybyhdl = &socket_attrquerybyhdl,
  786. .attrsetbyhdl = &socket_attrsetbyhdl,
  787. };
  788. struct handle_ops udpsrv_ops = {
  789. .getname = &socket_getname,
  790. .open = &udp_open,
  791. .readbyaddr = &udp_receivebyaddr,
  792. .writebyaddr = &udp_sendbyaddr,
  793. .delete = &socket_delete,
  794. .close = &socket_close,
  795. .attrquerybyhdl = &socket_attrquerybyhdl,
  796. .attrsetbyhdl = &socket_attrsetbyhdl,
  797. };