shim_socket.c 51 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778
  1. /* Copyright (C) 2014 Stony Brook University
  2. This file is part of Graphene Library OS.
  3. Graphene Library OS is free software: you can redistribute it and/or
  4. modify it under the terms of the GNU Lesser General Public License
  5. as published by the Free Software Foundation, either version 3 of the
  6. License, or (at your option) any later version.
  7. Graphene Library OS is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. GNU Lesser General Public License for more details.
  11. You should have received a copy of the GNU Lesser General Public License
  12. along with this program. If not, see <http://www.gnu.org/licenses/>. */
  13. /*
  14. * shim_socket.c
  15. *
  16. * Implementation of system call "socket", "bind", "accept4", "listen",
  17. * "connect", "sendto", "recvfrom", "sendmsg", "recvmsg" and "shutdown" and
  18. * "getsockname", "getpeername".
  19. */
  20. #include <asm/socket.h>
  21. #include <errno.h>
  22. #include <linux/fcntl.h>
  23. #include <linux/in.h>
  24. #include <linux/in6.h>
  25. #include <pal.h>
  26. #include <pal_error.h>
  27. #include <shim_checkpoint.h>
  28. #include <shim_fs.h>
  29. #include <shim_handle.h>
  30. #include <shim_internal.h>
  31. #include <shim_table.h>
  32. #include <shim_utils.h>
  33. /*
  34. * User-settable options (used with setsockopt).
  35. */
  36. #define TCP_NODELAY 1 /* Don't delay send to coalesce packets */
  37. #define TCP_MAXSEG 2 /* Set maximum segment size */
  38. #define TCP_CORK 3 /* Control sending of partial frames */
  39. #define TCP_KEEPIDLE 4 /* Start keeplives after this period */
  40. #define TCP_KEEPINTVL 5 /* Interval between keepalives */
  41. #define TCP_KEEPCNT 6 /* Number of keepalives before death */
  42. #define TCP_SYNCNT 7 /* Number of SYN retransmits */
  43. #define TCP_LINGER2 8 /* Life time of orphaned FIN-WAIT-2 state */
  44. #define TCP_DEFER_ACCEPT 9 /* Wake up listener only when data arrive */
  45. #define TCP_WINDOW_CLAMP 10 /* Bound advertised window */
  46. #define TCP_INFO 11 /* Information about this connection. */
  47. #define TCP_QUICKACK 12 /* Bock/reenable quick ACKs. */
  48. #define TCP_CONGESTION 13 /* Congestion control algorithm. */
  49. #define TCP_MD5SIG 14 /* TCP MD5 Signature (RFC2385) */
  50. #define AF_UNSPEC 0
  51. #define SOCK_URI_SIZE 108
  52. static int rebase_on_lo __attribute_migratable = -1;
  53. static size_t minimal_addrlen(int domain) {
  54. switch (domain) {
  55. case AF_INET:
  56. return sizeof(struct sockaddr_in);
  57. case AF_INET6:
  58. return sizeof(struct sockaddr_in6);
  59. default:
  60. return sizeof(struct sockaddr);
  61. }
  62. }
  63. static int init_port_rebase(void) {
  64. if (rebase_on_lo != -1)
  65. return 0;
  66. char cfg[CONFIG_MAX];
  67. int rebase = 0;
  68. if (!root_config || get_config(root_config, "net.port.rebase_on_lo", cfg, sizeof(cfg)) <= 0) {
  69. rebase_on_lo = 0;
  70. return 0;
  71. }
  72. for (const char* p = cfg; *p; p++) {
  73. if (*p < '0' || *p > '9' || rebase > 32767) {
  74. rebase_on_lo = 0;
  75. return 0;
  76. }
  77. rebase = rebase * 10 + (*p - '0');
  78. }
  79. rebase_on_lo = rebase;
  80. return 0;
  81. }
  82. static int inet_parse_addr(int domain, int type, const char* uri, struct addr_inet* bind,
  83. struct addr_inet* conn);
  84. static int __process_pending_options(struct shim_handle* hdl);
  85. int shim_do_socket(int family, int type, int protocol) {
  86. struct shim_handle* hdl = get_new_handle();
  87. if (!hdl)
  88. return -ENOMEM;
  89. struct shim_sock_handle* sock = &hdl->info.sock;
  90. hdl->type = TYPE_SOCK;
  91. set_handle_fs(hdl, &socket_builtin_fs);
  92. hdl->flags = type & SOCK_NONBLOCK ? O_NONBLOCK : 0;
  93. hdl->acc_mode = 0;
  94. sock->domain = family;
  95. sock->sock_type = type & ~(SOCK_NONBLOCK | SOCK_CLOEXEC);
  96. sock->protocol = protocol;
  97. int ret = -ENOSYS;
  98. switch (sock->domain) {
  99. case AF_UNIX: // Local communication
  100. case AF_INET: // IPv4 Internet protocols ip(7)
  101. case AF_INET6: // IPv6 Internet protocols
  102. break;
  103. default:
  104. debug("shim_socket: unknown socket domain %d\n", sock->domain);
  105. goto err;
  106. }
  107. switch (sock->sock_type) {
  108. case SOCK_STREAM: // TCP
  109. break;
  110. case SOCK_DGRAM: // UDP
  111. hdl->acc_mode = MAY_READ | MAY_WRITE;
  112. break;
  113. default:
  114. debug("shim_socket: unknown socket type %d\n", sock->sock_type);
  115. goto err;
  116. }
  117. sock->sock_state = SOCK_CREATED;
  118. ret = set_new_fd_handle(hdl, type & SOCK_CLOEXEC ? FD_CLOEXEC : 0, NULL);
  119. err:
  120. put_handle(hdl);
  121. return ret;
  122. }
  123. static int unix_create_uri(char* uri, int count, enum shim_sock_state state, unsigned int pipeid) {
  124. int bytes = 0;
  125. switch (state) {
  126. case SOCK_CREATED:
  127. case SOCK_BOUNDCONNECTED:
  128. case SOCK_SHUTDOWN:
  129. return -ENOTCONN;
  130. case SOCK_BOUND:
  131. case SOCK_LISTENED:
  132. case SOCK_ACCEPTED:
  133. bytes = snprintf(uri, count, URI_PREFIX_PIPE_SRV "%u", pipeid);
  134. break;
  135. case SOCK_CONNECTED:
  136. bytes = snprintf(uri, count, URI_PREFIX_PIPE "%u", pipeid);
  137. break;
  138. default:
  139. return -ENOTCONN;
  140. }
  141. return bytes == count ? -ENAMETOOLONG : bytes;
  142. }
  143. static void inet_rebase_port(bool reverse, int domain, struct addr_inet* addr, bool local) {
  144. init_port_rebase();
  145. if (rebase_on_lo) {
  146. if (domain == AF_INET) {
  147. unsigned char* ad = (unsigned char*)&addr->addr.v4.s_addr;
  148. if (!local && memcmp(ad, "\177\0\0\1", 4))
  149. return;
  150. }
  151. if (domain == AF_INET6) {
  152. unsigned short* ad = (void*)&addr->addr.v6.s6_addr;
  153. if (!local && memcmp(ad, "\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\1", 16))
  154. return;
  155. }
  156. }
  157. if (reverse)
  158. addr->port = addr->ext_port - rebase_on_lo;
  159. else
  160. addr->ext_port = addr->port + rebase_on_lo;
  161. }
  162. static ssize_t inet_translate_addr(int domain, char* uri, size_t count, struct addr_inet* addr) {
  163. if (domain == AF_INET) {
  164. unsigned char* ad = (unsigned char*)&addr->addr.v4.s_addr;
  165. return snprintf(uri, count, "%u.%u.%u.%u:%u", ad[0], ad[1], ad[2], ad[3], addr->ext_port);
  166. }
  167. if (domain == AF_INET6) {
  168. unsigned short* ad = (void*)&addr->addr.v6.s6_addr;
  169. return snprintf(uri, count, "[%04x:%04x:%x:%04x:%04x:%04x:%04x:%04x]:%u", __ntohs(ad[0]),
  170. __ntohs(ad[1]), __ntohs(ad[2]), __ntohs(ad[3]), __ntohs(ad[4]), __ntohs(ad[5]),
  171. __ntohs(ad[6]), __ntohs(ad[7]), addr->ext_port);
  172. }
  173. return -EPROTONOSUPPORT;
  174. }
  175. static ssize_t inet_create_uri(int domain, char* uri, size_t count, int sock_type,
  176. enum shim_sock_state state, struct addr_inet* bind,
  177. struct addr_inet* conn) {
  178. size_t bytes = 0;
  179. ssize_t ret;
  180. size_t prefix_len;
  181. if (sock_type == SOCK_STREAM) {
  182. switch (state) {
  183. case SOCK_CREATED:
  184. case SOCK_SHUTDOWN:
  185. return -ENOTCONN;
  186. case SOCK_BOUND:
  187. case SOCK_LISTENED:
  188. prefix_len = static_strlen(URI_PREFIX_TCP_SRV);
  189. if (count < prefix_len + 1)
  190. return -ENAMETOOLONG;
  191. memcpy(uri, URI_PREFIX_TCP_SRV, prefix_len + 1);
  192. ret = inet_translate_addr(domain, uri + prefix_len, count - prefix_len, bind);
  193. return ret < 0 ? ret : (ssize_t)(ret + prefix_len);
  194. case SOCK_BOUNDCONNECTED:
  195. prefix_len = static_strlen(URI_PREFIX_TCP);
  196. if (count < prefix_len + 1)
  197. return -ENAMETOOLONG;
  198. memcpy(uri, URI_PREFIX_TCP, prefix_len + 1);
  199. bytes = prefix_len;
  200. ret = inet_translate_addr(domain, uri + bytes, count - bytes, bind);
  201. if (ret < 0)
  202. return ret;
  203. uri[bytes + ret] = ':';
  204. bytes += ret + 1;
  205. ret = inet_translate_addr(domain, uri + bytes, count - bytes, conn);
  206. return ret < 0 ? ret : (ssize_t)(ret + bytes);
  207. case SOCK_CONNECTED:
  208. case SOCK_ACCEPTED:
  209. prefix_len = static_strlen(URI_PREFIX_TCP);
  210. if (count < prefix_len + 1)
  211. return -ENAMETOOLONG;
  212. memcpy(uri, URI_PREFIX_TCP, prefix_len + 1);
  213. ret = inet_translate_addr(domain, uri + prefix_len, count - prefix_len, conn);
  214. return ret < 0 ? ret : (ssize_t)(ret + prefix_len);
  215. }
  216. }
  217. if (sock_type == SOCK_DGRAM) {
  218. switch (state) {
  219. case SOCK_CREATED:
  220. case SOCK_SHUTDOWN:
  221. return -ENOTCONN;
  222. case SOCK_LISTENED:
  223. case SOCK_ACCEPTED:
  224. return -EOPNOTSUPP;
  225. case SOCK_BOUNDCONNECTED:
  226. prefix_len = static_strlen(URI_PREFIX_UDP_SRV);
  227. if (count < prefix_len + 1)
  228. return -ENAMETOOLONG;
  229. memcpy(uri, URI_PREFIX_UDP_SRV, prefix_len + 1);
  230. bytes = prefix_len;
  231. ret = inet_translate_addr(domain, uri + bytes, count - bytes, bind);
  232. if (ret < 0)
  233. return ret;
  234. uri[bytes + ret] = ':';
  235. bytes += ret + 1;
  236. ret = inet_translate_addr(domain, uri + bytes, count - bytes, conn);
  237. return ret < 0 ? ret : (ssize_t)(ret + bytes);
  238. case SOCK_BOUND:
  239. prefix_len = static_strlen(URI_PREFIX_UDP_SRV);
  240. if (count < prefix_len + 1)
  241. return -ENAMETOOLONG;
  242. memcpy(uri, URI_PREFIX_UDP_SRV, prefix_len + 1);
  243. ret = inet_translate_addr(domain, uri + prefix_len, count - prefix_len, bind);
  244. return ret < 0 ? ret : (ssize_t)(ret + prefix_len);
  245. case SOCK_CONNECTED:
  246. prefix_len = static_strlen(URI_PREFIX_UDP);
  247. if (count < prefix_len + 1)
  248. return -ENAMETOOLONG;
  249. memcpy(uri, URI_PREFIX_UDP, prefix_len + 1);
  250. ret = inet_translate_addr(domain, uri + prefix_len, count - prefix_len, conn);
  251. return ret < 0 ? ret : (ssize_t)(ret + prefix_len);
  252. }
  253. }
  254. return -EPROTONOSUPPORT;
  255. }
  256. static inline void unix_copy_addr(struct sockaddr* saddr, struct shim_dentry* dent) {
  257. struct sockaddr_un* un = (struct sockaddr_un*)saddr;
  258. un->sun_family = AF_UNIX;
  259. size_t size;
  260. const char* path = dentry_get_path(dent, true, &size);
  261. memcpy(un->sun_path, path, size + 1);
  262. }
  263. static int inet_check_addr(int domain, struct sockaddr* addr, socklen_t addrlen) {
  264. if (domain == AF_INET) {
  265. if (addr->sa_family != AF_INET)
  266. return -EAFNOSUPPORT;
  267. if (addrlen != sizeof(struct sockaddr_in))
  268. return -EINVAL;
  269. return 0;
  270. }
  271. if (domain == AF_INET6) {
  272. if (addr->sa_family != AF_INET && addr->sa_family != AF_INET6)
  273. return -EAFNOSUPPORT;
  274. if (addrlen != minimal_addrlen(addr->sa_family))
  275. return -EINVAL;
  276. return 0;
  277. }
  278. return -EINVAL;
  279. }
  280. static int inet_copy_addr(int domain, struct sockaddr* saddr, const struct addr_inet* addr) {
  281. if (domain == AF_INET) {
  282. struct sockaddr_in* in = (struct sockaddr_in*)saddr;
  283. in->sin_family = AF_INET;
  284. in->sin_port = __htons(addr->port);
  285. in->sin_addr = addr->addr.v4;
  286. return sizeof(struct sockaddr_in);
  287. }
  288. if (domain == AF_INET6) {
  289. struct sockaddr_in6* in6 = (struct sockaddr_in6*)saddr;
  290. in6->sin6_family = AF_INET6;
  291. in6->sin6_port = __htons(addr->port);
  292. in6->sin6_addr = addr->addr.v6;
  293. return sizeof(struct sockaddr_in6);
  294. }
  295. return sizeof(struct sockaddr);
  296. }
  297. static void inet_save_addr(int domain, struct addr_inet* addr, const struct sockaddr* saddr) {
  298. if (domain == AF_INET) {
  299. const struct sockaddr_in* in = (const struct sockaddr_in*)saddr;
  300. addr->port = __ntohs(in->sin_port);
  301. addr->addr.v4 = in->sin_addr;
  302. return;
  303. }
  304. if (domain == AF_INET6) {
  305. if (saddr->sa_family == AF_INET) {
  306. const struct sockaddr_in* in = (const struct sockaddr_in*)saddr;
  307. addr->port = __ntohs(in->sin_port);
  308. uint32_t s_addr[4] = {
  309. /* in->sin_addr.s_addr is already network byte order */
  310. __htonl(0), __htonl(0), __htonl(0x0000ffff), in->sin_addr.s_addr
  311. };
  312. memcpy(&addr->addr.v6.s6_addr, s_addr, sizeof(s_addr));
  313. } else {
  314. const struct sockaddr_in6* in6 = (const struct sockaddr_in6*)saddr;
  315. addr->port = __ntohs(in6->sin6_port);
  316. addr->addr.v6 = in6->sin6_addr;
  317. }
  318. return;
  319. }
  320. }
  321. static inline bool inet_comp_addr(int domain, const struct addr_inet* addr,
  322. const struct sockaddr* saddr) {
  323. if (domain == AF_INET) {
  324. const struct sockaddr_in* in = (const struct sockaddr_in*)saddr;
  325. return addr->port == __ntohs(in->sin_port) &&
  326. !memcmp(&addr->addr.v4, &in->sin_addr, sizeof(struct in_addr));
  327. }
  328. if (domain == AF_INET6) {
  329. const struct sockaddr_in6* in6 = (const struct sockaddr_in6*)saddr;
  330. return addr->port == __ntohs(in6->sin6_port) &&
  331. !memcmp(&addr->addr.v6, &in6->sin6_addr, sizeof(struct in6_addr));
  332. }
  333. return false;
  334. }
  335. static int create_socket_uri(struct shim_handle* hdl) {
  336. struct shim_sock_handle* sock = &hdl->info.sock;
  337. if (sock->domain == AF_UNIX) {
  338. char uri_buf[32];
  339. int bytes = unix_create_uri(uri_buf, 32, sock->sock_state, sock->addr.un.pipeid);
  340. if (bytes < 0)
  341. return bytes;
  342. qstrsetstr(&hdl->uri, uri_buf, bytes);
  343. return 0;
  344. }
  345. if (sock->domain == AF_INET || sock->domain == AF_INET6) {
  346. char uri_buf[SOCK_URI_SIZE];
  347. int bytes = inet_create_uri(sock->domain, uri_buf, SOCK_URI_SIZE, sock->sock_type,
  348. sock->sock_state, &sock->addr.in.bind, &sock->addr.in.conn);
  349. if (bytes < 0)
  350. return bytes;
  351. qstrsetstr(&hdl->uri, uri_buf, bytes);
  352. return 0;
  353. }
  354. return -EPROTONOSUPPORT;
  355. }
  356. int shim_do_bind(int sockfd, struct sockaddr* addr, socklen_t addrlen) {
  357. if (!addr || test_user_memory(addr, addrlen, false))
  358. return -EFAULT;
  359. struct shim_handle* hdl = get_fd_handle(sockfd, NULL, NULL);
  360. int ret = -EINVAL;
  361. if (!hdl)
  362. return -EBADF;
  363. if (hdl->type != TYPE_SOCK) {
  364. put_handle(hdl);
  365. return -ENOTSOCK;
  366. }
  367. struct shim_sock_handle* sock = &hdl->info.sock;
  368. lock(&hdl->lock);
  369. enum shim_sock_state state = sock->sock_state;
  370. if (state != SOCK_CREATED) {
  371. debug("shim_bind: bind on a bound socket\n");
  372. goto out;
  373. }
  374. if (sock->domain == AF_UNIX) {
  375. if (addrlen != sizeof(struct sockaddr_un))
  376. goto out;
  377. struct sockaddr_un* saddr = (struct sockaddr_un*)addr;
  378. char* spath = saddr->sun_path;
  379. struct shim_dentry* dent = NULL;
  380. if ((ret = path_lookupat(NULL, spath, LOOKUP_CREATE, &dent, NULL)) < 0) {
  381. // DEP 7/3/17: We actually want either 0 or -ENOENT, as the
  382. // expected case is that the name is free (and we get the dent to
  383. // populate the name)
  384. if (ret != -ENOENT || !dent)
  385. goto out;
  386. }
  387. if (dent->state & DENTRY_VALID && !(dent->state & DENTRY_NEGATIVE)) {
  388. ret = -EADDRINUSE;
  389. goto out;
  390. }
  391. struct shim_unix_data* data = malloc(sizeof(struct shim_unix_data));
  392. data->pipeid = hashtype_to_idtype(dent->rel_path.hash);
  393. sock->addr.un.pipeid = data->pipeid;
  394. sock->addr.un.data = data;
  395. sock->addr.un.dentry = dent;
  396. } else if (sock->domain == AF_INET || sock->domain == AF_INET6) {
  397. if ((ret = inet_check_addr(sock->domain, addr, addrlen)) < 0)
  398. goto out;
  399. inet_save_addr(sock->domain, &sock->addr.in.bind, addr);
  400. inet_rebase_port(false, sock->domain, &sock->addr.in.bind, true);
  401. }
  402. sock->sock_state = SOCK_BOUND;
  403. if ((ret = create_socket_uri(hdl)) < 0)
  404. goto out;
  405. PAL_HANDLE pal_hdl = DkStreamOpen(qstrgetstr(&hdl->uri), 0, 0, 0, hdl->flags & O_NONBLOCK);
  406. if (!pal_hdl) {
  407. ret = (PAL_NATIVE_ERRNO == PAL_ERROR_STREAMEXIST) ? -EADDRINUSE : -PAL_ERRNO;
  408. debug("bind: invalid handle returned\n");
  409. goto out;
  410. }
  411. if (sock->domain == AF_UNIX) {
  412. struct shim_dentry* dent = sock->addr.un.dentry;
  413. dent->state ^= DENTRY_NEGATIVE;
  414. dent->state |= DENTRY_VALID | DENTRY_RECENTLY;
  415. dent->fs = &socket_builtin_fs;
  416. dent->data = sock->addr.un.data;
  417. }
  418. if (sock->domain == AF_INET || sock->domain == AF_INET6) {
  419. char uri[SOCK_URI_SIZE];
  420. if (!DkStreamGetName(pal_hdl, uri, SOCK_URI_SIZE)) {
  421. ret = -PAL_ERRNO;
  422. goto out;
  423. }
  424. if ((ret = inet_parse_addr(sock->domain, sock->sock_type, uri, &sock->addr.in.bind, NULL)) <
  425. 0)
  426. goto out;
  427. inet_rebase_port(true, sock->domain, &sock->addr.in.bind, true);
  428. }
  429. hdl->pal_handle = pal_hdl;
  430. __process_pending_options(hdl);
  431. ret = 0;
  432. out:
  433. if (ret < 0) {
  434. sock->sock_state = state;
  435. sock->error = -ret;
  436. if (sock->domain == AF_UNIX) {
  437. if (sock->addr.un.dentry)
  438. put_dentry(sock->addr.un.dentry);
  439. if (sock->addr.un.data) {
  440. free(sock->addr.un.data);
  441. sock->addr.un.data = NULL;
  442. }
  443. }
  444. }
  445. unlock(&hdl->lock);
  446. put_handle(hdl);
  447. return ret;
  448. }
  449. static int inet_parse_addr(int domain, int type, const char* uri, struct addr_inet* bind,
  450. struct addr_inet* conn) {
  451. char* ip_str;
  452. char* port_str;
  453. char* next_str;
  454. int ip_len = 0;
  455. if (!(next_str = strchr(uri, ':')))
  456. return -EINVAL;
  457. next_str++;
  458. enum { UDP, UDPSRV, TCP, TCPSRV } prefix;
  459. if (strstartswith_static(uri, URI_PREFIX_UDP))
  460. prefix = UDP;
  461. else if (strstartswith_static(uri, URI_PREFIX_UDP_SRV))
  462. prefix = UDPSRV;
  463. else if (strstartswith_static(uri, URI_PREFIX_TCP))
  464. prefix = TCP;
  465. else if (strstartswith_static(uri, URI_PREFIX_TCP_SRV))
  466. prefix = TCPSRV;
  467. else
  468. return -EINVAL;
  469. if ((prefix == UDP || prefix == UDPSRV) && type != SOCK_DGRAM)
  470. return -EINVAL;
  471. if ((prefix == TCP || prefix == TCPSRV) && type != SOCK_STREAM)
  472. return -EINVAL;
  473. for (int round = 0; (ip_str = next_str); round++) {
  474. if (ip_str[0] == '[') {
  475. ip_str++;
  476. if (domain != AF_INET6)
  477. return -EINVAL;
  478. if (!(port_str = strchr(ip_str, ']')))
  479. return -EINVAL;
  480. ip_len = port_str - ip_str;
  481. port_str++;
  482. if (*port_str != ':')
  483. return -EINVAL;
  484. } else {
  485. if (domain != AF_INET)
  486. return -EINVAL;
  487. if (!(port_str = strchr(ip_str, ':')))
  488. return -EINVAL;
  489. ip_len = port_str - ip_str;
  490. }
  491. port_str++;
  492. next_str = strchr(port_str, ':');
  493. if (next_str)
  494. next_str++;
  495. struct addr_inet* addr = round ? conn : bind;
  496. if (domain == AF_INET) {
  497. inet_pton4(ip_str, ip_len, &addr->addr.v4);
  498. addr->ext_port = atoi(port_str);
  499. }
  500. if (domain == AF_INET6) {
  501. inet_pton6(ip_str, ip_len, &addr->addr.v6);
  502. addr->ext_port = atoi(port_str);
  503. }
  504. }
  505. return 0;
  506. }
  507. int shim_do_listen(int sockfd, int backlog) {
  508. if (backlog < 0)
  509. return -EINVAL;
  510. struct shim_handle* hdl = get_fd_handle(sockfd, NULL, NULL);
  511. if (!hdl)
  512. return -EBADF;
  513. if (hdl->type != TYPE_SOCK) {
  514. put_handle(hdl);
  515. return -ENOTSOCK;
  516. }
  517. struct shim_sock_handle* sock = &hdl->info.sock;
  518. if (sock->sock_type != SOCK_STREAM) {
  519. debug("shim_listen: not a stream socket\n");
  520. put_handle(hdl);
  521. return -EINVAL;
  522. }
  523. lock(&hdl->lock);
  524. enum shim_sock_state state = sock->sock_state;
  525. int ret = -EINVAL;
  526. if (state != SOCK_BOUND && state != SOCK_LISTENED) {
  527. debug("shim_listen: listen on unbound socket\n");
  528. goto out;
  529. }
  530. hdl->acc_mode = MAY_READ;
  531. sock->sock_state = SOCK_LISTENED;
  532. ret = 0;
  533. out:
  534. if (ret < 0)
  535. sock->sock_state = state;
  536. unlock(&hdl->lock);
  537. put_handle(hdl);
  538. return ret;
  539. }
  540. /* Connect with the TCP socket is always in the client.
  541. *
  542. * With UDP, the connection is make to the socket specific for a
  543. * destination. A process with a connected UDP socket can call
  544. * connect again for that socket for one of two reasons: 1. To
  545. * specify a new IP address and port 2. To unconnect the socket.
  546. */
  547. int shim_do_connect(int sockfd, struct sockaddr* addr, int addrlen) {
  548. if (!addr || test_user_memory(addr, addrlen, false))
  549. return -EFAULT;
  550. struct shim_handle* hdl = get_fd_handle(sockfd, NULL, NULL);
  551. if (!hdl)
  552. return -EBADF;
  553. if (hdl->type != TYPE_SOCK) {
  554. put_handle(hdl);
  555. return -ENOTSOCK;
  556. }
  557. struct shim_sock_handle* sock = &hdl->info.sock;
  558. lock(&hdl->lock);
  559. enum shim_sock_state state = sock->sock_state;
  560. int ret = -EINVAL;
  561. if (state == SOCK_CONNECTED) {
  562. if (addr->sa_family == AF_UNSPEC) {
  563. sock->sock_state = SOCK_CREATED;
  564. if (sock->sock_type == SOCK_STREAM && hdl->pal_handle) {
  565. DkStreamDelete(hdl->pal_handle, 0);
  566. DkObjectClose(hdl->pal_handle);
  567. hdl->pal_handle = NULL;
  568. }
  569. debug("shim_connect: reconnect on a stream socket\n");
  570. ret = 0;
  571. goto out;
  572. }
  573. debug("shim_connect: reconnect on a stream socket\n");
  574. ret = -EISCONN;
  575. goto out;
  576. }
  577. if (state != SOCK_BOUND && state != SOCK_CREATED) {
  578. debug("shim_connect: connect on invalid socket\n");
  579. goto out;
  580. }
  581. if (sock->domain == AF_UNIX) {
  582. if (addrlen != sizeof(struct sockaddr_un))
  583. goto out;
  584. struct sockaddr_un* saddr = (struct sockaddr_un*)addr;
  585. char* spath = saddr->sun_path;
  586. struct shim_dentry* dent;
  587. if ((ret = path_lookupat(NULL, spath, LOOKUP_CREATE, &dent, NULL)) < 0) {
  588. // DEP 7/3/17: We actually want either 0 or -ENOENT, as the
  589. // expected case is that the name is free (and we get the dent to
  590. // populate the name)
  591. if (ret != -ENOENT || !dent)
  592. goto out;
  593. }
  594. struct shim_unix_data* data = dent->data;
  595. if (!(dent->state & DENTRY_VALID) || dent->state & DENTRY_NEGATIVE) {
  596. data = malloc(sizeof(struct shim_unix_data));
  597. data->pipeid = hashtype_to_idtype(dent->rel_path.hash);
  598. } else if (dent->fs != &socket_builtin_fs) {
  599. ret = -ECONNREFUSED;
  600. goto out;
  601. }
  602. sock->addr.un.pipeid = data->pipeid;
  603. sock->addr.un.data = data;
  604. sock->addr.un.dentry = dent;
  605. get_dentry(dent);
  606. }
  607. if (state == SOCK_BOUND) {
  608. /* if the socket is bound, the stream needs to be shut and rebound. */
  609. assert(hdl->pal_handle);
  610. DkStreamDelete(hdl->pal_handle, 0);
  611. DkObjectClose(hdl->pal_handle);
  612. hdl->pal_handle = NULL;
  613. }
  614. if (sock->domain != AF_UNIX) {
  615. if ((ret = inet_check_addr(sock->domain, addr, addrlen)) < 0)
  616. goto out;
  617. inet_save_addr(sock->domain, &sock->addr.in.conn, addr);
  618. inet_rebase_port(false, sock->domain, &sock->addr.in.conn, false);
  619. }
  620. sock->sock_state = (state == SOCK_BOUND) ? SOCK_BOUNDCONNECTED : SOCK_CONNECTED;
  621. if ((ret = create_socket_uri(hdl)) < 0)
  622. goto out;
  623. PAL_HANDLE pal_hdl = DkStreamOpen(qstrgetstr(&hdl->uri), 0, 0, 0, hdl->flags & O_NONBLOCK);
  624. if (!pal_hdl) {
  625. ret = (PAL_NATIVE_ERRNO == PAL_ERROR_DENIED) ? -ECONNREFUSED : -PAL_ERRNO;
  626. goto out;
  627. }
  628. hdl->pal_handle = pal_hdl;
  629. if (sock->domain == AF_UNIX) {
  630. struct shim_dentry* dent = sock->addr.un.dentry;
  631. lock(&dent->lock);
  632. dent->state ^= DENTRY_NEGATIVE;
  633. dent->state |= DENTRY_VALID | DENTRY_RECENTLY;
  634. dent->fs = &socket_builtin_fs;
  635. dent->data = sock->addr.un.data;
  636. unlock(&dent->lock);
  637. }
  638. if (sock->domain == AF_INET || sock->domain == AF_INET6) {
  639. char uri[SOCK_URI_SIZE];
  640. if (!DkStreamGetName(pal_hdl, uri, SOCK_URI_SIZE)) {
  641. ret = -PAL_ERRNO;
  642. goto out;
  643. }
  644. if ((ret = inet_parse_addr(sock->domain, sock->sock_type, uri, &sock->addr.in.bind,
  645. &sock->addr.in.conn)) < 0)
  646. goto out;
  647. inet_rebase_port(true, sock->domain, &sock->addr.in.bind, true);
  648. inet_rebase_port(true, sock->domain, &sock->addr.in.conn, false);
  649. }
  650. hdl->acc_mode = MAY_READ | MAY_WRITE;
  651. __process_pending_options(hdl);
  652. ret = 0;
  653. out:
  654. if (ret < 0) {
  655. sock->sock_state = state;
  656. sock->error = -ret;
  657. if (sock->domain == AF_UNIX) {
  658. if (sock->addr.un.dentry)
  659. put_dentry(sock->addr.un.dentry);
  660. if (sock->addr.un.data) {
  661. free(sock->addr.un.data);
  662. sock->addr.un.data = NULL;
  663. }
  664. }
  665. }
  666. unlock(&hdl->lock);
  667. put_handle(hdl);
  668. return ret;
  669. }
  670. int __do_accept(struct shim_handle* hdl, int flags, struct sockaddr* addr, socklen_t* addrlen) {
  671. if (hdl->type != TYPE_SOCK)
  672. return -ENOTSOCK;
  673. struct shim_sock_handle* sock = &hdl->info.sock;
  674. int ret;
  675. PAL_HANDLE accepted = NULL;
  676. if (sock->sock_type != SOCK_STREAM) {
  677. debug("shim_accept: not a stream socket\n");
  678. return -EOPNOTSUPP;
  679. }
  680. if (addr) {
  681. if (!addrlen || test_user_memory(addrlen, sizeof(*addrlen), false))
  682. return -EINVAL;
  683. if (*addrlen < minimal_addrlen(sock->domain))
  684. return -EINVAL;
  685. if (test_user_memory(addr, *addrlen, true))
  686. return -EINVAL;
  687. }
  688. lock(&hdl->lock);
  689. if (sock->sock_state != SOCK_LISTENED) {
  690. debug("shim_accpet: invalid socket\n");
  691. ret = -EINVAL;
  692. goto out;
  693. }
  694. accepted = DkStreamWaitForClient(hdl->pal_handle);
  695. if (!accepted) {
  696. ret = -PAL_ERRNO;
  697. goto out;
  698. }
  699. if (flags & O_NONBLOCK) {
  700. PAL_STREAM_ATTR attr;
  701. if (!DkStreamAttributesQueryByHandle(accepted, &attr)) {
  702. ret = -PAL_ERRNO;
  703. goto out;
  704. }
  705. attr.nonblocking = PAL_TRUE;
  706. if (!DkStreamAttributesSetByHandle(accepted, &attr)) {
  707. ret = -PAL_ERRNO;
  708. goto out;
  709. }
  710. }
  711. struct shim_handle* cli = get_new_handle();
  712. if (!cli) {
  713. ret = -ENOMEM;
  714. goto out;
  715. }
  716. struct shim_sock_handle* cli_sock = &cli->info.sock;
  717. cli->type = TYPE_SOCK;
  718. set_handle_fs(cli, &socket_builtin_fs);
  719. cli->acc_mode = MAY_READ | MAY_WRITE;
  720. cli->flags = O_RDWR | flags;
  721. cli->pal_handle = accepted;
  722. accepted = NULL;
  723. cli_sock->domain = sock->domain;
  724. cli_sock->sock_type = sock->sock_type;
  725. cli_sock->protocol = sock->protocol;
  726. cli_sock->sock_state = SOCK_ACCEPTED;
  727. if (sock->domain == AF_UNIX) {
  728. cli_sock->addr.un.pipeid = sock->addr.un.pipeid;
  729. if (sock->addr.un.dentry) {
  730. get_dentry(sock->addr.un.dentry);
  731. cli_sock->addr.un.dentry = sock->addr.un.dentry;
  732. }
  733. qstrsetstr(&cli->uri, qstrgetstr(&hdl->uri), hdl->uri.len);
  734. if (addr) {
  735. unix_copy_addr(addr, sock->addr.un.dentry);
  736. if (addrlen)
  737. *addrlen = sizeof(struct sockaddr_un);
  738. }
  739. }
  740. if (sock->domain == AF_INET || sock->domain == AF_INET6) {
  741. char uri[SOCK_URI_SIZE];
  742. int uri_len;
  743. if (!(uri_len = DkStreamGetName(cli->pal_handle, uri, SOCK_URI_SIZE))) {
  744. ret = -PAL_ERRNO;
  745. goto out_cli;
  746. }
  747. if ((ret = inet_parse_addr(cli_sock->domain, cli_sock->sock_type, uri,
  748. &cli_sock->addr.in.bind, &cli_sock->addr.in.conn)) < 0)
  749. goto out_cli;
  750. qstrsetstr(&cli->uri, uri, uri_len);
  751. inet_rebase_port(true, cli_sock->domain, &cli_sock->addr.in.bind, true);
  752. inet_rebase_port(true, cli_sock->domain, &cli_sock->addr.in.conn, false);
  753. if (addr) {
  754. inet_copy_addr(sock->domain, addr, &sock->addr.in.conn);
  755. if (addrlen) {
  756. assert(sock->domain == AF_INET || sock->domain == AF_INET6);
  757. *addrlen = minimal_addrlen(sock->domain);
  758. }
  759. }
  760. }
  761. ret = set_new_fd_handle(cli, flags & O_CLOEXEC ? FD_CLOEXEC : 0, NULL);
  762. out_cli:
  763. put_handle(cli);
  764. out:
  765. if (ret < 0)
  766. sock->error = -ret;
  767. if (accepted)
  768. DkObjectClose(accepted);
  769. unlock(&hdl->lock);
  770. return ret;
  771. }
  772. int shim_do_accept(int fd, struct sockaddr* addr, socklen_t* addrlen) {
  773. int flags;
  774. struct shim_handle* hdl = get_fd_handle(fd, &flags, NULL);
  775. if (!hdl)
  776. return -EBADF;
  777. int ret = __do_accept(hdl, flags & O_CLOEXEC, addr, addrlen);
  778. put_handle(hdl);
  779. return ret;
  780. }
  781. int shim_do_accept4(int fd, struct sockaddr* addr, socklen_t* addrlen, int flags) {
  782. struct shim_handle* hdl = get_fd_handle(fd, NULL, NULL);
  783. if (!hdl)
  784. return -EBADF;
  785. int ret = __do_accept(
  786. hdl, (flags & SOCK_CLOEXEC ? O_CLOEXEC : 0) | (flags & SOCK_NONBLOCK ? O_NONBLOCK : 0),
  787. addr, addrlen);
  788. put_handle(hdl);
  789. return ret;
  790. }
  791. static ssize_t do_sendmsg(int fd, struct iovec* bufs, int nbufs, int flags,
  792. const struct sockaddr* addr, socklen_t addrlen) {
  793. // Issue #752 - https://github.com/oscarlab/graphene/issues/752
  794. __UNUSED(flags);
  795. struct shim_handle* hdl = get_fd_handle(fd, NULL, NULL);
  796. if (!hdl)
  797. return -EBADF;
  798. ssize_t ret = -ENOTSOCK;
  799. if (hdl->type != TYPE_SOCK)
  800. goto out;
  801. struct shim_sock_handle* sock = &hdl->info.sock;
  802. ret = -EFAULT;
  803. if (addr && test_user_memory((void*)addr, addrlen, false))
  804. goto out;
  805. if (!bufs || test_user_memory(bufs, sizeof(*bufs) * nbufs, false))
  806. goto out;
  807. for (int i = 0; i < nbufs; i++) {
  808. if (!bufs[i].iov_base || test_user_memory(bufs[i].iov_base, bufs[i].iov_len, false))
  809. goto out;
  810. }
  811. lock(&hdl->lock);
  812. PAL_HANDLE pal_hdl = hdl->pal_handle;
  813. char* uri = NULL;
  814. /* Data gram sock need not be conneted or bound at all */
  815. if (sock->sock_type == SOCK_STREAM && sock->sock_state != SOCK_CONNECTED &&
  816. sock->sock_state != SOCK_BOUNDCONNECTED && sock->sock_state != SOCK_ACCEPTED) {
  817. ret = -ENOTCONN;
  818. goto out_locked;
  819. }
  820. if (sock->sock_type == SOCK_DGRAM && sock->sock_state == SOCK_SHUTDOWN) {
  821. ret = -ENOTCONN;
  822. goto out_locked;
  823. }
  824. if (!(hdl->acc_mode & MAY_WRITE)) {
  825. ret = -ECONNRESET;
  826. goto out_locked;
  827. }
  828. if (sock->sock_type == SOCK_DGRAM && sock->sock_state != SOCK_BOUNDCONNECTED &&
  829. sock->sock_state != SOCK_CONNECTED) {
  830. if (!addr) {
  831. ret = -EDESTADDRREQ;
  832. goto out_locked;
  833. }
  834. if (sock->sock_state == SOCK_CREATED && !pal_hdl) {
  835. pal_hdl = DkStreamOpen(URI_PREFIX_UDP, 0, 0, 0, hdl->flags & O_NONBLOCK);
  836. if (!pal_hdl) {
  837. ret = -PAL_ERRNO;
  838. goto out_locked;
  839. }
  840. hdl->pal_handle = pal_hdl;
  841. }
  842. if (addr && addr->sa_family != sock->domain) {
  843. ret = -EINVAL;
  844. goto out_locked;
  845. }
  846. uri = __alloca(SOCK_URI_SIZE);
  847. }
  848. unlock(&hdl->lock);
  849. if (uri) {
  850. struct addr_inet addr_buf;
  851. inet_save_addr(sock->domain, &addr_buf, addr);
  852. inet_rebase_port(false, sock->domain, &addr_buf, false);
  853. size_t prefix_len = static_strlen(URI_PREFIX_UDP);
  854. memcpy(uri, URI_PREFIX_UDP, prefix_len + 1);
  855. if ((ret = inet_translate_addr(sock->domain,
  856. uri + prefix_len,
  857. SOCK_URI_SIZE - prefix_len,
  858. &addr_buf)) < 0) {
  859. lock(&hdl->lock);
  860. goto out_locked;
  861. }
  862. debug("next packet send to %s\n", uri);
  863. }
  864. int bytes = 0;
  865. ret = 0;
  866. for (int i = 0; i < nbufs; i++) {
  867. PAL_NUM pal_ret = DkStreamWrite(pal_hdl, 0, bufs[i].iov_len, bufs[i].iov_base, uri);
  868. if (pal_ret == PAL_STREAM_ERROR) {
  869. ret = (PAL_NATIVE_ERRNO == PAL_ERROR_STREAMEXIST) ? -ECONNABORTED : -PAL_ERRNO;
  870. break;
  871. }
  872. bytes += pal_ret;
  873. }
  874. if (bytes)
  875. ret = bytes;
  876. if (ret < 0) {
  877. lock(&hdl->lock);
  878. goto out_locked;
  879. }
  880. goto out;
  881. out_locked:
  882. if (ret < 0)
  883. sock->error = -ret;
  884. unlock(&hdl->lock);
  885. out:
  886. put_handle(hdl);
  887. return ret;
  888. }
  889. ssize_t shim_do_sendto(int sockfd, const void* buf, size_t len, int flags,
  890. const struct sockaddr* addr, socklen_t addrlen) {
  891. struct iovec iovbuf;
  892. iovbuf.iov_base = (void*)buf;
  893. iovbuf.iov_len = len;
  894. return do_sendmsg(sockfd, &iovbuf, 1, flags, addr, addrlen);
  895. }
  896. ssize_t shim_do_sendmsg(int sockfd, struct msghdr* msg, int flags) {
  897. return do_sendmsg(sockfd, msg->msg_iov, msg->msg_iovlen, flags, msg->msg_name,
  898. msg->msg_namelen);
  899. }
  900. ssize_t shim_do_sendmmsg(int sockfd, struct mmsghdr* msg, size_t vlen, int flags) {
  901. ssize_t total = 0;
  902. for (size_t i = 0; i * sizeof(struct mmsghdr) < vlen; i++) {
  903. struct msghdr* m = &msg[i].msg_hdr;
  904. ssize_t bytes =
  905. do_sendmsg(sockfd, m->msg_iov, m->msg_iovlen, flags, m->msg_name, m->msg_namelen);
  906. if (bytes < 0)
  907. return total > 0 ? total : bytes;
  908. msg[i].msg_len = bytes;
  909. total++;
  910. }
  911. return total;
  912. }
  913. static ssize_t do_recvmsg(int fd, struct iovec* bufs, int nbufs, int flags, struct sockaddr* addr,
  914. socklen_t* addrlen) {
  915. /* TODO handle flags properly. For now, explicitly return an error. */
  916. if (flags) {
  917. debug("recvmsg()/recvmmsg()/recvfrom(): flags parameter unsupported.\n");
  918. return -EOPNOTSUPP;
  919. }
  920. struct shim_handle* hdl = get_fd_handle(fd, NULL, NULL);
  921. if (!hdl)
  922. return -EBADF;
  923. int ret = -ENOTSOCK;
  924. if (hdl->type != TYPE_SOCK)
  925. goto out;
  926. struct shim_sock_handle* sock = &hdl->info.sock;
  927. if (addr) {
  928. ret = -EINVAL;
  929. if (!addrlen || test_user_memory(addrlen, sizeof(*addrlen), false))
  930. goto out;
  931. if (*addrlen < minimal_addrlen(sock->domain))
  932. goto out;
  933. if (test_user_memory(addr, *addrlen, true))
  934. goto out;
  935. }
  936. ret = -EFAULT;
  937. if (!bufs || test_user_memory(bufs, sizeof(*bufs) * nbufs, false))
  938. goto out;
  939. for (int i = 0; i < nbufs; i++) {
  940. if (!bufs[i].iov_base || test_user_memory(bufs[i].iov_base, bufs[i].iov_len, true))
  941. goto out;
  942. }
  943. lock(&hdl->lock);
  944. PAL_HANDLE pal_hdl = hdl->pal_handle;
  945. char* uri = NULL;
  946. if (sock->sock_type == SOCK_STREAM && sock->sock_state != SOCK_CONNECTED &&
  947. sock->sock_state != SOCK_BOUNDCONNECTED && sock->sock_state != SOCK_ACCEPTED) {
  948. ret = -ENOTCONN;
  949. goto out_locked;
  950. }
  951. if (!(hdl->acc_mode & MAY_READ)) {
  952. ret = 0;
  953. goto out_locked;
  954. }
  955. if (addr && sock->sock_type == SOCK_DGRAM && sock->sock_state != SOCK_CONNECTED &&
  956. sock->sock_state != SOCK_BOUNDCONNECTED) {
  957. if (sock->sock_state == SOCK_CREATED) {
  958. ret = -EINVAL;
  959. goto out_locked;
  960. }
  961. uri = __alloca(SOCK_URI_SIZE);
  962. }
  963. unlock(&hdl->lock);
  964. bool address_received = false;
  965. int bytes = 0;
  966. ret = 0;
  967. for (int i = 0; i < nbufs; i++) {
  968. PAL_NUM pal_ret = DkStreamRead(pal_hdl, 0, bufs[i].iov_len, bufs[i].iov_base, uri, uri ? SOCK_URI_SIZE : 0);
  969. if (pal_ret == PAL_STREAM_ERROR) {
  970. ret = (PAL_NATIVE_ERRNO == PAL_ERROR_STREAMNOTEXIST) ? -ECONNABORTED : -PAL_ERRNO;
  971. break;
  972. }
  973. bytes += pal_ret;
  974. if (addr && !address_received) {
  975. if (sock->domain == AF_UNIX) {
  976. unix_copy_addr(addr, sock->addr.un.dentry);
  977. *addrlen = sizeof(struct sockaddr_un);
  978. }
  979. if (sock->domain == AF_INET || sock->domain == AF_INET6) {
  980. if (uri) {
  981. struct addr_inet conn;
  982. if ((ret = inet_parse_addr(sock->domain, sock->sock_type, uri, &conn, NULL)) < 0) {
  983. lock(&hdl->lock);
  984. goto out_locked;
  985. }
  986. debug("last packet received from %s\n", uri);
  987. inet_rebase_port(true, sock->domain, &conn, false);
  988. inet_copy_addr(sock->domain, addr, &conn);
  989. } else {
  990. inet_copy_addr(sock->domain, addr, &sock->addr.in.conn);
  991. }
  992. *addrlen = (sock->domain == AF_INET) ? sizeof(struct sockaddr_in)
  993. : sizeof(struct sockaddr_in6);
  994. }
  995. address_received = true;
  996. }
  997. /* gap in iovecs is not allowed, return a partial read to user; it is the responsibility of
  998. * user application to deal with partial reads */
  999. if (pal_ret < bufs[i].iov_len)
  1000. break;
  1001. }
  1002. if (bytes)
  1003. ret = bytes;
  1004. if (ret < 0) {
  1005. lock(&hdl->lock);
  1006. goto out_locked;
  1007. }
  1008. goto out;
  1009. out_locked:
  1010. if (ret < 0)
  1011. sock->error = -ret;
  1012. unlock(&hdl->lock);
  1013. out:
  1014. put_handle(hdl);
  1015. return ret;
  1016. }
  1017. ssize_t shim_do_recvfrom(int sockfd, void* buf, size_t len, int flags, struct sockaddr* addr,
  1018. socklen_t* addrlen) {
  1019. struct iovec iovbuf;
  1020. iovbuf.iov_base = (void*)buf;
  1021. iovbuf.iov_len = len;
  1022. return do_recvmsg(sockfd, &iovbuf, 1, flags, addr, addrlen);
  1023. }
  1024. ssize_t shim_do_recvmsg(int sockfd, struct msghdr* msg, int flags) {
  1025. return do_recvmsg(sockfd, msg->msg_iov, msg->msg_iovlen, flags, msg->msg_name,
  1026. &msg->msg_namelen);
  1027. }
  1028. ssize_t shim_do_recvmmsg(int sockfd, struct mmsghdr* msg, size_t vlen, int flags,
  1029. struct __kernel_timespec* timeout) {
  1030. ssize_t total = 0;
  1031. // Issue # 753 - https://github.com/oscarlab/graphene/issues/753
  1032. /* TODO(donporter): timeout properly. For now, explicitly return an error. */
  1033. if (timeout) {
  1034. debug("recvmmsg(): timeout parameter unsupported.\n");
  1035. return -EOPNOTSUPP;
  1036. }
  1037. for (size_t i = 0; i * sizeof(struct mmsghdr) < vlen; i++) {
  1038. struct msghdr* m = &msg[i].msg_hdr;
  1039. ssize_t bytes =
  1040. do_recvmsg(sockfd, m->msg_iov, m->msg_iovlen, flags, m->msg_name, &m->msg_namelen);
  1041. if (bytes < 0)
  1042. return total > 0 ? total : bytes;
  1043. msg[i].msg_len = bytes;
  1044. total++;
  1045. }
  1046. return total;
  1047. }
  1048. #define SHUT_RD 0
  1049. #define SHUT_WR 1
  1050. #define SHUT_RDWR 2
  1051. int shim_do_shutdown(int sockfd, int how) {
  1052. struct shim_handle* hdl = get_fd_handle(sockfd, NULL, NULL);
  1053. if (!hdl)
  1054. return -EBADF;
  1055. int ret = 0;
  1056. struct shim_sock_handle* sock = &hdl->info.sock;
  1057. if (hdl->type != TYPE_SOCK) {
  1058. ret = -ENOTSOCK;
  1059. goto out;
  1060. }
  1061. lock(&hdl->lock);
  1062. if (sock->sock_state != SOCK_LISTENED && sock->sock_state != SOCK_ACCEPTED &&
  1063. sock->sock_state != SOCK_CONNECTED && sock->sock_state != SOCK_BOUNDCONNECTED) {
  1064. ret = -ENOTCONN;
  1065. goto out_locked;
  1066. }
  1067. switch (how) {
  1068. case SHUT_RD:
  1069. DkStreamDelete(hdl->pal_handle, PAL_DELETE_RD);
  1070. hdl->acc_mode &= ~MAY_READ;
  1071. break;
  1072. case SHUT_WR:
  1073. DkStreamDelete(hdl->pal_handle, PAL_DELETE_WR);
  1074. hdl->acc_mode &= ~MAY_WRITE;
  1075. break;
  1076. case SHUT_RDWR:
  1077. DkStreamDelete(hdl->pal_handle, 0);
  1078. hdl->acc_mode = 0;
  1079. sock->sock_state = SOCK_SHUTDOWN;
  1080. break;
  1081. }
  1082. ret = 0;
  1083. out_locked:
  1084. if (ret < 0)
  1085. sock->error = -ret;
  1086. unlock(&hdl->lock);
  1087. out:
  1088. put_handle(hdl);
  1089. return ret;
  1090. }
  1091. int shim_do_getsockname(int sockfd, struct sockaddr* addr, int* addrlen) {
  1092. if (!addr || !addrlen)
  1093. return -EFAULT;
  1094. if (*addrlen <= 0)
  1095. return -EINVAL;
  1096. if (test_user_memory(addr, *addrlen, true))
  1097. return -EFAULT;
  1098. struct shim_handle* hdl = get_fd_handle(sockfd, NULL, NULL);
  1099. if (!hdl)
  1100. return -EBADF;
  1101. int ret = -EINVAL;
  1102. if (hdl->type != TYPE_SOCK) {
  1103. ret = -ENOTSOCK;
  1104. goto out;
  1105. }
  1106. struct shim_sock_handle* sock = &hdl->info.sock;
  1107. lock(&hdl->lock);
  1108. struct sockaddr saddr;
  1109. int len = inet_copy_addr(sock->domain, &saddr, &sock->addr.in.bind);
  1110. if (len < *addrlen)
  1111. len = *addrlen;
  1112. memcpy(addr, &saddr, len);
  1113. *addrlen = len;
  1114. ret = 0;
  1115. unlock(&hdl->lock);
  1116. out:
  1117. put_handle(hdl);
  1118. return ret;
  1119. }
  1120. int shim_do_getpeername(int sockfd, struct sockaddr* addr, int* addrlen) {
  1121. if (!addr || !addrlen)
  1122. return -EFAULT;
  1123. if (*addrlen <= 0)
  1124. return -EINVAL;
  1125. if (test_user_memory(addr, *addrlen, true))
  1126. return -EFAULT;
  1127. struct shim_handle* hdl = get_fd_handle(sockfd, NULL, NULL);
  1128. if (!hdl)
  1129. return -EBADF;
  1130. int ret = -EINVAL;
  1131. if (hdl->type != TYPE_SOCK) {
  1132. ret = -ENOTSOCK;
  1133. goto out;
  1134. }
  1135. struct shim_sock_handle* sock = &hdl->info.sock;
  1136. lock(&hdl->lock);
  1137. /* Data gram sock need not be conneted or bound at all */
  1138. if (sock->sock_type == SOCK_STREAM && sock->sock_state != SOCK_CONNECTED &&
  1139. sock->sock_state != SOCK_BOUNDCONNECTED && sock->sock_state != SOCK_ACCEPTED) {
  1140. ret = -ENOTCONN;
  1141. goto out_locked;
  1142. }
  1143. if (sock->sock_type == SOCK_DGRAM && sock->sock_state != SOCK_CONNECTED &&
  1144. sock->sock_state != SOCK_BOUNDCONNECTED) {
  1145. ret = -ENOTCONN;
  1146. goto out_locked;
  1147. }
  1148. struct sockaddr saddr;
  1149. int len = inet_copy_addr(sock->domain, &saddr, &sock->addr.in.conn);
  1150. if (len < *addrlen)
  1151. len = *addrlen;
  1152. memcpy(addr, &saddr, len);
  1153. *addrlen = len;
  1154. ret = 0;
  1155. out_locked:
  1156. unlock(&hdl->lock);
  1157. out:
  1158. put_handle(hdl);
  1159. return ret;
  1160. }
  1161. struct __kernel_linger {
  1162. int l_onoff;
  1163. int l_linger;
  1164. };
  1165. static int __do_setsockopt(struct shim_handle* hdl, int level, int optname, char* optval,
  1166. int optlen, PAL_STREAM_ATTR* attr) {
  1167. // Issue 754 - https://github.com/oscarlab/graphene/issues/754
  1168. __UNUSED(optlen);
  1169. int intval = *((int*)optval);
  1170. PAL_BOL bolval = intval ? PAL_TRUE : PAL_FALSE;
  1171. if (level == SOL_SOCKET) {
  1172. switch (optname) {
  1173. case SO_ACCEPTCONN:
  1174. case SO_DOMAIN:
  1175. case SO_ERROR:
  1176. case SO_PROTOCOL:
  1177. case SO_TYPE:
  1178. return -EPERM;
  1179. case SO_KEEPALIVE:
  1180. case SO_LINGER:
  1181. case SO_RCVBUF:
  1182. case SO_SNDBUF:
  1183. case SO_RCVTIMEO:
  1184. case SO_SNDTIMEO:
  1185. case SO_REUSEADDR:
  1186. goto query;
  1187. default:
  1188. goto unknown;
  1189. }
  1190. }
  1191. if (level == SOL_TCP) {
  1192. switch (optname) {
  1193. case TCP_CORK:
  1194. case TCP_NODELAY:
  1195. goto query;
  1196. default:
  1197. goto unknown;
  1198. }
  1199. }
  1200. unknown:
  1201. return -ENOPROTOOPT;
  1202. query:
  1203. if (!attr) {
  1204. attr = __alloca(sizeof(PAL_STREAM_ATTR));
  1205. if (!DkStreamAttributesQueryByHandle(hdl->pal_handle, attr))
  1206. return -PAL_ERRNO;
  1207. }
  1208. if (level == SOL_SOCKET) {
  1209. switch (optname) {
  1210. case SO_KEEPALIVE:
  1211. if (bolval != attr->socket.tcp_keepalive) {
  1212. attr->socket.tcp_keepalive = bolval;
  1213. goto set;
  1214. }
  1215. break;
  1216. case SO_LINGER: {
  1217. struct __kernel_linger* l = (struct __kernel_linger*)optval;
  1218. int linger = l->l_onoff ? l->l_linger : 0;
  1219. if (linger != (int)attr->socket.linger) {
  1220. attr->socket.linger = linger;
  1221. goto set;
  1222. }
  1223. break;
  1224. }
  1225. case SO_RCVBUF:
  1226. if (intval != (int)attr->socket.receivebuf) {
  1227. attr->socket.receivebuf = intval;
  1228. goto set;
  1229. }
  1230. break;
  1231. case SO_SNDBUF:
  1232. if (intval != (int)attr->socket.sendbuf) {
  1233. attr->socket.sendbuf = intval;
  1234. goto set;
  1235. }
  1236. break;
  1237. case SO_RCVTIMEO:
  1238. if (intval != (int)attr->socket.receivetimeout) {
  1239. attr->socket.receivetimeout = intval;
  1240. goto set;
  1241. }
  1242. break;
  1243. case SO_SNDTIMEO:
  1244. if (intval != (int)attr->socket.sendtimeout) {
  1245. attr->socket.sendtimeout = intval;
  1246. goto set;
  1247. }
  1248. break;
  1249. case SO_REUSEADDR:
  1250. break;
  1251. }
  1252. }
  1253. if (level == SOL_TCP) {
  1254. switch (optname) {
  1255. case TCP_CORK:
  1256. if (bolval != attr->socket.tcp_cork) {
  1257. attr->socket.tcp_cork = bolval;
  1258. goto set;
  1259. }
  1260. break;
  1261. case TCP_NODELAY:
  1262. if (bolval != attr->socket.tcp_nodelay) {
  1263. attr->socket.tcp_nodelay = bolval;
  1264. goto set;
  1265. }
  1266. break;
  1267. }
  1268. }
  1269. return 0;
  1270. set:
  1271. if (!DkStreamAttributesSetByHandle(hdl->pal_handle, attr))
  1272. return -PAL_ERRNO;
  1273. return 0;
  1274. }
  1275. static int __process_pending_options(struct shim_handle* hdl) {
  1276. struct shim_sock_handle* sock = &hdl->info.sock;
  1277. if (!sock->pending_options)
  1278. return 0;
  1279. PAL_STREAM_ATTR attr;
  1280. if (!DkStreamAttributesQueryByHandle(hdl->pal_handle, &attr))
  1281. return -PAL_ERRNO;
  1282. struct shim_sock_option* o = sock->pending_options;
  1283. while (o) {
  1284. PAL_STREAM_ATTR tmp = attr;
  1285. int ret = __do_setsockopt(hdl, o->level, o->optname, o->optval, o->optlen, &tmp);
  1286. if (!ret)
  1287. attr = tmp;
  1288. struct shim_sock_option* next = o->next;
  1289. free(o);
  1290. o = next;
  1291. }
  1292. return 0;
  1293. }
  1294. int shim_do_setsockopt(int fd, int level, int optname, char* optval, int optlen) {
  1295. if (!optval)
  1296. return -EFAULT;
  1297. struct shim_handle* hdl = get_fd_handle(fd, NULL, NULL);
  1298. if (!hdl)
  1299. return -EBADF;
  1300. int ret = 0;
  1301. if (hdl->type != TYPE_SOCK) {
  1302. ret = -ENOTSOCK;
  1303. goto out;
  1304. }
  1305. struct shim_sock_handle* sock = &hdl->info.sock;
  1306. lock(&hdl->lock);
  1307. if (!hdl->pal_handle) {
  1308. struct shim_sock_option* o = malloc(sizeof(struct shim_sock_option) + optlen);
  1309. if (!o) {
  1310. ret = -ENOMEM;
  1311. goto out_locked;
  1312. }
  1313. struct shim_sock_option** next = &sock->pending_options;
  1314. while (*next) {
  1315. next = &(*next)->next;
  1316. }
  1317. o->next = NULL;
  1318. *next = o;
  1319. o->level = level;
  1320. o->optname = optname;
  1321. o->optlen = optlen;
  1322. memcpy(&o->optval, optval, optlen);
  1323. goto out_locked;
  1324. }
  1325. ret = __do_setsockopt(hdl, level, optname, optval, optlen, NULL);
  1326. out_locked:
  1327. unlock(&hdl->lock);
  1328. out:
  1329. put_handle(hdl);
  1330. return ret;
  1331. }
  1332. int shim_do_getsockopt(int fd, int level, int optname, char* optval, int* optlen) {
  1333. if (!optval || !optlen)
  1334. return -EFAULT;
  1335. struct shim_handle* hdl = get_fd_handle(fd, NULL, NULL);
  1336. if (!hdl)
  1337. return -EBADF;
  1338. int ret = 0;
  1339. if (hdl->type != TYPE_SOCK) {
  1340. ret = -ENOTSOCK;
  1341. goto out;
  1342. }
  1343. struct shim_sock_handle* sock = &hdl->info.sock;
  1344. lock(&hdl->lock);
  1345. int* intval = (int*)optval;
  1346. if (level == SOL_SOCKET) {
  1347. switch (optname) {
  1348. case SO_ACCEPTCONN:
  1349. *intval = (sock->sock_state == SOCK_LISTENED) ? 1 : 0;
  1350. goto out;
  1351. case SO_DOMAIN:
  1352. *intval = sock->domain;
  1353. goto out;
  1354. case SO_ERROR:
  1355. *intval = sock->error;
  1356. goto out;
  1357. case SO_PROTOCOL:
  1358. switch (sock->protocol) {
  1359. case SOCK_STREAM:
  1360. *intval = IPPROTO_SCTP;
  1361. break;
  1362. case SOCK_DGRAM:
  1363. *intval = IPPROTO_UDP;
  1364. break;
  1365. default:
  1366. goto unknown;
  1367. }
  1368. goto out;
  1369. case SO_TYPE:
  1370. *intval = sock->sock_type;
  1371. goto out;
  1372. case SO_KEEPALIVE:
  1373. case SO_LINGER:
  1374. case SO_RCVBUF:
  1375. case SO_SNDBUF:
  1376. case SO_RCVTIMEO:
  1377. case SO_SNDTIMEO:
  1378. case SO_REUSEADDR:
  1379. goto query;
  1380. default:
  1381. goto unknown;
  1382. }
  1383. }
  1384. if (level == SOL_TCP) {
  1385. switch (optname) {
  1386. case TCP_CORK:
  1387. case TCP_NODELAY:
  1388. goto query;
  1389. default:
  1390. goto unknown;
  1391. }
  1392. }
  1393. unknown:
  1394. ret = -ENOPROTOOPT;
  1395. goto out;
  1396. query:
  1397. {
  1398. PAL_STREAM_ATTR attr;
  1399. if (!DkStreamAttributesQueryByHandle(hdl->pal_handle, &attr)) {
  1400. ret = -PAL_ERRNO;
  1401. goto out;
  1402. }
  1403. if (level == SOL_SOCKET) {
  1404. switch (optname) {
  1405. case SO_KEEPALIVE:
  1406. *intval = attr.socket.tcp_keepalive ? 1 : 0;
  1407. break;
  1408. case SO_LINGER: {
  1409. struct __kernel_linger* l = (struct __kernel_linger*)optval;
  1410. l->l_onoff = attr.socket.linger ? 1 : 0;
  1411. l->l_linger = attr.socket.linger;
  1412. break;
  1413. }
  1414. case SO_RCVBUF:
  1415. *intval = attr.socket.receivebuf;
  1416. break;
  1417. case SO_SNDBUF:
  1418. *intval = attr.socket.sendbuf;
  1419. break;
  1420. case SO_RCVTIMEO:
  1421. *intval = attr.socket.receivetimeout;
  1422. break;
  1423. case SO_SNDTIMEO:
  1424. *intval = attr.socket.sendtimeout;
  1425. break;
  1426. case SO_REUSEADDR:
  1427. *intval = 1;
  1428. break;
  1429. }
  1430. }
  1431. if (level == SOL_TCP) {
  1432. switch (optname) {
  1433. case TCP_CORK:
  1434. *intval = attr.socket.tcp_cork ? 1 : 0;
  1435. break;
  1436. case TCP_NODELAY:
  1437. *intval = attr.socket.tcp_nodelay ? 1 : 0;
  1438. break;
  1439. }
  1440. }
  1441. }
  1442. out:
  1443. unlock(&hdl->lock);
  1444. put_handle(hdl);
  1445. return ret;
  1446. }