shim_ipc_sysv.c 31 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039
  1. /* Copyright (C) 2014 Stony Brook University
  2. This file is part of Graphene Library OS.
  3. Graphene Library OS is free software: you can redistribute it and/or
  4. modify it under the terms of the GNU Lesser General Public License
  5. as published by the Free Software Foundation, either version 3 of the
  6. License, or (at your option) any later version.
  7. Graphene Library OS is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. GNU Lesser General Public License for more details.
  11. You should have received a copy of the GNU Lesser General Public License
  12. along with this program. If not, see <http://www.gnu.org/licenses/>. */
  13. /*
  14. * shim_ipc_pid.c
  15. *
  16. * This file contains functions and callbacks to handle IPC of SYSV namespace.
  17. */
  18. #include <shim_internal.h>
  19. #include <shim_thread.h>
  20. #include <shim_ipc.h>
  21. #include <shim_checkpoint.h>
  22. #include <shim_sysv.h>
  23. #include <pal.h>
  24. #include <pal_error.h>
  25. #include <errno.h>
  26. #define SYSV_RANGE_SIZE 128
  27. #define SYSV_LEASE_TIME 1000
  28. #define KEY_HASH(k) ((k)->key)
  29. #define KEY_COMP(k1, k2) \
  30. ((k1)->key != (k2)->key || (k1)->type != (k2)->type)
  31. #define KEY_COPY(k1, k2) \
  32. do { (k1)->key = (k2)->key; (k1)->type = (k2)->type; } while (0)
  33. #define NS sysv
  34. #define NS_CAP SYSV
  35. #define NS_KEY struct sysv_key
  36. #define INCLUDE_IPC_NSIMPL
  37. #include "shim_ipc_nsimpl.h"
  38. int init_ns_sysv (void)
  39. {
  40. init_namespace();
  41. return 0;
  42. }
  43. DEFINE_PROFILE_INTERVAL(ipc_sysv_delres_send, ipc);
  44. DEFINE_PROFILE_INTERVAL(ipc_sysv_delres_callback, ipc);
  45. int ipc_sysv_delres_send (struct shim_ipc_port * port, IDTYPE dest,
  46. IDTYPE resid, enum sysv_type type)
  47. {
  48. BEGIN_PROFILE_INTERVAL();
  49. int ret = 0;
  50. bool owned = false;
  51. if (!port) {
  52. if ((ret = connect_owner(resid, &port, &dest)) < 0)
  53. goto out;
  54. owned = true;
  55. }
  56. if (!owned) {
  57. size_t total_msg_size = get_ipc_msg_size(sizeof(struct shim_ipc_sysv_delres));
  58. struct shim_ipc_msg* msg = __alloca(total_msg_size);
  59. init_ipc_msg(msg, IPC_SYSV_DELRES, total_msg_size, dest);
  60. struct shim_ipc_sysv_delres * msgin = (struct shim_ipc_sysv_delres *)
  61. &msg->msg;
  62. msgin->resid = resid;
  63. msgin->type = type;
  64. debug("ipc send to %u: IPC_SYSV_DELRES(%u, %s)\n", dest, resid,
  65. SYSV_TYPE_STR(type));
  66. ret = send_ipc_message(msg, port);
  67. goto out;
  68. }
  69. size_t total_msg_size = get_ipc_msg_duplex_size(sizeof(struct shim_ipc_sysv_delres));
  70. struct shim_ipc_msg_duplex* msg = __alloca(total_msg_size);
  71. init_ipc_msg_duplex(msg, IPC_SYSV_DELRES, total_msg_size, dest);
  72. struct shim_ipc_sysv_delres * msgin = (struct shim_ipc_sysv_delres *)
  73. &msg->msg.msg;
  74. msgin->resid = resid;
  75. msgin->type = type;
  76. debug("ipc send to %u: IPC_SYSV_DELRES(%u, %s)\n", dest, resid,
  77. SYSV_TYPE_STR(type));
  78. ret = send_ipc_message_duplex(msg, port, NULL, NULL);
  79. put_ipc_port(port);
  80. out:
  81. SAVE_PROFILE_INTERVAL(ipc_sysv_delres_send);
  82. return ret;
  83. }
  84. int ipc_sysv_delres_callback (IPC_CALLBACK_ARGS)
  85. {
  86. __UNUSED(port);
  87. BEGIN_PROFILE_INTERVAL();
  88. int ret = 0;
  89. struct shim_ipc_sysv_delres * msgin =
  90. (struct shim_ipc_sysv_delres *) &msg->msg;
  91. debug("ipc callback from %u: IPC_SYSV_DELRES(%u, %s)\n", msg->src,
  92. msgin->resid, SYSV_TYPE_STR(msgin->type));
  93. bool owned = false;
  94. ret = -ENOENT;
  95. switch(msgin->type) {
  96. case SYSV_MSGQ: {
  97. struct shim_msg_handle * msgq = get_msg_handle_by_id(msgin->resid);
  98. if (!msgq)
  99. goto out;
  100. owned = msgq->owned;
  101. ret = del_msg_handle(msgq);
  102. break;
  103. }
  104. case SYSV_SEM: {
  105. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->resid);
  106. if (!sem)
  107. goto out;
  108. owned = sem->owned;
  109. ret = del_sem_handle(sem);
  110. break;
  111. }
  112. default:
  113. ret = -ENOSYS;
  114. break;
  115. }
  116. if (!ret)
  117. ret = owned ? RESPONSE_CALLBACK : 0;
  118. out:
  119. SAVE_PROFILE_INTERVAL(ipc_sysv_delres_callback);
  120. return ret;
  121. }
  122. DEFINE_PROFILE_INTERVAL(ipc_sysv_movres_send, ipc);
  123. DEFINE_PROFILE_INTERVAL(ipc_sysv_movres_callback, ipc);
  124. int ipc_sysv_movres_send (struct sysv_client * client, IDTYPE owner,
  125. const char * uri, LEASETYPE lease, IDTYPE resid,
  126. enum sysv_type type)
  127. {
  128. BEGIN_PROFILE_INTERVAL();
  129. int ret = 0;
  130. int len = strlen(uri);
  131. size_t total_msg_size = get_ipc_msg_size(sizeof(struct shim_ipc_sysv_movres) + len);
  132. struct shim_ipc_msg* msg = __alloca(total_msg_size);
  133. init_ipc_msg(msg, IPC_SYSV_MOVRES, total_msg_size, client->vmid);
  134. struct shim_ipc_sysv_movres * msgin = (struct shim_ipc_sysv_movres *)
  135. &msg->msg;
  136. msgin->resid = resid;
  137. msgin->type = type;
  138. msgin->owner = owner;
  139. msgin->lease = lease;
  140. memcpy(msgin->uri, uri, len + 1);
  141. msg->seq = client->seq;
  142. debug("ipc send to %u: IPC_SYSV_MOVRES(%u, %s, %u, %s)\n", client->vmid,
  143. resid, SYSV_TYPE_STR(type), owner, uri);
  144. ret = send_ipc_message(msg, client->port);
  145. SAVE_PROFILE_INTERVAL(ipc_sysv_movres_send);
  146. return ret;
  147. }
  148. int ipc_sysv_movres_callback (IPC_CALLBACK_ARGS)
  149. {
  150. BEGIN_PROFILE_INTERVAL();
  151. int ret = 0;
  152. struct shim_ipc_sysv_movres * msgin =
  153. (struct shim_ipc_sysv_movres *) &msg->msg;
  154. debug("ipc callback from %u: IPC_SYSV_MOVRES(%u, %s, %u, %s)\n", msg->src,
  155. msgin->resid, SYSV_TYPE_STR(msgin->type), msgin->owner, msgin->uri);
  156. struct shim_ipc_msg_duplex * obj = pop_ipc_msg_duplex(port, msg->seq);
  157. if (!obj)
  158. goto out;
  159. switch(msgin->type) {
  160. case SYSV_MSGQ:
  161. case SYSV_SEM:
  162. obj->retval = -EAGAIN;
  163. break;
  164. default:
  165. ret = -ENOSYS;
  166. goto out;
  167. }
  168. add_sysv_subrange(msgin->resid, msgin->owner, msgin->uri, &msgin->lease);
  169. if (obj->thread)
  170. thread_wakeup(obj->thread);
  171. out:
  172. SAVE_PROFILE_INTERVAL(ipc_sysv_movres_callback);
  173. return ret;
  174. }
  175. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgsnd_send, ipc);
  176. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgsnd_callback, ipc);
  177. int ipc_sysv_msgsnd_send (struct shim_ipc_port * port, IDTYPE dest,
  178. IDTYPE msgid, long msgtype,
  179. const void * buf, size_t size, unsigned long seq)
  180. {
  181. BEGIN_PROFILE_INTERVAL();
  182. int ret = 0;
  183. bool owned = true;
  184. if (!dest) {
  185. if ((ret = connect_owner(msgid, &port, &dest)) < 0)
  186. goto out;
  187. owned = false;
  188. }
  189. size_t total_msg_size = get_ipc_msg_size(sizeof(struct shim_ipc_sysv_msgsnd) + size);
  190. struct shim_ipc_msg* msg = __alloca(total_msg_size);
  191. init_ipc_msg(msg, IPC_SYSV_MSGSND, total_msg_size, dest);
  192. struct shim_ipc_sysv_msgsnd * msgin =
  193. (struct shim_ipc_sysv_msgsnd *) &msg->msg;
  194. msgin->msgid = msgid;
  195. msgin->msgtype = msgtype;
  196. memcpy(msgin->msg, buf, size);
  197. msg->seq = seq;
  198. debug("ipc send to %u: IPC_SYSV_MSGSND(%u, %ld)\n", dest,
  199. msgid, msgtype);
  200. ret = send_ipc_message(msg, port);
  201. if (!owned)
  202. put_ipc_port(port);
  203. out:
  204. SAVE_PROFILE_INTERVAL(ipc_sysv_msgsnd_send);
  205. return ret;
  206. }
  207. int ipc_sysv_msgsnd_callback (IPC_CALLBACK_ARGS)
  208. {
  209. BEGIN_PROFILE_INTERVAL();
  210. int ret = 0;
  211. struct shim_ipc_sysv_msgsnd * msgin =
  212. (struct shim_ipc_sysv_msgsnd *) &msg->msg;
  213. debug("ipc callback from %u: IPC_SYSV_MSGSND(%u, %ld)\n", msg->src,
  214. msgin->msgid, msgin->msgtype);
  215. size_t size = msg->size - sizeof(*msg) - sizeof(*msgin);
  216. if (msg->seq) {
  217. struct shim_ipc_msg_duplex * obj = pop_ipc_msg_duplex(port, msg->seq);
  218. void * priv = obj ? obj->private : NULL;
  219. if (priv) {
  220. struct shim_ipc_sysv_msgrcv * rcv =
  221. (struct shim_ipc_sysv_msgrcv *) obj->msg.msg;
  222. if (size > rcv->size)
  223. size = rcv->size;
  224. memcpy(priv, msgin->msg, size);
  225. obj->retval = size;
  226. if (obj->thread)
  227. thread_wakeup(obj->thread);
  228. goto out;
  229. }
  230. }
  231. struct shim_msg_handle * msgq = get_msg_handle_by_id(msgin->msgid);
  232. if (!msgq) {
  233. ret = -ENOENT;
  234. goto out;
  235. }
  236. if (msg->seq) {
  237. ret = add_sysv_msg(msgq, msgin->msgtype, size, msgin->msg, NULL);
  238. } else {
  239. struct sysv_client src;
  240. src.port = port;
  241. src.vmid = msg->src;
  242. src.seq = msg->seq;
  243. ret = add_sysv_msg(msgq, msgin->msgtype, size, msgin->msg, &src);
  244. }
  245. out:
  246. SAVE_PROFILE_INTERVAL(ipc_sysv_msgsnd_callback);
  247. return ret;
  248. }
  249. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgrcv_send, ipc);
  250. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgrcv_callback, ipc);
  251. int ipc_sysv_msgrcv_send (IDTYPE msgid, long msgtype, int flags, void * buf,
  252. size_t size)
  253. {
  254. BEGIN_PROFILE_INTERVAL();
  255. IDTYPE owner;
  256. struct shim_ipc_port * port = NULL;
  257. int ret = 0;
  258. if ((ret = connect_owner(msgid, &port, &owner)) < 0)
  259. goto out;
  260. if (owner == cur_process.vmid) {
  261. ret = -EAGAIN;
  262. goto out;
  263. }
  264. assert(port);
  265. size_t total_msg_size = get_ipc_msg_duplex_size(sizeof(struct shim_ipc_sysv_msgrcv));
  266. struct shim_ipc_msg_duplex* msg = __alloca(total_msg_size);
  267. init_ipc_msg_duplex(msg, IPC_SYSV_MSGRCV, total_msg_size, owner);
  268. struct shim_ipc_sysv_msgrcv * msgin =
  269. (struct shim_ipc_sysv_msgrcv *) &msg->msg.msg;
  270. msgin->msgid = msgid;
  271. msgin->msgtype = msgtype;
  272. msgin->size = size;
  273. msgin->flags = flags;
  274. debug("ipc send to %u: IPC_SYSV_MSGRCV(%u, %ld)\n", owner,
  275. msgid, msgtype);
  276. ret = send_ipc_message_duplex(msg, port, NULL, buf);
  277. put_ipc_port(port);
  278. out:
  279. SAVE_PROFILE_INTERVAL(ipc_sysv_msgrcv_send);
  280. return ret;
  281. }
  282. int ipc_sysv_msgrcv_callback (IPC_CALLBACK_ARGS)
  283. {
  284. BEGIN_PROFILE_INTERVAL();
  285. int ret = 0;
  286. struct shim_ipc_sysv_msgrcv * msgin =
  287. (struct shim_ipc_sysv_msgrcv *) &msg->msg;
  288. debug("ipc callback from %u: IPC_SYSV_MSGRCV(%u, %ld)\n", msg->src,
  289. msgin->msgid, msgin->msgtype);
  290. struct shim_msg_handle * msgq = get_msg_handle_by_id(msgin->msgid);
  291. if (!msgq) {
  292. ret = -ENOENT;
  293. goto out;
  294. }
  295. void * buf = __alloca(msgin->size);
  296. struct sysv_client src;
  297. src.port = port;
  298. src.vmid = msg->src;
  299. src.seq = msg->seq;
  300. ret = get_sysv_msg(msgq, msgin->msgtype, msgin->size, buf, msgin->flags,
  301. &src);
  302. if (ret > 0) {
  303. size_t size = ret;
  304. ret = ipc_sysv_msgsnd_send(port, msg->src, msgin->msgid, msgin->msgtype,
  305. buf, size, msg->seq);
  306. }
  307. put_msg_handle(msgq);
  308. out:
  309. SAVE_PROFILE_INTERVAL(ipc_sysv_msgrcv_callback);
  310. return ret;
  311. }
  312. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgmov_send, ipc);
  313. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgmov_callback, ipc);
  314. int ipc_sysv_msgmov_send (struct shim_ipc_port * port, IDTYPE dest,
  315. IDTYPE msgid, LEASETYPE lease,
  316. struct sysv_score * scores, int nscores)
  317. {
  318. BEGIN_PROFILE_INTERVAL();
  319. size_t total_msg_size = get_ipc_msg_size(sizeof(struct shim_ipc_sysv_msgmov) +
  320. sizeof(struct sysv_score) * nscores);
  321. struct shim_ipc_msg* msg = __alloca(total_msg_size);
  322. init_ipc_msg(msg, IPC_SYSV_MSGMOV, total_msg_size, dest);
  323. struct shim_ipc_sysv_msgmov * msgin =
  324. (struct shim_ipc_sysv_msgmov *) &msg->msg;
  325. msgin->msgid = msgid;
  326. msgin->lease = lease;
  327. msgin->nscores = nscores;
  328. if (nscores)
  329. memcpy(msgin->scores, scores, sizeof(struct sysv_score) * nscores);
  330. debug("ipc send to %u: IPC_SYSV_MSGMOV(%d)\n", dest, msgid);
  331. int ret = send_ipc_message(msg, port);
  332. SAVE_PROFILE_INTERVAL(ipc_sysv_msgmov_send);
  333. return ret;
  334. }
  335. int ipc_sysv_msgmov_callback (IPC_CALLBACK_ARGS)
  336. {
  337. __UNUSED(port);
  338. BEGIN_PROFILE_INTERVAL();
  339. int ret = 0;
  340. struct shim_ipc_sysv_msgmov * msgin =
  341. (struct shim_ipc_sysv_msgmov *) &msg->msg;
  342. debug("ipc callback from %u: IPC_SYSV_MSGMOV(%d)\n", msg->src,
  343. msgin->msgid);
  344. struct shim_msg_handle * msgq = get_msg_handle_by_id(msgin->msgid);
  345. if (!msgq) {
  346. ret = -ENOENT;
  347. goto out;
  348. }
  349. struct shim_handle * hdl = container_of(msgq, struct shim_handle,
  350. info.msg);
  351. lock(&hdl->lock);
  352. int nscores = (msgin->nscores > MAX_SYSV_CLIENTS) ?
  353. MAX_SYSV_CLIENTS : msgin->nscores;
  354. if (nscores)
  355. memcpy(msgq->scores, msgin->scores, nscores);
  356. if (nscores < MAX_SYSV_CLIENTS)
  357. memset(msgq->scores + nscores, 0,
  358. sizeof(struct sysv_score) * (MAX_SYSV_CLIENTS - nscores));
  359. unlock(&hdl->lock);
  360. ret = recover_msg_ownership(msgq);
  361. struct shim_ipc_info * info;
  362. if (!get_ipc_info_cur_process(&info)) {
  363. add_sysv_subrange(msgin->msgid, info->vmid, qstrgetstr(&info->uri),
  364. &msgin->lease);
  365. put_ipc_info(info);
  366. }
  367. put_msg_handle(msgq);
  368. out:
  369. SAVE_PROFILE_INTERVAL(ipc_sysv_msgmov_callback);
  370. return ret;
  371. }
  372. DEFINE_PROFILE_INTERVAL(ipc_sysv_semop_send, ipc);
  373. DEFINE_PROFILE_INTERVAL(ipc_sysv_semop_callback, ipc);
  374. int ipc_sysv_semop_send (IDTYPE semid, struct sembuf * sops, int nsops,
  375. unsigned long timeout, unsigned long * seq)
  376. {
  377. BEGIN_PROFILE_INTERVAL();
  378. IDTYPE owner;
  379. struct shim_ipc_port * port = NULL;
  380. int ret = 0;
  381. bool waitforreply = false;
  382. for (int i = 0 ; i < nsops ; i++)
  383. if (sops[i].sem_op <= 0) {
  384. waitforreply = true;
  385. break;
  386. }
  387. if ((ret = connect_owner(semid, &port, &owner)) < 0)
  388. goto out;
  389. if (owner == cur_process.vmid) {
  390. ret = -EAGAIN;
  391. goto out;
  392. }
  393. assert(port);
  394. if (!waitforreply) {
  395. size_t total_msg_size = get_ipc_msg_size(sizeof(struct shim_ipc_sysv_semop) +
  396. sizeof(struct sembuf) * nsops);
  397. struct shim_ipc_msg* msg = __alloca(total_msg_size);
  398. init_ipc_msg(msg, IPC_SYSV_SEMOP, total_msg_size, owner);
  399. struct shim_ipc_sysv_semop * msgin =
  400. (struct shim_ipc_sysv_semop *) &msg->msg;
  401. msgin->semid = semid;
  402. msgin->timeout = timeout;
  403. msgin->nsops = nsops;
  404. memcpy(msgin->sops, sops, sizeof(struct sembuf) * nsops);
  405. msg->seq = *seq;
  406. debug("ipc send to %u: IPC_SYSV_SEMOP(%u, %ld, %u)\n", owner, semid,
  407. timeout, nsops);
  408. ret = send_ipc_message(msg, port);
  409. put_ipc_port(port);
  410. goto out;
  411. }
  412. size_t total_msg_size = get_ipc_msg_duplex_size(sizeof(struct shim_ipc_sysv_semop) +
  413. sizeof(struct sembuf) * nsops);
  414. struct shim_ipc_msg_duplex* msg = __alloca(total_msg_size);
  415. init_ipc_msg_duplex(msg, IPC_SYSV_SEMOP, total_msg_size, owner);
  416. struct shim_ipc_sysv_semop * msgin =
  417. (struct shim_ipc_sysv_semop *) &msg->msg.msg;
  418. msgin->semid = semid;
  419. msgin->timeout = timeout;
  420. msgin->nsops = nsops;
  421. memcpy(msgin->sops, sops, sizeof(struct sembuf) * nsops);
  422. msg->msg.seq = *seq;
  423. debug("ipc send to %u: IPC_SYSV_SEMOP(%u, %ld, %u)\n", owner, semid,
  424. timeout, nsops);
  425. ret = send_ipc_message_duplex(msg, port, seq, NULL);
  426. put_ipc_port(port);
  427. out:
  428. SAVE_PROFILE_INTERVAL(ipc_sysv_semop_send);
  429. return ret;
  430. }
  431. int ipc_sysv_semop_callback (IPC_CALLBACK_ARGS)
  432. {
  433. BEGIN_PROFILE_INTERVAL();
  434. int ret = 0;
  435. struct shim_ipc_sysv_semop * msgin =
  436. (struct shim_ipc_sysv_semop *) &msg->msg;
  437. debug("ipc callback from %u: IPC_SYSV_SEMOP(%u, %ld, %u)\n", msg->src,
  438. msgin->semid, msgin->timeout, msgin->nsops);
  439. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->semid);
  440. if (!sem) {
  441. ret = -ENOENT;
  442. goto out;
  443. }
  444. struct sysv_client client;
  445. client.port = port;
  446. client.vmid = msg->src;
  447. client.seq = msg->seq;
  448. ret = submit_sysv_sem(sem, msgin->sops, msgin->nsops, msgin->timeout,
  449. &client);
  450. put_sem_handle(sem);
  451. out:
  452. SAVE_PROFILE_INTERVAL(ipc_sysv_semop_callback);
  453. return ret;
  454. }
  455. DEFINE_PROFILE_INTERVAL(ipc_sysv_semctl_send, ipc);
  456. DEFINE_PROFILE_INTERVAL(ipc_sysv_semctl_callback, ipc);
  457. int ipc_sysv_semctl_send (IDTYPE semid, int semnum, int cmd, void * vals,
  458. size_t valsize)
  459. {
  460. BEGIN_PROFILE_INTERVAL();
  461. IDTYPE owner;
  462. struct shim_ipc_port * port = NULL;
  463. int ret = 0;
  464. if ((ret = connect_owner(semid, &port, &owner)) < 0)
  465. goto out;
  466. int ctlvalsize = (cmd == SETALL || cmd == SETVAL) ? valsize : 0;
  467. size_t total_msg_size = get_ipc_msg_duplex_size(sizeof(struct shim_ipc_sysv_semctl) + ctlvalsize);
  468. struct shim_ipc_msg_duplex* msg = __alloca(total_msg_size);
  469. init_ipc_msg_duplex(msg, IPC_SYSV_SEMCTL, total_msg_size, owner);
  470. struct shim_ipc_sysv_semctl * msgin =
  471. (struct shim_ipc_sysv_semctl *) &msg->msg.msg;
  472. msgin->semid = semid;
  473. msgin->semnum = semnum;
  474. msgin->cmd = cmd;
  475. msgin->valsize = ctlvalsize;
  476. if (ctlvalsize)
  477. memcpy(msgin->vals, vals, ctlvalsize);
  478. debug("ipc send to %u: IPC_SYSV_SEMCTL(%u, %d, %d)\n", owner, semid,
  479. semnum, cmd);
  480. ret = send_ipc_message_duplex(msg, port, NULL, vals);
  481. put_ipc_port(port);
  482. out:
  483. SAVE_PROFILE_INTERVAL(ipc_sysv_semctl_send);
  484. return ret;
  485. }
  486. int ipc_sysv_semctl_callback (IPC_CALLBACK_ARGS)
  487. {
  488. BEGIN_PROFILE_INTERVAL();
  489. int ret = 0;
  490. struct shim_ipc_sysv_semctl * msgin =
  491. (struct shim_ipc_sysv_semctl *) &msg->msg;
  492. debug("ipc callback from %u: IPC_SYSV_SEMCTL(%u, %d, %d)\n", msg->src,
  493. msgin->semid, msgin->semnum, msgin->cmd);
  494. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->semid);
  495. if (!sem) {
  496. ret = -ENOENT;
  497. goto out;
  498. }
  499. void * vals = NULL;
  500. size_t valsize;
  501. switch(msgin->cmd) {
  502. case GETALL: {
  503. unsigned short * allsems = __alloca(sizeof(unsigned short) *
  504. sem->nsems);
  505. for (int i = 0 ; i < sem->nsems ; i++)
  506. allsems[i] = sem->sems[i].val;
  507. vals = allsems;
  508. valsize = sizeof(unsigned short) * sem->nsems;
  509. goto semret;
  510. }
  511. case GETNCNT:
  512. vals = &sem->sems[msgin->semnum].ncnt;
  513. valsize = sizeof(unsigned short);
  514. goto semret;
  515. case GETPID:
  516. vals = &sem->sems[msgin->semnum].pid;
  517. valsize = sizeof(IDTYPE);
  518. goto semret;
  519. case GETVAL:
  520. vals = &sem->sems[msgin->semnum].val;
  521. valsize = sizeof(unsigned short);
  522. goto semret;
  523. case GETZCNT:
  524. vals = &sem->sems[msgin->semnum].zcnt;
  525. valsize = sizeof(unsigned short);
  526. break;
  527. case SETALL: {
  528. if (msgin->valsize != sizeof(unsigned short) * sem->nsems) {
  529. ret = -EINVAL;
  530. break;
  531. }
  532. unsigned short * vals = (void *) msgin->vals;
  533. for (int i = 0 ; i < sem->nsems ; i++)
  534. sem->sems[i].val = vals[i];
  535. ret = RESPONSE_CALLBACK;
  536. break;
  537. }
  538. case SETVAL: {
  539. ret = -EINVAL;
  540. if (msgin->valsize != sizeof(unsigned short))
  541. break;
  542. if (msgin->semnum >= sem->nsems)
  543. break;
  544. sem->sems[msgin->semnum].val = *((int *) msgin->vals);
  545. ret = RESPONSE_CALLBACK;
  546. break;
  547. }
  548. default:
  549. ret = -ENOSYS;
  550. break;
  551. }
  552. put_sem_handle(sem);
  553. goto out;
  554. semret:
  555. ret = ipc_sysv_semret_send(port, msg->src, vals, valsize,
  556. msg->seq);
  557. out:
  558. SAVE_PROFILE_INTERVAL(ipc_sysv_semctl_callback);
  559. return ret;
  560. }
  561. DEFINE_PROFILE_INTERVAL(ipc_sysv_semret_send, ipc);
  562. DEFINE_PROFILE_INTERVAL(ipc_sysv_semret_callback, ipc);
  563. int ipc_sysv_semret_send (struct shim_ipc_port * port, IDTYPE dest, void * vals,
  564. size_t valsize, unsigned long seq)
  565. {
  566. BEGIN_PROFILE_INTERVAL();
  567. int ret = 0;
  568. size_t total_msg_size = get_ipc_msg_size(sizeof(struct shim_ipc_sysv_semret) + valsize);
  569. struct shim_ipc_msg* msg = __alloca(total_msg_size);
  570. init_ipc_msg(msg, IPC_SYSV_SEMRET, total_msg_size, dest);
  571. struct shim_ipc_sysv_semret * msgin =
  572. (struct shim_ipc_sysv_semret *) &msg->msg;
  573. msgin->valsize = valsize;
  574. memcpy(msgin->vals, vals, valsize);
  575. msg->seq = seq;
  576. debug("ipc send to %u: IPC_SYSV_SEMRET\n", dest);
  577. ret = send_ipc_message(msg, port);
  578. SAVE_PROFILE_INTERVAL(ipc_sysv_semret_send);
  579. return ret;
  580. }
  581. int ipc_sysv_semret_callback (IPC_CALLBACK_ARGS)
  582. {
  583. BEGIN_PROFILE_INTERVAL();
  584. struct shim_ipc_sysv_semret * semret =
  585. (struct shim_ipc_sysv_semret *) &msg->msg;
  586. debug("ipc callback from %u: IPC_SYSV_SEMRET\n", msg->src);
  587. struct shim_ipc_msg_duplex * obj = pop_ipc_msg_duplex(port, msg->seq);
  588. if (obj) {
  589. struct shim_ipc_sysv_semctl * semctl =
  590. (struct shim_ipc_sysv_semctl *) &obj->msg.msg;
  591. void * vals = obj->private;
  592. if (vals) {
  593. switch(semctl->cmd) {
  594. case GETALL:
  595. case GETNCNT:
  596. case GETPID:
  597. case GETVAL:
  598. case GETZCNT: {
  599. size_t retvalsize = semret->valsize;
  600. if (retvalsize > semctl->valsize)
  601. retvalsize = semctl->valsize;
  602. memcpy(vals, semret->vals, retvalsize);
  603. break;
  604. }
  605. }
  606. }
  607. if (obj->thread)
  608. thread_wakeup(obj->thread);
  609. }
  610. SAVE_PROFILE_INTERVAL(ipc_sysv_semret_callback);
  611. return 0;
  612. }
  613. DEFINE_PROFILE_INTERVAL(ipc_sysv_semmov_send, ipc);
  614. DEFINE_PROFILE_INTERVAL(ipc_sysv_semmov_callback, ipc);
  615. int ipc_sysv_semmov_send (struct shim_ipc_port * port, IDTYPE dest,
  616. IDTYPE semid, LEASETYPE lease,
  617. struct sem_backup * sems, int nsems,
  618. struct sem_client_backup * srcs, int nsrcs,
  619. struct sysv_score * scores, int nscores)
  620. {
  621. BEGIN_PROFILE_INTERVAL();
  622. size_t total_msg_size = get_ipc_msg_size(sizeof(struct shim_ipc_sysv_semmov) +
  623. sizeof(struct sem_backup) * nsems +
  624. sizeof(struct sem_client_backup) * nsrcs +
  625. sizeof(struct sysv_score) * nscores);
  626. struct shim_ipc_msg* msg = __alloca(total_msg_size);
  627. init_ipc_msg(msg, IPC_SYSV_SEMMOV, total_msg_size, dest);
  628. struct shim_ipc_sysv_semmov * msgin =
  629. (struct shim_ipc_sysv_semmov *) &msg->msg;
  630. msgin->semid = semid;
  631. msgin->lease = lease;
  632. msgin->nsems = nsems;
  633. msgin->nsrcs = nsrcs;
  634. msgin->nscores = nscores;
  635. memcpy(&msgin->sems, sems, sizeof(struct sem_backup) * nsems);
  636. memcpy((void *) msgin->sems + sizeof(struct sem_backup) * nsems,
  637. srcs, sizeof(struct sem_client_backup) * nsrcs);
  638. memcpy((void *) msgin->sems + sizeof(struct sem_backup) * nsems +
  639. sizeof(struct sem_client_backup) * nsrcs,
  640. scores, sizeof(struct sysv_score) * nscores);
  641. debug("ipc send to : IPC_SYSV_SEMMOV(%d)\n", semid);
  642. int ret = send_ipc_message(msg, port);
  643. SAVE_PROFILE_INTERVAL(ipc_sysv_semmov_send);
  644. return ret;
  645. }
  646. int ipc_sysv_semmov_callback (IPC_CALLBACK_ARGS)
  647. {
  648. __UNUSED(port);
  649. BEGIN_PROFILE_INTERVAL();
  650. int ret = 0;
  651. struct shim_ipc_sysv_semmov * msgin =
  652. (struct shim_ipc_sysv_semmov *) &msg->msg;
  653. debug("ipc callback from %u: IPC_SYSV_SEMMOV(%d)\n", msg->src,
  654. msgin->semid);
  655. struct sem_backup * sems = msgin->sems;
  656. struct sem_client_backup * clients =
  657. (struct sem_client_backup *) (sems + msgin->nsems);
  658. struct sysv_score * scores =
  659. (struct sysv_score *) (clients + msgin->nsrcs);
  660. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->semid);
  661. if (!sem) {
  662. ret = -ENOENT;
  663. goto out;
  664. }
  665. struct shim_handle * hdl = container_of(sem, struct shim_handle,
  666. info.sem);
  667. lock(&hdl->lock);
  668. int nscores = (msgin->nscores > MAX_SYSV_CLIENTS) ?
  669. MAX_SYSV_CLIENTS : msgin->nscores;
  670. if (nscores)
  671. memcpy(sem->scores, scores, nscores);
  672. if (nscores < MAX_SYSV_CLIENTS)
  673. memset(sem->scores + nscores, 0,
  674. sizeof(struct sysv_score) * (MAX_SYSV_CLIENTS - nscores));
  675. unlock(&hdl->lock);
  676. ret = recover_sem_ownership(sem, sems, msgin->nsems, clients,
  677. msgin->nsrcs);
  678. struct shim_ipc_info * info;
  679. if (!get_ipc_info_cur_process(&info)) {
  680. add_sysv_subrange(msgin->semid, info->vmid, qstrgetstr(&info->uri),
  681. &msgin->lease);
  682. put_ipc_info(info);
  683. }
  684. put_sem_handle(sem);
  685. out:
  686. SAVE_PROFILE_INTERVAL(ipc_sysv_semmov_callback);
  687. return ret;
  688. }
  689. #ifdef USE_SHARED_SEMAPHORE
  690. DEFINE_PROFILE_INTERVAL(ipc_sysv_semquery_send, ipc);
  691. DEFINE_PROFILE_INTERVAL(ipc_sysv_semquery_callback, ipc);
  692. int ipc_sysv_semquery_send (IDTYPE semid, int * nsems,
  693. PAL_NUM ** host_sem_ids)
  694. {
  695. BEGIN_PROFILE_INTERVAL();
  696. int ret = 0;
  697. IDTYPE dest;
  698. struct shim_ipc_port * port = NULL;
  699. if ((ret = connect_owner(semid, &port, &dest)) < 0)
  700. goto out;
  701. if (dest == cur_process.vmid) {
  702. ret = -EAGAIN;
  703. goto out;
  704. }
  705. assert(port);
  706. size_t total_msg_size = get_ipc_msg_duplex_size(sizeof(struct shim_ipc_sysv_semquery));
  707. struct shim_ipc_msg_duplex* msg = __alloca(total_msg_size);
  708. init_ipc_msg_duplex(msg, IPC_SYSV_SEMQUERY, total_msg_size, dest);
  709. struct shim_ipc_sysv_semquery * msgin =
  710. (struct shim_ipc_sysv_semquery *) &msg->msg.msg;
  711. msgin->semid = semid;
  712. debug("ipc send to %u: IPC_SYSV_SEMQUERY(%u)\n", dest, semid);
  713. ret = send_ipc_message_duplex(msg, port, NULL, host_sem_ids);
  714. put_ipc_port(port);
  715. if (ret >= 0) {
  716. *nsems = ret;
  717. ret = 0;
  718. }
  719. out:
  720. SAVE_PROFILE_INTERVAL(ipc_sysv_semquery_send);
  721. return ret;
  722. }
  723. int ipc_sysv_semquery_callback (IPC_CALLBACK_ARGS)
  724. {
  725. BEGIN_PROFILE_INTERVAL();
  726. int ret = 0;
  727. struct shim_ipc_sysv_semquery * msgin =
  728. (struct shim_ipc_sysv_semquery *) &msg->msg;
  729. debug("ipc callback from %u: IPC_SYSV_SEMQUERY(%u)\n", msg->src,
  730. msgin->semid);
  731. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->semid);
  732. if (!sem) {
  733. ret = -ENOENT;
  734. goto out;
  735. }
  736. ret = send_sem_host_ids(sem, port, msg->src, msg->seq);
  737. put_sem_handle(sem);
  738. out:
  739. SAVE_PROFILE_INTERVAL(ipc_sysv_semreply_callback);
  740. return ret;
  741. }
  742. DEFINE_PROFILE_INTERVAL(ipc_sysv_semreply_send, ipc);
  743. DEFINE_PROFILE_INTERVAL(ipc_sysv_semreply_callback, ipc);
  744. int ipc_sysv_semreply_send (struct shim_ipc_port * port, IDTYPE dest,
  745. IDTYPE semid, int nsems, PAL_NUM * host_sem_ids,
  746. unsigned long seq)
  747. {
  748. BEGIN_PROFILE_INTERVAL();
  749. int ret = 0;
  750. size_t total_msg_size = get_ipc_msg_size(sizeof(struct shim_ipc_sysv_semreply) +
  751. sizeof(PAL_NUM) * nsems);
  752. struct shim_ipc_msg* msg = __alloca(total_msg_size);
  753. init_ipc_msg(msg, IPC_SYSV_SEMREPLY, total_msg_size, dest);
  754. struct shim_ipc_sysv_semreply * msgin =
  755. (struct shim_ipc_sysv_semreply *) &msg->msg;
  756. msgin->semid = semid;
  757. msgin->nsems = nsems;
  758. if (nsems)
  759. memcpy(msgin->host_sem_ids, host_sem_ids, sizeof(PAL_NUM) * nsems);
  760. msg->seq = seq;
  761. debug("ipc send to %u: IPC_SYSV_SEMREPLY(%u, %d)\n", dest, semid, nsems);
  762. ret = send_ipc_message(msg, port);
  763. SAVE_PROFILE_INTERVAL(ipc_sysv_semreply_send);
  764. return ret;
  765. }
  766. int ipc_sysv_semreply_callback (IPC_CALLBACK_ARGS)
  767. {
  768. BEGIN_PROFILE_INTERVAL();
  769. int ret = 0;
  770. struct shim_ipc_sysv_semreply * msgin =
  771. (struct shim_ipc_sysv_semreply *) &msg->msg;
  772. debug("ipc callback from %u: IPC_SYSV_SEMREPLY(%u, %d)\n", msg->src,
  773. msgin->semid, msgin->nsems);
  774. struct shim_ipc_msg_duplex * obj = pop_ipc_msg_duplex(port, msg->seq);
  775. if (!obj)
  776. goto out;
  777. PAL_NUM ** semids = obj->private;
  778. if (semids)
  779. *semids = malloc_copy(msgin->host_sem_ids,
  780. sizeof(PAL_NUM) * msgin->nsems);
  781. obj->retval = msgin->nsems;
  782. if (obj->thread)
  783. thread_wakeup(obj->thread);
  784. out:
  785. SAVE_PROFILE_INTERVAL(ipc_sysv_semreply_callback);
  786. return ret;
  787. }
  788. #endif /* USE_SHARED_SEMAPHORE */
  789. int __balance_sysv_score (struct sysv_balance_policy * policy,
  790. struct shim_handle * hdl,
  791. struct sysv_score * scores, int nscores,
  792. struct sysv_client * src, long score)
  793. {
  794. struct sysv_score * s = scores;
  795. struct sysv_score * last = scores + nscores;
  796. for ( ; s < last && !s->vmid ; s++);
  797. struct sysv_score * free = s > scores ? scores : NULL;
  798. struct sysv_score * highest = s < last ? s : NULL;
  799. struct sysv_score * lowest = highest;
  800. struct sysv_score * owner = NULL;
  801. struct sysv_score * chosen = NULL;
  802. for ( ; s < last ; s++) {
  803. if (!s->vmid) {
  804. if (!free)
  805. free = s;
  806. continue;
  807. }
  808. if (s->score >= highest->score)
  809. highest = s;
  810. if (s->score < lowest->score)
  811. lowest = s;
  812. if (src) {
  813. if (s->vmid == cur_process.vmid)
  814. owner = s;
  815. if (s->vmid == src->vmid) {
  816. chosen = s;
  817. continue;
  818. }
  819. } else {
  820. if (s->vmid == cur_process.vmid) {
  821. owner = chosen = s;
  822. continue;
  823. }
  824. }
  825. s->score = (s->score >= policy->score_decay) ?
  826. s->score - policy->score_decay : 0;
  827. debug("balance: %u => %ld\n", s->vmid, s->score);
  828. }
  829. if (!chosen) {
  830. chosen = free ? : lowest;
  831. chosen->vmid = src ? src->vmid : cur_process.vmid;
  832. chosen->score = 0;
  833. }
  834. chosen->score += score;
  835. if (chosen->score > policy->score_max)
  836. chosen->score = policy->score_max;
  837. debug("balance: %u => %ld\n", chosen->vmid, chosen->score);
  838. if (!src || chosen != highest ||
  839. chosen->score < (owner ? owner->score : 0) + policy->balance_threshold)
  840. return 0;
  841. return policy->migrate(hdl, src);
  842. }