shim_ipc_sysv.c 31 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046
  1. /* Copyright (C) 2014 Stony Brook University
  2. This file is part of Graphene Library OS.
  3. Graphene Library OS is free software: you can redistribute it and/or
  4. modify it under the terms of the GNU Lesser General Public License
  5. as published by the Free Software Foundation, either version 3 of the
  6. License, or (at your option) any later version.
  7. Graphene Library OS is distributed in the hope that it will be useful,
  8. but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. GNU Lesser General Public License for more details.
  11. You should have received a copy of the GNU Lesser General Public License
  12. along with this program. If not, see <http://www.gnu.org/licenses/>. */
  13. /*
  14. * shim_ipc_pid.c
  15. *
  16. * This file contains functions and callbacks to handle IPC of SYSV namespace.
  17. */
  18. #include <shim_internal.h>
  19. #include <shim_thread.h>
  20. #include <shim_ipc.h>
  21. #include <shim_checkpoint.h>
  22. #include <shim_sysv.h>
  23. #include <pal.h>
  24. #include <pal_error.h>
  25. #include <errno.h>
  26. #define SYSV_RANGE_SIZE 128
  27. #define SYSV_LEASE_TIME 1000
  28. #define KEY_HASH(k) ((k)->key)
  29. #define KEY_COMP(k1, k2) \
  30. ((k1)->key != (k2)->key || (k1)->type != (k2)->type)
  31. #define KEY_COPY(k1, k2) \
  32. do { (k1)->key = (k2)->key; (k1)->type = (k2)->type; } while (0)
  33. #define NS sysv
  34. #define NS_CAP SYSV
  35. #define NS_KEY struct sysv_key
  36. #define INCLUDE_IPC_NSIMPL
  37. #include "shim_ipc_nsimpl.h"
  38. int init_ns_sysv (void)
  39. {
  40. init_namespace();
  41. return 0;
  42. }
  43. DEFINE_PROFILE_INTERVAL(ipc_sysv_delres_send, ipc);
  44. DEFINE_PROFILE_INTERVAL(ipc_sysv_delres_callback, ipc);
  45. int ipc_sysv_delres_send (struct shim_ipc_port * port, IDTYPE dest,
  46. IDTYPE resid, enum sysv_type type)
  47. {
  48. BEGIN_PROFILE_INTERVAL();
  49. int ret = 0;
  50. bool owned = false;
  51. if (!port) {
  52. if ((ret = connect_owner(resid, &port, &dest)) < 0)
  53. goto out;
  54. owned = true;
  55. }
  56. if (!owned) {
  57. struct shim_ipc_msg * msg = create_ipc_msg_on_stack(
  58. IPC_SYSV_DELRES,
  59. sizeof(struct shim_ipc_sysv_delres),
  60. dest);
  61. struct shim_ipc_sysv_delres * msgin = (struct shim_ipc_sysv_delres *)
  62. &msg->msg;
  63. msgin->resid = resid;
  64. msgin->type = type;
  65. debug("ipc send to %u: IPC_SYSV_DELRES(%u, %s)\n", dest, resid,
  66. SYSV_TYPE_STR(type));
  67. ret = send_ipc_message(msg, port);
  68. goto out;
  69. }
  70. struct shim_ipc_msg_obj * msg = create_ipc_msg_duplex_on_stack(
  71. IPC_SYSV_DELRES,
  72. sizeof(struct shim_ipc_sysv_delres),
  73. dest);
  74. struct shim_ipc_sysv_delres * msgin = (struct shim_ipc_sysv_delres *)
  75. &msg->msg.msg;
  76. msgin->resid = resid;
  77. msgin->type = type;
  78. debug("ipc send to %u: IPC_SYSV_DELRES(%u, %s)\n", dest, resid,
  79. SYSV_TYPE_STR(type));
  80. ret = do_ipc_duplex(msg, port, NULL, NULL);
  81. put_ipc_port(port);
  82. out:
  83. SAVE_PROFILE_INTERVAL(ipc_sysv_delres_send);
  84. return ret;
  85. }
  86. int ipc_sysv_delres_callback (IPC_CALLBACK_ARGS)
  87. {
  88. __UNUSED(port);
  89. BEGIN_PROFILE_INTERVAL();
  90. int ret = 0;
  91. struct shim_ipc_sysv_delres * msgin =
  92. (struct shim_ipc_sysv_delres *) &msg->msg;
  93. debug("ipc callback from %u: IPC_SYSV_DELRES(%u, %s)\n", msg->src,
  94. msgin->resid, SYSV_TYPE_STR(msgin->type));
  95. bool owned = false;
  96. ret = -ENOENT;
  97. switch(msgin->type) {
  98. case SYSV_MSGQ: {
  99. struct shim_msg_handle * msgq = get_msg_handle_by_id(msgin->resid);
  100. if (!msgq)
  101. goto out;
  102. owned = msgq->owned;
  103. ret = del_msg_handle(msgq);
  104. break;
  105. }
  106. case SYSV_SEM: {
  107. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->resid);
  108. if (!sem)
  109. goto out;
  110. owned = sem->owned;
  111. ret = del_sem_handle(sem);
  112. break;
  113. }
  114. default:
  115. ret = -ENOSYS;
  116. break;
  117. }
  118. if (!ret)
  119. ret = owned ? RESPONSE_CALLBACK : 0;
  120. out:
  121. SAVE_PROFILE_INTERVAL(ipc_sysv_delres_callback);
  122. return ret;
  123. }
  124. DEFINE_PROFILE_INTERVAL(ipc_sysv_movres_send, ipc);
  125. DEFINE_PROFILE_INTERVAL(ipc_sysv_movres_callback, ipc);
  126. int ipc_sysv_movres_send (struct sysv_client * client, IDTYPE owner,
  127. const char * uri, LEASETYPE lease, IDTYPE resid,
  128. enum sysv_type type)
  129. {
  130. BEGIN_PROFILE_INTERVAL();
  131. int ret = 0;
  132. int len = strlen(uri);
  133. struct shim_ipc_msg * msg = create_ipc_msg_on_stack(
  134. IPC_SYSV_MOVRES,
  135. sizeof(struct shim_ipc_sysv_movres) +
  136. len, client->vmid);
  137. struct shim_ipc_sysv_movres * msgin = (struct shim_ipc_sysv_movres *)
  138. &msg->msg;
  139. msgin->resid = resid;
  140. msgin->type = type;
  141. msgin->owner = owner;
  142. msgin->lease = lease;
  143. memcpy(msgin->uri, uri, len + 1);
  144. msg->seq = client->seq;
  145. debug("ipc send to %u: IPC_SYSV_MOVRES(%u, %s, %u, %s)\n", client->vmid,
  146. resid, SYSV_TYPE_STR(type), owner, uri);
  147. ret = send_ipc_message(msg, client->port);
  148. SAVE_PROFILE_INTERVAL(ipc_sysv_movres_send);
  149. return ret;
  150. }
  151. int ipc_sysv_movres_callback (IPC_CALLBACK_ARGS)
  152. {
  153. BEGIN_PROFILE_INTERVAL();
  154. int ret = 0;
  155. struct shim_ipc_sysv_movres * msgin =
  156. (struct shim_ipc_sysv_movres *) &msg->msg;
  157. debug("ipc callback from %u: IPC_SYSV_MOVRES(%u, %s, %u, %s)\n", msg->src,
  158. msgin->resid, SYSV_TYPE_STR(msgin->type), msgin->owner, msgin->uri);
  159. struct shim_ipc_msg_obj * obj = find_ipc_msg_duplex(port, msg->seq);
  160. if (!obj)
  161. goto out;
  162. switch(msgin->type) {
  163. case SYSV_MSGQ:
  164. case SYSV_SEM:
  165. obj->retval = -EAGAIN;
  166. break;
  167. default:
  168. ret = -ENOSYS;
  169. goto out;
  170. }
  171. add_sysv_subrange(msgin->resid, msgin->owner, msgin->uri, &msgin->lease);
  172. if (obj->thread)
  173. thread_wakeup(obj->thread);
  174. out:
  175. SAVE_PROFILE_INTERVAL(ipc_sysv_movres_callback);
  176. return ret;
  177. }
  178. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgsnd_send, ipc);
  179. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgsnd_callback, ipc);
  180. int ipc_sysv_msgsnd_send (struct shim_ipc_port * port, IDTYPE dest,
  181. IDTYPE msgid, long msgtype,
  182. const void * buf, size_t size, unsigned long seq)
  183. {
  184. BEGIN_PROFILE_INTERVAL();
  185. int ret = 0;
  186. bool owned = true;
  187. if (!dest) {
  188. if ((ret = connect_owner(msgid, &port, &dest)) < 0)
  189. goto out;
  190. owned = false;
  191. }
  192. struct shim_ipc_msg * msg = create_ipc_msg_on_stack(
  193. IPC_SYSV_MSGSND,
  194. sizeof(struct shim_ipc_sysv_msgsnd) +
  195. size, dest);
  196. struct shim_ipc_sysv_msgsnd * msgin =
  197. (struct shim_ipc_sysv_msgsnd *) &msg->msg;
  198. msgin->msgid = msgid;
  199. msgin->msgtype = msgtype;
  200. memcpy(msgin->msg, buf, size);
  201. msg->seq = seq;
  202. debug("ipc send to %u: IPC_SYSV_MSGSND(%u, %ld)\n", dest,
  203. msgid, msgtype);
  204. ret = send_ipc_message(msg, port);
  205. if (!owned)
  206. put_ipc_port(port);
  207. out:
  208. SAVE_PROFILE_INTERVAL(ipc_sysv_msgsnd_send);
  209. return ret;
  210. }
  211. int ipc_sysv_msgsnd_callback (IPC_CALLBACK_ARGS)
  212. {
  213. BEGIN_PROFILE_INTERVAL();
  214. int ret = 0;
  215. struct shim_ipc_sysv_msgsnd * msgin =
  216. (struct shim_ipc_sysv_msgsnd *) &msg->msg;
  217. debug("ipc callback from %u: IPC_SYSV_MSGSND(%u, %ld)\n", msg->src,
  218. msgin->msgid, msgin->msgtype);
  219. size_t size = msg->size - sizeof(*msg) - sizeof(*msgin);
  220. if (msg->seq) {
  221. struct shim_ipc_msg_obj * obj = find_ipc_msg_duplex(port, msg->seq);
  222. void * priv = obj ? obj->private : NULL;
  223. if (priv) {
  224. struct shim_ipc_sysv_msgrcv * rcv =
  225. (struct shim_ipc_sysv_msgrcv *) obj->msg.msg;
  226. if (size > rcv->size)
  227. size = rcv->size;
  228. memcpy(priv, msgin->msg, size);
  229. obj->retval = size;
  230. if (obj->thread)
  231. thread_wakeup(obj->thread);
  232. goto out;
  233. }
  234. }
  235. struct shim_msg_handle * msgq = get_msg_handle_by_id(msgin->msgid);
  236. if (!msgq) {
  237. ret = -ENOENT;
  238. goto out;
  239. }
  240. if (msg->seq) {
  241. ret = add_sysv_msg(msgq, msgin->msgtype, size, msgin->msg, NULL);
  242. } else {
  243. struct sysv_client src;
  244. src.port = port;
  245. src.vmid = msg->src;
  246. src.seq = msg->seq;
  247. ret = add_sysv_msg(msgq, msgin->msgtype, size, msgin->msg, &src);
  248. }
  249. out:
  250. SAVE_PROFILE_INTERVAL(ipc_sysv_msgsnd_callback);
  251. return ret;
  252. }
  253. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgrcv_send, ipc);
  254. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgrcv_callback, ipc);
  255. int ipc_sysv_msgrcv_send (IDTYPE msgid, long msgtype, int flags, void * buf,
  256. size_t size)
  257. {
  258. BEGIN_PROFILE_INTERVAL();
  259. IDTYPE owner;
  260. struct shim_ipc_port * port = NULL;
  261. int ret = 0;
  262. if ((ret = connect_owner(msgid, &port, &owner)) < 0)
  263. goto out;
  264. if (owner == cur_process.vmid) {
  265. ret = -EAGAIN;
  266. goto out;
  267. }
  268. assert(port);
  269. struct shim_ipc_msg_obj * msg = create_ipc_msg_duplex_on_stack(
  270. IPC_SYSV_MSGRCV,
  271. sizeof(struct shim_ipc_sysv_msgrcv),
  272. true);
  273. struct shim_ipc_sysv_msgrcv * msgin =
  274. (struct shim_ipc_sysv_msgrcv *) &msg->msg.msg;
  275. msgin->msgid = msgid;
  276. msgin->msgtype = msgtype;
  277. msgin->size = size;
  278. msgin->flags = flags;
  279. debug("ipc send to %u: IPC_SYSV_MSGRCV(%u, %ld)\n", owner,
  280. msgid, msgtype);
  281. ret = do_ipc_duplex(msg, port, NULL, buf);
  282. put_ipc_port(port);
  283. out:
  284. SAVE_PROFILE_INTERVAL(ipc_sysv_msgrcv_send);
  285. return ret;
  286. }
  287. int ipc_sysv_msgrcv_callback (IPC_CALLBACK_ARGS)
  288. {
  289. BEGIN_PROFILE_INTERVAL();
  290. int ret = 0;
  291. struct shim_ipc_sysv_msgrcv * msgin =
  292. (struct shim_ipc_sysv_msgrcv *) &msg->msg;
  293. debug("ipc callback from %u: IPC_SYSV_MSGRCV(%u, %ld)\n", msg->src,
  294. msgin->msgid, msgin->msgtype);
  295. struct shim_msg_handle * msgq = get_msg_handle_by_id(msgin->msgid);
  296. if (!msgq) {
  297. ret = -ENOENT;
  298. goto out;
  299. }
  300. void * buf = __alloca(msgin->size);
  301. struct sysv_client src;
  302. src.port = port;
  303. src.vmid = msg->src;
  304. src.seq = msg->seq;
  305. ret = get_sysv_msg(msgq, msgin->msgtype, msgin->size, buf, msgin->flags,
  306. &src);
  307. if (ret > 0) {
  308. size_t size = ret;
  309. ret = ipc_sysv_msgsnd_send(port, msg->src, msgin->msgid, msgin->msgtype,
  310. buf, size, msg->seq);
  311. }
  312. put_msg_handle(msgq);
  313. out:
  314. SAVE_PROFILE_INTERVAL(ipc_sysv_msgrcv_callback);
  315. return ret;
  316. }
  317. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgmov_send, ipc);
  318. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgmov_callback, ipc);
  319. int ipc_sysv_msgmov_send (struct shim_ipc_port * port, IDTYPE dest,
  320. IDTYPE msgid, LEASETYPE lease,
  321. struct sysv_score * scores, int nscores)
  322. {
  323. BEGIN_PROFILE_INTERVAL();
  324. struct shim_ipc_msg * msg =
  325. create_ipc_msg_on_stack(IPC_SYSV_MSGMOV,
  326. sizeof(struct shim_ipc_sysv_msgmov) +
  327. sizeof(struct sysv_score) * nscores,
  328. dest);
  329. struct shim_ipc_sysv_msgmov * msgin =
  330. (struct shim_ipc_sysv_msgmov *) &msg->msg;
  331. msgin->msgid = msgid;
  332. msgin->lease = lease;
  333. msgin->nscores = nscores;
  334. if (nscores)
  335. memcpy(msgin->scores, scores, sizeof(struct sysv_score) * nscores);
  336. debug("ipc send to %u: IPC_SYSV_MSGMOV(%d)\n", dest, msgid);
  337. int ret = send_ipc_message(msg, port);
  338. SAVE_PROFILE_INTERVAL(ipc_sysv_msgmov_send);
  339. return ret;
  340. }
  341. int ipc_sysv_msgmov_callback (IPC_CALLBACK_ARGS)
  342. {
  343. __UNUSED(port);
  344. BEGIN_PROFILE_INTERVAL();
  345. int ret = 0;
  346. struct shim_ipc_sysv_msgmov * msgin =
  347. (struct shim_ipc_sysv_msgmov *) &msg->msg;
  348. debug("ipc callback from %u: IPC_SYSV_MSGMOV(%d)\n", msg->src,
  349. msgin->msgid);
  350. struct shim_msg_handle * msgq = get_msg_handle_by_id(msgin->msgid);
  351. if (!msgq) {
  352. ret = -ENOENT;
  353. goto out;
  354. }
  355. struct shim_handle * hdl = container_of(msgq, struct shim_handle,
  356. info.msg);
  357. lock(&hdl->lock);
  358. int nscores = (msgin->nscores > MAX_SYSV_CLIENTS) ?
  359. MAX_SYSV_CLIENTS : msgin->nscores;
  360. if (nscores)
  361. memcpy(msgq->scores, msgin->scores, nscores);
  362. if (nscores < MAX_SYSV_CLIENTS)
  363. memset(msgq->scores + nscores, 0,
  364. sizeof(struct sysv_score) * (MAX_SYSV_CLIENTS - nscores));
  365. unlock(&hdl->lock);
  366. ret = recover_msg_ownership(msgq);
  367. struct shim_ipc_info * info;
  368. if (!create_ipc_location(&info)) {
  369. add_sysv_subrange(msgin->msgid, info->vmid, qstrgetstr(&info->uri),
  370. &msgin->lease);
  371. put_ipc_info(info);
  372. }
  373. put_msg_handle(msgq);
  374. out:
  375. SAVE_PROFILE_INTERVAL(ipc_sysv_msgmov_callback);
  376. return ret;
  377. }
  378. DEFINE_PROFILE_INTERVAL(ipc_sysv_semop_send, ipc);
  379. DEFINE_PROFILE_INTERVAL(ipc_sysv_semop_callback, ipc);
  380. int ipc_sysv_semop_send (IDTYPE semid, struct sembuf * sops, int nsops,
  381. unsigned long timeout, unsigned long * seq)
  382. {
  383. BEGIN_PROFILE_INTERVAL();
  384. IDTYPE owner;
  385. struct shim_ipc_port * port = NULL;
  386. int ret = 0;
  387. bool waitforreply = false;
  388. for (int i = 0 ; i < nsops ; i++)
  389. if (sops[i].sem_op <= 0) {
  390. waitforreply = true;
  391. break;
  392. }
  393. if ((ret = connect_owner(semid, &port, &owner)) < 0)
  394. goto out;
  395. if (owner == cur_process.vmid) {
  396. ret = -EAGAIN;
  397. goto out;
  398. }
  399. assert(port);
  400. if (!waitforreply) {
  401. struct shim_ipc_msg * msg = create_ipc_msg_on_stack(
  402. IPC_SYSV_SEMOP,
  403. sizeof(struct shim_ipc_sysv_semop) +
  404. sizeof(struct sembuf) * nsops,
  405. owner);
  406. struct shim_ipc_sysv_semop * msgin =
  407. (struct shim_ipc_sysv_semop *) &msg->msg;
  408. msgin->semid = semid;
  409. msgin->timeout = timeout;
  410. msgin->nsops = nsops;
  411. memcpy(msgin->sops, sops, sizeof(struct sembuf) * nsops);
  412. msg->seq = *seq;
  413. debug("ipc send to %u: IPC_SYSV_SEMOP(%u, %ld, %u)\n", owner, semid,
  414. timeout, nsops);
  415. ret = send_ipc_message(msg, port);
  416. put_ipc_port(port);
  417. goto out;
  418. }
  419. struct shim_ipc_msg_obj * msg = create_ipc_msg_duplex_on_stack(
  420. IPC_SYSV_SEMOP,
  421. sizeof(struct shim_ipc_sysv_semop) +
  422. sizeof(struct sembuf) * nsops,
  423. owner);
  424. struct shim_ipc_sysv_semop * msgin =
  425. (struct shim_ipc_sysv_semop *) &msg->msg.msg;
  426. msgin->semid = semid;
  427. msgin->timeout = timeout;
  428. msgin->nsops = nsops;
  429. memcpy(msgin->sops, sops, sizeof(struct sembuf) * nsops);
  430. msg->msg.seq = *seq;
  431. debug("ipc send to %u: IPC_SYSV_SEMOP(%u, %ld, %u)\n", owner, semid,
  432. timeout, nsops);
  433. ret = do_ipc_duplex(msg, port, seq, NULL);
  434. put_ipc_port(port);
  435. out:
  436. SAVE_PROFILE_INTERVAL(ipc_sysv_semop_send);
  437. return ret;
  438. }
  439. int ipc_sysv_semop_callback (IPC_CALLBACK_ARGS)
  440. {
  441. BEGIN_PROFILE_INTERVAL();
  442. int ret = 0;
  443. struct shim_ipc_sysv_semop * msgin =
  444. (struct shim_ipc_sysv_semop *) &msg->msg;
  445. debug("ipc callback from %u: IPC_SYSV_SEMOP(%u, %ld, %u)\n", msg->src,
  446. msgin->semid, msgin->timeout, msgin->nsops);
  447. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->semid);
  448. if (!sem) {
  449. ret = -ENOENT;
  450. goto out;
  451. }
  452. struct sysv_client client;
  453. client.port = port;
  454. client.vmid = msg->src;
  455. client.seq = msg->seq;
  456. ret = submit_sysv_sem(sem, msgin->sops, msgin->nsops, msgin->timeout,
  457. &client);
  458. put_sem_handle(sem);
  459. out:
  460. SAVE_PROFILE_INTERVAL(ipc_sysv_semop_callback);
  461. return ret;
  462. }
  463. DEFINE_PROFILE_INTERVAL(ipc_sysv_semctl_send, ipc);
  464. DEFINE_PROFILE_INTERVAL(ipc_sysv_semctl_callback, ipc);
  465. int ipc_sysv_semctl_send (IDTYPE semid, int semnum, int cmd, void * vals,
  466. size_t valsize)
  467. {
  468. BEGIN_PROFILE_INTERVAL();
  469. IDTYPE owner;
  470. struct shim_ipc_port * port = NULL;
  471. int ret = 0;
  472. if ((ret = connect_owner(semid, &port, &owner)) < 0)
  473. goto out;
  474. int ctlvalsize = (cmd == SETALL || cmd == SETVAL) ? valsize : 0;
  475. struct shim_ipc_msg_obj * msg = create_ipc_msg_duplex_on_stack(
  476. IPC_SYSV_SEMCTL,
  477. sizeof(struct shim_ipc_sysv_semctl) +
  478. ctlvalsize,
  479. owner);
  480. struct shim_ipc_sysv_semctl * msgin =
  481. (struct shim_ipc_sysv_semctl *) &msg->msg.msg;
  482. msgin->semid = semid;
  483. msgin->semnum = semnum;
  484. msgin->cmd = cmd;
  485. msgin->valsize = ctlvalsize;
  486. if (ctlvalsize)
  487. memcpy(msgin->vals, vals, ctlvalsize);
  488. debug("ipc send to %u: IPC_SYSV_SEMCTL(%u, %d, %d)\n", owner, semid,
  489. semnum, cmd);
  490. ret = do_ipc_duplex(msg, port, NULL, vals);
  491. put_ipc_port(port);
  492. out:
  493. SAVE_PROFILE_INTERVAL(ipc_sysv_semctl_send);
  494. return ret;
  495. }
  496. int ipc_sysv_semctl_callback (IPC_CALLBACK_ARGS)
  497. {
  498. BEGIN_PROFILE_INTERVAL();
  499. int ret = 0;
  500. struct shim_ipc_sysv_semctl * msgin =
  501. (struct shim_ipc_sysv_semctl *) &msg->msg;
  502. debug("ipc callback from %u: IPC_SYSV_SEMCTL(%u, %d, %d)\n", msg->src,
  503. msgin->semid, msgin->semnum, msgin->cmd);
  504. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->semid);
  505. if (!sem) {
  506. ret = -ENOENT;
  507. goto out;
  508. }
  509. void * vals = NULL;
  510. size_t valsize;
  511. switch(msgin->cmd) {
  512. case GETALL: {
  513. unsigned short * allsems = __alloca(sizeof(unsigned short) *
  514. sem->nsems);
  515. for (int i = 0 ; i < sem->nsems ; i++)
  516. allsems[i] = sem->sems[i].val;
  517. vals = allsems;
  518. valsize = sizeof(unsigned short) * sem->nsems;
  519. goto semret;
  520. }
  521. case GETNCNT:
  522. vals = &sem->sems[msgin->semnum].ncnt;
  523. valsize = sizeof(unsigned short);
  524. goto semret;
  525. case GETPID:
  526. vals = &sem->sems[msgin->semnum].pid;
  527. valsize = sizeof(IDTYPE);
  528. goto semret;
  529. case GETVAL:
  530. vals = &sem->sems[msgin->semnum].val;
  531. valsize = sizeof(unsigned short);
  532. goto semret;
  533. case GETZCNT:
  534. vals = &sem->sems[msgin->semnum].zcnt;
  535. valsize = sizeof(unsigned short);
  536. break;
  537. case SETALL: {
  538. if (msgin->valsize != sizeof(unsigned short) * sem->nsems) {
  539. ret = -EINVAL;
  540. break;
  541. }
  542. unsigned short * vals = (void *) msgin->vals;
  543. for (int i = 0 ; i < sem->nsems ; i++)
  544. sem->sems[i].val = vals[i];
  545. ret = RESPONSE_CALLBACK;
  546. break;
  547. }
  548. case SETVAL: {
  549. ret = -EINVAL;
  550. if (msgin->valsize != sizeof(unsigned short))
  551. break;
  552. if (msgin->semnum >= sem->nsems)
  553. break;
  554. sem->sems[msgin->semnum].val = *((int *) msgin->vals);
  555. ret = RESPONSE_CALLBACK;
  556. break;
  557. }
  558. default:
  559. ret = -ENOSYS;
  560. break;
  561. }
  562. put_sem_handle(sem);
  563. goto out;
  564. semret:
  565. ret = ipc_sysv_semret_send(port, msg->src, vals, valsize,
  566. msg->seq);
  567. out:
  568. SAVE_PROFILE_INTERVAL(ipc_sysv_semctl_callback);
  569. return ret;
  570. }
  571. DEFINE_PROFILE_INTERVAL(ipc_sysv_semret_send, ipc);
  572. DEFINE_PROFILE_INTERVAL(ipc_sysv_semret_callback, ipc);
  573. int ipc_sysv_semret_send (struct shim_ipc_port * port, IDTYPE dest, void * vals,
  574. size_t valsize, unsigned long seq)
  575. {
  576. BEGIN_PROFILE_INTERVAL();
  577. int ret = 0;
  578. struct shim_ipc_msg * msg = create_ipc_msg_on_stack(
  579. IPC_SYSV_SEMRET,
  580. sizeof(struct shim_ipc_sysv_semret) +
  581. valsize,
  582. dest);
  583. struct shim_ipc_sysv_semret * msgin =
  584. (struct shim_ipc_sysv_semret *) &msg->msg;
  585. msgin->valsize = valsize;
  586. memcpy(msgin->vals, vals, valsize);
  587. msg->seq = seq;
  588. debug("ipc send to %u: IPC_SYSV_SEMRET\n", dest);
  589. ret = send_ipc_message(msg, port);
  590. SAVE_PROFILE_INTERVAL(ipc_sysv_semret_send);
  591. return ret;
  592. }
  593. int ipc_sysv_semret_callback (IPC_CALLBACK_ARGS)
  594. {
  595. BEGIN_PROFILE_INTERVAL();
  596. struct shim_ipc_sysv_semret * semret =
  597. (struct shim_ipc_sysv_semret *) &msg->msg;
  598. debug("ipc callback from %u: IPC_SYSV_SEMRET\n", msg->src);
  599. struct shim_ipc_msg_obj * obj = find_ipc_msg_duplex(port, msg->seq);
  600. if (obj) {
  601. struct shim_ipc_sysv_semctl * semctl =
  602. (struct shim_ipc_sysv_semctl *) &obj->msg.msg;
  603. void * vals = obj->private;
  604. if (vals) {
  605. switch(semctl->cmd) {
  606. case GETALL:
  607. case GETNCNT:
  608. case GETPID:
  609. case GETVAL:
  610. case GETZCNT: {
  611. size_t retvalsize = semret->valsize;
  612. if (retvalsize > semctl->valsize)
  613. retvalsize = semctl->valsize;
  614. memcpy(vals, semret->vals, retvalsize);
  615. break;
  616. }
  617. }
  618. }
  619. if (obj->thread)
  620. thread_wakeup(obj->thread);
  621. }
  622. SAVE_PROFILE_INTERVAL(ipc_sysv_semret_callback);
  623. return 0;
  624. }
  625. DEFINE_PROFILE_INTERVAL(ipc_sysv_semmov_send, ipc);
  626. DEFINE_PROFILE_INTERVAL(ipc_sysv_semmov_callback, ipc);
  627. int ipc_sysv_semmov_send (struct shim_ipc_port * port, IDTYPE dest,
  628. IDTYPE semid, LEASETYPE lease,
  629. struct sem_backup * sems, int nsems,
  630. struct sem_client_backup * srcs, int nsrcs,
  631. struct sysv_score * scores, int nscores)
  632. {
  633. BEGIN_PROFILE_INTERVAL();
  634. struct shim_ipc_msg * msg =
  635. create_ipc_msg_on_stack(IPC_SYSV_SEMMOV,
  636. sizeof(struct shim_ipc_sysv_semmov) +
  637. sizeof(struct sem_backup) * nsems +
  638. sizeof(struct sem_client_backup) * nsrcs +
  639. sizeof(struct sysv_score) * nscores,
  640. dest);
  641. struct shim_ipc_sysv_semmov * msgin =
  642. (struct shim_ipc_sysv_semmov *) &msg->msg;
  643. msgin->semid = semid;
  644. msgin->lease = lease;
  645. msgin->nsems = nsems;
  646. msgin->nsrcs = nsrcs;
  647. msgin->nscores = nscores;
  648. memcpy(&msgin->sems, sems, sizeof(struct sem_backup) * nsems);
  649. memcpy((void *) msgin->sems + sizeof(struct sem_backup) * nsems,
  650. srcs, sizeof(struct sem_client_backup) * nsrcs);
  651. memcpy((void *) msgin->sems + sizeof(struct sem_backup) * nsems +
  652. sizeof(struct sem_client_backup) * nsrcs,
  653. scores, sizeof(struct sysv_score) * nscores);
  654. debug("ipc send to : IPC_SYSV_SEMMOV(%d)\n", semid);
  655. int ret = send_ipc_message(msg, port);
  656. SAVE_PROFILE_INTERVAL(ipc_sysv_semmov_send);
  657. return ret;
  658. }
  659. int ipc_sysv_semmov_callback (IPC_CALLBACK_ARGS)
  660. {
  661. __UNUSED(port);
  662. BEGIN_PROFILE_INTERVAL();
  663. int ret = 0;
  664. struct shim_ipc_sysv_semmov * msgin =
  665. (struct shim_ipc_sysv_semmov *) &msg->msg;
  666. debug("ipc callback from %u: IPC_SYSV_SEMMOV(%d)\n", msg->src,
  667. msgin->semid);
  668. struct sem_backup * sems = msgin->sems;
  669. struct sem_client_backup * clients =
  670. (struct sem_client_backup *) (sems + msgin->nsems);
  671. struct sysv_score * scores =
  672. (struct sysv_score *) (clients + msgin->nsrcs);
  673. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->semid);
  674. if (!sem) {
  675. ret = -ENOENT;
  676. goto out;
  677. }
  678. struct shim_handle * hdl = container_of(sem, struct shim_handle,
  679. info.sem);
  680. lock(&hdl->lock);
  681. int nscores = (msgin->nscores > MAX_SYSV_CLIENTS) ?
  682. MAX_SYSV_CLIENTS : msgin->nscores;
  683. if (nscores)
  684. memcpy(sem->scores, scores, nscores);
  685. if (nscores < MAX_SYSV_CLIENTS)
  686. memset(sem->scores + nscores, 0,
  687. sizeof(struct sysv_score) * (MAX_SYSV_CLIENTS - nscores));
  688. unlock(&hdl->lock);
  689. ret = recover_sem_ownership(sem, sems, msgin->nsems, clients,
  690. msgin->nsrcs);
  691. struct shim_ipc_info * info;
  692. if (!create_ipc_location(&info)) {
  693. add_sysv_subrange(msgin->semid, info->vmid, qstrgetstr(&info->uri),
  694. &msgin->lease);
  695. put_ipc_info(info);
  696. }
  697. put_sem_handle(sem);
  698. out:
  699. SAVE_PROFILE_INTERVAL(ipc_sysv_semmov_callback);
  700. return ret;
  701. }
  702. #ifdef USE_SHARED_SEMAPHORE
  703. DEFINE_PROFILE_INTERVAL(ipc_sysv_semquery_send, ipc);
  704. DEFINE_PROFILE_INTERVAL(ipc_sysv_semquery_callback, ipc);
  705. int ipc_sysv_semquery_send (IDTYPE semid, int * nsems,
  706. PAL_NUM ** host_sem_ids)
  707. {
  708. BEGIN_PROFILE_INTERVAL();
  709. int ret = 0;
  710. IDTYPE dest;
  711. struct shim_ipc_port * port = NULL;
  712. if ((ret = connect_owner(semid, &port, &dest)) < 0)
  713. goto out;
  714. if (dest == cur_process.vmid) {
  715. ret = -EAGAIN;
  716. goto out;
  717. }
  718. assert(port);
  719. struct shim_ipc_msg_obj * msg = create_ipc_msg_duplex_on_stack(
  720. IPC_SYSV_SEMQUERY,
  721. sizeof(struct shim_ipc_sysv_semquery),
  722. dest);
  723. struct shim_ipc_sysv_semquery * msgin =
  724. (struct shim_ipc_sysv_semquery *) &msg->msg.msg;
  725. msgin->semid = semid;
  726. debug("ipc send to %u: IPC_SYSV_SEMQUERY(%u)\n", dest, semid);
  727. ret = do_ipc_duplex(msg, port, NULL, host_sem_ids);
  728. put_ipc_port(port);
  729. if (ret >= 0) {
  730. *nsems = ret;
  731. ret = 0;
  732. }
  733. out:
  734. SAVE_PROFILE_INTERVAL(ipc_sysv_semquery_send);
  735. return ret;
  736. }
  737. int ipc_sysv_semquery_callback (IPC_CALLBACK_ARGS)
  738. {
  739. BEGIN_PROFILE_INTERVAL();
  740. int ret = 0;
  741. struct shim_ipc_sysv_semquery * msgin =
  742. (struct shim_ipc_sysv_semquery *) &msg->msg;
  743. debug("ipc callback from %u: IPC_SYSV_SEMQUERY(%u)\n", msg->src,
  744. msgin->semid);
  745. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->semid);
  746. if (!sem) {
  747. ret = -ENOENT;
  748. goto out;
  749. }
  750. ret = send_sem_host_ids(sem, port, msg->src, msg->seq);
  751. put_sem_handle(sem);
  752. out:
  753. SAVE_PROFILE_INTERVAL(ipc_sysv_semreply_callback);
  754. return ret;
  755. }
  756. DEFINE_PROFILE_INTERVAL(ipc_sysv_semreply_send, ipc);
  757. DEFINE_PROFILE_INTERVAL(ipc_sysv_semreply_callback, ipc);
  758. int ipc_sysv_semreply_send (struct shim_ipc_port * port, IDTYPE dest,
  759. IDTYPE semid, int nsems, PAL_NUM * host_sem_ids,
  760. unsigned long seq)
  761. {
  762. BEGIN_PROFILE_INTERVAL();
  763. int ret = 0;
  764. struct shim_ipc_msg * msg = create_ipc_msg_on_stack(
  765. IPC_SYSV_SEMREPLY,
  766. sizeof(struct shim_ipc_sysv_semreply)
  767. + sizeof(PAL_NUM) * nsems,
  768. dest);
  769. struct shim_ipc_sysv_semreply * msgin =
  770. (struct shim_ipc_sysv_semreply *) &msg->msg;
  771. msgin->semid = semid;
  772. msgin->nsems = nsems;
  773. if (nsems)
  774. memcpy(msgin->host_sem_ids, host_sem_ids, sizeof(PAL_NUM) * nsems);
  775. msg->seq = seq;
  776. debug("ipc send to %u: IPC_SYSV_SEMREPLY(%u, %d)\n", dest, semid, nsems);
  777. ret = send_ipc_message(msg, port);
  778. SAVE_PROFILE_INTERVAL(ipc_sysv_semreply_send);
  779. return ret;
  780. }
  781. int ipc_sysv_semreply_callback (IPC_CALLBACK_ARGS)
  782. {
  783. BEGIN_PROFILE_INTERVAL();
  784. int ret = 0;
  785. struct shim_ipc_sysv_semreply * msgin =
  786. (struct shim_ipc_sysv_semreply *) &msg->msg;
  787. debug("ipc callback from %u: IPC_SYSV_SEMREPLY(%u, %d)\n", msg->src,
  788. msgin->semid, msgin->nsems);
  789. struct shim_ipc_msg_obj * obj = find_ipc_msg_duplex(port, msg->seq);
  790. if (!obj)
  791. goto out;
  792. PAL_NUM ** semids = obj->private;
  793. if (semids)
  794. *semids = malloc_copy(msgin->host_sem_ids,
  795. sizeof(PAL_NUM) * msgin->nsems);
  796. obj->retval = msgin->nsems;
  797. if (obj->thread)
  798. thread_wakeup(obj->thread);
  799. out:
  800. SAVE_PROFILE_INTERVAL(ipc_sysv_semreply_callback);
  801. return ret;
  802. }
  803. #endif /* USE_SHARED_SEMAPHORE */
  804. int __balance_sysv_score (struct sysv_balance_policy * policy,
  805. struct shim_handle * hdl,
  806. struct sysv_score * scores, int nscores,
  807. struct sysv_client * src, long score)
  808. {
  809. struct sysv_score * s = scores;
  810. struct sysv_score * last = scores + nscores;
  811. for ( ; s < last && !s->vmid ; s++);
  812. struct sysv_score * free = s > scores ? scores : NULL;
  813. struct sysv_score * highest = s < last ? s : NULL;
  814. struct sysv_score * lowest = highest;
  815. struct sysv_score * owner = NULL;
  816. struct sysv_score * chosen = NULL;
  817. for ( ; s < last ; s++) {
  818. if (!s->vmid) {
  819. if (!free)
  820. free = s;
  821. continue;
  822. }
  823. if (s->score >= highest->score)
  824. highest = s;
  825. if (s->score < lowest->score)
  826. lowest = s;
  827. if (src) {
  828. if (s->vmid == cur_process.vmid)
  829. owner = s;
  830. if (s->vmid == src->vmid) {
  831. chosen = s;
  832. continue;
  833. }
  834. } else {
  835. if (s->vmid == cur_process.vmid) {
  836. owner = chosen = s;
  837. continue;
  838. }
  839. }
  840. s->score = (s->score >= policy->score_decay) ?
  841. s->score - policy->score_decay : 0;
  842. debug("balance: %u => %ld\n", s->vmid, s->score);
  843. }
  844. if (!chosen) {
  845. chosen = free ? : lowest;
  846. chosen->vmid = src ? src->vmid : cur_process.vmid;
  847. chosen->score = 0;
  848. }
  849. chosen->score += score;
  850. if (chosen->score > policy->score_max)
  851. chosen->score = policy->score_max;
  852. debug("balance: %u => %ld\n", chosen->vmid, chosen->score);
  853. if (!src || chosen != highest ||
  854. chosen->score < (owner ? owner->score : 0) + policy->balance_threshold)
  855. return 0;
  856. return policy->migrate(hdl, src);
  857. }