shim_ipc_sysv.c 31 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043
  1. /* -*- mode:c; c-file-style:"k&r"; c-basic-offset: 4; tab-width:4; indent-tabs-mode:nil; mode:auto-fill; fill-column:78; -*- */
  2. /* vim: set ts=4 sw=4 et tw=78 fo=cqt wm=0: */
  3. /* Copyright (C) 2014 Stony Brook University
  4. This file is part of Graphene Library OS.
  5. Graphene Library OS is free software: you can redistribute it and/or
  6. modify it under the terms of the GNU Lesser General Public License
  7. as published by the Free Software Foundation, either version 3 of the
  8. License, or (at your option) any later version.
  9. Graphene Library OS is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU Lesser General Public License for more details.
  13. You should have received a copy of the GNU Lesser General Public License
  14. along with this program. If not, see <http://www.gnu.org/licenses/>. */
  15. /*
  16. * shim_ipc_pid.c
  17. *
  18. * This file contains functions and callbacks to handle IPC of SYSV namespace.
  19. */
  20. #include <shim_internal.h>
  21. #include <shim_thread.h>
  22. #include <shim_ipc.h>
  23. #include <shim_checkpoint.h>
  24. #include <shim_sysv.h>
  25. #include <pal.h>
  26. #include <pal_error.h>
  27. #include <errno.h>
  28. #define SYSV_RANGE_SIZE 128
  29. #define SYSV_LEASE_TIME 1000
  30. #define KEY_HASH(k) ((k)->key)
  31. #define KEY_COMP(k1, k2) \
  32. ((k1)->key != (k2)->key || (k1)->type != (k2)->type)
  33. #define KEY_COPY(k1, k2) \
  34. do { (k1)->key = (k2)->key; (k1)->type = (k2)->type; } while (0)
  35. #define NS sysv
  36. #define NS_CAP SYSV
  37. #define NS_KEY struct sysv_key
  38. #define INCLUDE_IPC_NSIMPL
  39. #include "shim_ipc_nsimpl.h"
  40. int init_ns_sysv (void)
  41. {
  42. init_namespace();
  43. return 0;
  44. }
  45. DEFINE_PROFILE_INTERVAL(ipc_sysv_delres_send, ipc);
  46. DEFINE_PROFILE_INTERVAL(ipc_sysv_delres_callback, ipc);
  47. int ipc_sysv_delres_send (struct shim_ipc_port * port, IDTYPE dest,
  48. IDTYPE resid, enum sysv_type type)
  49. {
  50. BEGIN_PROFILE_INTERVAL();
  51. int ret = 0;
  52. bool owned = false;
  53. if (!port) {
  54. if ((ret = connect_owner(resid, &port, &dest)) < 0)
  55. goto out;
  56. owned = true;
  57. }
  58. if (!owned) {
  59. struct shim_ipc_msg * msg = create_ipc_msg_on_stack(
  60. IPC_SYSV_DELRES,
  61. sizeof(struct shim_ipc_sysv_delres),
  62. dest);
  63. struct shim_ipc_sysv_delres * msgin = (struct shim_ipc_sysv_delres *)
  64. &msg->msg;
  65. msgin->resid = resid;
  66. msgin->type = type;
  67. debug("ipc send to %u: IPC_SYSV_DELRES(%u, %s)\n", dest, resid,
  68. SYSV_TYPE_STR(type));
  69. ret = send_ipc_message(msg, port);
  70. goto out;
  71. }
  72. struct shim_ipc_msg_obj * msg = create_ipc_msg_duplex_on_stack(
  73. IPC_SYSV_DELRES,
  74. sizeof(struct shim_ipc_sysv_delres),
  75. dest);
  76. struct shim_ipc_sysv_delres * msgin = (struct shim_ipc_sysv_delres *)
  77. &msg->msg.msg;
  78. msgin->resid = resid;
  79. msgin->type = type;
  80. debug("ipc send to %u: IPC_SYSV_DELRES(%u, %s)\n", dest, resid,
  81. SYSV_TYPE_STR(type));
  82. ret = do_ipc_duplex(msg, port, NULL, NULL);
  83. put_ipc_port(port);
  84. out:
  85. SAVE_PROFILE_INTERVAL(ipc_sysv_delres_send);
  86. return ret;
  87. }
  88. int ipc_sysv_delres_callback (IPC_CALLBACK_ARGS)
  89. {
  90. BEGIN_PROFILE_INTERVAL();
  91. int ret = 0;
  92. struct shim_ipc_sysv_delres * msgin =
  93. (struct shim_ipc_sysv_delres *) &msg->msg;
  94. debug("ipc callback from %u: IPC_SYSV_DELRES(%u, %s)\n", msg->src,
  95. msgin->resid, SYSV_TYPE_STR(msgin->type));
  96. bool owned = false;
  97. ret = -ENOENT;
  98. switch(msgin->type) {
  99. case SYSV_MSGQ: {
  100. struct shim_msg_handle * msgq = get_msg_handle_by_id(msgin->resid);
  101. if (!msgq)
  102. goto out;
  103. owned = msgq->owned;
  104. ret = del_msg_handle(msgq);
  105. break;
  106. }
  107. case SYSV_SEM: {
  108. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->resid);
  109. if (!sem)
  110. goto out;
  111. owned = sem->owned;
  112. ret = del_sem_handle(sem);
  113. break;
  114. }
  115. default:
  116. ret = -ENOSYS;
  117. break;
  118. }
  119. if (!ret)
  120. ret = owned ? RESPONSE_CALLBACK : 0;
  121. out:
  122. SAVE_PROFILE_INTERVAL(ipc_sysv_delres_callback);
  123. return ret;
  124. }
  125. DEFINE_PROFILE_INTERVAL(ipc_sysv_movres_send, ipc);
  126. DEFINE_PROFILE_INTERVAL(ipc_sysv_movres_callback, ipc);
  127. int ipc_sysv_movres_send (struct sysv_client * client, IDTYPE owner,
  128. const char * uri, LEASETYPE lease, IDTYPE resid,
  129. enum sysv_type type)
  130. {
  131. BEGIN_PROFILE_INTERVAL();
  132. int ret = 0;
  133. int len = strlen(uri);
  134. struct shim_ipc_msg * msg = create_ipc_msg_on_stack(
  135. IPC_SYSV_MOVRES,
  136. sizeof(struct shim_ipc_sysv_movres) +
  137. len, client->vmid);
  138. struct shim_ipc_sysv_movres * msgin = (struct shim_ipc_sysv_movres *)
  139. &msg->msg;
  140. msgin->resid = resid;
  141. msgin->type = type;
  142. msgin->owner = owner;
  143. msgin->lease = lease;
  144. memcpy(msgin->uri, uri, len + 1);
  145. msg->seq = client->seq;
  146. debug("ipc send to %u: IPC_SYSV_MOVRES(%u, %s, %u, %s)\n", client->vmid,
  147. resid, SYSV_TYPE_STR(type), owner, uri);
  148. ret = send_ipc_message(msg, client->port);
  149. SAVE_PROFILE_INTERVAL(ipc_sysv_movres_send);
  150. return ret;
  151. }
  152. int ipc_sysv_movres_callback (IPC_CALLBACK_ARGS)
  153. {
  154. BEGIN_PROFILE_INTERVAL();
  155. int ret = 0;
  156. struct shim_ipc_sysv_movres * msgin =
  157. (struct shim_ipc_sysv_movres *) &msg->msg;
  158. debug("ipc callback from %u: IPC_SYSV_MOVRES(%u, %s, %u, %s)\n", msg->src,
  159. msgin->resid, SYSV_TYPE_STR(msgin->type), msgin->owner, msgin->uri);
  160. struct shim_ipc_msg_obj * obj = find_ipc_msg_duplex(port, msg->seq);
  161. if (!obj)
  162. goto out;
  163. switch(msgin->type) {
  164. case SYSV_MSGQ:
  165. case SYSV_SEM:
  166. obj->retval = -EAGAIN;
  167. break;
  168. default:
  169. ret = -ENOSYS;
  170. goto out;
  171. }
  172. add_sysv_subrange(msgin->resid, msgin->owner, msgin->uri, &msgin->lease);
  173. if (obj->thread)
  174. thread_wakeup(obj->thread);
  175. out:
  176. SAVE_PROFILE_INTERVAL(ipc_sysv_movres_callback);
  177. return ret;
  178. }
  179. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgsnd_send, ipc);
  180. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgsnd_callback, ipc);
  181. int ipc_sysv_msgsnd_send (struct shim_ipc_port * port, IDTYPE dest,
  182. IDTYPE msgid, long msgtype,
  183. const void * buf, size_t size, unsigned long seq)
  184. {
  185. BEGIN_PROFILE_INTERVAL();
  186. int ret = 0;
  187. bool owned = true;
  188. if (!dest) {
  189. if ((ret = connect_owner(msgid, &port, &dest)) < 0)
  190. goto out;
  191. owned = false;
  192. }
  193. struct shim_ipc_msg * msg = create_ipc_msg_on_stack(
  194. IPC_SYSV_MSGSND,
  195. sizeof(struct shim_ipc_sysv_msgsnd) +
  196. size, dest);
  197. struct shim_ipc_sysv_msgsnd * msgin =
  198. (struct shim_ipc_sysv_msgsnd *) &msg->msg;
  199. msgin->msgid = msgid;
  200. msgin->msgtype = msgtype;
  201. memcpy(msgin->msg, buf, size);
  202. msg->seq = seq;
  203. debug("ipc send to %u: IPC_SYSV_MSGSND(%u, %ld)\n", dest,
  204. msgid, msgtype);
  205. ret = send_ipc_message(msg, port);
  206. if (!owned)
  207. put_ipc_port(port);
  208. out:
  209. SAVE_PROFILE_INTERVAL(ipc_sysv_msgsnd_send);
  210. return ret;
  211. }
  212. int ipc_sysv_msgsnd_callback (IPC_CALLBACK_ARGS)
  213. {
  214. BEGIN_PROFILE_INTERVAL();
  215. int ret = 0;
  216. struct shim_ipc_sysv_msgsnd * msgin =
  217. (struct shim_ipc_sysv_msgsnd *) &msg->msg;
  218. debug("ipc callback from %u: IPC_SYSV_MSGSND(%u, %ld)\n", msg->src,
  219. msgin->msgid, msgin->msgtype);
  220. size_t size = msg->size - sizeof(*msg) - sizeof(*msgin);
  221. if (msg->seq) {
  222. struct shim_ipc_msg_obj * obj = find_ipc_msg_duplex(port, msg->seq);
  223. void * priv = obj ? obj->private : NULL;
  224. if (priv) {
  225. struct shim_ipc_sysv_msgrcv * rcv =
  226. (struct shim_ipc_sysv_msgrcv *) obj->msg.msg;
  227. if (size > rcv->size)
  228. size = rcv->size;
  229. memcpy(priv, msgin->msg, size);
  230. obj->retval = size;
  231. if (obj->thread)
  232. thread_wakeup(obj->thread);
  233. goto out;
  234. }
  235. }
  236. struct shim_msg_handle * msgq = get_msg_handle_by_id(msgin->msgid);
  237. if (!msgq) {
  238. ret = -ENOENT;
  239. goto out;
  240. }
  241. if (msg->seq) {
  242. ret = add_sysv_msg(msgq, msgin->msgtype, size, msgin->msg, NULL);
  243. } else {
  244. struct sysv_client src;
  245. src.port = port;
  246. src.vmid = msg->src;
  247. src.seq = msg->seq;
  248. ret = add_sysv_msg(msgq, msgin->msgtype, size, msgin->msg, &src);
  249. }
  250. out:
  251. SAVE_PROFILE_INTERVAL(ipc_sysv_msgsnd_callback);
  252. return ret;
  253. }
  254. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgrcv_send, ipc);
  255. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgrcv_callback, ipc);
  256. int ipc_sysv_msgrcv_send (IDTYPE msgid, long msgtype, int flags, void * buf,
  257. size_t size)
  258. {
  259. BEGIN_PROFILE_INTERVAL();
  260. IDTYPE owner;
  261. struct shim_ipc_port * port = NULL;
  262. int ret = 0;
  263. if ((ret = connect_owner(msgid, &port, &owner)) < 0)
  264. goto out;
  265. if (owner == cur_process.vmid) {
  266. ret = -EAGAIN;
  267. goto out;
  268. }
  269. assert(port);
  270. struct shim_ipc_msg_obj * msg = create_ipc_msg_duplex_on_stack(
  271. IPC_SYSV_MSGRCV,
  272. sizeof(struct shim_ipc_sysv_msgrcv),
  273. true);
  274. struct shim_ipc_sysv_msgrcv * msgin =
  275. (struct shim_ipc_sysv_msgrcv *) &msg->msg.msg;
  276. msgin->msgid = msgid;
  277. msgin->msgtype = msgtype;
  278. msgin->size = size;
  279. msgin->flags = flags;
  280. debug("ipc send to %u: IPC_SYSV_MSGRCV(%u, %ld)\n", owner,
  281. msgid, msgtype);
  282. ret = do_ipc_duplex(msg, port, NULL, buf);
  283. put_ipc_port(port);
  284. out:
  285. SAVE_PROFILE_INTERVAL(ipc_sysv_msgrcv_send);
  286. return ret;
  287. }
  288. int ipc_sysv_msgrcv_callback (IPC_CALLBACK_ARGS)
  289. {
  290. BEGIN_PROFILE_INTERVAL();
  291. int ret = 0;
  292. struct shim_ipc_sysv_msgrcv * msgin =
  293. (struct shim_ipc_sysv_msgrcv *) &msg->msg;
  294. debug("ipc callback from %u: IPC_SYSV_MSGRCV(%u, %ld)\n", msg->src,
  295. msgin->msgid, msgin->msgtype);
  296. struct shim_msg_handle * msgq = get_msg_handle_by_id(msgin->msgid);
  297. if (!msgq) {
  298. ret = -ENOENT;
  299. goto out;
  300. }
  301. void * buf = __alloca(msgin->size);
  302. struct sysv_client src;
  303. src.port = port;
  304. src.vmid = msg->src;
  305. src.seq = msg->seq;
  306. ret = get_sysv_msg(msgq, msgin->msgtype, msgin->size, buf, msgin->flags,
  307. &src);
  308. if (ret > 0) {
  309. size_t size = ret;
  310. ret = ipc_sysv_msgsnd_send(port, msg->src, msgin->msgid, msgin->msgtype,
  311. buf, size, msg->seq);
  312. }
  313. put_msg_handle(msgq);
  314. out:
  315. SAVE_PROFILE_INTERVAL(ipc_sysv_msgrcv_callback);
  316. return ret;
  317. }
  318. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgmov_send, ipc);
  319. DEFINE_PROFILE_INTERVAL(ipc_sysv_msgmov_callback, ipc);
  320. int ipc_sysv_msgmov_send (struct shim_ipc_port * port, IDTYPE dest,
  321. IDTYPE msgid, LEASETYPE lease,
  322. struct sysv_score * scores, int nscores)
  323. {
  324. BEGIN_PROFILE_INTERVAL();
  325. struct shim_ipc_msg * msg =
  326. create_ipc_msg_on_stack(IPC_SYSV_MSGMOV,
  327. sizeof(struct shim_ipc_sysv_msgmov) +
  328. sizeof(struct sysv_score) * nscores,
  329. dest);
  330. struct shim_ipc_sysv_msgmov * msgin =
  331. (struct shim_ipc_sysv_msgmov *) &msg->msg;
  332. msgin->msgid = msgid;
  333. msgin->lease = lease;
  334. msgin->nscores = nscores;
  335. if (nscores)
  336. memcpy(msgin->scores, scores, sizeof(struct sysv_score) * nscores);
  337. debug("ipc send to %u: IPC_SYSV_MSGMOV(%ld)\n", dest, msgid);
  338. int ret = send_ipc_message(msg, port);
  339. SAVE_PROFILE_INTERVAL(ipc_sysv_msgmov_send);
  340. return ret;
  341. }
  342. int ipc_sysv_msgmov_callback (IPC_CALLBACK_ARGS)
  343. {
  344. BEGIN_PROFILE_INTERVAL();
  345. int ret = 0;
  346. struct shim_ipc_sysv_msgmov * msgin =
  347. (struct shim_ipc_sysv_msgmov *) &msg->msg;
  348. debug("ipc callback from %u: IPC_SYSV_MSGMOV(%ld)\n", msg->src,
  349. msgin->msgid);
  350. struct shim_msg_handle * msgq = get_msg_handle_by_id(msgin->msgid);
  351. if (!msgq) {
  352. ret = -ENOENT;
  353. goto out;
  354. }
  355. struct shim_handle * hdl = container_of(msgq, struct shim_handle,
  356. info.msg);
  357. lock(hdl->lock);
  358. int nscores = (msgin->nscores > MAX_SYSV_CLIENTS) ?
  359. MAX_SYSV_CLIENTS : msgin->nscores;
  360. if (nscores)
  361. memcpy(msgq->scores, msgin->scores, nscores);
  362. if (nscores < MAX_SYSV_CLIENTS)
  363. memset(msgq->scores + nscores, 0,
  364. sizeof(struct sysv_score) * (MAX_SYSV_CLIENTS - nscores));
  365. unlock(hdl->lock);
  366. ret = recover_msg_ownership(msgq);
  367. struct shim_ipc_info * info;
  368. if (!create_ipc_location(&info)) {
  369. add_sysv_subrange(msgin->msgid, info->vmid, qstrgetstr(&info->uri),
  370. &msgin->lease);
  371. put_ipc_info(info);
  372. }
  373. put_msg_handle(msgq);
  374. out:
  375. SAVE_PROFILE_INTERVAL(ipc_sysv_msgmov_callback);
  376. return ret;
  377. }
  378. DEFINE_PROFILE_INTERVAL(ipc_sysv_semop_send, ipc);
  379. DEFINE_PROFILE_INTERVAL(ipc_sysv_semop_callback, ipc);
  380. int ipc_sysv_semop_send (IDTYPE semid, struct sembuf * sops, int nsops,
  381. unsigned long timeout, unsigned long * seq)
  382. {
  383. BEGIN_PROFILE_INTERVAL();
  384. IDTYPE owner;
  385. struct shim_ipc_port * port = NULL;
  386. int ret = 0;
  387. bool waitforreply = false;
  388. for (int i = 0 ; i < nsops ; i++)
  389. if (sops[i].sem_op <= 0) {
  390. waitforreply = true;
  391. break;
  392. }
  393. if ((ret = connect_owner(semid, &port, &owner)) < 0)
  394. goto out;
  395. if (owner == cur_process.vmid) {
  396. ret = -EAGAIN;
  397. goto out;
  398. }
  399. assert(port);
  400. if (!waitforreply) {
  401. struct shim_ipc_msg * msg = create_ipc_msg_on_stack(
  402. IPC_SYSV_SEMOP,
  403. sizeof(struct shim_ipc_sysv_semop) +
  404. sizeof(struct sembuf) * nsops,
  405. owner);
  406. struct shim_ipc_sysv_semop * msgin =
  407. (struct shim_ipc_sysv_semop *) &msg->msg;
  408. msgin->semid = semid;
  409. msgin->timeout = timeout;
  410. msgin->nsops = nsops;
  411. memcpy(msgin->sops, sops, sizeof(struct sembuf) * nsops);
  412. msg->seq = *seq;
  413. debug("ipc send to %u: IPC_SYSV_SEMOP(%u, %ld, %u)\n", owner, semid,
  414. timeout, nsops);
  415. ret = send_ipc_message(msg, port);
  416. put_ipc_port(port);
  417. goto out;
  418. }
  419. struct shim_ipc_msg_obj * msg = create_ipc_msg_duplex_on_stack(
  420. IPC_SYSV_SEMOP,
  421. sizeof(struct shim_ipc_sysv_semop) +
  422. sizeof(struct sembuf) * nsops,
  423. owner);
  424. struct shim_ipc_sysv_semop * msgin =
  425. (struct shim_ipc_sysv_semop *) &msg->msg.msg;
  426. msgin->semid = semid;
  427. msgin->timeout = timeout;
  428. msgin->nsops = nsops;
  429. memcpy(msgin->sops, sops, sizeof(struct sembuf) * nsops);
  430. msg->msg.seq = *seq;
  431. debug("ipc send to %u: IPC_SYSV_SEMOP(%u, %ld, %u)\n", owner, semid,
  432. timeout, nsops);
  433. ret = do_ipc_duplex(msg, port, seq, NULL);
  434. put_ipc_port(port);
  435. out:
  436. SAVE_PROFILE_INTERVAL(ipc_sysv_semop_send);
  437. return ret;
  438. }
  439. int ipc_sysv_semop_callback (IPC_CALLBACK_ARGS)
  440. {
  441. BEGIN_PROFILE_INTERVAL();
  442. int ret = 0;
  443. struct shim_ipc_sysv_semop * msgin =
  444. (struct shim_ipc_sysv_semop *) &msg->msg;
  445. debug("ipc callback from %u: IPC_SYSV_SEMOP(%u, %ld, %u)\n", msg->src,
  446. msgin->semid, msgin->timeout, msgin->nsops);
  447. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->semid);
  448. if (!sem) {
  449. ret = -ENOENT;
  450. goto out;
  451. }
  452. struct sysv_client client;
  453. client.port = port;
  454. client.vmid = msg->src;
  455. client.seq = msg->seq;
  456. ret = submit_sysv_sem(sem, msgin->sops, msgin->nsops, msgin->timeout,
  457. &client);
  458. put_sem_handle(sem);
  459. out:
  460. SAVE_PROFILE_INTERVAL(ipc_sysv_semop_callback);
  461. return ret;
  462. }
  463. DEFINE_PROFILE_INTERVAL(ipc_sysv_semctl_send, ipc);
  464. DEFINE_PROFILE_INTERVAL(ipc_sysv_semctl_callback, ipc);
  465. int ipc_sysv_semctl_send (IDTYPE semid, int semnum, int cmd, void * vals,
  466. int valsize)
  467. {
  468. BEGIN_PROFILE_INTERVAL();
  469. IDTYPE owner;
  470. struct shim_ipc_port * port = NULL;
  471. int ret = 0;
  472. if ((ret = connect_owner(semid, &port, &owner)) < 0)
  473. goto out;
  474. int ctlvalsize = (cmd == SETALL || cmd == SETVAL) ? valsize : 0;
  475. struct shim_ipc_msg_obj * msg = create_ipc_msg_duplex_on_stack(
  476. IPC_SYSV_SEMCTL,
  477. sizeof(struct shim_ipc_sysv_semctl) +
  478. ctlvalsize,
  479. owner);
  480. struct shim_ipc_sysv_semctl * msgin =
  481. (struct shim_ipc_sysv_semctl *) &msg->msg.msg;
  482. msgin->semid = semid;
  483. msgin->semnum = semnum;
  484. msgin->cmd = cmd;
  485. msgin->valsize = ctlvalsize;
  486. if (ctlvalsize)
  487. memcpy(msgin->vals, vals, ctlvalsize);
  488. debug("ipc send to %u: IPC_SYSV_SEMCTL(%u, %d, %d)\n", owner, semid,
  489. semnum, cmd);
  490. ret = do_ipc_duplex(msg, port, NULL, vals);
  491. put_ipc_port(port);
  492. out:
  493. SAVE_PROFILE_INTERVAL(ipc_sysv_semctl_send);
  494. return ret;
  495. }
  496. int ipc_sysv_semctl_callback (IPC_CALLBACK_ARGS)
  497. {
  498. BEGIN_PROFILE_INTERVAL();
  499. int ret = 0;
  500. struct shim_ipc_sysv_semctl * msgin =
  501. (struct shim_ipc_sysv_semctl *) &msg->msg;
  502. debug("ipc callback from %u: IPC_SYSV_SEMCTL(%u, %d, %d)\n", msg->src,
  503. msgin->semid, msgin->semnum, msgin->cmd);
  504. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->semid);
  505. if (!sem) {
  506. ret = -ENOENT;
  507. goto out;
  508. }
  509. void * vals = NULL;
  510. int valsize;
  511. switch(msgin->cmd) {
  512. case GETALL: {
  513. unsigned short * allsems = __alloca(sizeof(unsigned short) *
  514. sem->nsems);
  515. for (int i = 0 ; i < sem->nsems ; i++)
  516. allsems[i] = sem->sems[i].val;
  517. vals = allsems;
  518. valsize = sizeof(unsigned short) * sem->nsems;
  519. goto semret;
  520. }
  521. case GETNCNT:
  522. vals = &sem->sems[msgin->semnum].ncnt;
  523. valsize = sizeof(unsigned short);
  524. goto semret;
  525. case GETPID:
  526. vals = &sem->sems[msgin->semnum].pid;
  527. valsize = sizeof(IDTYPE);
  528. goto semret;
  529. case GETVAL:
  530. vals = &sem->sems[msgin->semnum].val;
  531. valsize = sizeof(unsigned short);
  532. goto semret;
  533. case GETZCNT:
  534. vals = &sem->sems[msgin->semnum].zcnt;
  535. valsize = sizeof(unsigned short);
  536. break;
  537. case SETALL: {
  538. if (msgin->valsize != sizeof(unsigned short) * sem->nsems) {
  539. ret = -EINVAL;
  540. break;
  541. }
  542. unsigned short * vals = (void *) msgin->vals;
  543. for (int i = 0 ; i < sem->nsems ; i++)
  544. sem->sems[i].val = vals[i];
  545. ret = RESPONSE_CALLBACK;
  546. break;
  547. }
  548. case SETVAL: {
  549. ret = -EINVAL;
  550. if (msgin->valsize != sizeof(unsigned short))
  551. break;
  552. if (msgin->semnum >= sem->nsems)
  553. break;
  554. sem->sems[msgin->semnum].val = *((int *) msgin->vals);
  555. ret = RESPONSE_CALLBACK;
  556. break;
  557. }
  558. default:
  559. ret = -ENOSYS;
  560. break;
  561. }
  562. put_sem_handle(sem);
  563. goto out;
  564. semret:
  565. ret = ipc_sysv_semret_send(port, msg->src, vals, valsize,
  566. msg->seq);
  567. out:
  568. SAVE_PROFILE_INTERVAL(ipc_sysv_semctl_callback);
  569. return ret;
  570. }
  571. DEFINE_PROFILE_INTERVAL(ipc_sysv_semret_send, ipc);
  572. DEFINE_PROFILE_INTERVAL(ipc_sysv_semret_callback, ipc);
  573. int ipc_sysv_semret_send (struct shim_ipc_port * port, IDTYPE dest, void * vals,
  574. int valsize, unsigned long seq)
  575. {
  576. BEGIN_PROFILE_INTERVAL();
  577. int ret = 0;
  578. struct shim_ipc_msg * msg = create_ipc_msg_on_stack(
  579. IPC_SYSV_SEMRET,
  580. sizeof(struct shim_ipc_sysv_semret) +
  581. valsize,
  582. dest);
  583. struct shim_ipc_sysv_semret * msgin =
  584. (struct shim_ipc_sysv_semret *) &msg->msg;
  585. msgin->valsize = valsize;
  586. memcpy(msgin->vals, vals, valsize);
  587. msg->seq = seq;
  588. debug("ipc send to %u: IPC_SYSV_SEMRET\n", dest);
  589. ret = send_ipc_message(msg, port);
  590. SAVE_PROFILE_INTERVAL(ipc_sysv_semret_send);
  591. return ret;
  592. }
  593. int ipc_sysv_semret_callback (IPC_CALLBACK_ARGS)
  594. {
  595. BEGIN_PROFILE_INTERVAL();
  596. struct shim_ipc_sysv_semret * semret =
  597. (struct shim_ipc_sysv_semret *) &msg->msg;
  598. debug("ipc callback from %u: IPC_SYSV_SEMRET\n", msg->src);
  599. struct shim_ipc_msg_obj * obj = find_ipc_msg_duplex(port, msg->seq);
  600. if (obj) {
  601. struct shim_ipc_sysv_semctl * semctl =
  602. (struct shim_ipc_sysv_semctl *) &obj->msg.msg;
  603. void * vals = obj->private;
  604. if (vals) {
  605. switch(semctl->cmd) {
  606. case GETALL:
  607. case GETNCNT:
  608. case GETPID:
  609. case GETVAL:
  610. case GETZCNT: {
  611. int retvalsize = semret->valsize;
  612. if (retvalsize > semctl->valsize)
  613. retvalsize = semctl->valsize;
  614. memcpy(vals, semret->vals, retvalsize);
  615. break;
  616. }
  617. }
  618. }
  619. if (obj->thread)
  620. thread_wakeup(obj->thread);
  621. }
  622. SAVE_PROFILE_INTERVAL(ipc_sysv_semret_callback);
  623. return 0;
  624. }
  625. DEFINE_PROFILE_INTERVAL(ipc_sysv_semmov_send, ipc);
  626. DEFINE_PROFILE_INTERVAL(ipc_sysv_semmov_callback, ipc);
  627. int ipc_sysv_semmov_send (struct shim_ipc_port * port, IDTYPE dest,
  628. IDTYPE semid, LEASETYPE lease,
  629. struct sem_backup * sems, int nsems,
  630. struct sem_client_backup * srcs, int nsrcs,
  631. struct sysv_score * scores, int nscores)
  632. {
  633. BEGIN_PROFILE_INTERVAL();
  634. struct shim_ipc_msg * msg =
  635. create_ipc_msg_on_stack(IPC_SYSV_SEMMOV,
  636. sizeof(struct shim_ipc_sysv_semmov) +
  637. sizeof(struct sem_backup) * nsems +
  638. sizeof(struct sem_client_backup) * nsrcs +
  639. sizeof(struct sysv_score) * nscores,
  640. dest);
  641. struct shim_ipc_sysv_semmov * msgin =
  642. (struct shim_ipc_sysv_semmov *) &msg->msg;
  643. msgin->semid = semid;
  644. msgin->lease = lease;
  645. msgin->nsems = nsems;
  646. msgin->nsrcs = nsrcs;
  647. msgin->nscores = nscores;
  648. memcpy(&msgin->sems, sems, sizeof(struct sem_backup) * nsems);
  649. memcpy((void *) msgin->sems + sizeof(struct sem_backup) * nsems,
  650. srcs, sizeof(struct sem_client_backup) * nsrcs);
  651. memcpy((void *) msgin->sems + sizeof(struct sem_backup) * nsems +
  652. sizeof(struct sem_client_backup) * nsrcs,
  653. scores, sizeof(struct sysv_score) * nscores);
  654. debug("ipc send to %u: IPC_SYSV_SEMMOV(%ld)\n", semid);
  655. int ret = send_ipc_message(msg, port);
  656. SAVE_PROFILE_INTERVAL(ipc_sysv_semmov_send);
  657. return ret;
  658. }
  659. int ipc_sysv_semmov_callback (IPC_CALLBACK_ARGS)
  660. {
  661. BEGIN_PROFILE_INTERVAL();
  662. int ret = 0;
  663. struct shim_ipc_sysv_semmov * msgin =
  664. (struct shim_ipc_sysv_semmov *) &msg->msg;
  665. debug("ipc callback from %u: IPC_SYSV_SEMMOV(%ld)\n", msg->src,
  666. msgin->semid);
  667. struct sem_backup * sems = msgin->sems;
  668. struct sem_client_backup * clients =
  669. (struct sem_client_backup *) (sems + msgin->nsems);
  670. struct sysv_score * scores =
  671. (struct sysv_score *) (clients + msgin->nsrcs);
  672. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->semid);
  673. if (!sem) {
  674. ret = -ENOENT;
  675. goto out;
  676. }
  677. struct shim_handle * hdl = container_of(sem, struct shim_handle,
  678. info.sem);
  679. lock(hdl->lock);
  680. int nscores = (msgin->nscores > MAX_SYSV_CLIENTS) ?
  681. MAX_SYSV_CLIENTS : msgin->nscores;
  682. if (nscores)
  683. memcpy(sem->scores, scores, nscores);
  684. if (nscores < MAX_SYSV_CLIENTS)
  685. memset(sem->scores + nscores, 0,
  686. sizeof(struct sysv_score) * (MAX_SYSV_CLIENTS - nscores));
  687. unlock(hdl->lock);
  688. ret = recover_sem_ownership(sem, sems, msgin->nsems, clients,
  689. msgin->nsrcs);
  690. struct shim_ipc_info * info;
  691. if (!create_ipc_location(&info)) {
  692. add_sysv_subrange(msgin->semid, info->vmid, qstrgetstr(&info->uri),
  693. &msgin->lease);
  694. put_ipc_info(info);
  695. }
  696. put_sem_handle(sem);
  697. out:
  698. SAVE_PROFILE_INTERVAL(ipc_sysv_semmov_callback);
  699. return ret;
  700. }
  701. #ifdef USE_SHARED_SEMAPHORE
  702. DEFINE_PROFILE_INTERVAL(ipc_sysv_semquery_send, ipc);
  703. DEFINE_PROFILE_INTERVAL(ipc_sysv_semquery_callback, ipc);
  704. int ipc_sysv_semquery_send (IDTYPE semid, int * nsems,
  705. PAL_NUM ** host_sem_ids)
  706. {
  707. BEGIN_PROFILE_INTERVAL();
  708. int ret = 0;
  709. IDTYPE dest;
  710. struct shim_ipc_port * port = NULL;
  711. if ((ret = connect_owner(semid, &port, &dest)) < 0)
  712. goto out;
  713. if (dest == cur_process.vmid) {
  714. ret = -EAGAIN;
  715. goto out;
  716. }
  717. assert(port);
  718. struct shim_ipc_msg_obj * msg = create_ipc_msg_duplex_on_stack(
  719. IPC_SYSV_SEMQUERY,
  720. sizeof(struct shim_ipc_sysv_semquery),
  721. dest);
  722. struct shim_ipc_sysv_semquery * msgin =
  723. (struct shim_ipc_sysv_semquery *) &msg->msg.msg;
  724. msgin->semid = semid;
  725. debug("ipc send to %u: IPC_SYSV_SEMQUERY(%u)\n", dest, semid);
  726. ret = do_ipc_duplex(msg, port, NULL, host_sem_ids);
  727. put_ipc_port(port);
  728. if (ret >= 0) {
  729. *nsems = ret;
  730. ret = 0;
  731. }
  732. out:
  733. SAVE_PROFILE_INTERVAL(ipc_sysv_semquery_send);
  734. return ret;
  735. }
  736. int ipc_sysv_semquery_callback (IPC_CALLBACK_ARGS)
  737. {
  738. BEGIN_PROFILE_INTERVAL();
  739. int ret = 0;
  740. struct shim_ipc_sysv_semquery * msgin =
  741. (struct shim_ipc_sysv_semquery *) &msg->msg;
  742. debug("ipc callback from %u: IPC_SYSV_SEMQUERY(%u)\n", msg->src,
  743. msgin->semid);
  744. struct shim_sem_handle * sem = get_sem_handle_by_id(msgin->semid);
  745. if (!sem) {
  746. ret = -ENOENT;
  747. goto out;
  748. }
  749. ret = send_sem_host_ids(sem, port, msg->src, msg->seq);
  750. put_sem_handle(sem);
  751. out:
  752. SAVE_PROFILE_INTERVAL(ipc_sysv_semreply_callback);
  753. return ret;
  754. }
  755. DEFINE_PROFILE_INTERVAL(ipc_sysv_semreply_send, ipc);
  756. DEFINE_PROFILE_INTERVAL(ipc_sysv_semreply_callback, ipc);
  757. int ipc_sysv_semreply_send (struct shim_ipc_port * port, IDTYPE dest,
  758. IDTYPE semid, int nsems, PAL_NUM * host_sem_ids,
  759. unsigned long seq)
  760. {
  761. BEGIN_PROFILE_INTERVAL();
  762. int ret = 0;
  763. struct shim_ipc_msg * msg = create_ipc_msg_on_stack(
  764. IPC_SYSV_SEMREPLY,
  765. sizeof(struct shim_ipc_sysv_semreply)
  766. + sizeof(PAL_NUM) * nsems,
  767. dest);
  768. struct shim_ipc_sysv_semreply * msgin =
  769. (struct shim_ipc_sysv_semreply *) &msg->msg;
  770. msgin->semid = semid;
  771. msgin->nsems = nsems;
  772. if (nsems)
  773. memcpy(msgin->host_sem_ids, host_sem_ids, sizeof(PAL_NUM) * nsems);
  774. msg->seq = seq;
  775. debug("ipc send to %u: IPC_SYSV_SEMREPLY(%u, %d)\n", dest, semid, nsems);
  776. ret = send_ipc_message(msg, port);
  777. SAVE_PROFILE_INTERVAL(ipc_sysv_semreply_send);
  778. return ret;
  779. }
  780. int ipc_sysv_semreply_callback (IPC_CALLBACK_ARGS)
  781. {
  782. BEGIN_PROFILE_INTERVAL();
  783. int ret = 0;
  784. struct shim_ipc_sysv_semreply * msgin =
  785. (struct shim_ipc_sysv_semreply *) &msg->msg;
  786. debug("ipc callback from %u: IPC_SYSV_SEMREPLY(%u, %d)\n", msg->src,
  787. msgin->semid, msgin->nsems);
  788. struct shim_ipc_msg_obj * obj = find_ipc_msg_duplex(port, msg->seq);
  789. if (!obj)
  790. goto out;
  791. PAL_NUM ** semids = obj->private;
  792. if (semids)
  793. *semids = malloc_copy(msgin->host_sem_ids,
  794. sizeof(PAL_NUM) * msgin->nsems);
  795. obj->retval = msgin->nsems;
  796. if (obj->thread)
  797. thread_wakeup(obj->thread);
  798. out:
  799. SAVE_PROFILE_INTERVAL(ipc_sysv_semreply_callback);
  800. return ret;
  801. }
  802. #endif /* USE_SHARED_SEMAPHORE */
  803. int __balance_sysv_score (struct sysv_balance_policy * policy,
  804. struct shim_handle * hdl,
  805. struct sysv_score * scores, int nscores,
  806. struct sysv_client * src, long score)
  807. {
  808. struct sysv_score * s = scores;
  809. struct sysv_score * last = scores + nscores;
  810. for ( ; s < last && !s->vmid ; s++);
  811. struct sysv_score * free = s > scores ? scores : NULL;
  812. struct sysv_score * highest = s < last ? s : NULL;
  813. struct sysv_score * lowest = highest;
  814. struct sysv_score * owner = NULL;
  815. struct sysv_score * chosen = NULL;
  816. for ( ; s < last ; s++) {
  817. if (!s->vmid) {
  818. if (!free)
  819. free = s;
  820. continue;
  821. }
  822. if (s->score >= highest->score)
  823. highest = s;
  824. if (s->score < lowest->score)
  825. lowest = s;
  826. if (src) {
  827. if (s->vmid == cur_process.vmid)
  828. owner = s;
  829. if (s->vmid == src->vmid) {
  830. chosen = s;
  831. continue;
  832. }
  833. } else {
  834. if (s->vmid == cur_process.vmid) {
  835. owner = chosen = s;
  836. continue;
  837. }
  838. }
  839. s->score = (s->score >= policy->score_decay) ?
  840. s->score - policy->score_decay : 0;
  841. debug("balance: %u => %d\n", s->vmid, s->score);
  842. }
  843. if (!chosen) {
  844. chosen = free ? : lowest;
  845. chosen->vmid = src ? src->vmid : cur_process.vmid;
  846. chosen->score = 0;
  847. }
  848. chosen->score += score;
  849. if (chosen->score > policy->score_max)
  850. chosen->score = policy->score_max;
  851. debug("balance: %u => %d\n", chosen->vmid, chosen->score);
  852. if (!src || chosen != highest ||
  853. chosen->score < (owner ? owner->score : 0) + policy->balance_threshold)
  854. return 0;
  855. return policy->migrate(hdl, src);
  856. }