scheduler.c 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737
  1. /* Copyright (c) 2013-2017, The Tor Project, Inc. */
  2. /* See LICENSE for licensing information */
  3. #include "or.h"
  4. #include "config.h"
  5. #include "compat_libevent.h"
  6. #define SCHEDULER_PRIVATE_
  7. #define SCHEDULER_KIST_PRIVATE
  8. #include "scheduler.h"
  9. #include "main.h"
  10. #include "buffers.h"
  11. #define TOR_CHANNEL_INTERNAL_
  12. #include "channeltls.h"
  13. #include <event2/event.h>
  14. /**
  15. * \file scheduler.c
  16. * \brief Channel scheduling system: decides which channels should send and
  17. * receive when.
  18. *
  19. * This module is the global/common parts of the scheduling system. This system
  20. * is what decides what channels get to send cells on their circuits and when.
  21. *
  22. * Terms:
  23. * - "Scheduling system": the collection of scheduler*.{h,c} files and their
  24. * aggregate behavior.
  25. * - "Scheduler implementation": a scheduler_t. The scheduling system has one
  26. * active scheduling implementation at a time.
  27. *
  28. * In this file you will find state that any scheduler implementation can have
  29. * access to as well as the functions the rest of Tor uses to interact with the
  30. * scheduling system.
  31. *
  32. * The earliest versions of Tor approximated a kind of round-robin system
  33. * among active connections, but only approximated it. It would only consider
  34. * one connection (roughly equal to a channel in today's terms) at a time, and
  35. * thus could only prioritize circuits against others on the same connection.
  36. *
  37. * Then in response to the KIST paper[0], Tor implemented a global
  38. * circuit scheduler. It was supposed to prioritize circuits across many
  39. * channels, but wasn't effective. It is preserved in scheduler_vanilla.c.
  40. *
  41. * [0]: http://www.robgjansen.com/publications/kist-sec2014.pdf
  42. *
  43. * Then we actually got around to implementing KIST for real. We decided to
  44. * modularize the scheduler so new ones can be implemented. You can find KIST
  45. * in scheduler_kist.c.
  46. *
  47. * Channels have one of four scheduling states based on whether or not they
  48. * have cells to send and whether or not they are able to send.
  49. *
  50. * <ol>
  51. * <li>
  52. * Not open for writes, no cells to send.
  53. * <ul><li> Not much to do here, and the channel will have scheduler_state
  54. * == SCHED_CHAN_IDLE
  55. * <li> Transitions from:
  56. * <ul>
  57. * <li>Open for writes/has cells by simultaneously draining all circuit
  58. * queues and filling the output buffer.
  59. * </ul>
  60. * <li> Transitions to:
  61. * <ul>
  62. * <li> Not open for writes/has cells by arrival of cells on an attached
  63. * circuit (this would be driven from append_cell_to_circuit_queue())
  64. * <li> Open for writes/no cells by a channel type specific path;
  65. * driven from connection_or_flushed_some() for channel_tls_t.
  66. * </ul>
  67. * </ul>
  68. *
  69. * <li> Open for writes, no cells to send
  70. * <ul>
  71. * <li>Not much here either; this will be the state an idle but open
  72. * channel can be expected to settle in. It will have scheduler_state
  73. * == SCHED_CHAN_WAITING_FOR_CELLS
  74. * <li> Transitions from:
  75. * <ul>
  76. * <li>Not open for writes/no cells by flushing some of the output
  77. * buffer.
  78. * <li>Open for writes/has cells by the scheduler moving cells from
  79. * circuit queues to channel output queue, but not having enough
  80. * to fill the output queue.
  81. * </ul>
  82. * <li> Transitions to:
  83. * <ul>
  84. * <li>Open for writes/has cells by arrival of new cells on an attached
  85. * circuit, in append_cell_to_circuit_queue()
  86. * </ul>
  87. * </ul>
  88. *
  89. * <li>Not open for writes, cells to send
  90. * <ul>
  91. * <li>This is the state of a busy circuit limited by output bandwidth;
  92. * cells have piled up in the circuit queues waiting to be relayed.
  93. * The channel will have scheduler_state == SCHED_CHAN_WAITING_TO_WRITE.
  94. * <li> Transitions from:
  95. * <ul>
  96. * <li>Not open for writes/no cells by arrival of cells on an attached
  97. * circuit
  98. * <li>Open for writes/has cells by filling an output buffer without
  99. * draining all cells from attached circuits
  100. * </ul>
  101. * <li> Transitions to:
  102. * <ul>
  103. * <li>Opens for writes/has cells by draining some of the output buffer
  104. * via the connection_or_flushed_some() path (for channel_tls_t).
  105. * </ul>
  106. * </ul>
  107. *
  108. * <li>Open for writes, cells to send
  109. * <ul>
  110. * <li>This connection is ready to relay some cells and waiting for
  111. * the scheduler to choose it. The channel will have scheduler_state ==
  112. * SCHED_CHAN_PENDING.
  113. * <li>Transitions from:
  114. * <ul>
  115. * <li>Not open for writes/has cells by the connection_or_flushed_some()
  116. * path
  117. * <li>Open for writes/no cells by the append_cell_to_circuit_queue()
  118. * path
  119. * </ul>
  120. * <li> Transitions to:
  121. * <ul>
  122. * <li>Not open for writes/no cells by draining all circuit queues and
  123. * simultaneously filling the output buffer.
  124. * <li>Not open for writes/has cells by writing enough cells to fill the
  125. * output buffer
  126. * <li>Open for writes/no cells by draining all attached circuit queues
  127. * without also filling the output buffer
  128. * </ul>
  129. * </ul>
  130. * </ol>
  131. *
  132. * Other event-driven parts of the code move channels between these scheduling
  133. * states by calling scheduler functions. The scheduling system builds up a
  134. * list of channels in the SCHED_CHAN_PENDING state that the scheduler
  135. * implementation should then use when it runs. Scheduling implementations need
  136. * to properly update channel states during their scheduler_t->run() function
  137. * as that is the only opportunity for channels to move from SCHED_CHAN_PENDING
  138. * to any other state.
  139. *
  140. * The remainder of this file is a small amount of state that any scheduler
  141. * implementation should have access to, and the functions the rest of Tor uses
  142. * to interact with the scheduling system.
  143. */
  144. /*****************************************************************************
  145. * Scheduling system state
  146. *
  147. * State that can be accessed from any scheduler implementation (but not
  148. * outside the scheduling system)
  149. *****************************************************************************/
  150. /** DOCDOC */
  151. STATIC const scheduler_t *the_scheduler;
  152. /**
  153. * We keep a list of channels that are pending - i.e, have cells to write
  154. * and can accept them to send. The enum scheduler_state in channel_t
  155. * is reserved for our use.
  156. *
  157. * Priority queue of channels that can write and have cells (pending work)
  158. */
  159. STATIC smartlist_t *channels_pending = NULL;
  160. /**
  161. * This event runs the scheduler from its callback, and is manually
  162. * activated whenever a channel enters open for writes/cells to send.
  163. */
  164. STATIC struct event *run_sched_ev = NULL;
  165. /*****************************************************************************
  166. * Scheduling system static function definitions
  167. *
  168. * Functions that can only be accessed from this file.
  169. *****************************************************************************/
  170. /** Return a human readable string for the given scheduler type. */
  171. static const char *
  172. get_scheduler_type_string(scheduler_types_t type)
  173. {
  174. switch (type) {
  175. case SCHEDULER_VANILLA:
  176. return "Vanilla";
  177. case SCHEDULER_KIST:
  178. return "KIST";
  179. case SCHEDULER_KIST_LITE:
  180. return "KISTLite";
  181. case SCHEDULER_NONE:
  182. /* fallthrough */
  183. default:
  184. tor_assert_unreached();
  185. return "(N/A)";
  186. }
  187. }
  188. /**
  189. * Scheduler event callback; this should get triggered once per event loop
  190. * if any scheduling work was created during the event loop.
  191. */
  192. static void
  193. scheduler_evt_callback(evutil_socket_t fd, short events, void *arg)
  194. {
  195. (void) fd;
  196. (void) events;
  197. (void) arg;
  198. log_debug(LD_SCHED, "Scheduler event callback called");
  199. /* Run the scheduler. This is a mandatory function. */
  200. /* We might as well assert on this. If this function doesn't exist, no cells
  201. * are getting scheduled. Things are very broken. scheduler_t says the run()
  202. * function is mandatory. */
  203. tor_assert(the_scheduler->run);
  204. the_scheduler->run();
  205. /* Schedule itself back in if it has more work. */
  206. /* Again, might as well assert on this mandatory scheduler_t function. If it
  207. * doesn't exist, there's no way to tell libevent to run the scheduler again
  208. * in the future. */
  209. tor_assert(the_scheduler->schedule);
  210. the_scheduler->schedule();
  211. }
  212. /** Using the global options, select the scheduler we should be using. */
  213. static void
  214. select_scheduler(void)
  215. {
  216. scheduler_t *new_scheduler = NULL;
  217. #ifdef TOR_UNIT_TESTS
  218. /* This is hella annoying to set in the options for every test that passes
  219. * through the scheduler and there are many so if we don't explicitly have
  220. * a list of types set, just put the vanilla one. */
  221. if (get_options()->SchedulerTypes_ == NULL) {
  222. the_scheduler = get_vanilla_scheduler();
  223. return;
  224. }
  225. #endif /* defined(TOR_UNIT_TESTS) */
  226. /* This list is ordered that is first entry has the first priority. Thus, as
  227. * soon as we find a scheduler type that we can use, we use it and stop. */
  228. SMARTLIST_FOREACH_BEGIN(get_options()->SchedulerTypes_, int *, type) {
  229. switch (*type) {
  230. case SCHEDULER_VANILLA:
  231. new_scheduler = get_vanilla_scheduler();
  232. goto end;
  233. case SCHEDULER_KIST:
  234. if (!scheduler_can_use_kist()) {
  235. #ifdef HAVE_KIST_SUPPORT
  236. log_notice(LD_SCHED, "Scheduler type KIST has been disabled by "
  237. "the consensus or no kernel support.");
  238. #else /* !(defined(HAVE_KIST_SUPPORT)) */
  239. log_info(LD_SCHED, "Scheduler type KIST not built in");
  240. #endif /* defined(HAVE_KIST_SUPPORT) */
  241. continue;
  242. }
  243. new_scheduler = get_kist_scheduler();
  244. scheduler_kist_set_full_mode();
  245. goto end;
  246. case SCHEDULER_KIST_LITE:
  247. new_scheduler = get_kist_scheduler();
  248. scheduler_kist_set_lite_mode();
  249. goto end;
  250. case SCHEDULER_NONE:
  251. /* fallthrough */
  252. default:
  253. /* Our option validation should have caught this. */
  254. tor_assert_unreached();
  255. }
  256. } SMARTLIST_FOREACH_END(type);
  257. end:
  258. if (new_scheduler == NULL) {
  259. log_err(LD_SCHED, "Tor was unable to select a scheduler type. Please "
  260. "make sure Schedulers is correctly configured with "
  261. "what Tor does support.");
  262. /* We weren't able to choose a scheduler which means that none of the ones
  263. * set in Schedulers are supported or usable. We will respect the user
  264. * wishes of using what it has been configured and don't do a sneaky
  265. * fallback. Because this can be changed at runtime, we have to stop tor
  266. * right now. */
  267. exit(1);
  268. }
  269. /* Set the chosen scheduler. */
  270. the_scheduler = new_scheduler;
  271. }
  272. /**
  273. * Helper function called from a few different places. It changes the
  274. * scheduler implementation, if necessary. And if it did, it then tells the
  275. * old one to free its state and the new one to initialize.
  276. */
  277. static void
  278. set_scheduler(void)
  279. {
  280. const scheduler_t *old_scheduler = the_scheduler;
  281. scheduler_types_t old_scheduler_type = SCHEDULER_NONE;
  282. /* We keep track of the type in order to log only if the type switched. We
  283. * can't just use the scheduler pointers because KIST and KISTLite share the
  284. * same object. */
  285. if (the_scheduler) {
  286. old_scheduler_type = the_scheduler->type;
  287. }
  288. /* From the options, select the scheduler type to set. */
  289. select_scheduler();
  290. tor_assert(the_scheduler);
  291. /* We look at the pointer difference in case the old sched and new sched
  292. * share the same scheduler object, as is the case with KIST and KISTLite. */
  293. if (old_scheduler != the_scheduler) {
  294. /* Allow the old scheduler to clean up, if needed. */
  295. if (old_scheduler && old_scheduler->free_all) {
  296. old_scheduler->free_all();
  297. }
  298. /* Initialize the new scheduler. */
  299. if (the_scheduler->init) {
  300. the_scheduler->init();
  301. }
  302. }
  303. /* Finally we notice log if we switched schedulers. We use the type in case
  304. * two schedulers share a scheduler object. */
  305. if (old_scheduler_type != the_scheduler->type) {
  306. log_notice(LD_CONFIG, "Scheduler type %s has been enabled.",
  307. get_scheduler_type_string(the_scheduler->type));
  308. }
  309. }
  310. /*****************************************************************************
  311. * Scheduling system private function definitions
  312. *
  313. * Functions that can only be accessed from scheduler*.c
  314. *****************************************************************************/
  315. /** Return the pending channel list. */
  316. smartlist_t *
  317. get_channels_pending(void)
  318. {
  319. return channels_pending;
  320. }
  321. /** Comparison function to use when sorting pending channels. */
  322. MOCK_IMPL(int,
  323. scheduler_compare_channels, (const void *c1_v, const void *c2_v))
  324. {
  325. const channel_t *c1 = NULL, *c2 = NULL;
  326. /* These are a workaround for -Wbad-function-cast throwing a fit */
  327. const circuitmux_policy_t *p1, *p2;
  328. uintptr_t p1_i, p2_i;
  329. tor_assert(c1_v);
  330. tor_assert(c2_v);
  331. c1 = (const channel_t *)(c1_v);
  332. c2 = (const channel_t *)(c2_v);
  333. if (c1 != c2) {
  334. if (circuitmux_get_policy(c1->cmux) ==
  335. circuitmux_get_policy(c2->cmux)) {
  336. /* Same cmux policy, so use the mux comparison */
  337. return circuitmux_compare_muxes(c1->cmux, c2->cmux);
  338. } else {
  339. /*
  340. * Different policies; not important to get this edge case perfect
  341. * because the current code never actually gives different channels
  342. * different cmux policies anyway. Just use this arbitrary but
  343. * definite choice.
  344. */
  345. p1 = circuitmux_get_policy(c1->cmux);
  346. p2 = circuitmux_get_policy(c2->cmux);
  347. p1_i = (uintptr_t)p1;
  348. p2_i = (uintptr_t)p2;
  349. return (p1_i < p2_i) ? -1 : 1;
  350. }
  351. } else {
  352. /* c1 == c2, so always equal */
  353. return 0;
  354. }
  355. }
  356. /*****************************************************************************
  357. * Scheduling system global functions
  358. *
  359. * Functions that can be accessed from anywhere in Tor.
  360. *****************************************************************************/
  361. /**
  362. * This is how the scheduling system is notified of Tor's configuration
  363. * changing. For example: a SIGHUP was issued.
  364. */
  365. void
  366. scheduler_conf_changed(void)
  367. {
  368. /* Let the scheduler decide what it should do. */
  369. set_scheduler();
  370. /* Then tell the (possibly new) scheduler that we have new options. */
  371. if (the_scheduler->on_new_options) {
  372. the_scheduler->on_new_options();
  373. }
  374. }
  375. /**
  376. * Whenever we get a new consensus, this function is called.
  377. */
  378. void
  379. scheduler_notify_networkstatus_changed(const networkstatus_t *old_c,
  380. const networkstatus_t *new_c)
  381. {
  382. /* Maybe the consensus param made us change the scheduler. */
  383. set_scheduler();
  384. /* Then tell the (possibly new) scheduler that we have a new consensus */
  385. if (the_scheduler->on_new_consensus) {
  386. the_scheduler->on_new_consensus(old_c, new_c);
  387. }
  388. }
  389. /**
  390. * Free everything scheduling-related from main.c. Note this is only called
  391. * when Tor is shutting down, while scheduler_t->free_all() is called both when
  392. * Tor is shutting down and when we are switching schedulers.
  393. */
  394. void
  395. scheduler_free_all(void)
  396. {
  397. log_debug(LD_SCHED, "Shutting down scheduler");
  398. if (run_sched_ev) {
  399. if (event_del(run_sched_ev) < 0) {
  400. log_warn(LD_BUG, "Problem deleting run_sched_ev");
  401. }
  402. tor_event_free(run_sched_ev);
  403. run_sched_ev = NULL;
  404. }
  405. if (channels_pending) {
  406. /* We don't have ownership of the objects in this list. */
  407. smartlist_free(channels_pending);
  408. channels_pending = NULL;
  409. }
  410. if (the_scheduler && the_scheduler->free_all) {
  411. the_scheduler->free_all();
  412. }
  413. the_scheduler = NULL;
  414. }
  415. /** Mark a channel as no longer ready to accept writes. */
  416. MOCK_IMPL(void,
  417. scheduler_channel_doesnt_want_writes,(channel_t *chan))
  418. {
  419. IF_BUG_ONCE(!chan) {
  420. return;
  421. }
  422. IF_BUG_ONCE(!channels_pending) {
  423. return;
  424. }
  425. /* If it's already in pending, we can put it in waiting_to_write */
  426. if (chan->scheduler_state == SCHED_CHAN_PENDING) {
  427. /*
  428. * It's in channels_pending, so it shouldn't be in any of
  429. * the other lists. It can't write any more, so it goes to
  430. * channels_waiting_to_write.
  431. */
  432. smartlist_pqueue_remove(channels_pending,
  433. scheduler_compare_channels,
  434. offsetof(channel_t, sched_heap_idx),
  435. chan);
  436. chan->scheduler_state = SCHED_CHAN_WAITING_TO_WRITE;
  437. log_debug(LD_SCHED,
  438. "Channel " U64_FORMAT " at %p went from pending "
  439. "to waiting_to_write",
  440. U64_PRINTF_ARG(chan->global_identifier), chan);
  441. } else {
  442. /*
  443. * It's not in pending, so it can't become waiting_to_write; it's
  444. * either not in any of the lists (nothing to do) or it's already in
  445. * waiting_for_cells (remove it, can't write any more).
  446. */
  447. if (chan->scheduler_state == SCHED_CHAN_WAITING_FOR_CELLS) {
  448. chan->scheduler_state = SCHED_CHAN_IDLE;
  449. log_debug(LD_SCHED,
  450. "Channel " U64_FORMAT " at %p left waiting_for_cells",
  451. U64_PRINTF_ARG(chan->global_identifier), chan);
  452. }
  453. }
  454. }
  455. /** Mark a channel as having waiting cells. */
  456. MOCK_IMPL(void,
  457. scheduler_channel_has_waiting_cells,(channel_t *chan))
  458. {
  459. IF_BUG_ONCE(!chan) {
  460. return;
  461. }
  462. IF_BUG_ONCE(!channels_pending) {
  463. return;
  464. }
  465. /* First, check if it's also writeable */
  466. if (chan->scheduler_state == SCHED_CHAN_WAITING_FOR_CELLS) {
  467. /*
  468. * It's in channels_waiting_for_cells, so it shouldn't be in any of
  469. * the other lists. It has waiting cells now, so it goes to
  470. * channels_pending.
  471. */
  472. chan->scheduler_state = SCHED_CHAN_PENDING;
  473. smartlist_pqueue_add(channels_pending,
  474. scheduler_compare_channels,
  475. offsetof(channel_t, sched_heap_idx),
  476. chan);
  477. log_debug(LD_SCHED,
  478. "Channel " U64_FORMAT " at %p went from waiting_for_cells "
  479. "to pending",
  480. U64_PRINTF_ARG(chan->global_identifier), chan);
  481. /* If we made a channel pending, we potentially have scheduling work to
  482. * do. */
  483. the_scheduler->schedule();
  484. } else {
  485. /*
  486. * It's not in waiting_for_cells, so it can't become pending; it's
  487. * either not in any of the lists (we add it to waiting_to_write)
  488. * or it's already in waiting_to_write or pending (we do nothing)
  489. */
  490. if (!(chan->scheduler_state == SCHED_CHAN_WAITING_TO_WRITE ||
  491. chan->scheduler_state == SCHED_CHAN_PENDING)) {
  492. chan->scheduler_state = SCHED_CHAN_WAITING_TO_WRITE;
  493. log_debug(LD_SCHED,
  494. "Channel " U64_FORMAT " at %p entered waiting_to_write",
  495. U64_PRINTF_ARG(chan->global_identifier), chan);
  496. }
  497. }
  498. }
  499. /** Add the scheduler event to the set of pending events with next_run being
  500. * the longest time libevent should wait before triggering the event. */
  501. void
  502. scheduler_ev_add(const struct timeval *next_run)
  503. {
  504. tor_assert(run_sched_ev);
  505. tor_assert(next_run);
  506. if (BUG(event_add(run_sched_ev, next_run) < 0)) {
  507. log_warn(LD_SCHED, "Adding to libevent failed. Next run time was set to: "
  508. "%ld.%06ld", next_run->tv_sec, (long)next_run->tv_usec);
  509. return;
  510. }
  511. }
  512. /** Make the scheduler event active with the given flags. */
  513. void
  514. scheduler_ev_active(int flags)
  515. {
  516. tor_assert(run_sched_ev);
  517. event_active(run_sched_ev, flags, 1);
  518. }
  519. /*
  520. * Initialize everything scheduling-related from config.c. Note this is only
  521. * called when Tor is starting up, while scheduler_t->init() is called both
  522. * when Tor is starting up and when we are switching schedulers.
  523. */
  524. void
  525. scheduler_init(void)
  526. {
  527. log_debug(LD_SCHED, "Initting scheduler");
  528. // Two '!' because we really do want to check if the pointer is non-NULL
  529. IF_BUG_ONCE(!!run_sched_ev) {
  530. log_warn(LD_SCHED, "We should not already have a libevent scheduler event."
  531. "I'll clean the old one up, but this is odd.");
  532. tor_event_free(run_sched_ev);
  533. run_sched_ev = NULL;
  534. }
  535. run_sched_ev = tor_event_new(tor_libevent_get_base(), -1,
  536. 0, scheduler_evt_callback, NULL);
  537. channels_pending = smartlist_new();
  538. set_scheduler();
  539. }
  540. /*
  541. * If a channel is going away, this is how the scheduling system is informed
  542. * so it can do any freeing necessary. This ultimately calls
  543. * scheduler_t->on_channel_free() so the current scheduler can release any
  544. * state specific to this channel.
  545. */
  546. MOCK_IMPL(void,
  547. scheduler_release_channel,(channel_t *chan))
  548. {
  549. IF_BUG_ONCE(!chan) {
  550. return;
  551. }
  552. IF_BUG_ONCE(!channels_pending) {
  553. return;
  554. }
  555. if (chan->scheduler_state == SCHED_CHAN_PENDING) {
  556. if (SCHED_BUG(smartlist_pos(channels_pending, chan) == -1, chan)) {
  557. log_warn(LD_SCHED, "Scheduler asked to release channel %" PRIu64 " "
  558. "but it wasn't in channels_pending",
  559. chan->global_identifier);
  560. } else {
  561. smartlist_pqueue_remove(channels_pending,
  562. scheduler_compare_channels,
  563. offsetof(channel_t, sched_heap_idx),
  564. chan);
  565. }
  566. }
  567. if (the_scheduler->on_channel_free) {
  568. the_scheduler->on_channel_free(chan);
  569. }
  570. chan->scheduler_state = SCHED_CHAN_IDLE;
  571. }
  572. /** Mark a channel as ready to accept writes */
  573. void
  574. scheduler_channel_wants_writes(channel_t *chan)
  575. {
  576. IF_BUG_ONCE(!chan) {
  577. return;
  578. }
  579. IF_BUG_ONCE(!channels_pending) {
  580. return;
  581. }
  582. /* If it's already in waiting_to_write, we can put it in pending */
  583. if (chan->scheduler_state == SCHED_CHAN_WAITING_TO_WRITE) {
  584. /*
  585. * It can write now, so it goes to channels_pending.
  586. */
  587. log_debug(LD_SCHED, "chan=%" PRIu64 " became pending",
  588. chan->global_identifier);
  589. smartlist_pqueue_add(channels_pending,
  590. scheduler_compare_channels,
  591. offsetof(channel_t, sched_heap_idx),
  592. chan);
  593. chan->scheduler_state = SCHED_CHAN_PENDING;
  594. log_debug(LD_SCHED,
  595. "Channel " U64_FORMAT " at %p went from waiting_to_write "
  596. "to pending",
  597. U64_PRINTF_ARG(chan->global_identifier), chan);
  598. /* We just made a channel pending, we have scheduling work to do. */
  599. the_scheduler->schedule();
  600. } else {
  601. /*
  602. * It's not in SCHED_CHAN_WAITING_TO_WRITE, so it can't become pending;
  603. * it's either idle and goes to WAITING_FOR_CELLS, or it's a no-op.
  604. */
  605. if (!(chan->scheduler_state == SCHED_CHAN_WAITING_FOR_CELLS ||
  606. chan->scheduler_state == SCHED_CHAN_PENDING)) {
  607. chan->scheduler_state = SCHED_CHAN_WAITING_FOR_CELLS;
  608. log_debug(LD_SCHED,
  609. "Channel " U64_FORMAT " at %p entered waiting_for_cells",
  610. U64_PRINTF_ARG(chan->global_identifier), chan);
  611. }
  612. }
  613. }
  614. /* Log warn the given channel and extra scheduler context as well. This is
  615. * used by SCHED_BUG() in order to be able to extract as much information as
  616. * we can when we hit a bug. Channel chan can be NULL. */
  617. void
  618. scheduler_bug_occurred(const channel_t *chan)
  619. {
  620. char buf[128];
  621. if (chan != NULL) {
  622. const size_t outbuf_len =
  623. buf_datalen(TO_CONN(BASE_CHAN_TO_TLS((channel_t *) chan)->conn)->outbuf);
  624. tor_snprintf(buf, sizeof(buf),
  625. "Channel %" PRIu64 " in state %s and scheduler state %d."
  626. " Num cells on cmux: %d. Connection outbuf len: %lu.",
  627. chan->global_identifier,
  628. channel_state_to_string(chan->state),
  629. chan->scheduler_state, circuitmux_num_cells(chan->cmux),
  630. (unsigned long)outbuf_len);
  631. }
  632. {
  633. char *msg;
  634. /* Rate limit every 60 seconds. If we start seeing this every 60 sec, we
  635. * know something is stuck/wrong. It *should* be loud but not too much. */
  636. static ratelim_t rlimit = RATELIM_INIT(60);
  637. if ((msg = rate_limit_log(&rlimit, approx_time()))) {
  638. log_warn(LD_BUG, "%s Num pending channels: %d. "
  639. "Channel in pending list: %s.%s",
  640. (chan != NULL) ? buf : "No channel in bug context.",
  641. smartlist_len(channels_pending),
  642. (smartlist_pos(channels_pending, chan) == -1) ? "no" : "yes",
  643. msg);
  644. tor_free(msg);
  645. }
  646. }
  647. }
  648. #ifdef TOR_UNIT_TESTS
  649. /*
  650. * Notify scheduler that a channel's queue position may have changed.
  651. */
  652. void
  653. scheduler_touch_channel(channel_t *chan)
  654. {
  655. IF_BUG_ONCE(!chan) {
  656. return;
  657. }
  658. if (chan->scheduler_state == SCHED_CHAN_PENDING) {
  659. /* Remove and re-add it */
  660. smartlist_pqueue_remove(channels_pending,
  661. scheduler_compare_channels,
  662. offsetof(channel_t, sched_heap_idx),
  663. chan);
  664. smartlist_pqueue_add(channels_pending,
  665. scheduler_compare_channels,
  666. offsetof(channel_t, sched_heap_idx),
  667. chan);
  668. }
  669. /* else no-op, since it isn't in the queue */
  670. }
  671. #endif /* defined(TOR_UNIT_TESTS) */