hibernate.c 34 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017
  1. /* Copyright (c) 2004-2006, Roger Dingledine, Nick Mathewson.
  2. * Copyright (c) 2007-2011, The Tor Project, Inc. */
  3. /* See LICENSE for licensing information */
  4. /**
  5. * \file hibernate.c
  6. * \brief Functions to close listeners, stop allowing new circuits,
  7. * etc in preparation for closing down or going dormant; and to track
  8. * bandwidth and time intervals to know when to hibernate and when to
  9. * stop hibernating.
  10. **/
  11. /*
  12. hibernating, phase 1:
  13. - send destroy in response to create cells
  14. - send end (policy failed) in response to begin cells
  15. - close an OR conn when it has no circuits
  16. hibernating, phase 2:
  17. (entered when bandwidth hard limit reached)
  18. - close all OR/AP/exit conns)
  19. */
  20. #define HIBERNATE_PRIVATE
  21. #include "or.h"
  22. #include "config.h"
  23. #include "connection.h"
  24. #include "connection_edge.h"
  25. #include "hibernate.h"
  26. #include "main.h"
  27. #include "router.h"
  28. extern long stats_n_seconds_working; /* published uptime */
  29. /** Are we currently awake, asleep, running out of bandwidth, or shutting
  30. * down? */
  31. static hibernate_state_t hibernate_state = HIBERNATE_STATE_INITIAL;
  32. /** If are hibernating, when do we plan to wake up? Set to 0 if we
  33. * aren't hibernating. */
  34. static time_t hibernate_end_time = 0;
  35. /** If we are shutting down, when do we plan finally exit? Set to 0 if
  36. * we aren't shutting down. */
  37. static time_t shutdown_time = 0;
  38. /** Possible accounting periods. */
  39. typedef enum {
  40. UNIT_MONTH=1, UNIT_WEEK=2, UNIT_DAY=3,
  41. } time_unit_t;
  42. /* Fields for accounting logic. Accounting overview:
  43. *
  44. * Accounting is designed to ensure that no more than N bytes are sent in
  45. * either direction over a given interval (currently, one month, one week, or
  46. * one day) We could
  47. * try to do this by choking our bandwidth to a trickle, but that
  48. * would make our streams useless. Instead, we estimate what our
  49. * bandwidth usage will be, and guess how long we'll be able to
  50. * provide that much bandwidth before hitting our limit. We then
  51. * choose a random time within the accounting interval to come up (so
  52. * that we don't get 50 Tors running on the 1st of the month and none
  53. * on the 30th).
  54. *
  55. * Each interval runs as follows:
  56. *
  57. * 1. We guess our bandwidth usage, based on how much we used
  58. * last time. We choose a "wakeup time" within the interval to come up.
  59. * 2. Until the chosen wakeup time, we hibernate.
  60. * 3. We come up at the wakeup time, and provide bandwidth until we are
  61. * "very close" to running out.
  62. * 4. Then we go into low-bandwidth mode, and stop accepting new
  63. * connections, but provide bandwidth until we run out.
  64. * 5. Then we hibernate until the end of the interval.
  65. *
  66. * If the interval ends before we run out of bandwidth, we go back to
  67. * step one.
  68. */
  69. /** How many bytes have we read in this accounting interval? */
  70. static uint64_t n_bytes_read_in_interval = 0;
  71. /** How many bytes have we written in this accounting interval? */
  72. static uint64_t n_bytes_written_in_interval = 0;
  73. /** How many seconds have we been running this interval? */
  74. static uint32_t n_seconds_active_in_interval = 0;
  75. /** How many seconds were we active in this interval before we hit our soft
  76. * limit? */
  77. static int n_seconds_to_hit_soft_limit = 0;
  78. /** When in this interval was the soft limit hit. */
  79. static time_t soft_limit_hit_at = 0;
  80. /** How many bytes had we read/written when we hit the soft limit? */
  81. static uint64_t n_bytes_at_soft_limit = 0;
  82. /** When did this accounting interval start? */
  83. static time_t interval_start_time = 0;
  84. /** When will this accounting interval end? */
  85. static time_t interval_end_time = 0;
  86. /** How far into the accounting interval should we hibernate? */
  87. static time_t interval_wakeup_time = 0;
  88. /** How much bandwidth do we 'expect' to use per minute? (0 if we have no
  89. * info from the last period.) */
  90. static uint64_t expected_bandwidth_usage = 0;
  91. /** What unit are we using for our accounting? */
  92. static time_unit_t cfg_unit = UNIT_MONTH;
  93. /** How many days,hours,minutes into each unit does our accounting interval
  94. * start? */
  95. static int cfg_start_day = 0,
  96. cfg_start_hour = 0,
  97. cfg_start_min = 0;
  98. static void reset_accounting(time_t now);
  99. static int read_bandwidth_usage(void);
  100. static time_t start_of_accounting_period_after(time_t now);
  101. static time_t start_of_accounting_period_containing(time_t now);
  102. static void accounting_set_wakeup_time(void);
  103. /* ************
  104. * Functions for bandwidth accounting.
  105. * ************/
  106. /** Configure accounting start/end time settings based on
  107. * options->AccountingStart. Return 0 on success, -1 on failure. If
  108. * <b>validate_only</b> is true, do not change the current settings. */
  109. int
  110. accounting_parse_options(const or_options_t *options, int validate_only)
  111. {
  112. time_unit_t unit;
  113. int ok, idx;
  114. long d,h,m;
  115. smartlist_t *items;
  116. const char *v = options->AccountingStart;
  117. const char *s;
  118. char *cp;
  119. if (!v) {
  120. if (!validate_only) {
  121. cfg_unit = UNIT_MONTH;
  122. cfg_start_day = 1;
  123. cfg_start_hour = 0;
  124. cfg_start_min = 0;
  125. }
  126. return 0;
  127. }
  128. items = smartlist_create();
  129. smartlist_split_string(items, v, NULL,
  130. SPLIT_SKIP_SPACE|SPLIT_IGNORE_BLANK,0);
  131. if (smartlist_len(items)<2) {
  132. log_warn(LD_CONFIG, "Too few arguments to AccountingStart");
  133. goto err;
  134. }
  135. s = smartlist_get(items,0);
  136. if (0==strcasecmp(s, "month")) {
  137. unit = UNIT_MONTH;
  138. } else if (0==strcasecmp(s, "week")) {
  139. unit = UNIT_WEEK;
  140. } else if (0==strcasecmp(s, "day")) {
  141. unit = UNIT_DAY;
  142. } else {
  143. log_warn(LD_CONFIG,
  144. "Unrecognized accounting unit '%s': only 'month', 'week',"
  145. " and 'day' are supported.", s);
  146. goto err;
  147. }
  148. switch (unit) {
  149. case UNIT_WEEK:
  150. d = tor_parse_long(smartlist_get(items,1), 10, 1, 7, &ok, NULL);
  151. if (!ok) {
  152. log_warn(LD_CONFIG, "Weekly accounting must begin on a day between "
  153. "1 (Monday) and 7 (Sunday)");
  154. goto err;
  155. }
  156. break;
  157. case UNIT_MONTH:
  158. d = tor_parse_long(smartlist_get(items,1), 10, 1, 28, &ok, NULL);
  159. if (!ok) {
  160. log_warn(LD_CONFIG, "Monthly accounting must begin on a day between "
  161. "1 and 28");
  162. goto err;
  163. }
  164. break;
  165. case UNIT_DAY:
  166. d = 0;
  167. break;
  168. /* Coverity dislikes unreachable default cases; some compilers warn on
  169. * switch statements missing a case. Tell Coverity not to worry. */
  170. /* coverity[dead_error_begin] */
  171. default:
  172. tor_assert(0);
  173. }
  174. idx = unit==UNIT_DAY?1:2;
  175. if (smartlist_len(items) != (idx+1)) {
  176. log_warn(LD_CONFIG,"Accounting unit '%s' requires %d argument%s.",
  177. s, idx, (idx>1)?"s":"");
  178. goto err;
  179. }
  180. s = smartlist_get(items, idx);
  181. h = tor_parse_long(s, 10, 0, 23, &ok, &cp);
  182. if (!ok) {
  183. log_warn(LD_CONFIG,"Accounting start time not parseable: bad hour.");
  184. goto err;
  185. }
  186. if (!cp || *cp!=':') {
  187. log_warn(LD_CONFIG,
  188. "Accounting start time not parseable: not in HH:MM format");
  189. goto err;
  190. }
  191. m = tor_parse_long(cp+1, 10, 0, 59, &ok, &cp);
  192. if (!ok) {
  193. log_warn(LD_CONFIG, "Accounting start time not parseable: bad minute");
  194. goto err;
  195. }
  196. if (!cp || *cp!='\0') {
  197. log_warn(LD_CONFIG,
  198. "Accounting start time not parseable: not in HH:MM format");
  199. goto err;
  200. }
  201. if (!validate_only) {
  202. cfg_unit = unit;
  203. cfg_start_day = (int)d;
  204. cfg_start_hour = (int)h;
  205. cfg_start_min = (int)m;
  206. }
  207. SMARTLIST_FOREACH(items, char *, item, tor_free(item));
  208. smartlist_free(items);
  209. return 0;
  210. err:
  211. SMARTLIST_FOREACH(items, char *, item, tor_free(item));
  212. smartlist_free(items);
  213. return -1;
  214. }
  215. /** If we want to manage the accounting system and potentially
  216. * hibernate, return 1, else return 0.
  217. */
  218. int
  219. accounting_is_enabled(const or_options_t *options)
  220. {
  221. if (options->AccountingMax)
  222. return 1;
  223. return 0;
  224. }
  225. /** If accounting is enabled, return how long (in seconds) this
  226. * interval lasts. */
  227. int
  228. accounting_get_interval_length(void)
  229. {
  230. return (int)(interval_end_time - interval_start_time);
  231. }
  232. /** Called from main.c to tell us that <b>seconds</b> seconds have
  233. * passed, <b>n_read</b> bytes have been read, and <b>n_written</b>
  234. * bytes have been written. */
  235. void
  236. accounting_add_bytes(size_t n_read, size_t n_written, int seconds)
  237. {
  238. n_bytes_read_in_interval += n_read;
  239. n_bytes_written_in_interval += n_written;
  240. /* If we haven't been called in 10 seconds, we're probably jumping
  241. * around in time. */
  242. n_seconds_active_in_interval += (seconds < 10) ? seconds : 0;
  243. }
  244. /** If get_end, return the end of the accounting period that contains
  245. * the time <b>now</b>. Else, return the start of the accounting
  246. * period that contains the time <b>now</b> */
  247. static time_t
  248. edge_of_accounting_period_containing(time_t now, int get_end)
  249. {
  250. int before;
  251. struct tm tm;
  252. tor_localtime_r(&now, &tm);
  253. /* Set 'before' to true iff the current time is before the hh:mm
  254. * changeover time for today. */
  255. before = tm.tm_hour < cfg_start_hour ||
  256. (tm.tm_hour == cfg_start_hour && tm.tm_min < cfg_start_min);
  257. /* Dispatch by unit. First, find the start day of the given period;
  258. * then, if get_end is true, increment to the end day. */
  259. switch (cfg_unit)
  260. {
  261. case UNIT_MONTH: {
  262. /* If this is before the Nth, we want the Nth of last month. */
  263. if (tm.tm_mday < cfg_start_day ||
  264. (tm.tm_mday < cfg_start_day && before)) {
  265. --tm.tm_mon;
  266. }
  267. /* Otherwise, the month is correct. */
  268. tm.tm_mday = cfg_start_day;
  269. if (get_end)
  270. ++tm.tm_mon;
  271. break;
  272. }
  273. case UNIT_WEEK: {
  274. /* What is the 'target' day of the week in struct tm format? (We
  275. say Sunday==7; struct tm says Sunday==0.) */
  276. int wday = cfg_start_day % 7;
  277. /* How many days do we subtract from today to get to the right day? */
  278. int delta = (7+tm.tm_wday-wday)%7;
  279. /* If we are on the right day, but the changeover hasn't happened yet,
  280. * then subtract a whole week. */
  281. if (delta == 0 && before)
  282. delta = 7;
  283. tm.tm_mday -= delta;
  284. if (get_end)
  285. tm.tm_mday += 7;
  286. break;
  287. }
  288. case UNIT_DAY:
  289. if (before)
  290. --tm.tm_mday;
  291. if (get_end)
  292. ++tm.tm_mday;
  293. break;
  294. default:
  295. tor_assert(0);
  296. }
  297. tm.tm_hour = cfg_start_hour;
  298. tm.tm_min = cfg_start_min;
  299. tm.tm_sec = 0;
  300. tm.tm_isdst = -1; /* Autodetect DST */
  301. return mktime(&tm);
  302. }
  303. /** Return the start of the accounting period containing the time
  304. * <b>now</b>. */
  305. static time_t
  306. start_of_accounting_period_containing(time_t now)
  307. {
  308. return edge_of_accounting_period_containing(now, 0);
  309. }
  310. /** Return the start of the accounting period that comes after the one
  311. * containing the time <b>now</b>. */
  312. static time_t
  313. start_of_accounting_period_after(time_t now)
  314. {
  315. return edge_of_accounting_period_containing(now, 1);
  316. }
  317. /** Return the length of the accounting period containing the time
  318. * <b>now</b>. */
  319. static long
  320. length_of_accounting_period_containing(time_t now)
  321. {
  322. return edge_of_accounting_period_containing(now, 1) -
  323. edge_of_accounting_period_containing(now, 0);
  324. }
  325. /** Initialize the accounting subsystem. */
  326. void
  327. configure_accounting(time_t now)
  328. {
  329. time_t s_now;
  330. /* Try to remember our recorded usage. */
  331. if (!interval_start_time)
  332. read_bandwidth_usage(); /* If we fail, we'll leave values at zero, and
  333. * reset below.*/
  334. s_now = start_of_accounting_period_containing(now);
  335. if (!interval_start_time) {
  336. /* We didn't have recorded usage; Start a new interval. */
  337. log_info(LD_ACCT, "Starting new accounting interval.");
  338. reset_accounting(now);
  339. } else if (s_now == interval_start_time) {
  340. log_info(LD_ACCT, "Continuing accounting interval.");
  341. /* We are in the interval we thought we were in. Do nothing.*/
  342. interval_end_time = start_of_accounting_period_after(interval_start_time);
  343. } else {
  344. long duration =
  345. length_of_accounting_period_containing(interval_start_time);
  346. double delta = ((double)(s_now - interval_start_time)) / duration;
  347. if (-0.50 <= delta && delta <= 0.50) {
  348. /* The start of the period is now a little later or earlier than we
  349. * remembered. That's fine; we might lose some bytes we could otherwise
  350. * have written, but better to err on the side of obeying people's
  351. * accounting settings. */
  352. log_info(LD_ACCT, "Accounting interval moved by %.02f%%; "
  353. "that's fine.", delta*100);
  354. interval_end_time = start_of_accounting_period_after(now);
  355. } else if (delta >= 0.99) {
  356. /* This is the regular time-moved-forward case; don't be too noisy
  357. * about it or people will complain */
  358. log_info(LD_ACCT, "Accounting interval elapsed; starting a new one");
  359. reset_accounting(now);
  360. } else {
  361. log_warn(LD_ACCT,
  362. "Mismatched accounting interval: moved by %.02f%%. "
  363. "Starting a fresh one.", delta*100);
  364. reset_accounting(now);
  365. }
  366. }
  367. accounting_set_wakeup_time();
  368. }
  369. /** Set expected_bandwidth_usage based on how much we sent/received
  370. * per minute last interval (if we were up for at least 30 minutes),
  371. * or based on our declared bandwidth otherwise. */
  372. static void
  373. update_expected_bandwidth(void)
  374. {
  375. uint64_t expected;
  376. const or_options_t *options= get_options();
  377. uint64_t max_configured = (options->RelayBandwidthRate > 0 ?
  378. options->RelayBandwidthRate :
  379. options->BandwidthRate) * 60;
  380. #define MIN_TIME_FOR_MEASUREMENT (1800)
  381. if (soft_limit_hit_at > interval_start_time && n_bytes_at_soft_limit &&
  382. (soft_limit_hit_at - interval_start_time) > MIN_TIME_FOR_MEASUREMENT) {
  383. /* If we hit our soft limit last time, only count the bytes up to that
  384. * time. This is a better predictor of our actual bandwidth than
  385. * considering the entirety of the last interval, since we likely started
  386. * using bytes very slowly once we hit our soft limit. */
  387. expected = n_bytes_at_soft_limit /
  388. (soft_limit_hit_at - interval_start_time);
  389. expected /= 60;
  390. } else if (n_seconds_active_in_interval >= MIN_TIME_FOR_MEASUREMENT) {
  391. /* Otherwise, we either measured enough time in the last interval but
  392. * never hit our soft limit, or we're using a state file from a Tor that
  393. * doesn't know to store soft-limit info. Just take rate at which
  394. * we were reading/writing in the last interval as our expected rate.
  395. */
  396. uint64_t used = MAX(n_bytes_written_in_interval,
  397. n_bytes_read_in_interval);
  398. expected = used / (n_seconds_active_in_interval / 60);
  399. } else {
  400. /* If we haven't gotten enough data last interval, set 'expected'
  401. * to 0. This will set our wakeup to the start of the interval.
  402. * Next interval, we'll choose our starting time based on how much
  403. * we sent this interval.
  404. */
  405. expected = 0;
  406. }
  407. if (expected > max_configured)
  408. expected = max_configured;
  409. expected_bandwidth_usage = expected;
  410. }
  411. /** Called at the start of a new accounting interval: reset our
  412. * expected bandwidth usage based on what happened last time, set up
  413. * the start and end of the interval, and clear byte/time totals.
  414. */
  415. static void
  416. reset_accounting(time_t now)
  417. {
  418. log_info(LD_ACCT, "Starting new accounting interval.");
  419. update_expected_bandwidth();
  420. interval_start_time = start_of_accounting_period_containing(now);
  421. interval_end_time = start_of_accounting_period_after(interval_start_time);
  422. n_bytes_read_in_interval = 0;
  423. n_bytes_written_in_interval = 0;
  424. n_seconds_active_in_interval = 0;
  425. n_bytes_at_soft_limit = 0;
  426. soft_limit_hit_at = 0;
  427. n_seconds_to_hit_soft_limit = 0;
  428. }
  429. /** Return true iff we should save our bandwidth usage to disk. */
  430. static INLINE int
  431. time_to_record_bandwidth_usage(time_t now)
  432. {
  433. /* Note every 600 sec */
  434. #define NOTE_INTERVAL (600)
  435. /* Or every 20 megabytes */
  436. #define NOTE_BYTES 20*(1024*1024)
  437. static uint64_t last_read_bytes_noted = 0;
  438. static uint64_t last_written_bytes_noted = 0;
  439. static time_t last_time_noted = 0;
  440. if (last_time_noted + NOTE_INTERVAL <= now ||
  441. last_read_bytes_noted + NOTE_BYTES <= n_bytes_read_in_interval ||
  442. last_written_bytes_noted + NOTE_BYTES <= n_bytes_written_in_interval ||
  443. (interval_end_time && interval_end_time <= now)) {
  444. last_time_noted = now;
  445. last_read_bytes_noted = n_bytes_read_in_interval;
  446. last_written_bytes_noted = n_bytes_written_in_interval;
  447. return 1;
  448. }
  449. return 0;
  450. }
  451. /** Invoked once per second. Checks whether it is time to hibernate,
  452. * record bandwidth used, etc. */
  453. void
  454. accounting_run_housekeeping(time_t now)
  455. {
  456. if (now >= interval_end_time) {
  457. configure_accounting(now);
  458. }
  459. if (time_to_record_bandwidth_usage(now)) {
  460. if (accounting_record_bandwidth_usage(now, get_or_state())) {
  461. log_warn(LD_FS, "Couldn't record bandwidth usage to disk.");
  462. }
  463. }
  464. }
  465. /** When we have no idea how fast we are, how long do we assume it will take
  466. * us to exhaust our bandwidth? */
  467. #define GUESS_TIME_TO_USE_BANDWIDTH (24*60*60)
  468. /** Based on our interval and our estimated bandwidth, choose a
  469. * deterministic (but random-ish) time to wake up. */
  470. static void
  471. accounting_set_wakeup_time(void)
  472. {
  473. char digest[DIGEST_LEN];
  474. crypto_digest_env_t *d_env;
  475. uint64_t time_to_exhaust_bw;
  476. int time_to_consider;
  477. if (! server_identity_key_is_set()) {
  478. if (init_keys() < 0) {
  479. log_err(LD_BUG, "Error initializing keys");
  480. tor_assert(0);
  481. }
  482. }
  483. if (server_identity_key_is_set()) {
  484. char buf[ISO_TIME_LEN+1];
  485. format_iso_time(buf, interval_start_time);
  486. crypto_pk_get_digest(get_server_identity_key(), digest);
  487. d_env = crypto_new_digest_env();
  488. crypto_digest_add_bytes(d_env, buf, ISO_TIME_LEN);
  489. crypto_digest_add_bytes(d_env, digest, DIGEST_LEN);
  490. crypto_digest_get_digest(d_env, digest, DIGEST_LEN);
  491. crypto_free_digest_env(d_env);
  492. } else {
  493. crypto_rand(digest, DIGEST_LEN);
  494. }
  495. if (!expected_bandwidth_usage) {
  496. char buf1[ISO_TIME_LEN+1];
  497. char buf2[ISO_TIME_LEN+1];
  498. format_local_iso_time(buf1, interval_start_time);
  499. format_local_iso_time(buf2, interval_end_time);
  500. interval_wakeup_time = interval_start_time;
  501. log_notice(LD_ACCT,
  502. "Configured hibernation. This interval begins at %s "
  503. "and ends at %s. We have no prior estimate for bandwidth, so "
  504. "we will start out awake and hibernate when we exhaust our quota.",
  505. buf1, buf2);
  506. return;
  507. }
  508. time_to_exhaust_bw =
  509. (get_options()->AccountingMax/expected_bandwidth_usage)*60;
  510. if (time_to_exhaust_bw > INT_MAX) {
  511. time_to_exhaust_bw = INT_MAX;
  512. time_to_consider = 0;
  513. } else {
  514. time_to_consider = accounting_get_interval_length() -
  515. (int)time_to_exhaust_bw;
  516. }
  517. if (time_to_consider<=0) {
  518. interval_wakeup_time = interval_start_time;
  519. } else {
  520. /* XXX can we simplify this just by picking a random (non-deterministic)
  521. * time to be up? If we go down and come up, then we pick a new one. Is
  522. * that good enough? -RD */
  523. /* This is not a perfectly unbiased conversion, but it is good enough:
  524. * in the worst case, the first half of the day is 0.06 percent likelier
  525. * to be chosen than the last half. */
  526. interval_wakeup_time = interval_start_time +
  527. (get_uint32(digest) % time_to_consider);
  528. }
  529. {
  530. char buf1[ISO_TIME_LEN+1];
  531. char buf2[ISO_TIME_LEN+1];
  532. char buf3[ISO_TIME_LEN+1];
  533. char buf4[ISO_TIME_LEN+1];
  534. time_t down_time;
  535. if (interval_wakeup_time+time_to_exhaust_bw > TIME_MAX)
  536. down_time = TIME_MAX;
  537. else
  538. down_time = (time_t)(interval_wakeup_time+time_to_exhaust_bw);
  539. if (down_time>interval_end_time)
  540. down_time = interval_end_time;
  541. format_local_iso_time(buf1, interval_start_time);
  542. format_local_iso_time(buf2, interval_wakeup_time);
  543. format_local_iso_time(buf3, down_time);
  544. format_local_iso_time(buf4, interval_end_time);
  545. log_notice(LD_ACCT,
  546. "Configured hibernation. This interval began at %s; "
  547. "the scheduled wake-up time %s %s; "
  548. "we expect%s to exhaust our quota for this interval around %s; "
  549. "the next interval begins at %s (all times local)",
  550. buf1,
  551. time(NULL)<interval_wakeup_time?"is":"was", buf2,
  552. time(NULL)<down_time?"":"ed", buf3,
  553. buf4);
  554. }
  555. }
  556. /* This rounds 0 up to 1000, but that's actually a feature. */
  557. #define ROUND_UP(x) (((x) + 0x3ff) & ~0x3ff)
  558. /** Save all our bandwidth tracking information to disk. Return 0 on
  559. * success, -1 on failure. */
  560. int
  561. accounting_record_bandwidth_usage(time_t now, or_state_t *state)
  562. {
  563. /* Just update the state */
  564. state->AccountingIntervalStart = interval_start_time;
  565. state->AccountingBytesReadInInterval = ROUND_UP(n_bytes_read_in_interval);
  566. state->AccountingBytesWrittenInInterval =
  567. ROUND_UP(n_bytes_written_in_interval);
  568. state->AccountingSecondsActive = n_seconds_active_in_interval;
  569. state->AccountingExpectedUsage = expected_bandwidth_usage;
  570. state->AccountingSecondsToReachSoftLimit = n_seconds_to_hit_soft_limit;
  571. state->AccountingSoftLimitHitAt = soft_limit_hit_at;
  572. state->AccountingBytesAtSoftLimit = n_bytes_at_soft_limit;
  573. or_state_mark_dirty(state,
  574. now+(get_options()->AvoidDiskWrites ? 7200 : 60));
  575. return 0;
  576. }
  577. #undef ROUND_UP
  578. /** Read stored accounting information from disk. Return 0 on success;
  579. * return -1 and change nothing on failure. */
  580. static int
  581. read_bandwidth_usage(void)
  582. {
  583. or_state_t *state = get_or_state();
  584. {
  585. char *fname = get_datadir_fname("bw_accounting");
  586. unlink(fname);
  587. tor_free(fname);
  588. }
  589. if (!state)
  590. return -1;
  591. log_info(LD_ACCT, "Reading bandwidth accounting data from state file");
  592. n_bytes_read_in_interval = state->AccountingBytesReadInInterval;
  593. n_bytes_written_in_interval = state->AccountingBytesWrittenInInterval;
  594. n_seconds_active_in_interval = state->AccountingSecondsActive;
  595. interval_start_time = state->AccountingIntervalStart;
  596. expected_bandwidth_usage = state->AccountingExpectedUsage;
  597. /* Older versions of Tor (before 0.2.2.17-alpha or so) didn't generate these
  598. * fields. If you switch back and forth, you might get an
  599. * AccountingSoftLimitHitAt value from long before the most recent
  600. * interval_start_time. If that's so, then ignore the softlimit-related
  601. * values. */
  602. if (state->AccountingSoftLimitHitAt > interval_start_time) {
  603. soft_limit_hit_at = state->AccountingSoftLimitHitAt;
  604. n_bytes_at_soft_limit = state->AccountingBytesAtSoftLimit;
  605. n_seconds_to_hit_soft_limit = state->AccountingSecondsToReachSoftLimit;
  606. } else {
  607. soft_limit_hit_at = 0;
  608. n_bytes_at_soft_limit = 0;
  609. n_seconds_to_hit_soft_limit = 0;
  610. }
  611. {
  612. char tbuf1[ISO_TIME_LEN+1];
  613. char tbuf2[ISO_TIME_LEN+1];
  614. format_iso_time(tbuf1, state->LastWritten);
  615. format_iso_time(tbuf2, state->AccountingIntervalStart);
  616. log_info(LD_ACCT,
  617. "Successfully read bandwidth accounting info from state written at %s "
  618. "for interval starting at %s. We have been active for %lu seconds in "
  619. "this interval. At the start of the interval, we expected to use "
  620. "about %lu KB per second. ("U64_FORMAT" bytes read so far, "
  621. U64_FORMAT" bytes written so far)",
  622. tbuf1, tbuf2,
  623. (unsigned long)n_seconds_active_in_interval,
  624. (unsigned long)(expected_bandwidth_usage*1024/60),
  625. U64_PRINTF_ARG(n_bytes_read_in_interval),
  626. U64_PRINTF_ARG(n_bytes_written_in_interval));
  627. }
  628. return 0;
  629. }
  630. /** Return true iff we have sent/received all the bytes we are willing
  631. * to send/receive this interval. */
  632. static int
  633. hibernate_hard_limit_reached(void)
  634. {
  635. uint64_t hard_limit = get_options()->AccountingMax;
  636. if (!hard_limit)
  637. return 0;
  638. return n_bytes_read_in_interval >= hard_limit
  639. || n_bytes_written_in_interval >= hard_limit;
  640. }
  641. /** Return true iff we have sent/received almost all the bytes we are willing
  642. * to send/receive this interval. */
  643. static int
  644. hibernate_soft_limit_reached(void)
  645. {
  646. const uint64_t acct_max = get_options()->AccountingMax;
  647. #define SOFT_LIM_PCT (.95)
  648. #define SOFT_LIM_BYTES (500*1024*1024)
  649. #define SOFT_LIM_MINUTES (3*60)
  650. /* The 'soft limit' is a fair bit more complicated now than once it was.
  651. * We want to stop accepting connections when ALL of the following are true:
  652. * - We expect to use up the remaining bytes in under 3 hours
  653. * - We have used up 95% of our bytes.
  654. * - We have less than 500MB of bytes left.
  655. */
  656. uint64_t soft_limit = DBL_TO_U64(U64_TO_DBL(acct_max) * SOFT_LIM_PCT);
  657. if (acct_max > SOFT_LIM_BYTES && acct_max - SOFT_LIM_BYTES > soft_limit) {
  658. soft_limit = acct_max - SOFT_LIM_BYTES;
  659. }
  660. if (expected_bandwidth_usage) {
  661. const uint64_t expected_usage =
  662. expected_bandwidth_usage * SOFT_LIM_MINUTES;
  663. if (acct_max > expected_usage && acct_max - expected_usage > soft_limit)
  664. soft_limit = acct_max - expected_usage;
  665. }
  666. if (!soft_limit)
  667. return 0;
  668. return n_bytes_read_in_interval >= soft_limit
  669. || n_bytes_written_in_interval >= soft_limit;
  670. }
  671. /** Called when we get a SIGINT, or when bandwidth soft limit is
  672. * reached. Puts us into "loose hibernation": we don't accept new
  673. * connections, but we continue handling old ones. */
  674. static void
  675. hibernate_begin(hibernate_state_t new_state, time_t now)
  676. {
  677. const or_options_t *options = get_options();
  678. if (new_state == HIBERNATE_STATE_EXITING &&
  679. hibernate_state != HIBERNATE_STATE_LIVE) {
  680. log_notice(LD_GENERAL,"SIGINT received %s; exiting now.",
  681. hibernate_state == HIBERNATE_STATE_EXITING ?
  682. "a second time" : "while hibernating");
  683. tor_cleanup();
  684. exit(0);
  685. }
  686. if (new_state == HIBERNATE_STATE_LOWBANDWIDTH &&
  687. hibernate_state == HIBERNATE_STATE_LIVE) {
  688. soft_limit_hit_at = now;
  689. n_seconds_to_hit_soft_limit = n_seconds_active_in_interval;
  690. n_bytes_at_soft_limit = MAX(n_bytes_read_in_interval,
  691. n_bytes_written_in_interval);
  692. }
  693. /* close listeners. leave control listener(s). */
  694. connection_mark_all_noncontrol_listeners();
  695. /* XXX kill intro point circs */
  696. /* XXX upload rendezvous service descriptors with no intro points */
  697. if (new_state == HIBERNATE_STATE_EXITING) {
  698. log_notice(LD_GENERAL,"Interrupt: we have stopped accepting new "
  699. "connections, and will shut down in %d seconds. Interrupt "
  700. "again to exit now.", options->ShutdownWaitLength);
  701. shutdown_time = time(NULL) + options->ShutdownWaitLength;
  702. } else { /* soft limit reached */
  703. hibernate_end_time = interval_end_time;
  704. }
  705. hibernate_state = new_state;
  706. accounting_record_bandwidth_usage(now, get_or_state());
  707. or_state_mark_dirty(get_or_state(),
  708. get_options()->AvoidDiskWrites ? now+600 : 0);
  709. }
  710. /** Called when we've been hibernating and our timeout is reached. */
  711. static void
  712. hibernate_end(hibernate_state_t new_state)
  713. {
  714. tor_assert(hibernate_state == HIBERNATE_STATE_LOWBANDWIDTH ||
  715. hibernate_state == HIBERNATE_STATE_DORMANT ||
  716. hibernate_state == HIBERNATE_STATE_INITIAL);
  717. /* listeners will be relaunched in run_scheduled_events() in main.c */
  718. if (hibernate_state != HIBERNATE_STATE_INITIAL)
  719. log_notice(LD_ACCT,"Hibernation period ended. Resuming normal activity.");
  720. hibernate_state = new_state;
  721. hibernate_end_time = 0; /* no longer hibernating */
  722. stats_n_seconds_working = 0; /* reset published uptime */
  723. }
  724. /** A wrapper around hibernate_begin, for when we get SIGINT. */
  725. void
  726. hibernate_begin_shutdown(void)
  727. {
  728. hibernate_begin(HIBERNATE_STATE_EXITING, time(NULL));
  729. }
  730. /** Return true iff we are currently hibernating. */
  731. int
  732. we_are_hibernating(void)
  733. {
  734. return hibernate_state != HIBERNATE_STATE_LIVE;
  735. }
  736. /** If we aren't currently dormant, close all connections and become
  737. * dormant. */
  738. static void
  739. hibernate_go_dormant(time_t now)
  740. {
  741. connection_t *conn;
  742. if (hibernate_state == HIBERNATE_STATE_DORMANT)
  743. return;
  744. else if (hibernate_state == HIBERNATE_STATE_LOWBANDWIDTH)
  745. hibernate_state = HIBERNATE_STATE_DORMANT;
  746. else
  747. hibernate_begin(HIBERNATE_STATE_DORMANT, now);
  748. log_notice(LD_ACCT,"Going dormant. Blowing away remaining connections.");
  749. /* Close all OR/AP/exit conns. Leave dir conns because we still want
  750. * to be able to upload server descriptors so people know we're still
  751. * running, and download directories so we can detect if we're obsolete.
  752. * Leave control conns because we still want to be controllable.
  753. */
  754. while ((conn = connection_get_by_type(CONN_TYPE_OR)) ||
  755. (conn = connection_get_by_type(CONN_TYPE_AP)) ||
  756. (conn = connection_get_by_type(CONN_TYPE_EXIT))) {
  757. if (CONN_IS_EDGE(conn))
  758. connection_edge_end(TO_EDGE_CONN(conn), END_STREAM_REASON_HIBERNATING);
  759. log_info(LD_NET,"Closing conn type %d", conn->type);
  760. if (conn->type == CONN_TYPE_AP) /* send socks failure if needed */
  761. connection_mark_unattached_ap(TO_ENTRY_CONN(conn),
  762. END_STREAM_REASON_HIBERNATING);
  763. else
  764. connection_mark_for_close(conn);
  765. }
  766. if (now < interval_wakeup_time)
  767. hibernate_end_time = interval_wakeup_time;
  768. else
  769. hibernate_end_time = interval_end_time;
  770. accounting_record_bandwidth_usage(now, get_or_state());
  771. or_state_mark_dirty(get_or_state(),
  772. get_options()->AvoidDiskWrites ? now+600 : 0);
  773. }
  774. /** Called when hibernate_end_time has arrived. */
  775. static void
  776. hibernate_end_time_elapsed(time_t now)
  777. {
  778. char buf[ISO_TIME_LEN+1];
  779. /* The interval has ended, or it is wakeup time. Find out which. */
  780. accounting_run_housekeeping(now);
  781. if (interval_wakeup_time <= now) {
  782. /* The interval hasn't changed, but interval_wakeup_time has passed.
  783. * It's time to wake up and start being a server. */
  784. hibernate_end(HIBERNATE_STATE_LIVE);
  785. return;
  786. } else {
  787. /* The interval has changed, and it isn't time to wake up yet. */
  788. hibernate_end_time = interval_wakeup_time;
  789. format_iso_time(buf,interval_wakeup_time);
  790. if (hibernate_state != HIBERNATE_STATE_DORMANT) {
  791. /* We weren't sleeping before; we should sleep now. */
  792. log_notice(LD_ACCT,
  793. "Accounting period ended. Commencing hibernation until "
  794. "%s GMT", buf);
  795. hibernate_go_dormant(now);
  796. } else {
  797. log_notice(LD_ACCT,
  798. "Accounting period ended. This period, we will hibernate"
  799. " until %s GMT",buf);
  800. }
  801. }
  802. }
  803. /** Consider our environment and decide if it's time
  804. * to start/stop hibernating.
  805. */
  806. void
  807. consider_hibernation(time_t now)
  808. {
  809. int accounting_enabled = get_options()->AccountingMax != 0;
  810. char buf[ISO_TIME_LEN+1];
  811. /* If we're in 'exiting' mode, then we just shut down after the interval
  812. * elapses. */
  813. if (hibernate_state == HIBERNATE_STATE_EXITING) {
  814. tor_assert(shutdown_time);
  815. if (shutdown_time <= now) {
  816. log_notice(LD_GENERAL, "Clean shutdown finished. Exiting.");
  817. tor_cleanup();
  818. exit(0);
  819. }
  820. return; /* if exiting soon, don't worry about bandwidth limits */
  821. }
  822. if (hibernate_state == HIBERNATE_STATE_DORMANT) {
  823. /* We've been hibernating because of bandwidth accounting. */
  824. tor_assert(hibernate_end_time);
  825. if (hibernate_end_time > now && accounting_enabled) {
  826. /* If we're hibernating, don't wake up until it's time, regardless of
  827. * whether we're in a new interval. */
  828. return ;
  829. } else {
  830. hibernate_end_time_elapsed(now);
  831. }
  832. }
  833. /* Else, we aren't hibernating. See if it's time to start hibernating, or to
  834. * go dormant. */
  835. if (hibernate_state == HIBERNATE_STATE_LIVE ||
  836. hibernate_state == HIBERNATE_STATE_INITIAL) {
  837. if (hibernate_soft_limit_reached()) {
  838. log_notice(LD_ACCT,
  839. "Bandwidth soft limit reached; commencing hibernation. "
  840. "No new connections will be accepted");
  841. hibernate_begin(HIBERNATE_STATE_LOWBANDWIDTH, now);
  842. } else if (accounting_enabled && now < interval_wakeup_time) {
  843. format_local_iso_time(buf,interval_wakeup_time);
  844. log_notice(LD_ACCT,
  845. "Commencing hibernation. We will wake up at %s local time.",
  846. buf);
  847. hibernate_go_dormant(now);
  848. } else if (hibernate_state == HIBERNATE_STATE_INITIAL) {
  849. hibernate_end(HIBERNATE_STATE_LIVE);
  850. }
  851. }
  852. if (hibernate_state == HIBERNATE_STATE_LOWBANDWIDTH) {
  853. if (!accounting_enabled) {
  854. hibernate_end_time_elapsed(now);
  855. } else if (hibernate_hard_limit_reached()) {
  856. hibernate_go_dormant(now);
  857. } else if (hibernate_end_time <= now) {
  858. /* The hibernation period ended while we were still in lowbandwidth.*/
  859. hibernate_end_time_elapsed(now);
  860. }
  861. }
  862. }
  863. /** Helper function: called when we get a GETINFO request for an
  864. * accounting-related key on the control connection <b>conn</b>. If we can
  865. * answer the request for <b>question</b>, then set *<b>answer</b> to a newly
  866. * allocated string holding the result. Otherwise, set *<b>answer</b> to
  867. * NULL. */
  868. int
  869. getinfo_helper_accounting(control_connection_t *conn,
  870. const char *question, char **answer,
  871. const char **errmsg)
  872. {
  873. (void) conn;
  874. (void) errmsg;
  875. if (!strcmp(question, "accounting/enabled")) {
  876. *answer = tor_strdup(accounting_is_enabled(get_options()) ? "1" : "0");
  877. } else if (!strcmp(question, "accounting/hibernating")) {
  878. if (hibernate_state == HIBERNATE_STATE_DORMANT)
  879. *answer = tor_strdup("hard");
  880. else if (hibernate_state == HIBERNATE_STATE_LOWBANDWIDTH)
  881. *answer = tor_strdup("soft");
  882. else
  883. *answer = tor_strdup("awake");
  884. } else if (!strcmp(question, "accounting/bytes")) {
  885. *answer = tor_malloc(32);
  886. tor_snprintf(*answer, 32, U64_FORMAT" "U64_FORMAT,
  887. U64_PRINTF_ARG(n_bytes_read_in_interval),
  888. U64_PRINTF_ARG(n_bytes_written_in_interval));
  889. } else if (!strcmp(question, "accounting/bytes-left")) {
  890. uint64_t limit = get_options()->AccountingMax;
  891. uint64_t read_left = 0, write_left = 0;
  892. if (n_bytes_read_in_interval < limit)
  893. read_left = limit - n_bytes_read_in_interval;
  894. if (n_bytes_written_in_interval < limit)
  895. write_left = limit - n_bytes_written_in_interval;
  896. *answer = tor_malloc(64);
  897. tor_snprintf(*answer, 64, U64_FORMAT" "U64_FORMAT,
  898. U64_PRINTF_ARG(read_left), U64_PRINTF_ARG(write_left));
  899. } else if (!strcmp(question, "accounting/interval-start")) {
  900. *answer = tor_malloc(ISO_TIME_LEN+1);
  901. format_iso_time(*answer, interval_start_time);
  902. } else if (!strcmp(question, "accounting/interval-wake")) {
  903. *answer = tor_malloc(ISO_TIME_LEN+1);
  904. format_iso_time(*answer, interval_wakeup_time);
  905. } else if (!strcmp(question, "accounting/interval-end")) {
  906. *answer = tor_malloc(ISO_TIME_LEN+1);
  907. format_iso_time(*answer, interval_end_time);
  908. } else {
  909. *answer = NULL;
  910. }
  911. return 0;
  912. }
  913. /**
  914. * Manually change the hibernation state. Private; used only by the unit
  915. * tests.
  916. */
  917. void
  918. hibernate_set_state_for_testing_(hibernate_state_t newstate)
  919. {
  920. hibernate_state = newstate;
  921. }