routerset.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415
  1. /* Copyright (c) 2001 Matej Pfajfar.
  2. * Copyright (c) 2001-2004, Roger Dingledine.
  3. * Copyright (c) 2004-2006, Roger Dingledine, Nick Mathewson.
  4. * Copyright (c) 2007-2015, The Tor Project, Inc. */
  5. /* See LICENSE for licensing information */
  6. #define ROUTERSET_PRIVATE
  7. #include "or.h"
  8. #include "geoip.h"
  9. #include "nodelist.h"
  10. #include "policies.h"
  11. #include "router.h"
  12. #include "routerparse.h"
  13. #include "routerset.h"
  14. /** Return a new empty routerset. */
  15. routerset_t *
  16. routerset_new(void)
  17. {
  18. routerset_t *result = tor_malloc_zero(sizeof(routerset_t));
  19. result->list = smartlist_new();
  20. result->names = strmap_new();
  21. result->digests = digestmap_new();
  22. result->policies = smartlist_new();
  23. result->country_names = smartlist_new();
  24. return result;
  25. }
  26. /** If <b>c</b> is a country code in the form {cc}, return a newly allocated
  27. * string holding the "cc" part. Else, return NULL. */
  28. STATIC char *
  29. routerset_get_countryname(const char *c)
  30. {
  31. char *country;
  32. if (strlen(c) < 4 || c[0] !='{' || c[3] !='}')
  33. return NULL;
  34. country = tor_strndup(c+1, 2);
  35. tor_strlower(country);
  36. return country;
  37. }
  38. /** Update the routerset's <b>countries</b> bitarray_t. Called whenever
  39. * the GeoIP IPv4 database is reloaded.
  40. */
  41. void
  42. routerset_refresh_countries(routerset_t *target)
  43. {
  44. int cc;
  45. bitarray_free(target->countries);
  46. if (!geoip_is_loaded(AF_INET)) {
  47. target->countries = NULL;
  48. target->n_countries = 0;
  49. return;
  50. }
  51. target->n_countries = geoip_get_n_countries();
  52. target->countries = bitarray_init_zero(target->n_countries);
  53. SMARTLIST_FOREACH_BEGIN(target->country_names, const char *, country) {
  54. cc = geoip_get_country(country);
  55. if (cc >= 0) {
  56. tor_assert(cc < target->n_countries);
  57. bitarray_set(target->countries, cc);
  58. } else {
  59. log_warn(LD_CONFIG, "Country code '%s' is not recognized.",
  60. country);
  61. }
  62. } SMARTLIST_FOREACH_END(country);
  63. }
  64. /** Parse the string <b>s</b> to create a set of routerset entries, and add
  65. * them to <b>target</b>. In log messages, refer to the string as
  66. * <b>description</b>. Return 0 on success, -1 on failure.
  67. *
  68. * Three kinds of elements are allowed in routersets: nicknames, IP address
  69. * patterns, and fingerprints. They may be surrounded by optional space, and
  70. * must be separated by commas.
  71. */
  72. int
  73. routerset_parse(routerset_t *target, const char *s, const char *description)
  74. {
  75. int r = 0;
  76. int added_countries = 0;
  77. char *countryname;
  78. smartlist_t *list = smartlist_new();
  79. smartlist_split_string(list, s, ",",
  80. SPLIT_SKIP_SPACE | SPLIT_IGNORE_BLANK, 0);
  81. SMARTLIST_FOREACH_BEGIN(list, char *, nick) {
  82. addr_policy_t *p;
  83. if (is_legal_hexdigest(nick)) {
  84. char d[DIGEST_LEN];
  85. if (*nick == '$')
  86. ++nick;
  87. log_debug(LD_CONFIG, "Adding identity %s to %s", nick, description);
  88. base16_decode(d, sizeof(d), nick, HEX_DIGEST_LEN);
  89. digestmap_set(target->digests, d, (void*)1);
  90. } else if (is_legal_nickname(nick)) {
  91. log_debug(LD_CONFIG, "Adding nickname %s to %s", nick, description);
  92. strmap_set_lc(target->names, nick, (void*)1);
  93. } else if ((countryname = routerset_get_countryname(nick)) != NULL) {
  94. log_debug(LD_CONFIG, "Adding country %s to %s", nick,
  95. description);
  96. smartlist_add(target->country_names, countryname);
  97. added_countries = 1;
  98. } else if ((strchr(nick,'.') || strchr(nick, ':') || strchr(nick, '*'))
  99. && (p = router_parse_addr_policy_item_from_string(
  100. nick, ADDR_POLICY_REJECT))) {
  101. /* IPv4 addresses contain '.', IPv6 addresses contain ':',
  102. * and wildcard addresses contain '*'. */
  103. log_debug(LD_CONFIG, "Adding address %s to %s", nick, description);
  104. smartlist_add(target->policies, p);
  105. } else {
  106. log_warn(LD_CONFIG, "Entry '%s' in %s is malformed.", nick,
  107. description);
  108. r = -1;
  109. tor_free(nick);
  110. SMARTLIST_DEL_CURRENT(list, nick);
  111. }
  112. } SMARTLIST_FOREACH_END(nick);
  113. policy_expand_unspec(&target->policies);
  114. smartlist_add_all(target->list, list);
  115. smartlist_free(list);
  116. if (added_countries)
  117. routerset_refresh_countries(target);
  118. return r;
  119. }
  120. /** Add all members of the set <b>source</b> to <b>target</b>. */
  121. void
  122. routerset_union(routerset_t *target, const routerset_t *source)
  123. {
  124. char *s;
  125. tor_assert(target);
  126. if (!source || !source->list)
  127. return;
  128. s = routerset_to_string(source);
  129. routerset_parse(target, s, "other routerset");
  130. tor_free(s);
  131. }
  132. /** Return true iff <b>set</b> lists only nicknames and digests, and includes
  133. * no IP ranges or countries. */
  134. int
  135. routerset_is_list(const routerset_t *set)
  136. {
  137. return smartlist_len(set->country_names) == 0 &&
  138. smartlist_len(set->policies) == 0;
  139. }
  140. /** Return true iff we need a GeoIP IP-to-country database to make sense of
  141. * <b>set</b>. */
  142. int
  143. routerset_needs_geoip(const routerset_t *set)
  144. {
  145. return set && smartlist_len(set->country_names);
  146. }
  147. /** Return true iff there are no entries in <b>set</b>. */
  148. int
  149. routerset_is_empty(const routerset_t *set)
  150. {
  151. return !set || smartlist_len(set->list) == 0;
  152. }
  153. /** Return the number of entries in <b>set</b>. This does NOT return a
  154. * negative value. */
  155. int
  156. routerset_len(const routerset_t *set)
  157. {
  158. if (!set) {
  159. return 0;
  160. }
  161. return smartlist_len(set->list);
  162. }
  163. /** Helper. Return true iff <b>set</b> contains a router based on the other
  164. * provided fields. Return higher values for more specific subentries: a
  165. * single router is more specific than an address range of routers, which is
  166. * more specific in turn than a country code.
  167. *
  168. * (If country is -1, then we take the country
  169. * from addr.) */
  170. STATIC int
  171. routerset_contains(const routerset_t *set, const tor_addr_t *addr,
  172. uint16_t orport,
  173. const char *nickname, const char *id_digest,
  174. country_t country)
  175. {
  176. if (!set || !set->list)
  177. return 0;
  178. if (nickname && strmap_get_lc(set->names, nickname))
  179. return 4;
  180. if (id_digest && digestmap_get(set->digests, id_digest))
  181. return 4;
  182. if (addr && compare_tor_addr_to_addr_policy(addr, orport, set->policies)
  183. == ADDR_POLICY_REJECTED)
  184. return 3;
  185. if (set->countries) {
  186. if (country < 0 && addr)
  187. country = geoip_get_country_by_addr(addr);
  188. if (country >= 0 && country < set->n_countries &&
  189. bitarray_is_set(set->countries, country))
  190. return 2;
  191. }
  192. return 0;
  193. }
  194. /** If *<b>setp</b> includes at least one country code, or if
  195. * <b>only_some_cc_set</b> is 0, add the ?? and A1 country codes to
  196. * *<b>setp</b>, creating it as needed. Return true iff *<b>setp</b> changed.
  197. */
  198. int
  199. routerset_add_unknown_ccs(routerset_t **setp, int only_if_some_cc_set)
  200. {
  201. routerset_t *set;
  202. int add_unknown, add_a1;
  203. if (only_if_some_cc_set) {
  204. if (!*setp || smartlist_len((*setp)->country_names) == 0)
  205. return 0;
  206. }
  207. if (!*setp)
  208. *setp = routerset_new();
  209. set = *setp;
  210. add_unknown = ! smartlist_contains_string_case(set->country_names, "??") &&
  211. geoip_get_country("??") >= 0;
  212. add_a1 = ! smartlist_contains_string_case(set->country_names, "a1") &&
  213. geoip_get_country("A1") >= 0;
  214. if (add_unknown) {
  215. smartlist_add(set->country_names, tor_strdup("??"));
  216. smartlist_add(set->list, tor_strdup("{??}"));
  217. }
  218. if (add_a1) {
  219. smartlist_add(set->country_names, tor_strdup("a1"));
  220. smartlist_add(set->list, tor_strdup("{a1}"));
  221. }
  222. if (add_unknown || add_a1) {
  223. routerset_refresh_countries(set);
  224. return 1;
  225. }
  226. return 0;
  227. }
  228. /** Return true iff we can tell that <b>ei</b> is a member of <b>set</b>. */
  229. int
  230. routerset_contains_extendinfo(const routerset_t *set, const extend_info_t *ei)
  231. {
  232. return routerset_contains(set,
  233. &ei->addr,
  234. ei->port,
  235. ei->nickname,
  236. ei->identity_digest,
  237. -1 /*country*/);
  238. }
  239. /** Return true iff <b>ri</b> is in <b>set</b>. If country is <b>-1</b>, we
  240. * look up the country. */
  241. int
  242. routerset_contains_router(const routerset_t *set, const routerinfo_t *ri,
  243. country_t country)
  244. {
  245. tor_addr_t addr;
  246. tor_addr_from_ipv4h(&addr, ri->addr);
  247. return routerset_contains(set,
  248. &addr,
  249. ri->or_port,
  250. ri->nickname,
  251. ri->cache_info.identity_digest,
  252. country);
  253. }
  254. /** Return true iff <b>rs</b> is in <b>set</b>. If country is <b>-1</b>, we
  255. * look up the country. */
  256. int
  257. routerset_contains_routerstatus(const routerset_t *set,
  258. const routerstatus_t *rs,
  259. country_t country)
  260. {
  261. tor_addr_t addr;
  262. tor_addr_from_ipv4h(&addr, rs->addr);
  263. return routerset_contains(set,
  264. &addr,
  265. rs->or_port,
  266. rs->nickname,
  267. rs->identity_digest,
  268. country);
  269. }
  270. /** Return true iff <b>node</b> is in <b>set</b>. */
  271. int
  272. routerset_contains_node(const routerset_t *set, const node_t *node)
  273. {
  274. if (node->rs)
  275. return routerset_contains_routerstatus(set, node->rs, node->country);
  276. else if (node->ri)
  277. return routerset_contains_router(set, node->ri, node->country);
  278. else
  279. return 0;
  280. }
  281. /** Add every known node_t that is a member of <b>routerset</b> to
  282. * <b>out</b>, but never add any that are part of <b>excludeset</b>.
  283. * If <b>running_only</b>, only add the running ones. */
  284. void
  285. routerset_get_all_nodes(smartlist_t *out, const routerset_t *routerset,
  286. const routerset_t *excludeset, int running_only)
  287. {
  288. tor_assert(out);
  289. if (!routerset || !routerset->list)
  290. return;
  291. if (routerset_is_list(routerset)) {
  292. /* No routers are specified by type; all are given by name or digest.
  293. * we can do a lookup in O(len(routerset)). */
  294. SMARTLIST_FOREACH(routerset->list, const char *, name, {
  295. const node_t *node = node_get_by_nickname(name, 1);
  296. if (node) {
  297. if (!running_only || node->is_running)
  298. if (!routerset_contains_node(excludeset, node))
  299. smartlist_add(out, (void*)node);
  300. }
  301. });
  302. } else {
  303. /* We need to iterate over the routerlist to get all the ones of the
  304. * right kind. */
  305. smartlist_t *nodes = nodelist_get_list();
  306. SMARTLIST_FOREACH(nodes, const node_t *, node, {
  307. if (running_only && !node->is_running)
  308. continue;
  309. if (routerset_contains_node(routerset, node) &&
  310. !routerset_contains_node(excludeset, node))
  311. smartlist_add(out, (void*)node);
  312. });
  313. }
  314. }
  315. /** Remove every node_t from <b>lst</b> that is in <b>routerset</b>. */
  316. void
  317. routerset_subtract_nodes(smartlist_t *lst, const routerset_t *routerset)
  318. {
  319. tor_assert(lst);
  320. if (!routerset)
  321. return;
  322. SMARTLIST_FOREACH(lst, const node_t *, node, {
  323. if (routerset_contains_node(routerset, node)) {
  324. //log_debug(LD_DIR, "Subtracting %s",r->nickname);
  325. SMARTLIST_DEL_CURRENT(lst, node);
  326. }
  327. });
  328. }
  329. /** Return a new string that when parsed by routerset_parse_string() will
  330. * yield <b>set</b>. */
  331. char *
  332. routerset_to_string(const routerset_t *set)
  333. {
  334. if (!set || !set->list)
  335. return tor_strdup("");
  336. return smartlist_join_strings(set->list, ",", 0, NULL);
  337. }
  338. /** Helper: return true iff old and new are both NULL, or both non-NULL
  339. * equal routersets. */
  340. int
  341. routerset_equal(const routerset_t *old, const routerset_t *new)
  342. {
  343. if (routerset_is_empty(old) && routerset_is_empty(new)) {
  344. /* Two empty sets are equal */
  345. return 1;
  346. } else if (routerset_is_empty(old) || routerset_is_empty(new)) {
  347. /* An empty set is equal to nothing else. */
  348. return 0;
  349. }
  350. tor_assert(old != NULL);
  351. tor_assert(new != NULL);
  352. if (smartlist_len(old->list) != smartlist_len(new->list))
  353. return 0;
  354. SMARTLIST_FOREACH(old->list, const char *, cp1, {
  355. const char *cp2 = smartlist_get(new->list, cp1_sl_idx);
  356. if (strcmp(cp1, cp2))
  357. return 0;
  358. });
  359. return 1;
  360. }
  361. /** Free all storage held in <b>routerset</b>. */
  362. void
  363. routerset_free(routerset_t *routerset)
  364. {
  365. if (!routerset)
  366. return;
  367. SMARTLIST_FOREACH(routerset->list, char *, cp, tor_free(cp));
  368. smartlist_free(routerset->list);
  369. SMARTLIST_FOREACH(routerset->policies, addr_policy_t *, p,
  370. addr_policy_free(p));
  371. smartlist_free(routerset->policies);
  372. SMARTLIST_FOREACH(routerset->country_names, char *, cp, tor_free(cp));
  373. smartlist_free(routerset->country_names);
  374. strmap_free(routerset->names, NULL);
  375. digestmap_free(routerset->digests, NULL);
  376. bitarray_free(routerset->countries);
  377. tor_free(routerset);
  378. }