util.c 73 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817
  1. /* Copyright (c) 2003, Roger Dingledine
  2. * Copyright (c) 2004-2006, Roger Dingledine, Nick Mathewson.
  3. * Copyright (c) 2007-2011, The Tor Project, Inc. */
  4. /* See LICENSE for licensing information */
  5. /**
  6. * \file util.c
  7. * \brief Common functions for strings, IO, network, data structures,
  8. * process control.
  9. **/
  10. /* This is required on rh7 to make strptime not complain.
  11. */
  12. #define _GNU_SOURCE
  13. #include "orconfig.h"
  14. #include "util.h"
  15. #include "torlog.h"
  16. #undef log
  17. #include "crypto.h"
  18. #include "torint.h"
  19. #include "container.h"
  20. #include "address.h"
  21. #ifdef MS_WINDOWS
  22. #include <io.h>
  23. #include <direct.h>
  24. #include <process.h>
  25. #include <tchar.h>
  26. #else
  27. #include <dirent.h>
  28. #include <pwd.h>
  29. #endif
  30. /* math.h needs this on Linux */
  31. #ifndef __USE_ISOC99
  32. #define __USE_ISOC99 1
  33. #endif
  34. #include <math.h>
  35. #include <stdlib.h>
  36. #include <stdio.h>
  37. #include <string.h>
  38. #include <assert.h>
  39. #ifdef HAVE_NETINET_IN_H
  40. #include <netinet/in.h>
  41. #endif
  42. #ifdef HAVE_ARPA_INET_H
  43. #include <arpa/inet.h>
  44. #endif
  45. #ifdef HAVE_ERRNO_H
  46. #include <errno.h>
  47. #endif
  48. #ifdef HAVE_SYS_SOCKET_H
  49. #include <sys/socket.h>
  50. #endif
  51. #ifdef HAVE_SYS_TIME_H
  52. #include <sys/time.h>
  53. #endif
  54. #ifdef HAVE_UNISTD_H
  55. #include <unistd.h>
  56. #endif
  57. #ifdef HAVE_SYS_STAT_H
  58. #include <sys/stat.h>
  59. #endif
  60. #ifdef HAVE_SYS_FCNTL_H
  61. #include <sys/fcntl.h>
  62. #endif
  63. #ifdef HAVE_FCNTL_H
  64. #include <fcntl.h>
  65. #endif
  66. #ifdef HAVE_TIME_H
  67. #include <time.h>
  68. #endif
  69. #ifdef HAVE_MALLOC_MALLOC_H
  70. #include <malloc/malloc.h>
  71. #endif
  72. #ifdef HAVE_MALLOC_H
  73. #ifndef OPENBSD
  74. /* OpenBSD has a malloc.h, but for our purposes, it only exists in order to
  75. * scold us for being so stupid as to autodetect its presence. To be fair,
  76. * they've done this since 1996, when autoconf was only 5 years old. */
  77. #include <malloc.h>
  78. #endif
  79. #endif
  80. #ifdef HAVE_MALLOC_NP_H
  81. #include <malloc_np.h>
  82. #endif
  83. /* =====
  84. * Memory management
  85. * ===== */
  86. #ifdef USE_DMALLOC
  87. #undef strndup
  88. #include <dmalloc.h>
  89. /* Macro to pass the extra dmalloc args to another function. */
  90. #define DMALLOC_FN_ARGS , file, line
  91. #if defined(HAVE_DMALLOC_STRDUP)
  92. /* the dmalloc_strdup should be fine as defined */
  93. #elif defined(HAVE_DMALLOC_STRNDUP)
  94. #define dmalloc_strdup(file, line, string, xalloc_b) \
  95. dmalloc_strndup(file, line, (string), -1, xalloc_b)
  96. #else
  97. #error "No dmalloc_strdup or equivalent"
  98. #endif
  99. #else /* not using dmalloc */
  100. #define DMALLOC_FN_ARGS
  101. #endif
  102. /** Allocate a chunk of <b>size</b> bytes of memory, and return a pointer to
  103. * result. On error, log and terminate the process. (Same as malloc(size),
  104. * but never returns NULL.)
  105. *
  106. * <b>file</b> and <b>line</b> are used if dmalloc is enabled, and
  107. * ignored otherwise.
  108. */
  109. void *
  110. _tor_malloc(size_t size DMALLOC_PARAMS)
  111. {
  112. void *result;
  113. tor_assert(size < SIZE_T_CEILING);
  114. #ifndef MALLOC_ZERO_WORKS
  115. /* Some libc mallocs don't work when size==0. Override them. */
  116. if (size==0) {
  117. size=1;
  118. }
  119. #endif
  120. #ifdef USE_DMALLOC
  121. result = dmalloc_malloc(file, line, size, DMALLOC_FUNC_MALLOC, 0, 0);
  122. #else
  123. result = malloc(size);
  124. #endif
  125. if (PREDICT_UNLIKELY(result == NULL)) {
  126. log_err(LD_MM,"Out of memory on malloc(). Dying.");
  127. /* If these functions die within a worker process, they won't call
  128. * spawn_exit, but that's ok, since the parent will run out of memory soon
  129. * anyway. */
  130. exit(1);
  131. }
  132. return result;
  133. }
  134. /** Allocate a chunk of <b>size</b> bytes of memory, fill the memory with
  135. * zero bytes, and return a pointer to the result. Log and terminate
  136. * the process on error. (Same as calloc(size,1), but never returns NULL.)
  137. */
  138. void *
  139. _tor_malloc_zero(size_t size DMALLOC_PARAMS)
  140. {
  141. /* You may ask yourself, "wouldn't it be smart to use calloc instead of
  142. * malloc+memset? Perhaps libc's calloc knows some nifty optimization trick
  143. * we don't!" Indeed it does, but its optimizations are only a big win when
  144. * we're allocating something very big (it knows if it just got the memory
  145. * from the OS in a pre-zeroed state). We don't want to use tor_malloc_zero
  146. * for big stuff, so we don't bother with calloc. */
  147. void *result = _tor_malloc(size DMALLOC_FN_ARGS);
  148. memset(result, 0, size);
  149. return result;
  150. }
  151. /** Change the size of the memory block pointed to by <b>ptr</b> to <b>size</b>
  152. * bytes long; return the new memory block. On error, log and
  153. * terminate. (Like realloc(ptr,size), but never returns NULL.)
  154. */
  155. void *
  156. _tor_realloc(void *ptr, size_t size DMALLOC_PARAMS)
  157. {
  158. void *result;
  159. tor_assert(size < SIZE_T_CEILING);
  160. #ifdef USE_DMALLOC
  161. result = dmalloc_realloc(file, line, ptr, size, DMALLOC_FUNC_REALLOC, 0);
  162. #else
  163. result = realloc(ptr, size);
  164. #endif
  165. if (PREDICT_UNLIKELY(result == NULL)) {
  166. log_err(LD_MM,"Out of memory on realloc(). Dying.");
  167. exit(1);
  168. }
  169. return result;
  170. }
  171. /** Return a newly allocated copy of the NUL-terminated string s. On
  172. * error, log and terminate. (Like strdup(s), but never returns
  173. * NULL.)
  174. */
  175. char *
  176. _tor_strdup(const char *s DMALLOC_PARAMS)
  177. {
  178. char *dup;
  179. tor_assert(s);
  180. #ifdef USE_DMALLOC
  181. dup = dmalloc_strdup(file, line, s, 0);
  182. #else
  183. dup = strdup(s);
  184. #endif
  185. if (PREDICT_UNLIKELY(dup == NULL)) {
  186. log_err(LD_MM,"Out of memory on strdup(). Dying.");
  187. exit(1);
  188. }
  189. return dup;
  190. }
  191. /** Allocate and return a new string containing the first <b>n</b>
  192. * characters of <b>s</b>. If <b>s</b> is longer than <b>n</b>
  193. * characters, only the first <b>n</b> are copied. The result is
  194. * always NUL-terminated. (Like strndup(s,n), but never returns
  195. * NULL.)
  196. */
  197. char *
  198. _tor_strndup(const char *s, size_t n DMALLOC_PARAMS)
  199. {
  200. char *dup;
  201. tor_assert(s);
  202. tor_assert(n < SIZE_T_CEILING);
  203. dup = _tor_malloc((n+1) DMALLOC_FN_ARGS);
  204. /* Performance note: Ordinarily we prefer strlcpy to strncpy. But
  205. * this function gets called a whole lot, and platform strncpy is
  206. * much faster than strlcpy when strlen(s) is much longer than n.
  207. */
  208. strncpy(dup, s, n);
  209. dup[n]='\0';
  210. return dup;
  211. }
  212. /** Allocate a chunk of <b>len</b> bytes, with the same contents as the
  213. * <b>len</b> bytes starting at <b>mem</b>. */
  214. void *
  215. _tor_memdup(const void *mem, size_t len DMALLOC_PARAMS)
  216. {
  217. char *dup;
  218. tor_assert(len < SIZE_T_CEILING);
  219. tor_assert(mem);
  220. dup = _tor_malloc(len DMALLOC_FN_ARGS);
  221. memcpy(dup, mem, len);
  222. return dup;
  223. }
  224. /** Helper for places that need to take a function pointer to the right
  225. * spelling of "free()". */
  226. void
  227. _tor_free(void *mem)
  228. {
  229. tor_free(mem);
  230. }
  231. #if defined(HAVE_MALLOC_GOOD_SIZE) && !defined(HAVE_MALLOC_GOOD_SIZE_PROTOTYPE)
  232. /* Some version of Mac OSX have malloc_good_size in their libc, but not
  233. * actually defined in malloc/malloc.h. We detect this and work around it by
  234. * prototyping.
  235. */
  236. extern size_t malloc_good_size(size_t size);
  237. #endif
  238. /** Allocate and return a chunk of memory of size at least *<b>size</b>, using
  239. * the same resources we would use to malloc *<b>sizep</b>. Set *<b>sizep</b>
  240. * to the number of usable bytes in the chunk of memory. */
  241. void *
  242. _tor_malloc_roundup(size_t *sizep DMALLOC_PARAMS)
  243. {
  244. #ifdef HAVE_MALLOC_GOOD_SIZE
  245. tor_assert(*sizep < SIZE_T_CEILING);
  246. *sizep = malloc_good_size(*sizep);
  247. return _tor_malloc(*sizep DMALLOC_FN_ARGS);
  248. #elif 0 && defined(HAVE_MALLOC_USABLE_SIZE) && !defined(USE_DMALLOC)
  249. /* Never use malloc_usable_size(); it makes valgrind really unhappy,
  250. * and doesn't win much in terms of usable space where it exists. */
  251. void *result;
  252. tor_assert(*sizep < SIZE_T_CEILING);
  253. result = _tor_malloc(*sizep DMALLOC_FN_ARGS);
  254. *sizep = malloc_usable_size(result);
  255. return result;
  256. #else
  257. return _tor_malloc(*sizep DMALLOC_FN_ARGS);
  258. #endif
  259. }
  260. /** Call the platform malloc info function, and dump the results to the log at
  261. * level <b>severity</b>. If no such function exists, do nothing. */
  262. void
  263. tor_log_mallinfo(int severity)
  264. {
  265. #ifdef HAVE_MALLINFO
  266. struct mallinfo mi;
  267. memset(&mi, 0, sizeof(mi));
  268. mi = mallinfo();
  269. tor_log(severity, LD_MM,
  270. "mallinfo() said: arena=%d, ordblks=%d, smblks=%d, hblks=%d, "
  271. "hblkhd=%d, usmblks=%d, fsmblks=%d, uordblks=%d, fordblks=%d, "
  272. "keepcost=%d",
  273. mi.arena, mi.ordblks, mi.smblks, mi.hblks,
  274. mi.hblkhd, mi.usmblks, mi.fsmblks, mi.uordblks, mi.fordblks,
  275. mi.keepcost);
  276. #else
  277. (void)severity;
  278. #endif
  279. #ifdef USE_DMALLOC
  280. dmalloc_log_changed(0, /* Since the program started. */
  281. 1, /* Log info about non-freed pointers. */
  282. 0, /* Do not log info about freed pointers. */
  283. 0 /* Do not log individual pointers. */
  284. );
  285. #endif
  286. }
  287. /* =====
  288. * Math
  289. * ===== */
  290. /**
  291. * Returns the natural logarithm of d base 2. We define this wrapper here so
  292. * as to make it easier not to conflict with Tor's log() macro.
  293. */
  294. double
  295. tor_mathlog(double d)
  296. {
  297. return log(d);
  298. }
  299. /** Return the long integer closest to d. We define this wrapper here so
  300. * that not all users of math.h need to use the right incancations to get
  301. * the c99 functions. */
  302. long
  303. tor_lround(double d)
  304. {
  305. return lround(d);
  306. }
  307. /** Returns floor(log2(u64)). If u64 is 0, (incorrectly) returns 0. */
  308. int
  309. tor_log2(uint64_t u64)
  310. {
  311. int r = 0;
  312. if (u64 >= (U64_LITERAL(1)<<32)) {
  313. u64 >>= 32;
  314. r = 32;
  315. }
  316. if (u64 >= (U64_LITERAL(1)<<16)) {
  317. u64 >>= 16;
  318. r += 16;
  319. }
  320. if (u64 >= (U64_LITERAL(1)<<8)) {
  321. u64 >>= 8;
  322. r += 8;
  323. }
  324. if (u64 >= (U64_LITERAL(1)<<4)) {
  325. u64 >>= 4;
  326. r += 4;
  327. }
  328. if (u64 >= (U64_LITERAL(1)<<2)) {
  329. u64 >>= 2;
  330. r += 2;
  331. }
  332. if (u64 >= (U64_LITERAL(1)<<1)) {
  333. u64 >>= 1;
  334. r += 1;
  335. }
  336. return r;
  337. }
  338. /** Return the power of 2 closest to <b>u64</b>. */
  339. uint64_t
  340. round_to_power_of_2(uint64_t u64)
  341. {
  342. int lg2 = tor_log2(u64);
  343. uint64_t low = U64_LITERAL(1) << lg2, high = U64_LITERAL(1) << (lg2+1);
  344. if (high - u64 < u64 - low)
  345. return high;
  346. else
  347. return low;
  348. }
  349. /** Return the lowest x such that x is at least <b>number</b>, and x modulo
  350. * <b>divisor</b> == 0. */
  351. unsigned
  352. round_to_next_multiple_of(unsigned number, unsigned divisor)
  353. {
  354. number += divisor - 1;
  355. number -= number % divisor;
  356. return number;
  357. }
  358. /** Return the lowest x such that x is at least <b>number</b>, and x modulo
  359. * <b>divisor</b> == 0. */
  360. uint32_t
  361. round_uint32_to_next_multiple_of(uint32_t number, uint32_t divisor)
  362. {
  363. number += divisor - 1;
  364. number -= number % divisor;
  365. return number;
  366. }
  367. /** Return the lowest x such that x is at least <b>number</b>, and x modulo
  368. * <b>divisor</b> == 0. */
  369. uint64_t
  370. round_uint64_to_next_multiple_of(uint64_t number, uint64_t divisor)
  371. {
  372. number += divisor - 1;
  373. number -= number % divisor;
  374. return number;
  375. }
  376. /* =====
  377. * String manipulation
  378. * ===== */
  379. /** Remove from the string <b>s</b> every character which appears in
  380. * <b>strip</b>. */
  381. void
  382. tor_strstrip(char *s, const char *strip)
  383. {
  384. char *read = s;
  385. while (*read) {
  386. if (strchr(strip, *read)) {
  387. ++read;
  388. } else {
  389. *s++ = *read++;
  390. }
  391. }
  392. *s = '\0';
  393. }
  394. /** Return a pointer to a NUL-terminated hexadecimal string encoding
  395. * the first <b>fromlen</b> bytes of <b>from</b>. (fromlen must be \<= 32.) The
  396. * result does not need to be deallocated, but repeated calls to
  397. * hex_str will trash old results.
  398. */
  399. const char *
  400. hex_str(const char *from, size_t fromlen)
  401. {
  402. static char buf[65];
  403. if (fromlen>(sizeof(buf)-1)/2)
  404. fromlen = (sizeof(buf)-1)/2;
  405. base16_encode(buf,sizeof(buf),from,fromlen);
  406. return buf;
  407. }
  408. /** Convert all alphabetic characters in the nul-terminated string <b>s</b> to
  409. * lowercase. */
  410. void
  411. tor_strlower(char *s)
  412. {
  413. while (*s) {
  414. *s = TOR_TOLOWER(*s);
  415. ++s;
  416. }
  417. }
  418. /** Convert all alphabetic characters in the nul-terminated string <b>s</b> to
  419. * lowercase. */
  420. void
  421. tor_strupper(char *s)
  422. {
  423. while (*s) {
  424. *s = TOR_TOUPPER(*s);
  425. ++s;
  426. }
  427. }
  428. /** Return 1 if every character in <b>s</b> is printable, else return 0.
  429. */
  430. int
  431. tor_strisprint(const char *s)
  432. {
  433. while (*s) {
  434. if (!TOR_ISPRINT(*s))
  435. return 0;
  436. s++;
  437. }
  438. return 1;
  439. }
  440. /** Return 1 if no character in <b>s</b> is uppercase, else return 0.
  441. */
  442. int
  443. tor_strisnonupper(const char *s)
  444. {
  445. while (*s) {
  446. if (TOR_ISUPPER(*s))
  447. return 0;
  448. s++;
  449. }
  450. return 1;
  451. }
  452. /** Compares the first strlen(s2) characters of s1 with s2. Returns as for
  453. * strcmp.
  454. */
  455. int
  456. strcmpstart(const char *s1, const char *s2)
  457. {
  458. size_t n = strlen(s2);
  459. return strncmp(s1, s2, n);
  460. }
  461. /** Compare the s1_len-byte string <b>s1</b> with <b>s2</b>,
  462. * without depending on a terminating nul in s1. Sorting order is first by
  463. * length, then lexically; return values are as for strcmp.
  464. */
  465. int
  466. strcmp_len(const char *s1, const char *s2, size_t s1_len)
  467. {
  468. size_t s2_len = strlen(s2);
  469. if (s1_len < s2_len)
  470. return -1;
  471. if (s1_len > s2_len)
  472. return 1;
  473. return fast_memcmp(s1, s2, s2_len);
  474. }
  475. /** Compares the first strlen(s2) characters of s1 with s2. Returns as for
  476. * strcasecmp.
  477. */
  478. int
  479. strcasecmpstart(const char *s1, const char *s2)
  480. {
  481. size_t n = strlen(s2);
  482. return strncasecmp(s1, s2, n);
  483. }
  484. /** Compares the last strlen(s2) characters of s1 with s2. Returns as for
  485. * strcmp.
  486. */
  487. int
  488. strcmpend(const char *s1, const char *s2)
  489. {
  490. size_t n1 = strlen(s1), n2 = strlen(s2);
  491. if (n2>n1)
  492. return strcmp(s1,s2);
  493. else
  494. return strncmp(s1+(n1-n2), s2, n2);
  495. }
  496. /** Compares the last strlen(s2) characters of s1 with s2. Returns as for
  497. * strcasecmp.
  498. */
  499. int
  500. strcasecmpend(const char *s1, const char *s2)
  501. {
  502. size_t n1 = strlen(s1), n2 = strlen(s2);
  503. if (n2>n1) /* then they can't be the same; figure out which is bigger */
  504. return strcasecmp(s1,s2);
  505. else
  506. return strncasecmp(s1+(n1-n2), s2, n2);
  507. }
  508. /** Compare the value of the string <b>prefix</b> with the start of the
  509. * <b>memlen</b>-byte memory chunk at <b>mem</b>. Return as for strcmp.
  510. *
  511. * [As fast_memcmp(mem, prefix, strlen(prefix)) but returns -1 if memlen is
  512. * less than strlen(prefix).]
  513. */
  514. int
  515. fast_memcmpstart(const void *mem, size_t memlen,
  516. const char *prefix)
  517. {
  518. size_t plen = strlen(prefix);
  519. if (memlen < plen)
  520. return -1;
  521. return fast_memcmp(mem, prefix, plen);
  522. }
  523. /** Return a pointer to the first char of s that is not whitespace and
  524. * not a comment, or to the terminating NUL if no such character exists.
  525. */
  526. const char *
  527. eat_whitespace(const char *s)
  528. {
  529. tor_assert(s);
  530. while (1) {
  531. switch (*s) {
  532. case '\0':
  533. default:
  534. return s;
  535. case ' ':
  536. case '\t':
  537. case '\n':
  538. case '\r':
  539. ++s;
  540. break;
  541. case '#':
  542. ++s;
  543. while (*s && *s != '\n')
  544. ++s;
  545. }
  546. }
  547. }
  548. /** Return a pointer to the first char of s that is not whitespace and
  549. * not a comment, or to the terminating NUL if no such character exists.
  550. */
  551. const char *
  552. eat_whitespace_eos(const char *s, const char *eos)
  553. {
  554. tor_assert(s);
  555. tor_assert(eos && s <= eos);
  556. while (s < eos) {
  557. switch (*s) {
  558. case '\0':
  559. default:
  560. return s;
  561. case ' ':
  562. case '\t':
  563. case '\n':
  564. case '\r':
  565. ++s;
  566. break;
  567. case '#':
  568. ++s;
  569. while (s < eos && *s && *s != '\n')
  570. ++s;
  571. }
  572. }
  573. return s;
  574. }
  575. /** Return a pointer to the first char of s that is not a space or a tab
  576. * or a \\r, or to the terminating NUL if no such character exists. */
  577. const char *
  578. eat_whitespace_no_nl(const char *s)
  579. {
  580. while (*s == ' ' || *s == '\t' || *s == '\r')
  581. ++s;
  582. return s;
  583. }
  584. /** As eat_whitespace_no_nl, but stop at <b>eos</b> whether we have
  585. * found a non-whitespace character or not. */
  586. const char *
  587. eat_whitespace_eos_no_nl(const char *s, const char *eos)
  588. {
  589. while (s < eos && (*s == ' ' || *s == '\t' || *s == '\r'))
  590. ++s;
  591. return s;
  592. }
  593. /** Return a pointer to the first char of s that is whitespace or <b>#</b>,
  594. * or to the terminating NUL if no such character exists.
  595. */
  596. const char *
  597. find_whitespace(const char *s)
  598. {
  599. /* tor_assert(s); */
  600. while (1) {
  601. switch (*s)
  602. {
  603. case '\0':
  604. case '#':
  605. case ' ':
  606. case '\r':
  607. case '\n':
  608. case '\t':
  609. return s;
  610. default:
  611. ++s;
  612. }
  613. }
  614. }
  615. /** As find_whitespace, but stop at <b>eos</b> whether we have found a
  616. * whitespace or not. */
  617. const char *
  618. find_whitespace_eos(const char *s, const char *eos)
  619. {
  620. /* tor_assert(s); */
  621. while (s < eos) {
  622. switch (*s)
  623. {
  624. case '\0':
  625. case '#':
  626. case ' ':
  627. case '\r':
  628. case '\n':
  629. case '\t':
  630. return s;
  631. default:
  632. ++s;
  633. }
  634. }
  635. return s;
  636. }
  637. /** Return the first occurrence of <b>needle</b> in <b>haystack</b> that
  638. * occurs at the start of a line (that is, at the beginning of <b>haystack</b>
  639. * or immediately after a newline). Return NULL if no such string is found.
  640. */
  641. const char *
  642. find_str_at_start_of_line(const char *haystack, const char *needle)
  643. {
  644. size_t needle_len = strlen(needle);
  645. do {
  646. if (!strncmp(haystack, needle, needle_len))
  647. return haystack;
  648. haystack = strchr(haystack, '\n');
  649. if (!haystack)
  650. return NULL;
  651. else
  652. ++haystack;
  653. } while (*haystack);
  654. return NULL;
  655. }
  656. /** Return true iff the 'len' bytes at 'mem' are all zero. */
  657. int
  658. tor_mem_is_zero(const char *mem, size_t len)
  659. {
  660. static const char ZERO[] = {
  661. 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0,
  662. };
  663. while (len >= sizeof(ZERO)) {
  664. /* It's safe to use fast_memcmp here, since the very worst thing an
  665. * attacker could learn is how many initial bytes of a secret were zero */
  666. if (fast_memcmp(mem, ZERO, sizeof(ZERO)))
  667. return 0;
  668. len -= sizeof(ZERO);
  669. mem += sizeof(ZERO);
  670. }
  671. /* Deal with leftover bytes. */
  672. if (len)
  673. return fast_memeq(mem, ZERO, len);
  674. return 1;
  675. }
  676. /** Return true iff the DIGEST_LEN bytes in digest are all zero. */
  677. int
  678. tor_digest_is_zero(const char *digest)
  679. {
  680. static const uint8_t ZERO_DIGEST[] = {
  681. 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0
  682. };
  683. return tor_memeq(digest, ZERO_DIGEST, DIGEST_LEN);
  684. }
  685. /** Return true iff the DIGEST256_LEN bytes in digest are all zero. */
  686. int
  687. tor_digest256_is_zero(const char *digest)
  688. {
  689. return tor_mem_is_zero(digest, DIGEST256_LEN);
  690. }
  691. /* Helper: common code to check whether the result of a strtol or strtoul or
  692. * strtoll is correct. */
  693. #define CHECK_STRTOX_RESULT() \
  694. /* Was at least one character converted? */ \
  695. if (endptr == s) \
  696. goto err; \
  697. /* Were there unexpected unconverted characters? */ \
  698. if (!next && *endptr) \
  699. goto err; \
  700. /* Is r within limits? */ \
  701. if (r < min || r > max) \
  702. goto err; \
  703. if (ok) *ok = 1; \
  704. if (next) *next = endptr; \
  705. return r; \
  706. err: \
  707. if (ok) *ok = 0; \
  708. if (next) *next = endptr; \
  709. return 0
  710. /** Extract a long from the start of s, in the given numeric base. If
  711. * there is unconverted data and next is provided, set *next to the
  712. * first unconverted character. An error has occurred if no characters
  713. * are converted; or if there are unconverted characters and next is NULL; or
  714. * if the parsed value is not between min and max. When no error occurs,
  715. * return the parsed value and set *ok (if provided) to 1. When an error
  716. * occurs, return 0 and set *ok (if provided) to 0.
  717. */
  718. long
  719. tor_parse_long(const char *s, int base, long min, long max,
  720. int *ok, char **next)
  721. {
  722. char *endptr;
  723. long r;
  724. r = strtol(s, &endptr, base);
  725. CHECK_STRTOX_RESULT();
  726. }
  727. /** As tor_parse_long(), but return an unsigned long. */
  728. unsigned long
  729. tor_parse_ulong(const char *s, int base, unsigned long min,
  730. unsigned long max, int *ok, char **next)
  731. {
  732. char *endptr;
  733. unsigned long r;
  734. r = strtoul(s, &endptr, base);
  735. CHECK_STRTOX_RESULT();
  736. }
  737. /** As tor_parse_long(), but return a double. */
  738. double
  739. tor_parse_double(const char *s, double min, double max, int *ok, char **next)
  740. {
  741. char *endptr;
  742. double r;
  743. r = strtod(s, &endptr);
  744. CHECK_STRTOX_RESULT();
  745. }
  746. /** As tor_parse_long, but return a uint64_t. Only base 10 is guaranteed to
  747. * work for now. */
  748. uint64_t
  749. tor_parse_uint64(const char *s, int base, uint64_t min,
  750. uint64_t max, int *ok, char **next)
  751. {
  752. char *endptr;
  753. uint64_t r;
  754. #ifdef HAVE_STRTOULL
  755. r = (uint64_t)strtoull(s, &endptr, base);
  756. #elif defined(MS_WINDOWS)
  757. #if defined(_MSC_VER) && _MSC_VER < 1300
  758. tor_assert(base <= 10);
  759. r = (uint64_t)_atoi64(s);
  760. endptr = (char*)s;
  761. while (TOR_ISSPACE(*endptr)) endptr++;
  762. while (TOR_ISDIGIT(*endptr)) endptr++;
  763. #else
  764. r = (uint64_t)_strtoui64(s, &endptr, base);
  765. #endif
  766. #elif SIZEOF_LONG == 8
  767. r = (uint64_t)strtoul(s, &endptr, base);
  768. #else
  769. #error "I don't know how to parse 64-bit numbers."
  770. #endif
  771. CHECK_STRTOX_RESULT();
  772. }
  773. /** Encode the <b>srclen</b> bytes at <b>src</b> in a NUL-terminated,
  774. * uppercase hexadecimal string; store it in the <b>destlen</b>-byte buffer
  775. * <b>dest</b>.
  776. */
  777. void
  778. base16_encode(char *dest, size_t destlen, const char *src, size_t srclen)
  779. {
  780. const char *end;
  781. char *cp;
  782. tor_assert(destlen >= srclen*2+1);
  783. tor_assert(destlen < SIZE_T_CEILING);
  784. cp = dest;
  785. end = src+srclen;
  786. while (src<end) {
  787. *cp++ = "0123456789ABCDEF"[ (*(const uint8_t*)src) >> 4 ];
  788. *cp++ = "0123456789ABCDEF"[ (*(const uint8_t*)src) & 0xf ];
  789. ++src;
  790. }
  791. *cp = '\0';
  792. }
  793. /** Helper: given a hex digit, return its value, or -1 if it isn't hex. */
  794. static INLINE int
  795. _hex_decode_digit(char c)
  796. {
  797. switch (c) {
  798. case '0': return 0;
  799. case '1': return 1;
  800. case '2': return 2;
  801. case '3': return 3;
  802. case '4': return 4;
  803. case '5': return 5;
  804. case '6': return 6;
  805. case '7': return 7;
  806. case '8': return 8;
  807. case '9': return 9;
  808. case 'A': case 'a': return 10;
  809. case 'B': case 'b': return 11;
  810. case 'C': case 'c': return 12;
  811. case 'D': case 'd': return 13;
  812. case 'E': case 'e': return 14;
  813. case 'F': case 'f': return 15;
  814. default:
  815. return -1;
  816. }
  817. }
  818. /** Helper: given a hex digit, return its value, or -1 if it isn't hex. */
  819. int
  820. hex_decode_digit(char c)
  821. {
  822. return _hex_decode_digit(c);
  823. }
  824. /** Given a hexadecimal string of <b>srclen</b> bytes in <b>src</b>, decode it
  825. * and store the result in the <b>destlen</b>-byte buffer at <b>dest</b>.
  826. * Return 0 on success, -1 on failure. */
  827. int
  828. base16_decode(char *dest, size_t destlen, const char *src, size_t srclen)
  829. {
  830. const char *end;
  831. int v1,v2;
  832. if ((srclen % 2) != 0)
  833. return -1;
  834. if (destlen < srclen/2 || destlen > SIZE_T_CEILING)
  835. return -1;
  836. end = src+srclen;
  837. while (src<end) {
  838. v1 = _hex_decode_digit(*src);
  839. v2 = _hex_decode_digit(*(src+1));
  840. if (v1<0||v2<0)
  841. return -1;
  842. *(uint8_t*)dest = (v1<<4)|v2;
  843. ++dest;
  844. src+=2;
  845. }
  846. return 0;
  847. }
  848. /** Allocate and return a new string representing the contents of <b>s</b>,
  849. * surrounded by quotes and using standard C escapes.
  850. *
  851. * Generally, we use this for logging values that come in over the network to
  852. * keep them from tricking users, and for sending certain values to the
  853. * controller.
  854. *
  855. * We trust values from the resolver, OS, configuration file, and command line
  856. * to not be maliciously ill-formed. We validate incoming routerdescs and
  857. * SOCKS requests and addresses from BEGIN cells as they're parsed;
  858. * afterwards, we trust them as non-malicious.
  859. */
  860. char *
  861. esc_for_log(const char *s)
  862. {
  863. const char *cp;
  864. char *result, *outp;
  865. size_t len = 3;
  866. if (!s) {
  867. return tor_strdup("");
  868. }
  869. for (cp = s; *cp; ++cp) {
  870. switch (*cp) {
  871. case '\\':
  872. case '\"':
  873. case '\'':
  874. case '\r':
  875. case '\n':
  876. case '\t':
  877. len += 2;
  878. break;
  879. default:
  880. if (TOR_ISPRINT(*cp) && ((uint8_t)*cp)<127)
  881. ++len;
  882. else
  883. len += 4;
  884. break;
  885. }
  886. }
  887. result = outp = tor_malloc(len);
  888. *outp++ = '\"';
  889. for (cp = s; *cp; ++cp) {
  890. switch (*cp) {
  891. case '\\':
  892. case '\"':
  893. case '\'':
  894. *outp++ = '\\';
  895. *outp++ = *cp;
  896. break;
  897. case '\n':
  898. *outp++ = '\\';
  899. *outp++ = 'n';
  900. break;
  901. case '\t':
  902. *outp++ = '\\';
  903. *outp++ = 't';
  904. break;
  905. case '\r':
  906. *outp++ = '\\';
  907. *outp++ = 'r';
  908. break;
  909. default:
  910. if (TOR_ISPRINT(*cp) && ((uint8_t)*cp)<127) {
  911. *outp++ = *cp;
  912. } else {
  913. tor_snprintf(outp, 5, "\\%03o", (int)(uint8_t) *cp);
  914. outp += 4;
  915. }
  916. break;
  917. }
  918. }
  919. *outp++ = '\"';
  920. *outp++ = 0;
  921. return result;
  922. }
  923. /** Allocate and return a new string representing the contents of <b>s</b>,
  924. * surrounded by quotes and using standard C escapes.
  925. *
  926. * THIS FUNCTION IS NOT REENTRANT. Don't call it from outside the main
  927. * thread. Also, each call invalidates the last-returned value, so don't
  928. * try log_warn(LD_GENERAL, "%s %s", escaped(a), escaped(b));
  929. */
  930. const char *
  931. escaped(const char *s)
  932. {
  933. static char *_escaped_val = NULL;
  934. tor_free(_escaped_val);
  935. if (s)
  936. _escaped_val = esc_for_log(s);
  937. else
  938. _escaped_val = NULL;
  939. return _escaped_val;
  940. }
  941. /** Rudimentary string wrapping code: given a un-wrapped <b>string</b> (no
  942. * newlines!), break the string into newline-terminated lines of no more than
  943. * <b>width</b> characters long (not counting newline) and insert them into
  944. * <b>out</b> in order. Precede the first line with prefix0, and subsequent
  945. * lines with prefixRest.
  946. */
  947. /* This uses a stupid greedy wrapping algorithm right now:
  948. * - For each line:
  949. * - Try to fit as much stuff as possible, but break on a space.
  950. * - If the first "word" of the line will extend beyond the allowable
  951. * width, break the word at the end of the width.
  952. */
  953. void
  954. wrap_string(smartlist_t *out, const char *string, size_t width,
  955. const char *prefix0, const char *prefixRest)
  956. {
  957. size_t p0Len, pRestLen, pCurLen;
  958. const char *eos, *prefixCur;
  959. tor_assert(out);
  960. tor_assert(string);
  961. tor_assert(width);
  962. if (!prefix0)
  963. prefix0 = "";
  964. if (!prefixRest)
  965. prefixRest = "";
  966. p0Len = strlen(prefix0);
  967. pRestLen = strlen(prefixRest);
  968. tor_assert(width > p0Len && width > pRestLen);
  969. eos = strchr(string, '\0');
  970. tor_assert(eos);
  971. pCurLen = p0Len;
  972. prefixCur = prefix0;
  973. while ((eos-string)+pCurLen > width) {
  974. const char *eol = string + width - pCurLen;
  975. while (eol > string && *eol != ' ')
  976. --eol;
  977. /* eol is now the last space that can fit, or the start of the string. */
  978. if (eol > string) {
  979. size_t line_len = (eol-string) + pCurLen + 2;
  980. char *line = tor_malloc(line_len);
  981. memcpy(line, prefixCur, pCurLen);
  982. memcpy(line+pCurLen, string, eol-string);
  983. line[line_len-2] = '\n';
  984. line[line_len-1] = '\0';
  985. smartlist_add(out, line);
  986. string = eol + 1;
  987. } else {
  988. size_t line_len = width + 2;
  989. char *line = tor_malloc(line_len);
  990. memcpy(line, prefixCur, pCurLen);
  991. memcpy(line+pCurLen, string, width - pCurLen);
  992. line[line_len-2] = '\n';
  993. line[line_len-1] = '\0';
  994. smartlist_add(out, line);
  995. string += width-pCurLen;
  996. }
  997. prefixCur = prefixRest;
  998. pCurLen = pRestLen;
  999. }
  1000. if (string < eos) {
  1001. size_t line_len = (eos-string) + pCurLen + 2;
  1002. char *line = tor_malloc(line_len);
  1003. memcpy(line, prefixCur, pCurLen);
  1004. memcpy(line+pCurLen, string, eos-string);
  1005. line[line_len-2] = '\n';
  1006. line[line_len-1] = '\0';
  1007. smartlist_add(out, line);
  1008. }
  1009. }
  1010. /* =====
  1011. * Time
  1012. * ===== */
  1013. /**
  1014. * Converts struct timeval to a double value.
  1015. * Preserves microsecond precision, but just barely.
  1016. * Error is approx +/- 0.1 usec when dealing with epoch values.
  1017. */
  1018. double
  1019. tv_to_double(const struct timeval *tv)
  1020. {
  1021. double conv = tv->tv_sec;
  1022. conv += tv->tv_usec/1000000.0;
  1023. return conv;
  1024. }
  1025. /**
  1026. * Converts timeval to milliseconds.
  1027. */
  1028. int64_t
  1029. tv_to_msec(const struct timeval *tv)
  1030. {
  1031. int64_t conv = ((int64_t)tv->tv_sec)*1000L;
  1032. /* Round ghetto-style */
  1033. conv += ((int64_t)tv->tv_usec+500)/1000L;
  1034. return conv;
  1035. }
  1036. /**
  1037. * Converts timeval to microseconds.
  1038. */
  1039. int64_t
  1040. tv_to_usec(const struct timeval *tv)
  1041. {
  1042. int64_t conv = ((int64_t)tv->tv_sec)*1000000L;
  1043. conv += tv->tv_usec;
  1044. return conv;
  1045. }
  1046. /** Return the number of microseconds elapsed between *start and *end.
  1047. */
  1048. long
  1049. tv_udiff(const struct timeval *start, const struct timeval *end)
  1050. {
  1051. long udiff;
  1052. long secdiff = end->tv_sec - start->tv_sec;
  1053. if (labs(secdiff+1) > LONG_MAX/1000000) {
  1054. log_warn(LD_GENERAL, "comparing times on microsecond detail too far "
  1055. "apart: %ld seconds", secdiff);
  1056. return LONG_MAX;
  1057. }
  1058. udiff = secdiff*1000000L + (end->tv_usec - start->tv_usec);
  1059. return udiff;
  1060. }
  1061. /** Return the number of milliseconds elapsed between *start and *end.
  1062. */
  1063. long
  1064. tv_mdiff(const struct timeval *start, const struct timeval *end)
  1065. {
  1066. long mdiff;
  1067. long secdiff = end->tv_sec - start->tv_sec;
  1068. if (labs(secdiff+1) > LONG_MAX/1000) {
  1069. log_warn(LD_GENERAL, "comparing times on millisecond detail too far "
  1070. "apart: %ld seconds", secdiff);
  1071. return LONG_MAX;
  1072. }
  1073. /* Subtract and round */
  1074. mdiff = secdiff*1000L +
  1075. ((long)end->tv_usec - (long)start->tv_usec + 500L) / 1000L;
  1076. return mdiff;
  1077. }
  1078. /** Yield true iff <b>y</b> is a leap-year. */
  1079. #define IS_LEAPYEAR(y) (!(y % 4) && ((y % 100) || !(y % 400)))
  1080. /** Helper: Return the number of leap-days between Jan 1, y1 and Jan 1, y2. */
  1081. static int
  1082. n_leapdays(int y1, int y2)
  1083. {
  1084. --y1;
  1085. --y2;
  1086. return (y2/4 - y1/4) - (y2/100 - y1/100) + (y2/400 - y1/400);
  1087. }
  1088. /** Number of days per month in non-leap year; used by tor_timegm. */
  1089. static const int days_per_month[] =
  1090. { 31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31};
  1091. /** Return a time_t given a struct tm. The result is given in GMT, and
  1092. * does not account for leap seconds.
  1093. */
  1094. time_t
  1095. tor_timegm(struct tm *tm)
  1096. {
  1097. /* This is a pretty ironclad timegm implementation, snarfed from Python2.2.
  1098. * It's way more brute-force than fiddling with tzset().
  1099. */
  1100. time_t year, days, hours, minutes, seconds;
  1101. int i;
  1102. year = tm->tm_year + 1900;
  1103. if (year < 1970 || tm->tm_mon < 0 || tm->tm_mon > 11) {
  1104. log_warn(LD_BUG, "Out-of-range argument to tor_timegm");
  1105. return -1;
  1106. }
  1107. tor_assert(year < INT_MAX);
  1108. days = 365 * (year-1970) + n_leapdays(1970,(int)year);
  1109. for (i = 0; i < tm->tm_mon; ++i)
  1110. days += days_per_month[i];
  1111. if (tm->tm_mon > 1 && IS_LEAPYEAR(year))
  1112. ++days;
  1113. days += tm->tm_mday - 1;
  1114. hours = days*24 + tm->tm_hour;
  1115. minutes = hours*60 + tm->tm_min;
  1116. seconds = minutes*60 + tm->tm_sec;
  1117. return seconds;
  1118. }
  1119. /* strftime is locale-specific, so we need to replace those parts */
  1120. /** A c-locale array of 3-letter names of weekdays, starting with Sun. */
  1121. static const char *WEEKDAY_NAMES[] =
  1122. { "Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat" };
  1123. /** A c-locale array of 3-letter names of months, starting with Jan. */
  1124. static const char *MONTH_NAMES[] =
  1125. { "Jan", "Feb", "Mar", "Apr", "May", "Jun",
  1126. "Jul", "Aug", "Sep", "Oct", "Nov", "Dec" };
  1127. /** Set <b>buf</b> to the RFC1123 encoding of the GMT value of <b>t</b>.
  1128. * The buffer must be at least RFC1123_TIME_LEN+1 bytes long.
  1129. *
  1130. * (RFC1123 format is Fri, 29 Sep 2006 15:54:20 GMT)
  1131. */
  1132. void
  1133. format_rfc1123_time(char *buf, time_t t)
  1134. {
  1135. struct tm tm;
  1136. tor_gmtime_r(&t, &tm);
  1137. strftime(buf, RFC1123_TIME_LEN+1, "___, %d ___ %Y %H:%M:%S GMT", &tm);
  1138. tor_assert(tm.tm_wday >= 0);
  1139. tor_assert(tm.tm_wday <= 6);
  1140. memcpy(buf, WEEKDAY_NAMES[tm.tm_wday], 3);
  1141. tor_assert(tm.tm_wday >= 0);
  1142. tor_assert(tm.tm_mon <= 11);
  1143. memcpy(buf+8, MONTH_NAMES[tm.tm_mon], 3);
  1144. }
  1145. /** Parse the RFC1123 encoding of some time (in GMT) from <b>buf</b>,
  1146. * and store the result in *<b>t</b>.
  1147. *
  1148. * Return 0 on success, -1 on failure.
  1149. */
  1150. int
  1151. parse_rfc1123_time(const char *buf, time_t *t)
  1152. {
  1153. struct tm tm;
  1154. char month[4];
  1155. char weekday[4];
  1156. int i, m;
  1157. unsigned tm_mday, tm_year, tm_hour, tm_min, tm_sec;
  1158. if (strlen(buf) != RFC1123_TIME_LEN)
  1159. return -1;
  1160. memset(&tm, 0, sizeof(tm));
  1161. if (tor_sscanf(buf, "%3s, %2u %3s %u %2u:%2u:%2u GMT", weekday,
  1162. &tm_mday, month, &tm_year, &tm_hour,
  1163. &tm_min, &tm_sec) < 7) {
  1164. char *esc = esc_for_log(buf);
  1165. log_warn(LD_GENERAL, "Got invalid RFC1123 time %s", esc);
  1166. tor_free(esc);
  1167. return -1;
  1168. }
  1169. if (tm_mday > 31 || tm_hour > 23 || tm_min > 59 || tm_sec > 61) {
  1170. char *esc = esc_for_log(buf);
  1171. log_warn(LD_GENERAL, "Got invalid RFC1123 time %s", esc);
  1172. tor_free(esc);
  1173. return -1;
  1174. }
  1175. tm.tm_mday = (int)tm_mday;
  1176. tm.tm_year = (int)tm_year;
  1177. tm.tm_hour = (int)tm_hour;
  1178. tm.tm_min = (int)tm_min;
  1179. tm.tm_sec = (int)tm_sec;
  1180. m = -1;
  1181. for (i = 0; i < 12; ++i) {
  1182. if (!strcmp(month, MONTH_NAMES[i])) {
  1183. m = i;
  1184. break;
  1185. }
  1186. }
  1187. if (m<0) {
  1188. char *esc = esc_for_log(buf);
  1189. log_warn(LD_GENERAL, "Got invalid RFC1123 time %s: No such month", esc);
  1190. tor_free(esc);
  1191. return -1;
  1192. }
  1193. tm.tm_mon = m;
  1194. if (tm.tm_year < 1970) {
  1195. char *esc = esc_for_log(buf);
  1196. log_warn(LD_GENERAL,
  1197. "Got invalid RFC1123 time %s. (Before 1970)", esc);
  1198. tor_free(esc);
  1199. return -1;
  1200. }
  1201. tm.tm_year -= 1900;
  1202. *t = tor_timegm(&tm);
  1203. return 0;
  1204. }
  1205. /** Set <b>buf</b> to the ISO8601 encoding of the local value of <b>t</b>.
  1206. * The buffer must be at least ISO_TIME_LEN+1 bytes long.
  1207. *
  1208. * (ISO8601 format is 2006-10-29 10:57:20)
  1209. */
  1210. void
  1211. format_local_iso_time(char *buf, time_t t)
  1212. {
  1213. struct tm tm;
  1214. strftime(buf, ISO_TIME_LEN+1, "%Y-%m-%d %H:%M:%S", tor_localtime_r(&t, &tm));
  1215. }
  1216. /** Set <b>buf</b> to the ISO8601 encoding of the GMT value of <b>t</b>.
  1217. * The buffer must be at least ISO_TIME_LEN+1 bytes long.
  1218. */
  1219. void
  1220. format_iso_time(char *buf, time_t t)
  1221. {
  1222. struct tm tm;
  1223. strftime(buf, ISO_TIME_LEN+1, "%Y-%m-%d %H:%M:%S", tor_gmtime_r(&t, &tm));
  1224. }
  1225. /** Given an ISO-formatted UTC time value (after the epoch) in <b>cp</b>,
  1226. * parse it and store its value in *<b>t</b>. Return 0 on success, -1 on
  1227. * failure. Ignore extraneous stuff in <b>cp</b> separated by whitespace from
  1228. * the end of the time string. */
  1229. int
  1230. parse_iso_time(const char *cp, time_t *t)
  1231. {
  1232. struct tm st_tm;
  1233. unsigned int year=0, month=0, day=0, hour=100, minute=100, second=100;
  1234. if (tor_sscanf(cp, "%u-%2u-%2u %2u:%2u:%2u", &year, &month,
  1235. &day, &hour, &minute, &second) < 6) {
  1236. char *esc = esc_for_log(cp);
  1237. log_warn(LD_GENERAL, "ISO time %s was unparseable", esc);
  1238. tor_free(esc);
  1239. return -1;
  1240. }
  1241. if (year < 1970 || month < 1 || month > 12 || day < 1 || day > 31 ||
  1242. hour > 23 || minute > 59 || second > 61) {
  1243. char *esc = esc_for_log(cp);
  1244. log_warn(LD_GENERAL, "ISO time %s was nonsensical", esc);
  1245. tor_free(esc);
  1246. return -1;
  1247. }
  1248. st_tm.tm_year = year-1900;
  1249. st_tm.tm_mon = month-1;
  1250. st_tm.tm_mday = day;
  1251. st_tm.tm_hour = hour;
  1252. st_tm.tm_min = minute;
  1253. st_tm.tm_sec = second;
  1254. if (st_tm.tm_year < 70) {
  1255. char *esc = esc_for_log(cp);
  1256. log_warn(LD_GENERAL, "Got invalid ISO time %s. (Before 1970)", esc);
  1257. tor_free(esc);
  1258. return -1;
  1259. }
  1260. *t = tor_timegm(&st_tm);
  1261. return 0;
  1262. }
  1263. /** Given a <b>date</b> in one of the three formats allowed by HTTP (ugh),
  1264. * parse it into <b>tm</b>. Return 0 on success, negative on failure. */
  1265. int
  1266. parse_http_time(const char *date, struct tm *tm)
  1267. {
  1268. const char *cp;
  1269. char month[4];
  1270. char wkday[4];
  1271. int i;
  1272. unsigned tm_mday, tm_year, tm_hour, tm_min, tm_sec;
  1273. tor_assert(tm);
  1274. memset(tm, 0, sizeof(*tm));
  1275. /* First, try RFC1123 or RFC850 format: skip the weekday. */
  1276. if ((cp = strchr(date, ','))) {
  1277. ++cp;
  1278. if (tor_sscanf(date, "%2u %3s %4u %2u:%2u:%2u GMT",
  1279. &tm_mday, month, &tm_year,
  1280. &tm_hour, &tm_min, &tm_sec) == 6) {
  1281. /* rfc1123-date */
  1282. tm_year -= 1900;
  1283. } else if (tor_sscanf(date, "%2u-%3s-%2u %2u:%2u:%2u GMT",
  1284. &tm_mday, month, &tm_year,
  1285. &tm_hour, &tm_min, &tm_sec) == 6) {
  1286. /* rfc850-date */
  1287. } else {
  1288. return -1;
  1289. }
  1290. } else {
  1291. /* No comma; possibly asctime() format. */
  1292. if (tor_sscanf(date, "%3s %3s %2u %2u:%2u:%2u %4u",
  1293. wkday, month, &tm_mday,
  1294. &tm_hour, &tm_min, &tm_sec, &tm_year) == 7) {
  1295. tm_year -= 1900;
  1296. } else {
  1297. return -1;
  1298. }
  1299. }
  1300. tm->tm_mday = (int)tm_mday;
  1301. tm->tm_year = (int)tm_year;
  1302. tm->tm_hour = (int)tm_hour;
  1303. tm->tm_min = (int)tm_min;
  1304. tm->tm_sec = (int)tm_sec;
  1305. month[3] = '\0';
  1306. /* Okay, now decode the month. */
  1307. for (i = 0; i < 12; ++i) {
  1308. if (!strcasecmp(MONTH_NAMES[i], month)) {
  1309. tm->tm_mon = i+1;
  1310. }
  1311. }
  1312. if (tm->tm_year < 0 ||
  1313. tm->tm_mon < 1 || tm->tm_mon > 12 ||
  1314. tm->tm_mday < 0 || tm->tm_mday > 31 ||
  1315. tm->tm_hour < 0 || tm->tm_hour > 23 ||
  1316. tm->tm_min < 0 || tm->tm_min > 59 ||
  1317. tm->tm_sec < 0 || tm->tm_sec > 61)
  1318. return -1; /* Out of range, or bad month. */
  1319. return 0;
  1320. }
  1321. /** Given an <b>interval</b> in seconds, try to write it to the
  1322. * <b>out_len</b>-byte buffer in <b>out</b> in a human-readable form.
  1323. * Return 0 on success, -1 on failure.
  1324. */
  1325. int
  1326. format_time_interval(char *out, size_t out_len, long interval)
  1327. {
  1328. /* We only report seconds if there's no hours. */
  1329. long sec = 0, min = 0, hour = 0, day = 0;
  1330. if (interval < 0)
  1331. interval = -interval;
  1332. if (interval >= 86400) {
  1333. day = interval / 86400;
  1334. interval %= 86400;
  1335. }
  1336. if (interval >= 3600) {
  1337. hour = interval / 3600;
  1338. interval %= 3600;
  1339. }
  1340. if (interval >= 60) {
  1341. min = interval / 60;
  1342. interval %= 60;
  1343. }
  1344. sec = interval;
  1345. if (day) {
  1346. return tor_snprintf(out, out_len, "%ld days, %ld hours, %ld minutes",
  1347. day, hour, min);
  1348. } else if (hour) {
  1349. return tor_snprintf(out, out_len, "%ld hours, %ld minutes", hour, min);
  1350. } else if (min) {
  1351. return tor_snprintf(out, out_len, "%ld minutes, %ld seconds", min, sec);
  1352. } else {
  1353. return tor_snprintf(out, out_len, "%ld seconds", sec);
  1354. }
  1355. }
  1356. /* =====
  1357. * Cached time
  1358. * ===== */
  1359. #ifndef TIME_IS_FAST
  1360. /** Cached estimate of the current time. Updated around once per second;
  1361. * may be a few seconds off if we are really busy. This is a hack to avoid
  1362. * calling time(NULL) (which not everybody has optimized) on critical paths.
  1363. */
  1364. static time_t cached_approx_time = 0;
  1365. /** Return a cached estimate of the current time from when
  1366. * update_approx_time() was last called. This is a hack to avoid calling
  1367. * time(NULL) on critical paths: please do not even think of calling it
  1368. * anywhere else. */
  1369. time_t
  1370. approx_time(void)
  1371. {
  1372. return cached_approx_time;
  1373. }
  1374. /** Update the cached estimate of the current time. This function SHOULD be
  1375. * called once per second, and MUST be called before the first call to
  1376. * get_approx_time. */
  1377. void
  1378. update_approx_time(time_t now)
  1379. {
  1380. cached_approx_time = now;
  1381. }
  1382. #endif
  1383. /* =====
  1384. * Rate limiting
  1385. * ===== */
  1386. /** If the rate-limiter <b>lim</b> is ready at <b>now</b>, return the number
  1387. * of calls to rate_limit_is_ready (including this one!) since the last time
  1388. * rate_limit_is_ready returned nonzero. Otherwise return 0. */
  1389. static int
  1390. rate_limit_is_ready(ratelim_t *lim, time_t now)
  1391. {
  1392. if (lim->rate + lim->last_allowed <= now) {
  1393. int res = lim->n_calls_since_last_time + 1;
  1394. lim->last_allowed = now;
  1395. lim->n_calls_since_last_time = 0;
  1396. return res;
  1397. } else {
  1398. ++lim->n_calls_since_last_time;
  1399. return 0;
  1400. }
  1401. }
  1402. /** If the rate-limiter <b>lim</b> is ready at <b>now</b>, return a newly
  1403. * allocated string indicating how many messages were suppressed, suitable to
  1404. * append to a log message. Otherwise return NULL. */
  1405. char *
  1406. rate_limit_log(ratelim_t *lim, time_t now)
  1407. {
  1408. int n;
  1409. if ((n = rate_limit_is_ready(lim, now))) {
  1410. if (n == 1) {
  1411. return tor_strdup("");
  1412. } else {
  1413. char *cp=NULL;
  1414. tor_asprintf(&cp,
  1415. " [%d similar message(s) suppressed in last %d seconds]",
  1416. n-1, lim->rate);
  1417. return cp;
  1418. }
  1419. } else {
  1420. return NULL;
  1421. }
  1422. }
  1423. /* =====
  1424. * File helpers
  1425. * ===== */
  1426. /** Write <b>count</b> bytes from <b>buf</b> to <b>fd</b>. <b>isSocket</b>
  1427. * must be 1 if fd was returned by socket() or accept(), and 0 if fd
  1428. * was returned by open(). Return the number of bytes written, or -1
  1429. * on error. Only use if fd is a blocking fd. */
  1430. ssize_t
  1431. write_all(int fd, const char *buf, size_t count, int isSocket)
  1432. {
  1433. size_t written = 0;
  1434. ssize_t result;
  1435. tor_assert(count < SSIZE_T_MAX);
  1436. while (written != count) {
  1437. if (isSocket)
  1438. result = tor_socket_send(fd, buf+written, count-written, 0);
  1439. else
  1440. result = write(fd, buf+written, count-written);
  1441. if (result<0)
  1442. return -1;
  1443. written += result;
  1444. }
  1445. return (ssize_t)count;
  1446. }
  1447. /** Read from <b>fd</b> to <b>buf</b>, until we get <b>count</b> bytes
  1448. * or reach the end of the file. <b>isSocket</b> must be 1 if fd
  1449. * was returned by socket() or accept(), and 0 if fd was returned by
  1450. * open(). Return the number of bytes read, or -1 on error. Only use
  1451. * if fd is a blocking fd. */
  1452. ssize_t
  1453. read_all(int fd, char *buf, size_t count, int isSocket)
  1454. {
  1455. size_t numread = 0;
  1456. ssize_t result;
  1457. if (count > SIZE_T_CEILING || count > SSIZE_T_MAX)
  1458. return -1;
  1459. while (numread != count) {
  1460. if (isSocket)
  1461. result = tor_socket_recv(fd, buf+numread, count-numread, 0);
  1462. else
  1463. result = read(fd, buf+numread, count-numread);
  1464. if (result<0)
  1465. return -1;
  1466. else if (result == 0)
  1467. break;
  1468. numread += result;
  1469. }
  1470. return (ssize_t)numread;
  1471. }
  1472. /*
  1473. * Filesystem operations.
  1474. */
  1475. /** Clean up <b>name</b> so that we can use it in a call to "stat". On Unix,
  1476. * we do nothing. On Windows, we remove a trailing slash, unless the path is
  1477. * the root of a disk. */
  1478. static void
  1479. clean_name_for_stat(char *name)
  1480. {
  1481. #ifdef MS_WINDOWS
  1482. size_t len = strlen(name);
  1483. if (!len)
  1484. return;
  1485. if (name[len-1]=='\\' || name[len-1]=='/') {
  1486. if (len == 1 || (len==3 && name[1]==':'))
  1487. return;
  1488. name[len-1]='\0';
  1489. }
  1490. #else
  1491. (void)name;
  1492. #endif
  1493. }
  1494. /** Return FN_ERROR if filename can't be read, FN_NOENT if it doesn't
  1495. * exist, FN_FILE if it is a regular file, or FN_DIR if it's a
  1496. * directory. On FN_ERROR, sets errno. */
  1497. file_status_t
  1498. file_status(const char *fname)
  1499. {
  1500. struct stat st;
  1501. char *f;
  1502. int r;
  1503. f = tor_strdup(fname);
  1504. clean_name_for_stat(f);
  1505. r = stat(f, &st);
  1506. tor_free(f);
  1507. if (r) {
  1508. if (errno == ENOENT) {
  1509. return FN_NOENT;
  1510. }
  1511. return FN_ERROR;
  1512. }
  1513. if (st.st_mode & S_IFDIR)
  1514. return FN_DIR;
  1515. else if (st.st_mode & S_IFREG)
  1516. return FN_FILE;
  1517. else
  1518. return FN_ERROR;
  1519. }
  1520. /** Check whether dirname exists and is private. If yes return 0. If
  1521. * it does not exist, and check==CPD_CREATE is set, try to create it
  1522. * and return 0 on success. If it does not exist, and
  1523. * check==CPD_CHECK, and we think we can create it, return 0. Else
  1524. * return -1. */
  1525. int
  1526. check_private_dir(const char *dirname, cpd_check_t check)
  1527. {
  1528. int r;
  1529. struct stat st;
  1530. char *f;
  1531. tor_assert(dirname);
  1532. f = tor_strdup(dirname);
  1533. clean_name_for_stat(f);
  1534. r = stat(f, &st);
  1535. tor_free(f);
  1536. if (r) {
  1537. if (errno != ENOENT) {
  1538. log_warn(LD_FS, "Directory %s cannot be read: %s", dirname,
  1539. strerror(errno));
  1540. return -1;
  1541. }
  1542. if (check == CPD_NONE) {
  1543. log_warn(LD_FS, "Directory %s does not exist.", dirname);
  1544. return -1;
  1545. } else if (check == CPD_CREATE) {
  1546. log_info(LD_GENERAL, "Creating directory %s", dirname);
  1547. #if defined (MS_WINDOWS) && !defined (WINCE)
  1548. r = mkdir(dirname);
  1549. #else
  1550. r = mkdir(dirname, 0700);
  1551. #endif
  1552. if (r) {
  1553. log_warn(LD_FS, "Error creating directory %s: %s", dirname,
  1554. strerror(errno));
  1555. return -1;
  1556. }
  1557. }
  1558. /* XXXX In the case where check==CPD_CHECK, we should look at the
  1559. * parent directory a little harder. */
  1560. return 0;
  1561. }
  1562. if (!(st.st_mode & S_IFDIR)) {
  1563. log_warn(LD_FS, "%s is not a directory", dirname);
  1564. return -1;
  1565. }
  1566. #ifndef MS_WINDOWS
  1567. if (st.st_uid != getuid()) {
  1568. struct passwd *pw = NULL;
  1569. char *process_ownername = NULL;
  1570. pw = getpwuid(getuid());
  1571. process_ownername = pw ? tor_strdup(pw->pw_name) : tor_strdup("<unknown>");
  1572. pw = getpwuid(st.st_uid);
  1573. log_warn(LD_FS, "%s is not owned by this user (%s, %d) but by "
  1574. "%s (%d). Perhaps you are running Tor as the wrong user?",
  1575. dirname, process_ownername, (int)getuid(),
  1576. pw ? pw->pw_name : "<unknown>", (int)st.st_uid);
  1577. tor_free(process_ownername);
  1578. return -1;
  1579. }
  1580. if (st.st_mode & 0077) {
  1581. log_warn(LD_FS, "Fixing permissions on directory %s", dirname);
  1582. if (chmod(dirname, 0700)) {
  1583. log_warn(LD_FS, "Could not chmod directory %s: %s", dirname,
  1584. strerror(errno));
  1585. return -1;
  1586. } else {
  1587. return 0;
  1588. }
  1589. }
  1590. #endif
  1591. return 0;
  1592. }
  1593. /** Create a file named <b>fname</b> with the contents <b>str</b>. Overwrite
  1594. * the previous <b>fname</b> if possible. Return 0 on success, -1 on failure.
  1595. *
  1596. * This function replaces the old file atomically, if possible. This
  1597. * function, and all other functions in util.c that create files, create them
  1598. * with mode 0600.
  1599. */
  1600. int
  1601. write_str_to_file(const char *fname, const char *str, int bin)
  1602. {
  1603. #ifdef MS_WINDOWS
  1604. if (!bin && strchr(str, '\r')) {
  1605. log_warn(LD_BUG,
  1606. "We're writing a text string that already contains a CR.");
  1607. }
  1608. #endif
  1609. return write_bytes_to_file(fname, str, strlen(str), bin);
  1610. }
  1611. /** Represents a file that we're writing to, with support for atomic commit:
  1612. * we can write into a temporary file, and either remove the file on
  1613. * failure, or replace the original file on success. */
  1614. struct open_file_t {
  1615. char *tempname; /**< Name of the temporary file. */
  1616. char *filename; /**< Name of the original file. */
  1617. unsigned rename_on_close:1; /**< Are we using the temporary file or not? */
  1618. unsigned binary:1; /**< Did we open in binary mode? */
  1619. int fd; /**< fd for the open file. */
  1620. FILE *stdio_file; /**< stdio wrapper for <b>fd</b>. */
  1621. };
  1622. /** Try to start writing to the file in <b>fname</b>, passing the flags
  1623. * <b>open_flags</b> to the open() syscall, creating the file (if needed) with
  1624. * access value <b>mode</b>. If the O_APPEND flag is set, we append to the
  1625. * original file. Otherwise, we open a new temporary file in the same
  1626. * directory, and either replace the original or remove the temporary file
  1627. * when we're done.
  1628. *
  1629. * Return the fd for the newly opened file, and store working data in
  1630. * *<b>data_out</b>. The caller should not close the fd manually:
  1631. * instead, call finish_writing_to_file() or abort_writing_to_file().
  1632. * Returns -1 on failure.
  1633. *
  1634. * NOTE: When not appending, the flags O_CREAT and O_TRUNC are treated
  1635. * as true and the flag O_EXCL is treated as false.
  1636. *
  1637. * NOTE: Ordinarily, O_APPEND means "seek to the end of the file before each
  1638. * write()". We don't do that.
  1639. */
  1640. int
  1641. start_writing_to_file(const char *fname, int open_flags, int mode,
  1642. open_file_t **data_out)
  1643. {
  1644. size_t tempname_len = strlen(fname)+16;
  1645. open_file_t *new_file = tor_malloc_zero(sizeof(open_file_t));
  1646. const char *open_name;
  1647. int append = 0;
  1648. tor_assert(fname);
  1649. tor_assert(data_out);
  1650. #if (O_BINARY != 0 && O_TEXT != 0)
  1651. tor_assert((open_flags & (O_BINARY|O_TEXT)) != 0);
  1652. #endif
  1653. new_file->fd = -1;
  1654. tor_assert(tempname_len > strlen(fname)); /*check for overflow*/
  1655. new_file->filename = tor_strdup(fname);
  1656. if (open_flags & O_APPEND) {
  1657. open_name = fname;
  1658. new_file->rename_on_close = 0;
  1659. append = 1;
  1660. open_flags &= ~O_APPEND;
  1661. } else {
  1662. open_name = new_file->tempname = tor_malloc(tempname_len);
  1663. if (tor_snprintf(new_file->tempname, tempname_len, "%s.tmp", fname)<0) {
  1664. log_warn(LD_GENERAL, "Failed to generate filename");
  1665. goto err;
  1666. }
  1667. /* We always replace an existing temporary file if there is one. */
  1668. open_flags |= O_CREAT|O_TRUNC;
  1669. open_flags &= ~O_EXCL;
  1670. new_file->rename_on_close = 1;
  1671. }
  1672. if (open_flags & O_BINARY)
  1673. new_file->binary = 1;
  1674. new_file->fd = open(open_name, open_flags, mode);
  1675. if (new_file->fd < 0) {
  1676. log_warn(LD_FS, "Couldn't open \"%s\" (%s) for writing: %s",
  1677. open_name, fname, strerror(errno));
  1678. goto err;
  1679. }
  1680. if (append) {
  1681. if (tor_fd_seekend(new_file->fd) < 0) {
  1682. log_warn(LD_FS, "Couldn't seek to end of file \"%s\": %s", open_name,
  1683. strerror(errno));
  1684. goto err;
  1685. }
  1686. }
  1687. *data_out = new_file;
  1688. return new_file->fd;
  1689. err:
  1690. if (new_file->fd >= 0)
  1691. close(new_file->fd);
  1692. *data_out = NULL;
  1693. tor_free(new_file->filename);
  1694. tor_free(new_file->tempname);
  1695. tor_free(new_file);
  1696. return -1;
  1697. }
  1698. /** Given <b>file_data</b> from start_writing_to_file(), return a stdio FILE*
  1699. * that can be used to write to the same file. The caller should not mix
  1700. * stdio calls with non-stdio calls. */
  1701. FILE *
  1702. fdopen_file(open_file_t *file_data)
  1703. {
  1704. tor_assert(file_data);
  1705. if (file_data->stdio_file)
  1706. return file_data->stdio_file;
  1707. tor_assert(file_data->fd >= 0);
  1708. if (!(file_data->stdio_file = fdopen(file_data->fd,
  1709. file_data->binary?"ab":"a"))) {
  1710. log_warn(LD_FS, "Couldn't fdopen \"%s\" [%d]: %s", file_data->filename,
  1711. file_data->fd, strerror(errno));
  1712. }
  1713. return file_data->stdio_file;
  1714. }
  1715. /** Combines start_writing_to_file with fdopen_file(): arguments are as
  1716. * for start_writing_to_file, but */
  1717. FILE *
  1718. start_writing_to_stdio_file(const char *fname, int open_flags, int mode,
  1719. open_file_t **data_out)
  1720. {
  1721. FILE *res;
  1722. if (start_writing_to_file(fname, open_flags, mode, data_out)<0)
  1723. return NULL;
  1724. if (!(res = fdopen_file(*data_out))) {
  1725. abort_writing_to_file(*data_out);
  1726. *data_out = NULL;
  1727. }
  1728. return res;
  1729. }
  1730. /** Helper function: close and free the underlying file and memory in
  1731. * <b>file_data</b>. If we were writing into a temporary file, then delete
  1732. * that file (if abort_write is true) or replaces the target file with
  1733. * the temporary file (if abort_write is false). */
  1734. static int
  1735. finish_writing_to_file_impl(open_file_t *file_data, int abort_write)
  1736. {
  1737. int r = 0;
  1738. tor_assert(file_data && file_data->filename);
  1739. if (file_data->stdio_file) {
  1740. if (fclose(file_data->stdio_file)) {
  1741. log_warn(LD_FS, "Error closing \"%s\": %s", file_data->filename,
  1742. strerror(errno));
  1743. abort_write = r = -1;
  1744. }
  1745. } else if (file_data->fd >= 0 && close(file_data->fd) < 0) {
  1746. log_warn(LD_FS, "Error flushing \"%s\": %s", file_data->filename,
  1747. strerror(errno));
  1748. abort_write = r = -1;
  1749. }
  1750. if (file_data->rename_on_close) {
  1751. tor_assert(file_data->tempname && file_data->filename);
  1752. if (abort_write) {
  1753. unlink(file_data->tempname);
  1754. } else {
  1755. tor_assert(strcmp(file_data->filename, file_data->tempname));
  1756. if (replace_file(file_data->tempname, file_data->filename)) {
  1757. log_warn(LD_FS, "Error replacing \"%s\": %s", file_data->filename,
  1758. strerror(errno));
  1759. r = -1;
  1760. }
  1761. }
  1762. }
  1763. tor_free(file_data->filename);
  1764. tor_free(file_data->tempname);
  1765. tor_free(file_data);
  1766. return r;
  1767. }
  1768. /** Finish writing to <b>file_data</b>: close the file handle, free memory as
  1769. * needed, and if using a temporary file, replace the original file with
  1770. * the temporary file. */
  1771. int
  1772. finish_writing_to_file(open_file_t *file_data)
  1773. {
  1774. return finish_writing_to_file_impl(file_data, 0);
  1775. }
  1776. /** Finish writing to <b>file_data</b>: close the file handle, free memory as
  1777. * needed, and if using a temporary file, delete it. */
  1778. int
  1779. abort_writing_to_file(open_file_t *file_data)
  1780. {
  1781. return finish_writing_to_file_impl(file_data, 1);
  1782. }
  1783. /** Helper: given a set of flags as passed to open(2), open the file
  1784. * <b>fname</b> and write all the sized_chunk_t structs in <b>chunks</b> to
  1785. * the file. Do so as atomically as possible e.g. by opening temp files and
  1786. * renaming. */
  1787. static int
  1788. write_chunks_to_file_impl(const char *fname, const smartlist_t *chunks,
  1789. int open_flags)
  1790. {
  1791. open_file_t *file = NULL;
  1792. int fd;
  1793. ssize_t result;
  1794. fd = start_writing_to_file(fname, open_flags, 0600, &file);
  1795. if (fd<0)
  1796. return -1;
  1797. SMARTLIST_FOREACH(chunks, sized_chunk_t *, chunk,
  1798. {
  1799. result = write_all(fd, chunk->bytes, chunk->len, 0);
  1800. if (result < 0) {
  1801. log_warn(LD_FS, "Error writing to \"%s\": %s", fname,
  1802. strerror(errno));
  1803. goto err;
  1804. }
  1805. tor_assert((size_t)result == chunk->len);
  1806. });
  1807. return finish_writing_to_file(file);
  1808. err:
  1809. abort_writing_to_file(file);
  1810. return -1;
  1811. }
  1812. /** Given a smartlist of sized_chunk_t, write them atomically to a file
  1813. * <b>fname</b>, overwriting or creating the file as necessary. */
  1814. int
  1815. write_chunks_to_file(const char *fname, const smartlist_t *chunks, int bin)
  1816. {
  1817. int flags = OPEN_FLAGS_REPLACE|(bin?O_BINARY:O_TEXT);
  1818. return write_chunks_to_file_impl(fname, chunks, flags);
  1819. }
  1820. /** As write_str_to_file, but does not assume a NUL-terminated
  1821. * string. Instead, we write <b>len</b> bytes, starting at <b>str</b>. */
  1822. int
  1823. write_bytes_to_file(const char *fname, const char *str, size_t len,
  1824. int bin)
  1825. {
  1826. int flags = OPEN_FLAGS_REPLACE|(bin?O_BINARY:O_TEXT);
  1827. int r;
  1828. sized_chunk_t c = { str, len };
  1829. smartlist_t *chunks = smartlist_create();
  1830. smartlist_add(chunks, &c);
  1831. r = write_chunks_to_file_impl(fname, chunks, flags);
  1832. smartlist_free(chunks);
  1833. return r;
  1834. }
  1835. /** As write_bytes_to_file, but if the file already exists, append the bytes
  1836. * to the end of the file instead of overwriting it. */
  1837. int
  1838. append_bytes_to_file(const char *fname, const char *str, size_t len,
  1839. int bin)
  1840. {
  1841. int flags = OPEN_FLAGS_APPEND|(bin?O_BINARY:O_TEXT);
  1842. int r;
  1843. sized_chunk_t c = { str, len };
  1844. smartlist_t *chunks = smartlist_create();
  1845. smartlist_add(chunks, &c);
  1846. r = write_chunks_to_file_impl(fname, chunks, flags);
  1847. smartlist_free(chunks);
  1848. return r;
  1849. }
  1850. /** Read the contents of <b>filename</b> into a newly allocated
  1851. * string; return the string on success or NULL on failure.
  1852. *
  1853. * If <b>stat_out</b> is provided, store the result of stat()ing the
  1854. * file into <b>stat_out</b>.
  1855. *
  1856. * If <b>flags</b> &amp; RFTS_BIN, open the file in binary mode.
  1857. * If <b>flags</b> &amp; RFTS_IGNORE_MISSING, don't warn if the file
  1858. * doesn't exist.
  1859. */
  1860. /*
  1861. * This function <em>may</em> return an erroneous result if the file
  1862. * is modified while it is running, but must not crash or overflow.
  1863. * Right now, the error case occurs when the file length grows between
  1864. * the call to stat and the call to read_all: the resulting string will
  1865. * be truncated.
  1866. */
  1867. char *
  1868. read_file_to_str(const char *filename, int flags, struct stat *stat_out)
  1869. {
  1870. int fd; /* router file */
  1871. struct stat statbuf;
  1872. char *string;
  1873. ssize_t r;
  1874. int bin = flags & RFTS_BIN;
  1875. tor_assert(filename);
  1876. fd = open(filename,O_RDONLY|(bin?O_BINARY:O_TEXT),0);
  1877. if (fd<0) {
  1878. int severity = LOG_WARN;
  1879. int save_errno = errno;
  1880. if (errno == ENOENT && (flags & RFTS_IGNORE_MISSING))
  1881. severity = LOG_INFO;
  1882. log_fn(severity, LD_FS,"Could not open \"%s\": %s ",filename,
  1883. strerror(errno));
  1884. errno = save_errno;
  1885. return NULL;
  1886. }
  1887. if (fstat(fd, &statbuf)<0) {
  1888. int save_errno = errno;
  1889. close(fd);
  1890. log_warn(LD_FS,"Could not fstat \"%s\".",filename);
  1891. errno = save_errno;
  1892. return NULL;
  1893. }
  1894. if ((uint64_t)(statbuf.st_size)+1 >= SIZE_T_CEILING)
  1895. return NULL;
  1896. string = tor_malloc((size_t)(statbuf.st_size+1));
  1897. r = read_all(fd,string,(size_t)statbuf.st_size,0);
  1898. if (r<0) {
  1899. int save_errno = errno;
  1900. log_warn(LD_FS,"Error reading from file \"%s\": %s", filename,
  1901. strerror(errno));
  1902. tor_free(string);
  1903. close(fd);
  1904. errno = save_errno;
  1905. return NULL;
  1906. }
  1907. string[r] = '\0'; /* NUL-terminate the result. */
  1908. #ifdef MS_WINDOWS
  1909. if (!bin && strchr(string, '\r')) {
  1910. log_debug(LD_FS, "We didn't convert CRLF to LF as well as we hoped "
  1911. "when reading %s. Coping.",
  1912. filename);
  1913. tor_strstrip(string, "\r");
  1914. r = strlen(string);
  1915. }
  1916. if (!bin) {
  1917. statbuf.st_size = (size_t) r;
  1918. } else
  1919. #endif
  1920. if (r != statbuf.st_size) {
  1921. /* Unless we're using text mode on win32, we'd better have an exact
  1922. * match for size. */
  1923. int save_errno = errno;
  1924. log_warn(LD_FS,"Could read only %d of %ld bytes of file \"%s\".",
  1925. (int)r, (long)statbuf.st_size,filename);
  1926. tor_free(string);
  1927. close(fd);
  1928. errno = save_errno;
  1929. return NULL;
  1930. }
  1931. close(fd);
  1932. if (stat_out) {
  1933. memcpy(stat_out, &statbuf, sizeof(struct stat));
  1934. }
  1935. return string;
  1936. }
  1937. #define TOR_ISODIGIT(c) ('0' <= (c) && (c) <= '7')
  1938. /** Given a c-style double-quoted escaped string in <b>s</b>, extract and
  1939. * decode its contents into a newly allocated string. On success, assign this
  1940. * string to *<b>result</b>, assign its length to <b>size_out</b> (if
  1941. * provided), and return a pointer to the position in <b>s</b> immediately
  1942. * after the string. On failure, return NULL.
  1943. */
  1944. static const char *
  1945. unescape_string(const char *s, char **result, size_t *size_out)
  1946. {
  1947. const char *cp;
  1948. char *out;
  1949. if (s[0] != '\"')
  1950. return NULL;
  1951. cp = s+1;
  1952. while (1) {
  1953. switch (*cp) {
  1954. case '\0':
  1955. case '\n':
  1956. return NULL;
  1957. case '\"':
  1958. goto end_of_loop;
  1959. case '\\':
  1960. if ((cp[1] == 'x' || cp[1] == 'X')
  1961. && TOR_ISXDIGIT(cp[2]) && TOR_ISXDIGIT(cp[3])) {
  1962. cp += 4;
  1963. } else if (TOR_ISODIGIT(cp[1])) {
  1964. cp += 2;
  1965. if (TOR_ISODIGIT(*cp)) ++cp;
  1966. if (TOR_ISODIGIT(*cp)) ++cp;
  1967. } else if (cp[1]) {
  1968. cp += 2;
  1969. } else {
  1970. return NULL;
  1971. }
  1972. break;
  1973. default:
  1974. ++cp;
  1975. break;
  1976. }
  1977. }
  1978. end_of_loop:
  1979. out = *result = tor_malloc(cp-s + 1);
  1980. cp = s+1;
  1981. while (1) {
  1982. switch (*cp)
  1983. {
  1984. case '\"':
  1985. *out = '\0';
  1986. if (size_out) *size_out = out - *result;
  1987. return cp+1;
  1988. case '\0':
  1989. tor_fragile_assert();
  1990. tor_free(*result);
  1991. return NULL;
  1992. case '\\':
  1993. switch (cp[1])
  1994. {
  1995. case 'n': *out++ = '\n'; cp += 2; break;
  1996. case 'r': *out++ = '\r'; cp += 2; break;
  1997. case 't': *out++ = '\t'; cp += 2; break;
  1998. case 'x': case 'X':
  1999. *out++ = ((hex_decode_digit(cp[2])<<4) +
  2000. hex_decode_digit(cp[3]));
  2001. cp += 4;
  2002. break;
  2003. case '0': case '1': case '2': case '3': case '4': case '5':
  2004. case '6': case '7':
  2005. {
  2006. int n = cp[1]-'0';
  2007. cp += 2;
  2008. if (TOR_ISODIGIT(*cp)) { n = n*8 + *cp-'0'; cp++; }
  2009. if (TOR_ISODIGIT(*cp)) { n = n*8 + *cp-'0'; cp++; }
  2010. if (n > 255) { tor_free(*result); return NULL; }
  2011. *out++ = (char)n;
  2012. }
  2013. break;
  2014. case '\'':
  2015. case '\"':
  2016. case '\\':
  2017. case '\?':
  2018. *out++ = cp[1];
  2019. cp += 2;
  2020. break;
  2021. default:
  2022. tor_free(*result); return NULL;
  2023. }
  2024. break;
  2025. default:
  2026. *out++ = *cp++;
  2027. }
  2028. }
  2029. }
  2030. /** Given a string containing part of a configuration file or similar format,
  2031. * advance past comments and whitespace and try to parse a single line. If we
  2032. * parse a line successfully, set *<b>key_out</b> to a new string holding the
  2033. * key portion and *<b>value_out</b> to a new string holding the value portion
  2034. * of the line, and return a pointer to the start of the next line. If we run
  2035. * out of data, return a pointer to the end of the string. If we encounter an
  2036. * error, return NULL.
  2037. */
  2038. const char *
  2039. parse_config_line_from_str(const char *line, char **key_out, char **value_out)
  2040. {
  2041. /* I believe the file format here is supposed to be:
  2042. FILE = (EMPTYLINE | LINE)* (EMPTYLASTLINE | LASTLINE)?
  2043. EMPTYLASTLINE = SPACE* | COMMENT
  2044. EMPTYLINE = EMPTYLASTLINE NL
  2045. SPACE = ' ' | '\r' | '\t'
  2046. COMMENT = '#' NOT-NL*
  2047. NOT-NL = Any character except '\n'
  2048. NL = '\n'
  2049. LASTLINE = SPACE* KEY SPACE* VALUES
  2050. LINE = LASTLINE NL
  2051. KEY = KEYCHAR+
  2052. KEYCHAR = Any character except ' ', '\r', '\n', '\t', '#', "\"
  2053. VALUES = QUOTEDVALUE | NORMALVALUE
  2054. QUOTEDVALUE = QUOTE QVITEM* QUOTE EOLSPACE?
  2055. QUOTE = '"'
  2056. QVCHAR = KEYCHAR | ESC ('n' | 't' | 'r' | '"' | ESC |'\'' | OCTAL | HEX)
  2057. ESC = "\\"
  2058. OCTAL = ODIGIT (ODIGIT ODIGIT?)?
  2059. HEX = ('x' | 'X') HEXDIGIT HEXDIGIT
  2060. ODIGIT = '0' .. '7'
  2061. HEXDIGIT = '0'..'9' | 'a' .. 'f' | 'A' .. 'F'
  2062. EOLSPACE = SPACE* COMMENT?
  2063. NORMALVALUE = (VALCHAR | ESC ESC_IGNORE | CONTINUATION)* EOLSPACE?
  2064. VALCHAR = Any character except ESC, '#', and '\n'
  2065. ESC_IGNORE = Any character except '#' or '\n'
  2066. CONTINUATION = ESC NL ( COMMENT NL )*
  2067. */
  2068. const char *key, *val, *cp;
  2069. int continuation = 0;
  2070. tor_assert(key_out);
  2071. tor_assert(value_out);
  2072. *key_out = *value_out = NULL;
  2073. key = val = NULL;
  2074. /* Skip until the first keyword. */
  2075. while (1) {
  2076. while (TOR_ISSPACE(*line))
  2077. ++line;
  2078. if (*line == '#') {
  2079. while (*line && *line != '\n')
  2080. ++line;
  2081. } else {
  2082. break;
  2083. }
  2084. }
  2085. if (!*line) { /* End of string? */
  2086. *key_out = *value_out = NULL;
  2087. return line;
  2088. }
  2089. /* Skip until the next space or \ followed by newline. */
  2090. key = line;
  2091. while (*line && !TOR_ISSPACE(*line) && *line != '#' &&
  2092. ! (line[0] == '\\' && line[1] == '\n'))
  2093. ++line;
  2094. *key_out = tor_strndup(key, line-key);
  2095. /* Skip until the value. */
  2096. while (*line == ' ' || *line == '\t')
  2097. ++line;
  2098. val = line;
  2099. /* Find the end of the line. */
  2100. if (*line == '\"') { // XXX No continuation handling is done here
  2101. if (!(line = unescape_string(line, value_out, NULL)))
  2102. return NULL;
  2103. while (*line == ' ' || *line == '\t')
  2104. ++line;
  2105. if (*line && *line != '#' && *line != '\n')
  2106. return NULL;
  2107. } else {
  2108. /* Look for the end of the line. */
  2109. while (*line && *line != '\n' && (*line != '#' || continuation)) {
  2110. if (*line == '\\' && line[1] == '\n') {
  2111. continuation = 1;
  2112. line += 2;
  2113. } else if (*line == '#') {
  2114. do {
  2115. ++line;
  2116. } while (*line && *line != '\n');
  2117. if (*line == '\n')
  2118. ++line;
  2119. } else {
  2120. ++line;
  2121. }
  2122. }
  2123. if (*line == '\n') {
  2124. cp = line++;
  2125. } else {
  2126. cp = line;
  2127. }
  2128. /* Now back cp up to be the last nonspace character */
  2129. while (cp>val && TOR_ISSPACE(*(cp-1)))
  2130. --cp;
  2131. tor_assert(cp >= val);
  2132. /* Now copy out and decode the value. */
  2133. *value_out = tor_strndup(val, cp-val);
  2134. if (continuation) {
  2135. char *v_out, *v_in;
  2136. v_out = v_in = *value_out;
  2137. while (*v_in) {
  2138. if (*v_in == '#') {
  2139. do {
  2140. ++v_in;
  2141. } while (*v_in && *v_in != '\n');
  2142. if (*v_in == '\n')
  2143. ++v_in;
  2144. } else if (v_in[0] == '\\' && v_in[1] == '\n') {
  2145. v_in += 2;
  2146. } else {
  2147. *v_out++ = *v_in++;
  2148. }
  2149. }
  2150. *v_out = '\0';
  2151. }
  2152. }
  2153. if (*line == '#') {
  2154. do {
  2155. ++line;
  2156. } while (*line && *line != '\n');
  2157. }
  2158. while (TOR_ISSPACE(*line)) ++line;
  2159. return line;
  2160. }
  2161. /** Expand any homedir prefix on <b>filename</b>; return a newly allocated
  2162. * string. */
  2163. char *
  2164. expand_filename(const char *filename)
  2165. {
  2166. tor_assert(filename);
  2167. #ifdef MS_WINDOWS
  2168. return tor_strdup(filename);
  2169. #else
  2170. if (*filename == '~') {
  2171. char *home, *result=NULL;
  2172. const char *rest;
  2173. if (filename[1] == '/' || filename[1] == '\0') {
  2174. home = getenv("HOME");
  2175. if (!home) {
  2176. log_warn(LD_CONFIG, "Couldn't find $HOME environment variable while "
  2177. "expanding \"%s\"; defaulting to \"\".", filename);
  2178. home = tor_strdup("");
  2179. } else {
  2180. home = tor_strdup(home);
  2181. }
  2182. rest = strlen(filename)>=2?(filename+2):"";
  2183. } else {
  2184. #ifdef HAVE_PWD_H
  2185. char *username, *slash;
  2186. slash = strchr(filename, '/');
  2187. if (slash)
  2188. username = tor_strndup(filename+1,slash-filename-1);
  2189. else
  2190. username = tor_strdup(filename+1);
  2191. if (!(home = get_user_homedir(username))) {
  2192. log_warn(LD_CONFIG,"Couldn't get homedir for \"%s\"",username);
  2193. tor_free(username);
  2194. return NULL;
  2195. }
  2196. tor_free(username);
  2197. rest = slash ? (slash+1) : "";
  2198. #else
  2199. log_warn(LD_CONFIG, "Couldn't expend homedir on system without pwd.h");
  2200. return tor_strdup(filename);
  2201. #endif
  2202. }
  2203. tor_assert(home);
  2204. /* Remove trailing slash. */
  2205. if (strlen(home)>1 && !strcmpend(home,PATH_SEPARATOR)) {
  2206. home[strlen(home)-1] = '\0';
  2207. }
  2208. tor_asprintf(&result,"%s"PATH_SEPARATOR"%s",home,rest);
  2209. tor_free(home);
  2210. return result;
  2211. } else {
  2212. return tor_strdup(filename);
  2213. }
  2214. #endif
  2215. }
  2216. #define MAX_SCANF_WIDTH 9999
  2217. /** Helper: given an ASCII-encoded decimal digit, return its numeric value.
  2218. * NOTE: requires that its input be in-bounds. */
  2219. static int
  2220. digit_to_num(char d)
  2221. {
  2222. int num = ((int)d) - (int)'0';
  2223. tor_assert(num <= 9 && num >= 0);
  2224. return num;
  2225. }
  2226. /** Helper: Read an unsigned int from *<b>bufp</b> of up to <b>width</b>
  2227. * characters. (Handle arbitrary width if <b>width</b> is less than 0.) On
  2228. * success, store the result in <b>out</b>, advance bufp to the next
  2229. * character, and return 0. On failure, return -1. */
  2230. static int
  2231. scan_unsigned(const char **bufp, unsigned *out, int width)
  2232. {
  2233. unsigned result = 0;
  2234. int scanned_so_far = 0;
  2235. if (!bufp || !*bufp || !out)
  2236. return -1;
  2237. if (width<0)
  2238. width=MAX_SCANF_WIDTH;
  2239. while (**bufp && TOR_ISDIGIT(**bufp) && scanned_so_far < width) {
  2240. int digit = digit_to_num(*(*bufp)++);
  2241. unsigned new_result = result * 10 + digit;
  2242. if (new_result > UINT32_MAX || new_result < result)
  2243. return -1; /* over/underflow. */
  2244. result = new_result;
  2245. ++scanned_so_far;
  2246. }
  2247. if (!scanned_so_far) /* No actual digits scanned */
  2248. return -1;
  2249. *out = result;
  2250. return 0;
  2251. }
  2252. /** Helper: copy up to <b>width</b> non-space characters from <b>bufp</b> to
  2253. * <b>out</b>. Make sure <b>out</b> is nul-terminated. Advance <b>bufp</b>
  2254. * to the next non-space character or the EOS. */
  2255. static int
  2256. scan_string(const char **bufp, char *out, int width)
  2257. {
  2258. int scanned_so_far = 0;
  2259. if (!bufp || !out || width < 0)
  2260. return -1;
  2261. while (**bufp && ! TOR_ISSPACE(**bufp) && scanned_so_far < width) {
  2262. *out++ = *(*bufp)++;
  2263. ++scanned_so_far;
  2264. }
  2265. *out = '\0';
  2266. return 0;
  2267. }
  2268. /** Locale-independent, minimal, no-surprises scanf variant, accepting only a
  2269. * restricted pattern format. For more info on what it supports, see
  2270. * tor_sscanf() documentation. */
  2271. int
  2272. tor_vsscanf(const char *buf, const char *pattern, va_list ap)
  2273. {
  2274. int n_matched = 0;
  2275. while (*pattern) {
  2276. if (*pattern != '%') {
  2277. if (*buf == *pattern) {
  2278. ++buf;
  2279. ++pattern;
  2280. continue;
  2281. } else {
  2282. return n_matched;
  2283. }
  2284. } else {
  2285. int width = -1;
  2286. ++pattern;
  2287. if (TOR_ISDIGIT(*pattern)) {
  2288. width = digit_to_num(*pattern++);
  2289. while (TOR_ISDIGIT(*pattern)) {
  2290. width *= 10;
  2291. width += digit_to_num(*pattern++);
  2292. if (width > MAX_SCANF_WIDTH)
  2293. return -1;
  2294. }
  2295. if (!width) /* No zero-width things. */
  2296. return -1;
  2297. }
  2298. if (*pattern == 'u') {
  2299. unsigned *u = va_arg(ap, unsigned *);
  2300. if (!*buf)
  2301. return n_matched;
  2302. if (scan_unsigned(&buf, u, width)<0)
  2303. return n_matched;
  2304. ++pattern;
  2305. ++n_matched;
  2306. } else if (*pattern == 's') {
  2307. char *s = va_arg(ap, char *);
  2308. if (width < 0)
  2309. return -1;
  2310. if (scan_string(&buf, s, width)<0)
  2311. return n_matched;
  2312. ++pattern;
  2313. ++n_matched;
  2314. } else if (*pattern == 'c') {
  2315. char *ch = va_arg(ap, char *);
  2316. if (width != -1)
  2317. return -1;
  2318. if (!*buf)
  2319. return n_matched;
  2320. *ch = *buf++;
  2321. ++pattern;
  2322. ++n_matched;
  2323. } else if (*pattern == '%') {
  2324. if (*buf != '%')
  2325. return -1;
  2326. ++buf;
  2327. ++pattern;
  2328. } else {
  2329. return -1; /* Unrecognized pattern component. */
  2330. }
  2331. }
  2332. }
  2333. return n_matched;
  2334. }
  2335. /** Minimal sscanf replacement: parse <b>buf</b> according to <b>pattern</b>
  2336. * and store the results in the corresponding argument fields. Differs from
  2337. * sscanf in that it: Only handles %u and %Ns. Does not handle arbitrarily
  2338. * long widths. %u does not consume any space. Is locale-independent.
  2339. * Returns -1 on malformed patterns.
  2340. *
  2341. * (As with other locale-independent functions, we need this to parse data that
  2342. * is in ASCII without worrying that the C library's locale-handling will make
  2343. * miscellaneous characters look like numbers, spaces, and so on.)
  2344. */
  2345. int
  2346. tor_sscanf(const char *buf, const char *pattern, ...)
  2347. {
  2348. int r;
  2349. va_list ap;
  2350. va_start(ap, pattern);
  2351. r = tor_vsscanf(buf, pattern, ap);
  2352. va_end(ap);
  2353. return r;
  2354. }
  2355. /** Return a new list containing the filenames in the directory <b>dirname</b>.
  2356. * Return NULL on error or if <b>dirname</b> is not a directory.
  2357. */
  2358. smartlist_t *
  2359. tor_listdir(const char *dirname)
  2360. {
  2361. smartlist_t *result;
  2362. #ifdef MS_WINDOWS
  2363. char *pattern;
  2364. TCHAR tpattern[MAX_PATH] = {0};
  2365. char name[MAX_PATH] = {0};
  2366. HANDLE handle;
  2367. WIN32_FIND_DATA findData;
  2368. size_t pattern_len = strlen(dirname)+16;
  2369. pattern = tor_malloc(pattern_len);
  2370. tor_snprintf(pattern, pattern_len, "%s\\*", dirname);
  2371. #ifdef UNICODE
  2372. mbstowcs(tpattern,pattern,MAX_PATH);
  2373. #else
  2374. strlcpy(tpattern, pattern, MAX_PATH);
  2375. #endif
  2376. if (INVALID_HANDLE_VALUE == (handle = FindFirstFile(tpattern, &findData))) {
  2377. tor_free(pattern);
  2378. return NULL;
  2379. }
  2380. result = smartlist_create();
  2381. while (1) {
  2382. #ifdef UNICODE
  2383. wcstombs(name,findData.cFileName,MAX_PATH);
  2384. #else
  2385. strlcpy(name,findData.cFileName,sizeof(name));
  2386. #endif
  2387. if (strcmp(name, ".") &&
  2388. strcmp(name, "..")) {
  2389. smartlist_add(result, tor_strdup(name));
  2390. }
  2391. if (!FindNextFile(handle, &findData)) {
  2392. DWORD err;
  2393. if ((err = GetLastError()) != ERROR_NO_MORE_FILES) {
  2394. char *errstr = format_win32_error(err);
  2395. log_warn(LD_FS, "Error reading directory '%s': %s", dirname, errstr);
  2396. tor_free(errstr);
  2397. }
  2398. break;
  2399. }
  2400. }
  2401. FindClose(handle);
  2402. tor_free(pattern);
  2403. #else
  2404. DIR *d;
  2405. struct dirent *de;
  2406. if (!(d = opendir(dirname)))
  2407. return NULL;
  2408. result = smartlist_create();
  2409. while ((de = readdir(d))) {
  2410. if (!strcmp(de->d_name, ".") ||
  2411. !strcmp(de->d_name, ".."))
  2412. continue;
  2413. smartlist_add(result, tor_strdup(de->d_name));
  2414. }
  2415. closedir(d);
  2416. #endif
  2417. return result;
  2418. }
  2419. /** Return true iff <b>filename</b> is a relative path. */
  2420. int
  2421. path_is_relative(const char *filename)
  2422. {
  2423. if (filename && filename[0] == '/')
  2424. return 0;
  2425. #ifdef MS_WINDOWS
  2426. else if (filename && filename[0] == '\\')
  2427. return 0;
  2428. else if (filename && strlen(filename)>3 && TOR_ISALPHA(filename[0]) &&
  2429. filename[1] == ':' && filename[2] == '\\')
  2430. return 0;
  2431. #endif
  2432. else
  2433. return 1;
  2434. }
  2435. /* =====
  2436. * Process helpers
  2437. * ===== */
  2438. #ifndef MS_WINDOWS
  2439. /* Based on code contributed by christian grothoff */
  2440. /** True iff we've called start_daemon(). */
  2441. static int start_daemon_called = 0;
  2442. /** True iff we've called finish_daemon(). */
  2443. static int finish_daemon_called = 0;
  2444. /** Socketpair used to communicate between parent and child process while
  2445. * daemonizing. */
  2446. static int daemon_filedes[2];
  2447. /** Start putting the process into daemon mode: fork and drop all resources
  2448. * except standard fds. The parent process never returns, but stays around
  2449. * until finish_daemon is called. (Note: it's safe to call this more
  2450. * than once: calls after the first are ignored.)
  2451. */
  2452. void
  2453. start_daemon(void)
  2454. {
  2455. pid_t pid;
  2456. if (start_daemon_called)
  2457. return;
  2458. start_daemon_called = 1;
  2459. if (pipe(daemon_filedes)) {
  2460. log_err(LD_GENERAL,"pipe failed; exiting. Error was %s", strerror(errno));
  2461. exit(1);
  2462. }
  2463. pid = fork();
  2464. if (pid < 0) {
  2465. log_err(LD_GENERAL,"fork failed. Exiting.");
  2466. exit(1);
  2467. }
  2468. if (pid) { /* Parent */
  2469. int ok;
  2470. char c;
  2471. close(daemon_filedes[1]); /* we only read */
  2472. ok = -1;
  2473. while (0 < read(daemon_filedes[0], &c, sizeof(char))) {
  2474. if (c == '.')
  2475. ok = 1;
  2476. }
  2477. fflush(stdout);
  2478. if (ok == 1)
  2479. exit(0);
  2480. else
  2481. exit(1); /* child reported error */
  2482. } else { /* Child */
  2483. close(daemon_filedes[0]); /* we only write */
  2484. pid = setsid(); /* Detach from controlling terminal */
  2485. /*
  2486. * Fork one more time, so the parent (the session group leader) can exit.
  2487. * This means that we, as a non-session group leader, can never regain a
  2488. * controlling terminal. This part is recommended by Stevens's
  2489. * _Advanced Programming in the Unix Environment_.
  2490. */
  2491. if (fork() != 0) {
  2492. exit(0);
  2493. }
  2494. set_main_thread(); /* We are now the main thread. */
  2495. return;
  2496. }
  2497. }
  2498. /** Finish putting the process into daemon mode: drop standard fds, and tell
  2499. * the parent process to exit. (Note: it's safe to call this more than once:
  2500. * calls after the first are ignored. Calls start_daemon first if it hasn't
  2501. * been called already.)
  2502. */
  2503. void
  2504. finish_daemon(const char *desired_cwd)
  2505. {
  2506. int nullfd;
  2507. char c = '.';
  2508. if (finish_daemon_called)
  2509. return;
  2510. if (!start_daemon_called)
  2511. start_daemon();
  2512. finish_daemon_called = 1;
  2513. if (!desired_cwd)
  2514. desired_cwd = "/";
  2515. /* Don't hold the wrong FS mounted */
  2516. if (chdir(desired_cwd) < 0) {
  2517. log_err(LD_GENERAL,"chdir to \"%s\" failed. Exiting.",desired_cwd);
  2518. exit(1);
  2519. }
  2520. nullfd = open("/dev/null", O_RDWR);
  2521. if (nullfd < 0) {
  2522. log_err(LD_GENERAL,"/dev/null can't be opened. Exiting.");
  2523. exit(1);
  2524. }
  2525. /* close fds linking to invoking terminal, but
  2526. * close usual incoming fds, but redirect them somewhere
  2527. * useful so the fds don't get reallocated elsewhere.
  2528. */
  2529. if (dup2(nullfd,0) < 0 ||
  2530. dup2(nullfd,1) < 0 ||
  2531. dup2(nullfd,2) < 0) {
  2532. log_err(LD_GENERAL,"dup2 failed. Exiting.");
  2533. exit(1);
  2534. }
  2535. if (nullfd > 2)
  2536. close(nullfd);
  2537. /* signal success */
  2538. if (write(daemon_filedes[1], &c, sizeof(char)) != sizeof(char)) {
  2539. log_err(LD_GENERAL,"write failed. Exiting.");
  2540. }
  2541. close(daemon_filedes[1]);
  2542. }
  2543. #else
  2544. /* defined(MS_WINDOWS) */
  2545. void
  2546. start_daemon(void)
  2547. {
  2548. }
  2549. void
  2550. finish_daemon(const char *cp)
  2551. {
  2552. (void)cp;
  2553. }
  2554. #endif
  2555. /** Write the current process ID, followed by NL, into <b>filename</b>.
  2556. */
  2557. void
  2558. write_pidfile(char *filename)
  2559. {
  2560. FILE *pidfile;
  2561. if ((pidfile = fopen(filename, "w")) == NULL) {
  2562. log_warn(LD_FS, "Unable to open \"%s\" for writing: %s", filename,
  2563. strerror(errno));
  2564. } else {
  2565. #ifdef MS_WINDOWS
  2566. fprintf(pidfile, "%d\n", (int)_getpid());
  2567. #else
  2568. fprintf(pidfile, "%d\n", (int)getpid());
  2569. #endif
  2570. fclose(pidfile);
  2571. }
  2572. }
  2573. #ifdef MS_WINDOWS
  2574. HANDLE
  2575. load_windows_system_library(const TCHAR *library_name)
  2576. {
  2577. TCHAR path[MAX_PATH];
  2578. unsigned n;
  2579. n = GetSystemDirectory(path, MAX_PATH);
  2580. if (n == 0 || n + _tcslen(library_name) + 2 >= MAX_PATH)
  2581. return 0;
  2582. _tcscat(path, TEXT("\\"));
  2583. _tcscat(path, library_name);
  2584. return LoadLibrary(path);
  2585. }
  2586. #endif