misc.h 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488
  1. /*
  2. * Header for miscellaneous helper functions, mostly defined in the
  3. * utils subdirectory.
  4. */
  5. #ifndef PUTTY_MISC_H
  6. #define PUTTY_MISC_H
  7. #include "defs.h"
  8. #include "puttymem.h"
  9. #include "marshal.h"
  10. #include <stdio.h> /* for FILE * */
  11. #include <stdarg.h> /* for va_list */
  12. #include <stdlib.h> /* for abort */
  13. #include <time.h> /* for struct tm */
  14. #include <limits.h> /* for INT_MAX/MIN */
  15. #include <assert.h> /* for assert (obviously) */
  16. unsigned long parse_blocksize(const char *bs);
  17. char ctrlparse(char *s, char **next);
  18. size_t host_strcspn(const char *s, const char *set);
  19. char *host_strchr(const char *s, int c);
  20. char *host_strrchr(const char *s, int c);
  21. char *host_strduptrim(const char *s);
  22. char *dupstr(const char *s);
  23. char *dupcat_fn(const char *s1, ...);
  24. #define dupcat(...) dupcat_fn(__VA_ARGS__, (const char *)NULL)
  25. char *dupprintf(const char *fmt, ...) PRINTF_LIKE(1, 2);
  26. char *dupvprintf(const char *fmt, va_list ap);
  27. void burnstr(char *string);
  28. /*
  29. * The visible part of a strbuf structure. There's a surrounding
  30. * implementation struct in strbuf.c, which isn't exposed to client
  31. * code.
  32. */
  33. struct strbuf {
  34. char *s;
  35. unsigned char *u;
  36. size_t len;
  37. BinarySink_IMPLEMENTATION;
  38. };
  39. /* strbuf constructors: strbuf_new_nm and strbuf_new differ in that a
  40. * strbuf constructed using the _nm version will resize itself by
  41. * alloc/copy/smemclr/free instead of realloc. Use that version for
  42. * data sensitive enough that it's worth costing performance to
  43. * avoid copies of it lingering in process memory. */
  44. strbuf *strbuf_new(void);
  45. strbuf *strbuf_new_nm(void);
  46. void strbuf_free(strbuf *buf);
  47. void *strbuf_append(strbuf *buf, size_t len);
  48. void strbuf_shrink_to(strbuf *buf, size_t new_len);
  49. void strbuf_shrink_by(strbuf *buf, size_t amount_to_remove);
  50. char *strbuf_to_str(strbuf *buf); /* does free buf, but you must free result */
  51. static inline void strbuf_clear(strbuf *buf) { strbuf_shrink_to(buf, 0); }
  52. bool strbuf_chomp(strbuf *buf, char char_to_remove);
  53. strbuf *strbuf_new_for_agent_query(void);
  54. void strbuf_finalise_agent_query(strbuf *buf);
  55. /* String-to-Unicode converters that auto-allocate the destination and
  56. * work around the rather deficient interface of mb_to_wc. */
  57. wchar_t *dup_mb_to_wc_c(int codepage, int flags, const char *string, int len);
  58. wchar_t *dup_mb_to_wc(int codepage, int flags, const char *string);
  59. char *dup_wc_to_mb_c(int codepage, int flags, const wchar_t *string, int len,
  60. const char *defchr, struct unicode_data *ucsdata);
  61. char *dup_wc_to_mb(int codepage, int flags, const wchar_t *string,
  62. const char *defchr, struct unicode_data *ucsdata);
  63. static inline int toint(unsigned u)
  64. {
  65. /*
  66. * Convert an unsigned to an int, without running into the
  67. * undefined behaviour which happens by the strict C standard if
  68. * the value overflows. You'd hope that sensible compilers would
  69. * do the sensible thing in response to a cast, but actually I
  70. * don't trust modern compilers not to do silly things like
  71. * assuming that _obviously_ you wouldn't have caused an overflow
  72. * and so they can elide an 'if (i < 0)' test immediately after
  73. * the cast.
  74. *
  75. * Sensible compilers ought of course to optimise this entire
  76. * function into 'just return the input value', and since it's
  77. * also declared inline, elide it completely in their output.
  78. */
  79. if (u <= (unsigned)INT_MAX)
  80. return (int)u;
  81. else if (u >= (unsigned)INT_MIN) /* wrap in cast _to_ unsigned is OK */
  82. return INT_MIN + (int)(u - (unsigned)INT_MIN);
  83. else
  84. return INT_MIN; /* fallback; should never occur on binary machines */
  85. }
  86. char *fgetline(FILE *fp);
  87. bool read_file_into(BinarySink *bs, FILE *fp);
  88. char *chomp(char *str);
  89. bool strstartswith(const char *s, const char *t);
  90. bool strendswith(const char *s, const char *t);
  91. void base64_encode_atom(const unsigned char *data, int n, char *out);
  92. int base64_decode_atom(const char *atom, unsigned char *out);
  93. struct bufchain_granule;
  94. struct bufchain_tag {
  95. struct bufchain_granule *head, *tail;
  96. size_t buffersize; /* current amount of buffered data */
  97. void (*queue_idempotent_callback)(IdempotentCallback *ic);
  98. IdempotentCallback *ic;
  99. };
  100. void bufchain_init(bufchain *ch);
  101. void bufchain_clear(bufchain *ch);
  102. size_t bufchain_size(bufchain *ch);
  103. void bufchain_add(bufchain *ch, const void *data, size_t len);
  104. ptrlen bufchain_prefix(bufchain *ch);
  105. void bufchain_consume(bufchain *ch, size_t len);
  106. void bufchain_fetch(bufchain *ch, void *data, size_t len);
  107. void bufchain_fetch_consume(bufchain *ch, void *data, size_t len);
  108. bool bufchain_try_consume(bufchain *ch, size_t len);
  109. bool bufchain_try_fetch(bufchain *ch, void *data, size_t len);
  110. bool bufchain_try_fetch_consume(bufchain *ch, void *data, size_t len);
  111. size_t bufchain_fetch_consume_up_to(bufchain *ch, void *data, size_t len);
  112. void bufchain_set_callback_inner(
  113. bufchain *ch, IdempotentCallback *ic,
  114. void (*queue_idempotent_callback)(IdempotentCallback *ic));
  115. static inline void bufchain_set_callback(bufchain *ch, IdempotentCallback *ic)
  116. {
  117. extern void queue_idempotent_callback(struct IdempotentCallback *ic);
  118. /* Wrapper that puts in the standard queue_idempotent_callback
  119. * function. Lives here rather than in bufchain.c so that
  120. * standalone programs can use the bufchain facility without this
  121. * optional callback feature and not need to provide a stub of
  122. * queue_idempotent_callback. */
  123. bufchain_set_callback_inner(ch, ic, queue_idempotent_callback);
  124. }
  125. bool validate_manual_hostkey(char *key);
  126. struct tm ltime(void);
  127. /*
  128. * Special form of strcmp which can cope with NULL inputs. NULL is
  129. * defined to sort before even the empty string.
  130. */
  131. int nullstrcmp(const char *a, const char *b);
  132. static inline ptrlen make_ptrlen(const void *ptr, size_t len)
  133. {
  134. ptrlen pl;
  135. pl.ptr = ptr;
  136. pl.len = len;
  137. return pl;
  138. }
  139. static inline ptrlen ptrlen_from_asciz(const char *str)
  140. {
  141. return make_ptrlen(str, strlen(str));
  142. }
  143. static inline ptrlen ptrlen_from_strbuf(strbuf *sb)
  144. {
  145. return make_ptrlen(sb->u, sb->len);
  146. }
  147. bool ptrlen_eq_string(ptrlen pl, const char *str);
  148. bool ptrlen_eq_ptrlen(ptrlen pl1, ptrlen pl2);
  149. int ptrlen_strcmp(ptrlen pl1, ptrlen pl2);
  150. /* ptrlen_startswith and ptrlen_endswith write through their 'tail'
  151. * argument if and only if it is non-NULL and they return true. Hence
  152. * you can write ptrlen_startswith(thing, prefix, &thing), writing
  153. * back to the same ptrlen it read from, to remove a prefix if present
  154. * and say whether it did so. */
  155. bool ptrlen_startswith(ptrlen whole, ptrlen prefix, ptrlen *tail);
  156. bool ptrlen_endswith(ptrlen whole, ptrlen suffix, ptrlen *tail);
  157. ptrlen ptrlen_get_word(ptrlen *input, const char *separators);
  158. char *mkstr(ptrlen pl);
  159. int string_length_for_printf(size_t);
  160. /* Derive two printf arguments from a ptrlen, suitable for "%.*s" */
  161. #define PTRLEN_PRINTF(pl) \
  162. string_length_for_printf((pl).len), (const char *)(pl).ptr
  163. /* Make a ptrlen out of a compile-time string literal. We try to
  164. * enforce that it _is_ a string literal by token-pasting "" on to it,
  165. * which should provoke a compile error if it's any other kind of
  166. * string. */
  167. #define PTRLEN_LITERAL(stringlit) \
  168. TYPECHECK("" stringlit "", make_ptrlen(stringlit, sizeof(stringlit)-1))
  169. /* Make a ptrlen out of a compile-time string literal in a way that
  170. * allows you to declare the ptrlen itself as a compile-time initialiser. */
  171. #define PTRLEN_DECL_LITERAL(stringlit) \
  172. { TYPECHECK("" stringlit "", stringlit), sizeof(stringlit)-1 }
  173. /* Make a ptrlen out of a constant byte array. */
  174. #define PTRLEN_FROM_CONST_BYTES(a) make_ptrlen(a, sizeof(a))
  175. /* Wipe sensitive data out of memory that's about to be freed. Simpler
  176. * than memset because we don't need the fill char parameter; also
  177. * attempts (by fiddly use of volatile) to inhibit the compiler from
  178. * over-cleverly trying to optimise the memset away because it knows
  179. * the variable is going out of scope. */
  180. void smemclr(void *b, size_t len);
  181. /* Compare two fixed-length chunks of memory for equality, without
  182. * data-dependent control flow (so an attacker with a very accurate
  183. * stopwatch can't try to guess where the first mismatching byte was).
  184. * Returns false for mismatch or true for equality (unlike memcmp),
  185. * hinted at by the 'eq' in the name. */
  186. bool smemeq(const void *av, const void *bv, size_t len);
  187. /* Encode a single UTF-8 character. Assumes that illegal characters
  188. * (such as things in the surrogate range, or > 0x10FFFF) have already
  189. * been removed. */
  190. size_t encode_utf8(void *output, unsigned long ch);
  191. /* Encode a wide-character string into UTF-8. Tolerates surrogates if
  192. * sizeof(wchar_t) == 2, assuming that in that case the wide string is
  193. * encoded in UTF-16. */
  194. char *encode_wide_string_as_utf8(const wchar_t *wstr);
  195. /* Decode a single UTF-8 character. Returns U+FFFD for any of the
  196. * illegal cases. */
  197. unsigned long decode_utf8(const char **utf8);
  198. /* Decode a single UTF-8 character to an output buffer of the
  199. * platform's wchar_t. May write a pair of surrogates if
  200. * sizeof(wchar_t) == 2, assuming that in that case the wide string is
  201. * encoded in UTF-16. Otherwise, writes one character. Returns the
  202. * number written. */
  203. size_t decode_utf8_to_wchar(const char **utf8, wchar_t *out);
  204. /* Write a string out in C string-literal format. */
  205. void write_c_string_literal(FILE *fp, ptrlen str);
  206. char *buildinfo(const char *newline);
  207. /*
  208. * A function you can put at points in the code where execution should
  209. * never reach in the first place. Better than assert(false), or even
  210. * assert(false && "some explanatory message"), because some compilers
  211. * don't interpret assert(false) as a declaration of unreachability,
  212. * so they may still warn about pointless things like some variable
  213. * not being initialised on the unreachable code path.
  214. *
  215. * I follow the assertion with a call to abort() just in case someone
  216. * compiles with -DNDEBUG, and I wrap that abort inside my own
  217. * function labelled NORETURN just in case some unusual kind of system
  218. * header wasn't foresighted enough to label abort() itself that way.
  219. */
  220. static inline NORETURN void unreachable_internal(void) {
  221. #ifndef WINSCP_VS
  222. // Not to try to link to VS abort
  223. abort();
  224. #endif
  225. }
  226. #define unreachable(msg) (assert(false && msg), unreachable_internal())
  227. /*
  228. * Debugging functions.
  229. *
  230. * Output goes to debug.log
  231. *
  232. * debug() is like printf().
  233. *
  234. * dmemdump() and dmemdumpl() both do memory dumps. The difference
  235. * is that dmemdumpl() is more suited for when the memory address is
  236. * important (say because you'll be recording pointer values later
  237. * on). dmemdump() is more concise.
  238. */
  239. #ifdef DEBUG
  240. void debug_printf(const char *fmt, ...) PRINTF_LIKE(1, 2);
  241. void debug_memdump(const void *buf, int len, bool L);
  242. #define debug(...) (debug_printf(__VA_ARGS__))
  243. #define dmemdump(buf,len) (debug_memdump(buf, len, false))
  244. #define dmemdumpl(buf,len) (debug_memdump(buf, len, true))
  245. #else
  246. #define debug(...) ((void)0)
  247. #define dmemdump(buf,len) ((void)0)
  248. #define dmemdumpl(buf,len) ((void)0)
  249. #endif
  250. #ifndef lenof
  251. #define lenof(x) ( (sizeof((x))) / (sizeof(*(x))))
  252. #endif
  253. #ifndef min
  254. #define min(x,y) ( (x) < (y) ? (x) : (y) )
  255. #endif
  256. #ifndef max
  257. #define max(x,y) ( (x) > (y) ? (x) : (y) )
  258. #endif
  259. static inline uint64_t GET_64BIT_LSB_FIRST(const void *vp)
  260. {
  261. const uint8_t *p = (const uint8_t *)vp;
  262. return (((uint64_t)p[0] ) | ((uint64_t)p[1] << 8) |
  263. ((uint64_t)p[2] << 16) | ((uint64_t)p[3] << 24) |
  264. ((uint64_t)p[4] << 32) | ((uint64_t)p[5] << 40) |
  265. ((uint64_t)p[6] << 48) | ((uint64_t)p[7] << 56));
  266. }
  267. static inline void PUT_64BIT_LSB_FIRST(void *vp, uint64_t value)
  268. {
  269. uint8_t *p = (uint8_t *)vp;
  270. p[0] = (uint8_t)(value);
  271. p[1] = (uint8_t)(value >> 8);
  272. p[2] = (uint8_t)(value >> 16);
  273. p[3] = (uint8_t)(value >> 24);
  274. p[4] = (uint8_t)(value >> 32);
  275. p[5] = (uint8_t)(value >> 40);
  276. p[6] = (uint8_t)(value >> 48);
  277. p[7] = (uint8_t)(value >> 56);
  278. }
  279. static inline uint32_t GET_32BIT_LSB_FIRST(const void *vp)
  280. {
  281. const uint8_t *p = (const uint8_t *)vp;
  282. return (((uint32_t)p[0] ) | ((uint32_t)p[1] << 8) |
  283. ((uint32_t)p[2] << 16) | ((uint32_t)p[3] << 24));
  284. }
  285. static inline void PUT_32BIT_LSB_FIRST(void *vp, uint32_t value)
  286. {
  287. uint8_t *p = (uint8_t *)vp;
  288. p[0] = (uint8_t)(value);
  289. p[1] = (uint8_t)(value >> 8);
  290. p[2] = (uint8_t)(value >> 16);
  291. p[3] = (uint8_t)(value >> 24);
  292. }
  293. static inline uint16_t GET_16BIT_LSB_FIRST(const void *vp)
  294. {
  295. const uint8_t *p = (const uint8_t *)vp;
  296. return (((uint16_t)p[0] ) | ((uint16_t)p[1] << 8));
  297. }
  298. static inline void PUT_16BIT_LSB_FIRST(void *vp, uint16_t value)
  299. {
  300. uint8_t *p = (uint8_t *)vp;
  301. p[0] = (uint8_t)(value);
  302. p[1] = (uint8_t)(value >> 8);
  303. }
  304. static inline uint64_t GET_64BIT_MSB_FIRST(const void *vp)
  305. {
  306. const uint8_t *p = (const uint8_t *)vp;
  307. return (((uint64_t)p[7] ) | ((uint64_t)p[6] << 8) |
  308. ((uint64_t)p[5] << 16) | ((uint64_t)p[4] << 24) |
  309. ((uint64_t)p[3] << 32) | ((uint64_t)p[2] << 40) |
  310. ((uint64_t)p[1] << 48) | ((uint64_t)p[0] << 56));
  311. }
  312. static inline void PUT_64BIT_MSB_FIRST(void *vp, uint64_t value)
  313. {
  314. uint8_t *p = (uint8_t *)vp;
  315. p[7] = (uint8_t)(value);
  316. p[6] = (uint8_t)(value >> 8);
  317. p[5] = (uint8_t)(value >> 16);
  318. p[4] = (uint8_t)(value >> 24);
  319. p[3] = (uint8_t)(value >> 32);
  320. p[2] = (uint8_t)(value >> 40);
  321. p[1] = (uint8_t)(value >> 48);
  322. p[0] = (uint8_t)(value >> 56);
  323. }
  324. static inline uint32_t GET_32BIT_MSB_FIRST(const void *vp)
  325. {
  326. const uint8_t *p = (const uint8_t *)vp;
  327. return (((uint32_t)p[3] ) | ((uint32_t)p[2] << 8) |
  328. ((uint32_t)p[1] << 16) | ((uint32_t)p[0] << 24));
  329. }
  330. static inline void PUT_32BIT_MSB_FIRST(void *vp, uint32_t value)
  331. {
  332. uint8_t *p = (uint8_t *)vp;
  333. p[3] = (uint8_t)(value);
  334. p[2] = (uint8_t)(value >> 8);
  335. p[1] = (uint8_t)(value >> 16);
  336. p[0] = (uint8_t)(value >> 24);
  337. }
  338. static inline uint16_t GET_16BIT_MSB_FIRST(const void *vp)
  339. {
  340. const uint8_t *p = (const uint8_t *)vp;
  341. return (((uint16_t)p[1] ) | ((uint16_t)p[0] << 8));
  342. }
  343. static inline void PUT_16BIT_MSB_FIRST(void *vp, uint16_t value)
  344. {
  345. uint8_t *p = (uint8_t *)vp;
  346. p[1] = (uint8_t)(value);
  347. p[0] = (uint8_t)(value >> 8);
  348. }
  349. /* For use in X11-related applications, an endianness-variable form of
  350. * {GET,PUT}_16BIT which expects 'endian' to be either 'B' or 'l' */
  351. static inline uint16_t GET_16BIT_X11(char endian, const void *p)
  352. {
  353. return endian == 'B' ? GET_16BIT_MSB_FIRST(p) : GET_16BIT_LSB_FIRST(p);
  354. }
  355. static inline void PUT_16BIT_X11(char endian, void *p, uint16_t value)
  356. {
  357. if (endian == 'B')
  358. PUT_16BIT_MSB_FIRST(p, value);
  359. else
  360. PUT_16BIT_LSB_FIRST(p, value);
  361. }
  362. /* Replace NULL with the empty string, permitting an idiom in which we
  363. * get a string (pointer,length) pair that might be NULL,0 and can
  364. * then safely say things like printf("%.*s", length, NULLTOEMPTY(ptr)) */
  365. static inline const char *NULLTOEMPTY(const char *s)
  366. {
  367. return s ? s : "";
  368. }
  369. /* StripCtrlChars, defined in stripctrl.c: an adapter you can put on
  370. * the front of one BinarySink and which functions as one in turn.
  371. * Interprets its input as a stream of multibyte characters in the
  372. * system locale, and removes any that are not either printable
  373. * characters or newlines. */
  374. struct StripCtrlChars {
  375. BinarySink_IMPLEMENTATION;
  376. /* and this is contained in a larger structure */
  377. };
  378. StripCtrlChars *stripctrl_new(
  379. BinarySink *bs_out, bool permit_cr, wchar_t substitution);
  380. StripCtrlChars *stripctrl_new_term_fn(
  381. BinarySink *bs_out, bool permit_cr, wchar_t substitution,
  382. Terminal *term, unsigned long (*translate)(
  383. Terminal *, term_utf8_decode *, unsigned char));
  384. #define stripctrl_new_term(bs, cr, sub, term) \
  385. stripctrl_new_term_fn(bs, cr, sub, term, term_translate)
  386. void stripctrl_retarget(StripCtrlChars *sccpub, BinarySink *new_bs_out);
  387. void stripctrl_reset(StripCtrlChars *sccpub);
  388. void stripctrl_free(StripCtrlChars *sanpub);
  389. void stripctrl_enable_line_limiting(StripCtrlChars *sccpub);
  390. #ifndef WINSCP
  391. char *stripctrl_string_ptrlen(StripCtrlChars *sccpub, ptrlen str);
  392. static inline char *stripctrl_string(StripCtrlChars *sccpub, const char *str)
  393. {
  394. return stripctrl_string_ptrlen(sccpub, ptrlen_from_asciz(str));
  395. }
  396. #endif
  397. #ifdef MPEXT
  398. // Recent PuTTY code uses C99 standard that allows code before initialization.
  399. // Frequently that code are assertions. This assert implementation allows being used before code.
  400. #define pinitassert(P) const int __assert_dummy = 1/((int)(P))
  401. #endif
  402. /*
  403. * A mechanism for loading a file from disk into a memory buffer where
  404. * it can be picked apart as a BinarySource.
  405. */
  406. struct LoadedFile {
  407. char *data;
  408. size_t len, max_size;
  409. BinarySource_IMPLEMENTATION;
  410. };
  411. typedef enum {
  412. LF_OK, /* file loaded successfully */
  413. LF_TOO_BIG, /* file didn't fit in buffer */
  414. LF_ERROR, /* error from stdio layer */
  415. } LoadFileStatus;
  416. LoadedFile *lf_new(size_t max_size);
  417. void lf_free(LoadedFile *lf);
  418. LoadFileStatus lf_load_fp(LoadedFile *lf, FILE *fp);
  419. LoadFileStatus lf_load(LoadedFile *lf, const Filename *filename);
  420. static inline ptrlen ptrlen_from_lf(LoadedFile *lf)
  421. { return make_ptrlen(lf->data, lf->len); }
  422. /* Set the memory block of 'size' bytes at 'out' to the bitwise XOR of
  423. * the two blocks of the same size at 'in1' and 'in2'.
  424. *
  425. * 'out' may point to exactly the same address as one of the inputs,
  426. * but if the input and output blocks overlap in any other way, the
  427. * result of this function is not guaranteed. No memmove-style effort
  428. * is made to handle difficult overlap cases. */
  429. void memxor(uint8_t *out, const uint8_t *in1, const uint8_t *in2, size_t size);
  430. #endif