archive_read_support_format_cab.c 83 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955295629572958295929602961296229632964296529662967296829692970297129722973297429752976297729782979298029812982298329842985298629872988298929902991299229932994299529962997299829993000300130023003300430053006300730083009301030113012301330143015301630173018301930203021302230233024302530263027302830293030303130323033303430353036303730383039304030413042304330443045304630473048304930503051305230533054305530563057305830593060306130623063306430653066306730683069307030713072307330743075307630773078307930803081308230833084308530863087308830893090309130923093309430953096309730983099310031013102310331043105310631073108310931103111311231133114311531163117311831193120312131223123312431253126312731283129313031313132313331343135313631373138313931403141314231433144314531463147314831493150315131523153315431553156315731583159316031613162316331643165316631673168316931703171317231733174317531763177317831793180318131823183318431853186318731883189319031913192319331943195319631973198319932003201320232033204320532063207320832093210321132123213321432153216321732183219322032213222322332243225322632273228
  1. /*-
  2. * Copyright (c) 2010-2012 Michihiro NAKAJIMA
  3. * All rights reserved.
  4. *
  5. * Redistribution and use in source and binary forms, with or without
  6. * modification, are permitted provided that the following conditions
  7. * are met:
  8. * 1. Redistributions of source code must retain the above copyright
  9. * notice, this list of conditions and the following disclaimer.
  10. * 2. Redistributions in binary form must reproduce the above copyright
  11. * notice, this list of conditions and the following disclaimer in the
  12. * documentation and/or other materials provided with the distribution.
  13. *
  14. * THIS SOFTWARE IS PROVIDED BY THE AUTHOR(S) ``AS IS'' AND ANY EXPRESS OR
  15. * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  16. * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
  17. * IN NO EVENT SHALL THE AUTHOR(S) BE LIABLE FOR ANY DIRECT, INDIRECT,
  18. * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  19. * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  20. * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  21. * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  22. * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
  23. * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  24. */
  25. #include "archive_platform.h"
  26. #ifdef HAVE_ERRNO_H
  27. #include <errno.h>
  28. #endif
  29. #ifdef HAVE_LIMITS_H
  30. #include <limits.h>
  31. #endif
  32. #ifdef HAVE_STDLIB_H
  33. #include <stdlib.h>
  34. #endif
  35. #ifdef HAVE_STRING_H
  36. #include <string.h>
  37. #endif
  38. #ifdef HAVE_ZLIB_H
  39. #include <cm3p/zlib.h>
  40. #endif
  41. #include "archive.h"
  42. #include "archive_entry.h"
  43. #include "archive_entry_locale.h"
  44. #include "archive_private.h"
  45. #include "archive_read_private.h"
  46. #include "archive_endian.h"
  47. struct lzx_dec {
  48. /* Decoding status. */
  49. int state;
  50. /*
  51. * Window to see last decoded data, from 32KBi to 2MBi.
  52. */
  53. int w_size;
  54. int w_mask;
  55. /* Window buffer, which is a loop buffer. */
  56. unsigned char *w_buff;
  57. /* The insert position to the window. */
  58. int w_pos;
  59. /* The position where we can copy decoded code from the window. */
  60. int copy_pos;
  61. /* The length how many bytes we can copy decoded code from
  62. * the window. */
  63. int copy_len;
  64. /* Translation reversal for x86 processor CALL byte sequence(E8).
  65. * This is used for LZX only. */
  66. uint32_t translation_size;
  67. char translation;
  68. char block_type;
  69. #define VERBATIM_BLOCK 1
  70. #define ALIGNED_OFFSET_BLOCK 2
  71. #define UNCOMPRESSED_BLOCK 3
  72. size_t block_size;
  73. size_t block_bytes_avail;
  74. /* Repeated offset. */
  75. int r0, r1, r2;
  76. unsigned char rbytes[4];
  77. int rbytes_avail;
  78. int length_header;
  79. int position_slot;
  80. int offset_bits;
  81. struct lzx_pos_tbl {
  82. int base;
  83. int footer_bits;
  84. } *pos_tbl;
  85. /*
  86. * Bit stream reader.
  87. */
  88. struct lzx_br {
  89. #define CACHE_TYPE uint64_t
  90. #define CACHE_BITS (8 * sizeof(CACHE_TYPE))
  91. /* Cache buffer. */
  92. CACHE_TYPE cache_buffer;
  93. /* Indicates how many bits avail in cache_buffer. */
  94. int cache_avail;
  95. unsigned char odd;
  96. char have_odd;
  97. } br;
  98. /*
  99. * Huffman coding.
  100. */
  101. struct huffman {
  102. int len_size;
  103. int freq[17];
  104. unsigned char *bitlen;
  105. /*
  106. * Use a index table. It's faster than searching a huffman
  107. * coding tree, which is a binary tree. But a use of a large
  108. * index table causes L1 cache read miss many times.
  109. */
  110. int max_bits;
  111. int tbl_bits;
  112. int tree_used;
  113. /* Direct access table. */
  114. uint16_t *tbl;
  115. } at, lt, mt, pt;
  116. int loop;
  117. int error;
  118. };
  119. static const int slots[] = {
  120. 30, 32, 34, 36, 38, 42, 50, 66, 98, 162, 290
  121. };
  122. #define SLOT_BASE 15
  123. #define SLOT_MAX 21/*->25*/
  124. struct lzx_stream {
  125. const unsigned char *next_in;
  126. int64_t avail_in;
  127. int64_t total_in;
  128. unsigned char *next_out;
  129. int64_t avail_out;
  130. int64_t total_out;
  131. struct lzx_dec *ds;
  132. };
  133. /*
  134. * Cabinet file definitions.
  135. */
  136. /* CFHEADER offset */
  137. #define CFHEADER_signature 0
  138. #define CFHEADER_cbCabinet 8
  139. #define CFHEADER_coffFiles 16
  140. #define CFHEADER_versionMinor 24
  141. #define CFHEADER_versionMajor 25
  142. #define CFHEADER_cFolders 26
  143. #define CFHEADER_cFiles 28
  144. #define CFHEADER_flags 30
  145. #define CFHEADER_setID 32
  146. #define CFHEADER_iCabinet 34
  147. #define CFHEADER_cbCFHeader 36
  148. #define CFHEADER_cbCFFolder 38
  149. #define CFHEADER_cbCFData 39
  150. /* CFFOLDER offset */
  151. #define CFFOLDER_coffCabStart 0
  152. #define CFFOLDER_cCFData 4
  153. #define CFFOLDER_typeCompress 6
  154. #define CFFOLDER_abReserve 8
  155. /* CFFILE offset */
  156. #define CFFILE_cbFile 0
  157. #define CFFILE_uoffFolderStart 4
  158. #define CFFILE_iFolder 8
  159. #define CFFILE_date_time 10
  160. #define CFFILE_attribs 14
  161. /* CFDATA offset */
  162. #define CFDATA_csum 0
  163. #define CFDATA_cbData 4
  164. #define CFDATA_cbUncomp 6
  165. static const char * const compression_name[] = {
  166. "NONE",
  167. "MSZIP",
  168. "Quantum",
  169. "LZX",
  170. };
  171. struct cfdata {
  172. /* Sum value of this CFDATA. */
  173. uint32_t sum;
  174. uint16_t compressed_size;
  175. uint16_t compressed_bytes_remaining;
  176. uint16_t uncompressed_size;
  177. uint16_t uncompressed_bytes_remaining;
  178. /* To know how many bytes we have decompressed. */
  179. uint16_t uncompressed_avail;
  180. /* Offset from the beginning of compressed data of this CFDATA */
  181. uint16_t read_offset;
  182. int64_t unconsumed;
  183. /* To keep memory image of this CFDATA to compute the sum. */
  184. size_t memimage_size;
  185. unsigned char *memimage;
  186. /* Result of calculation of sum. */
  187. uint32_t sum_calculated;
  188. unsigned char sum_extra[4];
  189. int sum_extra_avail;
  190. const void *sum_ptr;
  191. };
  192. struct cffolder {
  193. uint32_t cfdata_offset_in_cab;
  194. uint16_t cfdata_count;
  195. uint16_t comptype;
  196. #define COMPTYPE_NONE 0x0000
  197. #define COMPTYPE_MSZIP 0x0001
  198. #define COMPTYPE_QUANTUM 0x0002
  199. #define COMPTYPE_LZX 0x0003
  200. uint16_t compdata;
  201. const char *compname;
  202. /* At the time reading CFDATA */
  203. struct cfdata cfdata;
  204. int cfdata_index;
  205. /* Flags to mark progress of decompression. */
  206. char decompress_init;
  207. };
  208. struct cffile {
  209. uint32_t uncompressed_size;
  210. uint32_t offset;
  211. time_t mtime;
  212. uint16_t folder;
  213. #define iFoldCONTINUED_FROM_PREV 0xFFFD
  214. #define iFoldCONTINUED_TO_NEXT 0xFFFE
  215. #define iFoldCONTINUED_PREV_AND_NEXT 0xFFFF
  216. unsigned char attr;
  217. #define ATTR_RDONLY 0x01
  218. #define ATTR_NAME_IS_UTF 0x80
  219. struct archive_string pathname;
  220. };
  221. struct cfheader {
  222. /* Total bytes of all file size in a Cabinet. */
  223. uint32_t total_bytes;
  224. uint32_t files_offset;
  225. uint16_t folder_count;
  226. uint16_t file_count;
  227. uint16_t flags;
  228. #define PREV_CABINET 0x0001
  229. #define NEXT_CABINET 0x0002
  230. #define RESERVE_PRESENT 0x0004
  231. uint16_t setid;
  232. uint16_t cabinet;
  233. /* Version number. */
  234. unsigned char major;
  235. unsigned char minor;
  236. unsigned char cffolder;
  237. unsigned char cfdata;
  238. /* All folders in a cabinet. */
  239. struct cffolder *folder_array;
  240. /* All files in a cabinet. */
  241. struct cffile *file_array;
  242. int file_index;
  243. };
  244. struct cab {
  245. /* entry_bytes_remaining is the number of bytes we expect. */
  246. int64_t entry_offset;
  247. int64_t entry_bytes_remaining;
  248. int64_t entry_unconsumed;
  249. int64_t entry_compressed_bytes_read;
  250. int64_t entry_uncompressed_bytes_read;
  251. struct cffolder *entry_cffolder;
  252. struct cffile *entry_cffile;
  253. struct cfdata *entry_cfdata;
  254. /* Offset from beginning of a cabinet file. */
  255. int64_t cab_offset;
  256. struct cfheader cfheader;
  257. struct archive_wstring ws;
  258. /* Flag to mark progress that an archive was read their first header.*/
  259. char found_header;
  260. char end_of_archive;
  261. char end_of_entry;
  262. char end_of_entry_cleanup;
  263. char read_data_invoked;
  264. int64_t bytes_skipped;
  265. unsigned char *uncompressed_buffer;
  266. size_t uncompressed_buffer_size;
  267. int init_default_conversion;
  268. struct archive_string_conv *sconv;
  269. struct archive_string_conv *sconv_default;
  270. struct archive_string_conv *sconv_utf8;
  271. char format_name[64];
  272. #ifdef HAVE_ZLIB_H
  273. z_stream stream;
  274. char stream_valid;
  275. #endif
  276. struct lzx_stream xstrm;
  277. };
  278. static int archive_read_format_cab_bid(struct archive_read *, int);
  279. static int archive_read_format_cab_options(struct archive_read *,
  280. const char *, const char *);
  281. static int archive_read_format_cab_read_header(struct archive_read *,
  282. struct archive_entry *);
  283. static int archive_read_format_cab_read_data(struct archive_read *,
  284. const void **, size_t *, int64_t *);
  285. static int archive_read_format_cab_read_data_skip(struct archive_read *);
  286. static int archive_read_format_cab_cleanup(struct archive_read *);
  287. static int cab_skip_sfx(struct archive_read *);
  288. static time_t cab_dos_time(const unsigned char *);
  289. static int cab_read_data(struct archive_read *, const void **,
  290. size_t *, int64_t *);
  291. static int cab_read_header(struct archive_read *);
  292. static uint32_t cab_checksum_cfdata_4(const void *, size_t bytes, uint32_t);
  293. static uint32_t cab_checksum_cfdata(const void *, size_t bytes, uint32_t);
  294. static void cab_checksum_update(struct archive_read *, size_t);
  295. static int cab_checksum_finish(struct archive_read *);
  296. static int cab_next_cfdata(struct archive_read *);
  297. static const void *cab_read_ahead_cfdata(struct archive_read *, ssize_t *);
  298. static const void *cab_read_ahead_cfdata_none(struct archive_read *, ssize_t *);
  299. static const void *cab_read_ahead_cfdata_deflate(struct archive_read *,
  300. ssize_t *);
  301. static const void *cab_read_ahead_cfdata_lzx(struct archive_read *,
  302. ssize_t *);
  303. static int64_t cab_consume_cfdata(struct archive_read *, int64_t);
  304. static int64_t cab_minimum_consume_cfdata(struct archive_read *, int64_t);
  305. static int lzx_decode_init(struct lzx_stream *, int);
  306. static int lzx_read_blocks(struct lzx_stream *, int);
  307. static int lzx_decode_blocks(struct lzx_stream *, int);
  308. static void lzx_decode_free(struct lzx_stream *);
  309. static void lzx_translation(struct lzx_stream *, void *, size_t, uint32_t);
  310. static void lzx_cleanup_bitstream(struct lzx_stream *);
  311. static int lzx_decode(struct lzx_stream *, int);
  312. static int lzx_read_pre_tree(struct lzx_stream *);
  313. static int lzx_read_bitlen(struct lzx_stream *, struct huffman *, int);
  314. static int lzx_huffman_init(struct huffman *, size_t, int);
  315. static void lzx_huffman_free(struct huffman *);
  316. static int lzx_make_huffman_table(struct huffman *);
  317. static inline int lzx_decode_huffman(struct huffman *, unsigned);
  318. int
  319. archive_read_support_format_cab(struct archive *_a)
  320. {
  321. struct archive_read *a = (struct archive_read *)_a;
  322. struct cab *cab;
  323. int r;
  324. archive_check_magic(_a, ARCHIVE_READ_MAGIC,
  325. ARCHIVE_STATE_NEW, "archive_read_support_format_cab");
  326. cab = (struct cab *)calloc(1, sizeof(*cab));
  327. if (cab == NULL) {
  328. archive_set_error(&a->archive, ENOMEM,
  329. "Can't allocate CAB data");
  330. return (ARCHIVE_FATAL);
  331. }
  332. archive_string_init(&cab->ws);
  333. archive_wstring_ensure(&cab->ws, 256);
  334. r = __archive_read_register_format(a,
  335. cab,
  336. "cab",
  337. archive_read_format_cab_bid,
  338. archive_read_format_cab_options,
  339. archive_read_format_cab_read_header,
  340. archive_read_format_cab_read_data,
  341. archive_read_format_cab_read_data_skip,
  342. NULL,
  343. archive_read_format_cab_cleanup,
  344. NULL,
  345. NULL);
  346. if (r != ARCHIVE_OK)
  347. free(cab);
  348. return (ARCHIVE_OK);
  349. }
  350. static int
  351. find_cab_magic(const char *p)
  352. {
  353. switch (p[4]) {
  354. case 0:
  355. /*
  356. * Note: Self-Extraction program has 'MSCF' string in their
  357. * program. If we were finding 'MSCF' string only, we got
  358. * wrong place for Cabinet header, thus, we have to check
  359. * following four bytes which are reserved and must be set
  360. * to zero.
  361. */
  362. if (memcmp(p, "MSCF\0\0\0\0", 8) == 0)
  363. return 0;
  364. return 5;
  365. case 'F': return 1;
  366. case 'C': return 2;
  367. case 'S': return 3;
  368. case 'M': return 4;
  369. default: return 5;
  370. }
  371. }
  372. static int
  373. archive_read_format_cab_bid(struct archive_read *a, int best_bid)
  374. {
  375. const char *p;
  376. ssize_t bytes_avail, offset, window;
  377. /* If there's already a better bid than we can ever
  378. make, don't bother testing. */
  379. if (best_bid > 64)
  380. return (-1);
  381. if ((p = __archive_read_ahead(a, 8, NULL)) == NULL)
  382. return (-1);
  383. if (memcmp(p, "MSCF\0\0\0\0", 8) == 0)
  384. return (64);
  385. /*
  386. * Attempt to handle self-extracting archives
  387. * by noting a PE header and searching forward
  388. * up to 128k for a 'MSCF' marker.
  389. */
  390. if (p[0] == 'M' && p[1] == 'Z') {
  391. offset = 0;
  392. window = 4096;
  393. while (offset < (1024 * 128)) {
  394. const char *h = __archive_read_ahead(a, offset + window,
  395. &bytes_avail);
  396. if (h == NULL) {
  397. /* Remaining bytes are less than window. */
  398. window >>= 1;
  399. if (window < 128)
  400. return (0);
  401. continue;
  402. }
  403. p = h + offset;
  404. while (p + 8 < h + bytes_avail) {
  405. int next;
  406. if ((next = find_cab_magic(p)) == 0)
  407. return (64);
  408. p += next;
  409. }
  410. offset = p - h;
  411. }
  412. }
  413. return (0);
  414. }
  415. static int
  416. archive_read_format_cab_options(struct archive_read *a,
  417. const char *key, const char *val)
  418. {
  419. struct cab *cab;
  420. int ret = ARCHIVE_FAILED;
  421. cab = (struct cab *)(a->format->data);
  422. if (strcmp(key, "hdrcharset") == 0) {
  423. if (val == NULL || val[0] == 0)
  424. archive_set_error(&a->archive, ARCHIVE_ERRNO_MISC,
  425. "cab: hdrcharset option needs a character-set name");
  426. else {
  427. cab->sconv = archive_string_conversion_from_charset(
  428. &a->archive, val, 0);
  429. if (cab->sconv != NULL)
  430. ret = ARCHIVE_OK;
  431. else
  432. ret = ARCHIVE_FATAL;
  433. }
  434. return (ret);
  435. }
  436. /* Note: The "warn" return is just to inform the options
  437. * supervisor that we didn't handle it. It will generate
  438. * a suitable error if no one used this option. */
  439. return (ARCHIVE_WARN);
  440. }
  441. static int
  442. cab_skip_sfx(struct archive_read *a)
  443. {
  444. const char *p, *q;
  445. size_t skip;
  446. ssize_t bytes, window;
  447. window = 4096;
  448. for (;;) {
  449. const char *h = __archive_read_ahead(a, window, &bytes);
  450. if (h == NULL) {
  451. /* Remaining size are less than window. */
  452. window >>= 1;
  453. if (window < 128) {
  454. archive_set_error(&a->archive,
  455. ARCHIVE_ERRNO_FILE_FORMAT,
  456. "Couldn't find out CAB header");
  457. return (ARCHIVE_FATAL);
  458. }
  459. continue;
  460. }
  461. p = h;
  462. q = p + bytes;
  463. /*
  464. * Scan ahead until we find something that looks
  465. * like the cab header.
  466. */
  467. while (p + 8 < q) {
  468. int next;
  469. if ((next = find_cab_magic(p)) == 0) {
  470. skip = p - h;
  471. __archive_read_consume(a, skip);
  472. return (ARCHIVE_OK);
  473. }
  474. p += next;
  475. }
  476. skip = p - h;
  477. __archive_read_consume(a, skip);
  478. }
  479. }
  480. static int
  481. truncated_error(struct archive_read *a)
  482. {
  483. archive_set_error(&a->archive, ARCHIVE_ERRNO_FILE_FORMAT,
  484. "Truncated CAB header");
  485. return (ARCHIVE_FATAL);
  486. }
  487. static ssize_t
  488. cab_strnlen(const unsigned char *p, size_t maxlen)
  489. {
  490. size_t i;
  491. for (i = 0; i <= maxlen; i++) {
  492. if (p[i] == 0)
  493. break;
  494. }
  495. if (i > maxlen)
  496. return (-1);/* invalid */
  497. return ((ssize_t)i);
  498. }
  499. /* Read bytes as much as remaining. */
  500. static const void *
  501. cab_read_ahead_remaining(struct archive_read *a, size_t min, ssize_t *avail)
  502. {
  503. const void *p;
  504. while (min > 0) {
  505. p = __archive_read_ahead(a, min, avail);
  506. if (p != NULL)
  507. return (p);
  508. min--;
  509. }
  510. return (NULL);
  511. }
  512. /* Convert a path separator '\' -> '/' */
  513. static int
  514. cab_convert_path_separator_1(struct archive_string *fn, unsigned char attr)
  515. {
  516. size_t i;
  517. int mb;
  518. /* Easy check if we have '\' in multi-byte string. */
  519. mb = 0;
  520. for (i = 0; i < archive_strlen(fn); i++) {
  521. if (fn->s[i] == '\\') {
  522. if (mb) {
  523. /* This may be second byte of multi-byte
  524. * character. */
  525. break;
  526. }
  527. fn->s[i] = '/';
  528. mb = 0;
  529. } else if ((fn->s[i] & 0x80) && !(attr & ATTR_NAME_IS_UTF))
  530. mb = 1;
  531. else
  532. mb = 0;
  533. }
  534. if (i == archive_strlen(fn))
  535. return (0);
  536. return (-1);
  537. }
  538. /*
  539. * Replace a character '\' with '/' in wide character.
  540. */
  541. static void
  542. cab_convert_path_separator_2(struct cab *cab, struct archive_entry *entry)
  543. {
  544. const wchar_t *wp;
  545. size_t i;
  546. /* If a conversion to wide character failed, force the replacement. */
  547. if ((wp = archive_entry_pathname_w(entry)) != NULL) {
  548. archive_wstrcpy(&(cab->ws), wp);
  549. for (i = 0; i < archive_strlen(&(cab->ws)); i++) {
  550. if (cab->ws.s[i] == L'\\')
  551. cab->ws.s[i] = L'/';
  552. }
  553. archive_entry_copy_pathname_w(entry, cab->ws.s);
  554. }
  555. }
  556. /*
  557. * Read CFHEADER, CFFOLDER and CFFILE.
  558. */
  559. static int
  560. cab_read_header(struct archive_read *a)
  561. {
  562. const unsigned char *p;
  563. struct cab *cab;
  564. struct cfheader *hd;
  565. size_t bytes, used;
  566. ssize_t len;
  567. int64_t skip;
  568. int err, i;
  569. int cur_folder, prev_folder;
  570. uint32_t offset32;
  571. a->archive.archive_format = ARCHIVE_FORMAT_CAB;
  572. if (a->archive.archive_format_name == NULL)
  573. a->archive.archive_format_name = "CAB";
  574. if ((p = __archive_read_ahead(a, 42, NULL)) == NULL)
  575. return (truncated_error(a));
  576. cab = (struct cab *)(a->format->data);
  577. if (cab->found_header == 0 &&
  578. p[0] == 'M' && p[1] == 'Z') {
  579. /* This is an executable? Must be self-extracting... */
  580. err = cab_skip_sfx(a);
  581. if (err < ARCHIVE_WARN)
  582. return (err);
  583. /* Re-read header after processing the SFX. */
  584. if ((p = __archive_read_ahead(a, 42, NULL)) == NULL)
  585. return (truncated_error(a));
  586. }
  587. cab->cab_offset = 0;
  588. /*
  589. * Read CFHEADER.
  590. */
  591. hd = &cab->cfheader;
  592. if (p[CFHEADER_signature+0] != 'M' || p[CFHEADER_signature+1] != 'S' ||
  593. p[CFHEADER_signature+2] != 'C' || p[CFHEADER_signature+3] != 'F') {
  594. archive_set_error(&a->archive, ARCHIVE_ERRNO_FILE_FORMAT,
  595. "Couldn't find out CAB header");
  596. return (ARCHIVE_FATAL);
  597. }
  598. hd->total_bytes = archive_le32dec(p + CFHEADER_cbCabinet);
  599. hd->files_offset = archive_le32dec(p + CFHEADER_coffFiles);
  600. hd->minor = p[CFHEADER_versionMinor];
  601. hd->major = p[CFHEADER_versionMajor];
  602. hd->folder_count = archive_le16dec(p + CFHEADER_cFolders);
  603. if (hd->folder_count == 0)
  604. goto invalid;
  605. hd->file_count = archive_le16dec(p + CFHEADER_cFiles);
  606. if (hd->file_count == 0)
  607. goto invalid;
  608. hd->flags = archive_le16dec(p + CFHEADER_flags);
  609. hd->setid = archive_le16dec(p + CFHEADER_setID);
  610. hd->cabinet = archive_le16dec(p + CFHEADER_iCabinet);
  611. used = CFHEADER_iCabinet + 2;
  612. if (hd->flags & RESERVE_PRESENT) {
  613. uint16_t cfheader;
  614. cfheader = archive_le16dec(p + CFHEADER_cbCFHeader);
  615. if (cfheader > 60000U)
  616. goto invalid;
  617. hd->cffolder = p[CFHEADER_cbCFFolder];
  618. hd->cfdata = p[CFHEADER_cbCFData];
  619. used += 4;/* cbCFHeader, cbCFFolder and cbCFData */
  620. used += cfheader;/* abReserve */
  621. } else
  622. hd->cffolder = 0;/* Avoid compiling warning. */
  623. if (hd->flags & PREV_CABINET) {
  624. /* How many bytes are used for szCabinetPrev. */
  625. if ((p = __archive_read_ahead(a, used+256, NULL)) == NULL)
  626. return (truncated_error(a));
  627. if ((len = cab_strnlen(p + used, 255)) <= 0)
  628. goto invalid;
  629. used += len + 1;
  630. /* How many bytes are used for szDiskPrev. */
  631. if ((p = __archive_read_ahead(a, used+256, NULL)) == NULL)
  632. return (truncated_error(a));
  633. if ((len = cab_strnlen(p + used, 255)) <= 0)
  634. goto invalid;
  635. used += len + 1;
  636. }
  637. if (hd->flags & NEXT_CABINET) {
  638. /* How many bytes are used for szCabinetNext. */
  639. if ((p = __archive_read_ahead(a, used+256, NULL)) == NULL)
  640. return (truncated_error(a));
  641. if ((len = cab_strnlen(p + used, 255)) <= 0)
  642. goto invalid;
  643. used += len + 1;
  644. /* How many bytes are used for szDiskNext. */
  645. if ((p = __archive_read_ahead(a, used+256, NULL)) == NULL)
  646. return (truncated_error(a));
  647. if ((len = cab_strnlen(p + used, 255)) <= 0)
  648. goto invalid;
  649. used += len + 1;
  650. }
  651. __archive_read_consume(a, used);
  652. cab->cab_offset += used;
  653. used = 0;
  654. /*
  655. * Read CFFOLDER.
  656. */
  657. hd->folder_array = (struct cffolder *)calloc(
  658. hd->folder_count, sizeof(struct cffolder));
  659. if (hd->folder_array == NULL)
  660. goto nomem;
  661. bytes = 8;
  662. if (hd->flags & RESERVE_PRESENT)
  663. bytes += hd->cffolder;
  664. bytes *= hd->folder_count;
  665. if ((p = __archive_read_ahead(a, bytes, NULL)) == NULL)
  666. return (truncated_error(a));
  667. offset32 = 0;
  668. for (i = 0; i < hd->folder_count; i++) {
  669. struct cffolder *folder = &(hd->folder_array[i]);
  670. folder->cfdata_offset_in_cab =
  671. archive_le32dec(p + CFFOLDER_coffCabStart);
  672. folder->cfdata_count = archive_le16dec(p+CFFOLDER_cCFData);
  673. folder->comptype =
  674. archive_le16dec(p+CFFOLDER_typeCompress) & 0x0F;
  675. folder->compdata =
  676. archive_le16dec(p+CFFOLDER_typeCompress) >> 8;
  677. /* Get a compression name. */
  678. if (folder->comptype <
  679. sizeof(compression_name) / sizeof(compression_name[0]))
  680. folder->compname = compression_name[folder->comptype];
  681. else
  682. folder->compname = "UNKNOWN";
  683. p += 8;
  684. used += 8;
  685. if (hd->flags & RESERVE_PRESENT) {
  686. p += hd->cffolder;/* abReserve */
  687. used += hd->cffolder;
  688. }
  689. /*
  690. * Sanity check if each data is acceptable.
  691. */
  692. if (offset32 >= folder->cfdata_offset_in_cab)
  693. goto invalid;
  694. offset32 = folder->cfdata_offset_in_cab;
  695. /* Set a request to initialize zlib for the CFDATA of
  696. * this folder. */
  697. folder->decompress_init = 0;
  698. }
  699. __archive_read_consume(a, used);
  700. cab->cab_offset += used;
  701. /*
  702. * Read CFFILE.
  703. */
  704. /* Seek read pointer to the offset of CFFILE if needed. */
  705. skip = (int64_t)hd->files_offset - cab->cab_offset;
  706. if (skip < 0) {
  707. archive_set_error(&a->archive, ARCHIVE_ERRNO_MISC,
  708. "Invalid offset of CFFILE %jd < %jd",
  709. (intmax_t)hd->files_offset, (intmax_t)cab->cab_offset);
  710. return (ARCHIVE_FATAL);
  711. }
  712. if (skip) {
  713. __archive_read_consume(a, skip);
  714. cab->cab_offset += skip;
  715. }
  716. /* Allocate memory for CFDATA */
  717. hd->file_array = (struct cffile *)calloc(
  718. hd->file_count, sizeof(struct cffile));
  719. if (hd->file_array == NULL)
  720. goto nomem;
  721. prev_folder = -1;
  722. for (i = 0; i < hd->file_count; i++) {
  723. struct cffile *file = &(hd->file_array[i]);
  724. ssize_t avail;
  725. if ((p = __archive_read_ahead(a, 16, NULL)) == NULL)
  726. return (truncated_error(a));
  727. file->uncompressed_size = archive_le32dec(p + CFFILE_cbFile);
  728. file->offset = archive_le32dec(p + CFFILE_uoffFolderStart);
  729. file->folder = archive_le16dec(p + CFFILE_iFolder);
  730. file->mtime = cab_dos_time(p + CFFILE_date_time);
  731. file->attr = (uint8_t)archive_le16dec(p + CFFILE_attribs);
  732. __archive_read_consume(a, 16);
  733. cab->cab_offset += 16;
  734. if ((p = cab_read_ahead_remaining(a, 256, &avail)) == NULL)
  735. return (truncated_error(a));
  736. if ((len = cab_strnlen(p, avail-1)) <= 0)
  737. goto invalid;
  738. /* Copy a pathname. */
  739. archive_string_init(&(file->pathname));
  740. archive_strncpy(&(file->pathname), p, len);
  741. __archive_read_consume(a, len + 1);
  742. cab->cab_offset += len + 1;
  743. /*
  744. * Sanity check if each data is acceptable.
  745. */
  746. if (file->uncompressed_size > 0x7FFF8000)
  747. goto invalid;/* Too large */
  748. if ((int64_t)file->offset + (int64_t)file->uncompressed_size
  749. > ARCHIVE_LITERAL_LL(0x7FFF8000))
  750. goto invalid;/* Too large */
  751. switch (file->folder) {
  752. case iFoldCONTINUED_TO_NEXT:
  753. /* This must be last file in a folder. */
  754. if (i != hd->file_count -1)
  755. goto invalid;
  756. cur_folder = hd->folder_count -1;
  757. break;
  758. case iFoldCONTINUED_PREV_AND_NEXT:
  759. /* This must be only one file in a folder. */
  760. if (hd->file_count != 1)
  761. goto invalid;
  762. /* FALL THROUGH */
  763. case iFoldCONTINUED_FROM_PREV:
  764. /* This must be first file in a folder. */
  765. if (i != 0)
  766. goto invalid;
  767. prev_folder = cur_folder = 0;
  768. offset32 = file->offset;
  769. break;
  770. default:
  771. if (file->folder >= hd->folder_count)
  772. goto invalid;
  773. cur_folder = file->folder;
  774. break;
  775. }
  776. /* Dot not back track. */
  777. if (cur_folder < prev_folder)
  778. goto invalid;
  779. if (cur_folder != prev_folder)
  780. offset32 = 0;
  781. prev_folder = cur_folder;
  782. /* Make sure there are not any blanks from last file
  783. * contents. */
  784. if (offset32 != file->offset)
  785. goto invalid;
  786. offset32 += file->uncompressed_size;
  787. /* CFDATA is available for file contents. */
  788. if (file->uncompressed_size > 0 &&
  789. hd->folder_array[cur_folder].cfdata_count == 0)
  790. goto invalid;
  791. }
  792. if (hd->cabinet != 0 || hd->flags & (PREV_CABINET | NEXT_CABINET)) {
  793. archive_set_error(&a->archive, ARCHIVE_ERRNO_FILE_FORMAT,
  794. "Multivolume cabinet file is unsupported");
  795. return (ARCHIVE_WARN);
  796. }
  797. return (ARCHIVE_OK);
  798. invalid:
  799. archive_set_error(&a->archive, ARCHIVE_ERRNO_FILE_FORMAT,
  800. "Invalid CAB header");
  801. return (ARCHIVE_FATAL);
  802. nomem:
  803. archive_set_error(&a->archive, ENOMEM,
  804. "Can't allocate memory for CAB data");
  805. return (ARCHIVE_FATAL);
  806. }
  807. static int
  808. archive_read_format_cab_read_header(struct archive_read *a,
  809. struct archive_entry *entry)
  810. {
  811. struct cab *cab;
  812. struct cfheader *hd;
  813. struct cffolder *prev_folder;
  814. struct cffile *file;
  815. struct archive_string_conv *sconv;
  816. int err = ARCHIVE_OK, r;
  817. cab = (struct cab *)(a->format->data);
  818. if (cab->found_header == 0) {
  819. err = cab_read_header(a);
  820. if (err < ARCHIVE_WARN)
  821. return (err);
  822. /* We've found the header. */
  823. cab->found_header = 1;
  824. }
  825. hd = &cab->cfheader;
  826. if (hd->file_index >= hd->file_count) {
  827. cab->end_of_archive = 1;
  828. return (ARCHIVE_EOF);
  829. }
  830. file = &hd->file_array[hd->file_index++];
  831. cab->end_of_entry = 0;
  832. cab->end_of_entry_cleanup = 0;
  833. cab->entry_compressed_bytes_read = 0;
  834. cab->entry_uncompressed_bytes_read = 0;
  835. cab->entry_unconsumed = 0;
  836. cab->entry_cffile = file;
  837. /*
  838. * Choose a proper folder.
  839. */
  840. prev_folder = cab->entry_cffolder;
  841. switch (file->folder) {
  842. case iFoldCONTINUED_FROM_PREV:
  843. case iFoldCONTINUED_PREV_AND_NEXT:
  844. cab->entry_cffolder = &hd->folder_array[0];
  845. break;
  846. case iFoldCONTINUED_TO_NEXT:
  847. cab->entry_cffolder = &hd->folder_array[hd->folder_count-1];
  848. break;
  849. default:
  850. cab->entry_cffolder = &hd->folder_array[file->folder];
  851. break;
  852. }
  853. /* If a cffolder of this file is changed, reset a cfdata to read
  854. * file contents from next cfdata. */
  855. if (prev_folder != cab->entry_cffolder)
  856. cab->entry_cfdata = NULL;
  857. /* If a pathname is UTF-8, prepare a string conversion object
  858. * for UTF-8 and use it. */
  859. if (file->attr & ATTR_NAME_IS_UTF) {
  860. if (cab->sconv_utf8 == NULL) {
  861. cab->sconv_utf8 =
  862. archive_string_conversion_from_charset(
  863. &(a->archive), "UTF-8", 1);
  864. if (cab->sconv_utf8 == NULL)
  865. return (ARCHIVE_FATAL);
  866. }
  867. sconv = cab->sconv_utf8;
  868. } else if (cab->sconv != NULL) {
  869. /* Choose the conversion specified by the option. */
  870. sconv = cab->sconv;
  871. } else {
  872. /* Choose the default conversion. */
  873. if (!cab->init_default_conversion) {
  874. cab->sconv_default =
  875. archive_string_default_conversion_for_read(
  876. &(a->archive));
  877. cab->init_default_conversion = 1;
  878. }
  879. sconv = cab->sconv_default;
  880. }
  881. /*
  882. * Set a default value and common data
  883. */
  884. r = cab_convert_path_separator_1(&(file->pathname), file->attr);
  885. if (archive_entry_copy_pathname_l(entry, file->pathname.s,
  886. archive_strlen(&(file->pathname)), sconv) != 0) {
  887. if (errno == ENOMEM) {
  888. archive_set_error(&a->archive, ENOMEM,
  889. "Can't allocate memory for Pathname");
  890. return (ARCHIVE_FATAL);
  891. }
  892. archive_set_error(&a->archive,
  893. ARCHIVE_ERRNO_FILE_FORMAT,
  894. "Pathname cannot be converted "
  895. "from %s to current locale.",
  896. archive_string_conversion_charset_name(sconv));
  897. err = ARCHIVE_WARN;
  898. }
  899. if (r < 0) {
  900. /* Convert a path separator '\' -> '/' */
  901. cab_convert_path_separator_2(cab, entry);
  902. }
  903. archive_entry_set_size(entry, file->uncompressed_size);
  904. if (file->attr & ATTR_RDONLY)
  905. archive_entry_set_mode(entry, AE_IFREG | 0555);
  906. else
  907. archive_entry_set_mode(entry, AE_IFREG | 0666);
  908. archive_entry_set_mtime(entry, file->mtime, 0);
  909. cab->entry_bytes_remaining = file->uncompressed_size;
  910. cab->entry_offset = 0;
  911. /* We don't need compress data. */
  912. if (file->uncompressed_size == 0)
  913. cab->end_of_entry_cleanup = cab->end_of_entry = 1;
  914. /* Set up a more descriptive format name. */
  915. snprintf(cab->format_name, sizeof(cab->format_name), "CAB %d.%d (%s)",
  916. hd->major, hd->minor, cab->entry_cffolder->compname);
  917. a->archive.archive_format_name = cab->format_name;
  918. return (err);
  919. }
  920. static int
  921. archive_read_format_cab_read_data(struct archive_read *a,
  922. const void **buff, size_t *size, int64_t *offset)
  923. {
  924. struct cab *cab = (struct cab *)(a->format->data);
  925. int r;
  926. switch (cab->entry_cffile->folder) {
  927. case iFoldCONTINUED_FROM_PREV:
  928. case iFoldCONTINUED_TO_NEXT:
  929. case iFoldCONTINUED_PREV_AND_NEXT:
  930. *buff = NULL;
  931. *size = 0;
  932. *offset = 0;
  933. archive_clear_error(&a->archive);
  934. archive_set_error(&a->archive, ARCHIVE_ERRNO_FILE_FORMAT,
  935. "Cannot restore this file split in multivolume.");
  936. return (ARCHIVE_FAILED);
  937. default:
  938. break;
  939. }
  940. if (cab->read_data_invoked == 0) {
  941. if (cab->bytes_skipped) {
  942. if (cab->entry_cfdata == NULL) {
  943. r = cab_next_cfdata(a);
  944. if (r < 0)
  945. return (r);
  946. }
  947. if (cab_consume_cfdata(a, cab->bytes_skipped) < 0)
  948. return (ARCHIVE_FATAL);
  949. cab->bytes_skipped = 0;
  950. }
  951. cab->read_data_invoked = 1;
  952. }
  953. if (cab->entry_unconsumed) {
  954. /* Consume as much as the compressor actually used. */
  955. r = (int)cab_consume_cfdata(a, cab->entry_unconsumed);
  956. cab->entry_unconsumed = 0;
  957. if (r < 0)
  958. return (r);
  959. }
  960. if (cab->end_of_archive || cab->end_of_entry) {
  961. if (!cab->end_of_entry_cleanup) {
  962. /* End-of-entry cleanup done. */
  963. cab->end_of_entry_cleanup = 1;
  964. }
  965. *offset = cab->entry_offset;
  966. *size = 0;
  967. *buff = NULL;
  968. return (ARCHIVE_EOF);
  969. }
  970. return (cab_read_data(a, buff, size, offset));
  971. }
  972. static uint32_t
  973. cab_checksum_cfdata_4(const void *p, size_t bytes, uint32_t seed)
  974. {
  975. const unsigned char *b;
  976. unsigned u32num;
  977. uint32_t sum;
  978. u32num = (unsigned)bytes / 4;
  979. sum = seed;
  980. b = p;
  981. for (;u32num > 0; --u32num) {
  982. sum ^= archive_le32dec(b);
  983. b += 4;
  984. }
  985. return (sum);
  986. }
  987. static uint32_t
  988. cab_checksum_cfdata(const void *p, size_t bytes, uint32_t seed)
  989. {
  990. const unsigned char *b;
  991. uint32_t sum;
  992. uint32_t t;
  993. sum = cab_checksum_cfdata_4(p, bytes, seed);
  994. b = p;
  995. b += bytes & ~3;
  996. t = 0;
  997. switch (bytes & 3) {
  998. case 3:
  999. t |= ((uint32_t)(*b++)) << 16;
  1000. /* FALL THROUGH */
  1001. case 2:
  1002. t |= ((uint32_t)(*b++)) << 8;
  1003. /* FALL THROUGH */
  1004. case 1:
  1005. t |= *b;
  1006. /* FALL THROUGH */
  1007. default:
  1008. break;
  1009. }
  1010. sum ^= t;
  1011. return (sum);
  1012. }
  1013. static void
  1014. cab_checksum_update(struct archive_read *a, size_t bytes)
  1015. {
  1016. struct cab *cab = (struct cab *)(a->format->data);
  1017. struct cfdata *cfdata = cab->entry_cfdata;
  1018. const unsigned char *p;
  1019. size_t sumbytes;
  1020. if (cfdata->sum == 0 || cfdata->sum_ptr == NULL)
  1021. return;
  1022. /*
  1023. * Calculate the sum of this CFDATA.
  1024. * Make sure CFDATA must be calculated in four bytes.
  1025. */
  1026. p = cfdata->sum_ptr;
  1027. sumbytes = bytes;
  1028. if (cfdata->sum_extra_avail) {
  1029. while (cfdata->sum_extra_avail < 4 && sumbytes > 0) {
  1030. cfdata->sum_extra[
  1031. cfdata->sum_extra_avail++] = *p++;
  1032. sumbytes--;
  1033. }
  1034. if (cfdata->sum_extra_avail == 4) {
  1035. cfdata->sum_calculated = cab_checksum_cfdata_4(
  1036. cfdata->sum_extra, 4, cfdata->sum_calculated);
  1037. cfdata->sum_extra_avail = 0;
  1038. }
  1039. }
  1040. if (sumbytes) {
  1041. int odd = sumbytes & 3;
  1042. if ((int)(sumbytes - odd) > 0)
  1043. cfdata->sum_calculated = cab_checksum_cfdata_4(
  1044. p, sumbytes - odd, cfdata->sum_calculated);
  1045. if (odd)
  1046. memcpy(cfdata->sum_extra, p + sumbytes - odd, odd);
  1047. cfdata->sum_extra_avail = odd;
  1048. }
  1049. cfdata->sum_ptr = NULL;
  1050. }
  1051. static int
  1052. cab_checksum_finish(struct archive_read *a)
  1053. {
  1054. struct cab *cab = (struct cab *)(a->format->data);
  1055. struct cfdata *cfdata = cab->entry_cfdata;
  1056. int l;
  1057. /* Do not need to compute a sum. */
  1058. if (cfdata->sum == 0)
  1059. return (ARCHIVE_OK);
  1060. /*
  1061. * Calculate the sum of remaining CFDATA.
  1062. */
  1063. if (cfdata->sum_extra_avail) {
  1064. cfdata->sum_calculated =
  1065. cab_checksum_cfdata(cfdata->sum_extra,
  1066. cfdata->sum_extra_avail, cfdata->sum_calculated);
  1067. cfdata->sum_extra_avail = 0;
  1068. }
  1069. l = 4;
  1070. if (cab->cfheader.flags & RESERVE_PRESENT)
  1071. l += cab->cfheader.cfdata;
  1072. cfdata->sum_calculated = cab_checksum_cfdata(
  1073. cfdata->memimage + CFDATA_cbData, l, cfdata->sum_calculated);
  1074. if (cfdata->sum_calculated != cfdata->sum) {
  1075. #ifndef DONT_FAIL_ON_CRC_ERROR
  1076. archive_set_error(&a->archive, ARCHIVE_ERRNO_FILE_FORMAT,
  1077. "Checksum error CFDATA[%d] %" PRIx32 ":%" PRIx32 " in %d bytes",
  1078. cab->entry_cffolder->cfdata_index -1,
  1079. cfdata->sum, cfdata->sum_calculated,
  1080. cfdata->compressed_size);
  1081. return (ARCHIVE_FAILED);
  1082. #endif
  1083. }
  1084. return (ARCHIVE_OK);
  1085. }
  1086. /*
  1087. * Read CFDATA if needed.
  1088. */
  1089. static int
  1090. cab_next_cfdata(struct archive_read *a)
  1091. {
  1092. struct cab *cab = (struct cab *)(a->format->data);
  1093. struct cfdata *cfdata = cab->entry_cfdata;
  1094. /* There are remaining bytes in current CFDATA, use it first. */
  1095. if (cfdata != NULL && cfdata->uncompressed_bytes_remaining > 0)
  1096. return (ARCHIVE_OK);
  1097. if (cfdata == NULL) {
  1098. int64_t skip;
  1099. cab->entry_cffolder->cfdata_index = 0;
  1100. /* Seek read pointer to the offset of CFDATA if needed. */
  1101. skip = cab->entry_cffolder->cfdata_offset_in_cab
  1102. - cab->cab_offset;
  1103. if (skip < 0) {
  1104. int folder_index;
  1105. switch (cab->entry_cffile->folder) {
  1106. case iFoldCONTINUED_FROM_PREV:
  1107. case iFoldCONTINUED_PREV_AND_NEXT:
  1108. folder_index = 0;
  1109. break;
  1110. case iFoldCONTINUED_TO_NEXT:
  1111. folder_index = cab->cfheader.folder_count-1;
  1112. break;
  1113. default:
  1114. folder_index = cab->entry_cffile->folder;
  1115. break;
  1116. }
  1117. archive_set_error(&a->archive, ARCHIVE_ERRNO_MISC,
  1118. "Invalid offset of CFDATA in folder(%d) %jd < %jd",
  1119. folder_index,
  1120. (intmax_t)cab->entry_cffolder->cfdata_offset_in_cab,
  1121. (intmax_t)cab->cab_offset);
  1122. return (ARCHIVE_FATAL);
  1123. }
  1124. if (skip > 0) {
  1125. if (__archive_read_consume(a, skip) < 0)
  1126. return (ARCHIVE_FATAL);
  1127. cab->cab_offset =
  1128. cab->entry_cffolder->cfdata_offset_in_cab;
  1129. }
  1130. }
  1131. /*
  1132. * Read a CFDATA.
  1133. */
  1134. if (cab->entry_cffolder->cfdata_index <
  1135. cab->entry_cffolder->cfdata_count) {
  1136. const unsigned char *p;
  1137. int l;
  1138. cfdata = &(cab->entry_cffolder->cfdata);
  1139. cab->entry_cffolder->cfdata_index++;
  1140. cab->entry_cfdata = cfdata;
  1141. cfdata->sum_calculated = 0;
  1142. cfdata->sum_extra_avail = 0;
  1143. cfdata->sum_ptr = NULL;
  1144. l = 8;
  1145. if (cab->cfheader.flags & RESERVE_PRESENT)
  1146. l += cab->cfheader.cfdata;
  1147. if ((p = __archive_read_ahead(a, l, NULL)) == NULL)
  1148. return (truncated_error(a));
  1149. cfdata->sum = archive_le32dec(p + CFDATA_csum);
  1150. cfdata->compressed_size = archive_le16dec(p + CFDATA_cbData);
  1151. cfdata->compressed_bytes_remaining = cfdata->compressed_size;
  1152. cfdata->uncompressed_size =
  1153. archive_le16dec(p + CFDATA_cbUncomp);
  1154. cfdata->uncompressed_bytes_remaining =
  1155. cfdata->uncompressed_size;
  1156. cfdata->uncompressed_avail = 0;
  1157. cfdata->read_offset = 0;
  1158. cfdata->unconsumed = 0;
  1159. /*
  1160. * Sanity check if data size is acceptable.
  1161. */
  1162. if (cfdata->compressed_size == 0 ||
  1163. cfdata->compressed_size > (0x8000+6144))
  1164. goto invalid;
  1165. if (cfdata->uncompressed_size > 0x8000)
  1166. goto invalid;
  1167. if (cfdata->uncompressed_size == 0) {
  1168. switch (cab->entry_cffile->folder) {
  1169. case iFoldCONTINUED_PREV_AND_NEXT:
  1170. case iFoldCONTINUED_TO_NEXT:
  1171. break;
  1172. case iFoldCONTINUED_FROM_PREV:
  1173. default:
  1174. goto invalid;
  1175. }
  1176. }
  1177. /* If CFDATA is not last in a folder, an uncompressed
  1178. * size must be 0x8000(32KBi) */
  1179. if ((cab->entry_cffolder->cfdata_index <
  1180. cab->entry_cffolder->cfdata_count) &&
  1181. cfdata->uncompressed_size != 0x8000)
  1182. goto invalid;
  1183. /* A compressed data size and an uncompressed data size must
  1184. * be the same in no compression mode. */
  1185. if (cab->entry_cffolder->comptype == COMPTYPE_NONE &&
  1186. cfdata->compressed_size != cfdata->uncompressed_size)
  1187. goto invalid;
  1188. /*
  1189. * Save CFDATA image for sum check.
  1190. */
  1191. if (cfdata->memimage_size < (size_t)l) {
  1192. free(cfdata->memimage);
  1193. cfdata->memimage = malloc(l);
  1194. if (cfdata->memimage == NULL) {
  1195. archive_set_error(&a->archive, ENOMEM,
  1196. "Can't allocate memory for CAB data");
  1197. return (ARCHIVE_FATAL);
  1198. }
  1199. cfdata->memimage_size = l;
  1200. }
  1201. memcpy(cfdata->memimage, p, l);
  1202. /* Consume bytes as much as we used. */
  1203. __archive_read_consume(a, l);
  1204. cab->cab_offset += l;
  1205. } else if (cab->entry_cffolder->cfdata_count > 0) {
  1206. /* Run out of all CFDATA in a folder. */
  1207. cfdata->compressed_size = 0;
  1208. cfdata->uncompressed_size = 0;
  1209. cfdata->compressed_bytes_remaining = 0;
  1210. cfdata->uncompressed_bytes_remaining = 0;
  1211. } else {
  1212. /* Current folder does not have any CFDATA. */
  1213. cfdata = &(cab->entry_cffolder->cfdata);
  1214. cab->entry_cfdata = cfdata;
  1215. memset(cfdata, 0, sizeof(*cfdata));
  1216. }
  1217. return (ARCHIVE_OK);
  1218. invalid:
  1219. archive_set_error(&a->archive, ARCHIVE_ERRNO_FILE_FORMAT,
  1220. "Invalid CFDATA");
  1221. return (ARCHIVE_FATAL);
  1222. }
  1223. /*
  1224. * Read ahead CFDATA.
  1225. */
  1226. static const void *
  1227. cab_read_ahead_cfdata(struct archive_read *a, ssize_t *avail)
  1228. {
  1229. struct cab *cab = (struct cab *)(a->format->data);
  1230. int err;
  1231. err = cab_next_cfdata(a);
  1232. if (err < ARCHIVE_OK) {
  1233. *avail = err;
  1234. return (NULL);
  1235. }
  1236. switch (cab->entry_cffolder->comptype) {
  1237. case COMPTYPE_NONE:
  1238. return (cab_read_ahead_cfdata_none(a, avail));
  1239. case COMPTYPE_MSZIP:
  1240. return (cab_read_ahead_cfdata_deflate(a, avail));
  1241. case COMPTYPE_LZX:
  1242. return (cab_read_ahead_cfdata_lzx(a, avail));
  1243. default: /* Unsupported compression. */
  1244. archive_set_error(&a->archive, ARCHIVE_ERRNO_FILE_FORMAT,
  1245. "Unsupported CAB compression : %s",
  1246. cab->entry_cffolder->compname);
  1247. *avail = ARCHIVE_FAILED;
  1248. return (NULL);
  1249. }
  1250. }
  1251. /*
  1252. * Read ahead CFDATA as uncompressed data.
  1253. */
  1254. static const void *
  1255. cab_read_ahead_cfdata_none(struct archive_read *a, ssize_t *avail)
  1256. {
  1257. struct cab *cab = (struct cab *)(a->format->data);
  1258. struct cfdata *cfdata;
  1259. const void *d;
  1260. cfdata = cab->entry_cfdata;
  1261. /*
  1262. * Note: '1' here is a performance optimization.
  1263. * Recall that the decompression layer returns a count of
  1264. * available bytes; asking for more than that forces the
  1265. * decompressor to combine reads by copying data.
  1266. */
  1267. d = __archive_read_ahead(a, 1, avail);
  1268. if (*avail <= 0) {
  1269. *avail = truncated_error(a);
  1270. return (NULL);
  1271. }
  1272. if (*avail > cfdata->uncompressed_bytes_remaining)
  1273. *avail = cfdata->uncompressed_bytes_remaining;
  1274. cfdata->uncompressed_avail = cfdata->uncompressed_size;
  1275. cfdata->unconsumed = *avail;
  1276. cfdata->sum_ptr = d;
  1277. return (d);
  1278. }
  1279. /*
  1280. * Read ahead CFDATA as deflate data.
  1281. */
  1282. #ifdef HAVE_ZLIB_H
  1283. static const void *
  1284. cab_read_ahead_cfdata_deflate(struct archive_read *a, ssize_t *avail)
  1285. {
  1286. struct cab *cab = (struct cab *)(a->format->data);
  1287. struct cfdata *cfdata;
  1288. const void *d;
  1289. int r, mszip;
  1290. uint16_t uavail;
  1291. char eod = 0;
  1292. cfdata = cab->entry_cfdata;
  1293. /* If the buffer hasn't been allocated, allocate it now. */
  1294. if (cab->uncompressed_buffer == NULL) {
  1295. cab->uncompressed_buffer_size = 0x8000;
  1296. cab->uncompressed_buffer
  1297. = (unsigned char *)malloc(cab->uncompressed_buffer_size);
  1298. if (cab->uncompressed_buffer == NULL) {
  1299. archive_set_error(&a->archive, ENOMEM,
  1300. "No memory for CAB reader");
  1301. *avail = ARCHIVE_FATAL;
  1302. return (NULL);
  1303. }
  1304. }
  1305. uavail = cfdata->uncompressed_avail;
  1306. if (uavail == cfdata->uncompressed_size) {
  1307. d = cab->uncompressed_buffer + cfdata->read_offset;
  1308. *avail = uavail - cfdata->read_offset;
  1309. return (d);
  1310. }
  1311. if (!cab->entry_cffolder->decompress_init) {
  1312. cab->stream.next_in = NULL;
  1313. cab->stream.avail_in = 0;
  1314. cab->stream.total_in = 0;
  1315. cab->stream.next_out = NULL;
  1316. cab->stream.avail_out = 0;
  1317. cab->stream.total_out = 0;
  1318. if (cab->stream_valid)
  1319. r = inflateReset(&cab->stream);
  1320. else
  1321. r = inflateInit2(&cab->stream,
  1322. -15 /* Don't check for zlib header */);
  1323. if (r != Z_OK) {
  1324. archive_set_error(&a->archive, ARCHIVE_ERRNO_MISC,
  1325. "Can't initialize deflate decompression.");
  1326. *avail = ARCHIVE_FATAL;
  1327. return (NULL);
  1328. }
  1329. /* Stream structure has been set up. */
  1330. cab->stream_valid = 1;
  1331. /* We've initialized decompression for this stream. */
  1332. cab->entry_cffolder->decompress_init = 1;
  1333. }
  1334. if (cfdata->compressed_bytes_remaining == cfdata->compressed_size)
  1335. mszip = 2;
  1336. else
  1337. mszip = 0;
  1338. eod = 0;
  1339. cab->stream.total_out = uavail;
  1340. /*
  1341. * We always uncompress all data in current CFDATA.
  1342. */
  1343. while (!eod && cab->stream.total_out < cfdata->uncompressed_size) {
  1344. ssize_t bytes_avail;
  1345. cab->stream.next_out =
  1346. cab->uncompressed_buffer + cab->stream.total_out;
  1347. cab->stream.avail_out =
  1348. cfdata->uncompressed_size - cab->stream.total_out;
  1349. d = __archive_read_ahead(a, 1, &bytes_avail);
  1350. if (bytes_avail <= 0) {
  1351. *avail = truncated_error(a);
  1352. return (NULL);
  1353. }
  1354. if (bytes_avail > cfdata->compressed_bytes_remaining)
  1355. bytes_avail = cfdata->compressed_bytes_remaining;
  1356. /*
  1357. * A bug in zlib.h: stream.next_in should be marked 'const'
  1358. * but isn't (the library never alters data through the
  1359. * next_in pointer, only reads it). The result: this ugly
  1360. * cast to remove 'const'.
  1361. */
  1362. cab->stream.next_in = (Bytef *)(uintptr_t)d;
  1363. cab->stream.avail_in = (uInt)bytes_avail;
  1364. cab->stream.total_in = 0;
  1365. /* Cut out a tow-byte MSZIP signature(0x43, 0x4b). */
  1366. if (mszip > 0) {
  1367. if (bytes_avail <= 0)
  1368. goto nomszip;
  1369. if (bytes_avail <= mszip) {
  1370. if (mszip == 2) {
  1371. if (cab->stream.next_in[0] != 0x43)
  1372. goto nomszip;
  1373. if (bytes_avail > 1 &&
  1374. cab->stream.next_in[1] != 0x4b)
  1375. goto nomszip;
  1376. } else if (cab->stream.next_in[0] != 0x4b)
  1377. goto nomszip;
  1378. cfdata->unconsumed = bytes_avail;
  1379. cfdata->sum_ptr = d;
  1380. if (cab_minimum_consume_cfdata(
  1381. a, cfdata->unconsumed) < 0) {
  1382. *avail = ARCHIVE_FATAL;
  1383. return (NULL);
  1384. }
  1385. mszip -= (int)bytes_avail;
  1386. continue;
  1387. }
  1388. if (mszip == 1 && cab->stream.next_in[0] != 0x4b)
  1389. goto nomszip;
  1390. else if (mszip == 2 && (cab->stream.next_in[0] != 0x43 ||
  1391. cab->stream.next_in[1] != 0x4b))
  1392. goto nomszip;
  1393. cab->stream.next_in += mszip;
  1394. cab->stream.avail_in -= mszip;
  1395. cab->stream.total_in += mszip;
  1396. mszip = 0;
  1397. }
  1398. r = inflate(&cab->stream, 0);
  1399. switch (r) {
  1400. case Z_OK:
  1401. break;
  1402. case Z_STREAM_END:
  1403. eod = 1;
  1404. break;
  1405. default:
  1406. goto zlibfailed;
  1407. }
  1408. cfdata->unconsumed = cab->stream.total_in;
  1409. cfdata->sum_ptr = d;
  1410. if (cab_minimum_consume_cfdata(a, cfdata->unconsumed) < 0) {
  1411. *avail = ARCHIVE_FATAL;
  1412. return (NULL);
  1413. }
  1414. }
  1415. uavail = (uint16_t)cab->stream.total_out;
  1416. if (uavail < cfdata->uncompressed_size) {
  1417. archive_set_error(&a->archive, ARCHIVE_ERRNO_MISC,
  1418. "Invalid uncompressed size (%d < %d)",
  1419. uavail, cfdata->uncompressed_size);
  1420. *avail = ARCHIVE_FATAL;
  1421. return (NULL);
  1422. }
  1423. /*
  1424. * Note: I suspect there is a bug in makecab.exe because, in rare
  1425. * case, compressed bytes are still remaining regardless we have
  1426. * gotten all uncompressed bytes, which size is recorded in CFDATA,
  1427. * as much as we need, and we have to use the garbage so as to
  1428. * correctly compute the sum of CFDATA accordingly.
  1429. */
  1430. if (cfdata->compressed_bytes_remaining > 0) {
  1431. ssize_t bytes_avail;
  1432. d = __archive_read_ahead(a, cfdata->compressed_bytes_remaining,
  1433. &bytes_avail);
  1434. if (bytes_avail <= 0) {
  1435. *avail = truncated_error(a);
  1436. return (NULL);
  1437. }
  1438. cfdata->unconsumed = cfdata->compressed_bytes_remaining;
  1439. cfdata->sum_ptr = d;
  1440. if (cab_minimum_consume_cfdata(a, cfdata->unconsumed) < 0) {
  1441. *avail = ARCHIVE_FATAL;
  1442. return (NULL);
  1443. }
  1444. }
  1445. /*
  1446. * Set dictionary data for decompressing of next CFDATA, which
  1447. * in the same folder. This is why we always do decompress CFDATA
  1448. * even if beginning CFDATA or some of CFDATA are not used in
  1449. * skipping file data.
  1450. */
  1451. if (cab->entry_cffolder->cfdata_index <
  1452. cab->entry_cffolder->cfdata_count) {
  1453. r = inflateReset(&cab->stream);
  1454. if (r != Z_OK)
  1455. goto zlibfailed;
  1456. r = inflateSetDictionary(&cab->stream,
  1457. cab->uncompressed_buffer, cfdata->uncompressed_size);
  1458. if (r != Z_OK)
  1459. goto zlibfailed;
  1460. }
  1461. d = cab->uncompressed_buffer + cfdata->read_offset;
  1462. *avail = uavail - cfdata->read_offset;
  1463. cfdata->uncompressed_avail = uavail;
  1464. return (d);
  1465. zlibfailed:
  1466. switch (r) {
  1467. case Z_MEM_ERROR:
  1468. archive_set_error(&a->archive, ENOMEM,
  1469. "Out of memory for deflate decompression");
  1470. break;
  1471. default:
  1472. archive_set_error(&a->archive, ARCHIVE_ERRNO_MISC,
  1473. "Deflate decompression failed (%d)", r);
  1474. break;
  1475. }
  1476. *avail = ARCHIVE_FATAL;
  1477. return (NULL);
  1478. nomszip:
  1479. archive_set_error(&a->archive, ARCHIVE_ERRNO_MISC,
  1480. "CFDATA incorrect(no MSZIP signature)");
  1481. *avail = ARCHIVE_FATAL;
  1482. return (NULL);
  1483. }
  1484. #else /* HAVE_ZLIB_H */
  1485. static const void *
  1486. cab_read_ahead_cfdata_deflate(struct archive_read *a, ssize_t *avail)
  1487. {
  1488. *avail = ARCHIVE_FATAL;
  1489. archive_set_error(&a->archive, ARCHIVE_ERRNO_MISC,
  1490. "libarchive compiled without deflate support (no libz)");
  1491. return (NULL);
  1492. }
  1493. #endif /* HAVE_ZLIB_H */
  1494. static const void *
  1495. cab_read_ahead_cfdata_lzx(struct archive_read *a, ssize_t *avail)
  1496. {
  1497. struct cab *cab = (struct cab *)(a->format->data);
  1498. struct cfdata *cfdata;
  1499. const void *d;
  1500. int r;
  1501. uint16_t uavail;
  1502. cfdata = cab->entry_cfdata;
  1503. /* If the buffer hasn't been allocated, allocate it now. */
  1504. if (cab->uncompressed_buffer == NULL) {
  1505. cab->uncompressed_buffer_size = 0x8000;
  1506. cab->uncompressed_buffer
  1507. = (unsigned char *)malloc(cab->uncompressed_buffer_size);
  1508. if (cab->uncompressed_buffer == NULL) {
  1509. archive_set_error(&a->archive, ENOMEM,
  1510. "No memory for CAB reader");
  1511. *avail = ARCHIVE_FATAL;
  1512. return (NULL);
  1513. }
  1514. }
  1515. uavail = cfdata->uncompressed_avail;
  1516. if (uavail == cfdata->uncompressed_size) {
  1517. d = cab->uncompressed_buffer + cfdata->read_offset;
  1518. *avail = uavail - cfdata->read_offset;
  1519. return (d);
  1520. }
  1521. if (!cab->entry_cffolder->decompress_init) {
  1522. r = lzx_decode_init(&cab->xstrm,
  1523. cab->entry_cffolder->compdata);
  1524. if (r != ARCHIVE_OK) {
  1525. archive_set_error(&a->archive, ARCHIVE_ERRNO_MISC,
  1526. "Can't initialize LZX decompression.");
  1527. *avail = ARCHIVE_FATAL;
  1528. return (NULL);
  1529. }
  1530. /* We've initialized decompression for this stream. */
  1531. cab->entry_cffolder->decompress_init = 1;
  1532. }
  1533. /* Clean up remaining bits of previous CFDATA. */
  1534. lzx_cleanup_bitstream(&cab->xstrm);
  1535. cab->xstrm.total_out = uavail;
  1536. while (cab->xstrm.total_out < cfdata->uncompressed_size) {
  1537. ssize_t bytes_avail;
  1538. cab->xstrm.next_out =
  1539. cab->uncompressed_buffer + cab->xstrm.total_out;
  1540. cab->xstrm.avail_out =
  1541. cfdata->uncompressed_size - cab->xstrm.total_out;
  1542. d = __archive_read_ahead(a, 1, &bytes_avail);
  1543. if (d == NULL) {
  1544. archive_set_error(&a->archive,
  1545. ARCHIVE_ERRNO_FILE_FORMAT,
  1546. "Truncated CAB file data");
  1547. *avail = ARCHIVE_FATAL;
  1548. return (NULL);
  1549. }
  1550. if (bytes_avail > cfdata->compressed_bytes_remaining)
  1551. bytes_avail = cfdata->compressed_bytes_remaining;
  1552. cab->xstrm.next_in = d;
  1553. cab->xstrm.avail_in = bytes_avail;
  1554. cab->xstrm.total_in = 0;
  1555. r = lzx_decode(&cab->xstrm,
  1556. cfdata->compressed_bytes_remaining == bytes_avail);
  1557. switch (r) {
  1558. case ARCHIVE_OK:
  1559. case ARCHIVE_EOF:
  1560. break;
  1561. default:
  1562. archive_set_error(&a->archive, ARCHIVE_ERRNO_MISC,
  1563. "LZX decompression failed (%d)", r);
  1564. *avail = ARCHIVE_FATAL;
  1565. return (NULL);
  1566. }
  1567. cfdata->unconsumed = cab->xstrm.total_in;
  1568. cfdata->sum_ptr = d;
  1569. if (cab_minimum_consume_cfdata(a, cfdata->unconsumed) < 0) {
  1570. *avail = ARCHIVE_FATAL;
  1571. return (NULL);
  1572. }
  1573. }
  1574. uavail = (uint16_t)cab->xstrm.total_out;
  1575. /*
  1576. * Make sure a read pointer advances to next CFDATA.
  1577. */
  1578. if (cfdata->compressed_bytes_remaining > 0) {
  1579. ssize_t bytes_avail;
  1580. d = __archive_read_ahead(a, cfdata->compressed_bytes_remaining,
  1581. &bytes_avail);
  1582. if (bytes_avail <= 0) {
  1583. *avail = truncated_error(a);
  1584. return (NULL);
  1585. }
  1586. cfdata->unconsumed = cfdata->compressed_bytes_remaining;
  1587. cfdata->sum_ptr = d;
  1588. if (cab_minimum_consume_cfdata(a, cfdata->unconsumed) < 0) {
  1589. *avail = ARCHIVE_FATAL;
  1590. return (NULL);
  1591. }
  1592. }
  1593. /*
  1594. * Translation reversal of x86 processor CALL byte sequence(E8).
  1595. */
  1596. lzx_translation(&cab->xstrm, cab->uncompressed_buffer,
  1597. cfdata->uncompressed_size,
  1598. (cab->entry_cffolder->cfdata_index-1) * 0x8000);
  1599. d = cab->uncompressed_buffer + cfdata->read_offset;
  1600. *avail = uavail - cfdata->read_offset;
  1601. cfdata->uncompressed_avail = uavail;
  1602. return (d);
  1603. }
  1604. /*
  1605. * Consume CFDATA.
  1606. * We always decompress CFDATA to consume CFDATA as much as we need
  1607. * in uncompressed bytes because all CFDATA in a folder are related
  1608. * so we do not skip any CFDATA without decompressing.
  1609. * Note: If the folder of a CFFILE is iFoldCONTINUED_PREV_AND_NEXT or
  1610. * iFoldCONTINUED_FROM_PREV, we won't decompress because a CFDATA for
  1611. * the CFFILE is remaining bytes of previous Multivolume CAB file.
  1612. */
  1613. static int64_t
  1614. cab_consume_cfdata(struct archive_read *a, int64_t consumed_bytes)
  1615. {
  1616. struct cab *cab = (struct cab *)(a->format->data);
  1617. struct cfdata *cfdata;
  1618. int64_t cbytes, rbytes;
  1619. int err;
  1620. rbytes = cab_minimum_consume_cfdata(a, consumed_bytes);
  1621. if (rbytes < 0)
  1622. return (ARCHIVE_FATAL);
  1623. cfdata = cab->entry_cfdata;
  1624. while (rbytes > 0) {
  1625. ssize_t avail;
  1626. if (cfdata->compressed_size == 0) {
  1627. archive_set_error(&a->archive,
  1628. ARCHIVE_ERRNO_FILE_FORMAT,
  1629. "Invalid CFDATA");
  1630. return (ARCHIVE_FATAL);
  1631. }
  1632. cbytes = cfdata->uncompressed_bytes_remaining;
  1633. if (cbytes > rbytes)
  1634. cbytes = rbytes;
  1635. rbytes -= cbytes;
  1636. if (cfdata->uncompressed_avail == 0 &&
  1637. (cab->entry_cffile->folder == iFoldCONTINUED_PREV_AND_NEXT ||
  1638. cab->entry_cffile->folder == iFoldCONTINUED_FROM_PREV)) {
  1639. /* We have not read any data yet. */
  1640. if (cbytes == cfdata->uncompressed_bytes_remaining) {
  1641. /* Skip whole current CFDATA. */
  1642. __archive_read_consume(a,
  1643. cfdata->compressed_size);
  1644. cab->cab_offset += cfdata->compressed_size;
  1645. cfdata->compressed_bytes_remaining = 0;
  1646. cfdata->uncompressed_bytes_remaining = 0;
  1647. err = cab_next_cfdata(a);
  1648. if (err < 0)
  1649. return (err);
  1650. cfdata = cab->entry_cfdata;
  1651. if (cfdata->uncompressed_size == 0) {
  1652. switch (cab->entry_cffile->folder) {
  1653. case iFoldCONTINUED_PREV_AND_NEXT:
  1654. case iFoldCONTINUED_TO_NEXT:
  1655. case iFoldCONTINUED_FROM_PREV:
  1656. rbytes = 0;
  1657. break;
  1658. default:
  1659. break;
  1660. }
  1661. }
  1662. continue;
  1663. }
  1664. cfdata->read_offset += (uint16_t)cbytes;
  1665. cfdata->uncompressed_bytes_remaining -= (uint16_t)cbytes;
  1666. break;
  1667. } else if (cbytes == 0) {
  1668. err = cab_next_cfdata(a);
  1669. if (err < 0)
  1670. return (err);
  1671. cfdata = cab->entry_cfdata;
  1672. if (cfdata->uncompressed_size == 0) {
  1673. switch (cab->entry_cffile->folder) {
  1674. case iFoldCONTINUED_PREV_AND_NEXT:
  1675. case iFoldCONTINUED_TO_NEXT:
  1676. case iFoldCONTINUED_FROM_PREV:
  1677. return (ARCHIVE_FATAL);
  1678. default:
  1679. break;
  1680. }
  1681. }
  1682. continue;
  1683. }
  1684. while (cbytes > 0) {
  1685. (void)cab_read_ahead_cfdata(a, &avail);
  1686. if (avail <= 0)
  1687. return (ARCHIVE_FATAL);
  1688. if (avail > cbytes)
  1689. avail = (ssize_t)cbytes;
  1690. if (cab_minimum_consume_cfdata(a, avail) < 0)
  1691. return (ARCHIVE_FATAL);
  1692. cbytes -= avail;
  1693. }
  1694. }
  1695. return (consumed_bytes);
  1696. }
  1697. /*
  1698. * Consume CFDATA as much as we have already gotten and
  1699. * compute the sum of CFDATA.
  1700. */
  1701. static int64_t
  1702. cab_minimum_consume_cfdata(struct archive_read *a, int64_t consumed_bytes)
  1703. {
  1704. struct cab *cab = (struct cab *)(a->format->data);
  1705. struct cfdata *cfdata;
  1706. int64_t cbytes, rbytes;
  1707. int err;
  1708. cfdata = cab->entry_cfdata;
  1709. rbytes = consumed_bytes;
  1710. if (cab->entry_cffolder->comptype == COMPTYPE_NONE) {
  1711. if (consumed_bytes < cfdata->unconsumed)
  1712. cbytes = consumed_bytes;
  1713. else
  1714. cbytes = cfdata->unconsumed;
  1715. rbytes -= cbytes;
  1716. cfdata->read_offset += (uint16_t)cbytes;
  1717. cfdata->uncompressed_bytes_remaining -= (uint16_t)cbytes;
  1718. cfdata->unconsumed -= cbytes;
  1719. } else {
  1720. cbytes = cfdata->uncompressed_avail - cfdata->read_offset;
  1721. if (cbytes > 0) {
  1722. if (consumed_bytes < cbytes)
  1723. cbytes = consumed_bytes;
  1724. rbytes -= cbytes;
  1725. cfdata->read_offset += (uint16_t)cbytes;
  1726. cfdata->uncompressed_bytes_remaining -= (uint16_t)cbytes;
  1727. }
  1728. if (cfdata->unconsumed) {
  1729. cbytes = cfdata->unconsumed;
  1730. cfdata->unconsumed = 0;
  1731. } else
  1732. cbytes = 0;
  1733. }
  1734. if (cbytes) {
  1735. /* Compute the sum. */
  1736. cab_checksum_update(a, (size_t)cbytes);
  1737. /* Consume as much as the compressor actually used. */
  1738. __archive_read_consume(a, cbytes);
  1739. cab->cab_offset += cbytes;
  1740. cfdata->compressed_bytes_remaining -= (uint16_t)cbytes;
  1741. if (cfdata->compressed_bytes_remaining == 0) {
  1742. err = cab_checksum_finish(a);
  1743. if (err < 0)
  1744. return (err);
  1745. }
  1746. }
  1747. return (rbytes);
  1748. }
  1749. /*
  1750. * Returns ARCHIVE_OK if successful, ARCHIVE_FATAL otherwise, sets
  1751. * cab->end_of_entry if it consumes all of the data.
  1752. */
  1753. static int
  1754. cab_read_data(struct archive_read *a, const void **buff,
  1755. size_t *size, int64_t *offset)
  1756. {
  1757. struct cab *cab = (struct cab *)(a->format->data);
  1758. ssize_t bytes_avail;
  1759. if (cab->entry_bytes_remaining == 0) {
  1760. *buff = NULL;
  1761. *size = 0;
  1762. *offset = cab->entry_offset;
  1763. cab->end_of_entry = 1;
  1764. return (ARCHIVE_OK);
  1765. }
  1766. *buff = cab_read_ahead_cfdata(a, &bytes_avail);
  1767. if (bytes_avail <= 0) {
  1768. *buff = NULL;
  1769. *size = 0;
  1770. *offset = 0;
  1771. if (bytes_avail == 0 &&
  1772. cab->entry_cfdata->uncompressed_size == 0) {
  1773. /* All of CFDATA in a folder has been handled. */
  1774. archive_set_error(&a->archive,
  1775. ARCHIVE_ERRNO_FILE_FORMAT, "Invalid CFDATA");
  1776. return (ARCHIVE_FATAL);
  1777. } else
  1778. return ((int)bytes_avail);
  1779. }
  1780. if (bytes_avail > cab->entry_bytes_remaining)
  1781. bytes_avail = (ssize_t)cab->entry_bytes_remaining;
  1782. *size = bytes_avail;
  1783. *offset = cab->entry_offset;
  1784. cab->entry_offset += bytes_avail;
  1785. cab->entry_bytes_remaining -= bytes_avail;
  1786. if (cab->entry_bytes_remaining == 0)
  1787. cab->end_of_entry = 1;
  1788. cab->entry_unconsumed = bytes_avail;
  1789. if (cab->entry_cffolder->comptype == COMPTYPE_NONE) {
  1790. /* Don't consume more than current entry used. */
  1791. if (cab->entry_cfdata->unconsumed > cab->entry_unconsumed)
  1792. cab->entry_cfdata->unconsumed = cab->entry_unconsumed;
  1793. }
  1794. return (ARCHIVE_OK);
  1795. }
  1796. static int
  1797. archive_read_format_cab_read_data_skip(struct archive_read *a)
  1798. {
  1799. struct cab *cab;
  1800. int64_t bytes_skipped;
  1801. int r;
  1802. cab = (struct cab *)(a->format->data);
  1803. if (cab->end_of_archive)
  1804. return (ARCHIVE_EOF);
  1805. if (!cab->read_data_invoked) {
  1806. cab->bytes_skipped += cab->entry_bytes_remaining;
  1807. cab->entry_bytes_remaining = 0;
  1808. /* This entry is finished and done. */
  1809. cab->end_of_entry_cleanup = cab->end_of_entry = 1;
  1810. return (ARCHIVE_OK);
  1811. }
  1812. if (cab->entry_unconsumed) {
  1813. /* Consume as much as the compressor actually used. */
  1814. r = (int)cab_consume_cfdata(a, cab->entry_unconsumed);
  1815. cab->entry_unconsumed = 0;
  1816. if (r < 0)
  1817. return (r);
  1818. } else if (cab->entry_cfdata == NULL) {
  1819. r = cab_next_cfdata(a);
  1820. if (r < 0)
  1821. return (r);
  1822. }
  1823. /* if we've already read to end of data, we're done. */
  1824. if (cab->end_of_entry_cleanup)
  1825. return (ARCHIVE_OK);
  1826. /*
  1827. * If the length is at the beginning, we can skip the
  1828. * compressed data much more quickly.
  1829. */
  1830. bytes_skipped = cab_consume_cfdata(a, cab->entry_bytes_remaining);
  1831. if (bytes_skipped < 0)
  1832. return (ARCHIVE_FATAL);
  1833. /* If the compression type is none(uncompressed), we've already
  1834. * consumed data as much as the current entry size. */
  1835. if (cab->entry_cffolder->comptype == COMPTYPE_NONE &&
  1836. cab->entry_cfdata != NULL)
  1837. cab->entry_cfdata->unconsumed = 0;
  1838. /* This entry is finished and done. */
  1839. cab->end_of_entry_cleanup = cab->end_of_entry = 1;
  1840. return (ARCHIVE_OK);
  1841. }
  1842. static int
  1843. archive_read_format_cab_cleanup(struct archive_read *a)
  1844. {
  1845. struct cab *cab = (struct cab *)(a->format->data);
  1846. struct cfheader *hd = &cab->cfheader;
  1847. int i;
  1848. if (hd->folder_array != NULL) {
  1849. for (i = 0; i < hd->folder_count; i++)
  1850. free(hd->folder_array[i].cfdata.memimage);
  1851. free(hd->folder_array);
  1852. }
  1853. if (hd->file_array != NULL) {
  1854. for (i = 0; i < cab->cfheader.file_count; i++)
  1855. archive_string_free(&(hd->file_array[i].pathname));
  1856. free(hd->file_array);
  1857. }
  1858. #ifdef HAVE_ZLIB_H
  1859. if (cab->stream_valid)
  1860. inflateEnd(&cab->stream);
  1861. #endif
  1862. lzx_decode_free(&cab->xstrm);
  1863. archive_wstring_free(&cab->ws);
  1864. free(cab->uncompressed_buffer);
  1865. free(cab);
  1866. (a->format->data) = NULL;
  1867. return (ARCHIVE_OK);
  1868. }
  1869. /* Convert an MSDOS-style date/time into Unix-style time. */
  1870. static time_t
  1871. cab_dos_time(const unsigned char *p)
  1872. {
  1873. int msTime, msDate;
  1874. struct tm ts;
  1875. msDate = archive_le16dec(p);
  1876. msTime = archive_le16dec(p+2);
  1877. memset(&ts, 0, sizeof(ts));
  1878. ts.tm_year = ((msDate >> 9) & 0x7f) + 80; /* Years since 1900. */
  1879. ts.tm_mon = ((msDate >> 5) & 0x0f) - 1; /* Month number. */
  1880. ts.tm_mday = msDate & 0x1f; /* Day of month. */
  1881. ts.tm_hour = (msTime >> 11) & 0x1f;
  1882. ts.tm_min = (msTime >> 5) & 0x3f;
  1883. ts.tm_sec = (msTime << 1) & 0x3e;
  1884. ts.tm_isdst = -1;
  1885. return (mktime(&ts));
  1886. }
  1887. /*****************************************************************
  1888. *
  1889. * LZX decompression code.
  1890. *
  1891. *****************************************************************/
  1892. /*
  1893. * Initialize LZX decoder.
  1894. *
  1895. * Returns ARCHIVE_OK if initialization was successful.
  1896. * Returns ARCHIVE_FAILED if w_bits has unsupported value.
  1897. * Returns ARCHIVE_FATAL if initialization failed; memory allocation
  1898. * error occurred.
  1899. */
  1900. static int
  1901. lzx_decode_init(struct lzx_stream *strm, int w_bits)
  1902. {
  1903. struct lzx_dec *ds;
  1904. int slot, w_size, w_slot;
  1905. int base, footer;
  1906. int base_inc[18];
  1907. if (strm->ds == NULL) {
  1908. strm->ds = calloc(1, sizeof(*strm->ds));
  1909. if (strm->ds == NULL)
  1910. return (ARCHIVE_FATAL);
  1911. }
  1912. ds = strm->ds;
  1913. ds->error = ARCHIVE_FAILED;
  1914. /* Allow bits from 15(32KBi) up to 21(2MBi) */
  1915. if (w_bits < SLOT_BASE || w_bits > SLOT_MAX)
  1916. return (ARCHIVE_FAILED);
  1917. ds->error = ARCHIVE_FATAL;
  1918. /*
  1919. * Alloc window
  1920. */
  1921. w_size = ds->w_size;
  1922. w_slot = slots[w_bits - SLOT_BASE];
  1923. ds->w_size = 1U << w_bits;
  1924. ds->w_mask = ds->w_size -1;
  1925. if (ds->w_buff == NULL || w_size != ds->w_size) {
  1926. free(ds->w_buff);
  1927. ds->w_buff = malloc(ds->w_size);
  1928. if (ds->w_buff == NULL)
  1929. return (ARCHIVE_FATAL);
  1930. free(ds->pos_tbl);
  1931. ds->pos_tbl = malloc(sizeof(ds->pos_tbl[0]) * w_slot);
  1932. if (ds->pos_tbl == NULL)
  1933. return (ARCHIVE_FATAL);
  1934. }
  1935. for (footer = 0; footer < 18; footer++)
  1936. base_inc[footer] = 1 << footer;
  1937. base = footer = 0;
  1938. for (slot = 0; slot < w_slot; slot++) {
  1939. int n;
  1940. if (footer == 0)
  1941. base = slot;
  1942. else
  1943. base += base_inc[footer];
  1944. if (footer < 17) {
  1945. footer = -2;
  1946. for (n = base; n; n >>= 1)
  1947. footer++;
  1948. if (footer <= 0)
  1949. footer = 0;
  1950. }
  1951. ds->pos_tbl[slot].base = base;
  1952. ds->pos_tbl[slot].footer_bits = footer;
  1953. }
  1954. ds->w_pos = 0;
  1955. ds->state = 0;
  1956. ds->br.cache_buffer = 0;
  1957. ds->br.cache_avail = 0;
  1958. ds->r0 = ds->r1 = ds->r2 = 1;
  1959. /* Initialize aligned offset tree. */
  1960. if (lzx_huffman_init(&(ds->at), 8, 8) != ARCHIVE_OK)
  1961. return (ARCHIVE_FATAL);
  1962. /* Initialize pre-tree. */
  1963. if (lzx_huffman_init(&(ds->pt), 20, 10) != ARCHIVE_OK)
  1964. return (ARCHIVE_FATAL);
  1965. /* Initialize Main tree. */
  1966. if (lzx_huffman_init(&(ds->mt), 256+(w_slot<<3), 16)
  1967. != ARCHIVE_OK)
  1968. return (ARCHIVE_FATAL);
  1969. /* Initialize Length tree. */
  1970. if (lzx_huffman_init(&(ds->lt), 249, 16) != ARCHIVE_OK)
  1971. return (ARCHIVE_FATAL);
  1972. ds->error = 0;
  1973. return (ARCHIVE_OK);
  1974. }
  1975. /*
  1976. * Release LZX decoder.
  1977. */
  1978. static void
  1979. lzx_decode_free(struct lzx_stream *strm)
  1980. {
  1981. if (strm->ds == NULL)
  1982. return;
  1983. free(strm->ds->w_buff);
  1984. free(strm->ds->pos_tbl);
  1985. lzx_huffman_free(&(strm->ds->at));
  1986. lzx_huffman_free(&(strm->ds->pt));
  1987. lzx_huffman_free(&(strm->ds->mt));
  1988. lzx_huffman_free(&(strm->ds->lt));
  1989. free(strm->ds);
  1990. strm->ds = NULL;
  1991. }
  1992. /*
  1993. * E8 Call Translation reversal.
  1994. */
  1995. static void
  1996. lzx_translation(struct lzx_stream *strm, void *p, size_t size, uint32_t offset)
  1997. {
  1998. struct lzx_dec *ds = strm->ds;
  1999. unsigned char *b, *end;
  2000. if (!ds->translation || size <= 10)
  2001. return;
  2002. b = p;
  2003. end = b + size - 10;
  2004. while (b < end && (b = memchr(b, 0xE8, end - b)) != NULL) {
  2005. size_t i = b - (unsigned char *)p;
  2006. int32_t cp, displacement, value;
  2007. cp = (int32_t)(offset + (uint32_t)i);
  2008. value = archive_le32dec(&b[1]);
  2009. if (value >= -cp && value < (int32_t)ds->translation_size) {
  2010. if (value >= 0)
  2011. displacement = value - cp;
  2012. else
  2013. displacement = value + ds->translation_size;
  2014. archive_le32enc(&b[1], (uint32_t)displacement);
  2015. }
  2016. b += 5;
  2017. }
  2018. }
  2019. /*
  2020. * Bit stream reader.
  2021. */
  2022. /* Check that the cache buffer has enough bits. */
  2023. #define lzx_br_has(br, n) ((br)->cache_avail >= n)
  2024. /* Get compressed data by bit. */
  2025. #define lzx_br_bits(br, n) \
  2026. (((uint32_t)((br)->cache_buffer >> \
  2027. ((br)->cache_avail - (n)))) & cache_masks[n])
  2028. #define lzx_br_bits_forced(br, n) \
  2029. (((uint32_t)((br)->cache_buffer << \
  2030. ((n) - (br)->cache_avail))) & cache_masks[n])
  2031. /* Read ahead to make sure the cache buffer has enough compressed data we
  2032. * will use.
  2033. * True : completed, there is enough data in the cache buffer.
  2034. * False : we met that strm->next_in is empty, we have to get following
  2035. * bytes. */
  2036. #define lzx_br_read_ahead_0(strm, br, n) \
  2037. (lzx_br_has((br), (n)) || lzx_br_fillup(strm, br))
  2038. /* True : the cache buffer has some bits as much as we need.
  2039. * False : there are no enough bits in the cache buffer to be used,
  2040. * we have to get following bytes if we could. */
  2041. #define lzx_br_read_ahead(strm, br, n) \
  2042. (lzx_br_read_ahead_0((strm), (br), (n)) || lzx_br_has((br), (n)))
  2043. /* Notify how many bits we consumed. */
  2044. #define lzx_br_consume(br, n) ((br)->cache_avail -= (n))
  2045. #define lzx_br_consume_unaligned_bits(br) ((br)->cache_avail &= ~0x0f)
  2046. #define lzx_br_is_unaligned(br) ((br)->cache_avail & 0x0f)
  2047. static const uint32_t cache_masks[] = {
  2048. 0x00000000, 0x00000001, 0x00000003, 0x00000007,
  2049. 0x0000000F, 0x0000001F, 0x0000003F, 0x0000007F,
  2050. 0x000000FF, 0x000001FF, 0x000003FF, 0x000007FF,
  2051. 0x00000FFF, 0x00001FFF, 0x00003FFF, 0x00007FFF,
  2052. 0x0000FFFF, 0x0001FFFF, 0x0003FFFF, 0x0007FFFF,
  2053. 0x000FFFFF, 0x001FFFFF, 0x003FFFFF, 0x007FFFFF,
  2054. 0x00FFFFFF, 0x01FFFFFF, 0x03FFFFFF, 0x07FFFFFF,
  2055. 0x0FFFFFFF, 0x1FFFFFFF, 0x3FFFFFFF, 0x7FFFFFFF,
  2056. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF
  2057. };
  2058. /*
  2059. * Shift away used bits in the cache data and fill it up with following bits.
  2060. * Call this when cache buffer does not have enough bits you need.
  2061. *
  2062. * Returns 1 if the cache buffer is full.
  2063. * Returns 0 if the cache buffer is not full; input buffer is empty.
  2064. */
  2065. static int
  2066. lzx_br_fillup(struct lzx_stream *strm, struct lzx_br *br)
  2067. {
  2068. /*
  2069. * x86 processor family can read misaligned data without an access error.
  2070. */
  2071. int n = CACHE_BITS - br->cache_avail;
  2072. for (;;) {
  2073. switch (n >> 4) {
  2074. case 4:
  2075. if (strm->avail_in >= 8) {
  2076. br->cache_buffer =
  2077. ((uint64_t)strm->next_in[1]) << 56 |
  2078. ((uint64_t)strm->next_in[0]) << 48 |
  2079. ((uint64_t)strm->next_in[3]) << 40 |
  2080. ((uint64_t)strm->next_in[2]) << 32 |
  2081. ((uint32_t)strm->next_in[5]) << 24 |
  2082. ((uint32_t)strm->next_in[4]) << 16 |
  2083. ((uint32_t)strm->next_in[7]) << 8 |
  2084. (uint32_t)strm->next_in[6];
  2085. strm->next_in += 8;
  2086. strm->avail_in -= 8;
  2087. br->cache_avail += 8 * 8;
  2088. return (1);
  2089. }
  2090. break;
  2091. case 3:
  2092. if (strm->avail_in >= 6) {
  2093. br->cache_buffer =
  2094. (br->cache_buffer << 48) |
  2095. ((uint64_t)strm->next_in[1]) << 40 |
  2096. ((uint64_t)strm->next_in[0]) << 32 |
  2097. ((uint64_t)strm->next_in[3]) << 24 |
  2098. ((uint64_t)strm->next_in[2]) << 16 |
  2099. ((uint64_t)strm->next_in[5]) << 8 |
  2100. (uint64_t)strm->next_in[4];
  2101. strm->next_in += 6;
  2102. strm->avail_in -= 6;
  2103. br->cache_avail += 6 * 8;
  2104. return (1);
  2105. }
  2106. break;
  2107. case 0:
  2108. /* We have enough compressed data in
  2109. * the cache buffer.*/
  2110. return (1);
  2111. default:
  2112. break;
  2113. }
  2114. if (strm->avail_in < 2) {
  2115. /* There is not enough compressed data to
  2116. * fill up the cache buffer. */
  2117. if (strm->avail_in == 1) {
  2118. br->odd = *strm->next_in++;
  2119. strm->avail_in--;
  2120. br->have_odd = 1;
  2121. }
  2122. return (0);
  2123. }
  2124. br->cache_buffer =
  2125. (br->cache_buffer << 16) |
  2126. archive_le16dec(strm->next_in);
  2127. strm->next_in += 2;
  2128. strm->avail_in -= 2;
  2129. br->cache_avail += 16;
  2130. n -= 16;
  2131. }
  2132. }
  2133. static void
  2134. lzx_br_fixup(struct lzx_stream *strm, struct lzx_br *br)
  2135. {
  2136. int n = CACHE_BITS - br->cache_avail;
  2137. if (br->have_odd && n >= 16 && strm->avail_in > 0) {
  2138. br->cache_buffer =
  2139. (br->cache_buffer << 16) |
  2140. ((uint16_t)(*strm->next_in)) << 8 | br->odd;
  2141. strm->next_in++;
  2142. strm->avail_in--;
  2143. br->cache_avail += 16;
  2144. br->have_odd = 0;
  2145. }
  2146. }
  2147. static void
  2148. lzx_cleanup_bitstream(struct lzx_stream *strm)
  2149. {
  2150. strm->ds->br.cache_avail = 0;
  2151. strm->ds->br.have_odd = 0;
  2152. }
  2153. /*
  2154. * Decode LZX.
  2155. *
  2156. * 1. Returns ARCHIVE_OK if output buffer or input buffer are empty.
  2157. * Please set available buffer and call this function again.
  2158. * 2. Returns ARCHIVE_EOF if decompression has been completed.
  2159. * 3. Returns ARCHIVE_FAILED if an error occurred; compressed data
  2160. * is broken or you do not set 'last' flag properly.
  2161. */
  2162. #define ST_RD_TRANSLATION 0
  2163. #define ST_RD_TRANSLATION_SIZE 1
  2164. #define ST_RD_BLOCK_TYPE 2
  2165. #define ST_RD_BLOCK_SIZE 3
  2166. #define ST_RD_ALIGNMENT 4
  2167. #define ST_RD_R0 5
  2168. #define ST_RD_R1 6
  2169. #define ST_RD_R2 7
  2170. #define ST_COPY_UNCOMP1 8
  2171. #define ST_COPY_UNCOMP2 9
  2172. #define ST_RD_ALIGNED_OFFSET 10
  2173. #define ST_RD_VERBATIM 11
  2174. #define ST_RD_PRE_MAIN_TREE_256 12
  2175. #define ST_MAIN_TREE_256 13
  2176. #define ST_RD_PRE_MAIN_TREE_REM 14
  2177. #define ST_MAIN_TREE_REM 15
  2178. #define ST_RD_PRE_LENGTH_TREE 16
  2179. #define ST_LENGTH_TREE 17
  2180. #define ST_MAIN 18
  2181. #define ST_LENGTH 19
  2182. #define ST_OFFSET 20
  2183. #define ST_REAL_POS 21
  2184. #define ST_COPY 22
  2185. static int
  2186. lzx_decode(struct lzx_stream *strm, int last)
  2187. {
  2188. struct lzx_dec *ds = strm->ds;
  2189. int64_t avail_in;
  2190. int r;
  2191. if (ds->error)
  2192. return (ds->error);
  2193. avail_in = strm->avail_in;
  2194. lzx_br_fixup(strm, &(ds->br));
  2195. do {
  2196. if (ds->state < ST_MAIN)
  2197. r = lzx_read_blocks(strm, last);
  2198. else {
  2199. int64_t bytes_written = strm->avail_out;
  2200. r = lzx_decode_blocks(strm, last);
  2201. bytes_written -= strm->avail_out;
  2202. strm->next_out += bytes_written;
  2203. strm->total_out += bytes_written;
  2204. }
  2205. } while (r == 100);
  2206. strm->total_in += avail_in - strm->avail_in;
  2207. return (r);
  2208. }
  2209. static int
  2210. lzx_read_blocks(struct lzx_stream *strm, int last)
  2211. {
  2212. struct lzx_dec *ds = strm->ds;
  2213. struct lzx_br *br = &(ds->br);
  2214. int i, r;
  2215. for (;;) {
  2216. switch (ds->state) {
  2217. case ST_RD_TRANSLATION:
  2218. if (!lzx_br_read_ahead(strm, br, 1)) {
  2219. ds->state = ST_RD_TRANSLATION;
  2220. if (last)
  2221. goto failed;
  2222. return (ARCHIVE_OK);
  2223. }
  2224. ds->translation = lzx_br_bits(br, 1);
  2225. lzx_br_consume(br, 1);
  2226. /* FALL THROUGH */
  2227. case ST_RD_TRANSLATION_SIZE:
  2228. if (ds->translation) {
  2229. if (!lzx_br_read_ahead(strm, br, 32)) {
  2230. ds->state = ST_RD_TRANSLATION_SIZE;
  2231. if (last)
  2232. goto failed;
  2233. return (ARCHIVE_OK);
  2234. }
  2235. ds->translation_size = lzx_br_bits(br, 16);
  2236. lzx_br_consume(br, 16);
  2237. ds->translation_size <<= 16;
  2238. ds->translation_size |= lzx_br_bits(br, 16);
  2239. lzx_br_consume(br, 16);
  2240. }
  2241. /* FALL THROUGH */
  2242. case ST_RD_BLOCK_TYPE:
  2243. if (!lzx_br_read_ahead(strm, br, 3)) {
  2244. ds->state = ST_RD_BLOCK_TYPE;
  2245. if (last)
  2246. goto failed;
  2247. return (ARCHIVE_OK);
  2248. }
  2249. ds->block_type = lzx_br_bits(br, 3);
  2250. lzx_br_consume(br, 3);
  2251. /* Check a block type. */
  2252. switch (ds->block_type) {
  2253. case VERBATIM_BLOCK:
  2254. case ALIGNED_OFFSET_BLOCK:
  2255. case UNCOMPRESSED_BLOCK:
  2256. break;
  2257. default:
  2258. goto failed;/* Invalid */
  2259. }
  2260. /* FALL THROUGH */
  2261. case ST_RD_BLOCK_SIZE:
  2262. if (!lzx_br_read_ahead(strm, br, 24)) {
  2263. ds->state = ST_RD_BLOCK_SIZE;
  2264. if (last)
  2265. goto failed;
  2266. return (ARCHIVE_OK);
  2267. }
  2268. ds->block_size = lzx_br_bits(br, 8);
  2269. lzx_br_consume(br, 8);
  2270. ds->block_size <<= 16;
  2271. ds->block_size |= lzx_br_bits(br, 16);
  2272. lzx_br_consume(br, 16);
  2273. if (ds->block_size == 0)
  2274. goto failed;
  2275. ds->block_bytes_avail = ds->block_size;
  2276. if (ds->block_type != UNCOMPRESSED_BLOCK) {
  2277. if (ds->block_type == VERBATIM_BLOCK)
  2278. ds->state = ST_RD_VERBATIM;
  2279. else
  2280. ds->state = ST_RD_ALIGNED_OFFSET;
  2281. break;
  2282. }
  2283. /* FALL THROUGH */
  2284. case ST_RD_ALIGNMENT:
  2285. /*
  2286. * Handle an Uncompressed Block.
  2287. */
  2288. /* Skip padding to align following field on
  2289. * 16-bit boundary. */
  2290. if (lzx_br_is_unaligned(br))
  2291. lzx_br_consume_unaligned_bits(br);
  2292. else {
  2293. if (lzx_br_read_ahead(strm, br, 16))
  2294. lzx_br_consume(br, 16);
  2295. else {
  2296. ds->state = ST_RD_ALIGNMENT;
  2297. if (last)
  2298. goto failed;
  2299. return (ARCHIVE_OK);
  2300. }
  2301. }
  2302. /* Preparation to read repeated offsets R0,R1 and R2. */
  2303. ds->rbytes_avail = 0;
  2304. ds->state = ST_RD_R0;
  2305. /* FALL THROUGH */
  2306. case ST_RD_R0:
  2307. case ST_RD_R1:
  2308. case ST_RD_R2:
  2309. do {
  2310. uint16_t u16;
  2311. /* Drain bits in the cache buffer of
  2312. * bit-stream. */
  2313. if (lzx_br_has(br, 32)) {
  2314. u16 = lzx_br_bits(br, 16);
  2315. lzx_br_consume(br, 16);
  2316. archive_le16enc(ds->rbytes, u16);
  2317. u16 = lzx_br_bits(br, 16);
  2318. lzx_br_consume(br, 16);
  2319. archive_le16enc(ds->rbytes+2, u16);
  2320. ds->rbytes_avail = 4;
  2321. } else if (lzx_br_has(br, 16)) {
  2322. u16 = lzx_br_bits(br, 16);
  2323. lzx_br_consume(br, 16);
  2324. archive_le16enc(ds->rbytes, u16);
  2325. ds->rbytes_avail = 2;
  2326. }
  2327. if (ds->rbytes_avail < 4 && ds->br.have_odd) {
  2328. ds->rbytes[ds->rbytes_avail++] =
  2329. ds->br.odd;
  2330. ds->br.have_odd = 0;
  2331. }
  2332. while (ds->rbytes_avail < 4) {
  2333. if (strm->avail_in <= 0) {
  2334. if (last)
  2335. goto failed;
  2336. return (ARCHIVE_OK);
  2337. }
  2338. ds->rbytes[ds->rbytes_avail++] =
  2339. *strm->next_in++;
  2340. strm->avail_in--;
  2341. }
  2342. ds->rbytes_avail = 0;
  2343. if (ds->state == ST_RD_R0) {
  2344. ds->r0 = archive_le32dec(ds->rbytes);
  2345. if (ds->r0 < 0)
  2346. goto failed;
  2347. ds->state = ST_RD_R1;
  2348. } else if (ds->state == ST_RD_R1) {
  2349. ds->r1 = archive_le32dec(ds->rbytes);
  2350. if (ds->r1 < 0)
  2351. goto failed;
  2352. ds->state = ST_RD_R2;
  2353. } else if (ds->state == ST_RD_R2) {
  2354. ds->r2 = archive_le32dec(ds->rbytes);
  2355. if (ds->r2 < 0)
  2356. goto failed;
  2357. /* We've gotten all repeated offsets. */
  2358. ds->state = ST_COPY_UNCOMP1;
  2359. }
  2360. } while (ds->state != ST_COPY_UNCOMP1);
  2361. /* FALL THROUGH */
  2362. case ST_COPY_UNCOMP1:
  2363. /*
  2364. * Copy bytes form next_in to next_out directly.
  2365. */
  2366. while (ds->block_bytes_avail) {
  2367. int l;
  2368. if (strm->avail_out <= 0)
  2369. /* Output buffer is empty. */
  2370. return (ARCHIVE_OK);
  2371. if (strm->avail_in <= 0) {
  2372. /* Input buffer is empty. */
  2373. if (last)
  2374. goto failed;
  2375. return (ARCHIVE_OK);
  2376. }
  2377. l = (int)ds->block_bytes_avail;
  2378. if (l > ds->w_size - ds->w_pos)
  2379. l = ds->w_size - ds->w_pos;
  2380. if (l > strm->avail_out)
  2381. l = (int)strm->avail_out;
  2382. if (l > strm->avail_in)
  2383. l = (int)strm->avail_in;
  2384. memcpy(strm->next_out, strm->next_in, l);
  2385. memcpy(&(ds->w_buff[ds->w_pos]),
  2386. strm->next_in, l);
  2387. strm->next_in += l;
  2388. strm->avail_in -= l;
  2389. strm->next_out += l;
  2390. strm->avail_out -= l;
  2391. strm->total_out += l;
  2392. ds->w_pos = (ds->w_pos + l) & ds->w_mask;
  2393. ds->block_bytes_avail -= l;
  2394. }
  2395. /* FALL THROUGH */
  2396. case ST_COPY_UNCOMP2:
  2397. /* Re-align; skip padding byte. */
  2398. if (ds->block_size & 1) {
  2399. if (strm->avail_in <= 0) {
  2400. /* Input buffer is empty. */
  2401. ds->state = ST_COPY_UNCOMP2;
  2402. if (last)
  2403. goto failed;
  2404. return (ARCHIVE_OK);
  2405. }
  2406. strm->next_in++;
  2407. strm->avail_in --;
  2408. }
  2409. /* This block ended. */
  2410. ds->state = ST_RD_BLOCK_TYPE;
  2411. return (ARCHIVE_EOF);
  2412. /********************/
  2413. case ST_RD_ALIGNED_OFFSET:
  2414. /*
  2415. * Read Aligned offset tree.
  2416. */
  2417. if (!lzx_br_read_ahead(strm, br, 3 * ds->at.len_size)) {
  2418. ds->state = ST_RD_ALIGNED_OFFSET;
  2419. if (last)
  2420. goto failed;
  2421. return (ARCHIVE_OK);
  2422. }
  2423. memset(ds->at.freq, 0, sizeof(ds->at.freq));
  2424. for (i = 0; i < ds->at.len_size; i++) {
  2425. ds->at.bitlen[i] = lzx_br_bits(br, 3);
  2426. ds->at.freq[ds->at.bitlen[i]]++;
  2427. lzx_br_consume(br, 3);
  2428. }
  2429. if (!lzx_make_huffman_table(&ds->at))
  2430. goto failed;
  2431. /* FALL THROUGH */
  2432. case ST_RD_VERBATIM:
  2433. ds->loop = 0;
  2434. /* FALL THROUGH */
  2435. case ST_RD_PRE_MAIN_TREE_256:
  2436. /*
  2437. * Read Pre-tree for first 256 elements of main tree.
  2438. */
  2439. if (!lzx_read_pre_tree(strm)) {
  2440. ds->state = ST_RD_PRE_MAIN_TREE_256;
  2441. if (last)
  2442. goto failed;
  2443. return (ARCHIVE_OK);
  2444. }
  2445. if (!lzx_make_huffman_table(&ds->pt))
  2446. goto failed;
  2447. ds->loop = 0;
  2448. /* FALL THROUGH */
  2449. case ST_MAIN_TREE_256:
  2450. /*
  2451. * Get path lengths of first 256 elements of main tree.
  2452. */
  2453. r = lzx_read_bitlen(strm, &ds->mt, 256);
  2454. if (r < 0)
  2455. goto failed;
  2456. else if (!r) {
  2457. ds->state = ST_MAIN_TREE_256;
  2458. if (last)
  2459. goto failed;
  2460. return (ARCHIVE_OK);
  2461. }
  2462. ds->loop = 0;
  2463. /* FALL THROUGH */
  2464. case ST_RD_PRE_MAIN_TREE_REM:
  2465. /*
  2466. * Read Pre-tree for remaining elements of main tree.
  2467. */
  2468. if (!lzx_read_pre_tree(strm)) {
  2469. ds->state = ST_RD_PRE_MAIN_TREE_REM;
  2470. if (last)
  2471. goto failed;
  2472. return (ARCHIVE_OK);
  2473. }
  2474. if (!lzx_make_huffman_table(&ds->pt))
  2475. goto failed;
  2476. ds->loop = 256;
  2477. /* FALL THROUGH */
  2478. case ST_MAIN_TREE_REM:
  2479. /*
  2480. * Get path lengths of remaining elements of main tree.
  2481. */
  2482. r = lzx_read_bitlen(strm, &ds->mt, -1);
  2483. if (r < 0)
  2484. goto failed;
  2485. else if (!r) {
  2486. ds->state = ST_MAIN_TREE_REM;
  2487. if (last)
  2488. goto failed;
  2489. return (ARCHIVE_OK);
  2490. }
  2491. if (!lzx_make_huffman_table(&ds->mt))
  2492. goto failed;
  2493. ds->loop = 0;
  2494. /* FALL THROUGH */
  2495. case ST_RD_PRE_LENGTH_TREE:
  2496. /*
  2497. * Read Pre-tree for remaining elements of main tree.
  2498. */
  2499. if (!lzx_read_pre_tree(strm)) {
  2500. ds->state = ST_RD_PRE_LENGTH_TREE;
  2501. if (last)
  2502. goto failed;
  2503. return (ARCHIVE_OK);
  2504. }
  2505. if (!lzx_make_huffman_table(&ds->pt))
  2506. goto failed;
  2507. ds->loop = 0;
  2508. /* FALL THROUGH */
  2509. case ST_LENGTH_TREE:
  2510. /*
  2511. * Get path lengths of remaining elements of main tree.
  2512. */
  2513. r = lzx_read_bitlen(strm, &ds->lt, -1);
  2514. if (r < 0)
  2515. goto failed;
  2516. else if (!r) {
  2517. ds->state = ST_LENGTH_TREE;
  2518. if (last)
  2519. goto failed;
  2520. return (ARCHIVE_OK);
  2521. }
  2522. if (!lzx_make_huffman_table(&ds->lt))
  2523. goto failed;
  2524. ds->state = ST_MAIN;
  2525. return (100);
  2526. }
  2527. }
  2528. failed:
  2529. return (ds->error = ARCHIVE_FAILED);
  2530. }
  2531. static int
  2532. lzx_decode_blocks(struct lzx_stream *strm, int last)
  2533. {
  2534. struct lzx_dec *ds = strm->ds;
  2535. struct lzx_br bre = ds->br;
  2536. struct huffman *at = &(ds->at), *lt = &(ds->lt), *mt = &(ds->mt);
  2537. const struct lzx_pos_tbl *pos_tbl = ds->pos_tbl;
  2538. unsigned char *noutp = strm->next_out;
  2539. unsigned char *endp = noutp + strm->avail_out;
  2540. unsigned char *w_buff = ds->w_buff;
  2541. unsigned char *at_bitlen = at->bitlen;
  2542. unsigned char *lt_bitlen = lt->bitlen;
  2543. unsigned char *mt_bitlen = mt->bitlen;
  2544. size_t block_bytes_avail = ds->block_bytes_avail;
  2545. int at_max_bits = at->max_bits;
  2546. int lt_max_bits = lt->max_bits;
  2547. int mt_max_bits = mt->max_bits;
  2548. int c, copy_len = ds->copy_len, copy_pos = ds->copy_pos;
  2549. int w_pos = ds->w_pos, w_mask = ds->w_mask, w_size = ds->w_size;
  2550. int length_header = ds->length_header;
  2551. int offset_bits = ds->offset_bits;
  2552. int position_slot = ds->position_slot;
  2553. int r0 = ds->r0, r1 = ds->r1, r2 = ds->r2;
  2554. int state = ds->state;
  2555. char block_type = ds->block_type;
  2556. for (;;) {
  2557. switch (state) {
  2558. case ST_MAIN:
  2559. for (;;) {
  2560. if (block_bytes_avail == 0) {
  2561. /* This block ended. */
  2562. ds->state = ST_RD_BLOCK_TYPE;
  2563. ds->br = bre;
  2564. ds->block_bytes_avail =
  2565. block_bytes_avail;
  2566. ds->copy_len = copy_len;
  2567. ds->copy_pos = copy_pos;
  2568. ds->length_header = length_header;
  2569. ds->position_slot = position_slot;
  2570. ds->r0 = r0; ds->r1 = r1; ds->r2 = r2;
  2571. ds->w_pos = w_pos;
  2572. strm->avail_out = endp - noutp;
  2573. return (ARCHIVE_EOF);
  2574. }
  2575. if (noutp >= endp)
  2576. /* Output buffer is empty. */
  2577. goto next_data;
  2578. if (!lzx_br_read_ahead(strm, &bre,
  2579. mt_max_bits)) {
  2580. if (!last)
  2581. goto next_data;
  2582. /* Remaining bits are less than
  2583. * maximum bits(mt.max_bits) but maybe
  2584. * it still remains as much as we need,
  2585. * so we should try to use it with
  2586. * dummy bits. */
  2587. c = lzx_decode_huffman(mt,
  2588. lzx_br_bits_forced(
  2589. &bre, mt_max_bits));
  2590. lzx_br_consume(&bre, mt_bitlen[c]);
  2591. if (!lzx_br_has(&bre, 0))
  2592. goto failed;/* Over read. */
  2593. } else {
  2594. c = lzx_decode_huffman(mt,
  2595. lzx_br_bits(&bre, mt_max_bits));
  2596. lzx_br_consume(&bre, mt_bitlen[c]);
  2597. }
  2598. if (c > UCHAR_MAX)
  2599. break;
  2600. /*
  2601. * 'c' is exactly literal code.
  2602. */
  2603. /* Save a decoded code to reference it
  2604. * afterward. */
  2605. w_buff[w_pos] = c;
  2606. w_pos = (w_pos + 1) & w_mask;
  2607. /* Store the decoded code to output buffer. */
  2608. *noutp++ = c;
  2609. block_bytes_avail--;
  2610. }
  2611. /*
  2612. * Get a match code, its length and offset.
  2613. */
  2614. c -= UCHAR_MAX + 1;
  2615. length_header = c & 7;
  2616. position_slot = c >> 3;
  2617. /* FALL THROUGH */
  2618. case ST_LENGTH:
  2619. /*
  2620. * Get a length.
  2621. */
  2622. if (length_header == 7) {
  2623. if (!lzx_br_read_ahead(strm, &bre,
  2624. lt_max_bits)) {
  2625. if (!last) {
  2626. state = ST_LENGTH;
  2627. goto next_data;
  2628. }
  2629. c = lzx_decode_huffman(lt,
  2630. lzx_br_bits_forced(
  2631. &bre, lt_max_bits));
  2632. lzx_br_consume(&bre, lt_bitlen[c]);
  2633. if (!lzx_br_has(&bre, 0))
  2634. goto failed;/* Over read. */
  2635. } else {
  2636. c = lzx_decode_huffman(lt,
  2637. lzx_br_bits(&bre, lt_max_bits));
  2638. lzx_br_consume(&bre, lt_bitlen[c]);
  2639. }
  2640. copy_len = c + 7 + 2;
  2641. } else
  2642. copy_len = length_header + 2;
  2643. if ((size_t)copy_len > block_bytes_avail)
  2644. goto failed;
  2645. /*
  2646. * Get an offset.
  2647. */
  2648. switch (position_slot) {
  2649. case 0: /* Use repeated offset 0. */
  2650. copy_pos = r0;
  2651. state = ST_REAL_POS;
  2652. continue;
  2653. case 1: /* Use repeated offset 1. */
  2654. copy_pos = r1;
  2655. /* Swap repeated offset. */
  2656. r1 = r0;
  2657. r0 = copy_pos;
  2658. state = ST_REAL_POS;
  2659. continue;
  2660. case 2: /* Use repeated offset 2. */
  2661. copy_pos = r2;
  2662. /* Swap repeated offset. */
  2663. r2 = r0;
  2664. r0 = copy_pos;
  2665. state = ST_REAL_POS;
  2666. continue;
  2667. default:
  2668. offset_bits =
  2669. pos_tbl[position_slot].footer_bits;
  2670. break;
  2671. }
  2672. /* FALL THROUGH */
  2673. case ST_OFFSET:
  2674. /*
  2675. * Get the offset, which is a distance from
  2676. * current window position.
  2677. */
  2678. if (block_type == ALIGNED_OFFSET_BLOCK &&
  2679. offset_bits >= 3) {
  2680. int offbits = offset_bits - 3;
  2681. if (!lzx_br_read_ahead(strm, &bre, offbits)) {
  2682. state = ST_OFFSET;
  2683. if (last)
  2684. goto failed;
  2685. goto next_data;
  2686. }
  2687. copy_pos = lzx_br_bits(&bre, offbits) << 3;
  2688. /* Get an aligned number. */
  2689. if (!lzx_br_read_ahead(strm, &bre,
  2690. offbits + at_max_bits)) {
  2691. if (!last) {
  2692. state = ST_OFFSET;
  2693. goto next_data;
  2694. }
  2695. lzx_br_consume(&bre, offbits);
  2696. c = lzx_decode_huffman(at,
  2697. lzx_br_bits_forced(&bre,
  2698. at_max_bits));
  2699. lzx_br_consume(&bre, at_bitlen[c]);
  2700. if (!lzx_br_has(&bre, 0))
  2701. goto failed;/* Over read. */
  2702. } else {
  2703. lzx_br_consume(&bre, offbits);
  2704. c = lzx_decode_huffman(at,
  2705. lzx_br_bits(&bre, at_max_bits));
  2706. lzx_br_consume(&bre, at_bitlen[c]);
  2707. }
  2708. /* Add an aligned number. */
  2709. copy_pos += c;
  2710. } else {
  2711. if (!lzx_br_read_ahead(strm, &bre,
  2712. offset_bits)) {
  2713. state = ST_OFFSET;
  2714. if (last)
  2715. goto failed;
  2716. goto next_data;
  2717. }
  2718. copy_pos = lzx_br_bits(&bre, offset_bits);
  2719. lzx_br_consume(&bre, offset_bits);
  2720. }
  2721. copy_pos += pos_tbl[position_slot].base -2;
  2722. /* Update repeated offset LRU queue. */
  2723. r2 = r1;
  2724. r1 = r0;
  2725. r0 = copy_pos;
  2726. /* FALL THROUGH */
  2727. case ST_REAL_POS:
  2728. /*
  2729. * Compute a real position in window.
  2730. */
  2731. copy_pos = (w_pos - copy_pos) & w_mask;
  2732. /* FALL THROUGH */
  2733. case ST_COPY:
  2734. /*
  2735. * Copy several bytes as extracted data from the window
  2736. * into the output buffer.
  2737. */
  2738. for (;;) {
  2739. const unsigned char *s;
  2740. int l;
  2741. l = copy_len;
  2742. if (copy_pos > w_pos) {
  2743. if (l > w_size - copy_pos)
  2744. l = w_size - copy_pos;
  2745. } else {
  2746. if (l > w_size - w_pos)
  2747. l = w_size - w_pos;
  2748. }
  2749. if (noutp + l >= endp)
  2750. l = (int)(endp - noutp);
  2751. s = w_buff + copy_pos;
  2752. if (l >= 8 && ((copy_pos + l < w_pos)
  2753. || (w_pos + l < copy_pos))) {
  2754. memcpy(w_buff + w_pos, s, l);
  2755. memcpy(noutp, s, l);
  2756. } else {
  2757. unsigned char *d;
  2758. int li;
  2759. d = w_buff + w_pos;
  2760. for (li = 0; li < l; li++)
  2761. noutp[li] = d[li] = s[li];
  2762. }
  2763. noutp += l;
  2764. copy_pos = (copy_pos + l) & w_mask;
  2765. w_pos = (w_pos + l) & w_mask;
  2766. block_bytes_avail -= l;
  2767. if (copy_len <= l)
  2768. /* A copy of current pattern ended. */
  2769. break;
  2770. copy_len -= l;
  2771. if (noutp >= endp) {
  2772. /* Output buffer is empty. */
  2773. state = ST_COPY;
  2774. goto next_data;
  2775. }
  2776. }
  2777. state = ST_MAIN;
  2778. break;
  2779. }
  2780. }
  2781. failed:
  2782. return (ds->error = ARCHIVE_FAILED);
  2783. next_data:
  2784. ds->br = bre;
  2785. ds->block_bytes_avail = block_bytes_avail;
  2786. ds->copy_len = copy_len;
  2787. ds->copy_pos = copy_pos;
  2788. ds->length_header = length_header;
  2789. ds->offset_bits = offset_bits;
  2790. ds->position_slot = position_slot;
  2791. ds->r0 = r0; ds->r1 = r1; ds->r2 = r2;
  2792. ds->state = state;
  2793. ds->w_pos = w_pos;
  2794. strm->avail_out = endp - noutp;
  2795. return (ARCHIVE_OK);
  2796. }
  2797. static int
  2798. lzx_read_pre_tree(struct lzx_stream *strm)
  2799. {
  2800. struct lzx_dec *ds = strm->ds;
  2801. struct lzx_br *br = &(ds->br);
  2802. int i;
  2803. if (ds->loop == 0)
  2804. memset(ds->pt.freq, 0, sizeof(ds->pt.freq));
  2805. for (i = ds->loop; i < ds->pt.len_size; i++) {
  2806. if (!lzx_br_read_ahead(strm, br, 4)) {
  2807. ds->loop = i;
  2808. return (0);
  2809. }
  2810. ds->pt.bitlen[i] = lzx_br_bits(br, 4);
  2811. ds->pt.freq[ds->pt.bitlen[i]]++;
  2812. lzx_br_consume(br, 4);
  2813. }
  2814. ds->loop = i;
  2815. return (1);
  2816. }
  2817. /*
  2818. * Read a bunch of bit-lengths from pre-tree.
  2819. */
  2820. static int
  2821. lzx_read_bitlen(struct lzx_stream *strm, struct huffman *d, int end)
  2822. {
  2823. struct lzx_dec *ds = strm->ds;
  2824. struct lzx_br *br = &(ds->br);
  2825. int c, i, j, ret, same;
  2826. unsigned rbits;
  2827. i = ds->loop;
  2828. if (i == 0)
  2829. memset(d->freq, 0, sizeof(d->freq));
  2830. ret = 0;
  2831. if (end < 0)
  2832. end = d->len_size;
  2833. while (i < end) {
  2834. ds->loop = i;
  2835. if (!lzx_br_read_ahead(strm, br, ds->pt.max_bits))
  2836. goto getdata;
  2837. rbits = lzx_br_bits(br, ds->pt.max_bits);
  2838. c = lzx_decode_huffman(&(ds->pt), rbits);
  2839. switch (c) {
  2840. case 17:/* several zero lengths, from 4 to 19. */
  2841. if (!lzx_br_read_ahead(strm, br, ds->pt.bitlen[c]+4))
  2842. goto getdata;
  2843. lzx_br_consume(br, ds->pt.bitlen[c]);
  2844. same = lzx_br_bits(br, 4) + 4;
  2845. if (i + same > end)
  2846. return (-1);/* Invalid */
  2847. lzx_br_consume(br, 4);
  2848. for (j = 0; j < same; j++)
  2849. d->bitlen[i++] = 0;
  2850. break;
  2851. case 18:/* many zero lengths, from 20 to 51. */
  2852. if (!lzx_br_read_ahead(strm, br, ds->pt.bitlen[c]+5))
  2853. goto getdata;
  2854. lzx_br_consume(br, ds->pt.bitlen[c]);
  2855. same = lzx_br_bits(br, 5) + 20;
  2856. if (i + same > end)
  2857. return (-1);/* Invalid */
  2858. lzx_br_consume(br, 5);
  2859. memset(d->bitlen + i, 0, same);
  2860. i += same;
  2861. break;
  2862. case 19:/* a few same lengths. */
  2863. if (!lzx_br_read_ahead(strm, br,
  2864. ds->pt.bitlen[c]+1+ds->pt.max_bits))
  2865. goto getdata;
  2866. lzx_br_consume(br, ds->pt.bitlen[c]);
  2867. same = lzx_br_bits(br, 1) + 4;
  2868. if (i + same > end)
  2869. return (-1);
  2870. lzx_br_consume(br, 1);
  2871. rbits = lzx_br_bits(br, ds->pt.max_bits);
  2872. c = lzx_decode_huffman(&(ds->pt), rbits);
  2873. lzx_br_consume(br, ds->pt.bitlen[c]);
  2874. c = (d->bitlen[i] - c + 17) % 17;
  2875. if (c < 0)
  2876. return (-1);/* Invalid */
  2877. for (j = 0; j < same; j++)
  2878. d->bitlen[i++] = c;
  2879. d->freq[c] += same;
  2880. break;
  2881. default:
  2882. lzx_br_consume(br, ds->pt.bitlen[c]);
  2883. c = (d->bitlen[i] - c + 17) % 17;
  2884. if (c < 0)
  2885. return (-1);/* Invalid */
  2886. d->freq[c]++;
  2887. d->bitlen[i++] = c;
  2888. break;
  2889. }
  2890. }
  2891. ret = 1;
  2892. getdata:
  2893. ds->loop = i;
  2894. return (ret);
  2895. }
  2896. static int
  2897. lzx_huffman_init(struct huffman *hf, size_t len_size, int tbl_bits)
  2898. {
  2899. if (hf->bitlen == NULL || hf->len_size != (int)len_size) {
  2900. free(hf->bitlen);
  2901. hf->bitlen = calloc(len_size, sizeof(hf->bitlen[0]));
  2902. if (hf->bitlen == NULL)
  2903. return (ARCHIVE_FATAL);
  2904. hf->len_size = (int)len_size;
  2905. } else
  2906. memset(hf->bitlen, 0, len_size * sizeof(hf->bitlen[0]));
  2907. if (hf->tbl == NULL) {
  2908. hf->tbl = malloc(((size_t)1 << tbl_bits) * sizeof(hf->tbl[0]));
  2909. if (hf->tbl == NULL)
  2910. return (ARCHIVE_FATAL);
  2911. hf->tbl_bits = tbl_bits;
  2912. }
  2913. return (ARCHIVE_OK);
  2914. }
  2915. static void
  2916. lzx_huffman_free(struct huffman *hf)
  2917. {
  2918. free(hf->bitlen);
  2919. free(hf->tbl);
  2920. }
  2921. /*
  2922. * Make a huffman coding table.
  2923. */
  2924. static int
  2925. lzx_make_huffman_table(struct huffman *hf)
  2926. {
  2927. uint16_t *tbl;
  2928. const unsigned char *bitlen;
  2929. int bitptn[17], weight[17];
  2930. int i, maxbits = 0, ptn, tbl_size, w;
  2931. int len_avail;
  2932. /*
  2933. * Initialize bit patterns.
  2934. */
  2935. ptn = 0;
  2936. for (i = 1, w = 1 << 15; i <= 16; i++, w >>= 1) {
  2937. bitptn[i] = ptn;
  2938. weight[i] = w;
  2939. if (hf->freq[i]) {
  2940. ptn += hf->freq[i] * w;
  2941. maxbits = i;
  2942. }
  2943. }
  2944. if ((ptn & 0xffff) != 0 || maxbits > hf->tbl_bits)
  2945. return (0);/* Invalid */
  2946. hf->max_bits = maxbits;
  2947. /*
  2948. * Cut out extra bits which we won't house in the table.
  2949. * This preparation reduces the same calculation in the for-loop
  2950. * making the table.
  2951. */
  2952. if (maxbits < 16) {
  2953. int ebits = 16 - maxbits;
  2954. for (i = 1; i <= maxbits; i++) {
  2955. bitptn[i] >>= ebits;
  2956. weight[i] >>= ebits;
  2957. }
  2958. }
  2959. /*
  2960. * Make the table.
  2961. */
  2962. tbl_size = 1 << hf->tbl_bits;
  2963. tbl = hf->tbl;
  2964. bitlen = hf->bitlen;
  2965. len_avail = hf->len_size;
  2966. hf->tree_used = 0;
  2967. for (i = 0; i < len_avail; i++) {
  2968. uint16_t *p;
  2969. int len, cnt;
  2970. if (bitlen[i] == 0)
  2971. continue;
  2972. /* Get a bit pattern */
  2973. len = bitlen[i];
  2974. if (len > tbl_size)
  2975. return (0);
  2976. ptn = bitptn[len];
  2977. cnt = weight[len];
  2978. /* Calculate next bit pattern */
  2979. if ((bitptn[len] = ptn + cnt) > tbl_size)
  2980. return (0);/* Invalid */
  2981. /* Update the table */
  2982. p = &(tbl[ptn]);
  2983. while (--cnt >= 0)
  2984. p[cnt] = (uint16_t)i;
  2985. }
  2986. return (1);
  2987. }
  2988. static inline int
  2989. lzx_decode_huffman(struct huffman *hf, unsigned rbits)
  2990. {
  2991. int c;
  2992. c = hf->tbl[rbits];
  2993. if (c < hf->len_size)
  2994. return (c);
  2995. return (0);
  2996. }