1 /* 7zMain.c - Test application for 7z Decoder
2 2018-08-04 : Igor Pavlov : Public domain */
3 
4 #include "Precomp.h"
5 
6 #include <stdio.h>
7 #include <string.h>
8 
9 #include "../../CpuArch.h"
10 
11 #include "../../7z.h"
12 #include "../../7zAlloc.h"
13 #include "../../7zBuf.h"
14 #include "../../7zCrc.h"
15 #include "../../7zFile.h"
16 #include "../../7zVersion.h"
17 
18 #ifndef USE_WINDOWS_FILE
19 /* for mkdir */
20 #ifdef _WIN32
21 #include <direct.h>
22 #else
23 #include <sys/stat.h>
24 #include <errno.h>
25 #endif
26 #endif
27 
28 
29 #define kInputBufSize ((size_t)1 << 18)
30 
31 static const ISzAlloc g_Alloc = { SzAlloc, SzFree };
32 
33 
Print(const char * s)34 static void Print(const char *s)
35 {
36   fputs(s, stdout);
37 }
38 
39 
Buf_EnsureSize(CBuf * dest,size_t size)40 static int Buf_EnsureSize(CBuf *dest, size_t size)
41 {
42   if (dest->size >= size)
43     return 1;
44   Buf_Free(dest, &g_Alloc);
45   return Buf_Create(dest, size, &g_Alloc);
46 }
47 
48 #ifndef _WIN32
49 #define _USE_UTF8
50 #endif
51 
52 /* #define _USE_UTF8 */
53 
54 #ifdef _USE_UTF8
55 
56 #define _UTF8_START(n) (0x100 - (1 << (7 - (n))))
57 
58 #define _UTF8_RANGE(n) (((UInt32)1) << ((n) * 5 + 6))
59 
60 #define _UTF8_HEAD(n, val) ((Byte)(_UTF8_START(n) + (val >> (6 * (n)))))
61 #define _UTF8_CHAR(n, val) ((Byte)(0x80 + (((val) >> (6 * (n))) & 0x3F)))
62 
Utf16_To_Utf8_Calc(const UInt16 * src,const UInt16 * srcLim)63 static size_t Utf16_To_Utf8_Calc(const UInt16 *src, const UInt16 *srcLim)
64 {
65   size_t size = 0;
66   for (;;)
67   {
68     UInt32 val;
69     if (src == srcLim)
70       return size;
71 
72     size++;
73     val = *src++;
74 
75     if (val < 0x80)
76       continue;
77 
78     if (val < _UTF8_RANGE(1))
79     {
80       size++;
81       continue;
82     }
83 
84     if (val >= 0xD800 && val < 0xDC00 && src != srcLim)
85     {
86       UInt32 c2 = *src;
87       if (c2 >= 0xDC00 && c2 < 0xE000)
88       {
89         src++;
90         size += 3;
91         continue;
92       }
93     }
94 
95     size += 2;
96   }
97 }
98 
Utf16_To_Utf8(Byte * dest,const UInt16 * src,const UInt16 * srcLim)99 static Byte *Utf16_To_Utf8(Byte *dest, const UInt16 *src, const UInt16 *srcLim)
100 {
101   for (;;)
102   {
103     UInt32 val;
104     if (src == srcLim)
105       return dest;
106 
107     val = *src++;
108 
109     if (val < 0x80)
110     {
111       *dest++ = (char)val;
112       continue;
113     }
114 
115     if (val < _UTF8_RANGE(1))
116     {
117       dest[0] = _UTF8_HEAD(1, val);
118       dest[1] = _UTF8_CHAR(0, val);
119       dest += 2;
120       continue;
121     }
122 
123     if (val >= 0xD800 && val < 0xDC00 && src != srcLim)
124     {
125       UInt32 c2 = *src;
126       if (c2 >= 0xDC00 && c2 < 0xE000)
127       {
128         src++;
129         val = (((val - 0xD800) << 10) | (c2 - 0xDC00)) + 0x10000;
130         dest[0] = _UTF8_HEAD(3, val);
131         dest[1] = _UTF8_CHAR(2, val);
132         dest[2] = _UTF8_CHAR(1, val);
133         dest[3] = _UTF8_CHAR(0, val);
134         dest += 4;
135         continue;
136       }
137     }
138 
139     dest[0] = _UTF8_HEAD(2, val);
140     dest[1] = _UTF8_CHAR(1, val);
141     dest[2] = _UTF8_CHAR(0, val);
142     dest += 3;
143   }
144 }
145 
Utf16_To_Utf8Buf(CBuf * dest,const UInt16 * src,size_t srcLen)146 static SRes Utf16_To_Utf8Buf(CBuf *dest, const UInt16 *src, size_t srcLen)
147 {
148   size_t destLen = Utf16_To_Utf8_Calc(src, src + srcLen);
149   destLen += 1;
150   if (!Buf_EnsureSize(dest, destLen))
151     return SZ_ERROR_MEM;
152   *Utf16_To_Utf8(dest->data, src, src + srcLen) = 0;
153   return SZ_OK;
154 }
155 
156 #endif
157 
Utf16_To_Char(CBuf * buf,const UInt16 * s,UINT codePage)158 static SRes Utf16_To_Char(CBuf *buf, const UInt16 *s
159     #ifndef _USE_UTF8
160     , UINT codePage
161     #endif
162     )
163 {
164   unsigned len = 0;
165   for (len = 0; s[len] != 0; len++);
166 
167   #ifndef _USE_UTF8
168   {
169     unsigned size = len * 3 + 100;
170     if (!Buf_EnsureSize(buf, size))
171       return SZ_ERROR_MEM;
172     {
173       buf->data[0] = 0;
174       if (len != 0)
175       {
176         char defaultChar = '_';
177         BOOL defUsed;
178         unsigned numChars = 0;
179         numChars = WideCharToMultiByte(codePage, 0, s, len, (char *)buf->data, size, &defaultChar, &defUsed);
180         if (numChars == 0 || numChars >= size)
181           return SZ_ERROR_FAIL;
182         buf->data[numChars] = 0;
183       }
184       return SZ_OK;
185     }
186   }
187   #else
188   return Utf16_To_Utf8Buf(buf, s, len);
189   #endif
190 }
191 
192 #ifdef _WIN32
193   #ifndef USE_WINDOWS_FILE
194     static UINT g_FileCodePage = CP_ACP;
195   #endif
196   #define MY_FILE_CODE_PAGE_PARAM ,g_FileCodePage
197 #else
198   #define MY_FILE_CODE_PAGE_PARAM
199 #endif
200 
MyCreateDir(const UInt16 * name)201 static WRes MyCreateDir(const UInt16 *name)
202 {
203   #ifdef USE_WINDOWS_FILE
204 
205   return CreateDirectoryW(name, NULL) ? 0 : GetLastError();
206 
207   #else
208 
209   CBuf buf;
210   WRes res;
211   Buf_Init(&buf);
212   RINOK(Utf16_To_Char(&buf, name MY_FILE_CODE_PAGE_PARAM));
213 
214   res =
215   #ifdef _WIN32
216   _mkdir((const char *)buf.data)
217   #else
218   mkdir((const char *)buf.data, 0777)
219   #endif
220   == 0 ? 0 : errno;
221   Buf_Free(&buf, &g_Alloc);
222   return res;
223 
224   #endif
225 }
226 
OutFile_OpenUtf16(CSzFile * p,const UInt16 * name)227 static WRes OutFile_OpenUtf16(CSzFile *p, const UInt16 *name)
228 {
229   #ifdef USE_WINDOWS_FILE
230   return OutFile_OpenW(p, name);
231   #else
232   CBuf buf;
233   WRes res;
234   Buf_Init(&buf);
235   RINOK(Utf16_To_Char(&buf, name MY_FILE_CODE_PAGE_PARAM));
236   res = OutFile_Open(p, (const char *)buf.data);
237   Buf_Free(&buf, &g_Alloc);
238   return res;
239   #endif
240 }
241 
242 
PrintString(const UInt16 * s)243 static SRes PrintString(const UInt16 *s)
244 {
245   CBuf buf;
246   SRes res;
247   Buf_Init(&buf);
248   res = Utf16_To_Char(&buf, s
249       #ifndef _USE_UTF8
250       , CP_OEMCP
251       #endif
252       );
253   if (res == SZ_OK)
254     Print((const char *)buf.data);
255   Buf_Free(&buf, &g_Alloc);
256   return res;
257 }
258 
UInt64ToStr(UInt64 value,char * s,int numDigits)259 static void UInt64ToStr(UInt64 value, char *s, int numDigits)
260 {
261   char temp[32];
262   int pos = 0;
263   do
264   {
265     temp[pos++] = (char)('0' + (unsigned)(value % 10));
266     value /= 10;
267   }
268   while (value != 0);
269 
270   for (numDigits -= pos; numDigits > 0; numDigits--)
271     *s++ = ' ';
272 
273   do
274     *s++ = temp[--pos];
275   while (pos);
276   *s = '\0';
277 }
278 
UIntToStr(char * s,unsigned value,int numDigits)279 static char *UIntToStr(char *s, unsigned value, int numDigits)
280 {
281   char temp[16];
282   int pos = 0;
283   do
284     temp[pos++] = (char)('0' + (value % 10));
285   while (value /= 10);
286 
287   for (numDigits -= pos; numDigits > 0; numDigits--)
288     *s++ = '0';
289 
290   do
291     *s++ = temp[--pos];
292   while (pos);
293   *s = '\0';
294   return s;
295 }
296 
UIntToStr_2(char * s,unsigned value)297 static void UIntToStr_2(char *s, unsigned value)
298 {
299   s[0] = (char)('0' + (value / 10));
300   s[1] = (char)('0' + (value % 10));
301 }
302 
303 #define PERIOD_4 (4 * 365 + 1)
304 #define PERIOD_100 (PERIOD_4 * 25 - 1)
305 #define PERIOD_400 (PERIOD_100 * 4 + 1)
306 
ConvertFileTimeToString(const CNtfsFileTime * nt,char * s)307 static void ConvertFileTimeToString(const CNtfsFileTime *nt, char *s)
308 {
309   unsigned year, mon, hour, min, sec;
310   Byte ms[] = { 31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31 };
311   unsigned t;
312   UInt32 v;
313   UInt64 v64 = nt->Low | ((UInt64)nt->High << 32);
314   v64 /= 10000000;
315   sec = (unsigned)(v64 % 60); v64 /= 60;
316   min = (unsigned)(v64 % 60); v64 /= 60;
317   hour = (unsigned)(v64 % 24); v64 /= 24;
318 
319   v = (UInt32)v64;
320 
321   year = (unsigned)(1601 + v / PERIOD_400 * 400);
322   v %= PERIOD_400;
323 
324   t = v / PERIOD_100; if (t ==  4) t =  3; year += t * 100; v -= t * PERIOD_100;
325   t = v / PERIOD_4;   if (t == 25) t = 24; year += t * 4;   v -= t * PERIOD_4;
326   t = v / 365;        if (t ==  4) t =  3; year += t;       v -= t * 365;
327 
328   if (year % 4 == 0 && (year % 100 != 0 || year % 400 == 0))
329     ms[1] = 29;
330   for (mon = 0;; mon++)
331   {
332     unsigned d = ms[mon];
333     if (v < d)
334       break;
335     v -= d;
336   }
337   s = UIntToStr(s, year, 4); *s++ = '-';
338   UIntToStr_2(s, mon + 1); s[2] = '-'; s += 3;
339   UIntToStr_2(s, (unsigned)v + 1); s[2] = ' '; s += 3;
340   UIntToStr_2(s, hour); s[2] = ':'; s += 3;
341   UIntToStr_2(s, min); s[2] = ':'; s += 3;
342   UIntToStr_2(s, sec); s[2] = 0;
343 }
344 
PrintLF()345 static void PrintLF()
346 {
347   Print("\n");
348 }
349 
PrintError(char * s)350 static void PrintError(char *s)
351 {
352   Print("\nERROR: ");
353   Print(s);
354   PrintLF();
355 }
356 
GetAttribString(UInt32 wa,BoolInt isDir,char * s)357 static void GetAttribString(UInt32 wa, BoolInt isDir, char *s)
358 {
359   #ifdef USE_WINDOWS_FILE
360   s[0] = (char)(((wa & FILE_ATTRIBUTE_DIRECTORY) != 0 || isDir) ? 'D' : '.');
361   s[1] = (char)(((wa & FILE_ATTRIBUTE_READONLY ) != 0) ? 'R': '.');
362   s[2] = (char)(((wa & FILE_ATTRIBUTE_HIDDEN   ) != 0) ? 'H': '.');
363   s[3] = (char)(((wa & FILE_ATTRIBUTE_SYSTEM   ) != 0) ? 'S': '.');
364   s[4] = (char)(((wa & FILE_ATTRIBUTE_ARCHIVE  ) != 0) ? 'A': '.');
365   s[5] = 0;
366   #else
367   s[0] = (char)(((wa & (1 << 4)) != 0 || isDir) ? 'D' : '.');
368   s[1] = 0;
369   #endif
370 }
371 
372 
373 // #define NUM_PARENTS_MAX 128
374 
main(int numargs,char * args[])375 int MY_CDECL main(int numargs, char *args[])
376 {
377   ISzAlloc allocImp;
378   ISzAlloc allocTempImp;
379 
380   CFileInStream archiveStream;
381   CLookToRead2 lookStream;
382   CSzArEx db;
383   SRes res;
384   UInt16 *temp = NULL;
385   size_t tempSize = 0;
386   // UInt32 parents[NUM_PARENTS_MAX];
387 
388   Print("\n7z Decoder " MY_VERSION_CPU " : " MY_COPYRIGHT_DATE "\n\n");
389 
390   if (numargs == 1)
391   {
392     Print(
393       "Usage: 7zDec <command> <archive_name>\n\n"
394       "<Commands>\n"
395       "  e: Extract files from archive (without using directory names)\n"
396       "  l: List contents of archive\n"
397       "  t: Test integrity of archive\n"
398       "  x: eXtract files with full paths\n");
399     return 0;
400   }
401 
402   if (numargs < 3)
403   {
404     PrintError("incorrect command");
405     return 1;
406   }
407 
408   #if defined(_WIN32) && !defined(USE_WINDOWS_FILE) && !defined(UNDER_CE)
409   g_FileCodePage = AreFileApisANSI() ? CP_ACP : CP_OEMCP;
410   #endif
411 
412 
413   allocImp = g_Alloc;
414   allocTempImp = g_Alloc;
415 
416   #ifdef UNDER_CE
417   if (InFile_OpenW(&archiveStream.file, L"\test.7z"))
418   #else
419   if (InFile_Open(&archiveStream.file, args[2]))
420   #endif
421   {
422     PrintError("can not open input file");
423     return 1;
424   }
425 
426   FileInStream_CreateVTable(&archiveStream);
427   LookToRead2_CreateVTable(&lookStream, False);
428   lookStream.buf = NULL;
429 
430   res = SZ_OK;
431 
432   {
433     lookStream.buf = ISzAlloc_Alloc(&allocImp, kInputBufSize);
434     if (!lookStream.buf)
435       res = SZ_ERROR_MEM;
436     else
437     {
438       lookStream.bufSize = kInputBufSize;
439       lookStream.realStream = &archiveStream.vt;
440       LookToRead2_Init(&lookStream);
441     }
442   }
443 
444   CrcGenerateTable();
445 
446   SzArEx_Init(&db);
447 
448   if (res == SZ_OK)
449   {
450     res = SzArEx_Open(&db, &lookStream.vt, &allocImp, &allocTempImp);
451   }
452 
453   if (res == SZ_OK)
454   {
455     char *command = args[1];
456     int listCommand = 0, testCommand = 0, fullPaths = 0;
457 
458     if (strcmp(command, "l") == 0) listCommand = 1;
459     else if (strcmp(command, "t") == 0) testCommand = 1;
460     else if (strcmp(command, "e") == 0) { }
461     else if (strcmp(command, "x") == 0) { fullPaths = 1; }
462     else
463     {
464       PrintError("incorrect command");
465       res = SZ_ERROR_FAIL;
466     }
467 
468     if (res == SZ_OK)
469     {
470       UInt32 i;
471 
472       /*
473       if you need cache, use these 3 variables.
474       if you use external function, you can make these variable as static.
475       */
476       UInt32 blockIndex = 0xFFFFFFFF; /* it can have any value before first call (if outBuffer = 0) */
477       Byte *outBuffer = 0; /* it must be 0 before first call for each new archive. */
478       size_t outBufferSize = 0;  /* it can have any value before first call (if outBuffer = 0) */
479 
480       for (i = 0; i < db.NumFiles; i++)
481       {
482         size_t offset = 0;
483         size_t outSizeProcessed = 0;
484         // const CSzFileItem *f = db.Files + i;
485         size_t len;
486         unsigned isDir = SzArEx_IsDir(&db, i);
487         if (listCommand == 0 && isDir && !fullPaths)
488           continue;
489         len = SzArEx_GetFileNameUtf16(&db, i, NULL);
490         // len = SzArEx_GetFullNameLen(&db, i);
491 
492         if (len > tempSize)
493         {
494           SzFree(NULL, temp);
495           tempSize = len;
496           temp = (UInt16 *)SzAlloc(NULL, tempSize * sizeof(temp[0]));
497           if (!temp)
498           {
499             res = SZ_ERROR_MEM;
500             break;
501           }
502         }
503 
504         SzArEx_GetFileNameUtf16(&db, i, temp);
505         /*
506         if (SzArEx_GetFullNameUtf16_Back(&db, i, temp + len) != temp)
507         {
508           res = SZ_ERROR_FAIL;
509           break;
510         }
511         */
512 
513         if (listCommand)
514         {
515           char attr[8], s[32], t[32];
516           UInt64 fileSize;
517 
518           GetAttribString(SzBitWithVals_Check(&db.Attribs, i) ? db.Attribs.Vals[i] : 0, isDir, attr);
519 
520           fileSize = SzArEx_GetFileSize(&db, i);
521           UInt64ToStr(fileSize, s, 10);
522 
523           if (SzBitWithVals_Check(&db.MTime, i))
524             ConvertFileTimeToString(&db.MTime.Vals[i], t);
525           else
526           {
527             size_t j;
528             for (j = 0; j < 19; j++)
529               t[j] = ' ';
530             t[j] = '\0';
531           }
532 
533           Print(t);
534           Print(" ");
535           Print(attr);
536           Print(" ");
537           Print(s);
538           Print("  ");
539           res = PrintString(temp);
540           if (res != SZ_OK)
541             break;
542           if (isDir)
543             Print("/");
544           PrintLF();
545           continue;
546         }
547 
548         Print(testCommand ?
549             "Testing    ":
550             "Extracting ");
551         res = PrintString(temp);
552         if (res != SZ_OK)
553           break;
554 
555         if (isDir)
556           Print("/");
557         else
558         {
559           res = SzArEx_Extract(&db, &lookStream.vt, i,
560               &blockIndex, &outBuffer, &outBufferSize,
561               &offset, &outSizeProcessed,
562               &allocImp, &allocTempImp);
563           if (res != SZ_OK)
564             break;
565         }
566 
567         if (!testCommand)
568         {
569           CSzFile outFile;
570           size_t processedSize;
571           size_t j;
572           UInt16 *name = (UInt16 *)temp;
573           const UInt16 *destPath = (const UInt16 *)name;
574 
575           for (j = 0; name[j] != 0; j++)
576             if (name[j] == '/')
577             {
578               if (fullPaths)
579               {
580                 name[j] = 0;
581                 MyCreateDir(name);
582                 name[j] = CHAR_PATH_SEPARATOR;
583               }
584               else
585                 destPath = name + j + 1;
586             }
587 
588           if (isDir)
589           {
590             MyCreateDir(destPath);
591             PrintLF();
592             continue;
593           }
594           else if (OutFile_OpenUtf16(&outFile, destPath))
595           {
596             PrintError("can not open output file");
597             res = SZ_ERROR_FAIL;
598             break;
599           }
600 
601           processedSize = outSizeProcessed;
602 
603           if (File_Write(&outFile, outBuffer + offset, &processedSize) != 0 || processedSize != outSizeProcessed)
604           {
605             PrintError("can not write output file");
606             res = SZ_ERROR_FAIL;
607             break;
608           }
609 
610           #ifdef USE_WINDOWS_FILE
611           {
612             FILETIME mtime, ctime;
613             FILETIME *mtimePtr = NULL;
614             FILETIME *ctimePtr = NULL;
615 
616             if (SzBitWithVals_Check(&db.MTime, i))
617             {
618               const CNtfsFileTime *t = &db.MTime.Vals[i];
619               mtime.dwLowDateTime = (DWORD)(t->Low);
620               mtime.dwHighDateTime = (DWORD)(t->High);
621               mtimePtr = &mtime;
622             }
623             if (SzBitWithVals_Check(&db.CTime, i))
624             {
625               const CNtfsFileTime *t = &db.CTime.Vals[i];
626               ctime.dwLowDateTime = (DWORD)(t->Low);
627               ctime.dwHighDateTime = (DWORD)(t->High);
628               ctimePtr = &ctime;
629             }
630             if (mtimePtr || ctimePtr)
631               SetFileTime(outFile.handle, ctimePtr, NULL, mtimePtr);
632           }
633           #endif
634 
635           if (File_Close(&outFile))
636           {
637             PrintError("can not close output file");
638             res = SZ_ERROR_FAIL;
639             break;
640           }
641 
642           #ifdef USE_WINDOWS_FILE
643           if (SzBitWithVals_Check(&db.Attribs, i))
644           {
645             UInt32 attrib = db.Attribs.Vals[i];
646             /* p7zip stores posix attributes in high 16 bits and adds 0x8000 as marker.
647                We remove posix bits, if we detect posix mode field */
648             if ((attrib & 0xF0000000) != 0)
649               attrib &= 0x7FFF;
650             SetFileAttributesW(destPath, attrib);
651           }
652           #endif
653         }
654         PrintLF();
655       }
656       ISzAlloc_Free(&allocImp, outBuffer);
657     }
658   }
659 
660   SzFree(NULL, temp);
661   SzArEx_Free(&db, &allocImp);
662   ISzAlloc_Free(&allocImp, lookStream.buf);
663 
664   File_Close(&archiveStream.file);
665 
666   if (res == SZ_OK)
667   {
668     Print("\nEverything is Ok\n");
669     return 0;
670   }
671 
672   if (res == SZ_ERROR_UNSUPPORTED)
673     PrintError("decoder doesn't support this archive");
674   else if (res == SZ_ERROR_MEM)
675     PrintError("can not allocate memory");
676   else if (res == SZ_ERROR_CRC)
677     PrintError("CRC error");
678   else
679   {
680     char s[32];
681     UInt64ToStr(res, s, 0);
682     PrintError(s);
683   }
684 
685   return 1;
686 }
687