2016-09-06 17:44:27 +00:00
|
|
|
/**
|
2016-09-11 20:20:15 +00:00
|
|
|
* Author......: See docs/credits.txt
|
2016-09-06 17:44:27 +00:00
|
|
|
* License.....: MIT
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "common.h"
|
2016-09-16 15:01:18 +00:00
|
|
|
#include "types.h"
|
2022-07-20 21:30:33 +00:00
|
|
|
#include "limits.h"
|
2016-09-06 17:44:27 +00:00
|
|
|
#include "memory.h"
|
2017-07-06 08:35:25 +00:00
|
|
|
#include "shared.h"
|
2016-09-06 17:44:27 +00:00
|
|
|
#include "filehandling.h"
|
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
#include <Alloc.h>
|
2021-08-27 08:09:37 +00:00
|
|
|
#include <7zCrc.h>
|
2021-08-25 13:56:55 +00:00
|
|
|
#include <7zFile.h>
|
2021-08-28 17:05:59 +00:00
|
|
|
#include <Xz.h>
|
2021-08-28 22:31:56 +00:00
|
|
|
#include <XzCrc64.h>
|
2021-08-25 13:56:55 +00:00
|
|
|
|
|
|
|
/* Maybe _LZMA_NO_SYSTEM_SIZE_T defined? */
|
|
|
|
#if defined (__clang__) || defined (__GNUC__)
|
|
|
|
#include <assert.h>
|
2021-08-30 13:28:54 +00:00
|
|
|
_Static_assert(sizeof (size_t) == sizeof (SizeT), "Check why sizeof(size_t) != sizeof(SizeT)");
|
2021-08-25 13:56:55 +00:00
|
|
|
#endif
|
|
|
|
|
2021-09-02 09:00:46 +00:00
|
|
|
#ifndef HCFILE_BUFFER_SIZE
|
|
|
|
#define HCFILE_BUFFER_SIZE 256 * 1024
|
2021-08-25 13:56:55 +00:00
|
|
|
#endif
|
|
|
|
|
2021-09-02 10:49:28 +00:00
|
|
|
#ifndef HCFILE_CHUNK_SIZE
|
|
|
|
#define HCFILE_CHUNK_SIZE 4 * 1024 * 1024
|
|
|
|
#endif
|
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
static bool xz_initialized = false;
|
|
|
|
|
|
|
|
static const ISzAlloc xz_alloc = { hc_lzma_alloc, hc_lzma_free };
|
|
|
|
|
|
|
|
struct xzfile
|
2021-10-08 15:38:54 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
CAlignOffsetAlloc alloc;
|
2021-08-26 13:41:17 +00:00
|
|
|
UInt64 inBlocks;
|
2021-08-25 13:56:55 +00:00
|
|
|
Byte *inBuf;
|
|
|
|
bool inEof;
|
|
|
|
SizeT inLen;
|
|
|
|
SizeT inPos;
|
|
|
|
Int64 inProcessed;
|
2021-08-26 13:41:17 +00:00
|
|
|
CFileInStream inStream;
|
2021-08-25 13:56:55 +00:00
|
|
|
Int64 outProcessed;
|
2021-08-26 13:41:17 +00:00
|
|
|
UInt64 outSize;
|
2021-08-25 13:56:55 +00:00
|
|
|
CXzUnpacker state;
|
2021-08-26 13:41:17 +00:00
|
|
|
CXzs streams;
|
2021-08-25 13:56:55 +00:00
|
|
|
};
|
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
#if defined (__CYGWIN__)
|
|
|
|
// workaround for zlib with cygwin build
|
2019-07-29 16:42:50 +00:00
|
|
|
int _wopen (const char *path, int oflag, ...)
|
2016-09-06 17:44:27 +00:00
|
|
|
{
|
2019-07-12 22:20:41 +00:00
|
|
|
va_list ap;
|
|
|
|
va_start (ap, oflag);
|
|
|
|
int r = open (path, oflag, ap);
|
|
|
|
va_end (ap);
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
#endif
|
2016-09-06 17:44:27 +00:00
|
|
|
|
2021-07-18 19:27:21 +00:00
|
|
|
bool hc_fopen (HCFILE *fp, const char *path, const char *mode)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-08-18 16:28:00 +00:00
|
|
|
if (fp == NULL || path == NULL || mode == NULL) return false;
|
|
|
|
|
|
|
|
/* cleanup */
|
|
|
|
fp->fd = -1;
|
|
|
|
fp->pfp = NULL;
|
|
|
|
fp->gfp = NULL;
|
|
|
|
fp->ufp = NULL;
|
2021-08-25 13:56:55 +00:00
|
|
|
fp->xfp = NULL;
|
2021-08-18 16:28:00 +00:00
|
|
|
fp->bom_size = 0;
|
|
|
|
fp->path = NULL;
|
|
|
|
fp->mode = NULL;
|
2016-09-06 17:44:27 +00:00
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
int oflag = -1;
|
2016-09-06 17:44:27 +00:00
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
int fmode = S_IRUSR|S_IWUSR;
|
|
|
|
|
2023-01-31 07:07:55 +00:00
|
|
|
if (strncmp (mode, "a", 1) == 0)
|
2016-09-06 17:44:27 +00:00
|
|
|
{
|
2019-07-12 22:20:41 +00:00
|
|
|
oflag = O_WRONLY | O_CREAT | O_APPEND;
|
2016-09-06 17:44:27 +00:00
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
#if defined(MSDOS) || defined(OS2) || defined(WIN32) || defined(_WIN32) || defined(__CYGWIN__)
|
|
|
|
if (strncmp (mode, "ab", 2) == 0) oflag |= O_BINARY;
|
|
|
|
#endif
|
|
|
|
}
|
2023-01-31 07:07:55 +00:00
|
|
|
else if (strncmp (mode, "r", 1) == 0)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
|
|
|
oflag = O_RDONLY;
|
|
|
|
fmode = -1;
|
2016-09-06 17:44:27 +00:00
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
#if defined(MSDOS) || defined(OS2) || defined(WIN32) || defined(_WIN32) || defined(__CYGWIN__)
|
|
|
|
if (strncmp (mode, "rb", 2) == 0) oflag |= O_BINARY;
|
|
|
|
#endif
|
|
|
|
}
|
2023-01-31 07:07:55 +00:00
|
|
|
else if (strncmp (mode, "w", 1) == 0)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
|
|
|
oflag = O_WRONLY | O_CREAT | O_TRUNC;
|
2016-09-06 17:44:27 +00:00
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
#if defined(MSDOS) || defined(OS2) || defined(WIN32) || defined(_WIN32) || defined(__CYGWIN__)
|
|
|
|
if (strncmp (mode, "wb", 2) == 0) oflag |= O_BINARY;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
// ADD more strncmp to handle more "mode"
|
|
|
|
return false;
|
|
|
|
}
|
2016-09-06 17:44:27 +00:00
|
|
|
|
2021-06-29 18:42:22 +00:00
|
|
|
unsigned char check[8] = { 0 };
|
2019-07-12 22:20:41 +00:00
|
|
|
|
2021-08-18 16:28:00 +00:00
|
|
|
bool is_gzip = false;
|
|
|
|
bool is_zip = false;
|
2021-08-25 13:56:55 +00:00
|
|
|
bool is_xz = false;
|
2023-01-31 07:02:26 +00:00
|
|
|
bool is_fifo = hc_path_is_fifo (path);
|
2021-08-18 16:28:00 +00:00
|
|
|
|
2023-01-31 07:02:26 +00:00
|
|
|
if (is_fifo == false)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2023-01-31 07:02:26 +00:00
|
|
|
int fd_tmp = open (path, O_RDONLY);
|
2019-07-12 22:20:41 +00:00
|
|
|
|
2023-01-31 07:02:26 +00:00
|
|
|
if (fd_tmp != -1)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2023-01-31 07:02:26 +00:00
|
|
|
lseek (fd_tmp, 0, SEEK_SET);
|
2021-06-29 18:42:22 +00:00
|
|
|
|
2023-01-31 07:02:26 +00:00
|
|
|
if (read (fd_tmp, check, sizeof (check)) > 0)
|
2021-06-29 18:42:22 +00:00
|
|
|
{
|
2023-01-31 07:02:26 +00:00
|
|
|
if (check[0] == 0x1f && check[1] == 0x8b && check[2] == 0x08) is_gzip = true;
|
|
|
|
if (check[0] == 0x50 && check[1] == 0x4b && check[2] == 0x03 && check[3] == 0x04) is_zip = true;
|
|
|
|
if (memcmp (check, XZ_SIG, XZ_SIG_SIZE) == 0) is_xz = true;
|
|
|
|
|
|
|
|
// compressed files with BOM will be undetected!
|
|
|
|
|
|
|
|
if (is_gzip == false && is_zip == false && is_xz == false)
|
|
|
|
{
|
|
|
|
fp->bom_size = hc_string_bom_size (check);
|
|
|
|
}
|
2021-06-29 18:42:22 +00:00
|
|
|
}
|
2019-07-12 22:20:41 +00:00
|
|
|
|
2023-01-31 07:02:26 +00:00
|
|
|
close (fd_tmp);
|
|
|
|
}
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
|
|
|
|
2021-08-21 11:29:10 +00:00
|
|
|
if (fmode == -1)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-08-21 11:29:10 +00:00
|
|
|
fp->fd = open (path, oflag);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
fp->fd = open (path, oflag, fmode);
|
|
|
|
}
|
2019-07-12 22:20:41 +00:00
|
|
|
|
2021-08-21 11:29:10 +00:00
|
|
|
if (fp->fd == -1) return false;
|
2019-07-12 22:20:41 +00:00
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (is_gzip)
|
|
|
|
{
|
|
|
|
if ((fp->gfp = gzdopen (fp->fd, mode)) == NULL) return false;
|
2021-09-02 09:08:36 +00:00
|
|
|
|
|
|
|
gzbuffer (fp->gfp, HCFILE_BUFFER_SIZE);
|
2021-08-25 13:56:55 +00:00
|
|
|
}
|
|
|
|
else if (is_zip)
|
|
|
|
{
|
|
|
|
if ((fp->ufp = unzOpen64 (path)) == NULL) return false;
|
|
|
|
|
|
|
|
if (unzOpenCurrentFile (fp->ufp) != UNZ_OK) return false;
|
|
|
|
}
|
|
|
|
else if (is_xz)
|
2021-08-21 11:29:10 +00:00
|
|
|
{
|
2021-08-28 22:31:56 +00:00
|
|
|
/* thread safe on little endian */
|
2021-08-25 13:56:55 +00:00
|
|
|
if (xz_initialized == false)
|
2021-08-18 16:28:00 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
CrcGenerateTable ();
|
2021-08-28 22:31:56 +00:00
|
|
|
Crc64GenerateTable ();
|
2021-08-26 10:01:25 +00:00
|
|
|
Sha256Prepare ();
|
2021-08-25 13:56:55 +00:00
|
|
|
xz_initialized = true;
|
2021-08-18 16:28:00 +00:00
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
|
2021-08-30 13:28:54 +00:00
|
|
|
xzfile_t *xfp = (xzfile_t *) hccalloc (1, sizeof (*xfp));
|
2021-08-25 13:56:55 +00:00
|
|
|
if (xfp == NULL) return false;
|
|
|
|
|
|
|
|
/* prepare cache line aligned memory allocator */
|
|
|
|
AlignOffsetAlloc_CreateVTable (&xfp->alloc);
|
|
|
|
xfp->alloc.numAlignBits = 7;
|
|
|
|
xfp->alloc.baseAlloc = &xz_alloc;
|
|
|
|
ISzAllocPtr alloc = &xfp->alloc.vt;
|
2021-09-02 09:00:46 +00:00
|
|
|
xfp->inBuf = (Byte *) ISzAlloc_Alloc (alloc, HCFILE_BUFFER_SIZE);
|
2021-08-25 13:56:55 +00:00
|
|
|
if (xfp->inBuf == NULL)
|
2021-08-18 16:28:00 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
hcfree (xfp);
|
|
|
|
close (fp->fd);
|
|
|
|
return false;
|
|
|
|
}
|
2019-07-29 16:42:50 +00:00
|
|
|
|
2021-08-26 13:41:17 +00:00
|
|
|
/* open the file */
|
|
|
|
CFileInStream *inStream = &xfp->inStream;
|
|
|
|
FileInStream_CreateVTable (inStream);
|
2021-08-25 13:56:55 +00:00
|
|
|
CSzFile *file = &inStream->file;
|
|
|
|
File_Construct (file);
|
|
|
|
WRes wres = InFile_Open (file, path);
|
|
|
|
if (wres != SZ_OK)
|
|
|
|
{
|
|
|
|
ISzAlloc_Free (alloc, xfp->inBuf);
|
|
|
|
hcfree (xfp);
|
|
|
|
close (fp->fd);
|
|
|
|
return false;
|
|
|
|
}
|
2021-08-18 16:28:00 +00:00
|
|
|
|
2021-08-26 13:41:17 +00:00
|
|
|
/* scan the file */
|
|
|
|
CLookToRead2 lookStream;
|
|
|
|
LookToRead2_CreateVTable (&lookStream, false);
|
|
|
|
lookStream.buf = xfp->inBuf;
|
2021-09-02 09:00:46 +00:00
|
|
|
lookStream.bufSize = HCFILE_BUFFER_SIZE;
|
2021-08-26 13:41:17 +00:00
|
|
|
lookStream.realStream = &inStream->vt;
|
|
|
|
LookToRead2_Init (&lookStream);
|
|
|
|
Xzs_Construct (&xfp->streams);
|
|
|
|
Int64 offset = 0;
|
|
|
|
SRes res = Xzs_ReadBackward (&xfp->streams, &lookStream.vt, &offset, NULL, alloc);
|
|
|
|
if (res != SZ_OK || offset != 0)
|
|
|
|
{
|
|
|
|
Xzs_Free (&xfp->streams, alloc);
|
|
|
|
File_Close (file);
|
|
|
|
ISzAlloc_Free (alloc, xfp->inBuf);
|
|
|
|
hcfree (xfp);
|
|
|
|
close (fp->fd);
|
|
|
|
return false;
|
|
|
|
}
|
2021-08-18 16:28:00 +00:00
|
|
|
|
2021-08-26 13:41:17 +00:00
|
|
|
xfp->inBlocks = Xzs_GetNumBlocks (&xfp->streams);
|
|
|
|
xfp->outSize = Xzs_GetUnpackSize (&xfp->streams);
|
2021-08-18 16:28:00 +00:00
|
|
|
|
2021-08-26 13:41:17 +00:00
|
|
|
/* seek to start of the file and fill the buffer */
|
2021-09-02 09:00:46 +00:00
|
|
|
SizeT inLen = HCFILE_BUFFER_SIZE;
|
2021-08-26 13:41:17 +00:00
|
|
|
res = ISeekInStream_Seek (&inStream->vt, &offset, SZ_SEEK_SET);
|
|
|
|
if (res == SZ_OK)
|
|
|
|
{
|
|
|
|
res = ISeekInStream_Read (&inStream->vt, xfp->inBuf, &inLen);
|
2021-08-18 16:28:00 +00:00
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
if (res != SZ_OK || inLen == 0)
|
|
|
|
{
|
2021-08-26 13:41:17 +00:00
|
|
|
Xzs_Free (&xfp->streams, alloc);
|
2021-08-25 13:56:55 +00:00
|
|
|
File_Close (file);
|
|
|
|
ISzAlloc_Free (alloc, xfp->inBuf);
|
|
|
|
hcfree (xfp);
|
|
|
|
close (fp->fd);
|
|
|
|
return false;
|
|
|
|
}
|
2021-08-18 16:28:00 +00:00
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
xfp->inLen = inLen;
|
|
|
|
|
|
|
|
/* read headers */
|
|
|
|
SizeT outLen = 0;
|
|
|
|
ECoderStatus status;
|
|
|
|
CXzUnpacker *state = &xfp->state;
|
|
|
|
XzUnpacker_Construct (state, alloc);
|
|
|
|
res = XzUnpacker_Code (state, NULL, &outLen, xfp->inBuf, &inLen, false, CODER_FINISH_ANY, &status);
|
|
|
|
if (res != SZ_OK)
|
|
|
|
{
|
|
|
|
XzUnpacker_Free (state);
|
2021-08-26 13:41:17 +00:00
|
|
|
Xzs_Free (&xfp->streams, alloc);
|
2021-08-25 13:56:55 +00:00
|
|
|
File_Close (file);
|
|
|
|
ISzAlloc_Free (alloc, xfp->inBuf);
|
|
|
|
hcfree (xfp);
|
|
|
|
close (fp->fd);
|
|
|
|
return false;
|
2021-08-18 16:28:00 +00:00
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
|
|
|
|
xfp->inPos = inLen;
|
|
|
|
xfp->inProcessed = inLen;
|
|
|
|
fp->xfp = xfp;
|
2019-07-29 16:42:50 +00:00
|
|
|
}
|
2019-07-12 22:20:41 +00:00
|
|
|
else
|
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
if ((fp->pfp = fdopen (fp->fd, mode)) == NULL) return false;
|
2021-06-29 18:42:22 +00:00
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (fp->bom_size)
|
|
|
|
{
|
|
|
|
// atm just skip bom
|
|
|
|
|
|
|
|
const int nread = fread (check, sizeof (char), fp->bom_size, fp->pfp);
|
|
|
|
|
|
|
|
if (nread != fp->bom_size) return false;
|
|
|
|
}
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
fp->path = path;
|
|
|
|
fp->mode = mode;
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2021-07-18 19:27:21 +00:00
|
|
|
bool hc_fopen_raw (HCFILE *fp, const char *path, const char *mode)
|
2021-05-29 11:27:05 +00:00
|
|
|
{
|
2021-08-18 16:28:00 +00:00
|
|
|
if (fp == NULL || path == NULL || mode == NULL) return false;
|
|
|
|
|
|
|
|
/* cleanup */
|
|
|
|
fp->fd = -1;
|
|
|
|
fp->pfp = NULL;
|
|
|
|
fp->gfp = NULL;
|
|
|
|
fp->ufp = NULL;
|
2021-08-25 13:56:55 +00:00
|
|
|
fp->xfp = NULL;
|
2021-08-18 16:28:00 +00:00
|
|
|
fp->bom_size = 0;
|
|
|
|
fp->path = NULL;
|
|
|
|
fp->mode = NULL;
|
2021-05-29 11:27:05 +00:00
|
|
|
|
|
|
|
int oflag = -1;
|
|
|
|
|
|
|
|
int fmode = S_IRUSR|S_IWUSR;
|
|
|
|
|
|
|
|
if (strncmp (mode, "a", 1) == 0 || strncmp (mode, "ab", 2) == 0)
|
|
|
|
{
|
|
|
|
oflag = O_WRONLY | O_CREAT | O_APPEND;
|
|
|
|
|
|
|
|
#if defined(MSDOS) || defined(OS2) || defined(WIN32) || defined(_WIN32) || defined(__CYGWIN__)
|
|
|
|
if (strncmp (mode, "ab", 2) == 0) oflag |= O_BINARY;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
else if (strncmp (mode, "r", 1) == 0 || strncmp (mode, "rb", 2) == 0)
|
|
|
|
{
|
|
|
|
oflag = O_RDONLY;
|
|
|
|
fmode = -1;
|
|
|
|
|
|
|
|
#if defined(MSDOS) || defined(OS2) || defined(WIN32) || defined(_WIN32) || defined(__CYGWIN__)
|
|
|
|
if (strncmp (mode, "rb", 2) == 0) oflag |= O_BINARY;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
else if (strncmp (mode, "w", 1) == 0 || strncmp (mode, "wb", 2) == 0)
|
|
|
|
{
|
|
|
|
oflag = O_WRONLY | O_CREAT | O_TRUNC;
|
|
|
|
|
|
|
|
#if defined(MSDOS) || defined(OS2) || defined(WIN32) || defined(_WIN32) || defined(__CYGWIN__)
|
|
|
|
if (strncmp (mode, "wb", 2) == 0) oflag |= O_BINARY;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
// ADD more strncmp to handle more "mode"
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (fmode == -1)
|
|
|
|
{
|
|
|
|
fp->fd = open (path, oflag);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
fp->fd = open (path, oflag, fmode);
|
|
|
|
}
|
|
|
|
|
2021-08-18 16:28:00 +00:00
|
|
|
if (fp->fd == -1) return false;
|
2021-05-29 11:27:05 +00:00
|
|
|
|
2021-08-18 16:28:00 +00:00
|
|
|
if ((fp->pfp = fdopen (fp->fd, mode)) == NULL) return false;
|
2021-05-29 11:27:05 +00:00
|
|
|
|
|
|
|
fp->path = path;
|
|
|
|
fp->mode = mode;
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
size_t hc_fread (void *ptr, size_t size, size_t nmemb, HCFILE *fp)
|
|
|
|
{
|
2021-09-02 12:16:19 +00:00
|
|
|
size_t n = (size_t) -1;
|
2019-07-12 22:20:41 +00:00
|
|
|
|
2021-09-02 10:49:28 +00:00
|
|
|
if (ptr == NULL || fp == NULL) return n;
|
2019-07-12 22:20:41 +00:00
|
|
|
|
2021-09-02 10:49:28 +00:00
|
|
|
if (size == 0 || nmemb == 0) return 0;
|
2019-07-29 16:42:50 +00:00
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (fp->pfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-09-02 10:49:28 +00:00
|
|
|
#ifdef _WIN
|
|
|
|
u64 len = (u64) size * nmemb;
|
2020-06-02 07:52:10 +00:00
|
|
|
|
2021-09-02 10:49:28 +00:00
|
|
|
#ifndef _WIN64
|
|
|
|
/* check 2 GB limit with 32 bit build */
|
2021-09-02 12:57:22 +00:00
|
|
|
if (len >= INT32_MAX) return n;
|
2021-09-02 10:49:28 +00:00
|
|
|
#endif
|
2020-06-02 07:52:10 +00:00
|
|
|
|
2021-09-02 10:49:28 +00:00
|
|
|
if (len <= HCFILE_CHUNK_SIZE)
|
2020-06-02 07:52:10 +00:00
|
|
|
{
|
|
|
|
n = fread (ptr, size, nmemb, fp->pfp);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2021-09-02 10:49:28 +00:00
|
|
|
size_t left = (size_t) len;
|
|
|
|
size_t pos = 0;
|
2020-06-02 07:52:10 +00:00
|
|
|
|
2021-09-02 10:49:28 +00:00
|
|
|
/* assume success */
|
|
|
|
n = nmemb;
|
2020-06-02 07:52:10 +00:00
|
|
|
|
2021-09-02 10:49:28 +00:00
|
|
|
do
|
2020-06-02 07:52:10 +00:00
|
|
|
{
|
2021-09-02 10:49:28 +00:00
|
|
|
size_t chunk = (left > HCFILE_CHUNK_SIZE) ? HCFILE_CHUNK_SIZE : left;
|
|
|
|
size_t bytes = fread ((unsigned char *) ptr + pos, 1, chunk, fp->pfp);
|
|
|
|
pos += bytes;
|
|
|
|
left -= bytes;
|
|
|
|
if (chunk != bytes)
|
|
|
|
{
|
|
|
|
/* partial read */
|
|
|
|
n = pos / size;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} while (left);
|
2020-06-02 07:52:10 +00:00
|
|
|
}
|
|
|
|
#else
|
2019-07-12 22:20:41 +00:00
|
|
|
n = fread (ptr, size, nmemb, fp->pfp);
|
2020-06-02 07:52:10 +00:00
|
|
|
#endif
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
else if (fp->gfp)
|
|
|
|
{
|
|
|
|
n = gzfread (ptr, size, nmemb, fp->gfp);
|
|
|
|
}
|
|
|
|
else if (fp->ufp)
|
|
|
|
{
|
2021-09-02 10:49:28 +00:00
|
|
|
u64 len = (u64) size * nmemb;
|
2021-09-02 11:59:38 +00:00
|
|
|
u64 pos = 0;
|
|
|
|
|
2021-09-02 12:57:22 +00:00
|
|
|
#if defined(_WIN) && !defined(_WIN64)
|
|
|
|
/* check 2 GB limit with 32 bit build */
|
|
|
|
if (len >= INT32_MAX) return n;
|
|
|
|
#endif
|
|
|
|
|
2021-09-02 11:59:38 +00:00
|
|
|
/* assume success */
|
|
|
|
n = nmemb;
|
|
|
|
|
|
|
|
do
|
2021-09-02 10:49:28 +00:00
|
|
|
{
|
2021-09-02 13:03:25 +00:00
|
|
|
unsigned chunk = (len > INT_MAX) ? INT_MAX : (unsigned) len;
|
2021-09-02 11:59:38 +00:00
|
|
|
int result = unzReadCurrentFile (fp->ufp, (unsigned char *) ptr + pos, chunk);
|
2021-09-02 12:16:19 +00:00
|
|
|
if (result < 0) return (size_t) -1;
|
2021-09-02 11:59:38 +00:00
|
|
|
pos += (u64) result;
|
|
|
|
len -= (u64) result;
|
|
|
|
if (chunk != (unsigned) result)
|
|
|
|
{
|
|
|
|
/* partial read */
|
|
|
|
n = pos / size;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} while (len);
|
2021-08-25 13:56:55 +00:00
|
|
|
}
|
|
|
|
else if (fp->xfp)
|
|
|
|
{
|
|
|
|
Byte *outBuf = (Byte *) ptr;
|
|
|
|
SizeT outLen = (SizeT) size * nmemb;
|
|
|
|
SizeT outPos = 0;
|
|
|
|
SRes res = SZ_OK;
|
|
|
|
xzfile_t *xfp = fp->xfp;
|
|
|
|
|
2021-09-02 12:57:22 +00:00
|
|
|
#if defined(_WIN) && !defined(_WIN64)
|
|
|
|
/* check 2 GB limit with 32 bit build */
|
|
|
|
if (outLen >= INT32_MAX) return n;
|
|
|
|
#endif
|
|
|
|
|
2021-09-02 12:16:19 +00:00
|
|
|
/* assume success */
|
|
|
|
n = nmemb;
|
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
do
|
|
|
|
{
|
|
|
|
/* fill buffer if needed */
|
|
|
|
if (xfp->inLen == xfp->inPos && !xfp->inEof)
|
|
|
|
{
|
|
|
|
xfp->inPos = 0;
|
2021-09-02 09:00:46 +00:00
|
|
|
xfp->inLen = HCFILE_BUFFER_SIZE;
|
2021-08-26 13:41:17 +00:00
|
|
|
res = ISeekInStream_Read (&xfp->inStream.vt, xfp->inBuf, &xfp->inLen);
|
2021-08-25 13:56:55 +00:00
|
|
|
if (res != SZ_OK || xfp->inLen == 0) xfp->inEof = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* decode */
|
|
|
|
ECoderStatus status;
|
|
|
|
SizeT inLeft = xfp->inLen - xfp->inPos;
|
|
|
|
SizeT outLeft = outLen - outPos;
|
|
|
|
res = XzUnpacker_Code (&xfp->state, outBuf + outPos, &outLeft, xfp->inBuf + xfp->inPos, &inLeft, inLeft == 0, CODER_FINISH_ANY, &status);
|
|
|
|
xfp->inPos += inLeft;
|
2021-08-26 10:01:25 +00:00
|
|
|
xfp->inProcessed += inLeft;
|
2021-09-02 12:16:19 +00:00
|
|
|
if (res != SZ_OK) return (size_t) -1;
|
|
|
|
if (inLeft == 0 && outLeft == 0)
|
|
|
|
{
|
|
|
|
/* partial read */
|
2023-08-18 23:37:00 +00:00
|
|
|
n = (outPos / size);
|
2021-09-02 12:16:19 +00:00
|
|
|
break;
|
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
outPos += outLeft;
|
|
|
|
xfp->outProcessed += outLeft;
|
|
|
|
} while (outPos < outLen);
|
|
|
|
}
|
2019-07-12 22:20:41 +00:00
|
|
|
|
|
|
|
return n;
|
|
|
|
}
|
|
|
|
|
2019-09-12 01:05:01 +00:00
|
|
|
size_t hc_fwrite (const void *ptr, size_t size, size_t nmemb, HCFILE *fp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
|
|
|
size_t n = -1;
|
|
|
|
|
2021-09-02 10:49:28 +00:00
|
|
|
if (ptr == NULL || fp == NULL) return n;
|
|
|
|
|
|
|
|
if (size == 0 || nmemb == 0) return 0;
|
2019-07-12 22:20:41 +00:00
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (fp->pfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-09-02 10:49:28 +00:00
|
|
|
#ifdef _WIN
|
|
|
|
u64 len = (u64) size * nmemb;
|
2020-06-02 07:52:10 +00:00
|
|
|
|
2021-09-02 10:49:28 +00:00
|
|
|
#ifndef _WIN64
|
|
|
|
/* check 2 GB limit with 32 bit build */
|
|
|
|
if (len >= INT32_MAX)
|
|
|
|
{
|
|
|
|
return n;
|
|
|
|
}
|
|
|
|
#endif
|
2020-06-02 07:52:10 +00:00
|
|
|
|
2021-09-02 10:49:28 +00:00
|
|
|
if (len <= HCFILE_CHUNK_SIZE)
|
2020-06-02 07:52:10 +00:00
|
|
|
{
|
|
|
|
n = fwrite (ptr, size, nmemb, fp->pfp);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2021-09-02 10:49:28 +00:00
|
|
|
size_t left = (size_t) len;
|
|
|
|
size_t pos = 0;
|
2020-06-02 07:52:10 +00:00
|
|
|
|
2021-09-02 10:49:28 +00:00
|
|
|
/* assume success */
|
|
|
|
n = nmemb;
|
2020-06-02 07:52:10 +00:00
|
|
|
|
2021-09-02 10:49:28 +00:00
|
|
|
do
|
2020-06-02 07:52:10 +00:00
|
|
|
{
|
2021-09-02 10:49:28 +00:00
|
|
|
size_t chunk = (left > HCFILE_CHUNK_SIZE) ? HCFILE_CHUNK_SIZE : left;
|
|
|
|
size_t bytes = fwrite ((unsigned char *) ptr + pos, 1, chunk, fp->pfp);
|
|
|
|
pos += bytes;
|
|
|
|
left -= bytes;
|
|
|
|
if (chunk != bytes) return -1;
|
|
|
|
} while (left);
|
2020-06-02 07:52:10 +00:00
|
|
|
}
|
|
|
|
#else
|
2019-07-12 22:20:41 +00:00
|
|
|
n = fwrite (ptr, size, nmemb, fp->pfp);
|
2020-06-02 07:52:10 +00:00
|
|
|
#endif
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
else if (fp->gfp)
|
|
|
|
{
|
|
|
|
n = gzfwrite (ptr, size, nmemb, fp->gfp);
|
2021-10-08 15:38:54 +00:00
|
|
|
}
|
2019-07-12 22:20:41 +00:00
|
|
|
|
|
|
|
return n;
|
|
|
|
}
|
|
|
|
|
|
|
|
int hc_fseek (HCFILE *fp, off_t offset, int whence)
|
|
|
|
{
|
|
|
|
int r = -1;
|
|
|
|
|
|
|
|
if (fp == NULL) return r;
|
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (fp->pfp)
|
|
|
|
{
|
|
|
|
r = fseeko (fp->pfp, offset, whence);
|
|
|
|
}
|
|
|
|
else if (fp->gfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2019-08-04 01:34:38 +00:00
|
|
|
r = gzseek (fp->gfp, offset, whence);
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
2021-08-18 14:18:31 +00:00
|
|
|
else if (fp->ufp)
|
2019-07-29 16:42:50 +00:00
|
|
|
{
|
|
|
|
/*
|
|
|
|
// untested and not used in wordlist engine
|
|
|
|
zlib_filefunc64_32_def *d = NULL;
|
|
|
|
if (whence == SEEK_SET)
|
|
|
|
{
|
2020-06-13 09:19:00 +00:00
|
|
|
r = ZSEEK64 (*d, fp->ufp, offset, ZLIB_FILEFUNC_SEEK_SET);
|
2019-07-29 16:42:50 +00:00
|
|
|
}
|
|
|
|
else if (whence == SEEK_CUR)
|
|
|
|
{
|
2020-06-13 09:19:00 +00:00
|
|
|
r = ZSEEK64 (*d, fp->ufp, offset, ZLIB_FILEFUNC_SEEK_CUR);
|
2019-07-29 16:42:50 +00:00
|
|
|
}
|
|
|
|
else if (whence == SEEK_END)
|
|
|
|
{
|
2020-06-13 09:19:00 +00:00
|
|
|
r = ZSEEK64 (*d, fp->ufp, offset, ZLIB_FILEFUNC_SEEK_END);
|
2019-07-29 16:42:50 +00:00
|
|
|
}
|
|
|
|
// or
|
|
|
|
// r = unzSetOffset (fp->ufp, offset);
|
|
|
|
*/
|
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
else if (fp->xfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
/* TODO */
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
|
|
|
void hc_rewind (HCFILE *fp)
|
|
|
|
{
|
|
|
|
if (fp == NULL) return;
|
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (fp->pfp)
|
|
|
|
{
|
|
|
|
rewind (fp->pfp);
|
|
|
|
}
|
|
|
|
else if (fp->gfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
|
|
|
gzrewind (fp->gfp);
|
|
|
|
}
|
2021-08-18 14:18:31 +00:00
|
|
|
else if (fp->ufp)
|
2019-07-29 16:42:50 +00:00
|
|
|
{
|
|
|
|
unzGoToFirstFile (fp->ufp);
|
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
else if (fp->xfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
xzfile_t *xfp = fp->xfp;
|
|
|
|
|
|
|
|
/* cleanup */
|
|
|
|
xfp->inEof = false;
|
|
|
|
xfp->inLen = 0;
|
|
|
|
xfp->inPos = 0;
|
|
|
|
xfp->inProcessed = 0;
|
|
|
|
xfp->outProcessed = 0;
|
|
|
|
|
|
|
|
/* reset */
|
2021-08-26 13:41:17 +00:00
|
|
|
Int64 offset = 0;
|
|
|
|
CFileInStream *inStream = &xfp->inStream;
|
|
|
|
SRes res = ISeekInStream_Seek (&inStream->vt, &offset, SZ_SEEK_SET);
|
|
|
|
if (res != SZ_OK) return;
|
2021-08-25 13:56:55 +00:00
|
|
|
CXzUnpacker *state = &xfp->state;
|
|
|
|
XzUnpacker_Init (&xfp->state);
|
|
|
|
|
2021-08-26 13:41:17 +00:00
|
|
|
/* fill the buffer */
|
2021-09-02 09:00:46 +00:00
|
|
|
SizeT inLen = HCFILE_BUFFER_SIZE;
|
2021-08-26 13:41:17 +00:00
|
|
|
res = ISeekInStream_Read (&inStream->vt, xfp->inBuf, &inLen);
|
2021-08-25 13:56:55 +00:00
|
|
|
if (res != SZ_OK || inLen == 0) return;
|
|
|
|
|
|
|
|
xfp->inLen = inLen;
|
|
|
|
|
|
|
|
/* read headers */
|
|
|
|
SizeT outLen = 0;
|
|
|
|
ECoderStatus status;
|
|
|
|
XzUnpacker_Code (state, NULL, &outLen, xfp->inBuf, &inLen, false, CODER_FINISH_ANY, &status);
|
|
|
|
xfp->inPos = inLen;
|
|
|
|
xfp->inProcessed = inLen;
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-08-21 11:29:10 +00:00
|
|
|
int hc_fstat (HCFILE *fp, struct stat *buf)
|
|
|
|
{
|
2021-08-26 13:41:17 +00:00
|
|
|
int r = -1;
|
|
|
|
|
|
|
|
if (fp == NULL || buf == NULL || fp->fd == -1) return r;
|
2021-08-21 11:29:10 +00:00
|
|
|
|
2021-08-26 13:41:17 +00:00
|
|
|
r = fstat (fp->fd, buf);
|
|
|
|
if (r != 0) return r;
|
2021-08-21 11:29:10 +00:00
|
|
|
|
2021-08-26 13:41:17 +00:00
|
|
|
if (fp->gfp)
|
|
|
|
{
|
|
|
|
/* TODO: For compressed files hc_ftell() reports uncompressed bytes, but hc_fstat() reports compressed bytes */
|
|
|
|
}
|
|
|
|
else if (fp->ufp)
|
|
|
|
{
|
|
|
|
/* TODO: For compressed files hc_ftell() reports uncompressed bytes, but hc_fstat() reports compressed bytes */
|
|
|
|
}
|
|
|
|
else if (fp->xfp)
|
|
|
|
{
|
2021-08-30 13:28:54 +00:00
|
|
|
/* check that the uncompressed size is known */
|
2021-08-26 13:41:17 +00:00
|
|
|
const xzfile_t *xfp = fp->xfp;
|
2021-09-02 10:49:28 +00:00
|
|
|
if (xfp->outSize != (UInt64) ((Int64) -1))
|
2021-08-30 13:28:54 +00:00
|
|
|
{
|
|
|
|
buf->st_size = (off_t) xfp->outSize;
|
|
|
|
}
|
2021-08-26 13:41:17 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return r;
|
2021-08-21 11:29:10 +00:00
|
|
|
}
|
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
off_t hc_ftell (HCFILE *fp)
|
|
|
|
{
|
|
|
|
off_t n = 0;
|
|
|
|
|
|
|
|
if (fp == NULL) return -1;
|
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (fp->pfp)
|
|
|
|
{
|
|
|
|
n = ftello (fp->pfp);
|
|
|
|
}
|
|
|
|
else if (fp->gfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
|
|
|
n = (off_t) gztell (fp->gfp);
|
|
|
|
}
|
2021-08-18 14:18:31 +00:00
|
|
|
else if (fp->ufp)
|
2019-07-29 16:42:50 +00:00
|
|
|
{
|
|
|
|
n = unztell (fp->ufp);
|
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
else if (fp->xfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
/* uncompressed bytes */
|
|
|
|
const xzfile_t *xfp = fp->xfp;
|
|
|
|
n = (off_t) xfp->outProcessed;
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return n;
|
|
|
|
}
|
|
|
|
|
|
|
|
int hc_fputc (int c, HCFILE *fp)
|
|
|
|
{
|
|
|
|
int r = -1;
|
|
|
|
|
|
|
|
if (fp == NULL) return r;
|
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (fp->pfp)
|
2019-07-29 16:42:50 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
r = fputc (c, fp->pfp);
|
2019-07-29 16:42:50 +00:00
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
else if (fp->gfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
r = gzputc (fp->gfp, c);
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
|
|
|
int hc_fgetc (HCFILE *fp)
|
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
int r = EOF;
|
2019-07-12 22:20:41 +00:00
|
|
|
|
|
|
|
if (fp == NULL) return r;
|
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (fp->pfp)
|
|
|
|
{
|
|
|
|
r = fgetc (fp->pfp);
|
|
|
|
}
|
|
|
|
else if (fp->gfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
|
|
|
r = gzgetc (fp->gfp);
|
|
|
|
}
|
2021-08-18 14:18:31 +00:00
|
|
|
else if (fp->ufp)
|
2019-07-29 16:42:50 +00:00
|
|
|
{
|
|
|
|
unsigned char c = 0;
|
|
|
|
|
|
|
|
if (unzReadCurrentFile (fp->ufp, &c, 1) == 1) r = (int) c;
|
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
else if (fp->xfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
Byte out;
|
|
|
|
SRes res = SZ_OK;
|
|
|
|
xzfile_t *xfp = fp->xfp;
|
|
|
|
|
|
|
|
/* fill buffer if needed */
|
|
|
|
if (xfp->inLen == xfp->inPos && !xfp->inEof)
|
|
|
|
{
|
|
|
|
xfp->inPos = 0;
|
2021-09-02 09:00:46 +00:00
|
|
|
xfp->inLen = HCFILE_BUFFER_SIZE;
|
2021-08-26 13:41:17 +00:00
|
|
|
res = ISeekInStream_Read (&xfp->inStream.vt, xfp->inBuf, &xfp->inLen);
|
2021-08-25 13:56:55 +00:00
|
|
|
if (res != SZ_OK || xfp->inLen == 0) xfp->inEof = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* decode single byte */
|
|
|
|
ECoderStatus status;
|
|
|
|
SizeT inLeft = xfp->inLen - xfp->inPos;
|
|
|
|
SizeT outLeft = 1;
|
|
|
|
res = XzUnpacker_Code (&xfp->state, &out, &outLeft, xfp->inBuf + xfp->inPos, &inLeft, inLeft == 0, CODER_FINISH_ANY, &status);
|
|
|
|
if (inLeft == 0 && outLeft == 0) return r;
|
|
|
|
xfp->inPos += inLeft;
|
2021-08-26 10:01:25 +00:00
|
|
|
xfp->inProcessed += inLeft;
|
2021-08-25 13:56:55 +00:00
|
|
|
if (res != SZ_OK) return r;
|
|
|
|
xfp->outProcessed++;
|
|
|
|
r = (int) out;
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
|
|
|
char *hc_fgets (char *buf, int len, HCFILE *fp)
|
|
|
|
{
|
|
|
|
char *r = NULL;
|
|
|
|
|
2021-08-26 10:01:25 +00:00
|
|
|
if (fp == NULL || buf == NULL || len <= 0) return r;
|
2019-07-12 22:20:41 +00:00
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (fp->pfp)
|
|
|
|
{
|
|
|
|
r = fgets (buf, len, fp->pfp);
|
|
|
|
}
|
|
|
|
else if (fp->gfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
|
|
|
r = gzgets (fp->gfp, buf, len);
|
|
|
|
}
|
2021-08-18 14:18:31 +00:00
|
|
|
else if (fp->ufp)
|
2019-07-29 16:42:50 +00:00
|
|
|
{
|
|
|
|
if (unzReadCurrentFile (fp->ufp, buf, len) > 0) r = buf;
|
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
else if (fp->xfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
Byte *outBuf = (Byte *) buf;
|
|
|
|
SizeT outLen = (SizeT) len - 1;
|
|
|
|
SRes res = SZ_OK;
|
|
|
|
xzfile_t *xfp = fp->xfp;
|
|
|
|
|
|
|
|
while (outLen > 0)
|
|
|
|
{
|
|
|
|
/* fill buffer if needed */
|
|
|
|
if (xfp->inLen == xfp->inPos && !xfp->inEof)
|
|
|
|
{
|
|
|
|
xfp->inPos = 0;
|
2021-09-02 09:00:46 +00:00
|
|
|
xfp->inLen = HCFILE_BUFFER_SIZE;
|
2021-08-26 13:41:17 +00:00
|
|
|
res = ISeekInStream_Read (&xfp->inStream.vt, xfp->inBuf, &xfp->inLen);
|
2021-08-25 13:56:55 +00:00
|
|
|
if (res != SZ_OK || xfp->inLen == 0) xfp->inEof = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* decode single byte */
|
|
|
|
ECoderStatus status;
|
|
|
|
SizeT inLeft = xfp->inLen - xfp->inPos;
|
|
|
|
SizeT outLeft = 1;
|
|
|
|
res = XzUnpacker_Code (&xfp->state, outBuf, &outLeft, xfp->inBuf + xfp->inPos, &inLeft, inLeft == 0, CODER_FINISH_ANY, &status);
|
|
|
|
if (inLeft == 0 && outLeft == 0) break;
|
|
|
|
xfp->inPos += inLeft;
|
2021-08-26 10:01:25 +00:00
|
|
|
xfp->inProcessed += inLeft;
|
2021-08-25 13:56:55 +00:00
|
|
|
if (res != SZ_OK) break;
|
|
|
|
xfp->outProcessed++;
|
|
|
|
if (*outBuf++ == '\n')
|
|
|
|
{
|
|
|
|
/* success */
|
|
|
|
r = buf;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
outLen--;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* always NULL terminate */
|
|
|
|
*outBuf = 0;
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
|
|
|
int hc_vfprintf (HCFILE *fp, const char *format, va_list ap)
|
|
|
|
{
|
|
|
|
int r = -1;
|
|
|
|
|
|
|
|
if (fp == NULL) return r;
|
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (fp->pfp)
|
2019-07-29 16:42:50 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
r = vfprintf (fp->pfp, format, ap);
|
2019-07-29 16:42:50 +00:00
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
else if (fp->gfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
r = gzvprintf (fp->gfp, format, ap);
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
|
|
|
int hc_fprintf (HCFILE *fp, const char *format, ...)
|
|
|
|
{
|
|
|
|
int r = -1;
|
|
|
|
|
|
|
|
if (fp == NULL) return r;
|
|
|
|
|
|
|
|
va_list ap;
|
|
|
|
|
|
|
|
va_start (ap, format);
|
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (fp->pfp)
|
2019-07-29 16:42:50 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
r = vfprintf (fp->pfp, format, ap);
|
2019-07-29 16:42:50 +00:00
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
else if (fp->gfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
r = gzvprintf (fp->gfp, format, ap);
|
2016-09-06 17:44:27 +00:00
|
|
|
}
|
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
va_end (ap);
|
|
|
|
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
|
|
|
int hc_fscanf (HCFILE *fp, const char *format, void *ptr)
|
|
|
|
{
|
|
|
|
if (fp == NULL) return -1;
|
|
|
|
|
2021-08-18 13:46:17 +00:00
|
|
|
char buf[HCBUFSIZ_TINY];
|
2019-07-12 22:20:41 +00:00
|
|
|
|
|
|
|
char *b = hc_fgets (buf, HCBUFSIZ_TINY - 1, fp);
|
|
|
|
|
|
|
|
if (b == NULL)
|
|
|
|
{
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
2019-08-04 01:34:38 +00:00
|
|
|
sscanf (b, format, ptr);
|
2019-07-12 22:20:41 +00:00
|
|
|
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
int hc_feof (HCFILE *fp)
|
|
|
|
{
|
|
|
|
int r = -1;
|
|
|
|
|
|
|
|
if (fp == NULL) return r;
|
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (fp->pfp)
|
|
|
|
{
|
|
|
|
r = feof (fp->pfp);
|
|
|
|
}
|
|
|
|
else if (fp->gfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
|
|
|
r = gzeof (fp->gfp);
|
|
|
|
}
|
2021-08-18 14:18:31 +00:00
|
|
|
else if (fp->ufp)
|
2019-07-29 16:42:50 +00:00
|
|
|
{
|
|
|
|
r = unzeof (fp->ufp);
|
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
else if (fp->xfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
const xzfile_t *xfp = fp->xfp;
|
|
|
|
r = (xfp->inEof && xfp->inPos == xfp->inLen);
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
|
|
|
void hc_fflush (HCFILE *fp)
|
|
|
|
{
|
|
|
|
if (fp == NULL) return;
|
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (fp->pfp)
|
2019-07-29 16:42:50 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
fflush (fp->pfp);
|
2019-07-29 16:42:50 +00:00
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
else if (fp->gfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
gzflush (fp->gfp, Z_SYNC_FLUSH);
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-08-21 11:29:10 +00:00
|
|
|
void hc_fsync (HCFILE *fp)
|
|
|
|
{
|
|
|
|
if (fp == NULL) return;
|
|
|
|
|
|
|
|
if (fp->pfp)
|
|
|
|
{
|
|
|
|
#if defined (_WIN)
|
|
|
|
HANDLE h = (HANDLE) _get_osfhandle (fp->fd);
|
|
|
|
|
|
|
|
FlushFileBuffers (h);
|
|
|
|
#else
|
|
|
|
fsync (fp->fd);
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
void hc_fclose (HCFILE *fp)
|
|
|
|
{
|
|
|
|
if (fp == NULL) return;
|
|
|
|
|
2021-08-25 13:56:55 +00:00
|
|
|
if (fp->pfp)
|
|
|
|
{
|
|
|
|
fclose (fp->pfp);
|
|
|
|
}
|
|
|
|
else if (fp->gfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
|
|
|
gzclose (fp->gfp);
|
|
|
|
}
|
2021-08-18 14:18:31 +00:00
|
|
|
else if (fp->ufp)
|
2019-07-29 16:42:50 +00:00
|
|
|
{
|
|
|
|
unzCloseCurrentFile (fp->ufp);
|
|
|
|
|
|
|
|
unzClose (fp->ufp);
|
2021-08-21 11:29:10 +00:00
|
|
|
|
|
|
|
close (fp->fd);
|
2019-07-29 16:42:50 +00:00
|
|
|
}
|
2021-08-25 13:56:55 +00:00
|
|
|
else if (fp->xfp)
|
2019-07-12 22:20:41 +00:00
|
|
|
{
|
2021-08-25 13:56:55 +00:00
|
|
|
xzfile_t *xfp = fp->xfp;
|
2021-08-26 13:41:17 +00:00
|
|
|
ISzAllocPtr alloc = &xfp->alloc.vt;
|
2021-08-25 13:56:55 +00:00
|
|
|
XzUnpacker_Free (&xfp->state);
|
2021-08-26 13:41:17 +00:00
|
|
|
Xzs_Free (&xfp->streams, alloc);
|
2021-08-25 13:56:55 +00:00
|
|
|
File_Close (&xfp->inStream.file);
|
2021-08-26 13:41:17 +00:00
|
|
|
ISzAlloc_Free (alloc, xfp->inBuf);
|
2021-08-25 13:56:55 +00:00
|
|
|
hcfree (xfp);
|
|
|
|
close (fp->fd);
|
2019-07-12 22:20:41 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
fp->fd = -1;
|
|
|
|
fp->pfp = NULL;
|
2021-08-18 16:28:00 +00:00
|
|
|
fp->gfp = NULL;
|
|
|
|
fp->ufp = NULL;
|
2021-08-25 13:56:55 +00:00
|
|
|
fp->xfp = NULL;
|
2019-07-12 22:20:41 +00:00
|
|
|
|
|
|
|
fp->path = NULL;
|
|
|
|
fp->mode = NULL;
|
2016-09-06 17:44:27 +00:00
|
|
|
}
|
|
|
|
|
2019-08-06 10:22:24 +00:00
|
|
|
size_t fgetl (HCFILE *fp, char *line_buf, const size_t line_sz)
|
2016-09-06 17:44:27 +00:00
|
|
|
{
|
2021-09-13 16:26:00 +00:00
|
|
|
int c;
|
2019-08-06 10:22:24 +00:00
|
|
|
|
2018-02-08 18:13:29 +00:00
|
|
|
size_t line_len = 0;
|
2016-09-06 17:44:27 +00:00
|
|
|
|
2021-09-13 16:26:00 +00:00
|
|
|
size_t line_truncated = 0;
|
2016-09-06 17:44:27 +00:00
|
|
|
|
2021-09-13 16:26:00 +00:00
|
|
|
while ((c = hc_fgetc (fp)) != EOF)
|
|
|
|
{
|
|
|
|
if (c == '\n') break;
|
2016-09-06 17:44:27 +00:00
|
|
|
|
2019-08-06 10:22:24 +00:00
|
|
|
if (line_len == line_sz)
|
|
|
|
{
|
|
|
|
line_truncated++;
|
|
|
|
}
|
2021-09-13 16:26:00 +00:00
|
|
|
else
|
|
|
|
{
|
|
|
|
line_buf[line_len] = (char) c;
|
2019-08-06 10:22:24 +00:00
|
|
|
|
2021-09-13 16:26:00 +00:00
|
|
|
line_len++;
|
|
|
|
}
|
2016-09-06 17:44:27 +00:00
|
|
|
}
|
|
|
|
|
2019-08-06 10:22:24 +00:00
|
|
|
if (line_truncated > 0)
|
|
|
|
{
|
2020-01-14 12:29:02 +00:00
|
|
|
fprintf (stderr, "\nOversized line detected! Truncated %" PRIu64 " bytes\n", (u64) line_truncated);
|
2019-08-06 10:22:24 +00:00
|
|
|
}
|
2021-09-13 16:26:00 +00:00
|
|
|
else
|
2016-09-06 17:44:27 +00:00
|
|
|
{
|
2021-09-13 16:26:00 +00:00
|
|
|
while (line_len > 0 && line_buf[line_len - 1] == '\r')
|
2017-01-05 20:58:24 +00:00
|
|
|
{
|
|
|
|
line_len--;
|
|
|
|
}
|
2016-09-06 17:44:27 +00:00
|
|
|
}
|
|
|
|
|
2017-01-05 20:58:24 +00:00
|
|
|
line_buf[line_len] = 0;
|
|
|
|
|
2021-08-18 13:46:17 +00:00
|
|
|
return line_len;
|
2016-09-06 17:44:27 +00:00
|
|
|
}
|
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
u64 count_lines (HCFILE *fp)
|
2017-02-14 10:14:32 +00:00
|
|
|
{
|
2019-07-12 22:20:41 +00:00
|
|
|
u64 cnt = 0;
|
2017-02-14 10:14:32 +00:00
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
char *buf = (char *) hcmalloc (HCBUFSIZ_LARGE + 1);
|
|
|
|
|
|
|
|
char prev = '\n';
|
|
|
|
|
|
|
|
while (!hc_feof (fp))
|
2017-02-14 10:14:32 +00:00
|
|
|
{
|
2019-07-12 22:20:41 +00:00
|
|
|
size_t nread = hc_fread (buf, sizeof (char), HCBUFSIZ_LARGE, fp);
|
2017-02-14 10:14:32 +00:00
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
if (nread < 1) continue;
|
2017-02-14 10:14:32 +00:00
|
|
|
|
2021-08-18 13:46:17 +00:00
|
|
|
for (size_t i = 0; i < nread; i++)
|
2017-02-14 10:14:32 +00:00
|
|
|
{
|
2019-07-12 22:20:41 +00:00
|
|
|
if (prev == '\n') cnt++;
|
2017-02-14 10:14:32 +00:00
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
prev = buf[i];
|
2017-02-14 10:14:32 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-07-12 22:20:41 +00:00
|
|
|
hcfree (buf);
|
|
|
|
|
|
|
|
return cnt;
|
2017-02-14 10:14:32 +00:00
|
|
|
}
|
|
|
|
|
2018-02-08 18:13:29 +00:00
|
|
|
size_t in_superchop (char *buf)
|
2016-09-06 17:44:27 +00:00
|
|
|
{
|
2016-11-17 05:17:28 +00:00
|
|
|
size_t len = strlen (buf);
|
2016-09-06 17:44:27 +00:00
|
|
|
|
|
|
|
while (len)
|
|
|
|
{
|
|
|
|
if (buf[len - 1] == '\n')
|
|
|
|
{
|
|
|
|
len--;
|
|
|
|
|
2017-02-14 10:14:32 +00:00
|
|
|
buf[len] = 0;
|
|
|
|
|
2016-09-06 17:44:27 +00:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (buf[len - 1] == '\r')
|
|
|
|
{
|
|
|
|
len--;
|
|
|
|
|
2017-02-14 10:14:32 +00:00
|
|
|
buf[len] = 0;
|
|
|
|
|
2016-09-06 17:44:27 +00:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return len;
|
|
|
|
}
|
2019-07-12 22:20:41 +00:00
|
|
|
|
|
|
|
size_t superchop_with_length (char *buf, const size_t len)
|
|
|
|
{
|
|
|
|
size_t new_len = len;
|
|
|
|
|
|
|
|
while (new_len)
|
|
|
|
{
|
|
|
|
if (buf[new_len - 1] == '\n')
|
|
|
|
{
|
|
|
|
new_len--;
|
|
|
|
|
|
|
|
buf[new_len] = 0;
|
|
|
|
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (buf[new_len - 1] == '\r')
|
|
|
|
{
|
|
|
|
new_len--;
|
|
|
|
|
|
|
|
buf[new_len] = 0;
|
|
|
|
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return new_len;
|
|
|
|
}
|