2021-08-13 17:21:30 +03:00
|
|
|
// SPDX-License-Identifier: GPL-2.0
|
|
|
|
/*
|
|
|
|
*
|
|
|
|
* Copyright (C) 2019-2021 Paragon Software GmbH, All rights reserved.
|
|
|
|
*
|
|
|
|
*/
|
2021-08-03 14:57:09 +03:00
|
|
|
|
2021-08-13 17:21:30 +03:00
|
|
|
#include <linux/blkdev.h>
|
|
|
|
#include <linux/buffer_head.h>
|
|
|
|
#include <linux/fs.h>
|
|
|
|
#include <linux/nls.h>
|
|
|
|
|
|
|
|
#include "debug.h"
|
|
|
|
#include "ntfs.h"
|
|
|
|
#include "ntfs_fs.h"
|
|
|
|
|
|
|
|
// clang-format off
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Src buffer is zero. */
|
2021-08-13 17:21:30 +03:00
|
|
|
#define LZNT_ERROR_ALL_ZEROS 1
|
|
|
|
#define LZNT_CHUNK_SIZE 0x1000
|
|
|
|
// clang-format on
|
|
|
|
|
|
|
|
struct lznt_hash {
|
|
|
|
const u8 *p1;
|
|
|
|
const u8 *p2;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct lznt {
|
|
|
|
const u8 *unc;
|
|
|
|
const u8 *unc_end;
|
|
|
|
const u8 *best_match;
|
|
|
|
size_t max_len;
|
|
|
|
bool std;
|
|
|
|
|
|
|
|
struct lznt_hash hash[LZNT_CHUNK_SIZE];
|
|
|
|
};
|
|
|
|
|
|
|
|
static inline size_t get_match_len(const u8 *ptr, const u8 *end, const u8 *prev,
|
|
|
|
size_t max_len)
|
|
|
|
{
|
|
|
|
size_t len = 0;
|
|
|
|
|
|
|
|
while (ptr + len < end && ptr[len] == prev[len] && ++len < max_len)
|
|
|
|
;
|
|
|
|
return len;
|
|
|
|
}
|
|
|
|
|
|
|
|
static size_t longest_match_std(const u8 *src, struct lznt *ctx)
|
|
|
|
{
|
|
|
|
size_t hash_index;
|
|
|
|
size_t len1 = 0, len2 = 0;
|
|
|
|
const u8 **hash;
|
|
|
|
|
|
|
|
hash_index =
|
|
|
|
((40543U * ((((src[0] << 4) ^ src[1]) << 4) ^ src[2])) >> 4) &
|
|
|
|
(LZNT_CHUNK_SIZE - 1);
|
|
|
|
|
|
|
|
hash = &(ctx->hash[hash_index].p1);
|
|
|
|
|
|
|
|
if (hash[0] >= ctx->unc && hash[0] < src && hash[0][0] == src[0] &&
|
|
|
|
hash[0][1] == src[1] && hash[0][2] == src[2]) {
|
|
|
|
len1 = 3;
|
|
|
|
if (ctx->max_len > 3)
|
|
|
|
len1 += get_match_len(src + 3, ctx->unc_end,
|
|
|
|
hash[0] + 3, ctx->max_len - 3);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (hash[1] >= ctx->unc && hash[1] < src && hash[1][0] == src[0] &&
|
|
|
|
hash[1][1] == src[1] && hash[1][2] == src[2]) {
|
|
|
|
len2 = 3;
|
|
|
|
if (ctx->max_len > 3)
|
|
|
|
len2 += get_match_len(src + 3, ctx->unc_end,
|
|
|
|
hash[1] + 3, ctx->max_len - 3);
|
|
|
|
}
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Compare two matches and select the best one. */
|
2021-08-13 17:21:30 +03:00
|
|
|
if (len1 < len2) {
|
|
|
|
ctx->best_match = hash[1];
|
|
|
|
len1 = len2;
|
|
|
|
} else {
|
|
|
|
ctx->best_match = hash[0];
|
|
|
|
}
|
|
|
|
|
|
|
|
hash[1] = hash[0];
|
|
|
|
hash[0] = src;
|
|
|
|
return len1;
|
|
|
|
}
|
|
|
|
|
|
|
|
static size_t longest_match_best(const u8 *src, struct lznt *ctx)
|
|
|
|
{
|
|
|
|
size_t max_len;
|
|
|
|
const u8 *ptr;
|
|
|
|
|
|
|
|
if (ctx->unc >= src || !ctx->max_len)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
max_len = 0;
|
|
|
|
for (ptr = ctx->unc; ptr < src; ++ptr) {
|
|
|
|
size_t len =
|
|
|
|
get_match_len(src, ctx->unc_end, ptr, ctx->max_len);
|
|
|
|
if (len >= max_len) {
|
|
|
|
max_len = len;
|
|
|
|
ctx->best_match = ptr;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return max_len >= 3 ? max_len : 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static const size_t s_max_len[] = {
|
|
|
|
0x1002, 0x802, 0x402, 0x202, 0x102, 0x82, 0x42, 0x22, 0x12,
|
|
|
|
};
|
|
|
|
|
|
|
|
static const size_t s_max_off[] = {
|
|
|
|
0x10, 0x20, 0x40, 0x80, 0x100, 0x200, 0x400, 0x800, 0x1000,
|
|
|
|
};
|
|
|
|
|
|
|
|
static inline u16 make_pair(size_t offset, size_t len, size_t index)
|
|
|
|
{
|
|
|
|
return ((offset - 1) << (12 - index)) |
|
|
|
|
((len - 3) & (((1 << (12 - index)) - 1)));
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline size_t parse_pair(u16 pair, size_t *offset, size_t index)
|
|
|
|
{
|
|
|
|
*offset = 1 + (pair >> (12 - index));
|
|
|
|
return 3 + (pair & ((1 << (12 - index)) - 1));
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* compress_chunk
|
|
|
|
*
|
2021-08-03 14:57:09 +03:00
|
|
|
* Return:
|
|
|
|
* * 0 - Ok, @cmpr contains @cmpr_chunk_size bytes of compressed data.
|
|
|
|
* * 1 - Input buffer is full zero.
|
|
|
|
* * -2 - The compressed buffer is too small to hold the compressed data.
|
2021-08-13 17:21:30 +03:00
|
|
|
*/
|
|
|
|
static inline int compress_chunk(size_t (*match)(const u8 *, struct lznt *),
|
|
|
|
const u8 *unc, const u8 *unc_end, u8 *cmpr,
|
|
|
|
u8 *cmpr_end, size_t *cmpr_chunk_size,
|
|
|
|
struct lznt *ctx)
|
|
|
|
{
|
|
|
|
size_t cnt = 0;
|
|
|
|
size_t idx = 0;
|
|
|
|
const u8 *up = unc;
|
|
|
|
u8 *cp = cmpr + 3;
|
|
|
|
u8 *cp2 = cmpr + 2;
|
|
|
|
u8 not_zero = 0;
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Control byte of 8-bit values: ( 0 - means byte as is, 1 - short pair ). */
|
2021-08-13 17:21:30 +03:00
|
|
|
u8 ohdr = 0;
|
|
|
|
u8 *last;
|
|
|
|
u16 t16;
|
|
|
|
|
|
|
|
if (unc + LZNT_CHUNK_SIZE < unc_end)
|
|
|
|
unc_end = unc + LZNT_CHUNK_SIZE;
|
|
|
|
|
|
|
|
last = min(cmpr + LZNT_CHUNK_SIZE + sizeof(short), cmpr_end);
|
|
|
|
|
|
|
|
ctx->unc = unc;
|
|
|
|
ctx->unc_end = unc_end;
|
|
|
|
ctx->max_len = s_max_len[0];
|
|
|
|
|
|
|
|
while (up < unc_end) {
|
|
|
|
size_t max_len;
|
|
|
|
|
|
|
|
while (unc + s_max_off[idx] < up)
|
|
|
|
ctx->max_len = s_max_len[++idx];
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Find match. */
|
2021-08-13 17:21:30 +03:00
|
|
|
max_len = up + 3 <= unc_end ? (*match)(up, ctx) : 0;
|
|
|
|
|
|
|
|
if (!max_len) {
|
|
|
|
if (cp >= last)
|
|
|
|
goto NotCompressed;
|
|
|
|
not_zero |= *cp++ = *up++;
|
|
|
|
} else if (cp + 1 >= last) {
|
|
|
|
goto NotCompressed;
|
|
|
|
} else {
|
|
|
|
t16 = make_pair(up - ctx->best_match, max_len, idx);
|
|
|
|
*cp++ = t16;
|
|
|
|
*cp++ = t16 >> 8;
|
|
|
|
|
|
|
|
ohdr |= 1 << cnt;
|
|
|
|
up += max_len;
|
|
|
|
}
|
|
|
|
|
|
|
|
cnt = (cnt + 1) & 7;
|
|
|
|
if (!cnt) {
|
|
|
|
*cp2 = ohdr;
|
|
|
|
ohdr = 0;
|
|
|
|
cp2 = cp;
|
|
|
|
cp += 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (cp2 < last)
|
|
|
|
*cp2 = ohdr;
|
|
|
|
else
|
|
|
|
cp -= 1;
|
|
|
|
|
|
|
|
*cmpr_chunk_size = cp - cmpr;
|
|
|
|
|
|
|
|
t16 = (*cmpr_chunk_size - 3) | 0xB000;
|
|
|
|
cmpr[0] = t16;
|
|
|
|
cmpr[1] = t16 >> 8;
|
|
|
|
|
|
|
|
return not_zero ? 0 : LZNT_ERROR_ALL_ZEROS;
|
|
|
|
|
|
|
|
NotCompressed:
|
|
|
|
|
|
|
|
if ((cmpr + LZNT_CHUNK_SIZE + sizeof(short)) > last)
|
|
|
|
return -2;
|
|
|
|
|
|
|
|
/*
|
2021-08-03 14:57:09 +03:00
|
|
|
* Copy non cmpr data.
|
2021-08-13 17:21:30 +03:00
|
|
|
* 0x3FFF == ((LZNT_CHUNK_SIZE + 2 - 3) | 0x3000)
|
|
|
|
*/
|
|
|
|
cmpr[0] = 0xff;
|
|
|
|
cmpr[1] = 0x3f;
|
|
|
|
|
|
|
|
memcpy(cmpr + sizeof(short), unc, LZNT_CHUNK_SIZE);
|
|
|
|
*cmpr_chunk_size = LZNT_CHUNK_SIZE + sizeof(short);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline ssize_t decompress_chunk(u8 *unc, u8 *unc_end, const u8 *cmpr,
|
|
|
|
const u8 *cmpr_end)
|
|
|
|
{
|
|
|
|
u8 *up = unc;
|
|
|
|
u8 ch = *cmpr++;
|
|
|
|
size_t bit = 0;
|
|
|
|
size_t index = 0;
|
|
|
|
u16 pair;
|
|
|
|
size_t offset, length;
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Do decompression until pointers are inside range. */
|
2021-08-13 17:21:30 +03:00
|
|
|
while (up < unc_end && cmpr < cmpr_end) {
|
|
|
|
/* Correct index */
|
|
|
|
while (unc + s_max_off[index] < up)
|
|
|
|
index += 1;
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Check the current flag for zero. */
|
2021-08-13 17:21:30 +03:00
|
|
|
if (!(ch & (1 << bit))) {
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Just copy byte. */
|
2021-08-13 17:21:30 +03:00
|
|
|
*up++ = *cmpr++;
|
|
|
|
goto next;
|
|
|
|
}
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Check for boundary. */
|
2021-08-13 17:21:30 +03:00
|
|
|
if (cmpr + 1 >= cmpr_end)
|
|
|
|
return -EINVAL;
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Read a short from little endian stream. */
|
2021-08-13 17:21:30 +03:00
|
|
|
pair = cmpr[1];
|
|
|
|
pair <<= 8;
|
|
|
|
pair |= cmpr[0];
|
|
|
|
|
|
|
|
cmpr += 2;
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Translate packed information into offset and length. */
|
2021-08-13 17:21:30 +03:00
|
|
|
length = parse_pair(pair, &offset, index);
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Check offset for boundary. */
|
2021-08-13 17:21:30 +03:00
|
|
|
if (unc + offset > up)
|
|
|
|
return -EINVAL;
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Truncate the length if necessary. */
|
2021-08-13 17:21:30 +03:00
|
|
|
if (up + length >= unc_end)
|
|
|
|
length = unc_end - up;
|
|
|
|
|
|
|
|
/* Now we copy bytes. This is the heart of LZ algorithm. */
|
|
|
|
for (; length > 0; length--, up++)
|
|
|
|
*up = *(up - offset);
|
|
|
|
|
|
|
|
next:
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Advance flag bit value. */
|
2021-08-13 17:21:30 +03:00
|
|
|
bit = (bit + 1) & 7;
|
|
|
|
|
|
|
|
if (!bit) {
|
|
|
|
if (cmpr >= cmpr_end)
|
|
|
|
break;
|
|
|
|
|
|
|
|
ch = *cmpr++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Return the size of uncompressed data. */
|
2021-08-13 17:21:30 +03:00
|
|
|
return up - unc;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2021-08-03 14:57:09 +03:00
|
|
|
* get_lznt_ctx
|
|
|
|
* @level: 0 - Standard compression.
|
|
|
|
* !0 - Best compression, requires a lot of cpu.
|
2021-08-13 17:21:30 +03:00
|
|
|
*/
|
|
|
|
struct lznt *get_lznt_ctx(int level)
|
|
|
|
{
|
2021-08-31 16:57:40 +03:00
|
|
|
struct lznt *r = kzalloc(level ? offsetof(struct lznt, hash)
|
|
|
|
: sizeof(struct lznt),
|
|
|
|
GFP_NOFS);
|
2021-08-13 17:21:30 +03:00
|
|
|
|
|
|
|
if (r)
|
|
|
|
r->std = !level;
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2021-08-03 14:57:09 +03:00
|
|
|
* compress_lznt - Compresses @unc into @cmpr
|
2021-08-13 17:21:30 +03:00
|
|
|
*
|
2021-08-03 14:57:09 +03:00
|
|
|
* Return:
|
|
|
|
* * +x - Ok, @cmpr contains 'final_compressed_size' bytes of compressed data.
|
|
|
|
* * 0 - Input buffer is full zero.
|
2021-08-13 17:21:30 +03:00
|
|
|
*/
|
|
|
|
size_t compress_lznt(const void *unc, size_t unc_size, void *cmpr,
|
|
|
|
size_t cmpr_size, struct lznt *ctx)
|
|
|
|
{
|
|
|
|
int err;
|
|
|
|
size_t (*match)(const u8 *src, struct lznt *ctx);
|
|
|
|
u8 *p = cmpr;
|
|
|
|
u8 *end = p + cmpr_size;
|
|
|
|
const u8 *unc_chunk = unc;
|
|
|
|
const u8 *unc_end = unc_chunk + unc_size;
|
|
|
|
bool is_zero = true;
|
|
|
|
|
|
|
|
if (ctx->std) {
|
|
|
|
match = &longest_match_std;
|
|
|
|
memset(ctx->hash, 0, sizeof(ctx->hash));
|
|
|
|
} else {
|
|
|
|
match = &longest_match_best;
|
|
|
|
}
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Compression cycle. */
|
2021-08-13 17:21:30 +03:00
|
|
|
for (; unc_chunk < unc_end; unc_chunk += LZNT_CHUNK_SIZE) {
|
|
|
|
cmpr_size = 0;
|
|
|
|
err = compress_chunk(match, unc_chunk, unc_end, p, end,
|
|
|
|
&cmpr_size, ctx);
|
|
|
|
if (err < 0)
|
|
|
|
return unc_size;
|
|
|
|
|
|
|
|
if (is_zero && err != LZNT_ERROR_ALL_ZEROS)
|
|
|
|
is_zero = false;
|
|
|
|
|
|
|
|
p += cmpr_size;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (p <= end - 2)
|
|
|
|
p[0] = p[1] = 0;
|
|
|
|
|
|
|
|
return is_zero ? 0 : PtrOffset(cmpr, p);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2021-08-03 14:57:09 +03:00
|
|
|
* decompress_lznt - Decompress @cmpr into @unc.
|
2021-08-13 17:21:30 +03:00
|
|
|
*/
|
|
|
|
ssize_t decompress_lznt(const void *cmpr, size_t cmpr_size, void *unc,
|
|
|
|
size_t unc_size)
|
|
|
|
{
|
|
|
|
const u8 *cmpr_chunk = cmpr;
|
|
|
|
const u8 *cmpr_end = cmpr_chunk + cmpr_size;
|
|
|
|
u8 *unc_chunk = unc;
|
|
|
|
u8 *unc_end = unc_chunk + unc_size;
|
|
|
|
u16 chunk_hdr;
|
|
|
|
|
|
|
|
if (cmpr_size < sizeof(short))
|
|
|
|
return -EINVAL;
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Read chunk header. */
|
2021-08-13 17:21:30 +03:00
|
|
|
chunk_hdr = cmpr_chunk[1];
|
|
|
|
chunk_hdr <<= 8;
|
|
|
|
chunk_hdr |= cmpr_chunk[0];
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Loop through decompressing chunks. */
|
2021-08-13 17:21:30 +03:00
|
|
|
for (;;) {
|
|
|
|
size_t chunk_size_saved;
|
|
|
|
size_t unc_use;
|
|
|
|
size_t cmpr_use = 3 + (chunk_hdr & (LZNT_CHUNK_SIZE - 1));
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Check that the chunk actually fits the supplied buffer. */
|
2021-08-13 17:21:30 +03:00
|
|
|
if (cmpr_chunk + cmpr_use > cmpr_end)
|
|
|
|
return -EINVAL;
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* First make sure the chunk contains compressed data. */
|
2021-08-13 17:21:30 +03:00
|
|
|
if (chunk_hdr & 0x8000) {
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Decompress a chunk and return if we get an error. */
|
2021-08-13 17:21:30 +03:00
|
|
|
ssize_t err =
|
|
|
|
decompress_chunk(unc_chunk, unc_end,
|
|
|
|
cmpr_chunk + sizeof(chunk_hdr),
|
|
|
|
cmpr_chunk + cmpr_use);
|
|
|
|
if (err < 0)
|
|
|
|
return err;
|
|
|
|
unc_use = err;
|
|
|
|
} else {
|
2021-08-03 14:57:09 +03:00
|
|
|
/* This chunk does not contain compressed data. */
|
2021-08-13 17:21:30 +03:00
|
|
|
unc_use = unc_chunk + LZNT_CHUNK_SIZE > unc_end
|
|
|
|
? unc_end - unc_chunk
|
|
|
|
: LZNT_CHUNK_SIZE;
|
|
|
|
|
|
|
|
if (cmpr_chunk + sizeof(chunk_hdr) + unc_use >
|
|
|
|
cmpr_end) {
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
memcpy(unc_chunk, cmpr_chunk + sizeof(chunk_hdr),
|
|
|
|
unc_use);
|
|
|
|
}
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Advance pointers. */
|
2021-08-13 17:21:30 +03:00
|
|
|
cmpr_chunk += cmpr_use;
|
|
|
|
unc_chunk += unc_use;
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Check for the end of unc buffer. */
|
2021-08-13 17:21:30 +03:00
|
|
|
if (unc_chunk >= unc_end)
|
|
|
|
break;
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Proceed the next chunk. */
|
2021-08-13 17:21:30 +03:00
|
|
|
if (cmpr_chunk > cmpr_end - 2)
|
|
|
|
break;
|
|
|
|
|
|
|
|
chunk_size_saved = LZNT_CHUNK_SIZE;
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Read chunk header. */
|
2021-08-13 17:21:30 +03:00
|
|
|
chunk_hdr = cmpr_chunk[1];
|
|
|
|
chunk_hdr <<= 8;
|
|
|
|
chunk_hdr |= cmpr_chunk[0];
|
|
|
|
|
|
|
|
if (!chunk_hdr)
|
|
|
|
break;
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Check the size of unc buffer. */
|
2021-08-13 17:21:30 +03:00
|
|
|
if (unc_use < chunk_size_saved) {
|
|
|
|
size_t t1 = chunk_size_saved - unc_use;
|
|
|
|
u8 *t2 = unc_chunk + t1;
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* 'Zero' memory. */
|
2021-08-13 17:21:30 +03:00
|
|
|
if (t2 >= unc_end)
|
|
|
|
break;
|
|
|
|
|
|
|
|
memset(unc_chunk, 0, t1);
|
|
|
|
unc_chunk = t2;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-08-03 14:57:09 +03:00
|
|
|
/* Check compression boundary. */
|
2021-08-13 17:21:30 +03:00
|
|
|
if (cmpr_chunk > cmpr_end)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* The unc size is just a difference between current
|
2021-08-03 14:57:09 +03:00
|
|
|
* pointer and original one.
|
2021-08-13 17:21:30 +03:00
|
|
|
*/
|
|
|
|
return PtrOffset(unc, unc_chunk);
|
|
|
|
}
|