forked from pool/brotli
1376 lines
69 KiB
Diff
1376 lines
69 KiB
Diff
|
From d0ffe60b87aa5ec302fcb031c8ebf726c1a1692a Mon Sep 17 00:00:00 2001
|
||
|
From: Eugene Kliuchnikov <eustas@google.com>
|
||
|
Date: Wed, 24 Oct 2018 16:06:09 +0200
|
||
|
Subject: [PATCH] Verbose CLI + start pulling "Shared-Brotli" (#722)
|
||
|
|
||
|
* Verbose CLI + start pulling "Shared-Brotli"
|
||
|
|
||
|
* vesbose CLI output; fix #666
|
||
|
* pull `SHIFT` transforms; currently this is semantically dead code;
|
||
|
later it will be used by "Shared-Brotli"
|
||
|
---
|
||
|
c/common/transform.c | 56 +++
|
||
|
c/common/transform.h | 5 +
|
||
|
c/enc/backward_references.h | 6 +-
|
||
|
c/enc/backward_references_hq.c | 11 +-
|
||
|
c/enc/backward_references_hq.h | 10 +-
|
||
|
c/enc/backward_references_inc.h | 6 +-
|
||
|
c/enc/encode.c | 2 -
|
||
|
c/enc/encoder_dict.c | 1 -
|
||
|
c/tools/brotli.c | 54 ++-
|
||
|
java/org/brotli/dec/BrotliInputStream.java | 12 +-
|
||
|
java/org/brotli/dec/Decode.java | 63 ++-
|
||
|
java/org/brotli/dec/SynthTest.java | 513 ++++++++++++++++++++-
|
||
|
java/org/brotli/dec/Transform.java | 183 ++++++--
|
||
|
java/org/brotli/dec/TransformTest.java | 14 +-
|
||
|
14 files changed, 848 insertions(+), 88 deletions(-)
|
||
|
|
||
|
diff --git a/c/common/transform.c b/c/common/transform.c
|
||
|
index 426e635f..c182053d 100755
|
||
|
--- a/c/common/transform.c
|
||
|
+++ b/c/common/transform.c
|
||
|
@@ -166,6 +166,7 @@ static BrotliTransforms kBrotliTransforms = {
|
||
|
kPrefixSuffixMap,
|
||
|
sizeof(kTransformsData) / (3 * sizeof(kTransformsData[0])),
|
||
|
kTransformsData,
|
||
|
+ NULL, /* no extra parameters */
|
||
|
{0, 12, 27, 23, 42, 63, 56, 48, 59, 64}
|
||
|
};
|
||
|
|
||
|
@@ -190,6 +191,48 @@ static int ToUpperCase(uint8_t* p) {
|
||
|
return 3;
|
||
|
}
|
||
|
|
||
|
+static int Shift(uint8_t* word, int word_len, uint16_t parameter) {
|
||
|
+ /* Limited sign extension: scalar < (1 << 24). */
|
||
|
+ uint32_t scalar =
|
||
|
+ (parameter & 0x7FFFu) + (0x1000000u - (parameter & 0x8000u));
|
||
|
+ if (word[0] < 0x80) {
|
||
|
+ /* 1-byte rune / 0sssssss / 7 bit scalar (ASCII). */
|
||
|
+ scalar += (uint32_t)word[0];
|
||
|
+ word[0] = (uint8_t)(scalar & 0x7Fu);
|
||
|
+ return 1;
|
||
|
+ } else if (word[0] < 0xC0) {
|
||
|
+ /* Continuation / 10AAAAAA. */
|
||
|
+ return 1;
|
||
|
+ } else if (word[0] < 0xE0) {
|
||
|
+ /* 2-byte rune / 110sssss AAssssss / 11 bit scalar. */
|
||
|
+ if (word_len < 2) return 1;
|
||
|
+ scalar += (uint32_t)((word[1] & 0x3Fu) | ((word[0] & 0x1Fu) << 6u));
|
||
|
+ word[0] = (uint8_t)(0xC0 | ((scalar >> 6u) & 0x1F));
|
||
|
+ word[1] = (uint8_t)((word[1] & 0xC0) | (scalar & 0x3F));
|
||
|
+ return 2;
|
||
|
+ } else if (word[0] < 0xF0) {
|
||
|
+ /* 3-byte rune / 1110ssss AAssssss BBssssss / 16 bit scalar. */
|
||
|
+ if (word_len < 3) return word_len;
|
||
|
+ scalar += (uint32_t)((word[2] & 0x3Fu) | ((word[1] & 0x3Fu) << 6u) |
|
||
|
+ ((word[0] & 0x0Fu) << 12u));
|
||
|
+ word[0] = (uint8_t)(0xE0 | ((scalar >> 12u) & 0x0F));
|
||
|
+ word[1] = (uint8_t)((word[1] & 0xC0) | ((scalar >> 6u) & 0x3F));
|
||
|
+ word[2] = (uint8_t)((word[2] & 0xC0) | (scalar & 0x3F));
|
||
|
+ return 3;
|
||
|
+ } else if (word[0] < 0xF8) {
|
||
|
+ /* 4-byte rune / 11110sss AAssssss BBssssss CCssssss / 21 bit scalar. */
|
||
|
+ if (word_len < 4) return word_len;
|
||
|
+ scalar += (uint32_t)((word[3] & 0x3Fu) | ((word[2] & 0x3Fu) << 6u) |
|
||
|
+ ((word[1] & 0x3Fu) << 12u) | ((word[0] & 0x07u) << 18u));
|
||
|
+ word[0] = (uint8_t)(0xF0 | ((scalar >> 18u) & 0x07));
|
||
|
+ word[1] = (uint8_t)((word[1] & 0xC0) | ((scalar >> 12u) & 0x3F));
|
||
|
+ word[2] = (uint8_t)((word[2] & 0xC0) | ((scalar >> 6u) & 0x3F));
|
||
|
+ word[3] = (uint8_t)((word[3] & 0xC0) | (scalar & 0x3F));
|
||
|
+ return 4;
|
||
|
+ }
|
||
|
+ return 1;
|
||
|
+}
|
||
|
+
|
||
|
int BrotliTransformDictionaryWord(uint8_t* dst, const uint8_t* word, int len,
|
||
|
const BrotliTransforms* transforms, int transform_idx) {
|
||
|
int idx = 0;
|
||
|
@@ -221,6 +264,19 @@ int BrotliTransformDictionaryWord(uint8_t* dst, const uint8_t* word, int len,
|
||
|
uppercase += step;
|
||
|
len -= step;
|
||
|
}
|
||
|
+ } else if (t == BROTLI_TRANSFORM_SHIFT_FIRST) {
|
||
|
+ uint16_t param = (uint16_t)(transforms->params[transform_idx * 2]
|
||
|
+ + (transforms->params[transform_idx * 2 + 1] << 8u));
|
||
|
+ Shift(&dst[idx - len], len, param);
|
||
|
+ } else if (t == BROTLI_TRANSFORM_SHIFT_ALL) {
|
||
|
+ uint16_t param = (uint16_t)(transforms->params[transform_idx * 2]
|
||
|
+ + (transforms->params[transform_idx * 2 + 1] << 8u));
|
||
|
+ uint8_t* shift = &dst[idx - len];
|
||
|
+ while (len > 0) {
|
||
|
+ int step = Shift(shift, len, param);
|
||
|
+ shift += step;
|
||
|
+ len -= step;
|
||
|
+ }
|
||
|
}
|
||
|
}
|
||
|
{
|
||
|
diff --git a/c/common/transform.h b/c/common/transform.h
|
||
|
index 456c12db..b6f86cc7 100755
|
||
|
--- a/c/common/transform.h
|
||
|
+++ b/c/common/transform.h
|
||
|
@@ -37,6 +37,8 @@ enum BrotliWordTransformType {
|
||
|
BROTLI_TRANSFORM_OMIT_FIRST_7 = 18,
|
||
|
BROTLI_TRANSFORM_OMIT_FIRST_8 = 19,
|
||
|
BROTLI_TRANSFORM_OMIT_FIRST_9 = 20,
|
||
|
+ BROTLI_TRANSFORM_SHIFT_FIRST = 21,
|
||
|
+ BROTLI_TRANSFORM_SHIFT_ALL = 22,
|
||
|
BROTLI_NUM_TRANSFORM_TYPES /* Counts transforms, not a transform itself. */
|
||
|
};
|
||
|
|
||
|
@@ -50,6 +52,9 @@ typedef struct BrotliTransforms {
|
||
|
uint32_t num_transforms;
|
||
|
/* Each entry is a [prefix_id, transform, suffix_id] triplet. */
|
||
|
const uint8_t* transforms;
|
||
|
+ /* Shift for BROTLI_TRANSFORM_SHIFT_FIRST and BROTLI_TRANSFORM_SHIFT_ALL,
|
||
|
+ must be NULL if and only if no such transforms are present. */
|
||
|
+ const uint8_t* params;
|
||
|
/* Indices of transforms like ["", BROTLI_TRANSFORM_OMIT_LAST_#, ""].
|
||
|
0-th element corresponds to ["", BROTLI_TRANSFORM_IDENTITY, ""].
|
||
|
-1, if cut-off transform does not exist. */
|
||
|
diff --git a/c/enc/backward_references.h b/c/enc/backward_references.h
|
||
|
index 3a414664..f82a80da 100644
|
||
|
--- a/c/enc/backward_references.h
|
||
|
+++ b/c/enc/backward_references.h
|
||
|
@@ -25,9 +25,9 @@ extern "C" {
|
||
|
initially the total amount of commands output by previous
|
||
|
CreateBackwardReferences calls, and must be incremented by the amount written
|
||
|
by this call. */
|
||
|
-BROTLI_INTERNAL void BrotliCreateBackwardReferences(
|
||
|
- size_t num_bytes, size_t position, const uint8_t* ringbuffer,
|
||
|
- size_t ringbuffer_mask, const BrotliEncoderParams* params,
|
||
|
+BROTLI_INTERNAL void BrotliCreateBackwardReferences(size_t num_bytes,
|
||
|
+ size_t position, const uint8_t* ringbuffer, size_t ringbuffer_mask,
|
||
|
+ const BrotliEncoderParams* params,
|
||
|
HasherHandle hasher, int* dist_cache, size_t* last_insert_len,
|
||
|
Command* commands, size_t* num_commands, size_t* num_literals);
|
||
|
|
||
|
diff --git a/c/enc/backward_references_hq.c b/c/enc/backward_references_hq.c
|
||
|
index 96b0e708..5737f752 100644
|
||
|
--- a/c/enc/backward_references_hq.c
|
||
|
+++ b/c/enc/backward_references_hq.c
|
||
|
@@ -419,8 +419,8 @@ static size_t UpdateNodes(
|
||
|
size_t k;
|
||
|
size_t gap = 0;
|
||
|
|
||
|
- EvaluateNode(block_start, pos, max_backward_limit, gap, starting_dist_cache,
|
||
|
- model, queue, nodes);
|
||
|
+ EvaluateNode(block_start, pos, max_backward_limit, gap,
|
||
|
+ starting_dist_cache, model, queue, nodes);
|
||
|
|
||
|
{
|
||
|
const PosData* posdata = StartPosQueueAt(queue, 0);
|
||
|
@@ -587,9 +587,10 @@ void BrotliZopfliCreateCommands(const size_t num_bytes,
|
||
|
{
|
||
|
size_t distance = ZopfliNodeCopyDistance(next);
|
||
|
size_t len_code = ZopfliNodeLengthCode(next);
|
||
|
- size_t max_distance =
|
||
|
- BROTLI_MIN(size_t, block_start + pos, max_backward_limit);
|
||
|
- BROTLI_BOOL is_dictionary = TO_BROTLI_BOOL(distance > max_distance + gap);
|
||
|
+ size_t max_distance = BROTLI_MIN(size_t,
|
||
|
+ block_start + pos, max_backward_limit);
|
||
|
+ BROTLI_BOOL is_dictionary =
|
||
|
+ TO_BROTLI_BOOL(distance > max_distance + gap);
|
||
|
size_t dist_code = ZopfliNodeDistanceCode(next);
|
||
|
InitCommand(&commands[i], ¶ms->dist, insert_length,
|
||
|
copy_length, (int)len_code - (int)copy_length, dist_code);
|
||
|
diff --git a/c/enc/backward_references_hq.h b/c/enc/backward_references_hq.h
|
||
|
index 1e4275d4..fb1ff3fa 100644
|
||
|
--- a/c/enc/backward_references_hq.h
|
||
|
+++ b/c/enc/backward_references_hq.h
|
||
|
@@ -23,14 +23,16 @@ extern "C" {
|
||
|
#endif
|
||
|
|
||
|
BROTLI_INTERNAL void BrotliCreateZopfliBackwardReferences(MemoryManager* m,
|
||
|
- size_t num_bytes, size_t position, const uint8_t* ringbuffer,
|
||
|
- size_t ringbuffer_mask, const BrotliEncoderParams* params,
|
||
|
+ size_t num_bytes,
|
||
|
+ size_t position, const uint8_t* ringbuffer, size_t ringbuffer_mask,
|
||
|
+ const BrotliEncoderParams* params,
|
||
|
HasherHandle hasher, int* dist_cache, size_t* last_insert_len,
|
||
|
Command* commands, size_t* num_commands, size_t* num_literals);
|
||
|
|
||
|
BROTLI_INTERNAL void BrotliCreateHqZopfliBackwardReferences(MemoryManager* m,
|
||
|
- size_t num_bytes, size_t position, const uint8_t* ringbuffer,
|
||
|
- size_t ringbuffer_mask, const BrotliEncoderParams* params,
|
||
|
+ size_t num_bytes,
|
||
|
+ size_t position, const uint8_t* ringbuffer, size_t ringbuffer_mask,
|
||
|
+ const BrotliEncoderParams* params,
|
||
|
HasherHandle hasher, int* dist_cache, size_t* last_insert_len,
|
||
|
Command* commands, size_t* num_commands, size_t* num_literals);
|
||
|
|
||
|
diff --git a/c/enc/backward_references_inc.h b/c/enc/backward_references_inc.h
|
||
|
index c18cdb00..e29daf33 100644
|
||
|
--- a/c/enc/backward_references_inc.h
|
||
|
+++ b/c/enc/backward_references_inc.h
|
||
|
@@ -60,7 +60,8 @@ static BROTLI_NOINLINE void EXPORT_FN(CreateBackwardReferences)(
|
||
|
FN(FindLongestMatch)(hasher,
|
||
|
¶ms->dictionary,
|
||
|
ringbuffer, ringbuffer_mask, dist_cache, position + 1, max_length,
|
||
|
- max_distance, gap, params->dist.max_distance, &sr2);
|
||
|
+ max_distance, gap, params->dist.max_distance,
|
||
|
+ &sr2);
|
||
|
if (sr2.score >= sr.score + cost_diff_lazy) {
|
||
|
/* Ok, let's just write one byte for now and start a match from the
|
||
|
next byte. */
|
||
|
@@ -76,7 +77,8 @@ static BROTLI_NOINLINE void EXPORT_FN(CreateBackwardReferences)(
|
||
|
}
|
||
|
apply_random_heuristics =
|
||
|
position + 2 * sr.len + random_heuristics_window_size;
|
||
|
- max_distance = BROTLI_MIN(size_t, position, max_backward_limit);
|
||
|
+ max_distance = BROTLI_MIN(size_t,
|
||
|
+ position, max_backward_limit);
|
||
|
{
|
||
|
/* The first 16 codes are special short-codes,
|
||
|
and the minimum offset is 1. */
|
||
|
diff --git a/c/enc/encode.c b/c/enc/encode.c
|
||
|
index 141e70aa..c82f2d3f 100644
|
||
|
--- a/c/enc/encode.c
|
||
|
+++ b/c/enc/encode.c
|
||
|
@@ -114,8 +114,6 @@ typedef struct BrotliEncoderStateStruct {
|
||
|
BROTLI_BOOL is_initialized_;
|
||
|
} BrotliEncoderStateStruct;
|
||
|
|
||
|
-static BROTLI_BOOL EnsureInitialized(BrotliEncoderState* s);
|
||
|
-
|
||
|
static size_t InputBlockSize(BrotliEncoderState* s) {
|
||
|
return (size_t)1 << s->params.lgblock;
|
||
|
}
|
||
|
diff --git a/c/enc/encoder_dict.c b/c/enc/encoder_dict.c
|
||
|
index 8b2f6ad4..e58ca670 100755
|
||
|
--- a/c/enc/encoder_dict.c
|
||
|
+++ b/c/enc/encoder_dict.c
|
||
|
@@ -24,7 +24,6 @@ void BrotliInitEncoderDictionary(BrotliEncoderDictionary* dict) {
|
||
|
|
||
|
dict->cutoffTransformsCount = kCutoffTransformsCount;
|
||
|
dict->cutoffTransforms = kCutoffTransforms;
|
||
|
-
|
||
|
}
|
||
|
|
||
|
#if defined(__cplusplus) || defined(c_plusplus)
|
||
|
diff --git a/c/tools/brotli.c b/c/tools/brotli.c
|
||
|
index ce05b641..838539ad 100644
|
||
|
--- a/c/tools/brotli.c
|
||
|
+++ b/c/tools/brotli.c
|
||
|
@@ -86,10 +86,10 @@ typedef struct {
|
||
|
/* Parameters */
|
||
|
int quality;
|
||
|
int lgwin;
|
||
|
+ int verbosity;
|
||
|
BROTLI_BOOL force_overwrite;
|
||
|
BROTLI_BOOL junk_source;
|
||
|
BROTLI_BOOL copy_stat;
|
||
|
- BROTLI_BOOL verbose;
|
||
|
BROTLI_BOOL write_to_stdout;
|
||
|
BROTLI_BOOL test_integrity;
|
||
|
BROTLI_BOOL decompress;
|
||
|
@@ -121,6 +121,12 @@ typedef struct {
|
||
|
const uint8_t* next_in;
|
||
|
size_t available_out;
|
||
|
uint8_t* next_out;
|
||
|
+
|
||
|
+ /* Reporting */
|
||
|
+ /* size_t would be large enough,
|
||
|
+ until 4GiB+ files are compressed / decompressed on 32-bit CPUs. */
|
||
|
+ size_t total_in;
|
||
|
+ size_t total_out;
|
||
|
} Context;
|
||
|
|
||
|
/* Parse up to 5 decimal digits. */
|
||
|
@@ -279,11 +285,11 @@ static Command ParseParams(Context* params) {
|
||
|
command = COMMAND_TEST_INTEGRITY;
|
||
|
continue;
|
||
|
} else if (c == 'v') {
|
||
|
- if (params->verbose) {
|
||
|
+ if (params->verbosity > 0) {
|
||
|
fprintf(stderr, "argument --verbose / -v already set\n");
|
||
|
return COMMAND_INVALID;
|
||
|
}
|
||
|
- params->verbose = BROTLI_TRUE;
|
||
|
+ params->verbosity = 1;
|
||
|
continue;
|
||
|
} else if (c == 'V') {
|
||
|
/* Don't parse further. */
|
||
|
@@ -415,11 +421,11 @@ static Command ParseParams(Context* params) {
|
||
|
command_set = BROTLI_TRUE;
|
||
|
command = COMMAND_TEST_INTEGRITY;
|
||
|
} else if (strcmp("verbose", arg) == 0) {
|
||
|
- if (params->verbose) {
|
||
|
+ if (params->verbosity > 0) {
|
||
|
fprintf(stderr, "argument --verbose / -v already set\n");
|
||
|
return COMMAND_INVALID;
|
||
|
}
|
||
|
- params->verbose = BROTLI_TRUE;
|
||
|
+ params->verbosity = 1;
|
||
|
} else if (strcmp("version", arg) == 0) {
|
||
|
/* Don't parse further. */
|
||
|
return COMMAND_VERSION;
|
||
|
@@ -787,6 +793,8 @@ static void InitializeBuffers(Context* context) {
|
||
|
context->next_in = NULL;
|
||
|
context->available_out = kFileBufferSize;
|
||
|
context->next_out = context->output;
|
||
|
+ context->total_in = 0;
|
||
|
+ context->total_out = 0;
|
||
|
}
|
||
|
|
||
|
static BROTLI_BOOL HasMoreInput(Context* context) {
|
||
|
@@ -796,6 +804,7 @@ static BROTLI_BOOL HasMoreInput(Context* context) {
|
||
|
static BROTLI_BOOL ProvideInput(Context* context) {
|
||
|
context->available_in =
|
||
|
fread(context->input, 1, kFileBufferSize, context->fin);
|
||
|
+ context->total_in += context->available_in;
|
||
|
context->next_in = context->input;
|
||
|
if (ferror(context->fin)) {
|
||
|
fprintf(stderr, "failed to read input [%s]: %s\n",
|
||
|
@@ -808,6 +817,7 @@ static BROTLI_BOOL ProvideInput(Context* context) {
|
||
|
/* Internal: should be used only in Provide-/Flush-Output. */
|
||
|
static BROTLI_BOOL WriteOutput(Context* context) {
|
||
|
size_t out_size = (size_t)(context->next_out - context->output);
|
||
|
+ context->total_out += out_size;
|
||
|
if (out_size == 0) return BROTLI_TRUE;
|
||
|
if (context->test_integrity) return BROTLI_TRUE;
|
||
|
|
||
|
@@ -833,6 +843,25 @@ static BROTLI_BOOL FlushOutput(Context* context) {
|
||
|
return BROTLI_TRUE;
|
||
|
}
|
||
|
|
||
|
+static void PrintBytes(size_t value) {
|
||
|
+ if (value < 1024) {
|
||
|
+ fprintf(stderr, "%d B", (int)value);
|
||
|
+ } else if (value < 1048576) {
|
||
|
+ fprintf(stderr, "%0.3f KiB", (double)value / 1024.0);
|
||
|
+ } else if (value < 1073741824) {
|
||
|
+ fprintf(stderr, "%0.3f MiB", (double)value / 1048576.0);
|
||
|
+ } else {
|
||
|
+ fprintf(stderr, "%0.3f GiB", (double)value / 1073741824.0);
|
||
|
+ }
|
||
|
+}
|
||
|
+
|
||
|
+static void PrintFileProcessingProgress(Context* context) {
|
||
|
+ fprintf(stderr, "[%s]: ", PrintablePath(context->current_input_path));
|
||
|
+ PrintBytes(context->total_in);
|
||
|
+ fprintf(stderr, " -> ");
|
||
|
+ PrintBytes(context->total_out);
|
||
|
+}
|
||
|
+
|
||
|
static BROTLI_BOOL DecompressFile(Context* context, BrotliDecoderState* s) {
|
||
|
BrotliDecoderResult result = BROTLI_DECODER_RESULT_NEEDS_MORE_INPUT;
|
||
|
InitializeBuffers(context);
|
||
|
@@ -853,6 +882,11 @@ static BROTLI_BOOL DecompressFile(Context* context, BrotliDecoderState* s) {
|
||
|
PrintablePath(context->current_input_path));
|
||
|
return BROTLI_FALSE;
|
||
|
}
|
||
|
+ if (context->verbosity > 0) {
|
||
|
+ fprintf(stderr, "Decompressed ");
|
||
|
+ PrintFileProcessingProgress(context);
|
||
|
+ fprintf(stderr, "\n");
|
||
|
+ }
|
||
|
return BROTLI_TRUE;
|
||
|
} else {
|
||
|
fprintf(stderr, "corrupt input [%s]\n",
|
||
|
@@ -915,7 +949,13 @@ static BROTLI_BOOL CompressFile(Context* context, BrotliEncoderState* s) {
|
||
|
}
|
||
|
|
||
|
if (BrotliEncoderIsFinished(s)) {
|
||
|
- return FlushOutput(context);
|
||
|
+ if (!FlushOutput(context)) return BROTLI_FALSE;
|
||
|
+ if (context->verbosity > 0) {
|
||
|
+ fprintf(stderr, "Compressed ");
|
||
|
+ PrintFileProcessingProgress(context);
|
||
|
+ fprintf(stderr, "\n");
|
||
|
+ }
|
||
|
+ return BROTLI_TRUE;
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
@@ -979,11 +1019,11 @@ int main(int argc, char** argv) {
|
||
|
|
||
|
context.quality = 11;
|
||
|
context.lgwin = -1;
|
||
|
+ context.verbosity = 0;
|
||
|
context.force_overwrite = BROTLI_FALSE;
|
||
|
context.junk_source = BROTLI_FALSE;
|
||
|
context.copy_stat = BROTLI_TRUE;
|
||
|
context.test_integrity = BROTLI_FALSE;
|
||
|
- context.verbose = BROTLI_FALSE;
|
||
|
context.write_to_stdout = BROTLI_FALSE;
|
||
|
context.decompress = BROTLI_FALSE;
|
||
|
context.large_window = BROTLI_FALSE;
|
||
|
diff --git a/java/org/brotli/dec/BrotliInputStream.java b/java/org/brotli/dec/BrotliInputStream.java
|
||
|
index a27e9284..5cc2e284 100644
|
||
|
--- a/java/org/brotli/dec/BrotliInputStream.java
|
||
|
+++ b/java/org/brotli/dec/BrotliInputStream.java
|
||
|
@@ -85,7 +85,17 @@ public BrotliInputStream(InputStream source, int byteReadBufferSize) throws IOEx
|
||
|
}
|
||
|
|
||
|
public void setEager(boolean eager) {
|
||
|
- state.isEager = eager ? 1 : 0;
|
||
|
+ boolean isEager = (state.isEager != 0);
|
||
|
+ if (eager == isEager) {
|
||
|
+ /* Shortcut for no-op change. */
|
||
|
+ return;
|
||
|
+ }
|
||
|
+ if (eager) {
|
||
|
+ Decode.setEager(state);
|
||
|
+ } else {
|
||
|
+ /* Once decoder is "eager", there is no way back. */
|
||
|
+ throw new IllegalStateException("Brotli decoder has been already switched to eager mode");
|
||
|
+ }
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
diff --git a/java/org/brotli/dec/Decode.java b/java/org/brotli/dec/Decode.java
|
||
|
index 9e3d43b0..60bf9c61 100644
|
||
|
--- a/java/org/brotli/dec/Decode.java
|
||
|
+++ b/java/org/brotli/dec/Decode.java
|
||
|
@@ -18,18 +18,19 @@
|
||
|
// RunningState
|
||
|
//----------------------------------------------------------------------------
|
||
|
private static final int UNINITIALIZED = 0;
|
||
|
- private static final int BLOCK_START = 1;
|
||
|
- private static final int COMPRESSED_BLOCK_START = 2;
|
||
|
- private static final int MAIN_LOOP = 3;
|
||
|
- private static final int READ_METADATA = 4;
|
||
|
- private static final int COPY_UNCOMPRESSED = 5;
|
||
|
- private static final int INSERT_LOOP = 6;
|
||
|
- private static final int COPY_LOOP = 7;
|
||
|
- private static final int TRANSFORM = 8;
|
||
|
- private static final int FINISHED = 9;
|
||
|
- private static final int CLOSED = 10;
|
||
|
- private static final int INIT_WRITE = 11;
|
||
|
- private static final int WRITE = 12;
|
||
|
+ private static final int INITIALIZED = 1;
|
||
|
+ private static final int BLOCK_START = 2;
|
||
|
+ private static final int COMPRESSED_BLOCK_START = 3;
|
||
|
+ private static final int MAIN_LOOP = 4;
|
||
|
+ private static final int READ_METADATA = 5;
|
||
|
+ private static final int COPY_UNCOMPRESSED = 6;
|
||
|
+ private static final int INSERT_LOOP = 7;
|
||
|
+ private static final int COPY_LOOP = 8;
|
||
|
+ private static final int TRANSFORM = 9;
|
||
|
+ private static final int FINISHED = 10;
|
||
|
+ private static final int CLOSED = 11;
|
||
|
+ private static final int INIT_WRITE = 12;
|
||
|
+ private static final int WRITE = 13;
|
||
|
|
||
|
private static final int DEFAULT_CODE_LENGTH = 8;
|
||
|
private static final int CODE_LENGTH_REPEAT_CODE = 16;
|
||
|
@@ -139,6 +140,20 @@ private static int decodeWindowBits(State s) {
|
||
|
return 17;
|
||
|
}
|
||
|
|
||
|
+ /**
|
||
|
+ * Switch decoder to "eager" mode.
|
||
|
+ *
|
||
|
+ * In "eager" mode decoder returns as soon as there is enough data to fill output buffer.
|
||
|
+ *
|
||
|
+ * @param s initialized state, before any read is performed.
|
||
|
+ */
|
||
|
+ static void setEager(State s) {
|
||
|
+ if (s.runningState != INITIALIZED) {
|
||
|
+ throw new IllegalStateException("State MUST be freshly initialized");
|
||
|
+ }
|
||
|
+ s.isEager = 1;
|
||
|
+ }
|
||
|
+
|
||
|
/**
|
||
|
* Associate input with decoder state.
|
||
|
*
|
||
|
@@ -152,13 +167,7 @@ static void initState(State s, InputStream input) {
|
||
|
s.blockTrees = new int[6 * HUFFMAN_TABLE_SIZE];
|
||
|
s.input = input;
|
||
|
BitReader.initBitReader(s);
|
||
|
- int windowBits = decodeWindowBits(s);
|
||
|
- if (windowBits == 9) { /* Reserved case for future expansion. */
|
||
|
- throw new BrotliRuntimeException("Invalid 'windowBits' code");
|
||
|
- }
|
||
|
- s.maxRingBufferSize = 1 << windowBits;
|
||
|
- s.maxBackwardDistance = s.maxRingBufferSize - 16;
|
||
|
- s.runningState = BLOCK_START;
|
||
|
+ s.runningState = INITIALIZED;
|
||
|
}
|
||
|
|
||
|
static void close(State s) throws IOException {
|
||
|
@@ -727,6 +736,16 @@ static void decompress(State s) {
|
||
|
if (s.runningState == CLOSED) {
|
||
|
throw new IllegalStateException("Can't decompress after close");
|
||
|
}
|
||
|
+ if (s.runningState == INITIALIZED) {
|
||
|
+ int windowBits = decodeWindowBits(s);
|
||
|
+ if (windowBits == 9) { /* Reserved case for future expansion. */
|
||
|
+ throw new BrotliRuntimeException("Invalid 'windowBits' code");
|
||
|
+ }
|
||
|
+ s.maxRingBufferSize = 1 << windowBits;
|
||
|
+ s.maxBackwardDistance = s.maxRingBufferSize - 16;
|
||
|
+ s.runningState = BLOCK_START;
|
||
|
+ }
|
||
|
+
|
||
|
int fence = calculateFence(s);
|
||
|
int ringBufferMask = s.ringBufferSize - 1;
|
||
|
byte[] ringBuffer = s.ringBuffer;
|
||
|
@@ -935,9 +954,9 @@ static void decompress(State s) {
|
||
|
int wordIdx = wordId & mask;
|
||
|
int transformIdx = wordId >>> shift;
|
||
|
offset += wordIdx * s.copyLength;
|
||
|
- if (transformIdx < Transform.NUM_TRANSFORMS) {
|
||
|
- int len = Transform.transformDictionaryWord(ringBuffer, s.pos,
|
||
|
- Dictionary.getData(), offset, s.copyLength, transformIdx);
|
||
|
+ if (transformIdx < Transform.NUM_RFC_TRANSFORMS) {
|
||
|
+ int len = Transform.transformDictionaryWord(ringBuffer, s.pos, Dictionary.getData(),
|
||
|
+ offset, s.copyLength, Transform.RFC_TRANSFORMS, transformIdx);
|
||
|
s.pos += len;
|
||
|
s.metaBlockLength -= len;
|
||
|
if (s.pos >= fence) {
|
||
|
diff --git a/java/org/brotli/dec/SynthTest.java b/java/org/brotli/dec/SynthTest.java
|
||
|
index c95a3c90..de91c377 100644
|
||
|
--- a/java/org/brotli/dec/SynthTest.java
|
||
|
+++ b/java/org/brotli/dec/SynthTest.java
|
||
|
@@ -64,6 +64,474 @@ private void checkSynth(byte[] compressed, boolean expectSuccess,
|
||
|
|
||
|
/* GENERATED CODE START */
|
||
|
|
||
|
+ @Test
|
||
|
+ public void testAllTransforms10() {
|
||
|
+ byte[] compressed = {
|
||
|
+ (byte) 0x1b, (byte) 0xfc, (byte) 0x05, (byte) 0x00, (byte) 0x00, (byte) 0x00, (byte) 0x80,
|
||
|
+ (byte) 0xe3, (byte) 0xb4, (byte) 0x0d, (byte) 0x00, (byte) 0x00, (byte) 0x07, (byte) 0x5b,
|
||
|
+ (byte) 0x26, (byte) 0x31, (byte) 0x40, (byte) 0x02, (byte) 0x00, (byte) 0xe0, (byte) 0x4e,
|
||
|
+ (byte) 0x1b, (byte) 0x13, (byte) 0x7c, (byte) 0x84, (byte) 0x26, (byte) 0xf8, (byte) 0x04,
|
||
|
+ (byte) 0x10, (byte) 0x4c, (byte) 0xf0, (byte) 0x89, (byte) 0x38, (byte) 0x30, (byte) 0xc1,
|
||
|
+ (byte) 0x27, (byte) 0x4e, (byte) 0xc1, (byte) 0x04, (byte) 0x9f, (byte) 0x64, (byte) 0x06,
|
||
|
+ (byte) 0x26, (byte) 0xf8, (byte) 0x24, (byte) 0x3f, (byte) 0x34, (byte) 0xc1, (byte) 0x27,
|
||
|
+ (byte) 0x7d, (byte) 0x82, (byte) 0x09, (byte) 0x3e, (byte) 0xe9, (byte) 0x16, (byte) 0x4d,
|
||
|
+ (byte) 0xf0, (byte) 0xc9, (byte) 0xd2, (byte) 0xc0, (byte) 0x04, (byte) 0x9f, (byte) 0x0c,
|
||
|
+ (byte) 0x8f, (byte) 0x4c, (byte) 0xf0, (byte) 0xc9, (byte) 0x06, (byte) 0xd1, (byte) 0x04,
|
||
|
+ (byte) 0x9f, (byte) 0x6c, (byte) 0x92, (byte) 0x4d, (byte) 0xf0, (byte) 0xc9, (byte) 0x39,
|
||
|
+ (byte) 0xc1, (byte) 0x04, (byte) 0x9f, (byte) 0xdc, (byte) 0x94, (byte) 0x4c, (byte) 0xf0,
|
||
|
+ (byte) 0xc9, (byte) 0x69, (byte) 0xd1, (byte) 0x04, (byte) 0x9f, (byte) 0x3c, (byte) 0x98,
|
||
|
+ (byte) 0x4d, (byte) 0xf0, (byte) 0x29, (byte) 0x9c, (byte) 0x81, (byte) 0x09, (byte) 0x3e,
|
||
|
+ (byte) 0x45, (byte) 0x37, (byte) 0x31, (byte) 0xc1, (byte) 0xa7, (byte) 0x60, (byte) 0x47,
|
||
|
+ (byte) 0x26, (byte) 0xf8, (byte) 0x14, (byte) 0xfa, (byte) 0xcc, (byte) 0x04, (byte) 0x9f,
|
||
|
+ (byte) 0xc2, (byte) 0x20, (byte) 0x9a, (byte) 0xe0, (byte) 0x53, (byte) 0x48, (byte) 0x54,
|
||
|
+ (byte) 0x13, (byte) 0x7c, (byte) 0x8a, (byte) 0x8f, (byte) 0x6c, (byte) 0x82, (byte) 0x4f,
|
||
|
+ (byte) 0xb1, (byte) 0xd2, (byte) 0x4d, (byte) 0xf0, (byte) 0x29, (byte) 0x67, (byte) 0x82,
|
||
|
+ (byte) 0x09, (byte) 0x3e, (byte) 0xe5, (byte) 0x4f, (byte) 0x31, (byte) 0xc1, (byte) 0xa7,
|
||
|
+ (byte) 0x7c, (byte) 0x4a, (byte) 0x26, (byte) 0xf8, (byte) 0x94, (byte) 0x57, (byte) 0xcd,
|
||
|
+ (byte) 0x04, (byte) 0x9f, (byte) 0x12, (byte) 0x2c, (byte) 0x9a, (byte) 0xe0, (byte) 0x53,
|
||
|
+ (byte) 0xba, (byte) 0x55, (byte) 0x13, (byte) 0x7c, (byte) 0xca, (byte) 0xbf, (byte) 0x6c,
|
||
|
+ (byte) 0x82, (byte) 0x4f, (byte) 0xb9, (byte) 0xd8, (byte) 0x4d, (byte) 0xf0, (byte) 0xa9,
|
||
|
+ (byte) 0x30, (byte) 0x03, (byte) 0x13, (byte) 0x7c, (byte) 0x2a, (byte) 0xd2, (byte) 0xc2,
|
||
|
+ (byte) 0x04, (byte) 0x9f, (byte) 0x4a, (byte) 0x36, (byte) 0x31, (byte) 0xc1, (byte) 0xa7,
|
||
|
+ (byte) 0xca, (byte) 0x6d, (byte) 0x4c, (byte) 0xf0, (byte) 0xa9, (byte) 0x94, (byte) 0x23,
|
||
|
+ (byte) 0x13, (byte) 0x7c, (byte) 0x2a, (byte) 0xeb, (byte) 0xca, (byte) 0x04, (byte) 0x9f,
|
||
|
+ (byte) 0xea, (byte) 0x3c, (byte) 0x33, (byte) 0xc1, (byte) 0xa7, (byte) 0xb2, (byte) 0xef,
|
||
|
+ (byte) 0x4c, (byte) 0xf0, (byte) 0xa9, (byte) 0xf8, (byte) 0x43, (byte) 0x13, (byte) 0x7c,
|
||
|
+ (byte) 0xaa, (byte) 0x00, (byte) 0xd3, (byte) 0x04, (byte) 0x9f, (byte) 0x2a, (byte) 0x42,
|
||
|
+ (byte) 0x35, (byte) 0xc1, (byte) 0xa7, (byte) 0xc2, (byte) 0x70, (byte) 0x4d, (byte) 0xf0,
|
||
|
+ (byte) 0xa9, (byte) 0x52, (byte) 0x64, (byte) 0x13, (byte) 0x7c, (byte) 0x2a, (byte) 0x1a,
|
||
|
+ (byte) 0xdb, (byte) 0x04, (byte) 0x9f, (byte) 0x6a, (byte) 0x48, (byte) 0x37, (byte) 0xc1,
|
||
|
+ (byte) 0xa7, (byte) 0x92, (byte) 0xf2, (byte) 0x4d, (byte) 0xf0, (byte) 0xa9, (byte) 0xc3,
|
||
|
+ (byte) 0x04, (byte) 0x13, (byte) 0x7c, (byte) 0xea, (byte) 0x32, (byte) 0xc3, (byte) 0x04,
|
||
|
+ (byte) 0x9f, (byte) 0x7a, (byte) 0x4e, (byte) 0x31, (byte) 0xc1, (byte) 0xa7, (byte) 0x06,
|
||
|
+ (byte) 0x74, (byte) 0x4c, (byte) 0xf0, (byte) 0xa9, (byte) 0x19, (byte) 0x25, (byte) 0x13,
|
||
|
+ (byte) 0x7c, (byte) 0x6a, (byte) 0x4d, (byte) 0xcb, (byte) 0x04, (byte) 0x9f, (byte) 0x1a,
|
||
|
+ (byte) 0x55, (byte) 0x33, (byte) 0xc1, (byte) 0xa7, (byte) 0x56, (byte) 0xf5, (byte) 0x4c,
|
||
|
+ (byte) 0xf0, (byte) 0xa9, (byte) 0x5d, (byte) 0x45, (byte) 0x13, (byte) 0x7c, (byte) 0xea,
|
||
|
+ (byte) 0x59, (byte) 0xd3, (byte) 0x04, (byte) 0x9f, (byte) 0xfa, (byte) 0x57, (byte) 0x35,
|
||
|
+ (byte) 0xc1, (byte) 0xa7, (byte) 0x66, (byte) 0x76, (byte) 0x4d, (byte) 0xf0, (byte) 0xa9,
|
||
|
+ (byte) 0x9f, (byte) 0x65, (byte) 0x13, (byte) 0x7c, (byte) 0x6a, (byte) 0x6f, (byte) 0xdb,
|
||
|
+ (byte) 0x04, (byte) 0x9f, (byte) 0x9a, (byte) 0x5d, (byte) 0x37, (byte) 0xc1, (byte) 0xa7,
|
||
|
+ (byte) 0x06, (byte) 0xf8, (byte) 0x4d, (byte) 0xf0, (byte) 0x69, (byte) 0x0c, (byte) 0x06,
|
||
|
+ (byte) 0x26, (byte) 0xf8, (byte) 0x34, (byte) 0x08, (byte) 0x07, (byte) 0x13, (byte) 0x7c,
|
||
|
+ (byte) 0x1a, (byte) 0x8b, (byte) 0x85, (byte) 0x09, (byte) 0x3e, (byte) 0x8d, (byte) 0xc8,
|
||
|
+ (byte) 0xc3, (byte) 0x04, (byte) 0x9f, (byte) 0xe6, (byte) 0x65, (byte) 0x62, (byte) 0x82,
|
||
|
+ (byte) 0x4f, (byte) 0xb3, (byte) 0x73, (byte) 0x31, (byte) 0xc1, (byte) 0xa7, (byte) 0x41,
|
||
|
+ (byte) 0xda, (byte) 0x98, (byte) 0xe0, (byte) 0xd3, (byte) 0x54, (byte) 0x7d, (byte) 0x4c,
|
||
|
+ (byte) 0xf0, (byte) 0x69, (byte) 0xc4, (byte) 0x46, (byte) 0x26, (byte) 0xf8, (byte) 0x34,
|
||
|
+ (byte) 0x72, (byte) 0x27, (byte) 0x13, (byte) 0x7c, (byte) 0x1a, (byte) 0xc5, (byte) 0x95,
|
||
|
+ (byte) 0x09, (byte) 0x3e, (byte) 0x8d, (byte) 0xe5, (byte) 0xcb, (byte) 0x04, (byte) 0x9f,
|
||
|
+ (byte) 0x06, (byte) 0x75, (byte) 0x66, (byte) 0x82, (byte) 0x4f, (byte) 0x43, (byte) 0x7b,
|
||
|
+ (byte) 0x33, (byte) 0xc1, (byte) 0xa7, (byte) 0x09, (byte) 0xde, (byte) 0x99, (byte) 0xe0,
|
||
|
+ (byte) 0xd3, (byte) 0x34, (byte) 0xff, (byte) 0x4c, (byte) 0xf0, (byte) 0x69, (byte) 0xb2,
|
||
|
+ (byte) 0x87, (byte) 0x26, (byte) 0xf8, (byte) 0x34, (byte) 0xe9, (byte) 0x47, (byte) 0x13,
|
||
|
+ (byte) 0x7c, (byte) 0x9a, (byte) 0xfb, (byte) 0xa5, (byte) 0x09, (byte) 0x3e, (byte) 0x4d,
|
||
|
+ (byte) 0x01, (byte) 0xd4, (byte) 0x04, (byte) 0x9f, (byte) 0x46, (byte) 0x82, (byte) 0x6a,
|
||
|
+ (byte) 0x82, (byte) 0x4f, (byte) 0x03, (byte) 0x82, (byte) 0x35, (byte) 0xc1, (byte) 0xa7,
|
||
|
+ (byte) 0x61, (byte) 0xe1, (byte) 0x9a, (byte) 0xe0, (byte) 0xd3, (byte) 0xe4, (byte) 0x80,
|
||
|
+ (byte) 0x4d, (byte) 0xf0, (byte) 0x69, (byte) 0x8a, (byte) 0xc8, (byte) 0x26, (byte) 0xf8,
|
||
|
+ (byte) 0x34, (byte) 0x52, (byte) 0x68, (byte) 0x13, (byte) 0x7c, (byte) 0x9a, (byte) 0x2f,
|
||
|
+ (byte) 0xb6, (byte) 0x09, (byte) 0x3e, (byte) 0x8d, (byte) 0x1b, (byte) 0xdc, (byte) 0x04,
|
||
|
+ (byte) 0x9f, (byte) 0x86, (byte) 0x8f, (byte) 0x6e, (byte) 0x82, (byte) 0x4f, (byte) 0xb3,
|
||
|
+ (byte) 0x88, (byte) 0x37, (byte) 0xc1, (byte) 0xa7, (byte) 0xd9, (byte) 0xe4, (byte) 0x9b,
|
||
|
+ (byte) 0xe0, (byte) 0xd3, (byte) 0x9e, (byte) 0x02, (byte) 0x4c, (byte) 0xf0, (byte) 0x69,
|
||
|
+ (byte) 0x6d, (byte) 0x09, (byte) 0x26, (byte) 0xf8, (byte) 0xb4, (byte) 0xc3, (byte) 0x08,
|
||
|
+ (byte) 0x13, (byte) 0x7c, (byte) 0x5a, (byte) 0x68, (byte) 0x86, (byte) 0x09, (byte) 0x3e,
|
||
|
+ (byte) 0xad, (byte) 0x37, (byte) 0xc4, (byte) 0x04, (byte) 0x9f, (byte) 0x56, (byte) 0x9d,
|
||
|
+ (byte) 0x62, (byte) 0x82, (byte) 0x4f, (byte) 0x9b, (byte) 0x8f, (byte) 0x31, (byte) 0xc1,
|
||
|
+ (byte) 0xa7, (byte) 0x2d, (byte) 0xe8, (byte) 0x98, (byte) 0xe0, (byte) 0xd3, (byte) 0x4a,
|
||
|
+ (byte) 0x84, (byte) 0x4c, (byte) 0xf0, (byte) 0x69, (byte) 0x3f, (byte) 0x4a, (byte) 0x26,
|
||
|
+ (byte) 0xf8, (byte) 0xb4, (byte) 0x2c, (byte) 0x29, (byte) 0x13, (byte) 0x7c, (byte) 0xda,
|
||
|
+ (byte) 0x9c, (byte) 0x96, (byte) 0x09, (byte) 0x3e, (byte) 0x2d, (byte) 0x52, (byte) 0xcc,
|
||
|
+ (byte) 0x04, (byte) 0x9f, (byte) 0xb6, (byte) 0xaa, (byte) 0x66, (byte) 0x82, (byte) 0x4f,
|
||
|
+ (byte) 0x2b, (byte) 0x96, (byte) 0x33, (byte) 0xc1, (byte) 0xa7, (byte) 0x7d, (byte) 0xeb,
|
||
|
+ (byte) 0x99, (byte) 0xe0, (byte) 0xd3, (byte) 0xf6, (byte) 0x05, (byte) 0x4d, (byte) 0xf0,
|
||
|
+ (byte) 0x69, (byte) 0x17, (byte) 0x8b, (byte) 0x26, (byte) 0xf8, (byte) 0xb4, (byte) 0x97,
|
||
|
+ (byte) 0x49, (byte) 0x13, (byte) 0x7c, (byte) 0xda, (byte) 0xd1, (byte) 0xa6, (byte) 0x09,
|
||
|
+ (byte) 0x3e, (byte) 0x2d, (byte) 0x6c, (byte) 0xd4, (byte) 0x04, (byte) 0x9f, (byte) 0xb6,
|
||
|
+ (byte) 0xb7, (byte) 0x6a, (byte) 0x82, (byte) 0x4f, (byte) 0xab, (byte) 0x9c, (byte) 0x35,
|
||
|
+ (byte) 0xc1, (byte) 0xa7, (byte) 0xc5, (byte) 0xee, (byte) 0x9a, (byte) 0xe0, (byte) 0xd3,
|
||
|
+ (byte) 0x9a, (byte) 0x87, (byte) 0x4d, (byte) 0xf0, (byte) 0x69, (byte) 0xe9, (byte) 0xcb
|
||
|
+ };
|
||
|
+ checkSynth(
|
||
|
+ /*
|
||
|
+ * // The stream consists of word "time" with all possible transforms.
|
||
|
+ * main_header
|
||
|
+ * metablock_header_easy: 1533, 1
|
||
|
+ * command_easy: 10, "|", 2 // = 0 << 10 + 1 + 1
|
||
|
+ * command_easy: 10, "|", 1037 // = 1 << 10 + 1 + 12
|
||
|
+ * command_easy: 10, "|", 2073 // = 2 << 10 + 1 + 24
|
||
|
+ * command_easy: 10, "|", 3110 // = 3 << 10 + 1 + 37
|
||
|
+ * command_easy: 10, "|", 4144 // = 4 << 10 + 1 + 47
|
||
|
+ * command_easy: 10, "|", 5180 // = 5 << 10 + 1 + 59
|
||
|
+ * command_easy: 10, "|", 6220 // = 6 << 10 + 1 + 75
|
||
|
+ * command_easy: 10, "|", 7256 // = 7 << 10 + 1 + 87
|
||
|
+ * command_easy: 10, "|", 8294 // = 8 << 10 + 1 + 101
|
||
|
+ * command_easy: 10, "|", 9333 // = 9 << 10 + 1 + 116
|
||
|
+ * command_easy: 10, "|", 10368 // = 10 << 10 + 1 + 127
|
||
|
+ * command_easy: 10, "|", 11408 // = 11 << 10 + 1 + 143
|
||
|
+ * command_easy: 10, "|", 12441 // = 12 << 10 + 1 + 152
|
||
|
+ * command_easy: 10, "|", 13475 // = 13 << 10 + 1 + 162
|
||
|
+ * command_easy: 10, "|", 14513 // = 14 << 10 + 1 + 176
|
||
|
+ * command_easy: 10, "|", 15550 // = 15 << 10 + 1 + 189
|
||
|
+ * command_easy: 10, "|", 16587 // = 16 << 10 + 1 + 202
|
||
|
+ * command_easy: 10, "|", 17626 // = 17 << 10 + 1 + 217
|
||
|
+ * command_easy: 10, "|", 18665 // = 18 << 10 + 1 + 232
|
||
|
+ * command_easy: 10, "|", 19703 // = 19 << 10 + 1 + 246
|
||
|
+ * command_easy: 10, "|", 20739 // = 20 << 10 + 1 + 258
|
||
|
+ * command_easy: 10, "|", 21775 // = 21 << 10 + 1 + 270
|
||
|
+ * command_easy: 10, "|", 22812 // = 22 << 10 + 1 + 283
|
||
|
+ * command_easy: 10, "|", 23848 // = 23 << 10 + 1 + 295
|
||
|
+ * command_easy: 10, "|", 24880 // = 24 << 10 + 1 + 303
|
||
|
+ * command_easy: 10, "|", 25916 // = 25 << 10 + 1 + 315
|
||
|
+ * command_easy: 10, "|", 26956 // = 26 << 10 + 1 + 331
|
||
|
+ * command_easy: 10, "|", 27988 // = 27 << 10 + 1 + 339
|
||
|
+ * command_easy: 10, "|", 29021 // = 28 << 10 + 1 + 348
|
||
|
+ * command_easy: 10, "|", 30059 // = 29 << 10 + 1 + 362
|
||
|
+ * command_easy: 10, "|", 31100 // = 30 << 10 + 1 + 379
|
||
|
+ * command_easy: 10, "|", 32136 // = 31 << 10 + 1 + 391
|
||
|
+ * command_easy: 10, "|", 33173 // = 32 << 10 + 1 + 404
|
||
|
+ * command_easy: 10, "|", 34209 // = 33 << 10 + 1 + 416
|
||
|
+ * command_easy: 10, "|", 35247 // = 34 << 10 + 1 + 430
|
||
|
+ * command_easy: 10, "|", 36278 // = 35 << 10 + 1 + 437
|
||
|
+ * command_easy: 10, "|", 37319 // = 36 << 10 + 1 + 454
|
||
|
+ * command_easy: 10, "|", 38355 // = 37 << 10 + 1 + 466
|
||
|
+ * command_easy: 10, "|", 39396 // = 38 << 10 + 1 + 483
|
||
|
+ * command_easy: 10, "|", 40435 // = 39 << 10 + 1 + 498
|
||
|
+ * command_easy: 10, "|", 41465 // = 40 << 10 + 1 + 504
|
||
|
+ * command_easy: 10, "|", 42494 // = 41 << 10 + 1 + 509
|
||
|
+ * command_easy: 10, "|", 43534 // = 42 << 10 + 1 + 525
|
||
|
+ * command_easy: 10, "|", 44565 // = 43 << 10 + 1 + 532
|
||
|
+ * command_easy: 10, "|", 45606 // = 44 << 10 + 1 + 549
|
||
|
+ * command_easy: 10, "|", 46641 // = 45 << 10 + 1 + 560
|
||
|
+ * command_easy: 10, "|", 47680 // = 46 << 10 + 1 + 575
|
||
|
+ * command_easy: 10, "|", 48719 // = 47 << 10 + 1 + 590
|
||
|
+ * command_easy: 10, "|", 49758 // = 48 << 10 + 1 + 605
|
||
|
+ * command_easy: 10, "|", 50786 // = 49 << 10 + 1 + 609
|
||
|
+ * command_easy: 10, "|", 51824 // = 50 << 10 + 1 + 623
|
||
|
+ * command_easy: 10, "|", 52861 // = 51 << 10 + 1 + 636
|
||
|
+ * command_easy: 10, "|", 53897 // = 52 << 10 + 1 + 648
|
||
|
+ * command_easy: 10, "|", 54935 // = 53 << 10 + 1 + 662
|
||
|
+ * command_easy: 10, "|", 55973 // = 54 << 10 + 1 + 676
|
||
|
+ * command_easy: 10, "|", 56999 // = 55 << 10 + 1 + 678
|
||
|
+ * command_easy: 10, "|", 58027 // = 56 << 10 + 1 + 682
|
||
|
+ * command_easy: 10, "|", 59056 // = 57 << 10 + 1 + 687
|
||
|
+ * command_easy: 10, "|", 60092 // = 58 << 10 + 1 + 699
|
||
|
+ * command_easy: 10, "|", 61129 // = 59 << 10 + 1 + 712
|
||
|
+ * command_easy: 10, "|", 62156 // = 60 << 10 + 1 + 715
|
||
|
+ * command_easy: 10, "|", 63195 // = 61 << 10 + 1 + 730
|
||
|
+ * command_easy: 10, "|", 64233 // = 62 << 10 + 1 + 744
|
||
|
+ * command_easy: 10, "|", 65277 // = 63 << 10 + 1 + 764
|
||
|
+ * command_easy: 10, "|", 66307 // = 64 << 10 + 1 + 770
|
||
|
+ * command_easy: 10, "|", 67333 // = 65 << 10 + 1 + 772
|
||
|
+ * command_easy: 10, "|", 68371 // = 66 << 10 + 1 + 786
|
||
|
+ * command_easy: 10, "|", 69407 // = 67 << 10 + 1 + 798
|
||
|
+ * command_easy: 10, "|", 70444 // = 68 << 10 + 1 + 811
|
||
|
+ * command_easy: 10, "|", 71480 // = 69 << 10 + 1 + 823
|
||
|
+ * command_easy: 10, "|", 72517 // = 70 << 10 + 1 + 836
|
||
|
+ * command_easy: 10, "|", 73554 // = 71 << 10 + 1 + 849
|
||
|
+ * command_easy: 10, "|", 74591 // = 72 << 10 + 1 + 862
|
||
|
+ * command_easy: 10, "|", 75631 // = 73 << 10 + 1 + 878
|
||
|
+ * command_easy: 10, "|", 76679 // = 74 << 10 + 1 + 902
|
||
|
+ * command_easy: 10, "|", 77715 // = 75 << 10 + 1 + 914
|
||
|
+ * command_easy: 10, "|", 78757 // = 76 << 10 + 1 + 932
|
||
|
+ * command_easy: 10, "|", 79793 // = 77 << 10 + 1 + 944
|
||
|
+ * command_easy: 10, "|", 80830 // = 78 << 10 + 1 + 957
|
||
|
+ * command_easy: 10, "|", 81866 // = 79 << 10 + 1 + 969
|
||
|
+ * command_easy: 10, "|", 82902 // = 80 << 10 + 1 + 981
|
||
|
+ * command_easy: 10, "|", 83942 // = 81 << 10 + 1 + 997
|
||
|
+ * command_easy: 10, "|", 84980 // = 82 << 10 + 1 + 1011
|
||
|
+ * command_easy: 10, "|", 86018 // = 83 << 10 + 1 + 1025
|
||
|
+ * command_easy: 10, "|", 87055 // = 84 << 10 + 1 + 1038
|
||
|
+ * command_easy: 10, "|", 88093 // = 85 << 10 + 1 + 1052
|
||
|
+ * command_easy: 10, "|", 89129 // = 86 << 10 + 1 + 1064
|
||
|
+ * command_easy: 10, "|", 90166 // = 87 << 10 + 1 + 1077
|
||
|
+ * command_easy: 10, "|", 91202 // = 88 << 10 + 1 + 1089
|
||
|
+ * command_easy: 10, "|", 92239 // = 89 << 10 + 1 + 1102
|
||
|
+ * command_easy: 10, "|", 93276 // = 90 << 10 + 1 + 1115
|
||
|
+ * command_easy: 10, "|", 94315 // = 91 << 10 + 1 + 1130
|
||
|
+ * command_easy: 10, "|", 95353 // = 92 << 10 + 1 + 1144
|
||
|
+ * command_easy: 10, "|", 96392 // = 93 << 10 + 1 + 1159
|
||
|
+ * command_easy: 10, "|", 97432 // = 94 << 10 + 1 + 1175
|
||
|
+ * command_easy: 10, "|", 98468 // = 95 << 10 + 1 + 1187
|
||
|
+ * command_easy: 10, "|", 99507 // = 96 << 10 + 1 + 1202
|
||
|
+ * command_easy: 10, "|", 100544 // = 97 << 10 + 1 + 1215
|
||
|
+ * command_easy: 10, "|", 101581 // = 98 << 10 + 1 + 1228
|
||
|
+ * command_easy: 10, "|", 102619 // = 99 << 10 + 1 + 1242
|
||
|
+ * command_easy: 10, "|", 103655 // = 100 << 10 + 1 + 1254
|
||
|
+ * command_easy: 10, "|", 104694 // = 101 << 10 + 1 + 1269
|
||
|
+ * command_easy: 10, "|", 105730 // = 102 << 10 + 1 + 1281
|
||
|
+ * command_easy: 10, "|", 106767 // = 103 << 10 + 1 + 1294
|
||
|
+ * command_easy: 10, "|", 107804 // = 104 << 10 + 1 + 1307
|
||
|
+ * command_easy: 10, "|", 108841 // = 105 << 10 + 1 + 1320
|
||
|
+ * command_easy: 10, "|", 109878 // = 106 << 10 + 1 + 1333
|
||
|
+ * command_easy: 10, "|", 110917 // = 107 << 10 + 1 + 1348
|
||
|
+ * command_easy: 10, "|", 111954 // = 108 << 10 + 1 + 1361
|
||
|
+ * command_easy: 10, "|", 112991 // = 109 << 10 + 1 + 1374
|
||
|
+ * command_easy: 10, "|", 114028 // = 110 << 10 + 1 + 1387
|
||
|
+ * command_easy: 10, "|", 115066 // = 111 << 10 + 1 + 1401
|
||
|
+ * command_easy: 10, "|", 116104 // = 112 << 10 + 1 + 1415
|
||
|
+ * command_easy: 10, "|", 117140 // = 113 << 10 + 1 + 1427
|
||
|
+ * command_easy: 10, "|", 118176 // = 114 << 10 + 1 + 1439
|
||
|
+ * command_easy: 10, "|", 119213 // = 115 << 10 + 1 + 1452
|
||
|
+ * command_easy: 10, "|", 120250 // = 116 << 10 + 1 + 1465
|
||
|
+ * command_easy: 10, "|", 121287 // = 117 << 10 + 1 + 1478
|
||
|
+ * command_easy: 10, "|", 122325 // = 118 << 10 + 1 + 1492
|
||
|
+ * command_easy: 10, "|", 123363 // = 119 << 10 + 1 + 1506
|
||
|
+ * command_easy: 10, "|", 124401 // = 120 << 10 + 1 + 1520
|
||
|
+ */
|
||
|
+ compressed,
|
||
|
+ true,
|
||
|
+ "|categories|categories | categories |ategories|Categories |categories the | categories|s cat"
|
||
|
+ + "egories |categories of |Categories|categories and |tegories|categorie|, categories |catego"
|
||
|
+ + "ries, | Categories |categories in |categories to |e categories |categories\"|categories.|c"
|
||
|
+ + "ategories\">|categories\n|categor|categories]|categories for |egories|categori|categories "
|
||
|
+ + "a |categories that | Categories|categories. |.categories| categories, |gories|categories w"
|
||
|
+ + "ith |categories'|categories from |categories by |ories|ries| the categories|catego|categor"
|
||
|
+ + "ies. The |CATEGORIES|categories on |categories as |categories is |cat|categorieing |catego"
|
||
|
+ + "ries\n\t|categories:| categories. |categoriesed |s|ies|cate|categories(|Categories, |ca|ca"
|
||
|
+ + "tegories at |categoriesly | the categories of |categ|c| Categories, |Categories\"|.categor"
|
||
|
+ + "ies(|CATEGORIES |Categories\">|categories=\"| categories.|.com/categories| the categories "
|
||
|
+ + "of the |Categories'|categories. This |categories,|.categories |Categories(|Categories.|cat"
|
||
|
+ + "egories not | categories=\"|categorieser | CATEGORIES |categoriesal | CATEGORIES|categorie"
|
||
|
+ + "s='|CATEGORIES\"|Categories. | categories(|categoriesful | Categories. |categoriesive |cat"
|
||
|
+ + "egoriesless |CATEGORIES'|categoriesest | Categories.|CATEGORIES\">| categories='|Categorie"
|
||
|
+ + "s,|categoriesize |CATEGORIES.|\302\240categories| categories,|Categories=\"|CATEGORIES="
|
||
|
+ + "\"|categoriesous |CATEGORIES, |Categories='| Categories,| CATEGORIES=\"| CATEGORIES, |CATE"
|
||
|
+ + "GORIES,|CATEGORIES(|CATEGORIES. | CATEGORIES.|CATEGORIES='| CATEGORIES. | Categories=\"| C"
|
||
|
+ + "ATEGORIES='| Categories='"
|
||
|
+ );
|
||
|
+ }
|
||
|
+
|
||
|
+ @Test
|
||
|
+ public void testAllTransforms4() {
|
||
|
+ byte[] compressed = {
|
||
|
+ (byte) 0x1b, (byte) 0x40, (byte) 0x03, (byte) 0x00, (byte) 0x00, (byte) 0x00, (byte) 0x80,
|
||
|
+ (byte) 0xe3, (byte) 0xb4, (byte) 0x0d, (byte) 0x00, (byte) 0x00, (byte) 0x07, (byte) 0x5b,
|
||
|
+ (byte) 0x26, (byte) 0x31, (byte) 0x40, (byte) 0x02, (byte) 0x00, (byte) 0xe0, (byte) 0x4e,
|
||
|
+ (byte) 0x1b, (byte) 0x51, (byte) 0x3e, (byte) 0x42, (byte) 0x51, (byte) 0x3e, (byte) 0x81,
|
||
|
+ (byte) 0x02, (byte) 0x51, (byte) 0x3e, (byte) 0x11, (byte) 0x04, (byte) 0xa2, (byte) 0x7c,
|
||
|
+ (byte) 0xe2, (byte) 0x0b, (byte) 0x44, (byte) 0xf9, (byte) 0x24, (byte) 0x1b, (byte) 0x10,
|
||
|
+ (byte) 0xe5, (byte) 0x93, (byte) 0x84, (byte) 0x50, (byte) 0x94, (byte) 0x4f, (byte) 0xba,
|
||
|
+ (byte) 0x02, (byte) 0x51, (byte) 0x3e, (byte) 0x69, (byte) 0x0c, (byte) 0x45, (byte) 0xf9,
|
||
|
+ (byte) 0x64, (byte) 0x39, (byte) 0x20, (byte) 0xca, (byte) 0x27, (byte) 0x13, (byte) 0x22,
|
||
|
+ (byte) 0x51, (byte) 0x3e, (byte) 0xd9, (byte) 0x11, (byte) 0x8a, (byte) 0xf2, (byte) 0xc9,
|
||
|
+ (byte) 0xa2, (byte) 0x58, (byte) 0x94, (byte) 0x4f, (byte) 0x4e, (byte) 0x05, (byte) 0xa2,
|
||
|
+ (byte) 0x7c, (byte) 0x72, (byte) 0x2c, (byte) 0x12, (byte) 0xe5, (byte) 0x93, (byte) 0x83,
|
||
|
+ (byte) 0xa1, (byte) 0x28, (byte) 0x9f, (byte) 0xfc, (byte) 0x8c, (byte) 0x45, (byte) 0xf9,
|
||
|
+ (byte) 0x14, (byte) 0x6e, (byte) 0x40, (byte) 0x94, (byte) 0x4f, (byte) 0x71, (byte) 0x47,
|
||
|
+ (byte) 0x44, (byte) 0xf9, (byte) 0x14, (byte) 0x80, (byte) 0x48, (byte) 0x94, (byte) 0x4f,
|
||
|
+ (byte) 0x81, (byte) 0xc8, (byte) 0x44, (byte) 0xf9, (byte) 0x14, (byte) 0x8e, (byte) 0x50,
|
||
|
+ (byte) 0x94, (byte) 0x4f, (byte) 0x41, (byte) 0x49, (byte) 0x45, (byte) 0xf9, (byte) 0x14,
|
||
|
+ (byte) 0x9b, (byte) 0x58, (byte) 0x94, (byte) 0x4f, (byte) 0x11, (byte) 0xca, (byte) 0x45,
|
||
|
+ (byte) 0xf9, (byte) 0x94, (byte) 0xa3, (byte) 0x40, (byte) 0x94, (byte) 0x4f, (byte) 0x99,
|
||
|
+ (byte) 0x4a, (byte) 0x44, (byte) 0xf9, (byte) 0x94, (byte) 0xb3, (byte) 0x48, (byte) 0x94,
|
||
|
+ (byte) 0x4f, (byte) 0x59, (byte) 0xcb, (byte) 0x44, (byte) 0xf9, (byte) 0x94, (byte) 0xb8,
|
||
|
+ (byte) 0x50, (byte) 0x94, (byte) 0x4f, (byte) 0x09, (byte) 0x4c, (byte) 0x45, (byte) 0xf9,
|
||
|
+ (byte) 0x94, (byte) 0xcb, (byte) 0x58, (byte) 0x94, (byte) 0x4f, (byte) 0x19, (byte) 0xcd,
|
||
|
+ (byte) 0x45, (byte) 0xf9, (byte) 0x54, (byte) 0xd8, (byte) 0x80, (byte) 0x28, (byte) 0x9f,
|
||
|
+ (byte) 0xca, (byte) 0x9b, (byte) 0x10, (byte) 0xe5, (byte) 0x53, (byte) 0x99, (byte) 0x23,
|
||
|
+ (byte) 0xa2, (byte) 0x7c, (byte) 0xaa, (byte) 0x73, (byte) 0x46, (byte) 0x94, (byte) 0x4f,
|
||
|
+ (byte) 0x25, (byte) 0x0f, (byte) 0x89, (byte) 0xf2, (byte) 0xa9, (byte) 0xf0, (byte) 0x29,
|
||
|
+ (byte) 0x51, (byte) 0x3e, (byte) 0xd5, (byte) 0x40, (byte) 0x26, (byte) 0xca, (byte) 0xa7,
|
||
|
+ (byte) 0x62, (byte) 0xe8, (byte) 0x44, (byte) 0xf9, (byte) 0x54, (byte) 0x0d, (byte) 0xa1,
|
||
|
+ (byte) 0x28, (byte) 0x9f, (byte) 0xca, (byte) 0xa1, (byte) 0x14, (byte) 0xe5, (byte) 0x53,
|
||
|
+ (byte) 0x61, (byte) 0xa4, (byte) 0xa2, (byte) 0x7c, (byte) 0xaa, (byte) 0x8c, (byte) 0x56,
|
||
|
+ (byte) 0x94, (byte) 0x4f, (byte) 0x45, (byte) 0x12, (byte) 0x8b, (byte) 0xf2, (byte) 0xa9,
|
||
|
+ (byte) 0x52, (byte) 0x6a, (byte) 0x51, (byte) 0x3e, (byte) 0x95, (byte) 0x4c, (byte) 0x2e,
|
||
|
+ (byte) 0xca, (byte) 0xa7, (byte) 0xda, (byte) 0xe9, (byte) 0x45, (byte) 0xf9, (byte) 0xd4,
|
||
|
+ (byte) 0x44, (byte) 0x81, (byte) 0x28, (byte) 0x9f, (byte) 0xba, (byte) 0xa8, (byte) 0x10,
|
||
|
+ (byte) 0xe5, (byte) 0x53, (byte) 0x37, (byte) 0x25, (byte) 0xa2, (byte) 0x7c, (byte) 0x6a,
|
||
|
+ (byte) 0xaa, (byte) 0x46, (byte) 0x94, (byte) 0x4f, (byte) 0xad, (byte) 0x15, (byte) 0x89,
|
||
|
+ (byte) 0xf2, (byte) 0xa9, (byte) 0xc5, (byte) 0x2a, (byte) 0x51, (byte) 0x3e, (byte) 0xb5,
|
||
|
+ (byte) 0x5a, (byte) 0x26, (byte) 0xca, (byte) 0xa7, (byte) 0x5e, (byte) 0xeb, (byte) 0x44,
|
||
|
+ (byte) 0xf9, (byte) 0xd4, (byte) 0x6c, (byte) 0xa1, (byte) 0x28, (byte) 0x9f, (byte) 0xba,
|
||
|
+ (byte) 0xad, (byte) 0x14, (byte) 0xe5, (byte) 0x53, (byte) 0xcf, (byte) 0xa5, (byte) 0xa2,
|
||
|
+ (byte) 0x7c, (byte) 0x6a, (byte) 0xbd, (byte) 0x56, (byte) 0x94, (byte) 0x4f, (byte) 0xbd,
|
||
|
+ (byte) 0x17, (byte) 0x8b, (byte) 0xf2, (byte) 0xa9, (byte) 0x09, (byte) 0x6b, (byte) 0x51,
|
||
|
+ (byte) 0x3e, (byte) 0x35, (byte) 0x63, (byte) 0x2e, (byte) 0xca, (byte) 0xa7, (byte) 0xd6,
|
||
|
+ (byte) 0xec, (byte) 0x45, (byte) 0xf9, (byte) 0x34, (byte) 0x9b, (byte) 0x01, (byte) 0x51,
|
||
|
+ (byte) 0x3e, (byte) 0x0d, (byte) 0x67, (byte) 0x41, (byte) 0x94, (byte) 0x4f, (byte) 0x43,
|
||
|
+ (byte) 0x9a, (byte) 0x10, (byte) 0xe5, (byte) 0xd3, (byte) 0xa8, (byte) 0x36, (byte) 0x44,
|
||
|
+ (byte) 0xf9, (byte) 0x34, (byte) 0xb1, (byte) 0x11, (byte) 0x51, (byte) 0x3e, (byte) 0xcd,
|
||
|
+ (byte) 0x6d, (byte) 0x45, (byte) 0x94, (byte) 0x4f, (byte) 0xe3, (byte) 0x9b, (byte) 0x11,
|
||
|
+ (byte) 0xe5, (byte) 0xd3, (byte) 0x14, (byte) 0x77, (byte) 0x44, (byte) 0xf9, (byte) 0x34,
|
||
|
+ (byte) 0xcc, (byte) 0x21, (byte) 0x51, (byte) 0x3e, (byte) 0x8d, (byte) 0x75, (byte) 0x49,
|
||
|
+ (byte) 0x94, (byte) 0x4f, (byte) 0x83, (byte) 0x9e, (byte) 0x12, (byte) 0xe5, (byte) 0xd3,
|
||
|
+ (byte) 0xb8, (byte) 0xb7, (byte) 0x44, (byte) 0xf9, (byte) 0x34, (byte) 0xfa, (byte) 0x31,
|
||
|
+ (byte) 0x51, (byte) 0x3e, (byte) 0x0d, (byte) 0x80, (byte) 0x4d, (byte) 0x94, (byte) 0x4f,
|
||
|
+ (byte) 0x73, (byte) 0xa0, (byte) 0x13, (byte) 0xe5, (byte) 0xd3, (byte) 0x34, (byte) 0xf8,
|
||
|
+ (byte) 0x44, (byte) 0xf9, (byte) 0x34, (byte) 0x13, (byte) 0x42, (byte) 0x51, (byte) 0x3e,
|
||
|
+ (byte) 0x4d, (byte) 0x87, (byte) 0x51, (byte) 0x94, (byte) 0x4f, (byte) 0x53, (byte) 0xa2,
|
||
|
+ (byte) 0x14, (byte) 0xe5, (byte) 0xd3, (byte) 0xb4, (byte) 0x38, (byte) 0x45, (byte) 0xf9,
|
||
|
+ (byte) 0x34, (byte) 0x34, (byte) 0x52, (byte) 0x51, (byte) 0x3e, (byte) 0x0d, (byte) 0x8f,
|
||
|
+ (byte) 0x55, (byte) 0x94, (byte) 0x4f, (byte) 0x23, (byte) 0xa4, (byte) 0x15, (byte) 0xe5,
|
||
|
+ (byte) 0xd3, (byte) 0x24, (byte) 0x79, (byte) 0x45, (byte) 0xf9, (byte) 0x34, (byte) 0x4f,
|
||
|
+ (byte) 0x62, (byte) 0x51, (byte) 0x3e, (byte) 0x8d, (byte) 0x95, (byte) 0x59, (byte) 0x94,
|
||
|
+ (byte) 0x4f, (byte) 0xd3, (byte) 0xa5, (byte) 0x16, (byte) 0xe5, (byte) 0xd3, (byte) 0x98,
|
||
|
+ (byte) 0xb9, (byte) 0x45, (byte) 0xf9, (byte) 0x34, (byte) 0x6e, (byte) 0x72, (byte) 0x51,
|
||
|
+ (byte) 0x3e, (byte) 0xcd, (byte) 0x9d, (byte) 0x5d, (byte) 0x94, (byte) 0x4f, (byte) 0x13,
|
||
|
+ (byte) 0xa8, (byte) 0x17, (byte) 0xe5, (byte) 0xd3, (byte) 0x1c, (byte) 0xfa, (byte) 0x45,
|
||
|
+ (byte) 0xf9, (byte) 0xb4, (byte) 0x90, (byte) 0x02, (byte) 0x51, (byte) 0x3e, (byte) 0xed,
|
||
|
+ (byte) 0xa5, (byte) 0x41, (byte) 0x94, (byte) 0x4f, (byte) 0xeb, (byte) 0xa9, (byte) 0x10,
|
||
|
+ (byte) 0xe5, (byte) 0xd3, (byte) 0x9a, (byte) 0x3a, (byte) 0x44, (byte) 0xf9, (byte) 0xb4,
|
||
|
+ (byte) 0xac, (byte) 0x12, (byte) 0x51, (byte) 0x3e, (byte) 0x6d, (byte) 0xad, (byte) 0x45,
|
||
|
+ (byte) 0x94, (byte) 0x4f, (byte) 0xbb, (byte) 0xab, (byte) 0x11, (byte) 0xe5, (byte) 0xd3,
|
||
|
+ (byte) 0x0a, (byte) 0x7b, (byte) 0x44, (byte) 0xf9, (byte) 0xb4, (byte) 0xc9, (byte) 0x22,
|
||
|
+ (byte) 0x51, (byte) 0x3e, (byte) 0x2d, (byte) 0xb4, (byte) 0x49, (byte) 0x94, (byte) 0x4f,
|
||
|
+ (byte) 0x7b, (byte) 0xad, (byte) 0x12, (byte) 0xe5, (byte) 0xd3, (byte) 0x82, (byte) 0xbb,
|
||
|
+ (byte) 0x44, (byte) 0xf9, (byte) 0xb4, (byte) 0xe7, (byte) 0x32, (byte) 0x51, (byte) 0x3e,
|
||
|
+ (byte) 0xad, (byte) 0xbb, (byte) 0x4d, (byte) 0x94, (byte) 0x4f, (byte) 0x5b, (byte) 0xaf,
|
||
|
+ (byte) 0x13, (byte) 0xe5, (byte) 0xd3, (byte) 0xf6, (byte) 0xfb, (byte) 0x44, (byte) 0xf9,
|
||
|
+ (byte) 0xb4, (byte) 0x05, (byte) 0x43, (byte) 0x51, (byte) 0x3e, (byte) 0xed, (byte) 0xc2,
|
||
|
+ (byte) 0x51, (byte) 0x94, (byte) 0x4f, (byte) 0x1b, (byte) 0xb1, (byte) 0x14, (byte) 0xe5,
|
||
|
+ (byte) 0xd3, (byte) 0x62, (byte) 0x3c, (byte) 0x45, (byte) 0xf9, (byte) 0xb4, (byte) 0x1f,
|
||
|
+ (byte) 0x53, (byte) 0x51, (byte) 0x3e, (byte) 0xad, (byte) 0xc9, (byte) 0x55, (byte) 0x94,
|
||
|
+ (byte) 0x4f, (byte) 0xeb, (byte) 0xb2, (byte) 0x15, (byte) 0xe5, (byte) 0xd3, (byte) 0xda,
|
||
|
+ (byte) 0x7c, (byte) 0x45, (byte) 0xf9, (byte) 0xb4, (byte) 0x3e, (byte) 0x63
|
||
|
+ };
|
||
|
+ checkSynth(
|
||
|
+ /*
|
||
|
+ * // The stream consists of word "time" with all possible transforms.
|
||
|
+ * main_header
|
||
|
+ * metablock_header_easy: 833, 1
|
||
|
+ * command_easy: 4, "|", 2 // = 0 << 10 + 1 + 1
|
||
|
+ * command_easy: 4, "|", 1031 // = 1 << 10 + 1 + 6
|
||
|
+ * command_easy: 4, "|", 2061 // = 2 << 10 + 1 + 12
|
||
|
+ * command_easy: 4, "|", 3092 // = 3 << 10 + 1 + 19
|
||
|
+ * command_easy: 4, "|", 4120 // = 4 << 10 + 1 + 23
|
||
|
+ * command_easy: 4, "|", 5150 // = 5 << 10 + 1 + 29
|
||
|
+ * command_easy: 4, "|", 6184 // = 6 << 10 + 1 + 39
|
||
|
+ * command_easy: 4, "|", 7214 // = 7 << 10 + 1 + 45
|
||
|
+ * command_easy: 4, "|", 8246 // = 8 << 10 + 1 + 53
|
||
|
+ * command_easy: 4, "|", 9279 // = 9 << 10 + 1 + 62
|
||
|
+ * command_easy: 4, "|", 10308 // = 10 << 10 + 1 + 67
|
||
|
+ * command_easy: 4, "|", 11342 // = 11 << 10 + 1 + 77
|
||
|
+ * command_easy: 4, "|", 12369 // = 12 << 10 + 1 + 80
|
||
|
+ * command_easy: 4, "|", 13397 // = 13 << 10 + 1 + 84
|
||
|
+ * command_easy: 4, "|", 14429 // = 14 << 10 + 1 + 92
|
||
|
+ * command_easy: 4, "|", 15460 // = 15 << 10 + 1 + 99
|
||
|
+ * command_easy: 4, "|", 16491 // = 16 << 10 + 1 + 106
|
||
|
+ * command_easy: 4, "|", 17524 // = 17 << 10 + 1 + 115
|
||
|
+ * command_easy: 4, "|", 18557 // = 18 << 10 + 1 + 124
|
||
|
+ * command_easy: 4, "|", 19589 // = 19 << 10 + 1 + 132
|
||
|
+ * command_easy: 4, "|", 20619 // = 20 << 10 + 1 + 138
|
||
|
+ * command_easy: 4, "|", 21649 // = 21 << 10 + 1 + 144
|
||
|
+ * command_easy: 4, "|", 22680 // = 22 << 10 + 1 + 151
|
||
|
+ * command_easy: 4, "|", 23710 // = 23 << 10 + 1 + 157
|
||
|
+ * command_easy: 4, "|", 24736 // = 24 << 10 + 1 + 159
|
||
|
+ * command_easy: 4, "|", 25766 // = 25 << 10 + 1 + 165
|
||
|
+ * command_easy: 4, "|", 26800 // = 26 << 10 + 1 + 175
|
||
|
+ * command_easy: 4, "|", 27826 // = 27 << 10 + 1 + 177
|
||
|
+ * command_easy: 4, "|", 28853 // = 28 << 10 + 1 + 180
|
||
|
+ * command_easy: 4, "|", 29885 // = 29 << 10 + 1 + 188
|
||
|
+ * command_easy: 4, "|", 30920 // = 30 << 10 + 1 + 199
|
||
|
+ * command_easy: 4, "|", 31950 // = 31 << 10 + 1 + 205
|
||
|
+ * command_easy: 4, "|", 32981 // = 32 << 10 + 1 + 212
|
||
|
+ * command_easy: 4, "|", 34011 // = 33 << 10 + 1 + 218
|
||
|
+ * command_easy: 4, "|", 35043 // = 34 << 10 + 1 + 226
|
||
|
+ * command_easy: 4, "|", 36068 // = 35 << 10 + 1 + 227
|
||
|
+ * command_easy: 4, "|", 37103 // = 36 << 10 + 1 + 238
|
||
|
+ * command_easy: 4, "|", 38133 // = 37 << 10 + 1 + 244
|
||
|
+ * command_easy: 4, "|", 39168 // = 38 << 10 + 1 + 255
|
||
|
+ * command_easy: 4, "|", 40201 // = 39 << 10 + 1 + 264
|
||
|
+ * command_easy: 4, "|", 41226 // = 40 << 10 + 1 + 265
|
||
|
+ * command_easy: 4, "|", 42251 // = 41 << 10 + 1 + 266
|
||
|
+ * command_easy: 4, "|", 43285 // = 42 << 10 + 1 + 276
|
||
|
+ * command_easy: 4, "|", 44310 // = 43 << 10 + 1 + 277
|
||
|
+ * command_easy: 4, "|", 45345 // = 44 << 10 + 1 + 288
|
||
|
+ * command_easy: 4, "|", 46374 // = 45 << 10 + 1 + 293
|
||
|
+ * command_easy: 4, "|", 47407 // = 46 << 10 + 1 + 302
|
||
|
+ * command_easy: 4, "|", 48440 // = 47 << 10 + 1 + 311
|
||
|
+ * command_easy: 4, "|", 49473 // = 48 << 10 + 1 + 320
|
||
|
+ * command_easy: 4, "|", 50498 // = 49 << 10 + 1 + 321
|
||
|
+ * command_easy: 4, "|", 51530 // = 50 << 10 + 1 + 329
|
||
|
+ * command_easy: 4, "|", 52561 // = 51 << 10 + 1 + 336
|
||
|
+ * command_easy: 4, "|", 53591 // = 52 << 10 + 1 + 342
|
||
|
+ * command_easy: 4, "|", 54623 // = 53 << 10 + 1 + 350
|
||
|
+ * command_easy: 4, "|", 55655 // = 54 << 10 + 1 + 358
|
||
|
+ * command_easy: 4, "|", 56680 // = 55 << 10 + 1 + 359
|
||
|
+ * command_easy: 4, "|", 57705 // = 56 << 10 + 1 + 360
|
||
|
+ * command_easy: 4, "|", 58730 // = 57 << 10 + 1 + 361
|
||
|
+ * command_easy: 4, "|", 59760 // = 58 << 10 + 1 + 367
|
||
|
+ * command_easy: 4, "|", 60791 // = 59 << 10 + 1 + 374
|
||
|
+ * command_easy: 4, "|", 61816 // = 60 << 10 + 1 + 375
|
||
|
+ * command_easy: 4, "|", 62849 // = 61 << 10 + 1 + 384
|
||
|
+ * command_easy: 4, "|", 63881 // = 62 << 10 + 1 + 392
|
||
|
+ * command_easy: 4, "|", 64919 // = 63 << 10 + 1 + 406
|
||
|
+ * command_easy: 4, "|", 65944 // = 64 << 10 + 1 + 407
|
||
|
+ * command_easy: 4, "|", 66969 // = 65 << 10 + 1 + 408
|
||
|
+ * command_easy: 4, "|", 68001 // = 66 << 10 + 1 + 416
|
||
|
+ * command_easy: 4, "|", 69031 // = 67 << 10 + 1 + 422
|
||
|
+ * command_easy: 4, "|", 70062 // = 68 << 10 + 1 + 429
|
||
|
+ * command_easy: 4, "|", 71092 // = 69 << 10 + 1 + 435
|
||
|
+ * command_easy: 4, "|", 72123 // = 70 << 10 + 1 + 442
|
||
|
+ * command_easy: 4, "|", 73154 // = 71 << 10 + 1 + 449
|
||
|
+ * command_easy: 4, "|", 74185 // = 72 << 10 + 1 + 456
|
||
|
+ * command_easy: 4, "|", 75219 // = 73 << 10 + 1 + 466
|
||
|
+ * command_easy: 4, "|", 76261 // = 74 << 10 + 1 + 484
|
||
|
+ * command_easy: 4, "|", 77291 // = 75 << 10 + 1 + 490
|
||
|
+ * command_easy: 4, "|", 78327 // = 76 << 10 + 1 + 502
|
||
|
+ * command_easy: 4, "|", 79357 // = 77 << 10 + 1 + 508
|
||
|
+ * command_easy: 4, "|", 80388 // = 78 << 10 + 1 + 515
|
||
|
+ * command_easy: 4, "|", 81418 // = 79 << 10 + 1 + 521
|
||
|
+ * command_easy: 4, "|", 82448 // = 80 << 10 + 1 + 527
|
||
|
+ * command_easy: 4, "|", 83482 // = 81 << 10 + 1 + 537
|
||
|
+ * command_easy: 4, "|", 84514 // = 82 << 10 + 1 + 545
|
||
|
+ * command_easy: 4, "|", 85546 // = 83 << 10 + 1 + 553
|
||
|
+ * command_easy: 4, "|", 86577 // = 84 << 10 + 1 + 560
|
||
|
+ * command_easy: 4, "|", 87609 // = 85 << 10 + 1 + 568
|
||
|
+ * command_easy: 4, "|", 88639 // = 86 << 10 + 1 + 574
|
||
|
+ * command_easy: 4, "|", 89670 // = 87 << 10 + 1 + 581
|
||
|
+ * command_easy: 4, "|", 90700 // = 88 << 10 + 1 + 587
|
||
|
+ * command_easy: 4, "|", 91731 // = 89 << 10 + 1 + 594
|
||
|
+ * command_easy: 4, "|", 92762 // = 90 << 10 + 1 + 601
|
||
|
+ * command_easy: 4, "|", 93795 // = 91 << 10 + 1 + 610
|
||
|
+ * command_easy: 4, "|", 94827 // = 92 << 10 + 1 + 618
|
||
|
+ * command_easy: 4, "|", 95860 // = 93 << 10 + 1 + 627
|
||
|
+ * command_easy: 4, "|", 96894 // = 94 << 10 + 1 + 637
|
||
|
+ * command_easy: 4, "|", 97924 // = 95 << 10 + 1 + 643
|
||
|
+ * command_easy: 4, "|", 98957 // = 96 << 10 + 1 + 652
|
||
|
+ * command_easy: 4, "|", 99988 // = 97 << 10 + 1 + 659
|
||
|
+ * command_easy: 4, "|", 101019 // = 98 << 10 + 1 + 666
|
||
|
+ * command_easy: 4, "|", 102051 // = 99 << 10 + 1 + 674
|
||
|
+ * command_easy: 4, "|", 103081 // = 100 << 10 + 1 + 680
|
||
|
+ * command_easy: 4, "|", 104114 // = 101 << 10 + 1 + 689
|
||
|
+ * command_easy: 4, "|", 105144 // = 102 << 10 + 1 + 695
|
||
|
+ * command_easy: 4, "|", 106175 // = 103 << 10 + 1 + 702
|
||
|
+ * command_easy: 4, "|", 107206 // = 104 << 10 + 1 + 709
|
||
|
+ * command_easy: 4, "|", 108237 // = 105 << 10 + 1 + 716
|
||
|
+ * command_easy: 4, "|", 109268 // = 106 << 10 + 1 + 723
|
||
|
+ * command_easy: 4, "|", 110301 // = 107 << 10 + 1 + 732
|
||
|
+ * command_easy: 4, "|", 111332 // = 108 << 10 + 1 + 739
|
||
|
+ * command_easy: 4, "|", 112363 // = 109 << 10 + 1 + 746
|
||
|
+ * command_easy: 4, "|", 113394 // = 110 << 10 + 1 + 753
|
||
|
+ * command_easy: 4, "|", 114426 // = 111 << 10 + 1 + 761
|
||
|
+ * command_easy: 4, "|", 115458 // = 112 << 10 + 1 + 769
|
||
|
+ * command_easy: 4, "|", 116488 // = 113 << 10 + 1 + 775
|
||
|
+ * command_easy: 4, "|", 117518 // = 114 << 10 + 1 + 781
|
||
|
+ * command_easy: 4, "|", 118549 // = 115 << 10 + 1 + 788
|
||
|
+ * command_easy: 4, "|", 119580 // = 116 << 10 + 1 + 795
|
||
|
+ * command_easy: 4, "|", 120611 // = 117 << 10 + 1 + 802
|
||
|
+ * command_easy: 4, "|", 121643 // = 118 << 10 + 1 + 810
|
||
|
+ * command_easy: 4, "|", 122675 // = 119 << 10 + 1 + 818
|
||
|
+ * command_easy: 4, "|", 123707 // = 120 << 10 + 1 + 826
|
||
|
+ */
|
||
|
+ compressed,
|
||
|
+ true,
|
||
|
+ "|time|time | time |ime|Time |time the | time|s time |time of |Time|time and |me|tim|, time |"
|
||
|
+ + "time, | Time |time in |time to |e time |time\"|time.|time\">|time\n|t|time]|time for |e|ti"
|
||
|
+ + "|time a |time that | Time|time. |.time| time, ||time with |time'|time from |time by ||| th"
|
||
|
+ + "e time||time. The |TIME|time on |time as |time is ||timing |time\n\t|time:| time. |timeed "
|
||
|
+ + "||||time(|Time, ||time at |timely | the time of ||| Time, |Time\"|.time(|TIME |Time\">|tim"
|
||
|
+ + "e=\"| time.|.com/time| the time of the |Time'|time. This |time,|.time |Time(|Time.|time no"
|
||
|
+ + "t | time=\"|timeer | TIME |timeal | TIME|time='|TIME\"|Time. | time(|timeful | Time. |time"
|
||
|
+ + "ive |timeless |TIME'|timeest | Time.|TIME\">| time='|Time,|timeize |TIME.|\302\240time| ti"
|
||
|
+ + "me,|Time=\"|TIME=\"|timeous |TIME, |Time='| Time,| TIME=\"| TIME, |TIME,|TIME(|TIME. | TIM"
|
||
|
+ + "E.|TIME='| TIME. | Time=\"| TIME='| Time='"
|
||
|
+ );
|
||
|
+ }
|
||
|
+
|
||
|
@Test
|
||
|
public void testBaseDictWord() {
|
||
|
byte[] compressed = {
|
||
|
@@ -446,6 +914,28 @@ public void testCopyLengthTooLong() {
|
||
|
);
|
||
|
}
|
||
|
|
||
|
+ @Test
|
||
|
+ public void testCopyTooLong() {
|
||
|
+ byte[] compressed = {
|
||
|
+ (byte) 0xa1, (byte) 0x08, (byte) 0x00, (byte) 0x00, (byte) 0x00, (byte) 0x00, (byte) 0x00,
|
||
|
+ (byte) 0x1c, (byte) 0xa7, (byte) 0x6d, (byte) 0x00, (byte) 0x00, (byte) 0x38, (byte) 0xd8,
|
||
|
+ (byte) 0x32, (byte) 0x89, (byte) 0x01, (byte) 0x12, (byte) 0x00, (byte) 0x00, (byte) 0x77,
|
||
|
+ (byte) 0xda, (byte) 0x34, (byte) 0xab, (byte) 0xdb, (byte) 0x50, (byte) 0x00
|
||
|
+ };
|
||
|
+ checkSynth(
|
||
|
+ /*
|
||
|
+ * // Has a copy length that goes over the end of the meta-block,
|
||
|
+ * // with a ringbuffer wrap.
|
||
|
+ * main_header: 10
|
||
|
+ * metablock_header_easy: 2, 1
|
||
|
+ * command_easy: 1024, "a", 1
|
||
|
+ */
|
||
|
+ compressed,
|
||
|
+ false,
|
||
|
+ ""
|
||
|
+ );
|
||
|
+ }
|
||
|
+
|
||
|
@Test
|
||
|
public void testCustomHuffmanCode() {
|
||
|
byte[] compressed = {
|
||
|
@@ -2199,6 +2689,23 @@ public void testSimplePrefixOutOfRangeSymbols() {
|
||
|
);
|
||
|
}
|
||
|
|
||
|
+/* DISABLED: Java decoder does not tolerate extra input after the brotli stream.
|
||
|
+ @Test
|
||
|
+ public void testSimplePrefixPlusExtraData() {
|
||
|
+ byte[] compressed = {
|
||
|
+ (byte) 0x1b, (byte) 0x03, (byte) 0x00, (byte) 0x00, (byte) 0xa0, (byte) 0xc3, (byte) 0xc4,
|
||
|
+ (byte) 0xc6, (byte) 0xc8, (byte) 0x02, (byte) 0x00, (byte) 0x70, (byte) 0xb0, (byte) 0x65,
|
||
|
+ (byte) 0x12, (byte) 0x03, (byte) 0x24, (byte) 0x00, (byte) 0x00, (byte) 0xee, (byte) 0xb4,
|
||
|
+ (byte) 0x51, (byte) 0xa0, (byte) 0x1d, (byte) 0x55, (byte) 0xaa
|
||
|
+ };
|
||
|
+ checkSynth(
|
||
|
+ compressed,
|
||
|
+ true,
|
||
|
+ "abcd"
|
||
|
+ );
|
||
|
+ }
|
||
|
+*/
|
||
|
+
|
||
|
@Test
|
||
|
public void testTooManySymbolsRepeated() {
|
||
|
byte[] compressed = {
|
||
|
@@ -2246,7 +2753,7 @@ public void testTransformedDictWord() {
|
||
|
* main_header
|
||
|
* metablock_header_easy: 9, 1
|
||
|
* command_inscopy_easy: 0, 4
|
||
|
- * command_dist_easy: 5121
|
||
|
+ * command_dist_easy: 5121 // 5 << 10 + 1
|
||
|
*/
|
||
|
compressed,
|
||
|
true,
|
||
|
@@ -2270,7 +2777,7 @@ public void testTransformedDictWordTooLong() {
|
||
|
* main_header
|
||
|
* metablock_header_easy: 4, 1
|
||
|
* command_inscopy_easy: 0, 4
|
||
|
- * command_dist_easy: 5121
|
||
|
+ * command_dist_easy: 5121 // 5 << 10 + 1
|
||
|
*/
|
||
|
compressed,
|
||
|
false,
|
||
|
@@ -2280,4 +2787,4 @@ public void testTransformedDictWordTooLong() {
|
||
|
|
||
|
/* GENERATED CODE END */
|
||
|
|
||
|
-}
|
||
|
\ No newline at end of file
|
||
|
+}
|
||
|
diff --git a/java/org/brotli/dec/Transform.java b/java/org/brotli/dec/Transform.java
|
||
|
index b90f2e96..3279ee73 100644
|
||
|
--- a/java/org/brotli/dec/Transform.java
|
||
|
+++ b/java/org/brotli/dec/Transform.java
|
||
|
@@ -10,13 +10,58 @@
|
||
|
|
||
|
/**
|
||
|
* Transformations on dictionary words.
|
||
|
+ *
|
||
|
+ * Transform descriptor is a triplet: {prefix, operator, suffix}.
|
||
|
+ * "prefix" and "suffix" are short strings inserted before and after transformed dictionary word.
|
||
|
+ * "operator" is applied to dictionary word itself.
|
||
|
+ *
|
||
|
+ * Some operators has "built-in" parameters, i.e. parameter is defined by operator ordinal. Other
|
||
|
+ * operators have "external" parameters, supplied via additional table encoded in shared dictionary.
|
||
|
+ *
|
||
|
+ * Operators:
|
||
|
+ * - IDENTITY (0): dictionary word is inserted "as is"
|
||
|
+ * - OMIT_LAST_N (1 - 9): last N octets of dictionary word are not inserted; N == ordinal
|
||
|
+ * - OMIT_FIRST_M (12-20): first M octets of dictionary word are not inserted; M == ordinal - 11
|
||
|
+ * - UPPERCASE_FIRST (10): first "scalar" is XOR'ed with number 32
|
||
|
+ * - UPPERCASE_ALL (11): all "scalars" are XOR'ed with number 32
|
||
|
+ * - SHIFT_FIRST (21): first "scalar" is shifted by number form parameter table
|
||
|
+ * - SHIFT_ALL (22): all "scalar" is shifted by number form parameter table
|
||
|
+ *
|
||
|
+ * Here "scalar" is a variable length character coding similar to UTF-8 encoding.
|
||
|
+ * UPPERCASE_XXX / SHIFT_XXX operators were designed to change the case of UTF-8 encoded characters.
|
||
|
+ * While UPPERCASE_XXX works well only on ASCII charset, SHIFT is much more generic and could be
|
||
|
+ * used for most (all?) alphabets.
|
||
|
*/
|
||
|
final class Transform {
|
||
|
|
||
|
- static final int NUM_TRANSFORMS = 121;
|
||
|
- private static final int[] TRANSFORMS = new int[NUM_TRANSFORMS * 3];
|
||
|
- private static final byte[] PREFIX_SUFFIX = new byte[217];
|
||
|
- private static final int[] PREFIX_SUFFIX_HEADS = new int[51];
|
||
|
+ static final class Transforms {
|
||
|
+ final int numTransforms;
|
||
|
+ final int[] triplets;
|
||
|
+ final byte[] prefixSuffixStorage;
|
||
|
+ final int[] prefixSuffixHeads;
|
||
|
+ final short[] params;
|
||
|
+
|
||
|
+ Transforms(int numTransforms, int prefixSuffixLen, int prefixSuffixCount) {
|
||
|
+ this.numTransforms = numTransforms;
|
||
|
+ this.triplets = new int[numTransforms * 3];
|
||
|
+ this.params = new short[numTransforms];
|
||
|
+ this.prefixSuffixStorage = new byte[prefixSuffixLen];
|
||
|
+ this.prefixSuffixHeads = new int[prefixSuffixCount + 1];
|
||
|
+ }
|
||
|
+ }
|
||
|
+
|
||
|
+ static final int NUM_RFC_TRANSFORMS = 121;
|
||
|
+ static final Transforms RFC_TRANSFORMS = new Transforms(NUM_RFC_TRANSFORMS, 167, 50);
|
||
|
+
|
||
|
+ private static final int OMIT_FIRST_LAST_LIMIT = 9;
|
||
|
+
|
||
|
+ private static final int IDENTITY = 0;
|
||
|
+ private static final int OMIT_LAST_BASE = IDENTITY + 1 - 1; // there is no OMIT_LAST_0.
|
||
|
+ private static final int UPPERCASE_FIRST = OMIT_LAST_BASE + OMIT_FIRST_LAST_LIMIT + 1;
|
||
|
+ private static final int UPPERCASE_ALL = UPPERCASE_FIRST + 1;
|
||
|
+ private static final int OMIT_FIRST_BASE = UPPERCASE_ALL + 1 - 1; // there is no OMIT_FIRST_0.
|
||
|
+ private static final int SHIFT_FIRST = OMIT_FIRST_BASE + OMIT_FIRST_LAST_LIMIT + 1;
|
||
|
+ private static final int SHIFT_ALL = SHIFT_FIRST + 1;
|
||
|
|
||
|
// Bundle of 0-terminated strings.
|
||
|
private static final String PREFIX_SUFFIX_SRC = "# #s #, #e #.# the #.com/#\u00C2\u00A0# of # and"
|
||
|
@@ -29,71 +74,87 @@
|
||
|
+ " G% ! *A *% H! D I!+! J!+ K +- *4! A L!*4 M N +6 O!*% +.! K *G P +%( ! G *D +D "
|
||
|
+ " Q +# *K!*G!+D!+# +G +A +4!+% +K!+4!*D!+K!*K";
|
||
|
|
||
|
- private static void unpackTransforms(byte[] prefixSuffix, int[] prefixSuffixHeads,
|
||
|
- int[] transforms, String prefixSuffixSrc, String transformsSrc) {
|
||
|
+ private static void unpackTransforms(byte[] prefixSuffix,
|
||
|
+ int[] prefixSuffixHeads, int[] transforms, String prefixSuffixSrc, String transformsSrc) {
|
||
|
int n = prefixSuffixSrc.length();
|
||
|
int index = 1;
|
||
|
+ int j = 0;
|
||
|
for (int i = 0; i < n; ++i) {
|
||
|
char c = prefixSuffixSrc.charAt(i);
|
||
|
- prefixSuffix[i] = (byte) c;
|
||
|
if (c == 35) { // == #
|
||
|
- prefixSuffixHeads[index++] = i + 1;
|
||
|
- prefixSuffix[i] = 0;
|
||
|
+ prefixSuffixHeads[index++] = j;
|
||
|
+ } else {
|
||
|
+ prefixSuffix[j++] = (byte) c;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
- for (int i = 0; i < NUM_TRANSFORMS * 3; ++i) {
|
||
|
+ for (int i = 0; i < NUM_RFC_TRANSFORMS * 3; ++i) {
|
||
|
transforms[i] = transformsSrc.charAt(i) - 32;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
static {
|
||
|
- unpackTransforms(PREFIX_SUFFIX, PREFIX_SUFFIX_HEADS, TRANSFORMS, PREFIX_SUFFIX_SRC,
|
||
|
- TRANSFORMS_SRC);
|
||
|
+ unpackTransforms(RFC_TRANSFORMS.prefixSuffixStorage, RFC_TRANSFORMS.prefixSuffixHeads,
|
||
|
+ RFC_TRANSFORMS.triplets, PREFIX_SUFFIX_SRC, TRANSFORMS_SRC);
|
||
|
}
|
||
|
|
||
|
- static int transformDictionaryWord(byte[] dst, int dstOffset, ByteBuffer data, int wordOffset,
|
||
|
- int len, int transformIndex) {
|
||
|
+ static int transformDictionaryWord(byte[] dst, int dstOffset, ByteBuffer src, int srcOffset,
|
||
|
+ int len, Transforms transforms, int transformIndex) {
|
||
|
int offset = dstOffset;
|
||
|
+ int[] triplets = transforms.triplets;
|
||
|
+ byte[] prefixSuffixStorage = transforms.prefixSuffixStorage;
|
||
|
+ int[] prefixSuffixHeads = transforms.prefixSuffixHeads;
|
||
|
int transformOffset = 3 * transformIndex;
|
||
|
- int transformPrefix = PREFIX_SUFFIX_HEADS[TRANSFORMS[transformOffset]];
|
||
|
- int transformType = TRANSFORMS[transformOffset + 1];
|
||
|
- int transformSuffix = PREFIX_SUFFIX_HEADS[TRANSFORMS[transformOffset + 2]];
|
||
|
+ int prefixIdx = triplets[transformOffset];
|
||
|
+ int transformType = triplets[transformOffset + 1];
|
||
|
+ int suffixIdx = triplets[transformOffset + 2];
|
||
|
+ int prefix = prefixSuffixHeads[prefixIdx];
|
||
|
+ int prefixEnd = prefixSuffixHeads[prefixIdx + 1];
|
||
|
+ int suffix = prefixSuffixHeads[suffixIdx];
|
||
|
+ int suffixEnd = prefixSuffixHeads[suffixIdx + 1];
|
||
|
+
|
||
|
+ int omitFirst = transformType - OMIT_FIRST_BASE;
|
||
|
+ int omitLast = transformType - OMIT_LAST_BASE;
|
||
|
+ if (omitFirst < 1 || omitFirst > OMIT_FIRST_LAST_LIMIT) {
|
||
|
+ omitFirst = 0;
|
||
|
+ }
|
||
|
+ if (omitLast < 1 || omitLast > OMIT_FIRST_LAST_LIMIT) {
|
||
|
+ omitLast = 0;
|
||
|
+ }
|
||
|
|
||
|
// Copy prefix.
|
||
|
- while (PREFIX_SUFFIX[transformPrefix] != 0) {
|
||
|
- dst[offset++] = PREFIX_SUFFIX[transformPrefix++];
|
||
|
+ while (prefix != prefixEnd) {
|
||
|
+ dst[offset++] = prefixSuffixStorage[prefix++];
|
||
|
}
|
||
|
|
||
|
// Copy trimmed word.
|
||
|
- int omitFirst = transformType >= 12 ? (transformType - 11) : 0;
|
||
|
if (omitFirst > len) {
|
||
|
omitFirst = len;
|
||
|
}
|
||
|
- wordOffset += omitFirst;
|
||
|
+ srcOffset += omitFirst;
|
||
|
len -= omitFirst;
|
||
|
- len -= transformType <= 9 ? transformType : 0; // Omit last.
|
||
|
+ len -= omitLast;
|
||
|
int i = len;
|
||
|
while (i > 0) {
|
||
|
- dst[offset++] = data.get(wordOffset++);
|
||
|
+ dst[offset++] = src.get(srcOffset++);
|
||
|
i--;
|
||
|
}
|
||
|
|
||
|
// Ferment.
|
||
|
- if (transformType == 11 || transformType == 10) {
|
||
|
+ if (transformType == UPPERCASE_FIRST || transformType == UPPERCASE_ALL) {
|
||
|
int uppercaseOffset = offset - len;
|
||
|
- if (transformType == 10) {
|
||
|
+ if (transformType == UPPERCASE_FIRST) {
|
||
|
len = 1;
|
||
|
}
|
||
|
while (len > 0) {
|
||
|
- int tmp = dst[uppercaseOffset] & 0xFF;
|
||
|
- if (tmp < 0xc0) {
|
||
|
- if (tmp >= 97 && tmp <= 122) { // in [a..z] range
|
||
|
+ int c0 = dst[uppercaseOffset] & 0xFF;
|
||
|
+ if (c0 < 0xC0) {
|
||
|
+ if (c0 >= 97 && c0 <= 122) { // in [a..z] range
|
||
|
dst[uppercaseOffset] ^= (byte) 32;
|
||
|
}
|
||
|
uppercaseOffset += 1;
|
||
|
len -= 1;
|
||
|
- } else if (tmp < 0xe0) {
|
||
|
+ } else if (c0 < 0xE0) {
|
||
|
dst[uppercaseOffset + 1] ^= (byte) 32;
|
||
|
uppercaseOffset += 2;
|
||
|
len -= 2;
|
||
|
@@ -103,11 +164,71 @@ static int transformDictionaryWord(byte[] dst, int dstOffset, ByteBuffer data, i
|
||
|
len -= 3;
|
||
|
}
|
||
|
}
|
||
|
+ } else if (transformType == SHIFT_FIRST || transformType == SHIFT_ALL) {
|
||
|
+ int shiftOffset = offset - len;
|
||
|
+ short param = transforms.params[transformIndex];
|
||
|
+ /* Limited sign extension: scalar < (1 << 24). */
|
||
|
+ int scalar = (param & 0x7FFF) + (0x1000000 - (param & 0x8000));
|
||
|
+ while (len > 0) {
|
||
|
+ int step = 1;
|
||
|
+ int c0 = dst[shiftOffset] & 0xFF;
|
||
|
+ if (c0 < 0x80) {
|
||
|
+ /* 1-byte rune / 0sssssss / 7 bit scalar (ASCII). */
|
||
|
+ scalar += c0;
|
||
|
+ dst[shiftOffset] = (byte) (scalar & 0x7F);
|
||
|
+ } else if (c0 < 0xC0) {
|
||
|
+ /* Continuation / 10AAAAAA. */
|
||
|
+ } else if (c0 < 0xE0) {
|
||
|
+ /* 2-byte rune / 110sssss AAssssss / 11 bit scalar. */
|
||
|
+ if (len >= 2) {
|
||
|
+ byte c1 = dst[shiftOffset + 1];
|
||
|
+ scalar += (c1 & 0x3F) | ((c0 & 0x1F) << 6);
|
||
|
+ dst[shiftOffset] = (byte) (0xC0 | ((scalar >> 6) & 0x1F));
|
||
|
+ dst[shiftOffset + 1] = (byte) ((c1 & 0xC0) | (scalar & 0x3F));
|
||
|
+ step = 2;
|
||
|
+ } else {
|
||
|
+ step = len;
|
||
|
+ }
|
||
|
+ } else if (c0 < 0xF0) {
|
||
|
+ /* 3-byte rune / 1110ssss AAssssss BBssssss / 16 bit scalar. */
|
||
|
+ if (len >= 3) {
|
||
|
+ byte c1 = dst[shiftOffset + 1];
|
||
|
+ byte c2 = dst[shiftOffset + 2];
|
||
|
+ scalar += (c2 & 0x3F) | ((c1 & 0x3F) << 6) | ((c0 & 0x0F) << 12);
|
||
|
+ dst[shiftOffset] = (byte) (0xE0 | ((scalar >> 12) & 0x0F));
|
||
|
+ dst[shiftOffset + 1] = (byte) ((c1 & 0xC0) | ((scalar >> 6) & 0x3F));
|
||
|
+ dst[shiftOffset + 2] = (byte) ((c2 & 0xC0) | (scalar & 0x3F));
|
||
|
+ step = 3;
|
||
|
+ } else {
|
||
|
+ step = len;
|
||
|
+ }
|
||
|
+ } else if (c0 < 0xF8) {
|
||
|
+ /* 4-byte rune / 11110sss AAssssss BBssssss CCssssss / 21 bit scalar. */
|
||
|
+ if (len >= 4) {
|
||
|
+ byte c1 = dst[shiftOffset + 1];
|
||
|
+ byte c2 = dst[shiftOffset + 2];
|
||
|
+ byte c3 = dst[shiftOffset + 3];
|
||
|
+ scalar += (c3 & 0x3F) | ((c2 & 0x3F) << 6) | ((c1 & 0x3F) << 12) | ((c0 & 0x07) << 18);
|
||
|
+ dst[shiftOffset] = (byte) (0xF0 | ((scalar >> 18) & 0x07));
|
||
|
+ dst[shiftOffset + 1] = (byte) ((c1 & 0xC0) | ((scalar >> 12) & 0x3F));
|
||
|
+ dst[shiftOffset + 2] = (byte) ((c2 & 0xC0) | ((scalar >> 6) & 0x3F));
|
||
|
+ dst[shiftOffset + 3] = (byte) ((c3 & 0xC0) | (scalar & 0x3F));
|
||
|
+ step = 4;
|
||
|
+ } else {
|
||
|
+ step = len;
|
||
|
+ }
|
||
|
+ }
|
||
|
+ shiftOffset += step;
|
||
|
+ len -= step;
|
||
|
+ if (transformType == SHIFT_FIRST) {
|
||
|
+ len = 0;
|
||
|
+ }
|
||
|
+ }
|
||
|
}
|
||
|
|
||
|
// Copy suffix.
|
||
|
- while (PREFIX_SUFFIX[transformSuffix] != 0) {
|
||
|
- dst[offset++] = PREFIX_SUFFIX[transformSuffix++];
|
||
|
+ while (suffix != suffixEnd) {
|
||
|
+ dst[offset++] = prefixSuffixStorage[suffix++];
|
||
|
}
|
||
|
|
||
|
return offset - dstOffset;
|
||
|
diff --git a/java/org/brotli/dec/TransformTest.java b/java/org/brotli/dec/TransformTest.java
|
||
|
index 616ba351..6e04f0dc 100644
|
||
|
--- a/java/org/brotli/dec/TransformTest.java
|
||
|
+++ b/java/org/brotli/dec/TransformTest.java
|
||
|
@@ -36,8 +36,8 @@ private static long crc64(byte[] data) {
|
||
|
public void testTrimAll() {
|
||
|
byte[] output = new byte[0];
|
||
|
byte[] input = {119, 111, 114, 100}; // "word"
|
||
|
- Transform.transformDictionaryWord(
|
||
|
- output, 0, ByteBuffer.wrap(input), 0, input.length, 39);
|
||
|
+ Transform.transformDictionaryWord(output, 0,
|
||
|
+ ByteBuffer.wrap(input), 0, input.length, Transform.RFC_TRANSFORMS, 39);
|
||
|
byte[] expectedOutput = new byte[0];
|
||
|
assertArrayEquals(expectedOutput, output);
|
||
|
}
|
||
|
@@ -46,8 +46,8 @@ public void testTrimAll() {
|
||
|
public void testCapitalize() {
|
||
|
byte[] output = new byte[6];
|
||
|
byte[] input = {113, -61, -90, -32, -92, -86}; // "qæप"
|
||
|
- Transform.transformDictionaryWord(
|
||
|
- output, 0, ByteBuffer.wrap(input), 0, input.length, 44);
|
||
|
+ Transform.transformDictionaryWord(output, 0,
|
||
|
+ ByteBuffer.wrap(input), 0, input.length, Transform.RFC_TRANSFORMS, 44);
|
||
|
byte[] expectedOutput = {81, -61, -122, -32, -92, -81}; // "QÆय"
|
||
|
assertArrayEquals(expectedOutput, output);
|
||
|
}
|
||
|
@@ -60,9 +60,9 @@ public void testAllTransforms() {
|
||
|
byte[] testWord = {111, 49, 50, 51, 52, 53, 54, 55, 56, 57, 97, 98, 99, 100, 101, 102};
|
||
|
byte[] output = new byte[2259];
|
||
|
int offset = 0;
|
||
|
- for (int i = 0; i < Transform.NUM_TRANSFORMS; ++i) {
|
||
|
- offset += Transform.transformDictionaryWord(
|
||
|
- output, offset, ByteBuffer.wrap(testWord), 0, testWord.length, i);
|
||
|
+ for (int i = 0; i < Transform.NUM_RFC_TRANSFORMS; ++i) {
|
||
|
+ offset += Transform.transformDictionaryWord(output, offset,
|
||
|
+ ByteBuffer.wrap(testWord), 0, testWord.length, Transform.RFC_TRANSFORMS, i);
|
||
|
output[offset++] = -1;
|
||
|
}
|
||
|
assertEquals(output.length, offset);
|
||
|
|