12940b44dSPeter Avalos ///////////////////////////////////////////////////////////////////////////////
22940b44dSPeter Avalos //
32940b44dSPeter Avalos /// \file x86.c
42940b44dSPeter Avalos /// \brief Filter for x86 binaries (BCJ filter)
52940b44dSPeter Avalos ///
62940b44dSPeter Avalos // Authors: Igor Pavlov
72940b44dSPeter Avalos // Lasse Collin
82940b44dSPeter Avalos //
92940b44dSPeter Avalos // This file has been put into the public domain.
102940b44dSPeter Avalos // You can do whatever you want with this file.
112940b44dSPeter Avalos //
122940b44dSPeter Avalos ///////////////////////////////////////////////////////////////////////////////
132940b44dSPeter Avalos
142940b44dSPeter Avalos #include "simple_private.h"
152940b44dSPeter Avalos
162940b44dSPeter Avalos
172940b44dSPeter Avalos #define Test86MSByte(b) ((b) == 0 || (b) == 0xFF)
182940b44dSPeter Avalos
192940b44dSPeter Avalos
2046a2189dSzrj typedef struct {
212940b44dSPeter Avalos uint32_t prev_mask;
222940b44dSPeter Avalos uint32_t prev_pos;
2346a2189dSzrj } lzma_simple_x86;
242940b44dSPeter Avalos
252940b44dSPeter Avalos
262940b44dSPeter Avalos static size_t
x86_code(void * simple_ptr,uint32_t now_pos,bool is_encoder,uint8_t * buffer,size_t size)2746a2189dSzrj x86_code(void *simple_ptr, uint32_t now_pos, bool is_encoder,
282940b44dSPeter Avalos uint8_t *buffer, size_t size)
292940b44dSPeter Avalos {
302940b44dSPeter Avalos static const bool MASK_TO_ALLOWED_STATUS[8]
312940b44dSPeter Avalos = { true, true, true, false, true, false, false, false };
322940b44dSPeter Avalos
332940b44dSPeter Avalos static const uint32_t MASK_TO_BIT_NUMBER[8]
342940b44dSPeter Avalos = { 0, 1, 2, 2, 3, 3, 3, 3 };
352940b44dSPeter Avalos
3646a2189dSzrj lzma_simple_x86 *simple = simple_ptr;
372940b44dSPeter Avalos uint32_t prev_mask = simple->prev_mask;
382940b44dSPeter Avalos uint32_t prev_pos = simple->prev_pos;
392940b44dSPeter Avalos
402940b44dSPeter Avalos if (size < 5)
412940b44dSPeter Avalos return 0;
422940b44dSPeter Avalos
432940b44dSPeter Avalos if (now_pos - prev_pos > 5)
442940b44dSPeter Avalos prev_pos = now_pos - 5;
452940b44dSPeter Avalos
462940b44dSPeter Avalos const size_t limit = size - 5;
472940b44dSPeter Avalos size_t buffer_pos = 0;
482940b44dSPeter Avalos
492940b44dSPeter Avalos while (buffer_pos <= limit) {
502940b44dSPeter Avalos uint8_t b = buffer[buffer_pos];
512940b44dSPeter Avalos if (b != 0xE8 && b != 0xE9) {
522940b44dSPeter Avalos ++buffer_pos;
532940b44dSPeter Avalos continue;
542940b44dSPeter Avalos }
552940b44dSPeter Avalos
562940b44dSPeter Avalos const uint32_t offset = now_pos + (uint32_t)(buffer_pos)
572940b44dSPeter Avalos - prev_pos;
582940b44dSPeter Avalos prev_pos = now_pos + (uint32_t)(buffer_pos);
592940b44dSPeter Avalos
602940b44dSPeter Avalos if (offset > 5) {
612940b44dSPeter Avalos prev_mask = 0;
622940b44dSPeter Avalos } else {
632940b44dSPeter Avalos for (uint32_t i = 0; i < offset; ++i) {
642940b44dSPeter Avalos prev_mask &= 0x77;
652940b44dSPeter Avalos prev_mask <<= 1;
662940b44dSPeter Avalos }
672940b44dSPeter Avalos }
682940b44dSPeter Avalos
692940b44dSPeter Avalos b = buffer[buffer_pos + 4];
702940b44dSPeter Avalos
712940b44dSPeter Avalos if (Test86MSByte(b)
722940b44dSPeter Avalos && MASK_TO_ALLOWED_STATUS[(prev_mask >> 1) & 0x7]
732940b44dSPeter Avalos && (prev_mask >> 1) < 0x10) {
742940b44dSPeter Avalos
752940b44dSPeter Avalos uint32_t src = ((uint32_t)(b) << 24)
762940b44dSPeter Avalos | ((uint32_t)(buffer[buffer_pos + 3]) << 16)
772940b44dSPeter Avalos | ((uint32_t)(buffer[buffer_pos + 2]) << 8)
782940b44dSPeter Avalos | (buffer[buffer_pos + 1]);
792940b44dSPeter Avalos
802940b44dSPeter Avalos uint32_t dest;
812940b44dSPeter Avalos while (true) {
822940b44dSPeter Avalos if (is_encoder)
832940b44dSPeter Avalos dest = src + (now_pos + (uint32_t)(
842940b44dSPeter Avalos buffer_pos) + 5);
852940b44dSPeter Avalos else
862940b44dSPeter Avalos dest = src - (now_pos + (uint32_t)(
872940b44dSPeter Avalos buffer_pos) + 5);
882940b44dSPeter Avalos
892940b44dSPeter Avalos if (prev_mask == 0)
902940b44dSPeter Avalos break;
912940b44dSPeter Avalos
922940b44dSPeter Avalos const uint32_t i = MASK_TO_BIT_NUMBER[
932940b44dSPeter Avalos prev_mask >> 1];
942940b44dSPeter Avalos
952940b44dSPeter Avalos b = (uint8_t)(dest >> (24 - i * 8));
962940b44dSPeter Avalos
972940b44dSPeter Avalos if (!Test86MSByte(b))
982940b44dSPeter Avalos break;
992940b44dSPeter Avalos
100*e151908bSDaniel Fojt src = dest ^ ((1U << (32 - i * 8)) - 1);
1012940b44dSPeter Avalos }
1022940b44dSPeter Avalos
1032940b44dSPeter Avalos buffer[buffer_pos + 4]
1042940b44dSPeter Avalos = (uint8_t)(~(((dest >> 24) & 1) - 1));
1052940b44dSPeter Avalos buffer[buffer_pos + 3] = (uint8_t)(dest >> 16);
1062940b44dSPeter Avalos buffer[buffer_pos + 2] = (uint8_t)(dest >> 8);
1072940b44dSPeter Avalos buffer[buffer_pos + 1] = (uint8_t)(dest);
1082940b44dSPeter Avalos buffer_pos += 5;
1092940b44dSPeter Avalos prev_mask = 0;
1102940b44dSPeter Avalos
1112940b44dSPeter Avalos } else {
1122940b44dSPeter Avalos ++buffer_pos;
1132940b44dSPeter Avalos prev_mask |= 1;
1142940b44dSPeter Avalos if (Test86MSByte(b))
1152940b44dSPeter Avalos prev_mask |= 0x10;
1162940b44dSPeter Avalos }
1172940b44dSPeter Avalos }
1182940b44dSPeter Avalos
1192940b44dSPeter Avalos simple->prev_mask = prev_mask;
1202940b44dSPeter Avalos simple->prev_pos = prev_pos;
1212940b44dSPeter Avalos
1222940b44dSPeter Avalos return buffer_pos;
1232940b44dSPeter Avalos }
1242940b44dSPeter Avalos
1252940b44dSPeter Avalos
1262940b44dSPeter Avalos static lzma_ret
x86_coder_init(lzma_next_coder * next,const lzma_allocator * allocator,const lzma_filter_info * filters,bool is_encoder)12715ab8c86SJohn Marino x86_coder_init(lzma_next_coder *next, const lzma_allocator *allocator,
1282940b44dSPeter Avalos const lzma_filter_info *filters, bool is_encoder)
1292940b44dSPeter Avalos {
1302940b44dSPeter Avalos const lzma_ret ret = lzma_simple_coder_init(next, allocator, filters,
13146a2189dSzrj &x86_code, sizeof(lzma_simple_x86), 5, 1, is_encoder);
1322940b44dSPeter Avalos
1332940b44dSPeter Avalos if (ret == LZMA_OK) {
13446a2189dSzrj lzma_simple_coder *coder = next->coder;
13546a2189dSzrj lzma_simple_x86 *simple = coder->simple;
13646a2189dSzrj simple->prev_mask = 0;
13746a2189dSzrj simple->prev_pos = (uint32_t)(-5);
1382940b44dSPeter Avalos }
1392940b44dSPeter Avalos
1402940b44dSPeter Avalos return ret;
1412940b44dSPeter Avalos }
1422940b44dSPeter Avalos
1432940b44dSPeter Avalos
1442940b44dSPeter Avalos extern lzma_ret
lzma_simple_x86_encoder_init(lzma_next_coder * next,const lzma_allocator * allocator,const lzma_filter_info * filters)14515ab8c86SJohn Marino lzma_simple_x86_encoder_init(lzma_next_coder *next,
14615ab8c86SJohn Marino const lzma_allocator *allocator,
1472940b44dSPeter Avalos const lzma_filter_info *filters)
1482940b44dSPeter Avalos {
1492940b44dSPeter Avalos return x86_coder_init(next, allocator, filters, true);
1502940b44dSPeter Avalos }
1512940b44dSPeter Avalos
1522940b44dSPeter Avalos
1532940b44dSPeter Avalos extern lzma_ret
lzma_simple_x86_decoder_init(lzma_next_coder * next,const lzma_allocator * allocator,const lzma_filter_info * filters)15415ab8c86SJohn Marino lzma_simple_x86_decoder_init(lzma_next_coder *next,
15515ab8c86SJohn Marino const lzma_allocator *allocator,
1562940b44dSPeter Avalos const lzma_filter_info *filters)
1572940b44dSPeter Avalos {
1582940b44dSPeter Avalos return x86_coder_init(next, allocator, filters, false);
1592940b44dSPeter Avalos }
160