/* Copyright (c) 2013. The YARA Authors. All Rights Reserved. Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met: 1. Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer. 2. Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution. 3. Neither the name of the copyright holder nor the names of its contributors may be used to endorse or promote products derived from this software without specific prior written permission. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ /* This module implements a structure I've called "arena". An arena is a data container composed of a set of pages. The arena grows automatically when needed by adding new pages to hold new data. Arenas can be saved and loaded from files. */ #include #include #include #include #include #include #include #include #include #include #pragma pack(push) #pragma pack(1) typedef struct _ARENA_FILE_HEADER { char magic[4]; uint32_t size; uint32_t version; } ARENA_FILE_HEADER; #pragma pack(pop) #define free_space(page) \ ((page)->size - (page)->used) // // _yr_arena_new_page // // Creates a new arena page of a given size // // Args: // size_t size - Size of the page // // Returns: // A pointer to the newly created YR_ARENA_PAGE structure // static YR_ARENA_PAGE* _yr_arena_new_page( size_t size) { YR_ARENA_PAGE* new_page; new_page = (YR_ARENA_PAGE*) yr_malloc(sizeof(YR_ARENA_PAGE)); if (new_page == NULL) return NULL; new_page->address = (uint8_t*) yr_malloc(size); if (new_page->address == NULL) { yr_free(new_page); return NULL; } new_page->size = size; new_page->used = 0; new_page->next = NULL; new_page->prev = NULL; new_page->reloc_list_head = NULL; new_page->reloc_list_tail = NULL; return new_page; } // // yr_arena_page_for_address // // Returns the page within the arena where an address reside. // // Args: // YR_ARENA* arena - Pointer to the arena // void* address - Address to be located // // Returns: // A pointer the corresponding YR_ARENA_PAGE structure where the address // resides. // YR_ARENA_PAGE* yr_arena_page_for_address( YR_ARENA* arena, void* address) { YR_ARENA_PAGE* page; // Most of the times this function is called with an address within // the current page, let's check the current page first to avoid // looping through the page list. page = arena->current_page; if (page != NULL && (uint8_t*) address >= page->address && (uint8_t*) address < page->address + page->used) return page; page = arena->page_list_head; while (page != NULL) { if ((uint8_t*) address >= page->address && (uint8_t*) address < page->address + page->used) return page; page = page->next; } return NULL; } // // _yr_arena_make_ptr_relocatable // // Tells the arena that certain addresses contains a relocatable pointer. // // Args: // YR_ARENA* arena - Pointer the arena // void* address - Base address // va_list offsets - List of offsets relative to base address // // Returns: // ERROR_SUCCESS if succeed or the corresponding error code otherwise. // static int _yr_arena_make_ptr_relocatable( YR_ARENA* arena, void* base, va_list offsets) { YR_RELOC* reloc; YR_ARENA_PAGE* page; size_t offset; size_t base_offset; int result = ERROR_SUCCESS; // If the arena must be relocatable. assert(arena->flags & ARENA_FLAGS_RELOCATABLE); page = yr_arena_page_for_address(arena, base); assert(page != NULL); base_offset = (uint8_t*) base - page->address; offset = va_arg(offsets, size_t); while (offset != -1) { assert(page->used >= sizeof(int64_t)); assert(base_offset + offset <= page->used - sizeof(int64_t)); reloc = (YR_RELOC*) yr_malloc(sizeof(YR_RELOC)); if (reloc == NULL) return ERROR_INSUFFICIENT_MEMORY; reloc->offset = (uint32_t) (base_offset + offset); reloc->next = NULL; if (page->reloc_list_head == NULL) page->reloc_list_head = reloc; if (page->reloc_list_tail != NULL) page->reloc_list_tail->next = reloc; page->reloc_list_tail = reloc; offset = va_arg(offsets, size_t); } return result; } // // yr_arena_create // // Creates a new arena. // // Args: // size_t initial_size - Initial size // int flags - Flags // YR_ARENA** arena - Address where a pointer to the new arena will be // written to. // // Returns: // ERROR_SUCCESS if succeed or the corresponding error code otherwise. // int yr_arena_create( size_t initial_size, int flags, YR_ARENA** arena) { YR_ARENA* new_arena; YR_ARENA_PAGE* new_page; *arena = NULL; new_arena = (YR_ARENA*) yr_malloc(sizeof(YR_ARENA)); if (new_arena == NULL) return ERROR_INSUFFICIENT_MEMORY; new_page = _yr_arena_new_page(initial_size); if (new_page == NULL) { yr_free(new_arena); return ERROR_INSUFFICIENT_MEMORY; } new_arena->page_list_head = new_page; new_arena->current_page = new_page; new_arena->flags = flags | ARENA_FLAGS_COALESCED; *arena = new_arena; return ERROR_SUCCESS; } // // yr_arena_destroy // // Destroys an arena releasing its resource. // // Args: // YR_ARENA* arena - Pointer to the arena. // // Returns: // ERROR_SUCCESS if succeed or the corresponding error code otherwise. // void yr_arena_destroy( YR_ARENA* arena) { YR_RELOC* reloc; YR_RELOC* next_reloc; YR_ARENA_PAGE* page; YR_ARENA_PAGE* next_page; if (arena == NULL) return; page = arena->page_list_head; while(page != NULL) { next_page = page->next; reloc = page->reloc_list_head; while (reloc != NULL) { next_reloc = reloc->next; yr_free(reloc); reloc = next_reloc; } yr_free(page->address); yr_free(page); page = next_page; } yr_free(arena); } // // yr_arena_base_address // // Returns the base address for the arena. // // Args: // YR_ARENA* arena - Pointer to the arena. // // Returns: // A pointer to the arena's data. NULL if no data has been written to // the arena yet. // void* yr_arena_base_address( YR_ARENA* arena) { if (arena->page_list_head->used == 0) return NULL; return arena->page_list_head->address; } // // yr_arena_next_address // // Given an address and an offset, returns the address where // address + offset resides. The arena is a collection of non-contiguous // regions of memory (pages), if address is pointing at the end of a page, // address + offset could cross the page boundary and point at somewhere // within the next page, this function handles these situations. It works // also with negative offsets. // // Args: // YR_ARENA* arena - Pointer to the arena. // void* address - Base address. // int offset - Offset. // // Returns: // A pointer // void* yr_arena_next_address( YR_ARENA* arena, void* address, size_t offset) { YR_ARENA_PAGE* page; page = yr_arena_page_for_address(arena, address); assert(page != NULL); if ((uint8_t*) address + offset >= page->address && (uint8_t*) address + offset < page->address + page->used) { return (uint8_t*) address + offset; } if (offset > 0) { offset -= page->address + page->used - (uint8_t*) address; page = page->next; while (page != NULL) { if (offset < page->used) return page->address + offset; offset -= page->used; page = page->next; } } else { offset += page->used; page = page->prev; while (page != NULL) { if (offset < page->used) return page->address + page->used + offset; offset += page->used; page = page->prev; } } return NULL; } // // yr_arena_coalesce // // Coalesce the arena into a single page. This is a required step before // saving the arena to a file. // // Args: // YR_ARENA* arena - Pointer to the arena. // // Returns: // ERROR_SUCCESS if succeed or the corresponding error code otherwise. // int yr_arena_coalesce( YR_ARENA* arena) { YR_ARENA_PAGE* page; YR_ARENA_PAGE* big_page; YR_ARENA_PAGE* next_page; YR_RELOC* reloc; uint8_t** reloc_address; uint8_t* reloc_target; size_t total_size = 0; page = arena->page_list_head; while(page != NULL) { total_size += page->used; page = page->next; } // Create a new page that will contain the entire arena. big_page = _yr_arena_new_page(total_size); if (big_page == NULL) return ERROR_INSUFFICIENT_MEMORY; // Copy data from current pages to the big page and adjust relocs. page = arena->page_list_head; while (page != NULL) { page->new_address = big_page->address + big_page->used; memcpy(page->new_address, page->address, page->used); reloc = page->reloc_list_head; while (reloc != NULL) { reloc->offset += (uint32_t) big_page->used; reloc = reloc->next; } if (big_page->reloc_list_head == NULL) big_page->reloc_list_head = page->reloc_list_head; if (big_page->reloc_list_tail != NULL) big_page->reloc_list_tail->next = page->reloc_list_head; if (page->reloc_list_tail != NULL) big_page->reloc_list_tail = page->reloc_list_tail; big_page->used += page->used; page = page->next; } // Relocate pointers. reloc = big_page->reloc_list_head; while (reloc != NULL) { reloc_address = (uint8_t**) (big_page->address + reloc->offset); reloc_target = *reloc_address; if (reloc_target != NULL) { page = yr_arena_page_for_address(arena, reloc_target); assert(page != NULL); *reloc_address = page->new_address + (reloc_target - page->address); } reloc = reloc->next; } // Release current pages. page = arena->page_list_head; while(page != NULL) { next_page = page->next; yr_free(page->address); yr_free(page); page = next_page; } arena->page_list_head = big_page; arena->current_page = big_page; arena->flags |= ARENA_FLAGS_COALESCED; return ERROR_SUCCESS; } // // yr_arena_reserve_memory // // Ensures that the arena have enough contiguous memory for future allocations. // if the available space in the current page is lower than "size", a new page // is allocated. // // Args: // YR_ARENA* arena - Pointer to the arena. // size_t size - Size of the region to be reserved. // // Returns: // ERROR_SUCCESS if succeed or the corresponding error code otherwise. // int yr_arena_reserve_memory( YR_ARENA* arena, size_t size) { YR_ARENA_PAGE* new_page; size_t new_page_size; uint8_t* new_page_address; if (size > free_space(arena->current_page)) { // Requested space is bigger than current page's empty space, // lets calculate the size for a new page. new_page_size = arena->current_page->size * 2; while (new_page_size < size) new_page_size *= 2; if (arena->current_page->used == 0) { // Current page is not used at all, it can be reallocated. new_page_address = (uint8_t*) yr_realloc( arena->current_page->address, new_page_size); if (new_page_address == NULL) return ERROR_INSUFFICIENT_MEMORY; arena->current_page->address = new_page_address; arena->current_page->size = new_page_size; } else { new_page = _yr_arena_new_page(new_page_size); if (new_page == NULL) return ERROR_INSUFFICIENT_MEMORY; new_page->prev = arena->current_page; arena->current_page->next = new_page; arena->current_page = new_page; arena->flags &= ~ARENA_FLAGS_COALESCED; } } return ERROR_SUCCESS; } // // yr_arena_allocate_memory // // Allocates memory within the arena. // // Args: // YR_ARENA* arena - Pointer to the arena. // size_t size - Size of the region to be allocated. // void** allocated_memory - Address of a pointer to newly allocated // region. // Returns: // ERROR_SUCCESS if succeed or the corresponding error code otherwise. // int yr_arena_allocate_memory( YR_ARENA* arena, size_t size, void** allocated_memory) { FAIL_ON_ERROR(yr_arena_reserve_memory(arena, size)); *allocated_memory = arena->current_page->address + \ arena->current_page->used; arena->current_page->used += size; return ERROR_SUCCESS; } // // yr_arena_allocate_struct // // Allocates a structure within the arena. This function is similar to // yr_arena_allocate_memory but additionally receives a variable-length // list of offsets within the structure where pointers reside. This allows // the arena to keep track of pointers that must be adjusted when memory // is relocated. This is an example on how to invoke this function: // // yr_arena_allocate_struct( // arena, // sizeof(MY_STRUCTURE), // (void**) &my_structure_ptr, // offsetof(MY_STRUCTURE, field_1), // offsetof(MY_STRUCTURE, field_2), // .. // offsetof(MY_STRUCTURE, field_N), // EOL); // // Args: // YR_ARENA* arena - Pointer to the arena. // size_t size - Size of the region to be allocated. // void** allocated_memory - Address of a pointer to newly allocated // region. // ... - Variable number of offsets relative to the // beginning of the struct. Offsets are of type // size_t. // // Returns: // ERROR_SUCCESS if succeed or the corresponding error code otherwise. // int yr_arena_allocate_struct( YR_ARENA* arena, size_t size, void** allocated_memory, ...) { int result; va_list offsets; va_start(offsets, allocated_memory); result = yr_arena_allocate_memory(arena, size, allocated_memory); if (result == ERROR_SUCCESS && arena->flags & ARENA_FLAGS_RELOCATABLE) result = _yr_arena_make_ptr_relocatable(arena, *allocated_memory, offsets); va_end(offsets); if (result == ERROR_SUCCESS) memset(*allocated_memory, 0, size); return result; } // // yr_arena_make_ptr_relocatable // // Tells the arena that certain addresses contains a relocatable pointer. // // Args: // YR_ARENA* arena - Pointer to the arena. // void* base - Address within the arena. // ... - Variable number of size_t arguments with offsets // relative to base. // // Returns: // ERROR_SUCCESS if succeed or the corresponding error code otherwise. // int yr_arena_make_ptr_relocatable( YR_ARENA* arena, void* base, ...) { int result; va_list offsets; va_start(offsets, base); result = _yr_arena_make_ptr_relocatable(arena, base, offsets); va_end(offsets); return result; } // // yr_arena_write_data // // Writes data to the arena. // // Args: // YR_ARENA* arena - Pointer to the arena. // void* data - Pointer to data to be written. // size_t size - Size of data. // void** written_data - Address where a pointer to the written data will // be returned. // // Returns: // ERROR_SUCCESS if succeed or the corresponding error code otherwise. // int yr_arena_write_data( YR_ARENA* arena, const void* data, size_t size, void** written_data) { void* output; int result; if (size > free_space(arena->current_page)) { result = yr_arena_allocate_memory(arena, size, &output); if (result != ERROR_SUCCESS) return result; } else { output = arena->current_page->address + arena->current_page->used; arena->current_page->used += size; } memcpy(output, data, size); if (written_data != NULL) *written_data = output; return ERROR_SUCCESS; } // // yr_arena_write_string // // Writes string to the arena. // // Args: // YR_ARENA* arena - Pointer to the arena. // const char* string - Pointer to string to be written. // char** written_string - Address where a pointer to the written data will // be returned. // // Returns: // ERROR_SUCCESS if succeed or the corresponding error code otherwise. // int yr_arena_write_string( YR_ARENA* arena, const char* string, char** written_string) { return yr_arena_write_data( arena, (void*) string, strlen(string) + 1, (void**) written_string); } // // yr_arena_append // // Appends source_arena to target_arena. This operation destroys source_arena, // after returning any pointer to source_arena is no longer valid. The data // from source_arena is guaranteed to be aligned to a 16 bytes boundary when // written to the source_arena // // Args: // YR_ARENA* target_arena - Pointer to target the arena. // YR_ARENA* source_arena - Pointer to source arena. // // Returns: // ERROR_SUCCESS if succeed or the corresponding error code otherwise. // int yr_arena_append( YR_ARENA* target_arena, YR_ARENA* source_arena) { uint8_t padding_data[15]; size_t padding_size = 16 - target_arena->current_page->used % 16; if (padding_size < 16) { memset(&padding_data, 0xCC, padding_size); FAIL_ON_ERROR(yr_arena_write_data( target_arena, padding_data, padding_size, NULL)); } target_arena->current_page->next = source_arena->page_list_head; source_arena->page_list_head->prev = target_arena->current_page; target_arena->current_page = source_arena->current_page; yr_free(source_arena); return ERROR_SUCCESS; } // // yr_arena_duplicate // // Duplicates the arena, making an exact copy. This function requires the // arena to be coalesced. // // Args: // YR_ARENA* arena - Pointer to the arena. // YR_ARENA** duplicated - Address where a pointer to the new arena arena // will be returned. // // Returns: // ERROR_SUCCESS if succeed or the corresponding error code otherwise. // int yr_arena_duplicate( YR_ARENA* arena, YR_ARENA** duplicated) { YR_RELOC* reloc; YR_RELOC* new_reloc; YR_ARENA_PAGE* page; YR_ARENA_PAGE* new_page; YR_ARENA* new_arena; uint8_t** reloc_address; uint8_t* reloc_target; // Arena must be coalesced and relocatable in order to be duplicated. assert(arena->flags & ARENA_FLAGS_COALESCED); assert(arena->flags & ARENA_FLAGS_RELOCATABLE); page = arena->page_list_head; FAIL_ON_ERROR(yr_arena_create(page->size, arena->flags, &new_arena)); new_page = new_arena->current_page; new_page->used = page->used; memcpy(new_page->address, page->address, page->size); reloc = page->reloc_list_head; while (reloc != NULL) { new_reloc = (YR_RELOC*) yr_malloc(sizeof(YR_RELOC)); if (new_reloc == NULL) { yr_arena_destroy(new_arena); return ERROR_INSUFFICIENT_MEMORY; } new_reloc->offset = reloc->offset; new_reloc->next = NULL; if (new_page->reloc_list_head == NULL) new_page->reloc_list_head = new_reloc; if (new_page->reloc_list_tail != NULL) new_page->reloc_list_tail->next = new_reloc; new_page->reloc_list_tail = new_reloc; reloc_address = (uint8_t**) (new_page->address + new_reloc->offset); reloc_target = *reloc_address; if (reloc_target != NULL) { assert(reloc_target >= page->address); assert(reloc_target < page->address + page->used); *reloc_address = reloc_target - \ page->address + \ new_page->address; } reloc = reloc->next; } *duplicated = new_arena; return ERROR_SUCCESS; } // // yr_arena_load_stream // // Loads an arena from a stream. The resulting arena is not relocatable, which // implies that the arena can't be duplicated with yr_arena_duplicate nor // saved with yr_arena_save_stream. // // Args: // YR_STREAM* stream - Pointer to stream object // YR_ARENA** - Address where a pointer to the loaded arena // will be returned // // Returns: // ERROR_SUCCESS if successful, appropriate error code otherwise. // int yr_arena_load_stream( YR_STREAM* stream, YR_ARENA** arena) { YR_ARENA_PAGE* page; YR_ARENA* new_arena; ARENA_FILE_HEADER header; uint32_t real_hash; uint32_t file_hash; uint32_t reloc_offset; uint8_t** reloc_address; uint8_t* reloc_target; uint32_t max_reloc_offset; int result; if (yr_stream_read(&header, sizeof(header), 1, stream) != 1) return ERROR_INVALID_FILE; if (header.magic[0] != 'Y' || header.magic[1] != 'A' || header.magic[2] != 'R' || header.magic[3] != 'A') { return ERROR_INVALID_FILE; } if (header.size < 2048) // compiled rules are always larger than 2KB return ERROR_CORRUPT_FILE; if (header.version != ARENA_FILE_VERSION) return ERROR_UNSUPPORTED_FILE_VERSION; real_hash = yr_hash(0, &header, sizeof(header)); result = yr_arena_create(header.size, ARENA_FLAGS_COALESCED, &new_arena); if (result != ERROR_SUCCESS) return result; page = new_arena->current_page; if (yr_stream_read(page->address, header.size, 1, stream) != 1) { yr_arena_destroy(new_arena); return ERROR_CORRUPT_FILE; } page->used = header.size; real_hash = yr_hash(real_hash, page->address, page->used); if (yr_stream_read(&reloc_offset, sizeof(reloc_offset), 1, stream) != 1) { yr_arena_destroy(new_arena); return ERROR_CORRUPT_FILE; } max_reloc_offset = header.size - sizeof(uint8_t*); while (reloc_offset != 0xFFFFFFFF) { if (reloc_offset > max_reloc_offset) { yr_arena_destroy(new_arena); return ERROR_CORRUPT_FILE; } //yr_arena_make_ptr_relocatable(new_arena, page->address, reloc_offset, EOL); reloc_address = (uint8_t**) (page->address + reloc_offset); reloc_target = *reloc_address; if (reloc_target == (uint8_t*) (size_t) 0xFFFABADA) { *reloc_address = 0; } else if (reloc_target < (uint8_t*) (size_t) max_reloc_offset) { *reloc_address += (size_t) page->address; } else { yr_arena_destroy(new_arena); return ERROR_CORRUPT_FILE; } if (yr_stream_read(&reloc_offset, sizeof(reloc_offset), 1, stream) != 1) { yr_arena_destroy(new_arena); return ERROR_CORRUPT_FILE; } } if (yr_stream_read(&file_hash, sizeof(file_hash), 1, stream) != 1) { yr_arena_destroy(new_arena); return ERROR_CORRUPT_FILE; } if (file_hash != real_hash) { yr_arena_destroy(new_arena); return ERROR_CORRUPT_FILE; } *arena = new_arena; return ERROR_SUCCESS; } // // yr_arena_save_stream // // Saves the arena into a stream. If the file exists its overwritten. This // function requires the arena to be coalesced. // // Args: // YR_ARENA* arena - Pointer to the arena. // YR_STREAM* stream - Pointer to stream object. // // Returns: // ERROR_SUCCESS if succeed or the corresponding error code otherwise. // int yr_arena_save_stream( YR_ARENA* arena, YR_STREAM* stream) { YR_ARENA_PAGE* page; YR_RELOC* reloc; ARENA_FILE_HEADER header; uint32_t end_marker = 0xFFFFFFFF; uint32_t file_hash; uint8_t** reloc_address; uint8_t* reloc_target; // Only coalesced and relocatable arenas can be saved. assert(arena->flags & ARENA_FLAGS_COALESCED); assert(arena->flags & ARENA_FLAGS_RELOCATABLE); page = arena->page_list_head; reloc = page->reloc_list_head; // Convert pointers to offsets before saving. while (reloc != NULL) { reloc_address = (uint8_t**) (page->address + reloc->offset); reloc_target = *reloc_address; if (reloc_target != NULL) { assert(reloc_target >= page->address); assert(reloc_target < page->address + page->used); *reloc_address = (uint8_t*) (*reloc_address - page->address); } else { *reloc_address = (uint8_t*) (size_t) 0xFFFABADA; } reloc = reloc->next; } assert(page->size < 0x80000000); // 2GB header.magic[0] = 'Y'; header.magic[1] = 'A'; header.magic[2] = 'R'; header.magic[3] = 'A'; header.size = (int32_t) page->size; header.version = ARENA_FILE_VERSION; if (yr_stream_write(&header, sizeof(header), 1, stream) != 1) return ERROR_WRITING_FILE; if (yr_stream_write(page->address, header.size, 1, stream) != 1) return ERROR_WRITING_FILE; file_hash = yr_hash(0, &header, sizeof(header)); file_hash = yr_hash(file_hash, page->address, page->used); reloc = page->reloc_list_head; // Convert offsets back to pointers. while (reloc != NULL) { if (yr_stream_write(&reloc->offset, sizeof(reloc->offset), 1, stream) != 1) return ERROR_WRITING_FILE; reloc_address = (uint8_t**) (page->address + reloc->offset); reloc_target = *reloc_address; if (reloc_target != (void*) (size_t) 0xFFFABADA) *reloc_address += (size_t) page->address; else *reloc_address = 0; reloc = reloc->next; } if (yr_stream_write(&end_marker, sizeof(end_marker), 1, stream) != 1) return ERROR_WRITING_FILE; if (yr_stream_write(&file_hash, sizeof(file_hash), 1, stream) != 1) return ERROR_WRITING_FILE; return ERROR_SUCCESS; }