aboutsummaryrefslogtreecommitdiffstats
path: root/lib/Bytecode/Reader/Reader.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'lib/Bytecode/Reader/Reader.cpp')
-rw-r--r--lib/Bytecode/Reader/Reader.cpp78
1 files changed, 56 insertions, 22 deletions
diff --git a/lib/Bytecode/Reader/Reader.cpp b/lib/Bytecode/Reader/Reader.cpp
index bedfa7e..18399c1 100644
--- a/lib/Bytecode/Reader/Reader.cpp
+++ b/lib/Bytecode/Reader/Reader.cpp
@@ -2153,19 +2153,40 @@ void BytecodeReader::ParseModule() {
error("Function declared, but bytecode stream ended before definition");
}
-static unsigned GetUncompressionBuffer(char*&buff, unsigned& sz, void* ctxt){
+/// This function handles allocation of the buffer used for decompression of
+/// compressed bytecode files. It is called by Compressor::decompress which is
+/// called by BytecodeReader::ParseBytecode.
+static unsigned GetDecompressionBuffer(char*&buff, unsigned& sz, void* ctxt){
+ // Case the context variable to our BufferInfo
BytecodeReader::BufferInfo* bi =
reinterpret_cast<BytecodeReader::BufferInfo*>(ctxt);
+
+ // Compute the new, doubled, size of the block
unsigned new_size = bi->size * 2;
+
+ // Extend or allocate the block (realloc(0,n) == malloc(n))
+ char* new_buff = (char*) ::realloc(bi->buff, new_size);
+
+ // Figure out what to return to the Compressor. If this is the first call,
+ // then bi->buff will be null. In this case we want to return the entire
+ // buffer because there was no previous allocation. Otherwise, when the
+ // buffer is reallocated, we save the new base pointer in the BufferInfo.buff
+ // field but return the address of only the extension, mid-way through the
+ // buffer (since its size was doubled). Furthermore, the sz result must be
+ // 1/2 the total size of the buffer.
if (bi->buff == 0 ) {
- buff = bi->buff = (char*) malloc(new_size);
+ buff = bi->buff = new_buff;
sz = new_size;
} else {
- bi->buff = (char*) ::realloc(bi->buff, new_size);
- buff = bi->buff + bi->size;
+ bi->buff = new_buff;
+ buff = new_buff + bi->size;
sz = bi->size;
}
+
+ // Retain the size of the allocated block
bi->size = new_size;
+
+ // Make sure we fail (return 1) if we didn't get any memory.
return (bi->buff == 0 ? 1 : 0);
}
@@ -2183,26 +2204,39 @@ void BytecodeReader::ParseBytecode(BufPtr Buf, unsigned Length,
if (Handler) Handler->handleStart(TheModule, Length);
- // Read and check signature...
- bool compressed =
- (Buf[0] == 0xEC && Buf[1] == 0xEC && Buf[2] == 0xF6 && Buf[3] == 0xED);
-
- if (compressed) {
- bi.size = Length * 2;;
- // Bytecode is compressed, have to decompress it first.
- unsigned uncompressedLength = Compressor::decompress((char*)Buf+4,Length-4,
- GetUncompressionBuffer, (void*) &bi);
-
+ // Read the four bytes of the signature.
+ unsigned Sig = read_uint();
+
+ // If this is a compressed file
+ if (Sig == ('l' | ('l' << 8) | ('v' << 16) | ('c' << 24))) {
+
+ // Compute the initial length of the uncompression buffer. Note that this
+ // is twice the length of the compressed buffer and will be doubled again
+ // in GetDecompressionBuffer for an initial allocation of 4xLength. This
+ // calculation is based on the typical compression ratio of bzip2 on LLVM
+ // bytecode files which typically ranges in the 50%-75% range. Since we
+ // tyipcally get at least 50%, doubling is insufficient. By using a 4x
+ // multiplier on the first allocation, we minimize the impact of having to
+ // copy the buffer on reallocation.
+ bi.size = Length * 2;
+
+ // Invoke the decompression of the bytecode. Note that we have to skip the
+ // file's magic number which is not part of the compressed block. Hence,
+ // the Buf+4 and Length-4.
+ unsigned decompressedLength = Compressor::decompress((char*)Buf+4,Length-4,
+ GetDecompressionBuffer, (void*) &bi);
+
+ // We must adjust the buffer pointers used by the bytecode reader to point
+ // into the new decompressed block. After decompression, the BufferInfo
+ // structure (member bi), will point to a contiguous memory area that has
+ // the decompressed data.
At = MemStart = BlockStart = Buf = (BufPtr) bi.buff;
- MemEnd = BlockEnd = Buf + uncompressedLength;
+ MemEnd = BlockEnd = Buf + decompressedLength;
- } else {
- if (!(Buf[0] == 'l' && Buf[1] == 'l' && Buf[2] == 'v' && Buf[3] == 'm'))
- error("Invalid bytecode signature: " +
- utohexstr(Buf[0]) + utohexstr(Buf[1]) + utohexstr(Buf[2]) +
- utohexstr(Buf[3]));
- else
- At += 4; // skip the bytes
+ // else if this isn't a regular (uncompressed) bytecode file, then its
+ // and error, generate that now.
+ } else if (Sig != ('l' | ('l' << 8) | ('v' << 16) | ('m' << 24))) {
+ error("Invalid bytecode signature: " + utohexstr(Sig));
}
// Tell the handler we're starting a module