corda/src/finder.cpp
Joshua Warner 1fcc097344 use size_t instead of unsigned in a bunch of appropriate places
This would theoretically break compatibility with apps using embedded
classpaths, on big-endian architectures - because of the size type
extension.  However, we don't currently support any big-endian
architectures, so it shouldn't be a problem.
2015-03-16 16:28:20 -06:00

1105 lines
26 KiB
C++

/* Copyright (c) 2008-2015, Avian Contributors
Permission to use, copy, modify, and/or distribute this software
for any purpose with or without fee is hereby granted, provided
that the above copyright notice and this permission notice appear
in all copies.
There is NO WARRANTY for this software. See license.txt for
details. */
#include <avian/system/system.h>
#include <avian/util/string.h>
#include <avian/util/runtime-array.h>
#include <avian/util/list.h>
#include <avian/util/hash.h>
#include <avian/util/tokenizer.h>
#include "avian/zlib-custom.h"
#include "avian/finder.h"
#include "avian/lzma.h"
#include "avian/append.h"
using namespace vm;
using namespace avian::util;
namespace {
const bool DebugFind = false;
const bool DebugStat = false;
class Element {
public:
class Iterator {
public:
virtual const char* next(size_t* size) = 0;
virtual void dispose() = 0;
};
Element() : next(0)
{
}
virtual Iterator* iterator() = 0;
virtual System::Region* find(const char* name) = 0;
virtual System::FileType stat(const char* name,
size_t* length,
bool tryDirectory) = 0;
virtual const char* urlPrefix() = 0;
virtual const char* sourceUrl() = 0;
virtual void dispose() = 0;
Element* next;
};
class DirectoryElement : public Element {
public:
class Iterator : public Element::Iterator {
public:
Iterator(System* s, Alloc* allocator, const char* name, unsigned skip)
: s(s),
allocator(allocator),
name(name),
skip(skip),
directory(0),
last(0),
it(0)
{
if (not s->success(s->open(&directory, name))) {
directory = 0;
}
}
virtual const char* next(size_t* size)
{
if (it) {
const char* v = it->next(size);
if (v) {
return v;
} else {
it->dispose();
it = 0;
}
}
if (last) {
allocator->free(last, strlen(last) + 1);
}
if (directory) {
for (const char* v = directory->next(); v; v = directory->next()) {
if (v[0] != '.') {
last = append(allocator, name, "/", v);
size_t length;
if (s->stat(last, &length) == System::TypeDirectory) {
it = new (allocator->allocate(sizeof(Iterator)))
Iterator(s, allocator, last, skip);
it->name = last;
}
const char* result = last + skip;
*size = strlen(result);
return result;
}
}
}
return 0;
}
virtual void dispose()
{
directory->dispose();
allocator->free(this, sizeof(*this));
}
System* s;
Alloc* allocator;
const char* name;
unsigned skip;
System::Directory* directory;
const char* last;
Iterator* it;
};
DirectoryElement(System* s, Alloc* allocator, const char* name)
: s(s),
allocator(allocator),
originalName(name),
name(s->toAbsolutePath(allocator, name)),
urlPrefix_(append(allocator, "file:", this->name, "/")),
sourceUrl_(append(allocator, "file:", this->name))
{
}
virtual Element::Iterator* iterator()
{
return new (allocator->allocate(sizeof(Iterator)))
Iterator(s, allocator, name, strlen(name) + 1);
}
virtual System::Region* find(const char* name)
{
const char* file = append(allocator, this->name, "/", name);
System::Region* region;
System::Status status = s->map(&region, file);
allocator->free(file, strlen(file) + 1);
if (s->success(status)) {
if (DebugFind) {
fprintf(stderr, "found %s in %s\n", name, this->name);
}
return region;
} else {
if (DebugFind) {
fprintf(stderr, "%s not found in %s\n", name, this->name);
}
return 0;
}
}
virtual System::FileType stat(const char* name, size_t* length, bool)
{
const char* file = append(allocator, this->name, "/", name);
System::FileType type = s->stat(file, length);
if (DebugStat) {
fprintf(stderr, "stat %s in %s: %d\n", name, this->name, type);
}
allocator->free(file, strlen(file) + 1);
return type;
}
virtual const char* urlPrefix()
{
return urlPrefix_;
}
virtual const char* sourceUrl()
{
return sourceUrl_;
}
virtual void dispose()
{
allocator->free(originalName, strlen(originalName) + 1);
allocator->free(name, strlen(name) + 1);
allocator->free(urlPrefix_, strlen(urlPrefix_) + 1);
allocator->free(sourceUrl_, strlen(sourceUrl_) + 1);
allocator->free(this, sizeof(*this));
}
System* s;
Alloc* allocator;
const char* originalName;
const char* name;
const char* urlPrefix_;
const char* sourceUrl_;
};
class PointerRegion : public System::Region {
public:
PointerRegion(System* s,
Alloc* allocator,
const uint8_t* start,
size_t length,
bool freePointer = false)
: s(s),
allocator(allocator),
start_(start),
length_(length),
freePointer(freePointer)
{
}
virtual const uint8_t* start()
{
return start_;
}
virtual size_t length()
{
return length_;
}
virtual void dispose()
{
if (freePointer) {
allocator->free(start_, length_);
}
allocator->free(this, sizeof(*this));
}
System* s;
Alloc* allocator;
const uint8_t* start_;
size_t length_;
bool freePointer;
};
class DataRegion : public System::Region {
public:
DataRegion(System* s, Alloc* allocator, size_t length)
: s(s), allocator(allocator), length_(length)
{
}
virtual const uint8_t* start()
{
return data;
}
virtual size_t length()
{
return length_;
}
virtual void dispose()
{
allocator->free(this, sizeof(*this) + length_);
}
System* s;
Alloc* allocator;
size_t length_;
uint8_t data[0];
};
class JarIndex {
public:
enum CompressionMethod { Stored = 0, Deflated = 8 };
class Entry {
public:
Entry(uint32_t hash, const uint8_t* entry) : hash(hash), entry(entry)
{
}
uint32_t hash;
const uint8_t* entry;
};
JarIndex(System* s, Alloc* allocator, unsigned capacity)
: s(s),
allocator(allocator),
capacity(capacity),
position(0),
nodes(static_cast<List<Entry>*>(
allocator->allocate(sizeof(List<Entry>) * capacity)))
{
memset(table, 0, sizeof(List<Entry>*) * capacity);
}
static JarIndex* make(System* s, Alloc* allocator, unsigned capacity)
{
return new (allocator->allocate(sizeof(JarIndex)
+ (sizeof(List<Entry>*) * capacity)))
JarIndex(s, allocator, capacity);
}
static JarIndex* open(System* s, Alloc* allocator, System::Region* region)
{
JarIndex* index = make(s, allocator, 32);
const uint8_t* start = region->start();
const uint8_t* end = start + region->length();
const uint8_t* p = end - CentralDirectorySearchStart;
// Find end of central directory record
while (p > start) {
if (signature(p) == CentralDirectorySignature) {
p = region->start() + centralDirectoryOffset(p);
while (p < end) {
if (signature(p) == EntrySignature) {
index = index->add(Entry(
hash(Slice<const uint8_t>(fileName(p), fileNameLength(p))), p));
p = endOfEntry(p);
} else {
return index;
}
}
} else {
p--;
}
}
return index;
}
JarIndex* add(const Entry& entry)
{
if (position < capacity) {
unsigned i = entry.hash & (capacity - 1);
table[i] = new (nodes + (position++)) List<Entry>(entry, table[i]);
return this;
} else {
JarIndex* index = make(s, allocator, capacity * 2);
for (unsigned i = 0; i < capacity; ++i) {
index->add(nodes[i].item);
}
index->add(entry);
dispose();
return index;
}
}
List<Entry>* findNode(const char* name)
{
size_t length = strlen(name);
unsigned i = hash(name) & (capacity - 1);
for (List<Entry>* n = table[i]; n; n = n->next) {
const uint8_t* p = n->item.entry;
if (equal(name, length, fileName(p), fileNameLength(p))) {
return n;
}
}
return 0;
}
System::Region* find(const char* name, const uint8_t* start)
{
List<Entry>* n = findNode(name);
if (n) {
const uint8_t* p = n->item.entry;
switch (compressionMethod(p)) {
case Stored: {
return new (allocator->allocate(sizeof(PointerRegion)))
PointerRegion(s,
allocator,
fileData(start + localHeaderOffset(p)),
compressedSize(p));
} break;
case Deflated: {
DataRegion* region = new (
allocator->allocate(sizeof(DataRegion) + uncompressedSize(p)))
DataRegion(s, allocator, uncompressedSize(p));
z_stream zStream;
memset(&zStream, 0, sizeof(z_stream));
zStream.next_in
= const_cast<uint8_t*>(fileData(start + localHeaderOffset(p)));
zStream.avail_in = compressedSize(p);
zStream.next_out = region->data;
zStream.avail_out = region->length();
// -15 means max window size and raw deflate (no zlib wrapper)
int r = inflateInit2(&zStream, -15);
expect(s, r == Z_OK);
r = inflate(&zStream, Z_FINISH);
expect(s, r == Z_STREAM_END);
inflateEnd(&zStream);
return region;
} break;
default:
abort(s);
}
}
return 0;
}
System::FileType stat(const char* name, size_t* length, bool tryDirectory)
{
List<Entry>* node = findNode(name);
if (node) {
*length = uncompressedSize(node->item.entry);
return System::TypeFile;
} else if (tryDirectory) {
*length = 0;
// try again with '/' appended
size_t length = strlen(name);
RUNTIME_ARRAY(char, n, length + 2);
memcpy(RUNTIME_ARRAY_BODY(n), name, length);
RUNTIME_ARRAY_BODY(n)[length] = '/';
RUNTIME_ARRAY_BODY(n)[length + 1] = 0;
node = findNode(RUNTIME_ARRAY_BODY(n));
if (node) {
return System::TypeDirectory;
} else {
return System::TypeDoesNotExist;
}
} else {
*length = 0;
return System::TypeDoesNotExist;
}
}
void dispose()
{
allocator->free(nodes, sizeof(List<Entry>) * capacity);
allocator->free(this, sizeof(*this) + (sizeof(List<Entry>*) * capacity));
}
System* s;
Alloc* allocator;
unsigned capacity;
unsigned position;
List<Entry>* nodes;
List<Entry>* table[0];
};
class JarElement : public Element {
public:
class Iterator : public Element::Iterator {
public:
Iterator(System* s, Alloc* allocator, JarIndex* index)
: s(s), allocator(allocator), index(index), position(0)
{
}
virtual const char* next(size_t* size)
{
if (position < index->position) {
List<JarIndex::Entry>* n = index->nodes + (position++);
*size = fileNameLength(n->item.entry);
return reinterpret_cast<const char*>(fileName(n->item.entry));
} else {
return 0;
}
}
virtual void dispose()
{
allocator->free(this, sizeof(*this));
}
System* s;
Alloc* allocator;
JarIndex* index;
unsigned position;
};
JarElement(System* s,
Alloc* allocator,
const char* name,
bool canonicalizePath = true)
: s(s),
allocator(allocator),
originalName(name),
name(name and canonicalizePath ? s->toAbsolutePath(allocator, name)
: name),
urlPrefix_(this->name ? append(allocator, "jar:file:", this->name, "!/")
: 0),
sourceUrl_(this->name ? append(allocator, "file:", this->name) : 0),
region(0),
index(0)
{
}
JarElement(System* s,
Alloc* allocator,
const uint8_t* jarData,
unsigned jarLength)
: s(s),
allocator(allocator),
originalName(0),
name(0),
urlPrefix_(name ? append(allocator, "jar:file:", name, "!/") : 0),
sourceUrl_(name ? append(allocator, "file:", name) : 0),
region(new (allocator->allocate(sizeof(PointerRegion)))
PointerRegion(s, allocator, jarData, jarLength)),
index(JarIndex::open(s, allocator, region))
{
}
virtual Element::Iterator* iterator()
{
init();
return new (allocator->allocate(sizeof(Iterator)))
Iterator(s, allocator, index);
}
virtual void init()
{
if (index == 0) {
System::Region* r;
if (s->success(s->map(&r, name))) {
region = r;
index = JarIndex::open(s, allocator, r);
}
}
}
virtual System::Region* find(const char* name)
{
init();
while (*name == '/')
name++;
System::Region* r = (index ? index->find(name, region->start()) : 0);
if (DebugFind) {
if (r) {
fprintf(stderr, "found %s in %s\n", name, this->name);
} else {
fprintf(stderr, "%s not found in %s\n", name, this->name);
}
}
return r;
}
virtual System::FileType stat(const char* name,
size_t* length,
bool tryDirectory)
{
init();
while (*name == '/')
name++;
System::FileType type = (index ? index->stat(name, length, tryDirectory)
: System::TypeDoesNotExist);
if (DebugStat) {
fprintf(stderr, "stat %s in %s: %d\n", name, this->name, type);
}
return type;
}
virtual const char* urlPrefix()
{
return urlPrefix_;
}
virtual const char* sourceUrl()
{
return sourceUrl_;
}
virtual void dispose()
{
dispose(sizeof(*this));
}
virtual void dispose(unsigned size)
{
if (name) {
if (originalName != name) {
allocator->free(originalName, strlen(originalName) + 1);
}
allocator->free(name, strlen(name) + 1);
allocator->free(urlPrefix_, strlen(urlPrefix_) + 1);
allocator->free(sourceUrl_, strlen(sourceUrl_) + 1);
}
if (index) {
index->dispose();
}
if (region) {
region->dispose();
}
allocator->free(this, size);
}
System* s;
Alloc* allocator;
const char* originalName;
const char* name;
const char* urlPrefix_;
const char* sourceUrl_;
System::Region* region;
JarIndex* index;
};
class BuiltinElement : public JarElement {
public:
BuiltinElement(System* s,
Alloc* allocator,
const char* name,
const char* libraryName)
: JarElement(s, allocator, name, false),
library(0),
libraryName(libraryName ? copy(allocator, libraryName) : 0)
{
}
virtual void init()
{
if (index == 0) {
if (s->success(s->load(&library, libraryName))) {
bool lzma = strncmp("lzma.", name, 5) == 0;
const char* symbolName = lzma ? name + 5 : name;
void* p = library->resolve(symbolName);
if (p) {
uint8_t* (*function)(size_t*);
memcpy(&function, &p, BytesPerWord);
size_t size = 0;
uint8_t* data = function(&size);
if (data) {
bool freePointer;
if (lzma) {
#ifdef AVIAN_USE_LZMA
size_t outSize;
data = decodeLZMA(s, allocator, data, size, &outSize);
size = outSize;
freePointer = true;
#else
abort(s);
#endif
} else {
freePointer = false;
}
region = new (allocator->allocate(sizeof(PointerRegion)))
PointerRegion(s, allocator, data, size, freePointer);
index = JarIndex::open(s, allocator, region);
} else if (DebugFind) {
fprintf(
stderr, "%s in %s returned null\n", symbolName, libraryName);
}
} else if (DebugFind) {
fprintf(stderr, "unable to find %s in %s\n", symbolName, libraryName);
}
} else if (DebugFind) {
fprintf(stderr, "unable to load %s\n", libraryName);
}
}
}
virtual const char* urlPrefix()
{
return "avianvmresource:";
}
virtual const char* sourceUrl()
{
return 0;
}
virtual void dispose()
{
if (library) {
library->disposeAll();
}
if (libraryName) {
allocator->free(libraryName, strlen(libraryName) + 1);
}
JarElement::dispose(sizeof(*this));
}
System::Library* library;
const char* libraryName;
};
void add(Element** first, Element** last, Element* e)
{
if (*last) {
(*last)->next = e;
} else {
*first = e;
}
*last = e;
}
unsigned baseName(const char* name, char fileSeparator)
{
const char* p = name;
const char* last = 0;
while (*p) {
if (*p == fileSeparator) {
last = p;
}
++p;
}
return last ? (last + 1) - name : 0;
}
void add(System* s,
Element** first,
Element** last,
Alloc* allocator,
const char* name,
unsigned nameLength,
const char* bootLibrary);
void addTokens(System* s,
Element** first,
Element** last,
Alloc* allocator,
const char* jarName,
unsigned jarNameBase,
const char* tokens,
unsigned tokensLength,
const char* bootLibrary)
{
for (Tokenizer t(String(tokens, tokensLength), ' '); t.hasMore();) {
String token(t.next());
RUNTIME_ARRAY(char, n, jarNameBase + token.length + 1);
memcpy(RUNTIME_ARRAY_BODY(n), jarName, jarNameBase);
memcpy(RUNTIME_ARRAY_BODY(n) + jarNameBase, token.text, token.length);
RUNTIME_ARRAY_BODY(n)[jarNameBase + token.length] = 0;
add(s,
first,
last,
allocator,
RUNTIME_ARRAY_BODY(n),
jarNameBase + token.length,
bootLibrary);
}
}
bool continuationLine(const uint8_t* base,
unsigned total,
size_t* start,
size_t* length)
{
return readLine(base, total, start, length) and *length > 0
and base[*start] == ' ';
}
void addJar(System* s,
Element** first,
Element** last,
Alloc* allocator,
const char* name,
const char* bootLibrary)
{
if (DebugFind) {
fprintf(stderr, "add jar %s\n", name);
}
JarElement* e = new (allocator->allocate(sizeof(JarElement)))
JarElement(s, allocator, name);
unsigned nameBase = baseName(name, s->fileSeparator());
add(first, last, e);
System::Region* region = e->find("META-INF/MANIFEST.MF");
if (region) {
size_t start = 0;
size_t length;
while (readLine(region->start(), region->length(), &start, &length)) {
unsigned multilineTotal = 0;
const unsigned PrefixLength = 12;
if (length > PrefixLength
and strncmp("Class-Path: ",
reinterpret_cast<const char*>(region->start() + start),
PrefixLength) == 0) {
{
size_t nextStart = start + length;
size_t nextLength;
while (continuationLine(
region->start(), region->length(), &nextStart, &nextLength)) {
multilineTotal += nextLength;
nextStart += nextLength;
}
}
const char* line = reinterpret_cast<const char*>(region->start() + start
+ PrefixLength);
unsigned lineLength = length - PrefixLength;
if (multilineTotal) {
RUNTIME_ARRAY(char, n, (length - PrefixLength) + multilineTotal + 1);
memcpy(RUNTIME_ARRAY_BODY(n), line, lineLength);
unsigned offset = lineLength;
{
size_t nextStart = start + length;
size_t nextLength;
while (continuationLine(
region->start(), region->length(), &nextStart, &nextLength)) {
unsigned continuationLength = nextLength - 1;
memcpy(RUNTIME_ARRAY_BODY(n) + offset,
region->start() + nextStart + 1,
continuationLength);
offset += continuationLength;
nextStart += nextLength;
}
}
addTokens(s,
first,
last,
allocator,
name,
nameBase,
RUNTIME_ARRAY_BODY(n),
offset,
bootLibrary);
} else {
addTokens(s,
first,
last,
allocator,
name,
nameBase,
line,
lineLength,
bootLibrary);
}
}
start += length + multilineTotal;
}
region->dispose();
}
}
void add(System* s,
Element** first,
Element** last,
Alloc* allocator,
const char* token,
unsigned tokenLength,
const char* bootLibrary)
{
if (*token == '[' and token[tokenLength - 1] == ']') {
char* name = static_cast<char*>(allocator->allocate(tokenLength - 1));
memcpy(name, token + 1, tokenLength - 1);
name[tokenLength - 2] = 0;
if (DebugFind) {
fprintf(stderr, "add builtin %s\n", name);
}
add(first,
last,
new (allocator->allocate(sizeof(BuiltinElement)))
BuiltinElement(s, allocator, name, bootLibrary));
} else {
char* name = static_cast<char*>(allocator->allocate(tokenLength + 1));
memcpy(name, token, tokenLength);
name[tokenLength] = 0;
size_t length;
switch (s->stat(name, &length)) {
case System::TypeFile: {
addJar(s, first, last, allocator, name, bootLibrary);
} break;
case System::TypeDirectory: {
if (DebugFind) {
fprintf(stderr, "add directory %s\n", name);
}
add(first,
last,
new (allocator->allocate(sizeof(DirectoryElement)))
DirectoryElement(s, allocator, name));
} break;
default: {
if (DebugFind) {
fprintf(stderr, "ignore nonexistent %s\n", name);
}
allocator->free(name, strlen(name) + 1);
} break;
}
}
}
Element* parsePath(System* s,
Alloc* allocator,
const char* path,
const char* bootLibrary)
{
Element* first = 0;
Element* last = 0;
for (Tokenizer t(path, s->pathSeparator()); t.hasMore();) {
String token(t.next());
add(s, &first, &last, allocator, token.text, token.length, bootLibrary);
}
return first;
}
class MyIterator : public Finder::IteratorImp {
public:
MyIterator(System* s, Alloc* allocator, Element* path)
: s(s),
allocator(allocator),
e(path ? path->next : 0),
it(path ? path->iterator() : 0)
{
}
virtual const char* next(size_t* size)
{
while (it) {
const char* v = it->next(size);
if (v) {
return v;
} else {
it->dispose();
if (e) {
it = e->iterator();
e = e->next;
} else {
it = 0;
}
}
}
return 0;
}
virtual void dispose()
{
if (it)
it->dispose();
allocator->free(this, sizeof(*this));
}
System* s;
Alloc* allocator;
Element* e;
Element::Iterator* it;
};
class MyFinder : public Finder {
public:
MyFinder(System* system,
Alloc* allocator,
const char* path,
const char* bootLibrary)
: system(system),
allocator(allocator),
path_(parsePath(system, allocator, path, bootLibrary)),
pathString(copy(allocator, path))
{
}
MyFinder(System* system,
Alloc* allocator,
const uint8_t* jarData,
unsigned jarLength)
: system(system),
allocator(allocator),
path_(new (allocator->allocate(sizeof(JarElement)))
JarElement(system, allocator, jarData, jarLength)),
pathString(0)
{
}
virtual IteratorImp* iterator()
{
return new (allocator->allocate(sizeof(MyIterator)))
MyIterator(system, allocator, path_);
}
virtual System::Region* find(const char* name)
{
for (Element* e = path_; e; e = e->next) {
System::Region* r = e->find(name);
if (r) {
return r;
}
}
return 0;
}
virtual System::FileType stat(const char* name,
size_t* length,
bool tryDirectory)
{
for (Element* e = path_; e; e = e->next) {
System::FileType type = e->stat(name, length, tryDirectory);
if (type != System::TypeDoesNotExist) {
return type;
}
}
return System::TypeDoesNotExist;
}
virtual const char* urlPrefix(const char* name)
{
void* finderElementPtr = NULL;
return nextUrlPrefix(name, finderElementPtr);
}
virtual const char* nextUrlPrefix(const char* name, void*& finderElementPtr)
{
Element*& e = reinterpret_cast<Element*&>(finderElementPtr);
e = e ? e->next : path_;
for (; e; e = e->next) {
size_t length;
System::FileType type = e->stat(name, &length, true);
if (type != System::TypeDoesNotExist) {
return e->urlPrefix();
}
}
return 0;
}
virtual const char* sourceUrl(const char* name)
{
for (Element* e = path_; e; e = e->next) {
size_t length;
System::FileType type = e->stat(name, &length, true);
if (type != System::TypeDoesNotExist) {
return e->sourceUrl();
}
}
return 0;
}
virtual const char* path()
{
return pathString;
}
virtual void dispose()
{
for (Element* e = path_; e;) {
Element* t = e;
e = e->next;
t->dispose();
}
if (pathString) {
allocator->free(pathString, strlen(pathString) + 1);
}
allocator->free(this, sizeof(*this));
}
System* system;
Alloc* allocator;
Element* path_;
const char* pathString;
};
} // namespace
namespace vm {
AVIAN_EXPORT Finder* makeFinder(System* s,
Alloc* a,
const char* path,
const char* bootLibrary)
{
return new (a->allocate(sizeof(MyFinder))) MyFinder(s, a, path, bootLibrary);
}
Finder* makeFinder(System* s,
Alloc* a,
const uint8_t* jarData,
size_t jarLength)
{
return new (a->allocate(sizeof(MyFinder))) MyFinder(s, a, jarData, jarLength);
}
} // namespace vm