corda/src/finder.cpp

815 lines
20 KiB
C++
Raw Normal View History

2010-12-06 03:21:09 +00:00
/* Copyright (c) 2008-2010, Avian Contributors
Permission to use, copy, modify, and/or distribute this software
for any purpose with or without fee is hereby granted, provided
that the above copyright notice and this permission notice appear
in all copies.
There is NO WARRANTY for this software. See license.txt for
details. */
#include "zlib-custom.h"
#include "system.h"
#include "tokenizer.h"
#include "finder.h"
using namespace vm;
namespace {
2010-09-14 02:38:55 +00:00
const bool DebugFind = false;
const char*
append(Allocator* allocator, const char* a, const char* b, const char* c)
{
unsigned al = strlen(a);
unsigned bl = strlen(b);
unsigned cl = strlen(c);
char* p = static_cast<char*>(allocator->allocate((al + bl + cl) + 1));
memcpy(p, a, al);
memcpy(p + al, b, bl);
memcpy(p + al + bl, c, cl + 1);
return p;
}
const char*
copy(Allocator* allocator, const char* a)
{
unsigned al = strlen(a);
char* p = static_cast<char*>(allocator->allocate(al + 1));
memcpy(p, a, al + 1);
return p;
}
2007-09-17 00:13:36 +00:00
bool
equal(const void* a, unsigned al, const void* b, unsigned bl)
{
if (al == bl) {
return memcmp(a, b, al) == 0;
} else {
return false;
}
}
class Element {
public:
class Iterator {
public:
virtual const char* next(unsigned* size) = 0;
virtual void dispose() = 0;
};
2007-09-17 00:13:36 +00:00
Element(): next(0) { }
virtual Iterator* iterator() = 0;
2007-09-17 00:13:36 +00:00
virtual System::Region* find(const char* name) = 0;
virtual System::FileType stat(const char* name, unsigned* length,
bool tryDirectory) = 0;
2007-09-17 00:13:36 +00:00
virtual void dispose() = 0;
Element* next;
};
class DirectoryElement: public Element {
public:
class Iterator: public Element::Iterator {
public:
Iterator(System* s, Allocator* allocator, const char* name, unsigned skip):
s(s), allocator(allocator), name(name), skip(skip), directory(0),
last(0), it(0)
{
if (not s->success(s->open(&directory, name))) {
directory = 0;
}
}
virtual const char* next(unsigned* size) {
2008-11-28 04:44:04 +00:00
if (it) {
const char* v = it->next(size);
if (v) {
return v;
} else {
it->dispose();
it = 0;
}
}
if (last) {
allocator->free(last, strlen(last) + 1);
2008-11-28 04:44:04 +00:00
}
if (directory) {
for (const char* v = directory->next(); v; v = directory->next()) {
if (v[0] != '.') {
last = append(allocator, name, "/", v);
unsigned length;
if (s->stat(last, &length) == System::TypeDirectory) {
it = new (allocator->allocate(sizeof(Iterator)))
Iterator(s, allocator, last, skip);
2008-11-28 04:44:04 +00:00
it->name = last;
}
const char* result = last + skip;
*size = strlen(result);
return result;
}
}
}
2008-11-28 04:44:04 +00:00
return 0;
}
virtual void dispose() {
directory->dispose();
allocator->free(this, sizeof(*this));
}
System* s;
Allocator* allocator;
2008-11-28 04:44:04 +00:00
const char* name;
unsigned skip;
System::Directory* directory;
2008-11-28 04:44:04 +00:00
const char* last;
Iterator* it;
};
DirectoryElement(System* s, Allocator* allocator, const char* name):
s(s), allocator(allocator), name(name)
2007-09-17 00:13:36 +00:00
{ }
virtual Element::Iterator* iterator() {
return new (allocator->allocate(sizeof(Iterator)))
Iterator(s, allocator, name, strlen(name) + 1);
}
2007-09-17 00:13:36 +00:00
virtual System::Region* find(const char* name) {
const char* file = append(allocator, this->name, "/", name);
2007-09-17 00:13:36 +00:00
System::Region* region;
System::Status status = s->map(&region, file);
allocator->free(file, strlen(file) + 1);
2007-09-17 00:13:36 +00:00
if (s->success(status)) {
2010-09-14 02:38:55 +00:00
if (DebugFind) {
fprintf(stderr, "found %s in %s\n", name, this->name);
}
2007-09-17 00:13:36 +00:00
return region;
} else {
if (DebugFind) {
fprintf(stderr, "%s not found in %s\n", name, this->name);
}
2007-09-17 00:13:36 +00:00
return 0;
}
}
virtual System::FileType stat(const char* name, unsigned* length, bool) {
const char* file = append(allocator, this->name, "/", name);
System::FileType type = s->stat(file, length);
allocator->free(file, strlen(file) + 1);
return type;
2007-09-17 00:13:36 +00:00
}
virtual void dispose() {
allocator->free(name, strlen(name) + 1);
allocator->free(this, sizeof(*this));
2007-09-17 00:13:36 +00:00
}
System* s;
Allocator* allocator;
2007-09-17 00:13:36 +00:00
const char* name;
};
class PointerRegion: public System::Region {
public:
PointerRegion(System* s, Allocator* allocator, const uint8_t* start,
size_t length):
2007-09-17 00:13:36 +00:00
s(s),
allocator(allocator),
2007-09-17 00:13:36 +00:00
start_(start),
length_(length)
{ }
virtual const uint8_t* start() {
return start_;
}
virtual size_t length() {
return length_;
}
virtual void dispose() {
allocator->free(this, sizeof(*this));
2007-09-17 00:13:36 +00:00
}
System* s;
Allocator* allocator;
2007-09-17 00:13:36 +00:00
const uint8_t* start_;
size_t length_;
};
class DataRegion: public System::Region {
public:
DataRegion(System* s, Allocator* allocator, size_t length):
2007-09-17 00:13:36 +00:00
s(s),
allocator(allocator),
2007-09-17 00:13:36 +00:00
length_(length)
{ }
virtual const uint8_t* start() {
return data;
}
virtual size_t length() {
return length_;
}
virtual void dispose() {
allocator->free(this, sizeof(*this) + length_);
2007-09-17 00:13:36 +00:00
}
System* s;
Allocator* allocator;
2007-09-17 00:13:36 +00:00
size_t length_;
uint8_t data[0];
};
class JarIndex {
public:
static const unsigned LocalHeaderSize = 30;
static const unsigned HeaderSize = 46;
2007-09-17 00:13:36 +00:00
enum CompressionMethod {
Stored = 0,
Deflated = 8
};
class Node {
public:
Node(uint32_t hash, const uint8_t* entry, Node* next):
hash(hash), entry(entry), next(next)
{ }
uint32_t hash;
const uint8_t* entry;
Node* next;
};
JarIndex(System* s, Allocator* allocator, unsigned capacity):
2007-09-17 00:13:36 +00:00
s(s),
allocator(allocator),
2007-09-17 00:13:36 +00:00
capacity(capacity),
position(0),
nodes(static_cast<Node*>(allocator->allocate(sizeof(Node) * capacity)))
2007-09-17 00:13:36 +00:00
{
memset(table, 0, sizeof(Node*) * capacity);
}
static uint16_t get2(const uint8_t* p) {
return
(static_cast<uint16_t>(p[1]) << 8) |
(static_cast<uint16_t>(p[0]) );
}
static uint32_t get4(const uint8_t* p) {
return
(static_cast<uint32_t>(p[3]) << 24) |
(static_cast<uint32_t>(p[2]) << 16) |
(static_cast<uint32_t>(p[1]) << 8) |
(static_cast<uint32_t>(p[0]) );
}
static uint32_t signature(const uint8_t* p) {
return get4(p);
}
static uint16_t compressionMethod(const uint8_t* centralHeader) {
return get2(centralHeader + 10);
2007-09-17 00:13:36 +00:00
}
static uint32_t compressedSize(const uint8_t* centralHeader) {
return get4(centralHeader + 20);
2007-09-17 00:13:36 +00:00
}
static uint32_t uncompressedSize(const uint8_t* centralHeader) {
return get4(centralHeader + 24);
2007-09-17 00:13:36 +00:00
}
static uint16_t fileNameLength(const uint8_t* centralHeader) {
return get2(centralHeader + 28);
2007-09-17 00:13:36 +00:00
}
static uint16_t extraFieldLength(const uint8_t* centralHeader) {
return get2(centralHeader + 30);
2007-09-17 00:13:36 +00:00
}
static uint16_t commentFieldLength(const uint8_t* centralHeader) {
return get2(centralHeader + 32);
2007-09-17 00:13:36 +00:00
}
static uint32_t localHeaderOffset(const uint8_t* centralHeader) {
return get4(centralHeader + 42);
}
static uint16_t localFileNameLength(const uint8_t* localHeader) {
return get2(localHeader + 26);
}
static uint16_t localExtraFieldLength(const uint8_t* localHeader) {
return get2(localHeader + 28);
}
static uint32_t centralDirectoryOffset(const uint8_t* centralHeader) {
return get4(centralHeader + 16);
}
static const uint8_t* fileName(const uint8_t* centralHeader) {
return centralHeader + 46;
}
static const uint8_t* fileData(const uint8_t* localHeader) {
return localHeader + LocalHeaderSize + localFileNameLength(localHeader) +
localExtraFieldLength(localHeader);
}
static const uint8_t* endOfEntry(const uint8_t* p) {
return p + HeaderSize + fileNameLength(p) + extraFieldLength(p) +
commentFieldLength(p);
}
static JarIndex* make(System* s, Allocator* allocator, unsigned capacity) {
2007-09-17 00:13:36 +00:00
return new
(allocator->allocate(sizeof(JarIndex) + (sizeof(Node*) * capacity)))
JarIndex(s, allocator, capacity);
2007-09-17 00:13:36 +00:00
}
static JarIndex* open(System* s, Allocator* allocator,
System::Region* region)
{
JarIndex* index = make(s, allocator, 32);
2007-09-17 00:13:36 +00:00
const uint8_t* start = region->start();
const uint8_t* end = start + region->length();
const uint8_t* p = end - 22;
// Find end of central directory record
while (p > start) {
if (signature(p) == 0x06054b50) {
p = region->start() + centralDirectoryOffset(p);
while (p < end) {
if (signature(p) == 0x02014b50) {
index = index->add(hash(fileName(p), fileNameLength(p)), p);
p = endOfEntry(p);
} else {
return index;
}
}
2007-09-17 00:13:36 +00:00
} else {
p--;
2007-09-17 00:13:36 +00:00
}
}
return index;
}
JarIndex* add(uint32_t hash, const uint8_t* entry) {
if (position < capacity) {
unsigned i = hash & (capacity - 1);
table[i] = new (nodes + (position++)) Node(hash, entry, table[i]);
return this;
} else {
JarIndex* index = make(s, allocator, capacity * 2);
2007-09-17 00:13:36 +00:00
for (unsigned i = 0; i < capacity; ++i) {
index->add(nodes[i].hash, nodes[i].entry);
}
index->add(hash, entry);
dispose();
return index;
}
}
Node* findNode(const char* name) {
unsigned length = strlen(name);
unsigned i = hash(name) & (capacity - 1);
for (Node* n = table[i]; n; n = n->next) {
const uint8_t* p = n->entry;
if (equal(name, length, fileName(p), fileNameLength(p))) {
return n;
}
}
return 0;
}
System::Region* find(const char* name, const uint8_t* start) {
2007-09-17 00:13:36 +00:00
Node* n = findNode(name);
if (n) {
const uint8_t* p = n->entry;
switch (compressionMethod(p)) {
case Stored: {
return new (allocator->allocate(sizeof(PointerRegion)))
PointerRegion(s, allocator, fileData(start + localHeaderOffset(p)),
compressedSize(p));
2007-09-17 00:13:36 +00:00
} break;
case Deflated: {
DataRegion* region = new
(allocator->allocate(sizeof(DataRegion) + uncompressedSize(p)))
DataRegion(s, allocator, uncompressedSize(p));
2007-09-17 00:13:36 +00:00
z_stream zStream; memset(&zStream, 0, sizeof(z_stream));
zStream.next_in = const_cast<uint8_t*>(fileData(start +
localHeaderOffset(p)));
zStream.avail_in = compressedSize(p);
zStream.next_out = region->data;
zStream.avail_out = region->length();
// -15 means max window size and raw deflate (no zlib wrapper)
int r = inflateInit2(&zStream, -15);
expect(s, r == Z_OK);
r = inflate(&zStream, Z_FINISH);
expect(s, r == Z_STREAM_END);
inflateEnd(&zStream);
return region;
2007-09-17 00:13:36 +00:00
} break;
default:
abort(s);
}
}
2007-09-17 00:13:36 +00:00
return 0;
}
System::FileType stat(const char* name, unsigned* length, bool tryDirectory)
{
Node* node = findNode(name);
if (node) {
*length = uncompressedSize(node->entry);
return System::TypeFile;
} else if (tryDirectory) {
*length = 0;
// try again with '/' appended
unsigned length = strlen(name);
RUNTIME_ARRAY(char, n, length + 2);
memcpy(RUNTIME_ARRAY_BODY(n), name, length);
RUNTIME_ARRAY_BODY(n)[length] = '/';
RUNTIME_ARRAY_BODY(n)[length + 1] = 0;
2011-01-21 23:14:21 +00:00
node = findNode(RUNTIME_ARRAY_BODY(n));
if (node) {
return System::TypeDirectory;
} else {
return System::TypeDoesNotExist;
}
} else {
*length = 0;
return System::TypeDoesNotExist;
}
2007-09-17 00:13:36 +00:00
}
void dispose() {
allocator->free(nodes, sizeof(Node) * capacity);
allocator->free(this, sizeof(*this) + (sizeof(Node*) * capacity));
2007-09-17 00:13:36 +00:00
}
System* s;
Allocator* allocator;
2007-09-17 00:13:36 +00:00
unsigned capacity;
unsigned position;
2007-09-17 00:13:36 +00:00
Node* nodes;
Node* table[0];
};
class JarElement: public Element {
public:
class Iterator: public Element::Iterator {
public:
Iterator(System* s, Allocator* allocator, JarIndex* index):
s(s), allocator(allocator), index(index), position(0)
{ }
virtual const char* next(unsigned* size) {
if (position < index->position) {
JarIndex::Node* n = index->nodes + (position++);
*size = JarIndex::fileNameLength(n->entry);
return reinterpret_cast<const char*>(JarIndex::fileName(n->entry));
} else {
return 0;
}
}
virtual void dispose() {
allocator->free(this, sizeof(*this));
}
System* s;
Allocator* allocator;
JarIndex* index;
unsigned position;
};
JarElement(System* s, Allocator* allocator, const char* name):
s(s), allocator(allocator), name(name), region(0), index(0)
{ }
JarElement(System* s, Allocator* allocator, const uint8_t* jarData,
unsigned jarLength):
s(s),
allocator(allocator),
name(0),
region(new (allocator->allocate(sizeof(PointerRegion)))
PointerRegion(s, allocator, jarData, jarLength)),
index(JarIndex::open(s, allocator, region))
2007-09-17 00:13:36 +00:00
{ }
virtual Element::Iterator* iterator() {
2008-11-28 04:44:04 +00:00
init();
return new (allocator->allocate(sizeof(Iterator)))
Iterator(s, allocator, index);
}
virtual void init() {
2007-09-17 00:13:36 +00:00
if (index == 0) {
System::Region* r;
if (s->success(s->map(&r, name))) {
2007-09-17 00:13:36 +00:00
region = r;
index = JarIndex::open(s, allocator, r);
2007-09-17 00:13:36 +00:00
}
}
}
virtual System::Region* find(const char* name) {
init();
while (*name == '/') name++;
2010-09-14 02:38:55 +00:00
System::Region* r = (index ? index->find(name, region->start()) : 0);
if (DebugFind) {
if (r) {
fprintf(stderr, "found %s in %s\n", name, this->name);
} else {
fprintf(stderr, "%s not found in %s\n", name, this->name);
}
2010-09-14 02:38:55 +00:00
}
return r;
2007-09-17 00:13:36 +00:00
}
virtual System::FileType stat(const char* name, unsigned* length,
bool tryDirectory)
{
2007-09-17 00:13:36 +00:00
init();
while (*name == '/') name++;
return (index ? index->stat(name, length, tryDirectory)
: System::TypeDoesNotExist);
2007-09-17 00:13:36 +00:00
}
virtual void dispose() {
dispose(sizeof(*this));
}
virtual void dispose(unsigned size) {
allocator->free(name, strlen(name) + 1);
2007-09-17 00:13:36 +00:00
if (index) {
index->dispose();
}
if (region) {
2007-09-17 00:13:36 +00:00
region->dispose();
}
allocator->free(this, size);
2007-09-17 00:13:36 +00:00
}
System* s;
Allocator* allocator;
2007-09-17 00:13:36 +00:00
const char* name;
System::Region* region;
JarIndex* index;
};
class BuiltinElement: public JarElement {
public:
BuiltinElement(System* s, Allocator* allocator, const char* name,
const char* libraryName):
JarElement(s, allocator, name),
libraryName(libraryName ? copy(allocator, libraryName) : 0)
{ }
virtual void init() {
if (index == 0) {
if (s->success(s->load(&library, libraryName))) {
void* p = library->resolve(name);
if (p) {
uint8_t* (*function)(unsigned*);
memcpy(&function, &p, BytesPerWord);
unsigned size;
uint8_t* data = function(&size);
if (data) {
region = new (allocator->allocate(sizeof(PointerRegion)))
PointerRegion(s, allocator, data, size);
index = JarIndex::open(s, allocator, region);
}
}
}
}
}
virtual void dispose() {
library->disposeAll();
if (libraryName) {
allocator->free(libraryName, strlen(libraryName) + 1);
}
JarElement::dispose(sizeof(*this));
}
System::Library* library;
const char* libraryName;
};
2007-09-17 00:13:36 +00:00
Element*
parsePath(System* s, Allocator* allocator, const char* path,
const char* bootLibrary)
{
2007-09-17 00:13:36 +00:00
Element* first = 0;
Element* prev = 0;
for (Tokenizer t(path, s->pathSeparator()); t.hasMore();) {
Tokenizer::Token token(t.next());
2007-09-17 00:13:36 +00:00
Element* e;
if (*token.s == '[' and token.s[token.length - 1] == ']') {
char* name = static_cast<char*>(allocator->allocate(token.length - 1));
memcpy(name, token.s + 1, token.length - 1);
name[token.length - 2] = 0;
e = new (allocator->allocate(sizeof(BuiltinElement)))
BuiltinElement(s, allocator, name, bootLibrary);
} else {
char* name = static_cast<char*>(allocator->allocate(token.length + 1));
memcpy(name, token.s, token.length);
name[token.length] = 0;
unsigned length;
switch (s->stat(name, &length)) {
case System::TypeFile: {
e = new (allocator->allocate(sizeof(JarElement)))
JarElement(s, allocator, name);
} break;
case System::TypeDirectory: {
e = new (allocator->allocate(sizeof(DirectoryElement)))
DirectoryElement(s, allocator, name);
} break;
default: {
allocator->free(name, strlen(name) + 1);
e = 0;
} break;
}
2007-09-17 00:13:36 +00:00
}
if (DebugFind) {
fprintf(stderr, "add element %.*s %p\n", token.length, token.s, e);
}
2007-09-17 00:13:36 +00:00
if (e) {
if (prev) {
prev->next = e;
} else {
first = e;
}
prev = e;
}
}
2007-09-17 00:13:36 +00:00
return first;
}
class MyIterator: public Finder::IteratorImp {
public:
MyIterator(System* s, Allocator* allocator, Element* path):
s(s), allocator(allocator), e(path ? path->next : 0),
it(path ? path->iterator() : 0)
{ }
virtual const char* next(unsigned* size) {
while (it) {
const char* v = it->next(size);
if (v) {
return v;
} else {
it->dispose();
if (e) {
it = e->iterator();
e = e->next;
2008-11-28 04:44:04 +00:00
} else {
it = 0;
}
}
}
return 0;
}
virtual void dispose() {
if (it) it->dispose();
allocator->free(this, sizeof(*this));
}
System* s;
Allocator* allocator;
Element* e;
Element::Iterator* it;
};
class MyFinder: public Finder {
public:
MyFinder(System* system, Allocator* allocator, const char* path,
const char* bootLibrary):
system(system),
allocator(allocator),
path_(parsePath(system, allocator, path, bootLibrary)),
pathString(copy(allocator, path))
{ }
MyFinder(System* system, Allocator* allocator, const uint8_t* jarData,
unsigned jarLength):
system(system),
allocator(allocator),
path_(new (allocator->allocate(sizeof(JarElement)))
JarElement(system, allocator, jarData, jarLength)),
pathString(0)
{ }
virtual IteratorImp* iterator() {
return new (allocator->allocate(sizeof(MyIterator)))
MyIterator(system, allocator, path_);
}
2007-09-17 00:13:36 +00:00
virtual System::Region* find(const char* name) {
for (Element* e = path_; e; e = e->next) {
System::Region* r = e->find(name);
if (r) {
return r;
}
}
return 0;
}
virtual System::FileType stat(const char* name, unsigned* length,
bool tryDirectory)
{
2007-09-17 00:13:36 +00:00
for (Element* e = path_; e; e = e->next) {
System::FileType type = e->stat(name, length, tryDirectory);
if (type != System::TypeDoesNotExist) {
return type;
}
}
return System::TypeDoesNotExist;
}
virtual const char* path() {
return pathString;
}
virtual void dispose() {
2007-09-17 00:13:36 +00:00
for (Element* e = path_; e;) {
Element* t = e;
e = e->next;
t->dispose();
}
allocator->free(pathString, strlen(pathString) + 1);
allocator->free(this, sizeof(*this));
}
System* system;
Allocator* allocator;
2007-09-17 00:13:36 +00:00
Element* path_;
const char* pathString;
};
} // namespace
namespace vm {
Finder*
makeFinder(System* s, Allocator* a, const char* path, const char* bootLibrary)
{
return new (a->allocate(sizeof(MyFinder))) MyFinder(s, a, path, bootLibrary);
}
Finder*
makeFinder(System* s, Allocator* a, const uint8_t* jarData, unsigned jarLength)
{
return new (a->allocate(sizeof(MyFinder)))
MyFinder(s, a, jarData, jarLength);
}
} // namespace vm