tippecanoe/geojson.c

631 lines
15 KiB
C
Raw Normal View History

2014-09-15 22:02:33 +00:00
#include <stdio.h>
#include <stdlib.h>
#include <math.h>
#include <string.h>
#include <unistd.h>
#include <sys/stat.h>
#include <sys/types.h>
#include <sys/mman.h>
#include <string.h>
#include <fcntl.h>
#include <ctype.h>
2014-09-15 22:27:35 +00:00
#include <errno.h>
#include <limits.h>
2014-09-15 22:18:08 +00:00
#include "jsonpull.h"
2014-09-22 23:06:44 +00:00
#include "tile.h"
2014-09-15 22:18:08 +00:00
#define BASE_ZOOM 14
2014-09-15 22:18:08 +00:00
#define GEOM_POINT 0 /* array of positions */
#define GEOM_MULTIPOINT 1 /* array of arrays of positions */
#define GEOM_LINESTRING 2 /* array of arrays of positions */
#define GEOM_MULTILINESTRING 3 /* array of arrays of arrays of positions */
#define GEOM_POLYGON 4 /* array of arrays of arrays of positions */
#define GEOM_MULTIPOLYGON 5 /* array of arrays of arrays of arrays of positions */
2014-09-15 22:27:35 +00:00
#define GEOM_TYPES 6
char *geometry_names[GEOM_TYPES] = {
2014-09-15 22:18:08 +00:00
"Point",
"MultiPoint",
"LineString",
"MultiLineString",
"Polygon",
"MultiPolygon",
2014-09-15 22:02:33 +00:00
};
2014-09-15 23:32:06 +00:00
int geometry_within[GEOM_TYPES] = {
-1, /* point */
GEOM_POINT, /* multipoint */
GEOM_POINT, /* linestring */
GEOM_LINESTRING, /* multilinestring */
GEOM_LINESTRING, /* polygon */
GEOM_POLYGON, /* multipolygon */
2014-09-15 22:02:33 +00:00
};
2014-09-16 00:33:54 +00:00
int mb_geometry[GEOM_TYPES] = {
2014-09-16 21:11:50 +00:00
VT_POINT,
VT_POINT,
VT_LINE,
VT_LINE,
VT_POLYGON,
VT_POLYGON,
2014-09-16 00:33:54 +00:00
};
// http://wiki.openstreetmap.org/wiki/Slippy_map_tilenames
void latlon2tile(double lat, double lon, int zoom, unsigned int *x, unsigned int *y) {
double lat_rad = lat * M_PI / 180;
unsigned long long n = 1LL << zoom;
*x = n * ((lon + 180) / 360);
*y = n * (1 - (log(tan(lat_rad) + 1/cos(lat_rad)) / M_PI)) / 2;
}
// http://wiki.openstreetmap.org/wiki/Slippy_map_tilenames
void tile2latlon(unsigned int x, unsigned int y, int zoom, double *lat, double *lon) {
unsigned long long n = 1LL << zoom;
*lon = 360.0 * x / n - 180.0;
float lat_rad = atan(sinh(M_PI * (1 - 2.0 * y / n)));
*lat = lat_rad * 180 / M_PI;
}
unsigned long long encode(unsigned int wx, unsigned int wy) {
long long out = 0;
int i;
for (i = 0; i < 32; i++) {
long long v = ((wx >> (32 - (i + 1))) & 1) << 1;
v |= (wy >> (32 - (i + 1))) & 1;
v = v << (64 - 2 * (i + 1));
out |= v;
}
return out;
}
void decode(unsigned long long index, unsigned *wx, unsigned *wy) {
*wx = *wy = 0;
int i;
for (i = 0; i < 32; i++) {
*wx |= ((index >> (64 - 2 * (i + 1) + 1)) & 1) << (32 - (i + 1));
*wy |= ((index >> (64 - 2 * (i + 1) + 0)) & 1) << (32 - (i + 1));
}
}
// http://www.tbray.org/ongoing/When/200x/2003/03/22/Binary
void *search(const void *key, const void *base, size_t nel, size_t width,
int (*cmp)(const void *, const void *)) {
long long high = nel, low = -1, probe;
while (high - low > 1) {
probe = (low + high) >> 1;
int c = cmp(((char *) base) + probe * width, key);
if (c > 0) {
high = probe;
} else {
low = probe;
}
}
if (low < 0) {
low = 0;
}
return ((char *) base) + low * width;
}
2014-09-17 22:48:29 +00:00
int indexcmp(const void *v1, const void *v2) {
const struct index *i1 = v1;
const struct index *i2 = v2;
if (i1->index < i2->index) {
return -1;
} else if (i1->index > i2->index) {
return 1;
} else {
return 0;
}
}
2014-09-22 19:22:58 +00:00
struct pool_val *pool(struct pool *p, char *s, int type) {
struct pool_val **v = &(p->vals);
while (*v != NULL) {
int cmp = strcmp(s, (*v)->s);
if (cmp == 0) {
cmp = type - (*v)->type;
}
if (cmp == 0) {
return *v;
} else if (cmp < 0) {
v = &((*v)->left);
} else {
v = &((*v)->right);
2014-09-22 19:22:58 +00:00
}
}
*v = malloc(sizeof(struct pool_val));
(*v)->left = NULL;
(*v)->right = NULL;
2014-09-22 19:22:58 +00:00
(*v)->next = NULL;
(*v)->s = s;
(*v)->type = type;
(*v)->n = p->n++;
if (p->tail != NULL) {
p->tail->next = *v;
}
p->tail = *v;
if (p->head == NULL) {
p->head = *v;
}
2014-09-22 19:22:58 +00:00
return *v;
}
void pool_free(struct pool *p) {
while (p->head != NULL) {
struct pool_val *next = p->head->next;
free(p->head);
p->head = next;
2014-09-22 19:22:58 +00:00
}
p->head = NULL;
p->tail = NULL;
p->vals = NULL;
2014-09-22 19:22:58 +00:00
}
size_t fwrite_check(const void *ptr, size_t size, size_t nitems, FILE *stream) {
size_t w = fwrite(ptr, size, nitems, stream);
if (w != nitems) {
fprintf(stderr, "Write failed\n");
exit(EXIT_FAILURE);
}
return w;
}
void serialize_int(FILE *out, int n, long long *fpos) {
fwrite_check(&n, sizeof(int), 1, out);
*fpos += sizeof(int);
}
void serialize_uint(FILE *out, unsigned n, long long *fpos) {
fwrite_check(&n, sizeof(unsigned), 1, out);
*fpos += sizeof(unsigned);
}
void serialize_string(FILE *out, char *s, long long *fpos) {
int len = strlen(s);
2014-09-22 19:22:58 +00:00
serialize_int(out, len + 1, fpos);
fwrite_check(s, sizeof(char), len, out);
2014-09-22 19:22:58 +00:00
fwrite_check("", sizeof(char), 1, out);
*fpos += len + 1;
}
void parse_geometry(int t, json_object *j, unsigned *bbox, long long *fpos, FILE *out, int op) {
2014-09-15 23:32:06 +00:00
if (j == NULL || j->type != JSON_ARRAY) {
fprintf(stderr, "expected array for type %d\n", t);
return;
}
int within = geometry_within[t];
if (within >= 0) {
int i;
for (i = 0; i < j->length; i++) {
2014-09-16 00:33:54 +00:00
if (within == GEOM_POINT) {
if (i == 0 || mb_geometry[t] == GEOM_MULTIPOINT) {
2014-09-16 21:11:50 +00:00
op = VT_MOVETO;
2014-09-16 00:33:54 +00:00
} else {
2014-09-16 21:11:50 +00:00
op = VT_LINETO;
}
2014-09-16 00:33:54 +00:00
}
parse_geometry(within, j->array[i], bbox, fpos, out, op);
2014-09-15 23:32:06 +00:00
}
} else {
if (j->length == 2 && j->array[0]->type == JSON_NUMBER && j->array[1]->type == JSON_NUMBER) {
unsigned x, y;
double lon = j->array[0]->number;
double lat = j->array[1]->number;
latlon2tile(lat, lon, 32, &x, &y);
if (bbox != NULL) {
if (x < bbox[0]) {
bbox[0] = x;
}
if (y < bbox[1]) {
bbox[1] = y;
}
if (x > bbox[2]) {
bbox[2] = x;
}
if (y > bbox[3]) {
bbox[3] = y;
}
}
serialize_int(out, op, fpos);
serialize_uint(out, x, fpos);
serialize_uint(out, y, fpos);
2014-09-15 23:32:06 +00:00
} else {
fprintf(stderr, "malformed point");
}
}
2014-09-16 00:33:54 +00:00
if (mb_geometry[t] == GEOM_POLYGON) {
serialize_int(out, VT_CLOSEPATH, fpos);
2014-09-16 00:33:54 +00:00
}
2014-09-15 23:32:06 +00:00
}
2014-09-15 22:02:33 +00:00
2014-09-17 23:00:19 +00:00
void deserialize_int(char **f, int *n) {
memcpy(n, *f, sizeof(int));
*f += sizeof(int);
2014-09-17 00:19:54 +00:00
}
2014-09-22 19:22:58 +00:00
struct pool_val *deserialize_string(char **f, struct pool *p, int type) {
struct pool_val *ret;
2014-09-17 00:19:54 +00:00
int len;
2014-09-22 19:22:58 +00:00
2014-09-17 00:19:54 +00:00
deserialize_int(f, &len);
2014-09-22 19:22:58 +00:00
ret = pool(p, *f, type);
2014-09-17 23:00:19 +00:00
*f += len;
2014-09-22 19:22:58 +00:00
return ret;
2014-09-17 00:19:54 +00:00
}
void range_search(struct index *ix, long long n, unsigned long long start, unsigned long long end, struct index **pstart, struct index **pend) {
struct index istart, iend;
istart.index = start;
iend.index = end;
*pstart = search(&istart, ix, n, sizeof(struct index), indexcmp);
*pend = search(&iend, ix, n, sizeof(struct index), indexcmp);
if (*pend >= ix + n) {
*pend = ix + n - 1;
}
while (*pstart > ix && indexcmp(*pstart - 1, &istart) == 0) {
(*pstart)--;
}
if (indexcmp(*pstart, &istart) < 0) {
(*pstart)++;
}
if (indexcmp(*pend, &iend) > 0) {
(*pend)--;
}
}
2014-09-23 23:01:19 +00:00
void check(struct index *ix, long long n, char *metabase, unsigned *file_bbox, struct pool *file_keys) {
fprintf(stderr, "\n");
int z;
for (z = BASE_ZOOM; z >= 0; z--) {
struct index *i, *j = NULL;
for (i = ix; i < ix + n && i != NULL; i = j) {
unsigned wx, wy;
decode(i->index, &wx, &wy);
2014-09-23 01:08:37 +00:00
unsigned tx = 0, ty = 0;
if (z != 0) {
tx = wx >> (32 - z);
ty = wy >> (32 - z);
}
2014-09-23 00:46:48 +00:00
// printf("%lld in %lld\n", (long long)(i - ix), (long long)n);
for (j = i + 1; j < ix + n; j++) {
unsigned wx2, wy2;
decode(j->index, &wx2, &wy2);
2014-09-23 01:08:37 +00:00
unsigned tx2 = 0, ty2 = 0;
if (z != 0) {
tx2 = wx2 >> (32 - z);
ty2 = wy2 >> (32 - z);
}
if (tx2 != tx || ty2 != ty) {
break;
}
}
2014-09-23 01:08:37 +00:00
printf("%d/%u/%u %x %x %lld to %lld\n", z, tx, ty, wx, wy, (long long)(i - ix), (long long)(j - ix));
2014-09-23 23:01:19 +00:00
write_tile(i, j, metabase, file_bbox, z, tx, ty, z == BASE_ZOOM ? 12 : 10, BASE_ZOOM, file_keys);
}
}
}
2014-09-23 23:01:19 +00:00
void quote(FILE *fp, char *s) {
for (; *s != '\0'; s++) {
if (*s == '\\' || *s == '\"') {
fputc('\\', fp);
fputc(*s, fp);
} else if (*s < ' ') {
fprintf(fp, "\\u%04x", *s);
} else {
fputc(*s, fp);
}
}
}
void read_json(FILE *f, char *fname) {
char metaname[] = "/tmp/meta.XXXXXXXX";
char indexname[] = "/tmp/index.XXXXXXXX";
int metafd = mkstemp(metaname);
int indexfd = mkstemp(indexname);
FILE *metafile = fopen(metaname, "wb");
FILE *indexfile = fopen(indexname, "wb");
long long fpos = 0;
unlink(metaname);
unlink(indexname);
unsigned file_bbox[] = { UINT_MAX, UINT_MAX, 0, 0 };
json_pull *jp = json_begin_file(f);
long long seq = 0;
2014-09-15 22:02:33 +00:00
while (1) {
json_object *j = json_read(jp);
if (j == NULL) {
if (jp->error != NULL) {
fprintf(stderr, "%d: %s\n", jp->line, jp->error);
}
json_free(jp->root);
break;
}
json_object *type = json_hash_get(j, "type");
if (type == NULL || type->type != JSON_STRING || strcmp(type->string, "Feature") != 0) {
continue;
}
json_object *geometry = json_hash_get(j, "geometry");
if (geometry == NULL) {
fprintf(stderr, "%d: feature with no geometry\n", jp->line);
goto next_feature;
}
json_object *geometry_type = json_hash_get(geometry, "type");
if (geometry_type == NULL || geometry_type->type != JSON_STRING) {
fprintf(stderr, "%d: geometry without type string\n", jp->line);
goto next_feature;
}
json_object *properties = json_hash_get(j, "properties");
if (properties == NULL || properties->type != JSON_HASH) {
fprintf(stderr, "%d: feature without properties hash\n", jp->line);
goto next_feature;
}
json_object *coordinates = json_hash_get(geometry, "coordinates");
if (coordinates == NULL || coordinates->type != JSON_ARRAY) {
fprintf(stderr, "%d: feature without coordinates array\n", jp->line);
goto next_feature;
}
int t;
for (t = 0; t < GEOM_TYPES; t++) {
if (strcmp(geometry_type->string, geometry_names[t]) == 0) {
break;
}
}
if (t >= GEOM_TYPES) {
fprintf(stderr, "%d: Can't handle geometry type %s\n", jp->line, geometry_type->string);
goto next_feature;
}
2014-09-15 22:02:33 +00:00
{
long long start = fpos;
unsigned bbox[] = { UINT_MAX, UINT_MAX, 0, 0 };
serialize_int(metafile, mb_geometry[t], &fpos);
parse_geometry(t, coordinates, bbox, &fpos, metafile, VT_MOVETO);
serialize_int(metafile, VT_END, &fpos);
char *metakey[properties->length];
char *metaval[properties->length];
int metatype[properties->length];
int m = 0;
int i;
for (i = 0; i < properties->length; i++) {
if (properties->keys[i]->type == JSON_STRING) {
metakey[m] = properties->keys[i]->string;
if (properties->values[i] != NULL && properties->values[i]->type == JSON_STRING) {
2014-09-16 21:11:50 +00:00
metatype[m] = VT_STRING;
metaval[m] = properties->values[i]->string;
m++;
} else if (properties->values[i] != NULL && properties->values[i]->type == JSON_NUMBER) {
2014-09-16 21:11:50 +00:00
metatype[m] = VT_NUMBER;
metaval[m] = properties->values[i]->string;
m++;
2014-09-15 23:32:06 +00:00
} else if (properties->values[i] != NULL && (properties->values[i]->type == JSON_TRUE || properties->values[i]->type == JSON_FALSE)) {
2014-09-16 21:11:50 +00:00
metatype[m] = VT_BOOLEAN;
2014-09-15 23:32:06 +00:00
metaval[m] = properties->values[i]->string;
m++;
2014-09-15 22:27:35 +00:00
} else {
fprintf(stderr, "%d: Unsupported metafile type\n", jp->line);
2014-09-15 23:32:06 +00:00
goto next_feature;
2014-09-15 22:02:33 +00:00
}
}
}
serialize_int(metafile, m, &fpos);
for (i = 0; i < m; i++) {
serialize_int(metafile, metatype[i], &fpos);
serialize_string(metafile, metakey[i], &fpos);
serialize_string(metafile, metaval[i], &fpos);
}
int z = 14;
unsigned cx = bbox[0] / 2 + bbox[2] / 2;
unsigned cy = bbox[1] / 2 + bbox[3] / 2;
/* XXX do proper overlap instead of whole bounding box */
2014-09-23 01:08:37 +00:00
if (z == 0) {
struct index ix;
ix.index = encode(cx, cy);
2014-09-23 01:08:37 +00:00
ix.fpos = start;
fwrite_check(&ix, sizeof(struct index), 1, indexfile);
} else {
unsigned x, y;
for (x = bbox[0] >> (32 - z); x <= bbox[2] >> (32 - z); x++) {
for (y = bbox[1] >> (32 - z); y <= bbox[3] >> (32 - z); y++) {
struct index ix;
if (x == cx >> (32 - z) && y == cy >> (32 - z)) {
ix.index = encode(cx, cy);
} else {
ix.index = encode(x << (32 - z), y << (32 - z));
}
2014-09-23 01:08:37 +00:00
ix.fpos = start;
fwrite_check(&ix, sizeof(struct index), 1, indexfile);
}
}
}
for (i = 0; i < 2; i++) {
if (bbox[i] < file_bbox[i]) {
file_bbox[i] = bbox[i];
}
}
for (i = 2; i < 4; i++) {
if (bbox[i] > file_bbox[i]) {
file_bbox[i] = bbox[i];
}
}
if (seq % 100000 == 0) {
fprintf(stderr, "Read %.1f million features\r", seq / 1000000.0);
}
seq++;
2014-09-15 22:02:33 +00:00
}
2014-09-15 22:27:35 +00:00
next_feature:
json_free(j);
2014-09-15 22:27:35 +00:00
/* XXX check for any non-features in the outer object */
2014-09-15 22:02:33 +00:00
}
json_end(jp);
fclose(metafile);
fclose(indexfile);
printf("bbox: %x %x %x %x\n", file_bbox[0], file_bbox[1], file_bbox[2], file_bbox[3]);
struct stat indexst;
fstat(indexfd, &indexst);
struct index *index = mmap(NULL, indexst.st_size, PROT_READ | PROT_WRITE, MAP_PRIVATE, indexfd, 0);
if (index == MAP_FAILED) {
perror("mmap index");
exit(EXIT_FAILURE);
}
struct stat metast;
fstat(metafd, &metast);
char *meta = mmap(NULL, metast.st_size, PROT_READ, MAP_PRIVATE, metafd, 0);
2014-09-17 23:00:19 +00:00
if (meta == MAP_FAILED) {
perror("mmap meta");
exit(EXIT_FAILURE);
}
2014-09-23 23:01:19 +00:00
struct pool file_keys;
file_keys.n = 0;
file_keys.vals = NULL;
file_keys.head = NULL;
file_keys.tail = NULL;
qsort(index, indexst.st_size / sizeof(struct index), sizeof(struct index), indexcmp);
2014-09-23 23:01:19 +00:00
check(index, indexst.st_size / sizeof(struct index), meta, file_bbox, &file_keys);
munmap(index, indexst.st_size);
munmap(meta, metast.st_size);
close(indexfd);
close(metafd);
2014-09-23 23:01:19 +00:00
FILE *fp = fopen("tiles/metadata.json", "w");
if (fp == NULL) {
fprintf(stderr, "metadata.json: %s\n", strerror(errno));
} else {
fprintf(fp, "{\n");
fprintf(fp, "\"name\": \"");
quote(fp, fname);
fprintf(fp, "\",\n");
fprintf(fp, "\"description\": \"");
quote(fp, fname);
fprintf(fp, "\",\n");
double minlat = 0, minlon = 0, maxlat = 0, maxlon = 0, midlat = 0, midlon = 0;
fprintf(fp, "\"version\": 1,\n");
fprintf(fp, "\"minzoom\": %d,\n", 0);
fprintf(fp, "\"maxzoom\": %d,\n", BASE_ZOOM);
fprintf(fp, "\"center\": \"%f,%f,%d\",\n", midlon, midlat, BASE_ZOOM);
fprintf(fp, "\"bounds\": \"%f,%f,%f,%f\",\n", minlon, minlat, maxlon, maxlat);
fprintf(fp, "\"type\": \"overlay\",\n");
fprintf(fp, "\"json\": \"{");
fprintf(fp, "\\\"vector_layers\\\": [ { \\\"id\\\": \\\"");
quote(fp, "name");
fprintf(fp, "\\\", \\\"description\\\": \\\"\\\", \\\"minzoom\\\": %d, \\\"maxzoom\\\": %d, \\\"fields\\\": {", 0, BASE_ZOOM);
struct pool_val *pv;
for (pv = file_keys.head; pv != NULL; pv = pv->next) {
fprintf(fp, "\\\"");
quote(fp, pv->s);
if (pv->type == VT_NUMBER) {
fprintf(fp, "\\\": \\\"Number\\\"");
} else {
fprintf(fp, "\\\": \\\"String\\\"");
}
if (pv->next != NULL) {
fprintf(fp, ", ");
}
}
fprintf(fp, "} } ]");
fprintf(fp, "}\",\n");
fprintf(fp, "\"format\": \"%s\"\n", "pbf"); // no trailing comma
fprintf(fp, "}\n");
fclose(fp);
}
2014-09-15 22:02:33 +00:00
}
2014-09-15 22:27:35 +00:00
int main(int argc, char **argv) {
if (argc > 1) {
int i;
for (i = 1; i < argc; i++) {
FILE *f = fopen(argv[i], "r");
if (f == NULL) {
fprintf(stderr, "%s: %s: %s\n", argv[0], argv[i], strerror(errno));
} else {
2014-09-23 23:01:19 +00:00
read_json(f, argv[i]);
2014-09-15 22:27:35 +00:00
fclose(f);
}
}
} else {
2014-09-23 23:01:19 +00:00
read_json(stdin, "standard input");
2014-09-15 22:27:35 +00:00
}
return 0;
}