https://github.com/mapbox/tippecanoe
Raw File
Tip revision: 18c1c1b507283c1aa5c4f9a5242528bc299c58a3 authored by Eric Fischer on 07 November 2018, 23:16:44 UTC
Merge branch 'master' into blake-properties
Tip revision: 18c1c1b
mvt.cpp
#include <stdio.h>
#include <string.h>
#include <string>
#include <vector>
#include <map>
#include <zlib.h>
#include <errno.h>
#include <limits.h>
#include <ctype.h>
#include <math.h>
#include <cmath>
#include "mvt.hpp"
#include "geometry.hpp"
#include "protozero/varint.hpp"
#include "protozero/pbf_reader.hpp"
#include "protozero/pbf_writer.hpp"
#include "milo/dtoa_milo.h"
#include "jsonpull/jsonpull.h"

static std::string quote(std::string const &s);

int mvt_format = mvt_blake;

mvt_geometry::mvt_geometry(int nop, long long nx, long long ny) {
	this->op = nop;
	this->x = nx;
	this->y = ny;
}

mvt_geometry::mvt_geometry(int nop, long long nx, long long ny, std::vector<double> nelevations) {
	this->op = nop;
	this->x = nx;
	this->y = ny;
	this->elevations = nelevations;
}

// https://github.com/mapbox/mapnik-vector-tile/blob/master/src/vector_tile_compression.hpp
bool is_compressed(std::string const &data) {
	return data.size() > 2 && (((uint8_t) data[0] == 0x78 && (uint8_t) data[1] == 0x9C) || ((uint8_t) data[0] == 0x1F && (uint8_t) data[1] == 0x8B));
}

// https://github.com/mapbox/mapnik-vector-tile/blob/master/src/vector_tile_compression.hpp
int decompress(std::string const &input, std::string &output) {
	z_stream inflate_s;
	inflate_s.zalloc = Z_NULL;
	inflate_s.zfree = Z_NULL;
	inflate_s.opaque = Z_NULL;
	inflate_s.avail_in = 0;
	inflate_s.next_in = Z_NULL;
	if (inflateInit2(&inflate_s, 32 + 15) != Z_OK) {
		fprintf(stderr, "Decompression error: %s\n", inflate_s.msg);
	}
	inflate_s.next_in = (Bytef *) input.data();
	inflate_s.avail_in = input.size();
	inflate_s.next_out = (Bytef *) output.data();
	inflate_s.avail_out = output.size();

	while (true) {
		size_t existing_output = inflate_s.next_out - (Bytef *) output.data();

		output.resize(existing_output + 2 * inflate_s.avail_in + 100);
		inflate_s.next_out = (Bytef *) output.data() + existing_output;
		inflate_s.avail_out = output.size() - existing_output;

		int ret = inflate(&inflate_s, 0);
		if (ret < 0) {
			fprintf(stderr, "Decompression error: ");
			if (ret == Z_DATA_ERROR) {
				fprintf(stderr, "data error");
			}
			if (ret == Z_STREAM_ERROR) {
				fprintf(stderr, "stream error");
			}
			if (ret == Z_MEM_ERROR) {
				fprintf(stderr, "out of memory");
			}
			if (ret == Z_BUF_ERROR) {
				fprintf(stderr, "no data in buffer");
			}
			fprintf(stderr, "\n");
			return 0;
		}

		if (ret == Z_STREAM_END) {
			break;
		}

		// ret must be Z_OK or Z_NEED_DICT;
		// continue decompresing
	}

	output.resize(inflate_s.next_out - (Bytef *) output.data());
	inflateEnd(&inflate_s);
	return 1;
}

// https://github.com/mapbox/mapnik-vector-tile/blob/master/src/vector_tile_compression.hpp
int compress(std::string const &input, std::string &output) {
	z_stream deflate_s;
	deflate_s.zalloc = Z_NULL;
	deflate_s.zfree = Z_NULL;
	deflate_s.opaque = Z_NULL;
	deflate_s.avail_in = 0;
	deflate_s.next_in = Z_NULL;
	deflateInit2(&deflate_s, Z_BEST_COMPRESSION, Z_DEFLATED, 31, 8, Z_DEFAULT_STRATEGY);
	deflate_s.next_in = (Bytef *) input.data();
	deflate_s.avail_in = input.size();
	size_t length = 0;
	do {
		size_t increase = input.size() / 2 + 1024;
		output.resize(length + increase);
		deflate_s.avail_out = increase;
		deflate_s.next_out = (Bytef *) (output.data() + length);
		int ret = deflate(&deflate_s, Z_FINISH);
		if (ret != Z_STREAM_END && ret != Z_OK && ret != Z_BUF_ERROR) {
			return -1;
		}
		length += (increase - deflate_s.avail_out);
	} while (deflate_s.avail_out == 0);
	deflateEnd(&deflate_s);
	output.resize(length);
	return 0;
}

mvt_scaling read_scaling(protozero::pbf_reader message) {
	protozero::pbf_reader dimension_reader(message);
	mvt_scaling dimension;

	dimension.offset = 0;
	dimension.multiplier = 1;
	dimension.base = 0;

	while (dimension_reader.next()) {
		switch (dimension_reader.tag()) {
		case 1:
			dimension.offset = dimension_reader.get_sint64();
			break;

		case 2:
			dimension.multiplier = dimension_reader.get_double();
			break;

		case 3:
			dimension.base = dimension_reader.get_double();
			break;

		default:
			dimension_reader.skip();
			break;
		}
	}

	return dimension;
}

bool mvt_tile::decode(std::string &message, bool &was_compressed) {
	layers.clear();
	std::string src;

	if (is_compressed(message)) {
		std::string uncompressed;
		if (decompress(message, uncompressed) == 0) {
			exit(EXIT_FAILURE);
		}
		src = uncompressed;
		was_compressed = true;
	} else {
		src = message;
		was_compressed = false;
	}

	protozero::pbf_reader reader(src);

	while (reader.next()) {
		switch (reader.tag()) {
		case 3: /* layer */
		{
			protozero::pbf_reader layer_reader(reader.get_message());
			mvt_layer layer;

			while (layer_reader.next()) {
				switch (layer_reader.tag()) {
				case 1: /* name */
					layer.name = layer_reader.get_string();
					break;

				case 3: /* key */
					layer.keys.push_back(layer_reader.get_string());
					break;

				case 4: /* value */
				{
					protozero::pbf_reader value_reader(layer_reader.get_message());
					mvt_value value;

					value.type = mvt_null;
					value.numeric_value.null_value = 0;

					while (value_reader.next()) {
						switch (value_reader.tag()) {
						case 1: /* string */
							value.type = mvt_string;
							value.string_value = value_reader.get_string();
							break;

						case 2: /* float */
							value.type = mvt_float;
							value.numeric_value.float_value = value_reader.get_float();
							break;

						case 3: /* double */
							value.type = mvt_double;
							value.numeric_value.double_value = value_reader.get_double();
							break;

						case 4: /* int */
							value.type = mvt_int;
							value.numeric_value.int_value = value_reader.get_int64();
							break;

						case 5: /* uint */
							value.type = mvt_uint;
							value.numeric_value.uint_value = value_reader.get_uint64();
							break;

						case 6: /* sint */
							value.type = mvt_sint;
							value.numeric_value.sint_value = value_reader.get_sint64();
							break;

						case 7: /* bool */
							value.type = mvt_bool;
							value.numeric_value.bool_value = value_reader.get_bool();
							break;

						default:
							value_reader.skip();
							break;
						}
					}

					layer.values.push_back(value);
					break;
				}

				case 5: /* extent */
					layer.extent = layer_reader.get_uint32();
					break;

				case 6: /* string values */
					layer.string_values.push_back(layer_reader.get_string());
					break;

				case 7: /* floats */
				{
					auto pi = layer_reader.get_packed_float();
					for (auto it = pi.first; it != pi.second; ++it) {
						layer.float_values.push_back(*it);
					}
					break;
				}

				case 8: /* doubles */
				{
					auto pi = layer_reader.get_packed_double();
					for (auto it = pi.first; it != pi.second; ++it) {
						layer.double_values.push_back(*it);
					}
					break;
				}

				case 9: /* integers */
				{
					auto pi = layer_reader.get_packed_fixed64();
					for (auto it = pi.first; it != pi.second; ++it) {
						layer.uint64_values.push_back(*it);
					}
					break;
				}

				case 10: /* elevation scaling */
				{
					layer.elevation_scaling = read_scaling(layer_reader.get_message());
					layer.has_elevation_scaling = true;
					break;
				}

				case 11: /* attribute scaling */
				{
					layer.attribute_scalings.push_back(read_scaling(layer_reader.get_message()));
					break;
				}

				case 12: /* tile x */
					layer.x = layer_reader.get_uint32();
					break;

				case 13: /* tile y */
					layer.y = layer_reader.get_uint32();
					break;

				case 14: /* zoom */
					layer.zoom = layer_reader.get_uint32();
					break;

				case 15: /* version */
					layer.version = layer_reader.get_uint32();
					break;

				case 2: /* feature */
				{
					protozero::pbf_reader feature_reader(layer_reader.get_message());
					mvt_feature feature;
					std::vector<uint32_t> geoms;

					while (feature_reader.next()) {
						switch (feature_reader.tag()) {
						case 1: /* id */
							feature.id = feature_reader.get_uint64();
							feature.has_id = true;
							break;

						case 2: /* tags */
						{
							auto pi = feature_reader.get_packed_uint32();
							for (auto it = pi.first; it != pi.second; ++it) {
								feature.tags.push_back(*it);
							}
							break;
						}

						case 3: /* feature type */
							feature.type = feature_reader.get_enum();
							break;

						case 4: /* geometry */
						{
							auto pi = feature_reader.get_packed_uint32();
							for (auto it = pi.first; it != pi.second; ++it) {
								geoms.push_back(*it);
							}
							break;
						}

						case 5: /* properties */
						{
							auto pi = feature_reader.get_packed_uint64();
							for (auto it = pi.first; it != pi.second; ++it) {
								feature.properties.push_back(*it);
							}
							break;
						}

						case 6: /* node attributes */
						{
							auto pi = feature_reader.get_packed_uint64();
							for (auto it = pi.first; it != pi.second; ++it) {
								feature.node_attributes.push_back(*it);
							}
							break;
						}

						case 7: /* elevations */
						{
							auto pi = feature_reader.get_packed_sint32();
							for (auto it = pi.first; it != pi.second; ++it) {
								feature.elevations.push_back(*it);
							}
							break;
						}

						case 10: /* string id */
						{
							feature.string_id = feature_reader.get_string();
							break;
						}

						case 8: /* knots */
						{
							auto pi = feature_reader.get_packed_uint64();
							for (auto it = pi.first; it != pi.second; ++it) {
								feature.knots.push_back(*it);
							}
							break;
						}

						case 9: /* spline degree */
							feature.spline_degree = feature_reader.get_uint32();
							break;

						default:
							feature_reader.skip();
							break;
						}
					}

					long long px = 0, py = 0;
					for (size_t g = 0; g < geoms.size(); g++) {
						uint32_t geom = geoms[g];
						uint32_t op = geom & 7;
						uint32_t count = geom >> 3;

						if (op == mvt_moveto || op == mvt_lineto) {
							for (size_t k = 0; k < count && g + 2 < geoms.size(); k++) {
								px += protozero::decode_zigzag32(geoms[g + 1]);
								py += protozero::decode_zigzag32(geoms[g + 2]);
								g += 2;

								mvt_geometry decoded = mvt_geometry(op, px, py);
								feature.geometry.push_back(decoded);
							}
						} else {
							feature.geometry.push_back(mvt_geometry(op, 0, 0));
						}
					}

					layer.features.push_back(feature);
					break;
				}

				default:
					layer_reader.skip();
					break;
				}
			}

			for (size_t i = 0; i < layer.keys.size(); i++) {
				layer.key_map.insert(std::pair<std::string, size_t>(layer.keys[i], i));
			}
			for (size_t i = 0; i < layer.values.size(); i++) {
				layer.value_map.insert(std::pair<mvt_value, size_t>(layer.values[i], i));
			}

			// This has to wait until the layer is decoded because we might not know
			// the values or elevation scales until after the features.

			for (size_t i = 0; i < layer.features.size(); i++) {
				std::vector<mvt_geometry> &geom = layer.features[i].geometry;
				std::vector<int> &elevations = layer.features[i].elevations;

				long current_elevation = layer.elevation_scaling.offset;
				size_t off = 0;

				if (elevations.size() != 0) {
					for (size_t j = 0; j < geom.size(); j++) {
						if (geom[j].op == mvt_moveto || geom[j].op == mvt_lineto) {
							if (off < elevations.size()) {
								double el;

								current_elevation += elevations[off];
								el = layer.elevation_scaling.base + layer.elevation_scaling.multiplier * current_elevation;

								geom[j].elevations.push_back(el);

								off++;
							} else {
								fprintf(stderr, "Ran out of elevations\n");
								exit(EXIT_FAILURE);
							}
						}
					}
				}

				elevations.clear();
			}

			layers.push_back(layer);
			break;
		}

		default:
			reader.skip();
			break;
		}
	}

	return true;
}

std::string mvt_tile::encode(int z) {
	std::string data;

	protozero::pbf_writer writer(data);

	for (size_t i = 0; i < layers.size(); i++) {
		std::string layer_string;
		protozero::pbf_writer layer_writer(layer_string);
		bool layer_is3d = false;

		layer_writer.add_uint32(15, layers[i].version); /* version */
		layer_writer.add_string(1, layers[i].name);     /* name */
		layer_writer.add_uint32(5, layers[i].extent);   /* extent */

		if (layers[i].zoom >= 0 && layers[i].x >= 0 && layers[i].y >= 0) {
			layer_writer.add_uint32(12, layers[i].x);
			layer_writer.add_uint32(13, layers[i].y);
			layer_writer.add_uint32(14, layers[i].zoom);
		}

		for (size_t j = 0; j < layers[i].keys.size(); j++) {
			layer_writer.add_string(3, layers[i].keys[j]); /* key */
		}

		for (size_t v = 0; v < layers[i].values.size(); v++) {
			std::string value_string;
			protozero::pbf_writer value_writer(value_string);
			mvt_value &pbv = layers[i].values[v];

			if (pbv.type == mvt_string) {
				value_writer.add_string(1, pbv.string_value);
			} else if (pbv.type == mvt_float) {
				value_writer.add_float(2, pbv.numeric_value.float_value);
			} else if (pbv.type == mvt_double) {
				value_writer.add_double(3, pbv.numeric_value.double_value);
			} else if (pbv.type == mvt_int) {
				value_writer.add_int64(4, pbv.numeric_value.int_value);
			} else if (pbv.type == mvt_uint) {
				value_writer.add_uint64(5, pbv.numeric_value.uint_value);
			} else if (pbv.type == mvt_sint) {
				value_writer.add_sint64(6, pbv.numeric_value.sint_value);
			} else if (pbv.type == mvt_bool) {
				value_writer.add_bool(7, pbv.numeric_value.bool_value);
			} else {
				fprintf(stderr, "Internal error: trying to write undefined attribute type to tile\n");
				exit(EXIT_FAILURE);
			}

			layer_writer.add_message(4, value_string);
		}

		for (size_t v = 0; v < layers[i].string_values.size(); v++) {
			layer_writer.add_string(6, layers[i].string_values[v]);
		}

		layer_writer.add_packed_float(7, std::begin(layers[i].float_values), std::end(layers[i].float_values));
		layer_writer.add_packed_double(8, std::begin(layers[i].double_values), std::end(layers[i].double_values));
		layer_writer.add_packed_fixed64(9, std::begin(layers[i].uint64_values), std::end(layers[i].uint64_values));

		for (size_t f = 0; f < layers[i].features.size(); f++) {
			std::vector<mvt_geometry> &geom = layers[i].features[f].geometry;

			for (size_t g = 0; g < geom.size(); g++) {
				if (geom[g].elevations.size() > 0) {
					mvt_scaling dim;

					// Use approximately the same resolution as ground resolution
					// for elevation resolution:
					// 1 meter at zoom level 13

					// dim.multiplier = exp(log(0.5) * (z - 13));
					// Use shifts instead of log for exact precision
					if (z <= 13) {
						dim.multiplier = 1 << (13 - z);
					} else {
						dim.multiplier = 1.0 / (1 << (z - 13));
					}

					// Arbitrary base and offset, just to make sure encoding and decoding work
					dim.base = dim.multiplier * 4;
					dim.offset = 50;

					layers[i].elevation_scaling = dim;
					layers[i].has_elevation_scaling = true;
				}
			}
		}

		for (size_t f = 0; f < layers[i].features.size(); f++) {
			std::string feature_string;
			protozero::pbf_writer feature_writer(feature_string);

			feature_writer.add_enum(3, layers[i].features[f].type);
			feature_writer.add_packed_uint32(2, std::begin(layers[i].features[f].tags), std::end(layers[i].features[f].tags));
			feature_writer.add_packed_uint64(5, std::begin(layers[i].features[f].properties), std::end(layers[i].features[f].properties));
			feature_writer.add_packed_uint64(6, std::begin(layers[i].features[f].node_attributes), std::end(layers[i].features[f].node_attributes));

			if (layers[i].features[f].has_id) {
				feature_writer.add_uint64(1, layers[i].features[f].id);
			}
			if (layers[i].features[f].string_id.size() != 0) {
				feature_writer.add_string(10, layers[i].features[f].string_id);
			}

			std::vector<long> elevations;
			long current_elevation = layers[i].elevation_scaling.offset;

			int px = 0, py = 0;
			int cmd_idx = -1;
			int cmd = -1;
			int length = 0;

			std::vector<mvt_geometry> &geom = layers[i].features[f].geometry;
			bool feature_is3d = false;

			std::vector<uint32_t> geometry;
			for (size_t g = 0; g < geom.size(); g++) {
				int op = geom[g].op;

				if (op != cmd) {
					if (cmd_idx >= 0) {
						geometry[cmd_idx] = (length << 3) | (cmd & ((1 << 3) - 1));
					}

					cmd = op;
					length = 0;
					cmd_idx = geometry.size();
					geometry.push_back(0);
				}

				if (op == mvt_moveto || op == mvt_lineto) {
					long long wwx = geom[g].x;
					long long wwy = geom[g].y;

					int dx = wwx - px;
					int dy = wwy - py;

					geometry.push_back(protozero::encode_zigzag32(dx));
					geometry.push_back(protozero::encode_zigzag32(dy));

					px = wwx;
					py = wwy;
					length++;

					double el;
					if (geom[g].elevations.size() > 0) {
						el = geom[g].elevations[0];
						feature_is3d = true;
						layer_is3d = true;
					} else {
						el = 0;  // XXX detect
					}

					el = std::round((el - layers[i].elevation_scaling.base) / layers[i].elevation_scaling.multiplier);
					int64_t delta = el - current_elevation;

					elevations.push_back(delta);
					current_elevation += delta;
				} else if (op == mvt_closepath) {
					length++;
				} else {
					fprintf(stderr, "\nInternal error: corrupted geometry\n");
					exit(EXIT_FAILURE);
				}
			}

			if (cmd_idx >= 0) {
				geometry[cmd_idx] = (length << 3) | (cmd & ((1 << 3) - 1));
			}

			feature_writer.add_packed_uint32(4, std::begin(geometry), std::end(geometry));

			if (feature_is3d) {
				feature_writer.add_packed_sint32(7, std::begin(elevations), std::end(elevations));
			}

			feature_writer.add_packed_uint64(8, std::begin(layers[i].features[f].knots), std::end(layers[i].features[f].knots));

			if (layers[i].features[f].spline_degree != 2) {
				feature_writer.add_uint32(9, layers[i].features[f].spline_degree);
			}

			layer_writer.add_message(2, feature_string);
		}

		if (layer_is3d) {
			std::string dimension_string;
			protozero::pbf_writer dimension_writer(dimension_string);

			dimension_writer.add_sint64(1, layers[i].elevation_scaling.offset);
			dimension_writer.add_double(2, layers[i].elevation_scaling.multiplier);
			dimension_writer.add_double(3, layers[i].elevation_scaling.base);

			layer_writer.add_message(10, dimension_string);
		}

		for (size_t d = 0; d < layers[i].attribute_scalings.size(); d++) {
			std::string dimension_string;
			protozero::pbf_writer dimension_writer(dimension_string);

			dimension_writer.add_sint64(1, layers[i].attribute_scalings[d].offset);
			dimension_writer.add_double(2, layers[i].attribute_scalings[d].multiplier);
			dimension_writer.add_double(3, layers[i].attribute_scalings[d].base);

			layer_writer.add_message(11, dimension_string);
		}

		writer.add_message(3, layer_string);
	}

	return data;
}

bool mvt_value::operator<(const mvt_value &o) const {
	if (type < o.type) {
		return true;
	}
	if (type == o.type) {
		if ((type == mvt_string && string_value < o.string_value) ||
		    (type == mvt_float && numeric_value.float_value < o.numeric_value.float_value) ||
		    (type == mvt_double && numeric_value.double_value < o.numeric_value.double_value) ||
		    (type == mvt_int && numeric_value.int_value < o.numeric_value.int_value) ||
		    (type == mvt_uint && numeric_value.uint_value < o.numeric_value.uint_value) ||
		    (type == mvt_sint && numeric_value.sint_value < o.numeric_value.sint_value) ||
		    (type == mvt_bool && numeric_value.bool_value < o.numeric_value.bool_value) ||
		    (type == mvt_hash && toString() < o.toString()) ||
		    (type == mvt_list && toString() < o.toString()) ||
		    (type == mvt_null && numeric_value.null_value < o.numeric_value.null_value)) {
			return true;
		}
	}

	return false;
}

static std::string quote(std::string const &s) {
	std::string buf;

	for (size_t i = 0; i < s.size(); i++) {
		unsigned char ch = s[i];

		if (ch == '\\' || ch == '\"') {
			buf.push_back('\\');
			buf.push_back(ch);
		} else if (ch < ' ') {
			char tmp[7];
			sprintf(tmp, "\\u%04x", ch);
			buf.append(std::string(tmp));
		} else {
			buf.push_back(ch);
		}
	}

	return buf;
}

std::string mvt_value::toString() const {
	if (type == mvt_string) {
		return std::string("\"") + quote(string_value) + "\"";
	} else if (type == mvt_int) {
		return std::to_string(numeric_value.int_value);
	} else if (type == mvt_double) {
		double v = numeric_value.double_value;
		if (v == (long long) v) {
			return std::to_string((long long) v);
		} else {
			return milo::dtoa_milo(v);
		}
	} else if (type == mvt_float) {
		double v = numeric_value.float_value;
		if (v == (long long) v) {
			return std::to_string((long long) v);
		} else {
			return milo::dtoa_milo(v);
		}
	} else if (type == mvt_sint) {
		return std::to_string(numeric_value.sint_value);
	} else if (type == mvt_uint) {
		return std::to_string(numeric_value.uint_value);
	} else if (type == mvt_bool) {
		return numeric_value.bool_value ? "true" : "false";
	} else if (type == mvt_list) {
		std::string ret = "[";

		for (size_t i = 0; i < list_value.size(); i++) {
			ret.append(list_value[i].toString());
			if (i + 1 < list_value.size()) {
				ret.append(",");
			}
		}

		ret.append("]");
		return ret;
	} else if (type == mvt_hash) {
		std::string ret = "{";

		for (size_t i = 0; i < list_value.size() && i < hash_keys.size(); i++) {
			ret.append("\"");
			ret.append(quote(hash_keys[i]));
			ret.append("\":");
			ret.append(list_value[i].toString());

			if (i + 1 < list_value.size()) {
				ret.append(",");
			}
		}

		ret.append("}");
		return ret;
	} else if (type == mvt_null) {
		return "null";
	} else {
		return "unknown";
	}
}

size_t mvt_layer::tag_key(std::string const &key) {
	size_t ko;

	std::map<std::string, size_t>::iterator ki = key_map.find(key);

	if (ki == key_map.end()) {
		ko = keys.size();
		keys.push_back(key);
		key_map.insert(std::pair<std::string, size_t>(key, ko));
	} else {
		ko = ki->second;
	}

	return ko;
}

size_t tag_object(mvt_layer &layer, json_object *j) {
	mvt_value tv;

	if (j->type == JSON_NUMBER) {
		long long v;
		if (is_integer(j->string, &v)) {
			if (v >= 0) {
				tv.type = mvt_int;
				tv.numeric_value.int_value = v;
			} else {
				tv.type = mvt_sint;
				tv.numeric_value.sint_value = v;
			}
		} else {
			tv.type = mvt_double;
			tv.numeric_value.double_value = atof(j->string);
		}
	} else if (j->type == JSON_TRUE) {
		tv.type = mvt_bool;
		tv.numeric_value.bool_value = 1;
	} else if (j->type == JSON_FALSE) {
		tv.type = mvt_bool;
		tv.numeric_value.bool_value = 0;
	} else if (j->type == JSON_STRING) {
		tv.type = mvt_string;
		tv.string_value = std::string(j->string);
	} else if (j->type == JSON_NULL) {
		tv.type = mvt_null;
		tv.numeric_value.null_value = 0;
	}

	return layer.tag_value(tv);
}

size_t mvt_layer::tag_value(mvt_value const &value) {
	size_t vo;

	std::map<mvt_value, size_t>::iterator vi = value_map.find(value);

	if (vi == value_map.end()) {
		vo = values.size();
		values.push_back(value);
		value_map.insert(std::pair<mvt_value, size_t>(value, vo));
	} else {
		vo = vi->second;
	}

	return vo;
}

void mvt_layer::tag(mvt_feature &feature, std::string key, mvt_value value) {
	if (value.type == mvt_hash || value.type == mvt_list) {
		json_pull *jp = json_begin_string((char *) value.string_value.c_str());
		json_object *jo = json_read_tree(jp);
		if (jo == NULL) {
			fprintf(stderr, "Internal error: failed to reconstruct JSON in tag %s\n", value.string_value.c_str());
			exit(EXIT_FAILURE);
		}
		size_t ko = tag_key(key);
		size_t vo = tag_object(*this, jo);
		feature.tags.push_back(ko);
		feature.tags.push_back(vo);
		json_free(jo);
		json_end(jp);
	} else {
		feature.tags.push_back(tag_key(key));
		feature.tags.push_back(tag_value(value));
	}
}

size_t mvt_layer::tag_v3_key(std::string key) {
	std::map<std::string, size_t>::iterator ki = key_map.find(key);
	size_t ko;

	if (ki == key_map.end()) {
		ko = keys.size();
		keys.push_back(key);
		key_map.insert(std::pair<std::string, size_t>(key, ko));
	} else {
		ko = ki->second;
	}

	return ko;
}

void mvt_layer::tag_v3_value(mvt_value value, std::vector<unsigned long> &onto) {
	std::map<mvt_value, unsigned long>::iterator vi = property_map.find(value);
	unsigned long vo;

	if (vi == property_map.end()) {
		if (value.type == mvt_string) {
			vo = (string_values.size() << 4) | 0;
			string_values.push_back(value.string_value);
			onto.push_back(vo);
		} else if (value.type == mvt_float) {
			vo = (float_values.size() << 4) | 1;
			float_values.push_back(value.numeric_value.float_value);
			onto.push_back(vo);
		} else if (value.type == mvt_double) {
			vo = (double_values.size() << 4) | 2;
			double_values.push_back(value.numeric_value.double_value);
			onto.push_back(vo);
		} else if (value.type == mvt_uint) {
			if (value.numeric_value.uint_value <= (1L << 61) - 1) {
				vo = (value.numeric_value.uint_value << 4) | 5;
			} else {
				vo = (uint64_values.size() << 4) | 3;
				uint64_values.push_back(value.numeric_value.uint_value);
			}
			onto.push_back(vo);
		} else if (value.type == mvt_int || value.type == mvt_sint) {
			long val;
			if (value.type == mvt_int) {
				val = value.numeric_value.int_value;
			} else {
				val = value.numeric_value.sint_value;
			}

			if (val >= -(1L << 60) + 1 && val <= (1L << 60) - 1) {
				vo = (protozero::encode_zigzag64(val) << 4) | 6;
			} else {
				vo = (uint64_values.size() << 4) | 4;
				uint64_values.push_back(protozero::encode_zigzag64(val));
			}
			onto.push_back(vo);
		} else if (value.type == mvt_bool) {
			vo = ((value.numeric_value.bool_value + 1) << 4) | 7;
			onto.push_back(vo);
		} else if (value.type == mvt_null) {
			vo = (0 << 4) | 7;
			onto.push_back(vo);
		} else if (value.type == mvt_list) {
			bool all_ints = true;
			for (size_t i = 0; i < value.list_value.size(); i++) {
				mvt_value &v = value.list_value[i];

				// Only try to delta-encode lists whose values are all smallish integers,
				// to avoid precision loss below

				if ((v.type == mvt_sint && v.numeric_value.sint_value < INT_MAX && v.numeric_value.sint_value > INT_MIN) ||
				    (v.type == mvt_uint && v.numeric_value.uint_value < INT_MAX) ||
				    (v.type == mvt_int && v.numeric_value.int_value < INT_MAX && v.numeric_value.int_value > INT_MIN)) {
					;
				} else {
					all_ints = false;
					break;
				}
			}

			if (all_ints) {
				if (delta_list_scaling < 0) {
					delta_list_scaling = attribute_scalings.size();

					mvt_scaling sc;
					sc.offset = 0;
					sc.multiplier = 1;
					sc.base = 0;
					attribute_scalings.push_back(sc);
				}

				vo = 10 | (value.list_value.size() << 4);
				onto.push_back(vo);
				onto.push_back(delta_list_scaling);  // which scaling

				long here = 0;
				for (size_t i = 0; i < value.list_value.size(); i++) {
					mvt_value &v = value.list_value[i];
					long val;

					if (v.type == mvt_sint) {
						val = v.numeric_value.sint_value;
					} else if (v.type == mvt_uint) {
						val = v.numeric_value.uint_value;
					} else if (v.type == mvt_int) {
						val = v.numeric_value.int_value;
					} else {
						fprintf(stderr, "Delta-encoded list: can't happen\n");
						exit(EXIT_FAILURE);
					}

					onto.push_back(protozero::encode_zigzag64(val - here) + 1);
					here = val;
				}
			} else {
				vo = 8 | (value.list_value.size() << 4);
				onto.push_back(vo);

				for (size_t i = 0; i < value.list_value.size(); i++) {
					tag_v3_value(value.list_value[i], onto);
				}
			}

			return;  // Can't save duplicate
		} else if (value.type == mvt_hash) {
			vo = 9 | (value.list_value.size() << 4);
			onto.push_back(vo);

			for (size_t i = 0; i < value.list_value.size() && i < value.hash_keys.size(); i++) {
				onto.push_back(tag_v3_key(value.hash_keys[i]));
				tag_v3_value(value.list_value[i], onto);
			}

			return;  // Can't save duplicate
		} else {
			fprintf(stderr, "Internal error: unknown value type %d\n", value.type);
			exit(EXIT_FAILURE);
		}

		property_map.insert(std::pair<mvt_value, size_t>(value, vo));
	} else {
		vo = vi->second;
		onto.push_back(vo);
	}
}

void mvt_layer::tag_v3(mvt_feature &feature, std::string key, mvt_value value) {
	size_t ko = tag_v3_key(key);
	feature.properties.push_back(ko);

	tag_v3_value(value, feature.properties);
}

void mvt_layer::reorder_values() {
	std::vector<mvt_value> orig_values = values;
	std::vector<std::string> orig_keys = keys;

	std::sort(values.begin(), values.end());
	std::sort(keys.begin(), keys.end());

	std::map<mvt_value, size_t> new_value_map;
	for (size_t i = 0; i < values.size(); i++) {
		new_value_map.insert(std::pair<mvt_value, size_t>(values[i], i));
	}

	std::map<std::string, size_t> new_key_map;
	for (size_t i = 0; i < keys.size(); i++) {
		new_key_map.insert(std::pair<std::string, size_t>(keys[i], i));
	}

	for (size_t i = 0; i < features.size(); i++) {
		for (size_t j = 1; j < features[i].tags.size(); j += 2) {
			mvt_value v = orig_values[features[i].tags[j]];
			auto f = new_value_map.find(v);

			if (f == new_value_map.end()) {
				std::string vs = v.toString();
				fprintf(stderr, "Internal error: value %s was lost\n", vs.c_str());
				exit(EXIT_FAILURE);
			}

			features[i].tags[j] = f->second;
		}

		for (size_t j = 0; j < features[i].tags.size(); j += 2) {
			std::string k = orig_keys[features[i].tags[j]];
			auto f = new_key_map.find(k);

			if (f == new_key_map.end()) {
				fprintf(stderr, "Internal error: key %s was lost\n", k.c_str());
				exit(EXIT_FAILURE);
			}

			features[i].tags[j] = f->second;
		}
	}
}

mvt_value mvt_layer::decode_property(std::vector<unsigned long> const &property, size_t &off) const {
	int type = property[off] & 0x0F;
	mvt_value ret;

	switch (type) {
	case 0: /* string reference */
		ret.type = mvt_string;
		if (property[off] >> 4 >= string_values.size()) {
			fprintf(stderr, "Out of bounds string reference: %lu vs %zu\n", property[off] >> 4, string_values.size());
			exit(EXIT_FAILURE);
		}
		ret.string_value = string_values[property[off] >> 4];
		return ret;

	case 1: /* float reference */
		ret.type = mvt_float;
		if (property[off] >> 4 >= float_values.size()) {
			fprintf(stderr, "Out of bounds float reference: %lu vs %zu\n", property[off] >> 4, float_values.size());
			exit(EXIT_FAILURE);
		}
		ret.numeric_value.float_value = float_values[property[off] >> 4];
		return ret;

	case 2: /* double reference */
		ret.type = mvt_double;
		if (property[off] >> 4 >= double_values.size()) {
			fprintf(stderr, "Out of bounds double reference: %lu vs %zu\n", property[off] >> 4, double_values.size());
			exit(EXIT_FAILURE);
		}
		ret.numeric_value.double_value = double_values[property[off] >> 4];
		return ret;

	case 3: /* unsigned int reference */
		ret.type = mvt_uint;
		if (property[off] >> 4 >= uint64_values.size()) {
			fprintf(stderr, "Out of bounds uint reference: %lu vs %zu\n", property[off] >> 4, uint64_values.size());
			exit(EXIT_FAILURE);
		}
		ret.numeric_value.uint_value = uint64_values[property[off] >> 4];
		return ret;

	case 4: /* signed int reference */
		ret.type = mvt_sint;
		if (property[off] >> 4 >= uint64_values.size()) {
			fprintf(stderr, "Out of bounds sint reference: %lu vs %zu\n", property[off] >> 4, uint64_values.size());
			exit(EXIT_FAILURE);
		}
		ret.numeric_value.sint_value = protozero::decode_zigzag64(uint64_values[property[off] >> 4]);
		return ret;

	case 5: /* unsigned integer */
		ret.type = mvt_uint;
		ret.numeric_value.uint_value = property[off] >> 4;
		return ret;

	case 6: /* signed integer */
		ret.type = mvt_sint;
		ret.numeric_value.sint_value = protozero::decode_zigzag64(property[off] >> 4);
		return ret;

	case 7: /* boolean */
		if ((property[off] >> 4) == 0) {
			ret.type = mvt_null;
			ret.numeric_value.null_value = 0;
		} else {
			ret.type = mvt_bool;
			ret.numeric_value.bool_value = (property[off] >> 4) - 1;
		}
		return ret;

	case 8: /* list */
	{
		ret.type = mvt_list;
		size_t len = property[off] >> 4;
		off++;

		for (size_t i = 0; i < len; i++) {
			mvt_value v1 = decode_property(property, off);
			off++;

			ret.list_value.push_back(v1);
		}

		off--;  // so caller can increment
		return ret;
	}

	case 9: /* hash */
	{
		ret.type = mvt_hash;
		size_t len = property[off] >> 4;
		off++;

		for (size_t i = 0; i < len; i++) {
			if (property[off] >= keys.size()) {
				fprintf(stderr, "Out of bounds hash key reference\n");
				exit(EXIT_FAILURE);
			}

			mvt_value v1;
			v1.type = mvt_string;
			v1.string_value = keys[property[off]];
			off++;

			mvt_value v2 = decode_property(property, off);
			off++;

			ret.hash_keys.push_back(v1.string_value);
			ret.list_value.push_back(v2);
		}

		off--;  // so caller can increment
		return ret;
	}

	case 10: /* delta-encoded list */
	{
		ret.type = mvt_list;
		size_t len = property[off] >> 4;
		off++;

		if (off >= property.size()) {
			fprintf(stderr, "Not enough elements in list attribute\n");
			exit(EXIT_FAILURE);
		}
		size_t scaling = property[off];
		off++;

		if (scaling >= attribute_scalings.size()) {
			fprintf(stderr, "Reference to nonexistent attribute scaling\n");
			exit(EXIT_FAILURE);
		}

		long here = 0;

		for (size_t i = 0; i < len; i++) {
			if (off >= property.size()) {
				fprintf(stderr, "Not enough elements in list attribute\n");
				exit(EXIT_FAILURE);
			}
			unsigned long increment = property[off];
			off++;

			double val;

			if (increment == 0) {
				val = NAN;
			} else {
				long inc = protozero::decode_zigzag64(increment - 1);
				here += inc;
				val = attribute_scalings[scaling].base + attribute_scalings[scaling].multiplier * (here + attribute_scalings[scaling].offset);
			}

			mvt_value v;
			v.type = mvt_double;
			v.numeric_value.double_value = val;

			ret.list_value.push_back(v);
		}

		off--;  // so caller can increment
		return ret;
	}

	default:
		ret.type = mvt_string;
		ret.string_value = std::to_string(property[off]);
		return ret;
	}
}

bool is_integer(const char *s, long long *v) {
	errno = 0;
	char *endptr;

	*v = strtoll(s, &endptr, 0);
	if (*v == 0 && errno != 0) {
		return 0;
	}
	if ((*v == LLONG_MIN || *v == LLONG_MAX) && (errno == ERANGE || errno == EINVAL)) {
		return 0;
	}
	if (*endptr != '\0') {
		// Special case: If it is an integer followed by .0000 or similar,
		// it is still an integer

		if (*endptr != '.') {
			return 0;
		}
		endptr++;
		for (; *endptr != '\0'; endptr++) {
			if (*endptr != '0') {
				return 0;
			}
		}

		return 1;
	}

	return 1;
}

bool is_unsigned_integer(const char *s, unsigned long long *v) {
	errno = 0;
	char *endptr;

	// Special check because MacOS stroull() returns 1
	// for -18446744073709551615
	while (isspace(*s)) {
		s++;
	}
	if (*s == '-') {
		return 0;
	}

	*v = strtoull(s, &endptr, 0);
	if (*v == 0 && errno != 0) {
		return 0;
	}
	if ((*v == ULLONG_MAX) && (errno == ERANGE || errno == EINVAL)) {
		return 0;
	}
	if (*endptr != '\0') {
		// Special case: If it is an integer followed by .0000 or similar,
		// it is still an integer

		if (*endptr != '.') {
			return 0;
		}
		endptr++;
		for (; *endptr != '\0'; endptr++) {
			if (*endptr != '0') {
				return 0;
			}
		}

		return 1;
	}

	return 1;
}

mvt_value json_to_mvt_value(json_object *o) {
	mvt_value tv;

	if (o->type == JSON_NUMBER) {
		return stringified_to_mvt_value(mvt_double, o->string);
	} else if (o->type == JSON_STRING) {
		tv.type = mvt_string;
		tv.string_value = o->string;
	} else if (o->type == JSON_NULL) {
		tv.type = mvt_null;
		tv.numeric_value.null_value = 0;
	} else if (o->type == JSON_TRUE) {
		tv.type = mvt_bool;
		tv.numeric_value.bool_value = 1;
	} else if (o->type == JSON_FALSE) {
		tv.type = mvt_bool;
		tv.numeric_value.bool_value = 0;
	} else if (o->type == JSON_ARRAY) {
		tv.type = mvt_list;

		for (size_t i = 0; i < o->length; i++) {
			tv.list_value.push_back(json_to_mvt_value(o->array[i]));
		}
	} else if (o->type == JSON_HASH) {
		tv.type = mvt_hash;

		for (size_t i = 0; i < o->length; i++) {
			tv.hash_keys.push_back(o->keys[i]->string);
			tv.list_value.push_back(json_to_mvt_value(o->values[i]));
		}
	}

	return tv;
}

mvt_value stringified_to_mvt_value(int type, const char *s) {
	mvt_value tv;

	if (type == mvt_double) {
		long long v;
		unsigned long long uv;
		if (is_unsigned_integer(s, &uv)) {
			if (uv <= LLONG_MAX) {
				tv.type = mvt_int;
				tv.numeric_value.int_value = uv;
			} else {
				tv.type = mvt_uint;
				tv.numeric_value.uint_value = uv;
			}
		} else if (is_integer(s, &v)) {
			tv.type = mvt_sint;
			tv.numeric_value.sint_value = v;
		} else {
			errno = 0;
			char *endptr;

			float f = strtof(s, &endptr);

			if (endptr == s || ((f == HUGE_VAL || f == HUGE_VALF || f == HUGE_VALL) && errno == ERANGE)) {
				double d = strtod(s, &endptr);
				if (endptr == s || ((d == HUGE_VAL || d == HUGE_VALF || d == HUGE_VALL) && errno == ERANGE)) {
					fprintf(stderr, "Warning: numeric value %s could not be represented\n", s);
				}
				tv.type = mvt_double;
				tv.numeric_value.double_value = d;
			} else {
				double d = atof(s);
				if (f == d) {
					tv.type = mvt_float;
					tv.numeric_value.float_value = f;
				} else {
					// Conversion succeeded, but lost precision, so use double
					tv.type = mvt_double;
					tv.numeric_value.double_value = d;
				}
			}
		}
	} else if (type == mvt_bool) {
		tv.type = mvt_bool;
		tv.numeric_value.bool_value = (s[0] == 't');
	} else if (type == mvt_null) {
		tv.type = mvt_null;
		tv.numeric_value.null_value = 0;
	} else if (type == mvt_string) {
		tv.type = mvt_string;
		tv.string_value = s;
	} else if (type == mvt_hash || type == mvt_list) {
		json_pull *jp = json_begin_string(s);
		json_object *jo = json_read_tree(jp);
		if (jo == NULL) {
			fprintf(stderr, "Internal error: failed to reconstruct JSON in stringified_to_mvt_value %s\n", s);
			exit(EXIT_FAILURE);
		}

		if (jo->type == JSON_ARRAY) {
			tv.type = mvt_list;

			for (size_t i = 0; i < jo->length; i++) {
				tv.list_value.push_back(json_to_mvt_value(jo->array[i]));
			}
		} else if (jo->type == JSON_HASH) {
			tv.type = mvt_hash;

			for (size_t i = 0; i < jo->length; i++) {
				tv.hash_keys.push_back(jo->keys[i]->string);
				tv.list_value.push_back(json_to_mvt_value(jo->values[i]));
			}
		} else {
			fprintf(stderr, "Expected a list or hash, not %s\n", s);
			exit(EXIT_FAILURE);
		}

		json_free(jo);
		json_end(jp);
	} else {
		fprintf(stderr, "Internal error: unknown type\n");
		exit(EXIT_FAILURE);
	}

	return tv;
}

std::vector<mvt_geometry> to_feature(drawvec &geom, mvt_layer &layer, std::vector<unsigned long> &onto) {
	std::vector<mvt_geometry> out;

	std::map<std::string, std::vector<mvt_value>> node_attributes;

	for (size_t i = 0; i < geom.size(); i++) {
		mvt_geometry g(geom[i].op, geom[i].x, geom[i].y, geom[i].elevations);

		if (geom[i].attributes.size() != 0) {
			mvt_value v = stringified_to_mvt_value(mvt_hash, geom[i].attributes.c_str());

			// We have a list by name within each node;
			// we need a list by node within each name.

			for (size_t j = 0; j < v.hash_keys.size() && j < v.list_value.size(); j++) {
				if (node_attributes.count(v.hash_keys[j]) == 0) {
					mvt_value null_value;
					null_value.type = mvt_null;
					null_value.numeric_value.null_value = 0;

					std::vector<mvt_value> attrib;
					for (size_t k = 0; k < geom.size(); k++) {
						attrib.push_back(null_value);
					}

					node_attributes.insert(std::pair<std::string, std::vector<mvt_value>>(v.hash_keys[j], attrib));
				}

				auto f = node_attributes.find(v.hash_keys[j]);
				if (f == node_attributes.end()) {
					fprintf(stderr, "Internal error: node attribute lookup failure\n");
					exit(EXIT_FAILURE);
				}

				f->second[i] = v.list_value[j];
			}
		}

		out.push_back(g);
	}

	for (auto f : node_attributes) {
		std::string key = f.first;
		std::vector<mvt_value> val = f.second;

		mvt_value merged;
		merged.type = mvt_list;

		for (size_t i = 0; i < val.size(); i++) {
			merged.list_value.push_back(val[i]);
		}

		onto.push_back(layer.tag_v3_key(key));
		layer.tag_v3_value(merged, onto);
	}

	return out;
}
back to top