nbt_parsing.c - nbtfsutils - Rivoreo Source Code Repositories

 /*
  * -----------------------------------------------------------------------------
  * "THE BEER-WARE LICENSE" (Revision 42):
  * Lukas Niederbremer <webmaster@flippeh.de> and Clark Gaebel <cg.wowus.cg@gmail.com>
  * wrote this file. As long as you retain this notice you can do whatever you
  * want with this stuff. If we meet some day, and you think this stuff is worth
  * it, you can buy us a beer in return.
  * -----------------------------------------------------------------------------
  */
 #include "nbt.h"

 #include <assert.h>
 #include <errno.h>
 #include <inttypes.h>
 #include <stdio.h>
 #include <stdlib.h>
 #include <string.h>
 #include <zlib.h>

 /* works around a bug in icc */
 int fileno(FILE*);

 /* are we running on a little-endian system? */
 static inline int little_endian()
 {
     union {
         uint16_t i;
         char c[2];
     } t = { 0x0001 };

     return *t.c == 1;
 }

 static inline void* swap_bytes(void* s, size_t len)
 {
     for(char* b = s,
             * e = b + len - 1;
         b < e;
         b++, e--)
     {
         char t = *b;

         *b = *e;
         *e = t;
     }

     return s;
 }

 /* big endian to native endian. works in-place */
 static inline void* be2ne(void* s, size_t len)
 {
     return little_endian() ? swap_bytes(s, len) : s;
 }

 /* native endian to big endian. works the exact same as its inverse */
 #define ne2be be2ne

 /* A special form of memcpy which copies `n' bytes into `dest', then returns
  * `src' + n.
  */
 static inline const void* memscan(void* dest, const void* src, size_t n)
 {
     memcpy(dest, src, n);
     return (const char*)src + n;
 }

 /* Does a memscan, then goes from big endian to native endian on the
  * destination.
  */
 static inline const void* swapped_memscan(void* dest, const void* src, size_t n)
 {
     const void* ret = memscan(dest, src, n);
     return be2ne(dest, n), ret;
 }

 #define CHECKED_MALLOC(var, n, on_error) do { \
     if((var = malloc(n)) == NULL)             \
     {                                         \
         errno = NBT_EMEM;                     \
         on_error;                             \
     }                                         \
 } while(0)

 #define CHECKED_GZWRITE(fp, ptr, len) do {        \
     if(gzwrite((fp), (ptr), (len)) != (int)(len)) \
         return NBT_EGZ;                           \
 } while(0)

 /* Parses a tag, given a name (may be NULL) and a type. Fills in the payload. */
 static nbt_node* parse_unnamed_tag(nbt_type type, char* name, const char** memory, size_t* length);

 /*
  * Reads some bytes from the memory stream. This macro will read `n'
  * bytes into `dest', call either memscan or swapped_memscan depending on
  * `scanner', then fix the length. If anything funky goes down, `on_failure'
  * will be executed.
  */
 #define READ_GENERIC(dest, n, scanner, on_failure) do { \
     if(*length < (n)) { on_failure; }                   \
     *memory = scanner((dest), *memory, (n));            \
     *length -= (n);                                     \
 } while(0)

 /*
  * Reads a string from memory, moving the pointer and updating the length
  * appropriately. Returns NULL on failure.
  */
 static inline char* read_string(const char** memory, size_t* length)
 {
     int16_t string_length;
     char* ret = NULL;

     READ_GENERIC(&string_length, sizeof string_length, swapped_memscan, goto parse_error);

     if(string_length < 0)               goto parse_error;
     if(*length < (size_t)string_length) goto parse_error;

     CHECKED_MALLOC(ret, string_length + 1, goto parse_error);

     READ_GENERIC(ret, (size_t)string_length, memscan, goto parse_error);

     ret[string_length] = '\0'; /* don't forget to NULL-terminate ;) */
     return ret;

 parse_error:
     if(errno == NBT_OK)
         errno = NBT_ERR;

     free(ret);
     return NULL;
 }

 static inline struct nbt_byte_array read_byte_array(const char** memory, size_t* length)
 {
     struct nbt_byte_array ret;
     ret.data = NULL;

     READ_GENERIC(&ret.length, sizeof ret.length, swapped_memscan, goto parse_error);

     if(ret.length < 0) goto parse_error;

     CHECKED_MALLOC(ret.data, ret.length, goto parse_error);

     READ_GENERIC(ret.data, (size_t)ret.length, memscan, goto parse_error);

     return ret;

 parse_error:
     if(errno == NBT_OK)
         errno = NBT_ERR;

     free(ret.data);
     ret.data = NULL;
     return ret;
 }

 static struct tag_list* read_list(const char** memory, size_t* length)
 {
     uint8_t type;
     int32_t elems;
     struct tag_list* ret = NULL;

     READ_GENERIC(&type, sizeof type, swapped_memscan, goto parse_error);
     READ_GENERIC(&elems, sizeof elems, swapped_memscan, goto parse_error);

     CHECKED_MALLOC(ret, sizeof *ret, goto parse_error);

     ret->data = NULL; /* the first value in a list is a sentinel. don't even try to read it. */
     INIT_LIST_HEAD(&ret->entry);

     for(int32_t i = 0; i < elems; i++)
     {
         struct tag_list* new;

         CHECKED_MALLOC(new, sizeof *new, goto parse_error);

         new->data = parse_unnamed_tag((nbt_type)type, NULL, memory, length);

         if(new->data == NULL)
         {
             free(new);
             goto parse_error;
         }

         list_add_tail(&new->entry, &ret->entry);
     }

     return ret;

 parse_error:
     if(errno == NBT_OK)
         errno = NBT_ERR;

     nbt_free_list(ret);
     return NULL;
 }

 static struct tag_list* read_compound(const char** memory, size_t* length)
 {
     struct tag_list* ret;

     CHECKED_MALLOC(ret, sizeof *ret, goto parse_error);

     ret->data = NULL;
     INIT_LIST_HEAD(&ret->entry);

     for(;;)
     {
         uint8_t type;
         char* name = NULL;
         struct tag_list* new_entry;

         READ_GENERIC(&type, sizeof type, swapped_memscan, goto parse_error);

         if(type == 0) break; /* TAG_END == 0. We've hit the end of the list when type == TAG_END. */

         name = read_string(memory, length);
         if(name == NULL) goto parse_error;

         CHECKED_MALLOC(new_entry, sizeof *new_entry,
             free(name);
             goto parse_error;
         );

         new_entry->data = parse_unnamed_tag((nbt_type)type, name, memory, length);

         if(new_entry->data == NULL)
         {
             free(new_entry);
             free(name);
             goto parse_error;
         }

         list_add_tail(&new_entry->entry, &ret->entry);
     }

     return ret;

 parse_error:
     if(errno == NBT_OK)
         errno = NBT_ERR;
     nbt_free_list(ret);

     return NULL;
 }

 /*
  * Parses a tag, given a name (may be NULL) and a type. Fills in the payload.
  */
 static inline nbt_node* parse_unnamed_tag(nbt_type type, char* name, const char** memory, size_t* length)
 {
     nbt_node* node;

     CHECKED_MALLOC(node, sizeof *node, goto parse_error);

     node->type = type;
     node->name = name;

 #define COPY_INTO_PAYLOAD(payload_name) \
     READ_GENERIC(&node->payload.payload_name, sizeof node->payload.payload_name, swapped_memscan, goto parse_error);

     switch(type)
     {
     case TAG_BYTE:
         COPY_INTO_PAYLOAD(tag_byte);
         break;
     case TAG_SHORT:
         COPY_INTO_PAYLOAD(tag_short);
         break;
     case TAG_INT:
         COPY_INTO_PAYLOAD(tag_int);
         break;
     case TAG_LONG:
         COPY_INTO_PAYLOAD(tag_long);
         break;
     case TAG_FLOAT:
         COPY_INTO_PAYLOAD(tag_float);
         break;
     case TAG_DOUBLE:
         COPY_INTO_PAYLOAD(tag_double);
         break;
     case TAG_BYTE_ARRAY:
         node->payload.tag_byte_array = read_byte_array(memory, length);
         break;
     case TAG_STRING:
         node->payload.tag_string = read_string(memory, length);
         break;
     case TAG_LIST:
         node->payload.tag_list = read_list(memory, length);
         break;
     case TAG_COMPOUND:
         node->payload.tag_compound = read_compound(memory, length);
         break;

     default:
         goto parse_error; /* Unknown node or TAG_END. Either way, we shouldn't be parsing this. */
     }

 #undef COPY_INTO_PAYLOAD

     if(errno != NBT_OK) goto parse_error;

     return node;

 parse_error:
     if(errno == NBT_OK)
         errno = NBT_ERR;

     free(node);
     return NULL;
 }


 nbt_node* nbt_parse(const void* mem, size_t len)
 {
     errno = NBT_OK;

     const char** memory = (const char**)&mem;
     size_t* length = &len;

     /*
      * this needs to stay up here since it's referenced by the parse_error
      * block.
      */
     char* name = NULL;

     uint8_t type;
     READ_GENERIC(&type, sizeof type, memscan, goto parse_error);

     name = read_string(memory, length);
     if(name == NULL) goto parse_error;

     nbt_node* ret = parse_unnamed_tag((nbt_type)type, name, memory, length);

     /* We can't check for NULL, because it COULD be an empty tree. */
     if(errno != NBT_OK) goto parse_error;

     return ret;

 parse_error:
     if(errno == NBT_OK)
         errno = NBT_ERR;

     free(name);
     return NULL;
 }

 typedef struct {
     char*  d; /*  data  */
     size_t l; /* length */
 } buffer_t;

 /* parses the whole file into a buffer */
 static inline buffer_t __parse_file(gzFile fp)
 {
     buffer_t ret = { NULL, 0 };

     /* WARNING: This loop runs in O(n^2). TODO: Fix this! */
     for(;;)
     {
         { /* resize buffer */
             char* temp = realloc(ret.d, ret.l + 4096);
             if(temp == NULL) goto parse_error;
             ret.d = temp;
         }

         /* copy in */
         size_t bytes_read = gzread(fp, ret.d + ret.l, 4096);

         int err;
         gzerror(fp, &err);
         if(err) { errno = NBT_EGZ; goto parse_error; }

         if(bytes_read == 0) break;

         /* fix ret.l */
         ret.l += bytes_read;
     }

     return ret;

 parse_error:
     if(errno == NBT_OK)
         errno = NBT_EMEM;

     free(ret.d);
     ret.d = NULL;

     return ret;
 }

 /*
  * No incremental parsing goes on. We just dump the whole decompressed file into
  * memory then pass the job off to nbt_parse.
  */
 nbt_node* nbt_parse_file(FILE* fp)
 {
     nbt_node* ret;

     errno = NBT_OK;

     /*
      * We need to keep these declarations up here as opposed to where they're
      * used because they're referenced by the parse_error block.
      */
     buffer_t buf = { NULL, 0 };
     gzFile f = Z_NULL;

     if(fp == NULL) return NULL;

     int fd = fileno(fp);
     if(fd == -1)    goto parse_error;

     f = gzdopen(fd, "rb");
     if(f == Z_NULL) goto parse_error;

     buf = __parse_file(f);

     if(buf.d == NULL)      goto parse_error;
     if(gzclose(f) != Z_OK) goto parse_error;

     ret = nbt_parse(buf.d, buf.l);

     free(buf.d);

     return ret;

 parse_error:
     if(errno == NBT_OK)
         errno = NBT_EGZ;

     free(buf.d);

     if(f != Z_NULL)
         gzclose(f);

     return NULL;
 }

 /* spaces, not tabs ;) */
 static inline void indent(FILE* fp, size_t amount)
 {
     for(size_t i = 0; i < amount; i++)
         fprintf(fp, "    ");
 }

 static nbt_status __nbt_dump_ascii(const nbt_node* tree, FILE* fp, size_t ident);

 /* prints the node's name, or (null) if it has none. */
 #define SAFE_NAME(node) ((node)->name ? (node)->name : "<null>")

 static inline void dump_byte_array(const struct nbt_byte_array ba, FILE* fp)
 {
     assert(ba.length >= 0);

     fprintf(fp, "[ ");
     for(int32_t i = 0; i < ba.length; ++i)
         fprintf(fp, "%i ", (int)ba.data[i]);
     fprintf(fp, "]");
 }

 static inline nbt_status dump_list_contents_ascii(const struct tag_list* list, FILE* fp, size_t ident)
 {
     const struct list_head* pos;

     list_for_each(pos, &list->entry)
     {
         const struct tag_list* entry = list_entry(pos, const struct tag_list, entry);
         nbt_status err;

         if((err = __nbt_dump_ascii(entry->data, fp, ident)) != NBT_OK)
             return err;
     }

     return NBT_OK;
 }

 static inline nbt_status __nbt_dump_ascii(const nbt_node* tree, FILE* fp, size_t ident)
 {
     if(tree == NULL) return NBT_OK;

     indent(fp, ident);

     if(tree->type == TAG_BYTE)
         fprintf(fp, "TAG_Byte(\"%s\"): %i\n", SAFE_NAME(tree), (int)tree->payload.tag_byte);
     else if(tree->type == TAG_SHORT)
         fprintf(fp, "TAG_Short(\"%s\"): %i\n", SAFE_NAME(tree), (int)tree->payload.tag_short);
     else if(tree->type == TAG_INT)
         fprintf(fp, "TAG_Int(\"%s\"): %i\n", SAFE_NAME(tree), (int)tree->payload.tag_int);
     else if(tree->type == TAG_LONG)
         fprintf(fp, "TAG_Long(\"%s\"): %" PRIi64 "\n", SAFE_NAME(tree), tree->payload.tag_long);
     else if(tree->type == TAG_FLOAT)
         fprintf(fp, "TAG_Float(\"%s\"): %f\n", SAFE_NAME(tree), (double)tree->payload.tag_float);
     else if(tree->type == TAG_DOUBLE)
         fprintf(fp, "TAG_Double(\"%s\"): %f\n", SAFE_NAME(tree), tree->payload.tag_double);
     else if(tree->type == TAG_BYTE_ARRAY)
     {
         fprintf(fp, "TAG_Byte_Array(\"%s\"): ", SAFE_NAME(tree));
         dump_byte_array(tree->payload.tag_byte_array, fp);
         fprintf(fp, "\n");
     }
     else if(tree->type == TAG_STRING)
     {
         if(tree->payload.tag_string == NULL)
             return NBT_ERR;

         fprintf(fp, "TAG_String(\"%s\"): %s\n", SAFE_NAME(tree), tree->payload.tag_string);
     }
     else if(tree->type == TAG_LIST)
     {
         fprintf(fp, "TAG_List(\"%s\")\n", SAFE_NAME(tree));
         indent(fp, ident);
         fprintf(fp, "{\n");

         nbt_status err;
         if((err = dump_list_contents_ascii(tree->payload.tag_list, fp, ident + 1)) != NBT_OK)
             return err;

         indent(fp, ident);
         fprintf(fp, "}\n");
     }
     else if(tree->type == TAG_COMPOUND)
     {
         fprintf(fp, "TAG_Compound(\"%s\")\n", SAFE_NAME(tree));
         indent(fp, ident);
         fprintf(fp, "{\n");

         nbt_status err;
         if((err = dump_list_contents_ascii(tree->payload.tag_compound, fp, ident + 1)) != NBT_OK)
             return err;

         indent(fp, ident);
         fprintf(fp, "}\n");
     }

     else
         return NBT_ERR;

     return NBT_OK;
 }

 nbt_status nbt_dump_ascii(const nbt_node* tree, FILE* fp)
 {
     return __nbt_dump_ascii(tree, fp, 0);
 }

 static nbt_status dump_byte_array_binary(const struct nbt_byte_array ba, gzFile fp)
 {
     int32_t dumped_length = ba.length;

     ne2be(&dumped_length, sizeof dumped_length);

     CHECKED_GZWRITE(fp, &dumped_length, sizeof dumped_length);

     if(ba.length) assert(ba.data);

     CHECKED_GZWRITE(fp, ba.data, ba.length);

     return NBT_OK;
 }

 static nbt_status dump_string_binary(const char* name, gzFile fp)
 {
     assert(name);

     size_t len = strlen(name);

     if(len > 32767 /* SHORT_MAX */)
         return NBT_ERR;

     { /* dump the length */
         int16_t dumped_len = (int16_t)len;
         ne2be(&dumped_len, sizeof dumped_len);

         CHECKED_GZWRITE(fp, &dumped_len, sizeof dumped_len);
     }

     CHECKED_GZWRITE(fp, name, len);

     return NBT_OK;
 }

 /*
  * Is the list all one type? If yes, return the type. Otherwise, return
  * TAG_INVALID
  */
 static inline nbt_type list_is_homogenous(const struct tag_list* list)
 {
     nbt_type type = TAG_INVALID;

     const struct list_head* pos;
     list_for_each(pos, &list->entry)
     {
         const struct tag_list* cur = list_entry(pos, const struct tag_list, entry);

         assert(cur->data->type != TAG_INVALID);

         if(cur->data->type == TAG_INVALID)
             return TAG_INVALID;

         /* if we're the first type, just set it to our current type */
         if(type == TAG_INVALID) type = cur->data->type;

         if(type != cur->data->type)
             return TAG_INVALID;
     }

     return type;
 }

 static nbt_status __dump_binary(const nbt_node*, bool, gzFile);

 static nbt_status dump_list_binary(const struct tag_list* list, gzFile fp)
 {
     nbt_type type;

     size_t len = list_length(&list->entry);

     if(len == 0) /* empty lists can just be silently ignored */
         return NBT_OK;

     if(len > 2147483647 /* INT_MAX */)
         return NBT_ERR;

     assert(list_is_homogenous(list) != TAG_INVALID);
     if((type = list_is_homogenous(list)) == TAG_INVALID)
         return NBT_ERR;

     {
         int8_t _type = (int8_t)type;
         ne2be(&_type, sizeof _type); /* unnecessary, but left in to keep similar code looking similar */
         CHECKED_GZWRITE(fp, &_type, sizeof _type);
     }

     {
         int32_t dumped_len = (int32_t)len;
         ne2be(&dumped_len, sizeof dumped_len);
         CHECKED_GZWRITE(fp, &dumped_len, sizeof dumped_len);
     }

     const struct list_head* pos;
     list_for_each(pos, &list->entry)
     {
         const struct tag_list* entry = list_entry(pos, const struct tag_list, entry);
         nbt_status ret;

         if((ret = __dump_binary(entry->data, false, fp)) != NBT_OK)
             return ret;
     }

     return NBT_OK;
 }

 static nbt_status dump_compound_binary(const struct tag_list* list, gzFile fp)
 {
     if(list_empty(&list->entry)) /* empty lists can just be silently ignored */
         return NBT_OK;

     const struct list_head* pos;
     list_for_each(pos, &list->entry)
     {
         const struct tag_list* entry = list_entry(pos, const struct tag_list, entry);
         nbt_status ret;

         if((ret = __dump_binary(entry->data, true, fp)) != NBT_OK)
             return ret;
     }

     /* write out TAG_End */
     uint8_t zero = 0;
     CHECKED_GZWRITE(fp, &zero, sizeof zero);

     return NBT_OK;
 }

 /*
  * @param dump_type   Should we dump the type, or just skip it? We need to skip
  *                    when dumping lists, because the list header already says
  *                    the type.
  */
 static inline nbt_status __dump_binary(const nbt_node* tree, bool dump_type, gzFile fp)
 {
     if(dump_type)
     { /* write out the type */
         int8_t type = (int8_t)tree->type;

         CHECKED_GZWRITE(fp, &type, sizeof type);
     }

     if(tree->name)
     {
         nbt_status err;

         if((err = dump_string_binary(tree->name, fp)) != NBT_OK)
             return err;
     }

 #define DUMP_NUM(type, x) do {               \
     type temp = x;                           \
     ne2be(&temp, sizeof temp);               \
     CHECKED_GZWRITE(fp, &temp, sizeof temp); \
 } while(0)

     if(tree->type == TAG_BYTE)
         DUMP_NUM(int8_t, tree->payload.tag_byte);
     else if(tree->type == TAG_SHORT)
         DUMP_NUM(int16_t, tree->payload.tag_short);
     else if(tree->type == TAG_INT)
         DUMP_NUM(int32_t, tree->payload.tag_int);
     else if(tree->type == TAG_LONG)
         DUMP_NUM(int64_t, tree->payload.tag_long);
     else if(tree->type == TAG_FLOAT)
         DUMP_NUM(float, tree->payload.tag_float);
     else if(tree->type == TAG_DOUBLE)
         DUMP_NUM(double, tree->payload.tag_double);
     else if(tree->type == TAG_BYTE_ARRAY)
         return dump_byte_array_binary(tree->payload.tag_byte_array, fp);
     else if(tree->type == TAG_STRING)
         return dump_string_binary(tree->payload.tag_string, fp);
     else if(tree->type == TAG_LIST)
         return dump_list_binary(tree->payload.tag_list, fp);
     else if(tree->type == TAG_COMPOUND)
         return dump_compound_binary(tree->payload.tag_compound, fp);

     else
         return NBT_ERR;

     return NBT_OK;

 #undef DUMP_NUM
 }

 nbt_status nbt_dump_binary(const nbt_node* tree, FILE* fp)
 {
     if(tree == NULL) return NBT_OK;

     int fd = fileno(fp);
     if(fd == -1) return NBT_EGZ;

     gzFile f = gzdopen(fd, "wb");
     if(f == Z_NULL) return NBT_EGZ;

     nbt_status r = __dump_binary(tree, true, f);

     gzclose(f);

     return r;
 }
	/*
	* -----------------------------------------------------------------------------
	* "THE BEER-WARE LICENSE" (Revision 42):
	* Lukas Niederbremer <webmaster@flippeh.de> and Clark Gaebel <cg.wowus.cg@gmail.com>
	* wrote this file. As long as you retain this notice you can do whatever you
	* want with this stuff. If we meet some day, and you think this stuff is worth
	* it, you can buy us a beer in return.
	* -----------------------------------------------------------------------------
	*/
	#include "nbt.h"

	#include <assert.h>
	#include <errno.h>
	#include <inttypes.h>
	#include <stdio.h>
	#include <stdlib.h>
	#include <string.h>
	#include <zlib.h>

	/* works around a bug in icc */
	int fileno(FILE*);

	/* are we running on a little-endian system? */
	static inline int little_endian()
	{
	union {
	uint16_t i;
	char c[2];
	} t = { 0x0001 };

	return *t.c == 1;
	}

	static inline void* swap_bytes(void* s, size_t len)
	{
	for(char* b = s,
	* e = b + len - 1;
	b < e;
	b++, e--)
	{
	char t = *b;

	b = e;
	*e = t;
	}

	return s;
	}

	/* big endian to native endian. works in-place */
	static inline void* be2ne(void* s, size_t len)
	{
	return little_endian() ? swap_bytes(s, len) : s;
	}

	/* native endian to big endian. works the exact same as its inverse */
	#define ne2be be2ne

	/* A special form of memcpy which copies `n' bytes into `dest', then returns
	* `src' + n.
	*/
	static inline const void* memscan(void* dest, const void* src, size_t n)
	{
	memcpy(dest, src, n);
	return (const char*)src + n;
	}

	/* Does a memscan, then goes from big endian to native endian on the
	* destination.
	*/
	static inline const void* swapped_memscan(void* dest, const void* src, size_t n)
	{
	const void* ret = memscan(dest, src, n);
	return be2ne(dest, n), ret;
	}

	#define CHECKED_MALLOC(var, n, on_error) do { \
	if((var = malloc(n)) == NULL) \
	{ \
	errno = NBT_EMEM; \
	on_error; \
	} \
	} while(0)

	#define CHECKED_GZWRITE(fp, ptr, len) do { \
	if(gzwrite((fp), (ptr), (len)) != (int)(len)) \
	return NBT_EGZ; \
	} while(0)

	/* Parses a tag, given a name (may be NULL) and a type. Fills in the payload. */
	static nbt_node* parse_unnamed_tag(nbt_type type, char* name, const char** memory, size_t* length);

	/*
	* Reads some bytes from the memory stream. This macro will read `n'
	* bytes into `dest', call either memscan or swapped_memscan depending on
	* `scanner', then fix the length. If anything funky goes down, `on_failure'
	* will be executed.
	*/
	#define READ_GENERIC(dest, n, scanner, on_failure) do { \
	if(*length < (n)) { on_failure; } \
	memory = scanner((dest), memory, (n)); \
	*length -= (n); \
	} while(0)

	/*
	* Reads a string from memory, moving the pointer and updating the length
	* appropriately. Returns NULL on failure.
	*/
	static inline char* read_string(const char** memory, size_t* length)
	{
	int16_t string_length;
	char* ret = NULL;

	READ_GENERIC(&string_length, sizeof string_length, swapped_memscan, goto parse_error);

	if(string_length < 0) goto parse_error;
	if(*length < (size_t)string_length) goto parse_error;

	CHECKED_MALLOC(ret, string_length + 1, goto parse_error);

	READ_GENERIC(ret, (size_t)string_length, memscan, goto parse_error);

	ret[string_length] = '\0'; /* don't forget to NULL-terminate ;) */
	return ret;

	parse_error:
	if(errno == NBT_OK)
	errno = NBT_ERR;

	free(ret);
	return NULL;
	}

	static inline struct nbt_byte_array read_byte_array(const char** memory, size_t* length)
	{
	struct nbt_byte_array ret;
	ret.data = NULL;

	READ_GENERIC(&ret.length, sizeof ret.length, swapped_memscan, goto parse_error);

	if(ret.length < 0) goto parse_error;

	CHECKED_MALLOC(ret.data, ret.length, goto parse_error);

	READ_GENERIC(ret.data, (size_t)ret.length, memscan, goto parse_error);

	return ret;

	parse_error:
	if(errno == NBT_OK)
	errno = NBT_ERR;

	free(ret.data);
	ret.data = NULL;
	return ret;
	}

	static struct tag_list* read_list(const char** memory, size_t* length)
	{
	uint8_t type;
	int32_t elems;
	struct tag_list* ret = NULL;

	READ_GENERIC(&type, sizeof type, swapped_memscan, goto parse_error);
	READ_GENERIC(&elems, sizeof elems, swapped_memscan, goto parse_error);

	CHECKED_MALLOC(ret, sizeof *ret, goto parse_error);

	ret->data = NULL; /* the first value in a list is a sentinel. don't even try to read it. */
	INIT_LIST_HEAD(&ret->entry);

	for(int32_t i = 0; i < elems; i++)
	{
	struct tag_list* new;

	CHECKED_MALLOC(new, sizeof *new, goto parse_error);

	new->data = parse_unnamed_tag((nbt_type)type, NULL, memory, length);

	if(new->data == NULL)
	{
	free(new);
	goto parse_error;
	}

	list_add_tail(&new->entry, &ret->entry);
	}

	return ret;

	parse_error:
	if(errno == NBT_OK)
	errno = NBT_ERR;

	nbt_free_list(ret);
	return NULL;
	}

	static struct tag_list* read_compound(const char** memory, size_t* length)
	{
	struct tag_list* ret;

	CHECKED_MALLOC(ret, sizeof *ret, goto parse_error);

	ret->data = NULL;
	INIT_LIST_HEAD(&ret->entry);

	for(;;)
	{
	uint8_t type;
	char* name = NULL;
	struct tag_list* new_entry;

	READ_GENERIC(&type, sizeof type, swapped_memscan, goto parse_error);

	if(type == 0) break; /* TAG_END == 0. We've hit the end of the list when type == TAG_END. */

	name = read_string(memory, length);
	if(name == NULL) goto parse_error;

	CHECKED_MALLOC(new_entry, sizeof *new_entry,
	free(name);
	goto parse_error;
	);

	new_entry->data = parse_unnamed_tag((nbt_type)type, name, memory, length);

	if(new_entry->data == NULL)
	{
	free(new_entry);
	free(name);
	goto parse_error;
	}

	list_add_tail(&new_entry->entry, &ret->entry);
	}

	return ret;

	parse_error:
	if(errno == NBT_OK)
	errno = NBT_ERR;
	nbt_free_list(ret);

	return NULL;
	}

	/*
	* Parses a tag, given a name (may be NULL) and a type. Fills in the payload.
	*/
	static inline nbt_node* parse_unnamed_tag(nbt_type type, char* name, const char** memory, size_t* length)
	{
	nbt_node* node;

	CHECKED_MALLOC(node, sizeof *node, goto parse_error);

	node->type = type;
	node->name = name;

	#define COPY_INTO_PAYLOAD(payload_name) \
	READ_GENERIC(&node->payload.payload_name, sizeof node->payload.payload_name, swapped_memscan, goto parse_error);

	switch(type)
	{
	case TAG_BYTE:
	COPY_INTO_PAYLOAD(tag_byte);
	break;
	case TAG_SHORT:
	COPY_INTO_PAYLOAD(tag_short);
	break;
	case TAG_INT:
	COPY_INTO_PAYLOAD(tag_int);
	break;
	case TAG_LONG:
	COPY_INTO_PAYLOAD(tag_long);
	break;
	case TAG_FLOAT:
	COPY_INTO_PAYLOAD(tag_float);
	break;
	case TAG_DOUBLE:
	COPY_INTO_PAYLOAD(tag_double);
	break;
	case TAG_BYTE_ARRAY:
	node->payload.tag_byte_array = read_byte_array(memory, length);
	break;
	case TAG_STRING:
	node->payload.tag_string = read_string(memory, length);
	break;
	case TAG_LIST:
	node->payload.tag_list = read_list(memory, length);
	break;
	case TAG_COMPOUND:
	node->payload.tag_compound = read_compound(memory, length);
	break;

	default:
	goto parse_error; /* Unknown node or TAG_END. Either way, we shouldn't be parsing this. */
	}

	#undef COPY_INTO_PAYLOAD

	if(errno != NBT_OK) goto parse_error;

	return node;

	parse_error:
	if(errno == NBT_OK)
	errno = NBT_ERR;

	free(node);
	return NULL;
	}


	nbt_node* nbt_parse(const void* mem, size_t len)
	{
	errno = NBT_OK;

	const char memory = (const char)&mem;
	size_t* length = &len;

	/*
	* this needs to stay up here since it's referenced by the parse_error
	* block.
	*/
	char* name = NULL;

	uint8_t type;
	READ_GENERIC(&type, sizeof type, memscan, goto parse_error);

	name = read_string(memory, length);
	if(name == NULL) goto parse_error;

	nbt_node* ret = parse_unnamed_tag((nbt_type)type, name, memory, length);

	/* We can't check for NULL, because it COULD be an empty tree. */
	if(errno != NBT_OK) goto parse_error;

	return ret;

	parse_error:
	if(errno == NBT_OK)
	errno = NBT_ERR;

	free(name);
	return NULL;
	}

	typedef struct {
	char* d; /* data */
	size_t l; /* length */
	} buffer_t;

	/* parses the whole file into a buffer */
	static inline buffer_t __parse_file(gzFile fp)
	{
	buffer_t ret = { NULL, 0 };

	/* WARNING: This loop runs in O(n^2). TODO: Fix this! */
	for(;;)
	{
	{ /* resize buffer */
	char* temp = realloc(ret.d, ret.l + 4096);
	if(temp == NULL) goto parse_error;
	ret.d = temp;
	}

	/* copy in */
	size_t bytes_read = gzread(fp, ret.d + ret.l, 4096);

	int err;
	gzerror(fp, &err);
	if(err) { errno = NBT_EGZ; goto parse_error; }

	if(bytes_read == 0) break;

	/* fix ret.l */
	ret.l += bytes_read;
	}

	return ret;

	parse_error:
	if(errno == NBT_OK)
	errno = NBT_EMEM;

	free(ret.d);
	ret.d = NULL;

	return ret;
	}

	/*
	* No incremental parsing goes on. We just dump the whole decompressed file into
	* memory then pass the job off to nbt_parse.
	*/
	nbt_node* nbt_parse_file(FILE* fp)
	{
	nbt_node* ret;

	errno = NBT_OK;

	/*
	* We need to keep these declarations up here as opposed to where they're
	* used because they're referenced by the parse_error block.
	*/
	buffer_t buf = { NULL, 0 };
	gzFile f = Z_NULL;

	if(fp == NULL) return NULL;

	int fd = fileno(fp);
	if(fd == -1) goto parse_error;

	f = gzdopen(fd, "rb");
	if(f == Z_NULL) goto parse_error;

	buf = __parse_file(f);

	if(buf.d == NULL) goto parse_error;
	if(gzclose(f) != Z_OK) goto parse_error;

	ret = nbt_parse(buf.d, buf.l);

	free(buf.d);

	return ret;

	parse_error:
	if(errno == NBT_OK)
	errno = NBT_EGZ;

	free(buf.d);

	if(f != Z_NULL)
	gzclose(f);

	return NULL;
	}

	/* spaces, not tabs ;) */
	static inline void indent(FILE* fp, size_t amount)
	{
	for(size_t i = 0; i < amount; i++)
	fprintf(fp, " ");
	}

	static nbt_status __nbt_dump_ascii(const nbt_node* tree, FILE* fp, size_t ident);

	/* prints the node's name, or (null) if it has none. */
	#define SAFE_NAME(node) ((node)->name ? (node)->name : "<null>")

	static inline void dump_byte_array(const struct nbt_byte_array ba, FILE* fp)
	{
	assert(ba.length >= 0);

	fprintf(fp, "[ ");
	for(int32_t i = 0; i < ba.length; ++i)
	fprintf(fp, "%i ", (int)ba.data[i]);
	fprintf(fp, "]");
	}

	static inline nbt_status dump_list_contents_ascii(const struct tag_list* list, FILE* fp, size_t ident)
	{
	const struct list_head* pos;

	list_for_each(pos, &list->entry)
	{
	const struct tag_list* entry = list_entry(pos, const struct tag_list, entry);
	nbt_status err;

	if((err = __nbt_dump_ascii(entry->data, fp, ident)) != NBT_OK)
	return err;
	}

	return NBT_OK;
	}

	static inline nbt_status __nbt_dump_ascii(const nbt_node* tree, FILE* fp, size_t ident)
	{
	if(tree == NULL) return NBT_OK;

	indent(fp, ident);

	if(tree->type == TAG_BYTE)
	fprintf(fp, "TAG_Byte(\"%s\"): %i\n", SAFE_NAME(tree), (int)tree->payload.tag_byte);
	else if(tree->type == TAG_SHORT)
	fprintf(fp, "TAG_Short(\"%s\"): %i\n", SAFE_NAME(tree), (int)tree->payload.tag_short);
	else if(tree->type == TAG_INT)
	fprintf(fp, "TAG_Int(\"%s\"): %i\n", SAFE_NAME(tree), (int)tree->payload.tag_int);
	else if(tree->type == TAG_LONG)
	fprintf(fp, "TAG_Long(\"%s\"): %" PRIi64 "\n", SAFE_NAME(tree), tree->payload.tag_long);
	else if(tree->type == TAG_FLOAT)
	fprintf(fp, "TAG_Float(\"%s\"): %f\n", SAFE_NAME(tree), (double)tree->payload.tag_float);
	else if(tree->type == TAG_DOUBLE)
	fprintf(fp, "TAG_Double(\"%s\"): %f\n", SAFE_NAME(tree), tree->payload.tag_double);
	else if(tree->type == TAG_BYTE_ARRAY)
	{
	fprintf(fp, "TAG_Byte_Array(\"%s\"): ", SAFE_NAME(tree));
	dump_byte_array(tree->payload.tag_byte_array, fp);
	fprintf(fp, "\n");
	}
	else if(tree->type == TAG_STRING)
	{
	if(tree->payload.tag_string == NULL)
	return NBT_ERR;

	fprintf(fp, "TAG_String(\"%s\"): %s\n", SAFE_NAME(tree), tree->payload.tag_string);
	}
	else if(tree->type == TAG_LIST)
	{
	fprintf(fp, "TAG_List(\"%s\")\n", SAFE_NAME(tree));
	indent(fp, ident);
	fprintf(fp, "{\n");

	nbt_status err;
	if((err = dump_list_contents_ascii(tree->payload.tag_list, fp, ident + 1)) != NBT_OK)
	return err;

	indent(fp, ident);
	fprintf(fp, "}\n");
	}
	else if(tree->type == TAG_COMPOUND)
	{
	fprintf(fp, "TAG_Compound(\"%s\")\n", SAFE_NAME(tree));
	indent(fp, ident);
	fprintf(fp, "{\n");

	nbt_status err;
	if((err = dump_list_contents_ascii(tree->payload.tag_compound, fp, ident + 1)) != NBT_OK)
	return err;

	indent(fp, ident);
	fprintf(fp, "}\n");
	}

	else
	return NBT_ERR;

	return NBT_OK;
	}

	nbt_status nbt_dump_ascii(const nbt_node* tree, FILE* fp)
	{
	return __nbt_dump_ascii(tree, fp, 0);
	}

	static nbt_status dump_byte_array_binary(const struct nbt_byte_array ba, gzFile fp)
	{
	int32_t dumped_length = ba.length;

	ne2be(&dumped_length, sizeof dumped_length);

	CHECKED_GZWRITE(fp, &dumped_length, sizeof dumped_length);

	if(ba.length) assert(ba.data);

	CHECKED_GZWRITE(fp, ba.data, ba.length);

	return NBT_OK;
	}

	static nbt_status dump_string_binary(const char* name, gzFile fp)
	{
	assert(name);

	size_t len = strlen(name);

	if(len > 32767 /* SHORT_MAX */)
	return NBT_ERR;

	{ /* dump the length */
	int16_t dumped_len = (int16_t)len;
	ne2be(&dumped_len, sizeof dumped_len);

	CHECKED_GZWRITE(fp, &dumped_len, sizeof dumped_len);
	}

	CHECKED_GZWRITE(fp, name, len);

	return NBT_OK;
	}

	/*
	* Is the list all one type? If yes, return the type. Otherwise, return
	* TAG_INVALID
	*/
	static inline nbt_type list_is_homogenous(const struct tag_list* list)
	{
	nbt_type type = TAG_INVALID;

	const struct list_head* pos;
	list_for_each(pos, &list->entry)
	{
	const struct tag_list* cur = list_entry(pos, const struct tag_list, entry);

	assert(cur->data->type != TAG_INVALID);

	if(cur->data->type == TAG_INVALID)
	return TAG_INVALID;

	/* if we're the first type, just set it to our current type */
	if(type == TAG_INVALID) type = cur->data->type;

	if(type != cur->data->type)
	return TAG_INVALID;
	}

	return type;
	}

	static nbt_status __dump_binary(const nbt_node*, bool, gzFile);

	static nbt_status dump_list_binary(const struct tag_list* list, gzFile fp)
	{
	nbt_type type;

	size_t len = list_length(&list->entry);

	if(len == 0) /* empty lists can just be silently ignored */
	return NBT_OK;

	if(len > 2147483647 /* INT_MAX */)
	return NBT_ERR;

	assert(list_is_homogenous(list) != TAG_INVALID);
	if((type = list_is_homogenous(list)) == TAG_INVALID)
	return NBT_ERR;

	{
	int8_t _type = (int8_t)type;
	ne2be(&_type, sizeof _type); /* unnecessary, but left in to keep similar code looking similar */
	CHECKED_GZWRITE(fp, &_type, sizeof _type);
	}

	{
	int32_t dumped_len = (int32_t)len;
	ne2be(&dumped_len, sizeof dumped_len);
	CHECKED_GZWRITE(fp, &dumped_len, sizeof dumped_len);
	}

	const struct list_head* pos;
	list_for_each(pos, &list->entry)
	{
	const struct tag_list* entry = list_entry(pos, const struct tag_list, entry);
	nbt_status ret;

	if((ret = __dump_binary(entry->data, false, fp)) != NBT_OK)
	return ret;
	}

	return NBT_OK;
	}

	static nbt_status dump_compound_binary(const struct tag_list* list, gzFile fp)
	{
	if(list_empty(&list->entry)) /* empty lists can just be silently ignored */
	return NBT_OK;

	const struct list_head* pos;
	list_for_each(pos, &list->entry)
	{
	const struct tag_list* entry = list_entry(pos, const struct tag_list, entry);
	nbt_status ret;

	if((ret = __dump_binary(entry->data, true, fp)) != NBT_OK)
	return ret;
	}

	/* write out TAG_End */
	uint8_t zero = 0;
	CHECKED_GZWRITE(fp, &zero, sizeof zero);

	return NBT_OK;
	}

	/*
	* @param dump_type Should we dump the type, or just skip it? We need to skip
	* when dumping lists, because the list header already says
	* the type.
	*/
	static inline nbt_status __dump_binary(const nbt_node* tree, bool dump_type, gzFile fp)
	{
	if(dump_type)
	{ /* write out the type */
	int8_t type = (int8_t)tree->type;

	CHECKED_GZWRITE(fp, &type, sizeof type);
	}

	if(tree->name)
	{
	nbt_status err;

	if((err = dump_string_binary(tree->name, fp)) != NBT_OK)
	return err;
	}

	#define DUMP_NUM(type, x) do { \
	type temp = x; \
	ne2be(&temp, sizeof temp); \
	CHECKED_GZWRITE(fp, &temp, sizeof temp); \
	} while(0)

	if(tree->type == TAG_BYTE)
	DUMP_NUM(int8_t, tree->payload.tag_byte);
	else if(tree->type == TAG_SHORT)
	DUMP_NUM(int16_t, tree->payload.tag_short);
	else if(tree->type == TAG_INT)
	DUMP_NUM(int32_t, tree->payload.tag_int);
	else if(tree->type == TAG_LONG)
	DUMP_NUM(int64_t, tree->payload.tag_long);
	else if(tree->type == TAG_FLOAT)
	DUMP_NUM(float, tree->payload.tag_float);
	else if(tree->type == TAG_DOUBLE)
	DUMP_NUM(double, tree->payload.tag_double);
	else if(tree->type == TAG_BYTE_ARRAY)
	return dump_byte_array_binary(tree->payload.tag_byte_array, fp);
	else if(tree->type == TAG_STRING)
	return dump_string_binary(tree->payload.tag_string, fp);
	else if(tree->type == TAG_LIST)
	return dump_list_binary(tree->payload.tag_list, fp);
	else if(tree->type == TAG_COMPOUND)
	return dump_compound_binary(tree->payload.tag_compound, fp);

	else
	return NBT_ERR;

	return NBT_OK;

	#undef DUMP_NUM
	}

	nbt_status nbt_dump_binary(const nbt_node* tree, FILE* fp)
	{
	if(tree == NULL) return NBT_OK;

	int fd = fileno(fp);
	if(fd == -1) return NBT_EGZ;

	gzFile f = gzdopen(fd, "wb");
	if(f == Z_NULL) return NBT_EGZ;

	nbt_status r = __dump_binary(tree, true, f);

	gzclose(f);

	return r;
	}