From d1853fc98e5745fb1a5bc0a289954874805ecffd Mon Sep 17 00:00:00 2001
From: Brendan Hansen <brendan.f.hansen@gmail.com>
Date: Sun, 16 Jan 2022 14:40:56 -0600
Subject: [PATCH] lots of changes

---
 lib/stb_image.c                             |   93 +
 lib/stb_image.h                             | 7897 +++++++++++++++++++
 lib/stb_image.onyx                          |   13 +
 run_tree/assets/shaders/world_fragment.glsl |    6 +-
 run_tree/assets/shaders/world_vertex.glsl   |    9 +-
 run_tree/assets/textures/block.png          |  Bin 0 -> 2406 bytes
 run_tree/lib/stb_image.so                   |  Bin 0 -> 156624 bytes
 run_tree/run.sh                             |    2 +-
 src/build.onyx                              |   16 +-
 src/chunk.onyx                              |   59 +-
 src/input.onyx                              |    2 +-
 src/main.onyx                               |    6 +
 src/mesh.onyx                               |   12 +-
 src/physics.onyx                            |    2 +-
 src/player.onyx                             |    4 +-
 src/texture.onyx                            |   38 +
 src/world.onyx                              |   10 +-
 src/worldgen.onyx                           |   20 +
 18 files changed, 8147 insertions(+), 42 deletions(-)
 create mode 100644 lib/stb_image.c
 create mode 100644 lib/stb_image.h
 create mode 100644 lib/stb_image.onyx
 create mode 100644 run_tree/assets/textures/block.png
 create mode 100755 run_tree/lib/stb_image.so
 create mode 100644 src/texture.onyx
 create mode 100644 src/worldgen.onyx

diff --git a/lib/stb_image.c b/lib/stb_image.c
new file mode 100644
index 0000000..7be2139
--- /dev/null
+++ b/lib/stb_image.c
@@ -0,0 +1,93 @@
+#define ONYX_LIBRARY_NAME stb_image
+#include "onyx_library.h"
+
+static wasm_func_t* stbi_heap_alloc = NULL;
+static void *__onyx_stbi_heap_alloc_wrapper(int size) {
+    if (stbi_heap_alloc == NULL) {
+        wasm_extern_t *stbi_heap_alloc_extern = runtime->wasm_extern_lookup_by_name(runtime->wasm_module, runtime->wasm_instance, "stbi_heap_alloc");
+        stbi_heap_alloc = runtime->wasm_extern_as_func(stbi_heap_alloc_extern);
+        assert(stbi_heap_alloc != NULL);
+    }
+
+    wasm_val_t args[] = { WASM_I32_VAL(size) };
+    wasm_val_t results[1];
+    wasm_val_vec_t args_arr = WASM_ARRAY_VEC(args);
+    wasm_val_vec_t results_arr = WASM_ARRAY_VEC(results);
+
+    runtime->wasm_func_call(stbi_heap_alloc, &args_arr, &results_arr);
+    return ONYX_PTR(results[0].of.i32);
+}
+
+static wasm_func_t* stbi_heap_resize = NULL;
+static void *__onyx_stbi_heap_resize_wrapper(void* ptr, int size) {
+    if (stbi_heap_resize == NULL) {
+        wasm_extern_t *stbi_heap_resize_extern = runtime->wasm_extern_lookup_by_name(runtime->wasm_module, runtime->wasm_instance, "stbi_heap_resize");
+        stbi_heap_resize = runtime->wasm_extern_as_func(stbi_heap_resize_extern);
+    }
+
+    int onyx_ptr = 0;
+    if (ptr != NULL) onyx_ptr = (int) ((char*) ptr - runtime->wasm_memory_data(runtime->wasm_memory));
+
+    wasm_val_t args[] = { WASM_I32_VAL(onyx_ptr), WASM_I32_VAL(size) };
+    wasm_val_t results[1];
+    wasm_val_vec_t args_arr = WASM_ARRAY_VEC(args);
+    wasm_val_vec_t results_arr = WASM_ARRAY_VEC(results);
+
+    runtime->wasm_func_call(stbi_heap_resize, &args_arr, &results_arr);
+    return ONYX_PTR(results[0].of.i32);
+}
+
+static wasm_func_t* stbi_heap_free = NULL;
+static void __onyx_stbi_heap_free_wrapper(void *ptr) {
+    if (stbi_heap_free == NULL) {
+        wasm_extern_t *stbi_heap_free_extern = runtime->wasm_extern_lookup_by_name(runtime->wasm_module, runtime->wasm_instance, "stbi_heap_free");
+        stbi_heap_free = runtime->wasm_extern_as_func(stbi_heap_free_extern);
+    }
+
+    if (ptr == NULL) return;
+
+    int onyx_ptr = (int) ((char*) ptr - runtime->wasm_memory_data(runtime->wasm_memory));
+
+    wasm_val_t args[] = { WASM_I32_VAL(onyx_ptr) };
+    wasm_val_vec_t results = {0,0};
+    wasm_val_vec_t args_arr = WASM_ARRAY_VEC(args);
+
+    runtime->wasm_func_call(stbi_heap_free, &args_arr, &results);
+}
+
+#define STBI_MALLOC(s)        __onyx_stbi_heap_alloc_wrapper(s)
+#define STBI_REALLOC(p,newsz) __onyx_stbi_heap_resize_wrapper(p,newsz)
+#define STBI_FREE(p)          __onyx_stbi_heap_free_wrapper(p)
+
+#define STB_IMAGE_IMPLEMENTATION
+#include "stb_image.h"
+
+#define PTR WASM_I32
+#define INT WASM_I32
+#define FLOAT WASM_F32
+#define PARAM(n, k) (params->data[n].of.k)
+
+ONYX_DEF(stbi_load, (PTR, PTR, PTR, PTR, INT), (PTR)) {
+    unsigned char *data = stbi_load(
+            (char *) ONYX_PTR(PARAM(0, i32)),
+            (int *) ONYX_PTR(PARAM(1, i32)),
+            (int *) ONYX_PTR(PARAM(2, i32)),
+            (int *) ONYX_PTR(PARAM(3, i32)),
+            PARAM(4, i32));
+
+    if (data == NULL) results->data[0] = WASM_I32_VAL(0);
+    else              results->data[0] = WASM_I32_VAL(data - (unsigned char *) runtime->wasm_memory_data(runtime->wasm_memory));
+    return NULL;
+} 
+
+ONYX_DEF(stbi_image_free, (PTR), ()) {
+    stbi_image_free(ONYX_PTR(PARAM(0, i32)));
+    return NULL;
+}
+
+ONYX_LIBRARY {
+    ONYX_FUNC(stbi_load)
+    ONYX_FUNC(stbi_image_free)
+
+    NULL
+};
diff --git a/lib/stb_image.h b/lib/stb_image.h
new file mode 100644
index 0000000..d60371b
--- /dev/null
+++ b/lib/stb_image.h
@@ -0,0 +1,7897 @@
+/* stb_image - v2.27 - public domain image loader - http://nothings.org/stb
+                                  no warranty implied; use at your own risk
+
+   Do this:
+      #define STB_IMAGE_IMPLEMENTATION
+   before you include this file in *one* C or C++ file to create the implementation.
+
+   // i.e. it should look like this:
+   #include ...
+   #include ...
+   #include ...
+   #define STB_IMAGE_IMPLEMENTATION
+   #include "stb_image.h"
+
+   You can #define STBI_ASSERT(x) before the #include to avoid using assert.h.
+   And #define STBI_MALLOC, STBI_REALLOC, and STBI_FREE to avoid using malloc,realloc,free
+
+
+   QUICK NOTES:
+      Primarily of interest to game developers and other people who can
+          avoid problematic images and only need the trivial interface
+
+      JPEG baseline & progressive (12 bpc/arithmetic not supported, same as stock IJG lib)
+      PNG 1/2/4/8/16-bit-per-channel
+
+      TGA (not sure what subset, if a subset)
+      BMP non-1bpp, non-RLE
+      PSD (composited view only, no extra channels, 8/16 bit-per-channel)
+
+      GIF (*comp always reports as 4-channel)
+      HDR (radiance rgbE format)
+      PIC (Softimage PIC)
+      PNM (PPM and PGM binary only)
+
+      Animated GIF still needs a proper API, but here's one way to do it:
+          http://gist.github.com/urraka/685d9a6340b26b830d49
+
+      - decode from memory or through FILE (define STBI_NO_STDIO to remove code)
+      - decode from arbitrary I/O callbacks
+      - SIMD acceleration on x86/x64 (SSE2) and ARM (NEON)
+
+   Full documentation under "DOCUMENTATION" below.
+
+
+LICENSE
+
+  See end of file for license information.
+
+RECENT REVISION HISTORY:
+
+      2.27  (2021-07-11) document stbi_info better, 16-bit PNM support, bug fixes
+      2.26  (2020-07-13) many minor fixes
+      2.25  (2020-02-02) fix warnings
+      2.24  (2020-02-02) fix warnings; thread-local failure_reason and flip_vertically
+      2.23  (2019-08-11) fix clang static analysis warning
+      2.22  (2019-03-04) gif fixes, fix warnings
+      2.21  (2019-02-25) fix typo in comment
+      2.20  (2019-02-07) support utf8 filenames in Windows; fix warnings and platform ifdefs
+      2.19  (2018-02-11) fix warning
+      2.18  (2018-01-30) fix warnings
+      2.17  (2018-01-29) bugfix, 1-bit BMP, 16-bitness query, fix warnings
+      2.16  (2017-07-23) all functions have 16-bit variants; optimizations; bugfixes
+      2.15  (2017-03-18) fix png-1,2,4; all Imagenet JPGs; no runtime SSE detection on GCC
+      2.14  (2017-03-03) remove deprecated STBI_JPEG_OLD; fixes for Imagenet JPGs
+      2.13  (2016-12-04) experimental 16-bit API, only for PNG so far; fixes
+      2.12  (2016-04-02) fix typo in 2.11 PSD fix that caused crashes
+      2.11  (2016-04-02) 16-bit PNGS; enable SSE2 in non-gcc x64
+                         RGB-format JPEG; remove white matting in PSD;
+                         allocate large structures on the stack;
+                         correct channel count for PNG & BMP
+      2.10  (2016-01-22) avoid warning introduced in 2.09
+      2.09  (2016-01-16) 16-bit TGA; comments in PNM files; STBI_REALLOC_SIZED
+
+   See end of file for full revision history.
+
+
+ ============================    Contributors    =========================
+
+ Image formats                          Extensions, features
+    Sean Barrett (jpeg, png, bmp)          Jetro Lauha (stbi_info)
+    Nicolas Schulz (hdr, psd)              Martin "SpartanJ" Golini (stbi_info)
+    Jonathan Dummer (tga)                  James "moose2000" Brown (iPhone PNG)
+    Jean-Marc Lienher (gif)                Ben "Disch" Wenger (io callbacks)
+    Tom Seddon (pic)                       Omar Cornut (1/2/4-bit PNG)
+    Thatcher Ulrich (psd)                  Nicolas Guillemot (vertical flip)
+    Ken Miller (pgm, ppm)                  Richard Mitton (16-bit PSD)
+    github:urraka (animated gif)           Junggon Kim (PNM comments)
+    Christopher Forseth (animated gif)     Daniel Gibson (16-bit TGA)
+                                           socks-the-fox (16-bit PNG)
+                                           Jeremy Sawicki (handle all ImageNet JPGs)
+ Optimizations & bugfixes                  Mikhail Morozov (1-bit BMP)
+    Fabian "ryg" Giesen                    Anael Seghezzi (is-16-bit query)
+    Arseny Kapoulkine                      Simon Breuss (16-bit PNM)
+    John-Mark Allen
+    Carmelo J Fdez-Aguera
+
+ Bug & warning fixes
+    Marc LeBlanc            David Woo          Guillaume George     Martins Mozeiko
+    Christpher Lloyd        Jerry Jansson      Joseph Thomson       Blazej Dariusz Roszkowski
+    Phil Jordan                                Dave Moore           Roy Eltham
+    Hayaki Saito            Nathan Reed        Won Chun
+    Luke Graham             Johan Duparc       Nick Verigakis       the Horde3D community
+    Thomas Ruf              Ronny Chevalier                         github:rlyeh
+    Janez Zemva             John Bartholomew   Michal Cichon        github:romigrou
+    Jonathan Blow           Ken Hamada         Tero Hanninen        github:svdijk
+    Eugene Golushkov        Laurent Gomila     Cort Stratton        github:snagar
+    Aruelien Pocheville     Sergio Gonzalez    Thibault Reuille     github:Zelex
+    Cass Everitt            Ryamond Barbiero                        github:grim210
+    Paul Du Bois            Engin Manap        Aldo Culquicondor    github:sammyhw
+    Philipp Wiesemann       Dale Weiler        Oriol Ferrer Mesia   github:phprus
+    Josh Tobin                                 Matthew Gregan       github:poppolopoppo
+    Julian Raschke          Gregory Mullen     Christian Floisand   github:darealshinji
+    Baldur Karlsson         Kevin Schmidt      JR Smith             github:Michaelangel007
+                            Brad Weinberger    Matvey Cherevko      github:mosra
+    Luca Sas                Alexander Veselov  Zack Middleton       [reserved]
+    Ryan C. Gordon          [reserved]                              [reserved]
+                     DO NOT ADD YOUR NAME HERE
+
+                     Jacko Dirks
+
+  To add your name to the credits, pick a random blank space in the middle and fill it.
+  80% of merge conflicts on stb PRs are due to people adding their name at the end
+  of the credits.
+*/
+
+#ifndef STBI_INCLUDE_STB_IMAGE_H
+#define STBI_INCLUDE_STB_IMAGE_H
+
+// DOCUMENTATION
+//
+// Limitations:
+//    - no 12-bit-per-channel JPEG
+//    - no JPEGs with arithmetic coding
+//    - GIF always returns *comp=4
+//
+// Basic usage (see HDR discussion below for HDR usage):
+//    int x,y,n;
+//    unsigned char *data = stbi_load(filename, &x, &y, &n, 0);
+//    // ... process data if not NULL ...
+//    // ... x = width, y = height, n = # 8-bit components per pixel ...
+//    // ... replace '0' with '1'..'4' to force that many components per pixel
+//    // ... but 'n' will always be the number that it would have been if you said 0
+//    stbi_image_free(data)
+//
+// Standard parameters:
+//    int *x                 -- outputs image width in pixels
+//    int *y                 -- outputs image height in pixels
+//    int *channels_in_file  -- outputs # of image components in image file
+//    int desired_channels   -- if non-zero, # of image components requested in result
+//
+// The return value from an image loader is an 'unsigned char *' which points
+// to the pixel data, or NULL on an allocation failure or if the image is
+// corrupt or invalid. The pixel data consists of *y scanlines of *x pixels,
+// with each pixel consisting of N interleaved 8-bit components; the first
+// pixel pointed to is top-left-most in the image. There is no padding between
+// image scanlines or between pixels, regardless of format. The number of
+// components N is 'desired_channels' if desired_channels is non-zero, or
+// *channels_in_file otherwise. If desired_channels is non-zero,
+// *channels_in_file has the number of components that _would_ have been
+// output otherwise. E.g. if you set desired_channels to 4, you will always
+// get RGBA output, but you can check *channels_in_file to see if it's trivially
+// opaque because e.g. there were only 3 channels in the source image.
+//
+// An output image with N components has the following components interleaved
+// in this order in each pixel:
+//
+//     N=#comp     components
+//       1           grey
+//       2           grey, alpha
+//       3           red, green, blue
+//       4           red, green, blue, alpha
+//
+// If image loading fails for any reason, the return value will be NULL,
+// and *x, *y, *channels_in_file will be unchanged. The function
+// stbi_failure_reason() can be queried for an extremely brief, end-user
+// unfriendly explanation of why the load failed. Define STBI_NO_FAILURE_STRINGS
+// to avoid compiling these strings at all, and STBI_FAILURE_USERMSG to get slightly
+// more user-friendly ones.
+//
+// Paletted PNG, BMP, GIF, and PIC images are automatically depalettized.
+//
+// To query the width, height and component count of an image without having to
+// decode the full file, you can use the stbi_info family of functions:
+//
+//   int x,y,n,ok;
+//   ok = stbi_info(filename, &x, &y, &n);
+//   // returns ok=1 and sets x, y, n if image is a supported format,
+//   // 0 otherwise.
+//
+// Note that stb_image pervasively uses ints in its public API for sizes,
+// including sizes of memory buffers. This is now part of the API and thus
+// hard to change without causing breakage. As a result, the various image
+// loaders all have certain limits on image size; these differ somewhat
+// by format but generally boil down to either just under 2GB or just under
+// 1GB. When the decoded image would be larger than this, stb_image decoding
+// will fail.
+//
+// Additionally, stb_image will reject image files that have any of their
+// dimensions set to a larger value than the configurable STBI_MAX_DIMENSIONS,
+// which defaults to 2**24 = 16777216 pixels. Due to the above memory limit,
+// the only way to have an image with such dimensions load correctly
+// is for it to have a rather extreme aspect ratio. Either way, the
+// assumption here is that such larger images are likely to be malformed
+// or malicious. If you do need to load an image with individual dimensions
+// larger than that, and it still fits in the overall size limit, you can
+// #define STBI_MAX_DIMENSIONS on your own to be something larger.
+//
+// ===========================================================================
+//
+// UNICODE:
+//
+//   If compiling for Windows and you wish to use Unicode filenames, compile
+//   with
+//       #define STBI_WINDOWS_UTF8
+//   and pass utf8-encoded filenames. Call stbi_convert_wchar_to_utf8 to convert
+//   Windows wchar_t filenames to utf8.
+//
+// ===========================================================================
+//
+// Philosophy
+//
+// stb libraries are designed with the following priorities:
+//
+//    1. easy to use
+//    2. easy to maintain
+//    3. good performance
+//
+// Sometimes I let "good performance" creep up in priority over "easy to maintain",
+// and for best performance I may provide less-easy-to-use APIs that give higher
+// performance, in addition to the easy-to-use ones. Nevertheless, it's important
+// to keep in mind that from the standpoint of you, a client of this library,
+// all you care about is #1 and #3, and stb libraries DO NOT emphasize #3 above all.
+//
+// Some secondary priorities arise directly from the first two, some of which
+// provide more explicit reasons why performance can't be emphasized.
+//
+//    - Portable ("ease of use")
+//    - Small source code footprint ("easy to maintain")
+//    - No dependencies ("ease of use")
+//
+// ===========================================================================
+//
+// I/O callbacks
+//
+// I/O callbacks allow you to read from arbitrary sources, like packaged
+// files or some other source. Data read from callbacks are processed
+// through a small internal buffer (currently 128 bytes) to try to reduce
+// overhead.
+//
+// The three functions you must define are "read" (reads some bytes of data),
+// "skip" (skips some bytes of data), "eof" (reports if the stream is at the end).
+//
+// ===========================================================================
+//
+// SIMD support
+//
+// The JPEG decoder will try to automatically use SIMD kernels on x86 when
+// supported by the compiler. For ARM Neon support, you must explicitly
+// request it.
+//
+// (The old do-it-yourself SIMD API is no longer supported in the current
+// code.)
+//
+// On x86, SSE2 will automatically be used when available based on a run-time
+// test; if not, the generic C versions are used as a fall-back. On ARM targets,
+// the typical path is to have separate builds for NEON and non-NEON devices
+// (at least this is true for iOS and Android). Therefore, the NEON support is
+// toggled by a build flag: define STBI_NEON to get NEON loops.
+//
+// If for some reason you do not want to use any of SIMD code, or if
+// you have issues compiling it, you can disable it entirely by
+// defining STBI_NO_SIMD.
+//
+// ===========================================================================
+//
+// HDR image support   (disable by defining STBI_NO_HDR)
+//
+// stb_image supports loading HDR images in general, and currently the Radiance
+// .HDR file format specifically. You can still load any file through the existing
+// interface; if you attempt to load an HDR file, it will be automatically remapped
+// to LDR, assuming gamma 2.2 and an arbitrary scale factor defaulting to 1;
+// both of these constants can be reconfigured through this interface:
+//
+//     stbi_hdr_to_ldr_gamma(2.2f);
+//     stbi_hdr_to_ldr_scale(1.0f);
+//
+// (note, do not use _inverse_ constants; stbi_image will invert them
+// appropriately).
+//
+// Additionally, there is a new, parallel interface for loading files as
+// (linear) floats to preserve the full dynamic range:
+//
+//    float *data = stbi_loadf(filename, &x, &y, &n, 0);
+//
+// If you load LDR images through this interface, those images will
+// be promoted to floating point values, run through the inverse of
+// constants corresponding to the above:
+//
+//     stbi_ldr_to_hdr_scale(1.0f);
+//     stbi_ldr_to_hdr_gamma(2.2f);
+//
+// Finally, given a filename (or an open file or memory block--see header
+// file for details) containing image data, you can query for the "most
+// appropriate" interface to use (that is, whether the image is HDR or
+// not), using:
+//
+//     stbi_is_hdr(char *filename);
+//
+// ===========================================================================
+//
+// iPhone PNG support:
+//
+// We optionally support converting iPhone-formatted PNGs (which store
+// premultiplied BGRA) back to RGB, even though they're internally encoded
+// differently. To enable this conversion, call
+// stbi_convert_iphone_png_to_rgb(1).
+//
+// Call stbi_set_unpremultiply_on_load(1) as well to force a divide per
+// pixel to remove any premultiplied alpha *only* if the image file explicitly
+// says there's premultiplied data (currently only happens in iPhone images,
+// and only if iPhone convert-to-rgb processing is on).
+//
+// ===========================================================================
+//
+// ADDITIONAL CONFIGURATION
+//
+//  - You can suppress implementation of any of the decoders to reduce
+//    your code footprint by #defining one or more of the following
+//    symbols before creating the implementation.
+//
+//        STBI_NO_JPEG
+//        STBI_NO_PNG
+//        STBI_NO_BMP
+//        STBI_NO_PSD
+//        STBI_NO_TGA
+//        STBI_NO_GIF
+//        STBI_NO_HDR
+//        STBI_NO_PIC
+//        STBI_NO_PNM   (.ppm and .pgm)
+//
+//  - You can request *only* certain decoders and suppress all other ones
+//    (this will be more forward-compatible, as addition of new decoders
+//    doesn't require you to disable them explicitly):
+//
+//        STBI_ONLY_JPEG
+//        STBI_ONLY_PNG
+//        STBI_ONLY_BMP
+//        STBI_ONLY_PSD
+//        STBI_ONLY_TGA
+//        STBI_ONLY_GIF
+//        STBI_ONLY_HDR
+//        STBI_ONLY_PIC
+//        STBI_ONLY_PNM   (.ppm and .pgm)
+//
+//   - If you use STBI_NO_PNG (or _ONLY_ without PNG), and you still
+//     want the zlib decoder to be available, #define STBI_SUPPORT_ZLIB
+//
+//  - If you define STBI_MAX_DIMENSIONS, stb_image will reject images greater
+//    than that size (in either width or height) without further processing.
+//    This is to let programs in the wild set an upper bound to prevent
+//    denial-of-service attacks on untrusted data, as one could generate a
+//    valid image of gigantic dimensions and force stb_image to allocate a
+//    huge block of memory and spend disproportionate time decoding it. By
+//    default this is set to (1 << 24), which is 16777216, but that's still
+//    very big.
+
+#ifndef STBI_NO_STDIO
+#include <stdio.h>
+#endif // STBI_NO_STDIO
+
+#define STBI_VERSION 1
+
+enum
+{
+   STBI_default = 0, // only used for desired_channels
+
+   STBI_grey       = 1,
+   STBI_grey_alpha = 2,
+   STBI_rgb        = 3,
+   STBI_rgb_alpha  = 4
+};
+
+#include <stdlib.h>
+typedef unsigned char stbi_uc;
+typedef unsigned short stbi_us;
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+#ifndef STBIDEF
+#ifdef STB_IMAGE_STATIC
+#define STBIDEF static
+#else
+#define STBIDEF extern
+#endif
+#endif
+
+//////////////////////////////////////////////////////////////////////////////
+//
+// PRIMARY API - works on images of any type
+//
+
+//
+// load image by filename, open file, or memory buffer
+//
+
+typedef struct
+{
+   int      (*read)  (void *user,char *data,int size);   // fill 'data' with 'size' bytes.  return number of bytes actually read
+   void     (*skip)  (void *user,int n);                 // skip the next 'n' bytes, or 'unget' the last -n bytes if negative
+   int      (*eof)   (void *user);                       // returns nonzero if we are at end of file/data
+} stbi_io_callbacks;
+
+////////////////////////////////////
+//
+// 8-bits-per-channel interface
+//
+
+STBIDEF stbi_uc *stbi_load_from_memory   (stbi_uc           const *buffer, int len   , int *x, int *y, int *channels_in_file, int desired_channels);
+STBIDEF stbi_uc *stbi_load_from_callbacks(stbi_io_callbacks const *clbk  , void *user, int *x, int *y, int *channels_in_file, int desired_channels);
+
+#ifndef STBI_NO_STDIO
+STBIDEF stbi_uc *stbi_load            (char const *filename, int *x, int *y, int *channels_in_file, int desired_channels);
+STBIDEF stbi_uc *stbi_load_from_file  (FILE *f, int *x, int *y, int *channels_in_file, int desired_channels);
+// for stbi_load_from_file, file pointer is left pointing immediately after image
+#endif
+
+#ifndef STBI_NO_GIF
+STBIDEF stbi_uc *stbi_load_gif_from_memory(stbi_uc const *buffer, int len, int **delays, int *x, int *y, int *z, int *comp, int req_comp);
+#endif
+
+#ifdef STBI_WINDOWS_UTF8
+STBIDEF int stbi_convert_wchar_to_utf8(char *buffer, size_t bufferlen, const wchar_t* input);
+#endif
+
+////////////////////////////////////
+//
+// 16-bits-per-channel interface
+//
+
+STBIDEF stbi_us *stbi_load_16_from_memory   (stbi_uc const *buffer, int len, int *x, int *y, int *channels_in_file, int desired_channels);
+STBIDEF stbi_us *stbi_load_16_from_callbacks(stbi_io_callbacks const *clbk, void *user, int *x, int *y, int *channels_in_file, int desired_channels);
+
+#ifndef STBI_NO_STDIO
+STBIDEF stbi_us *stbi_load_16          (char const *filename, int *x, int *y, int *channels_in_file, int desired_channels);
+STBIDEF stbi_us *stbi_load_from_file_16(FILE *f, int *x, int *y, int *channels_in_file, int desired_channels);
+#endif
+
+////////////////////////////////////
+//
+// float-per-channel interface
+//
+#ifndef STBI_NO_LINEAR
+   STBIDEF float *stbi_loadf_from_memory     (stbi_uc const *buffer, int len, int *x, int *y, int *channels_in_file, int desired_channels);
+   STBIDEF float *stbi_loadf_from_callbacks  (stbi_io_callbacks const *clbk, void *user, int *x, int *y,  int *channels_in_file, int desired_channels);
+
+   #ifndef STBI_NO_STDIO
+   STBIDEF float *stbi_loadf            (char const *filename, int *x, int *y, int *channels_in_file, int desired_channels);
+   STBIDEF float *stbi_loadf_from_file  (FILE *f, int *x, int *y, int *channels_in_file, int desired_channels);
+   #endif
+#endif
+
+#ifndef STBI_NO_HDR
+   STBIDEF void   stbi_hdr_to_ldr_gamma(float gamma);
+   STBIDEF void   stbi_hdr_to_ldr_scale(float scale);
+#endif // STBI_NO_HDR
+
+#ifndef STBI_NO_LINEAR
+   STBIDEF void   stbi_ldr_to_hdr_gamma(float gamma);
+   STBIDEF void   stbi_ldr_to_hdr_scale(float scale);
+#endif // STBI_NO_LINEAR
+
+// stbi_is_hdr is always defined, but always returns false if STBI_NO_HDR
+STBIDEF int    stbi_is_hdr_from_callbacks(stbi_io_callbacks const *clbk, void *user);
+STBIDEF int    stbi_is_hdr_from_memory(stbi_uc const *buffer, int len);
+#ifndef STBI_NO_STDIO
+STBIDEF int      stbi_is_hdr          (char const *filename);
+STBIDEF int      stbi_is_hdr_from_file(FILE *f);
+#endif // STBI_NO_STDIO
+
+
+// get a VERY brief reason for failure
+// on most compilers (and ALL modern mainstream compilers) this is threadsafe
+STBIDEF const char *stbi_failure_reason  (void);
+
+// free the loaded image -- this is just free()
+STBIDEF void     stbi_image_free      (void *retval_from_stbi_load);
+
+// get image dimensions & components without fully decoding
+STBIDEF int      stbi_info_from_memory(stbi_uc const *buffer, int len, int *x, int *y, int *comp);
+STBIDEF int      stbi_info_from_callbacks(stbi_io_callbacks const *clbk, void *user, int *x, int *y, int *comp);
+STBIDEF int      stbi_is_16_bit_from_memory(stbi_uc const *buffer, int len);
+STBIDEF int      stbi_is_16_bit_from_callbacks(stbi_io_callbacks const *clbk, void *user);
+
+#ifndef STBI_NO_STDIO
+STBIDEF int      stbi_info               (char const *filename,     int *x, int *y, int *comp);
+STBIDEF int      stbi_info_from_file     (FILE *f,                  int *x, int *y, int *comp);
+STBIDEF int      stbi_is_16_bit          (char const *filename);
+STBIDEF int      stbi_is_16_bit_from_file(FILE *f);
+#endif
+
+
+
+// for image formats that explicitly notate that they have premultiplied alpha,
+// we just return the colors as stored in the file. set this flag to force
+// unpremultiplication. results are undefined if the unpremultiply overflow.
+STBIDEF void stbi_set_unpremultiply_on_load(int flag_true_if_should_unpremultiply);
+
+// indicate whether we should process iphone images back to canonical format,
+// or just pass them through "as-is"
+STBIDEF void stbi_convert_iphone_png_to_rgb(int flag_true_if_should_convert);
+
+// flip the image vertically, so the first pixel in the output array is the bottom left
+STBIDEF void stbi_set_flip_vertically_on_load(int flag_true_if_should_flip);
+
+// as above, but only applies to images loaded on the thread that calls the function
+// this function is only available if your compiler supports thread-local variables;
+// calling it will fail to link if your compiler doesn't
+STBIDEF void stbi_set_unpremultiply_on_load_thread(int flag_true_if_should_unpremultiply);
+STBIDEF void stbi_convert_iphone_png_to_rgb_thread(int flag_true_if_should_convert);
+STBIDEF void stbi_set_flip_vertically_on_load_thread(int flag_true_if_should_flip);
+
+// ZLIB client - used by PNG, available for other purposes
+
+STBIDEF char *stbi_zlib_decode_malloc_guesssize(const char *buffer, int len, int initial_size, int *outlen);
+STBIDEF char *stbi_zlib_decode_malloc_guesssize_headerflag(const char *buffer, int len, int initial_size, int *outlen, int parse_header);
+STBIDEF char *stbi_zlib_decode_malloc(const char *buffer, int len, int *outlen);
+STBIDEF int   stbi_zlib_decode_buffer(char *obuffer, int olen, const char *ibuffer, int ilen);
+
+STBIDEF char *stbi_zlib_decode_noheader_malloc(const char *buffer, int len, int *outlen);
+STBIDEF int   stbi_zlib_decode_noheader_buffer(char *obuffer, int olen, const char *ibuffer, int ilen);
+
+
+#ifdef __cplusplus
+}
+#endif
+
+//
+//
+////   end header file   /////////////////////////////////////////////////////
+#endif // STBI_INCLUDE_STB_IMAGE_H
+
+#ifdef STB_IMAGE_IMPLEMENTATION
+
+#if defined(STBI_ONLY_JPEG) || defined(STBI_ONLY_PNG) || defined(STBI_ONLY_BMP) \
+  || defined(STBI_ONLY_TGA) || defined(STBI_ONLY_GIF) || defined(STBI_ONLY_PSD) \
+  || defined(STBI_ONLY_HDR) || defined(STBI_ONLY_PIC) || defined(STBI_ONLY_PNM) \
+  || defined(STBI_ONLY_ZLIB)
+   #ifndef STBI_ONLY_JPEG
+   #define STBI_NO_JPEG
+   #endif
+   #ifndef STBI_ONLY_PNG
+   #define STBI_NO_PNG
+   #endif
+   #ifndef STBI_ONLY_BMP
+   #define STBI_NO_BMP
+   #endif
+   #ifndef STBI_ONLY_PSD
+   #define STBI_NO_PSD
+   #endif
+   #ifndef STBI_ONLY_TGA
+   #define STBI_NO_TGA
+   #endif
+   #ifndef STBI_ONLY_GIF
+   #define STBI_NO_GIF
+   #endif
+   #ifndef STBI_ONLY_HDR
+   #define STBI_NO_HDR
+   #endif
+   #ifndef STBI_ONLY_PIC
+   #define STBI_NO_PIC
+   #endif
+   #ifndef STBI_ONLY_PNM
+   #define STBI_NO_PNM
+   #endif
+#endif
+
+#if defined(STBI_NO_PNG) && !defined(STBI_SUPPORT_ZLIB) && !defined(STBI_NO_ZLIB)
+#define STBI_NO_ZLIB
+#endif
+
+
+#include <stdarg.h>
+#include <stddef.h> // ptrdiff_t on osx
+#include <stdlib.h>
+#include <string.h>
+#include <limits.h>
+
+#if !defined(STBI_NO_LINEAR) || !defined(STBI_NO_HDR)
+#include <math.h>  // ldexp, pow
+#endif
+
+#ifndef STBI_NO_STDIO
+#include <stdio.h>
+#endif
+
+#ifndef STBI_ASSERT
+#include <assert.h>
+#define STBI_ASSERT(x) assert(x)
+#endif
+
+#ifdef __cplusplus
+#define STBI_EXTERN extern "C"
+#else
+#define STBI_EXTERN extern
+#endif
+
+
+#ifndef _MSC_VER
+   #ifdef __cplusplus
+   #define stbi_inline inline
+   #else
+   #define stbi_inline
+   #endif
+#else
+   #define stbi_inline __forceinline
+#endif
+
+#ifndef STBI_NO_THREAD_LOCALS
+   #if defined(__cplusplus) &&  __cplusplus >= 201103L
+      #define STBI_THREAD_LOCAL       thread_local
+   #elif defined(__GNUC__) && __GNUC__ < 5
+      #define STBI_THREAD_LOCAL       __thread
+   #elif defined(_MSC_VER)
+      #define STBI_THREAD_LOCAL       __declspec(thread)
+   #elif defined (__STDC_VERSION__) && __STDC_VERSION__ >= 201112L && !defined(__STDC_NO_THREADS__)
+      #define STBI_THREAD_LOCAL       _Thread_local
+   #endif
+
+   #ifndef STBI_THREAD_LOCAL
+      #if defined(__GNUC__)
+        #define STBI_THREAD_LOCAL       __thread
+      #endif
+   #endif
+#endif
+
+#ifdef _MSC_VER
+typedef unsigned short stbi__uint16;
+typedef   signed short stbi__int16;
+typedef unsigned int   stbi__uint32;
+typedef   signed int   stbi__int32;
+#else
+#include <stdint.h>
+typedef uint16_t stbi__uint16;
+typedef int16_t  stbi__int16;
+typedef uint32_t stbi__uint32;
+typedef int32_t  stbi__int32;
+#endif
+
+// should produce compiler error if size is wrong
+typedef unsigned char validate_uint32[sizeof(stbi__uint32)==4 ? 1 : -1];
+
+#ifdef _MSC_VER
+#define STBI_NOTUSED(v)  (void)(v)
+#else
+#define STBI_NOTUSED(v)  (void)sizeof(v)
+#endif
+
+#ifdef _MSC_VER
+#define STBI_HAS_LROTL
+#endif
+
+#ifdef STBI_HAS_LROTL
+   #define stbi_lrot(x,y)  _lrotl(x,y)
+#else
+   #define stbi_lrot(x,y)  (((x) << (y)) | ((x) >> (-(y) & 31)))
+#endif
+
+#if defined(STBI_MALLOC) && defined(STBI_FREE) && (defined(STBI_REALLOC) || defined(STBI_REALLOC_SIZED))
+// ok
+#elif !defined(STBI_MALLOC) && !defined(STBI_FREE) && !defined(STBI_REALLOC) && !defined(STBI_REALLOC_SIZED)
+// ok
+#else
+#error "Must define all or none of STBI_MALLOC, STBI_FREE, and STBI_REALLOC (or STBI_REALLOC_SIZED)."
+#endif
+
+#ifndef STBI_MALLOC
+#define STBI_MALLOC(sz)           malloc(sz)
+#define STBI_REALLOC(p,newsz)     realloc(p,newsz)
+#define STBI_FREE(p)              free(p)
+#endif
+
+#ifndef STBI_REALLOC_SIZED
+#define STBI_REALLOC_SIZED(p,oldsz,newsz) STBI_REALLOC(p,newsz)
+#endif
+
+// x86/x64 detection
+#if defined(__x86_64__) || defined(_M_X64)
+#define STBI__X64_TARGET
+#elif defined(__i386) || defined(_M_IX86)
+#define STBI__X86_TARGET
+#endif
+
+#if defined(__GNUC__) && defined(STBI__X86_TARGET) && !defined(__SSE2__) && !defined(STBI_NO_SIMD)
+// gcc doesn't support sse2 intrinsics unless you compile with -msse2,
+// which in turn means it gets to use SSE2 everywhere. This is unfortunate,
+// but previous attempts to provide the SSE2 functions with runtime
+// detection caused numerous issues. The way architecture extensions are
+// exposed in GCC/Clang is, sadly, not really suited for one-file libs.
+// New behavior: if compiled with -msse2, we use SSE2 without any
+// detection; if not, we don't use it at all.
+#define STBI_NO_SIMD
+#endif
+
+#if defined(__MINGW32__) && defined(STBI__X86_TARGET) && !defined(STBI_MINGW_ENABLE_SSE2) && !defined(STBI_NO_SIMD)
+// Note that __MINGW32__ doesn't actually mean 32-bit, so we have to avoid STBI__X64_TARGET
+//
+// 32-bit MinGW wants ESP to be 16-byte aligned, but this is not in the
+// Windows ABI and VC++ as well as Windows DLLs don't maintain that invariant.
+// As a result, enabling SSE2 on 32-bit MinGW is dangerous when not
+// simultaneously enabling "-mstackrealign".
+//
+// See https://github.com/nothings/stb/issues/81 for more information.
+//
+// So default to no SSE2 on 32-bit MinGW. If you've read this far and added
+// -mstackrealign to your build settings, feel free to #define STBI_MINGW_ENABLE_SSE2.
+#define STBI_NO_SIMD
+#endif
+
+#if !defined(STBI_NO_SIMD) && (defined(STBI__X86_TARGET) || defined(STBI__X64_TARGET))
+#define STBI_SSE2
+#include <emmintrin.h>
+
+#ifdef _MSC_VER
+
+#if _MSC_VER >= 1400  // not VC6
+#include <intrin.h> // __cpuid
+static int stbi__cpuid3(void)
+{
+   int info[4];
+   __cpuid(info,1);
+   return info[3];
+}
+#else
+static int stbi__cpuid3(void)
+{
+   int res;
+   __asm {
+      mov  eax,1
+      cpuid
+      mov  res,edx
+   }
+   return res;
+}
+#endif
+
+#define STBI_SIMD_ALIGN(type, name) __declspec(align(16)) type name
+
+#if !defined(STBI_NO_JPEG) && defined(STBI_SSE2)
+static int stbi__sse2_available(void)
+{
+   int info3 = stbi__cpuid3();
+   return ((info3 >> 26) & 1) != 0;
+}
+#endif
+
+#else // assume GCC-style if not VC++
+#define STBI_SIMD_ALIGN(type, name) type name __attribute__((aligned(16)))
+
+#if !defined(STBI_NO_JPEG) && defined(STBI_SSE2)
+static int stbi__sse2_available(void)
+{
+   // If we're even attempting to compile this on GCC/Clang, that means
+   // -msse2 is on, which means the compiler is allowed to use SSE2
+   // instructions at will, and so are we.
+   return 1;
+}
+#endif
+
+#endif
+#endif
+
+// ARM NEON
+#if defined(STBI_NO_SIMD) && defined(STBI_NEON)
+#undef STBI_NEON
+#endif
+
+#ifdef STBI_NEON
+#include <arm_neon.h>
+#ifdef _MSC_VER
+#define STBI_SIMD_ALIGN(type, name) __declspec(align(16)) type name
+#else
+#define STBI_SIMD_ALIGN(type, name) type name __attribute__((aligned(16)))
+#endif
+#endif
+
+#ifndef STBI_SIMD_ALIGN
+#define STBI_SIMD_ALIGN(type, name) type name
+#endif
+
+#ifndef STBI_MAX_DIMENSIONS
+#define STBI_MAX_DIMENSIONS (1 << 24)
+#endif
+
+///////////////////////////////////////////////
+//
+//  stbi__context struct and start_xxx functions
+
+// stbi__context structure is our basic context used by all images, so it
+// contains all the IO context, plus some basic image information
+typedef struct
+{
+   stbi__uint32 img_x, img_y;
+   int img_n, img_out_n;
+
+   stbi_io_callbacks io;
+   void *io_user_data;
+
+   int read_from_callbacks;
+   int buflen;
+   stbi_uc buffer_start[128];
+   int callback_already_read;
+
+   stbi_uc *img_buffer, *img_buffer_end;
+   stbi_uc *img_buffer_original, *img_buffer_original_end;
+} stbi__context;
+
+
+static void stbi__refill_buffer(stbi__context *s);
+
+// initialize a memory-decode context
+static void stbi__start_mem(stbi__context *s, stbi_uc const *buffer, int len)
+{
+   s->io.read = NULL;
+   s->read_from_callbacks = 0;
+   s->callback_already_read = 0;
+   s->img_buffer = s->img_buffer_original = (stbi_uc *) buffer;
+   s->img_buffer_end = s->img_buffer_original_end = (stbi_uc *) buffer+len;
+}
+
+// initialize a callback-based context
+static void stbi__start_callbacks(stbi__context *s, stbi_io_callbacks *c, void *user)
+{
+   s->io = *c;
+   s->io_user_data = user;
+   s->buflen = sizeof(s->buffer_start);
+   s->read_from_callbacks = 1;
+   s->callback_already_read = 0;
+   s->img_buffer = s->img_buffer_original = s->buffer_start;
+   stbi__refill_buffer(s);
+   s->img_buffer_original_end = s->img_buffer_end;
+}
+
+#ifndef STBI_NO_STDIO
+
+static int stbi__stdio_read(void *user, char *data, int size)
+{
+   return (int) fread(data,1,size,(FILE*) user);
+}
+
+static void stbi__stdio_skip(void *user, int n)
+{
+   int ch;
+   fseek((FILE*) user, n, SEEK_CUR);
+   ch = fgetc((FILE*) user);  /* have to read a byte to reset feof()'s flag */
+   if (ch != EOF) {
+      ungetc(ch, (FILE *) user);  /* push byte back onto stream if valid. */
+   }
+}
+
+static int stbi__stdio_eof(void *user)
+{
+   return feof((FILE*) user) || ferror((FILE *) user);
+}
+
+static stbi_io_callbacks stbi__stdio_callbacks =
+{
+   stbi__stdio_read,
+   stbi__stdio_skip,
+   stbi__stdio_eof,
+};
+
+static void stbi__start_file(stbi__context *s, FILE *f)
+{
+   stbi__start_callbacks(s, &stbi__stdio_callbacks, (void *) f);
+}
+
+//static void stop_file(stbi__context *s) { }
+
+#endif // !STBI_NO_STDIO
+
+static void stbi__rewind(stbi__context *s)
+{
+   // conceptually rewind SHOULD rewind to the beginning of the stream,
+   // but we just rewind to the beginning of the initial buffer, because
+   // we only use it after doing 'test', which only ever looks at at most 92 bytes
+   s->img_buffer = s->img_buffer_original;
+   s->img_buffer_end = s->img_buffer_original_end;
+}
+
+enum
+{
+   STBI_ORDER_RGB,
+   STBI_ORDER_BGR
+};
+
+typedef struct
+{
+   int bits_per_channel;
+   int num_channels;
+   int channel_order;
+} stbi__result_info;
+
+#ifndef STBI_NO_JPEG
+static int      stbi__jpeg_test(stbi__context *s);
+static void    *stbi__jpeg_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri);
+static int      stbi__jpeg_info(stbi__context *s, int *x, int *y, int *comp);
+#endif
+
+#ifndef STBI_NO_PNG
+static int      stbi__png_test(stbi__context *s);
+static void    *stbi__png_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri);
+static int      stbi__png_info(stbi__context *s, int *x, int *y, int *comp);
+static int      stbi__png_is16(stbi__context *s);
+#endif
+
+#ifndef STBI_NO_BMP
+static int      stbi__bmp_test(stbi__context *s);
+static void    *stbi__bmp_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri);
+static int      stbi__bmp_info(stbi__context *s, int *x, int *y, int *comp);
+#endif
+
+#ifndef STBI_NO_TGA
+static int      stbi__tga_test(stbi__context *s);
+static void    *stbi__tga_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri);
+static int      stbi__tga_info(stbi__context *s, int *x, int *y, int *comp);
+#endif
+
+#ifndef STBI_NO_PSD
+static int      stbi__psd_test(stbi__context *s);
+static void    *stbi__psd_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri, int bpc);
+static int      stbi__psd_info(stbi__context *s, int *x, int *y, int *comp);
+static int      stbi__psd_is16(stbi__context *s);
+#endif
+
+#ifndef STBI_NO_HDR
+static int      stbi__hdr_test(stbi__context *s);
+static float   *stbi__hdr_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri);
+static int      stbi__hdr_info(stbi__context *s, int *x, int *y, int *comp);
+#endif
+
+#ifndef STBI_NO_PIC
+static int      stbi__pic_test(stbi__context *s);
+static void    *stbi__pic_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri);
+static int      stbi__pic_info(stbi__context *s, int *x, int *y, int *comp);
+#endif
+
+#ifndef STBI_NO_GIF
+static int      stbi__gif_test(stbi__context *s);
+static void    *stbi__gif_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri);
+static void    *stbi__load_gif_main(stbi__context *s, int **delays, int *x, int *y, int *z, int *comp, int req_comp);
+static int      stbi__gif_info(stbi__context *s, int *x, int *y, int *comp);
+#endif
+
+#ifndef STBI_NO_PNM
+static int      stbi__pnm_test(stbi__context *s);
+static void    *stbi__pnm_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri);
+static int      stbi__pnm_info(stbi__context *s, int *x, int *y, int *comp);
+static int      stbi__pnm_is16(stbi__context *s);
+#endif
+
+static
+#ifdef STBI_THREAD_LOCAL
+STBI_THREAD_LOCAL
+#endif
+const char *stbi__g_failure_reason;
+
+STBIDEF const char *stbi_failure_reason(void)
+{
+   return stbi__g_failure_reason;
+}
+
+#ifndef STBI_NO_FAILURE_STRINGS
+static int stbi__err(const char *str)
+{
+   stbi__g_failure_reason = str;
+   return 0;
+}
+#endif
+
+static void *stbi__malloc(size_t size)
+{
+    return STBI_MALLOC(size);
+}
+
+// stb_image uses ints pervasively, including for offset calculations.
+// therefore the largest decoded image size we can support with the
+// current code, even on 64-bit targets, is INT_MAX. this is not a
+// significant limitation for the intended use case.
+//
+// we do, however, need to make sure our size calculations don't
+// overflow. hence a few helper functions for size calculations that
+// multiply integers together, making sure that they're non-negative
+// and no overflow occurs.
+
+// return 1 if the sum is valid, 0 on overflow.
+// negative terms are considered invalid.
+static int stbi__addsizes_valid(int a, int b)
+{
+   if (b < 0) return 0;
+   // now 0 <= b <= INT_MAX, hence also
+   // 0 <= INT_MAX - b <= INTMAX.
+   // And "a + b <= INT_MAX" (which might overflow) is the
+   // same as a <= INT_MAX - b (no overflow)
+   return a <= INT_MAX - b;
+}
+
+// returns 1 if the product is valid, 0 on overflow.
+// negative factors are considered invalid.
+static int stbi__mul2sizes_valid(int a, int b)
+{
+   if (a < 0 || b < 0) return 0;
+   if (b == 0) return 1; // mul-by-0 is always safe
+   // portable way to check for no overflows in a*b
+   return a <= INT_MAX/b;
+}
+
+#if !defined(STBI_NO_JPEG) || !defined(STBI_NO_PNG) || !defined(STBI_NO_TGA) || !defined(STBI_NO_HDR)
+// returns 1 if "a*b + add" has no negative terms/factors and doesn't overflow
+static int stbi__mad2sizes_valid(int a, int b, int add)
+{
+   return stbi__mul2sizes_valid(a, b) && stbi__addsizes_valid(a*b, add);
+}
+#endif
+
+// returns 1 if "a*b*c + add" has no negative terms/factors and doesn't overflow
+static int stbi__mad3sizes_valid(int a, int b, int c, int add)
+{
+   return stbi__mul2sizes_valid(a, b) && stbi__mul2sizes_valid(a*b, c) &&
+      stbi__addsizes_valid(a*b*c, add);
+}
+
+// returns 1 if "a*b*c*d + add" has no negative terms/factors and doesn't overflow
+#if !defined(STBI_NO_LINEAR) || !defined(STBI_NO_HDR) || !defined(STBI_NO_PNM)
+static int stbi__mad4sizes_valid(int a, int b, int c, int d, int add)
+{
+   return stbi__mul2sizes_valid(a, b) && stbi__mul2sizes_valid(a*b, c) &&
+      stbi__mul2sizes_valid(a*b*c, d) && stbi__addsizes_valid(a*b*c*d, add);
+}
+#endif
+
+#if !defined(STBI_NO_JPEG) || !defined(STBI_NO_PNG) || !defined(STBI_NO_TGA) || !defined(STBI_NO_HDR)
+// mallocs with size overflow checking
+static void *stbi__malloc_mad2(int a, int b, int add)
+{
+   if (!stbi__mad2sizes_valid(a, b, add)) return NULL;
+   return stbi__malloc(a*b + add);
+}
+#endif
+
+static void *stbi__malloc_mad3(int a, int b, int c, int add)
+{
+   if (!stbi__mad3sizes_valid(a, b, c, add)) return NULL;
+   return stbi__malloc(a*b*c + add);
+}
+
+#if !defined(STBI_NO_LINEAR) || !defined(STBI_NO_HDR) || !defined(STBI_NO_PNM)
+static void *stbi__malloc_mad4(int a, int b, int c, int d, int add)
+{
+   if (!stbi__mad4sizes_valid(a, b, c, d, add)) return NULL;
+   return stbi__malloc(a*b*c*d + add);
+}
+#endif
+
+// stbi__err - error
+// stbi__errpf - error returning pointer to float
+// stbi__errpuc - error returning pointer to unsigned char
+
+#ifdef STBI_NO_FAILURE_STRINGS
+   #define stbi__err(x,y)  0
+#elif defined(STBI_FAILURE_USERMSG)
+   #define stbi__err(x,y)  stbi__err(y)
+#else
+   #define stbi__err(x,y)  stbi__err(x)
+#endif
+
+#define stbi__errpf(x,y)   ((float *)(size_t) (stbi__err(x,y)?NULL:NULL))
+#define stbi__errpuc(x,y)  ((unsigned char *)(size_t) (stbi__err(x,y)?NULL:NULL))
+
+STBIDEF void stbi_image_free(void *retval_from_stbi_load)
+{
+   STBI_FREE(retval_from_stbi_load);
+}
+
+#ifndef STBI_NO_LINEAR
+static float   *stbi__ldr_to_hdr(stbi_uc *data, int x, int y, int comp);
+#endif
+
+#ifndef STBI_NO_HDR
+static stbi_uc *stbi__hdr_to_ldr(float   *data, int x, int y, int comp);
+#endif
+
+static int stbi__vertically_flip_on_load_global = 0;
+
+STBIDEF void stbi_set_flip_vertically_on_load(int flag_true_if_should_flip)
+{
+   stbi__vertically_flip_on_load_global = flag_true_if_should_flip;
+}
+
+#ifndef STBI_THREAD_LOCAL
+#define stbi__vertically_flip_on_load  stbi__vertically_flip_on_load_global
+#else
+static STBI_THREAD_LOCAL int stbi__vertically_flip_on_load_local, stbi__vertically_flip_on_load_set;
+
+STBIDEF void stbi_set_flip_vertically_on_load_thread(int flag_true_if_should_flip)
+{
+   stbi__vertically_flip_on_load_local = flag_true_if_should_flip;
+   stbi__vertically_flip_on_load_set = 1;
+}
+
+#define stbi__vertically_flip_on_load  (stbi__vertically_flip_on_load_set       \
+                                         ? stbi__vertically_flip_on_load_local  \
+                                         : stbi__vertically_flip_on_load_global)
+#endif // STBI_THREAD_LOCAL
+
+static void *stbi__load_main(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri, int bpc)
+{
+   memset(ri, 0, sizeof(*ri)); // make sure it's initialized if we add new fields
+   ri->bits_per_channel = 8; // default is 8 so most paths don't have to be changed
+   ri->channel_order = STBI_ORDER_RGB; // all current input & output are this, but this is here so we can add BGR order
+   ri->num_channels = 0;
+
+   // test the formats with a very explicit header first (at least a FOURCC
+   // or distinctive magic number first)
+   #ifndef STBI_NO_PNG
+   if (stbi__png_test(s))  return stbi__png_load(s,x,y,comp,req_comp, ri);
+   #endif
+   #ifndef STBI_NO_BMP
+   if (stbi__bmp_test(s))  return stbi__bmp_load(s,x,y,comp,req_comp, ri);
+   #endif
+   #ifndef STBI_NO_GIF
+   if (stbi__gif_test(s))  return stbi__gif_load(s,x,y,comp,req_comp, ri);
+   #endif
+   #ifndef STBI_NO_PSD
+   if (stbi__psd_test(s))  return stbi__psd_load(s,x,y,comp,req_comp, ri, bpc);
+   #else
+   STBI_NOTUSED(bpc);
+   #endif
+   #ifndef STBI_NO_PIC
+   if (stbi__pic_test(s))  return stbi__pic_load(s,x,y,comp,req_comp, ri);
+   #endif
+
+   // then the formats that can end up attempting to load with just 1 or 2
+   // bytes matching expectations; these are prone to false positives, so
+   // try them later
+   #ifndef STBI_NO_JPEG
+   if (stbi__jpeg_test(s)) return stbi__jpeg_load(s,x,y,comp,req_comp, ri);
+   #endif
+   #ifndef STBI_NO_PNM
+   if (stbi__pnm_test(s))  return stbi__pnm_load(s,x,y,comp,req_comp, ri);
+   #endif
+
+   #ifndef STBI_NO_HDR
+   if (stbi__hdr_test(s)) {
+      float *hdr = stbi__hdr_load(s, x,y,comp,req_comp, ri);
+      return stbi__hdr_to_ldr(hdr, *x, *y, req_comp ? req_comp : *comp);
+   }
+   #endif
+
+   #ifndef STBI_NO_TGA
+   // test tga last because it's a crappy test!
+   if (stbi__tga_test(s))
+      return stbi__tga_load(s,x,y,comp,req_comp, ri);
+   #endif
+
+   return stbi__errpuc("unknown image type", "Image not of any known type, or corrupt");
+}
+
+static stbi_uc *stbi__convert_16_to_8(stbi__uint16 *orig, int w, int h, int channels)
+{
+   int i;
+   int img_len = w * h * channels;
+   stbi_uc *reduced;
+
+   reduced = (stbi_uc *) stbi__malloc(img_len);
+   if (reduced == NULL) return stbi__errpuc("outofmem", "Out of memory");
+
+   for (i = 0; i < img_len; ++i)
+      reduced[i] = (stbi_uc)((orig[i] >> 8) & 0xFF); // top half of each byte is sufficient approx of 16->8 bit scaling
+
+   STBI_FREE(orig);
+   return reduced;
+}
+
+static stbi__uint16 *stbi__convert_8_to_16(stbi_uc *orig, int w, int h, int channels)
+{
+   int i;
+   int img_len = w * h * channels;
+   stbi__uint16 *enlarged;
+
+   enlarged = (stbi__uint16 *) stbi__malloc(img_len*2);
+   if (enlarged == NULL) return (stbi__uint16 *) stbi__errpuc("outofmem", "Out of memory");
+
+   for (i = 0; i < img_len; ++i)
+      enlarged[i] = (stbi__uint16)((orig[i] << 8) + orig[i]); // replicate to high and low byte, maps 0->0, 255->0xffff
+
+   STBI_FREE(orig);
+   return enlarged;
+}
+
+static void stbi__vertical_flip(void *image, int w, int h, int bytes_per_pixel)
+{
+   int row;
+   size_t bytes_per_row = (size_t)w * bytes_per_pixel;
+   stbi_uc temp[2048];
+   stbi_uc *bytes = (stbi_uc *)image;
+
+   for (row = 0; row < (h>>1); row++) {
+      stbi_uc *row0 = bytes + row*bytes_per_row;
+      stbi_uc *row1 = bytes + (h - row - 1)*bytes_per_row;
+      // swap row0 with row1
+      size_t bytes_left = bytes_per_row;
+      while (bytes_left) {
+         size_t bytes_copy = (bytes_left < sizeof(temp)) ? bytes_left : sizeof(temp);
+         memcpy(temp, row0, bytes_copy);
+         memcpy(row0, row1, bytes_copy);
+         memcpy(row1, temp, bytes_copy);
+         row0 += bytes_copy;
+         row1 += bytes_copy;
+         bytes_left -= bytes_copy;
+      }
+   }
+}
+
+#ifndef STBI_NO_GIF
+static void stbi__vertical_flip_slices(void *image, int w, int h, int z, int bytes_per_pixel)
+{
+   int slice;
+   int slice_size = w * h * bytes_per_pixel;
+
+   stbi_uc *bytes = (stbi_uc *)image;
+   for (slice = 0; slice < z; ++slice) {
+      stbi__vertical_flip(bytes, w, h, bytes_per_pixel);
+      bytes += slice_size;
+   }
+}
+#endif
+
+static unsigned char *stbi__load_and_postprocess_8bit(stbi__context *s, int *x, int *y, int *comp, int req_comp)
+{
+   stbi__result_info ri;
+   void *result = stbi__load_main(s, x, y, comp, req_comp, &ri, 8);
+
+   if (result == NULL)
+      return NULL;
+
+   // it is the responsibility of the loaders to make sure we get either 8 or 16 bit.
+   STBI_ASSERT(ri.bits_per_channel == 8 || ri.bits_per_channel == 16);
+
+   if (ri.bits_per_channel != 8) {
+      result = stbi__convert_16_to_8((stbi__uint16 *) result, *x, *y, req_comp == 0 ? *comp : req_comp);
+      ri.bits_per_channel = 8;
+   }
+
+   // @TODO: move stbi__convert_format to here
+
+   if (stbi__vertically_flip_on_load) {
+      int channels = req_comp ? req_comp : *comp;
+      stbi__vertical_flip(result, *x, *y, channels * sizeof(stbi_uc));
+   }
+
+   return (unsigned char *) result;
+}
+
+static stbi__uint16 *stbi__load_and_postprocess_16bit(stbi__context *s, int *x, int *y, int *comp, int req_comp)
+{
+   stbi__result_info ri;
+   void *result = stbi__load_main(s, x, y, comp, req_comp, &ri, 16);
+
+   if (result == NULL)
+      return NULL;
+
+   // it is the responsibility of the loaders to make sure we get either 8 or 16 bit.
+   STBI_ASSERT(ri.bits_per_channel == 8 || ri.bits_per_channel == 16);
+
+   if (ri.bits_per_channel != 16) {
+      result = stbi__convert_8_to_16((stbi_uc *) result, *x, *y, req_comp == 0 ? *comp : req_comp);
+      ri.bits_per_channel = 16;
+   }
+
+   // @TODO: move stbi__convert_format16 to here
+   // @TODO: special case RGB-to-Y (and RGBA-to-YA) for 8-bit-to-16-bit case to keep more precision
+
+   if (stbi__vertically_flip_on_load) {
+      int channels = req_comp ? req_comp : *comp;
+      stbi__vertical_flip(result, *x, *y, channels * sizeof(stbi__uint16));
+   }
+
+   return (stbi__uint16 *) result;
+}
+
+#if !defined(STBI_NO_HDR) && !defined(STBI_NO_LINEAR)
+static void stbi__float_postprocess(float *result, int *x, int *y, int *comp, int req_comp)
+{
+   if (stbi__vertically_flip_on_load && result != NULL) {
+      int channels = req_comp ? req_comp : *comp;
+      stbi__vertical_flip(result, *x, *y, channels * sizeof(float));
+   }
+}
+#endif
+
+#ifndef STBI_NO_STDIO
+
+#if defined(_WIN32) && defined(STBI_WINDOWS_UTF8)
+STBI_EXTERN __declspec(dllimport) int __stdcall MultiByteToWideChar(unsigned int cp, unsigned long flags, const char *str, int cbmb, wchar_t *widestr, int cchwide);
+STBI_EXTERN __declspec(dllimport) int __stdcall WideCharToMultiByte(unsigned int cp, unsigned long flags, const wchar_t *widestr, int cchwide, char *str, int cbmb, const char *defchar, int *used_default);
+#endif
+
+#if defined(_WIN32) && defined(STBI_WINDOWS_UTF8)
+STBIDEF int stbi_convert_wchar_to_utf8(char *buffer, size_t bufferlen, const wchar_t* input)
+{
+	return WideCharToMultiByte(65001 /* UTF8 */, 0, input, -1, buffer, (int) bufferlen, NULL, NULL);
+}
+#endif
+
+static FILE *stbi__fopen(char const *filename, char const *mode)
+{
+   FILE *f;
+#if defined(_WIN32) && defined(STBI_WINDOWS_UTF8)
+   wchar_t wMode[64];
+   wchar_t wFilename[1024];
+	if (0 == MultiByteToWideChar(65001 /* UTF8 */, 0, filename, -1, wFilename, sizeof(wFilename)/sizeof(*wFilename)))
+      return 0;
+
+	if (0 == MultiByteToWideChar(65001 /* UTF8 */, 0, mode, -1, wMode, sizeof(wMode)/sizeof(*wMode)))
+      return 0;
+
+#if defined(_MSC_VER) && _MSC_VER >= 1400
+	if (0 != _wfopen_s(&f, wFilename, wMode))
+		f = 0;
+#else
+   f = _wfopen(wFilename, wMode);
+#endif
+
+#elif defined(_MSC_VER) && _MSC_VER >= 1400
+   if (0 != fopen_s(&f, filename, mode))
+      f=0;
+#else
+   f = fopen(filename, mode);
+#endif
+   return f;
+}
+
+
+STBIDEF stbi_uc *stbi_load(char const *filename, int *x, int *y, int *comp, int req_comp)
+{
+   FILE *f = stbi__fopen(filename, "rb");
+   unsigned char *result;
+   if (!f) return stbi__errpuc("can't fopen", "Unable to open file");
+   result = stbi_load_from_file(f,x,y,comp,req_comp);
+   fclose(f);
+   return result;
+}
+
+STBIDEF stbi_uc *stbi_load_from_file(FILE *f, int *x, int *y, int *comp, int req_comp)
+{
+   unsigned char *result;
+   stbi__context s;
+   stbi__start_file(&s,f);
+   result = stbi__load_and_postprocess_8bit(&s,x,y,comp,req_comp);
+   if (result) {
+      // need to 'unget' all the characters in the IO buffer
+      fseek(f, - (int) (s.img_buffer_end - s.img_buffer), SEEK_CUR);
+   }
+   return result;
+}
+
+STBIDEF stbi__uint16 *stbi_load_from_file_16(FILE *f, int *x, int *y, int *comp, int req_comp)
+{
+   stbi__uint16 *result;
+   stbi__context s;
+   stbi__start_file(&s,f);
+   result = stbi__load_and_postprocess_16bit(&s,x,y,comp,req_comp);
+   if (result) {
+      // need to 'unget' all the characters in the IO buffer
+      fseek(f, - (int) (s.img_buffer_end - s.img_buffer), SEEK_CUR);
+   }
+   return result;
+}
+
+STBIDEF stbi_us *stbi_load_16(char const *filename, int *x, int *y, int *comp, int req_comp)
+{
+   FILE *f = stbi__fopen(filename, "rb");
+   stbi__uint16 *result;
+   if (!f) return (stbi_us *) stbi__errpuc("can't fopen", "Unable to open file");
+   result = stbi_load_from_file_16(f,x,y,comp,req_comp);
+   fclose(f);
+   return result;
+}
+
+
+#endif //!STBI_NO_STDIO
+
+STBIDEF stbi_us *stbi_load_16_from_memory(stbi_uc const *buffer, int len, int *x, int *y, int *channels_in_file, int desired_channels)
+{
+   stbi__context s;
+   stbi__start_mem(&s,buffer,len);
+   return stbi__load_and_postprocess_16bit(&s,x,y,channels_in_file,desired_channels);
+}
+
+STBIDEF stbi_us *stbi_load_16_from_callbacks(stbi_io_callbacks const *clbk, void *user, int *x, int *y, int *channels_in_file, int desired_channels)
+{
+   stbi__context s;
+   stbi__start_callbacks(&s, (stbi_io_callbacks *)clbk, user);
+   return stbi__load_and_postprocess_16bit(&s,x,y,channels_in_file,desired_channels);
+}
+
+STBIDEF stbi_uc *stbi_load_from_memory(stbi_uc const *buffer, int len, int *x, int *y, int *comp, int req_comp)
+{
+   stbi__context s;
+   stbi__start_mem(&s,buffer,len);
+   return stbi__load_and_postprocess_8bit(&s,x,y,comp,req_comp);
+}
+
+STBIDEF stbi_uc *stbi_load_from_callbacks(stbi_io_callbacks const *clbk, void *user, int *x, int *y, int *comp, int req_comp)
+{
+   stbi__context s;
+   stbi__start_callbacks(&s, (stbi_io_callbacks *) clbk, user);
+   return stbi__load_and_postprocess_8bit(&s,x,y,comp,req_comp);
+}
+
+#ifndef STBI_NO_GIF
+STBIDEF stbi_uc *stbi_load_gif_from_memory(stbi_uc const *buffer, int len, int **delays, int *x, int *y, int *z, int *comp, int req_comp)
+{
+   unsigned char *result;
+   stbi__context s;
+   stbi__start_mem(&s,buffer,len);
+
+   result = (unsigned char*) stbi__load_gif_main(&s, delays, x, y, z, comp, req_comp);
+   if (stbi__vertically_flip_on_load) {
+      stbi__vertical_flip_slices( result, *x, *y, *z, *comp );
+   }
+
+   return result;
+}
+#endif
+
+#ifndef STBI_NO_LINEAR
+static float *stbi__loadf_main(stbi__context *s, int *x, int *y, int *comp, int req_comp)
+{
+   unsigned char *data;
+   #ifndef STBI_NO_HDR
+   if (stbi__hdr_test(s)) {
+      stbi__result_info ri;
+      float *hdr_data = stbi__hdr_load(s,x,y,comp,req_comp, &ri);
+      if (hdr_data)
+         stbi__float_postprocess(hdr_data,x,y,comp,req_comp);
+      return hdr_data;
+   }
+   #endif
+   data = stbi__load_and_postprocess_8bit(s, x, y, comp, req_comp);
+   if (data)
+      return stbi__ldr_to_hdr(data, *x, *y, req_comp ? req_comp : *comp);
+   return stbi__errpf("unknown image type", "Image not of any known type, or corrupt");
+}
+
+STBIDEF float *stbi_loadf_from_memory(stbi_uc const *buffer, int len, int *x, int *y, int *comp, int req_comp)
+{
+   stbi__context s;
+   stbi__start_mem(&s,buffer,len);
+   return stbi__loadf_main(&s,x,y,comp,req_comp);
+}
+
+STBIDEF float *stbi_loadf_from_callbacks(stbi_io_callbacks const *clbk, void *user, int *x, int *y, int *comp, int req_comp)
+{
+   stbi__context s;
+   stbi__start_callbacks(&s, (stbi_io_callbacks *) clbk, user);
+   return stbi__loadf_main(&s,x,y,comp,req_comp);
+}
+
+#ifndef STBI_NO_STDIO
+STBIDEF float *stbi_loadf(char const *filename, int *x, int *y, int *comp, int req_comp)
+{
+   float *result;
+   FILE *f = stbi__fopen(filename, "rb");
+   if (!f) return stbi__errpf("can't fopen", "Unable to open file");
+   result = stbi_loadf_from_file(f,x,y,comp,req_comp);
+   fclose(f);
+   return result;
+}
+
+STBIDEF float *stbi_loadf_from_file(FILE *f, int *x, int *y, int *comp, int req_comp)
+{
+   stbi__context s;
+   stbi__start_file(&s,f);
+   return stbi__loadf_main(&s,x,y,comp,req_comp);
+}
+#endif // !STBI_NO_STDIO
+
+#endif // !STBI_NO_LINEAR
+
+// these is-hdr-or-not is defined independent of whether STBI_NO_LINEAR is
+// defined, for API simplicity; if STBI_NO_LINEAR is defined, it always
+// reports false!
+
+STBIDEF int stbi_is_hdr_from_memory(stbi_uc const *buffer, int len)
+{
+   #ifndef STBI_NO_HDR
+   stbi__context s;
+   stbi__start_mem(&s,buffer,len);
+   return stbi__hdr_test(&s);
+   #else
+   STBI_NOTUSED(buffer);
+   STBI_NOTUSED(len);
+   return 0;
+   #endif
+}
+
+#ifndef STBI_NO_STDIO
+STBIDEF int      stbi_is_hdr          (char const *filename)
+{
+   FILE *f = stbi__fopen(filename, "rb");
+   int result=0;
+   if (f) {
+      result = stbi_is_hdr_from_file(f);
+      fclose(f);
+   }
+   return result;
+}
+
+STBIDEF int stbi_is_hdr_from_file(FILE *f)
+{
+   #ifndef STBI_NO_HDR
+   long pos = ftell(f);
+   int res;
+   stbi__context s;
+   stbi__start_file(&s,f);
+   res = stbi__hdr_test(&s);
+   fseek(f, pos, SEEK_SET);
+   return res;
+   #else
+   STBI_NOTUSED(f);
+   return 0;
+   #endif
+}
+#endif // !STBI_NO_STDIO
+
+STBIDEF int      stbi_is_hdr_from_callbacks(stbi_io_callbacks const *clbk, void *user)
+{
+   #ifndef STBI_NO_HDR
+   stbi__context s;
+   stbi__start_callbacks(&s, (stbi_io_callbacks *) clbk, user);
+   return stbi__hdr_test(&s);
+   #else
+   STBI_NOTUSED(clbk);
+   STBI_NOTUSED(user);
+   return 0;
+   #endif
+}
+
+#ifndef STBI_NO_LINEAR
+static float stbi__l2h_gamma=2.2f, stbi__l2h_scale=1.0f;
+
+STBIDEF void   stbi_ldr_to_hdr_gamma(float gamma) { stbi__l2h_gamma = gamma; }
+STBIDEF void   stbi_ldr_to_hdr_scale(float scale) { stbi__l2h_scale = scale; }
+#endif
+
+static float stbi__h2l_gamma_i=1.0f/2.2f, stbi__h2l_scale_i=1.0f;
+
+STBIDEF void   stbi_hdr_to_ldr_gamma(float gamma) { stbi__h2l_gamma_i = 1/gamma; }
+STBIDEF void   stbi_hdr_to_ldr_scale(float scale) { stbi__h2l_scale_i = 1/scale; }
+
+
+//////////////////////////////////////////////////////////////////////////////
+//
+// Common code used by all image loaders
+//
+
+enum
+{
+   STBI__SCAN_load=0,
+   STBI__SCAN_type,
+   STBI__SCAN_header
+};
+
+static void stbi__refill_buffer(stbi__context *s)
+{
+   int n = (s->io.read)(s->io_user_data,(char*)s->buffer_start,s->buflen);
+   s->callback_already_read += (int) (s->img_buffer - s->img_buffer_original);
+   if (n == 0) {
+      // at end of file, treat same as if from memory, but need to handle case
+      // where s->img_buffer isn't pointing to safe memory, e.g. 0-byte file
+      s->read_from_callbacks = 0;
+      s->img_buffer = s->buffer_start;
+      s->img_buffer_end = s->buffer_start+1;
+      *s->img_buffer = 0;
+   } else {
+      s->img_buffer = s->buffer_start;
+      s->img_buffer_end = s->buffer_start + n;
+   }
+}
+
+stbi_inline static stbi_uc stbi__get8(stbi__context *s)
+{
+   if (s->img_buffer < s->img_buffer_end)
+      return *s->img_buffer++;
+   if (s->read_from_callbacks) {
+      stbi__refill_buffer(s);
+      return *s->img_buffer++;
+   }
+   return 0;
+}
+
+#if defined(STBI_NO_JPEG) && defined(STBI_NO_HDR) && defined(STBI_NO_PIC) && defined(STBI_NO_PNM)
+// nothing
+#else
+stbi_inline static int stbi__at_eof(stbi__context *s)
+{
+   if (s->io.read) {
+      if (!(s->io.eof)(s->io_user_data)) return 0;
+      // if feof() is true, check if buffer = end
+      // special case: we've only got the special 0 character at the end
+      if (s->read_from_callbacks == 0) return 1;
+   }
+
+   return s->img_buffer >= s->img_buffer_end;
+}
+#endif
+
+#if defined(STBI_NO_JPEG) && defined(STBI_NO_PNG) && defined(STBI_NO_BMP) && defined(STBI_NO_PSD) && defined(STBI_NO_TGA) && defined(STBI_NO_GIF) && defined(STBI_NO_PIC)
+// nothing
+#else
+static void stbi__skip(stbi__context *s, int n)
+{
+   if (n == 0) return;  // already there!
+   if (n < 0) {
+      s->img_buffer = s->img_buffer_end;
+      return;
+   }
+   if (s->io.read) {
+      int blen = (int) (s->img_buffer_end - s->img_buffer);
+      if (blen < n) {
+         s->img_buffer = s->img_buffer_end;
+         (s->io.skip)(s->io_user_data, n - blen);
+         return;
+      }
+   }
+   s->img_buffer += n;
+}
+#endif
+
+#if defined(STBI_NO_PNG) && defined(STBI_NO_TGA) && defined(STBI_NO_HDR) && defined(STBI_NO_PNM)
+// nothing
+#else
+static int stbi__getn(stbi__context *s, stbi_uc *buffer, int n)
+{
+   if (s->io.read) {
+      int blen = (int) (s->img_buffer_end - s->img_buffer);
+      if (blen < n) {
+         int res, count;
+
+         memcpy(buffer, s->img_buffer, blen);
+
+         count = (s->io.read)(s->io_user_data, (char*) buffer + blen, n - blen);
+         res = (count == (n-blen));
+         s->img_buffer = s->img_buffer_end;
+         return res;
+      }
+   }
+
+   if (s->img_buffer+n <= s->img_buffer_end) {
+      memcpy(buffer, s->img_buffer, n);
+      s->img_buffer += n;
+      return 1;
+   } else
+      return 0;
+}
+#endif
+
+#if defined(STBI_NO_JPEG) && defined(STBI_NO_PNG) && defined(STBI_NO_PSD) && defined(STBI_NO_PIC)
+// nothing
+#else
+static int stbi__get16be(stbi__context *s)
+{
+   int z = stbi__get8(s);
+   return (z << 8) + stbi__get8(s);
+}
+#endif
+
+#if defined(STBI_NO_PNG) && defined(STBI_NO_PSD) && defined(STBI_NO_PIC)
+// nothing
+#else
+static stbi__uint32 stbi__get32be(stbi__context *s)
+{
+   stbi__uint32 z = stbi__get16be(s);
+   return (z << 16) + stbi__get16be(s);
+}
+#endif
+
+#if defined(STBI_NO_BMP) && defined(STBI_NO_TGA) && defined(STBI_NO_GIF)
+// nothing
+#else
+static int stbi__get16le(stbi__context *s)
+{
+   int z = stbi__get8(s);
+   return z + (stbi__get8(s) << 8);
+}
+#endif
+
+#ifndef STBI_NO_BMP
+static stbi__uint32 stbi__get32le(stbi__context *s)
+{
+   stbi__uint32 z = stbi__get16le(s);
+   z += (stbi__uint32)stbi__get16le(s) << 16;
+   return z;
+}
+#endif
+
+#define STBI__BYTECAST(x)  ((stbi_uc) ((x) & 255))  // truncate int to byte without warnings
+
+#if defined(STBI_NO_JPEG) && defined(STBI_NO_PNG) && defined(STBI_NO_BMP) && defined(STBI_NO_PSD) && defined(STBI_NO_TGA) && defined(STBI_NO_GIF) && defined(STBI_NO_PIC) && defined(STBI_NO_PNM)
+// nothing
+#else
+//////////////////////////////////////////////////////////////////////////////
+//
+//  generic converter from built-in img_n to req_comp
+//    individual types do this automatically as much as possible (e.g. jpeg
+//    does all cases internally since it needs to colorspace convert anyway,
+//    and it never has alpha, so very few cases ). png can automatically
+//    interleave an alpha=255 channel, but falls back to this for other cases
+//
+//  assume data buffer is malloced, so malloc a new one and free that one
+//  only failure mode is malloc failing
+
+static stbi_uc stbi__compute_y(int r, int g, int b)
+{
+   return (stbi_uc) (((r*77) + (g*150) +  (29*b)) >> 8);
+}
+#endif
+
+#if defined(STBI_NO_PNG) && defined(STBI_NO_BMP) && defined(STBI_NO_PSD) && defined(STBI_NO_TGA) && defined(STBI_NO_GIF) && defined(STBI_NO_PIC) && defined(STBI_NO_PNM)
+// nothing
+#else
+static unsigned char *stbi__convert_format(unsigned char *data, int img_n, int req_comp, unsigned int x, unsigned int y)
+{
+   int i,j;
+   unsigned char *good;
+
+   if (req_comp == img_n) return data;
+   STBI_ASSERT(req_comp >= 1 && req_comp <= 4);
+
+   good = (unsigned char *) stbi__malloc_mad3(req_comp, x, y, 0);
+   if (good == NULL) {
+      STBI_FREE(data);
+      return stbi__errpuc("outofmem", "Out of memory");
+   }
+
+   for (j=0; j < (int) y; ++j) {
+      unsigned char *src  = data + j * x * img_n   ;
+      unsigned char *dest = good + j * x * req_comp;
+
+      #define STBI__COMBO(a,b)  ((a)*8+(b))
+      #define STBI__CASE(a,b)   case STBI__COMBO(a,b): for(i=x-1; i >= 0; --i, src += a, dest += b)
+      // convert source image with img_n components to one with req_comp components;
+      // avoid switch per pixel, so use switch per scanline and massive macros
+      switch (STBI__COMBO(img_n, req_comp)) {
+         STBI__CASE(1,2) { dest[0]=src[0]; dest[1]=255;                                     } break;
+         STBI__CASE(1,3) { dest[0]=dest[1]=dest[2]=src[0];                                  } break;
+         STBI__CASE(1,4) { dest[0]=dest[1]=dest[2]=src[0]; dest[3]=255;                     } break;
+         STBI__CASE(2,1) { dest[0]=src[0];                                                  } break;
+         STBI__CASE(2,3) { dest[0]=dest[1]=dest[2]=src[0];                                  } break;
+         STBI__CASE(2,4) { dest[0]=dest[1]=dest[2]=src[0]; dest[3]=src[1];                  } break;
+         STBI__CASE(3,4) { dest[0]=src[0];dest[1]=src[1];dest[2]=src[2];dest[3]=255;        } break;
+         STBI__CASE(3,1) { dest[0]=stbi__compute_y(src[0],src[1],src[2]);                   } break;
+         STBI__CASE(3,2) { dest[0]=stbi__compute_y(src[0],src[1],src[2]); dest[1] = 255;    } break;
+         STBI__CASE(4,1) { dest[0]=stbi__compute_y(src[0],src[1],src[2]);                   } break;
+         STBI__CASE(4,2) { dest[0]=stbi__compute_y(src[0],src[1],src[2]); dest[1] = src[3]; } break;
+         STBI__CASE(4,3) { dest[0]=src[0];dest[1]=src[1];dest[2]=src[2];                    } break;
+         default: STBI_ASSERT(0); STBI_FREE(data); STBI_FREE(good); return stbi__errpuc("unsupported", "Unsupported format conversion");
+      }
+      #undef STBI__CASE
+   }
+
+   STBI_FREE(data);
+   return good;
+}
+#endif
+
+#if defined(STBI_NO_PNG) && defined(STBI_NO_PSD)
+// nothing
+#else
+static stbi__uint16 stbi__compute_y_16(int r, int g, int b)
+{
+   return (stbi__uint16) (((r*77) + (g*150) +  (29*b)) >> 8);
+}
+#endif
+
+#if defined(STBI_NO_PNG) && defined(STBI_NO_PSD)
+// nothing
+#else
+static stbi__uint16 *stbi__convert_format16(stbi__uint16 *data, int img_n, int req_comp, unsigned int x, unsigned int y)
+{
+   int i,j;
+   stbi__uint16 *good;
+
+   if (req_comp == img_n) return data;
+   STBI_ASSERT(req_comp >= 1 && req_comp <= 4);
+
+   good = (stbi__uint16 *) stbi__malloc(req_comp * x * y * 2);
+   if (good == NULL) {
+      STBI_FREE(data);
+      return (stbi__uint16 *) stbi__errpuc("outofmem", "Out of memory");
+   }
+
+   for (j=0; j < (int) y; ++j) {
+      stbi__uint16 *src  = data + j * x * img_n   ;
+      stbi__uint16 *dest = good + j * x * req_comp;
+
+      #define STBI__COMBO(a,b)  ((a)*8+(b))
+      #define STBI__CASE(a,b)   case STBI__COMBO(a,b): for(i=x-1; i >= 0; --i, src += a, dest += b)
+      // convert source image with img_n components to one with req_comp components;
+      // avoid switch per pixel, so use switch per scanline and massive macros
+      switch (STBI__COMBO(img_n, req_comp)) {
+         STBI__CASE(1,2) { dest[0]=src[0]; dest[1]=0xffff;                                     } break;
+         STBI__CASE(1,3) { dest[0]=dest[1]=dest[2]=src[0];                                     } break;
+         STBI__CASE(1,4) { dest[0]=dest[1]=dest[2]=src[0]; dest[3]=0xffff;                     } break;
+         STBI__CASE(2,1) { dest[0]=src[0];                                                     } break;
+         STBI__CASE(2,3) { dest[0]=dest[1]=dest[2]=src[0];                                     } break;
+         STBI__CASE(2,4) { dest[0]=dest[1]=dest[2]=src[0]; dest[3]=src[1];                     } break;
+         STBI__CASE(3,4) { dest[0]=src[0];dest[1]=src[1];dest[2]=src[2];dest[3]=0xffff;        } break;
+         STBI__CASE(3,1) { dest[0]=stbi__compute_y_16(src[0],src[1],src[2]);                   } break;
+         STBI__CASE(3,2) { dest[0]=stbi__compute_y_16(src[0],src[1],src[2]); dest[1] = 0xffff; } break;
+         STBI__CASE(4,1) { dest[0]=stbi__compute_y_16(src[0],src[1],src[2]);                   } break;
+         STBI__CASE(4,2) { dest[0]=stbi__compute_y_16(src[0],src[1],src[2]); dest[1] = src[3]; } break;
+         STBI__CASE(4,3) { dest[0]=src[0];dest[1]=src[1];dest[2]=src[2];                       } break;
+         default: STBI_ASSERT(0); STBI_FREE(data); STBI_FREE(good); return (stbi__uint16*) stbi__errpuc("unsupported", "Unsupported format conversion");
+      }
+      #undef STBI__CASE
+   }
+
+   STBI_FREE(data);
+   return good;
+}
+#endif
+
+#ifndef STBI_NO_LINEAR
+static float   *stbi__ldr_to_hdr(stbi_uc *data, int x, int y, int comp)
+{
+   int i,k,n;
+   float *output;
+   if (!data) return NULL;
+   output = (float *) stbi__malloc_mad4(x, y, comp, sizeof(float), 0);
+   if (output == NULL) { STBI_FREE(data); return stbi__errpf("outofmem", "Out of memory"); }
+   // compute number of non-alpha components
+   if (comp & 1) n = comp; else n = comp-1;
+   for (i=0; i < x*y; ++i) {
+      for (k=0; k < n; ++k) {
+         output[i*comp + k] = (float) (pow(data[i*comp+k]/255.0f, stbi__l2h_gamma) * stbi__l2h_scale);
+      }
+   }
+   if (n < comp) {
+      for (i=0; i < x*y; ++i) {
+         output[i*comp + n] = data[i*comp + n]/255.0f;
+      }
+   }
+   STBI_FREE(data);
+   return output;
+}
+#endif
+
+#ifndef STBI_NO_HDR
+#define stbi__float2int(x)   ((int) (x))
+static stbi_uc *stbi__hdr_to_ldr(float   *data, int x, int y, int comp)
+{
+   int i,k,n;
+   stbi_uc *output;
+   if (!data) return NULL;
+   output = (stbi_uc *) stbi__malloc_mad3(x, y, comp, 0);
+   if (output == NULL) { STBI_FREE(data); return stbi__errpuc("outofmem", "Out of memory"); }
+   // compute number of non-alpha components
+   if (comp & 1) n = comp; else n = comp-1;
+   for (i=0; i < x*y; ++i) {
+      for (k=0; k < n; ++k) {
+         float z = (float) pow(data[i*comp+k]*stbi__h2l_scale_i, stbi__h2l_gamma_i) * 255 + 0.5f;
+         if (z < 0) z = 0;
+         if (z > 255) z = 255;
+         output[i*comp + k] = (stbi_uc) stbi__float2int(z);
+      }
+      if (k < comp) {
+         float z = data[i*comp+k] * 255 + 0.5f;
+         if (z < 0) z = 0;
+         if (z > 255) z = 255;
+         output[i*comp + k] = (stbi_uc) stbi__float2int(z);
+      }
+   }
+   STBI_FREE(data);
+   return output;
+}
+#endif
+
+//////////////////////////////////////////////////////////////////////////////
+//
+//  "baseline" JPEG/JFIF decoder
+//
+//    simple implementation
+//      - doesn't support delayed output of y-dimension
+//      - simple interface (only one output format: 8-bit interleaved RGB)
+//      - doesn't try to recover corrupt jpegs
+//      - doesn't allow partial loading, loading multiple at once
+//      - still fast on x86 (copying globals into locals doesn't help x86)
+//      - allocates lots of intermediate memory (full size of all components)
+//        - non-interleaved case requires this anyway
+//        - allows good upsampling (see next)
+//    high-quality
+//      - upsampled channels are bilinearly interpolated, even across blocks
+//      - quality integer IDCT derived from IJG's 'slow'
+//    performance
+//      - fast huffman; reasonable integer IDCT
+//      - some SIMD kernels for common paths on targets with SSE2/NEON
+//      - uses a lot of intermediate memory, could cache poorly
+
+#ifndef STBI_NO_JPEG
+
+// huffman decoding acceleration
+#define FAST_BITS   9  // larger handles more cases; smaller stomps less cache
+
+typedef struct
+{
+   stbi_uc  fast[1 << FAST_BITS];
+   // weirdly, repacking this into AoS is a 10% speed loss, instead of a win
+   stbi__uint16 code[256];
+   stbi_uc  values[256];
+   stbi_uc  size[257];
+   unsigned int maxcode[18];
+   int    delta[17];   // old 'firstsymbol' - old 'firstcode'
+} stbi__huffman;
+
+typedef struct
+{
+   stbi__context *s;
+   stbi__huffman huff_dc[4];
+   stbi__huffman huff_ac[4];
+   stbi__uint16 dequant[4][64];
+   stbi__int16 fast_ac[4][1 << FAST_BITS];
+
+// sizes for components, interleaved MCUs
+   int img_h_max, img_v_max;
+   int img_mcu_x, img_mcu_y;
+   int img_mcu_w, img_mcu_h;
+
+// definition of jpeg image component
+   struct
+   {
+      int id;
+      int h,v;
+      int tq;
+      int hd,ha;
+      int dc_pred;
+
+      int x,y,w2,h2;
+      stbi_uc *data;
+      void *raw_data, *raw_coeff;
+      stbi_uc *linebuf;
+      short   *coeff;   // progressive only
+      int      coeff_w, coeff_h; // number of 8x8 coefficient blocks
+   } img_comp[4];
+
+   stbi__uint32   code_buffer; // jpeg entropy-coded buffer
+   int            code_bits;   // number of valid bits
+   unsigned char  marker;      // marker seen while filling entropy buffer
+   int            nomore;      // flag if we saw a marker so must stop
+
+   int            progressive;
+   int            spec_start;
+   int            spec_end;
+   int            succ_high;
+   int            succ_low;
+   int            eob_run;
+   int            jfif;
+   int            app14_color_transform; // Adobe APP14 tag
+   int            rgb;
+
+   int scan_n, order[4];
+   int restart_interval, todo;
+
+// kernels
+   void (*idct_block_kernel)(stbi_uc *out, int out_stride, short data[64]);
+   void (*YCbCr_to_RGB_kernel)(stbi_uc *out, const stbi_uc *y, const stbi_uc *pcb, const stbi_uc *pcr, int count, int step);
+   stbi_uc *(*resample_row_hv_2_kernel)(stbi_uc *out, stbi_uc *in_near, stbi_uc *in_far, int w, int hs);
+} stbi__jpeg;
+
+static int stbi__build_huffman(stbi__huffman *h, int *count)
+{
+   int i,j,k=0;
+   unsigned int code;
+   // build size list for each symbol (from JPEG spec)
+   for (i=0; i < 16; ++i)
+      for (j=0; j < count[i]; ++j)
+         h->size[k++] = (stbi_uc) (i+1);
+   h->size[k] = 0;
+
+   // compute actual symbols (from jpeg spec)
+   code = 0;
+   k = 0;
+   for(j=1; j <= 16; ++j) {
+      // compute delta to add to code to compute symbol id
+      h->delta[j] = k - code;
+      if (h->size[k] == j) {
+         while (h->size[k] == j)
+            h->code[k++] = (stbi__uint16) (code++);
+         if (code-1 >= (1u << j)) return stbi__err("bad code lengths","Corrupt JPEG");
+      }
+      // compute largest code + 1 for this size, preshifted as needed later
+      h->maxcode[j] = code << (16-j);
+      code <<= 1;
+   }
+   h->maxcode[j] = 0xffffffff;
+
+   // build non-spec acceleration table; 255 is flag for not-accelerated
+   memset(h->fast, 255, 1 << FAST_BITS);
+   for (i=0; i < k; ++i) {
+      int s = h->size[i];
+      if (s <= FAST_BITS) {
+         int c = h->code[i] << (FAST_BITS-s);
+         int m = 1 << (FAST_BITS-s);
+         for (j=0; j < m; ++j) {
+            h->fast[c+j] = (stbi_uc) i;
+         }
+      }
+   }
+   return 1;
+}
+
+// build a table that decodes both magnitude and value of small ACs in
+// one go.
+static void stbi__build_fast_ac(stbi__int16 *fast_ac, stbi__huffman *h)
+{
+   int i;
+   for (i=0; i < (1 << FAST_BITS); ++i) {
+      stbi_uc fast = h->fast[i];
+      fast_ac[i] = 0;
+      if (fast < 255) {
+         int rs = h->values[fast];
+         int run = (rs >> 4) & 15;
+         int magbits = rs & 15;
+         int len = h->size[fast];
+
+         if (magbits && len + magbits <= FAST_BITS) {
+            // magnitude code followed by receive_extend code
+            int k = ((i << len) & ((1 << FAST_BITS) - 1)) >> (FAST_BITS - magbits);
+            int m = 1 << (magbits - 1);
+            if (k < m) k += (~0U << magbits) + 1;
+            // if the result is small enough, we can fit it in fast_ac table
+            if (k >= -128 && k <= 127)
+               fast_ac[i] = (stbi__int16) ((k * 256) + (run * 16) + (len + magbits));
+         }
+      }
+   }
+}
+
+static void stbi__grow_buffer_unsafe(stbi__jpeg *j)
+{
+   do {
+      unsigned int b = j->nomore ? 0 : stbi__get8(j->s);
+      if (b == 0xff) {
+         int c = stbi__get8(j->s);
+         while (c == 0xff) c = stbi__get8(j->s); // consume fill bytes
+         if (c != 0) {
+            j->marker = (unsigned char) c;
+            j->nomore = 1;
+            return;
+         }
+      }
+      j->code_buffer |= b << (24 - j->code_bits);
+      j->code_bits += 8;
+   } while (j->code_bits <= 24);
+}
+
+// (1 << n) - 1
+static const stbi__uint32 stbi__bmask[17]={0,1,3,7,15,31,63,127,255,511,1023,2047,4095,8191,16383,32767,65535};
+
+// decode a jpeg huffman value from the bitstream
+stbi_inline static int stbi__jpeg_huff_decode(stbi__jpeg *j, stbi__huffman *h)
+{
+   unsigned int temp;
+   int c,k;
+
+   if (j->code_bits < 16) stbi__grow_buffer_unsafe(j);
+
+   // look at the top FAST_BITS and determine what symbol ID it is,
+   // if the code is <= FAST_BITS
+   c = (j->code_buffer >> (32 - FAST_BITS)) & ((1 << FAST_BITS)-1);
+   k = h->fast[c];
+   if (k < 255) {
+      int s = h->size[k];
+      if (s > j->code_bits)
+         return -1;
+      j->code_buffer <<= s;
+      j->code_bits -= s;
+      return h->values[k];
+   }
+
+   // naive test is to shift the code_buffer down so k bits are
+   // valid, then test against maxcode. To speed this up, we've
+   // preshifted maxcode left so that it has (16-k) 0s at the
+   // end; in other words, regardless of the number of bits, it
+   // wants to be compared against something shifted to have 16;
+   // that way we don't need to shift inside the loop.
+   temp = j->code_buffer >> 16;
+   for (k=FAST_BITS+1 ; ; ++k)
+      if (temp < h->maxcode[k])
+         break;
+   if (k == 17) {
+      // error! code not found
+      j->code_bits -= 16;
+      return -1;
+   }
+
+   if (k > j->code_bits)
+      return -1;
+
+   // convert the huffman code to the symbol id
+   c = ((j->code_buffer >> (32 - k)) & stbi__bmask[k]) + h->delta[k];
+   STBI_ASSERT((((j->code_buffer) >> (32 - h->size[c])) & stbi__bmask[h->size[c]]) == h->code[c]);
+
+   // convert the id to a symbol
+   j->code_bits -= k;
+   j->code_buffer <<= k;
+   return h->values[c];
+}
+
+// bias[n] = (-1<<n) + 1
+static const int stbi__jbias[16] = {0,-1,-3,-7,-15,-31,-63,-127,-255,-511,-1023,-2047,-4095,-8191,-16383,-32767};
+
+// combined JPEG 'receive' and JPEG 'extend', since baseline
+// always extends everything it receives.
+stbi_inline static int stbi__extend_receive(stbi__jpeg *j, int n)
+{
+   unsigned int k;
+   int sgn;
+   if (j->code_bits < n) stbi__grow_buffer_unsafe(j);
+
+   sgn = j->code_buffer >> 31; // sign bit always in MSB; 0 if MSB clear (positive), 1 if MSB set (negative)
+   k = stbi_lrot(j->code_buffer, n);
+   j->code_buffer = k & ~stbi__bmask[n];
+   k &= stbi__bmask[n];
+   j->code_bits -= n;
+   return k + (stbi__jbias[n] & (sgn - 1));
+}
+
+// get some unsigned bits
+stbi_inline static int stbi__jpeg_get_bits(stbi__jpeg *j, int n)
+{
+   unsigned int k;
+   if (j->code_bits < n) stbi__grow_buffer_unsafe(j);
+   k = stbi_lrot(j->code_buffer, n);
+   j->code_buffer = k & ~stbi__bmask[n];
+   k &= stbi__bmask[n];
+   j->code_bits -= n;
+   return k;
+}
+
+stbi_inline static int stbi__jpeg_get_bit(stbi__jpeg *j)
+{
+   unsigned int k;
+   if (j->code_bits < 1) stbi__grow_buffer_unsafe(j);
+   k = j->code_buffer;
+   j->code_buffer <<= 1;
+   --j->code_bits;
+   return k & 0x80000000;
+}
+
+// given a value that's at position X in the zigzag stream,
+// where does it appear in the 8x8 matrix coded as row-major?
+static const stbi_uc stbi__jpeg_dezigzag[64+15] =
+{
+    0,  1,  8, 16,  9,  2,  3, 10,
+   17, 24, 32, 25, 18, 11,  4,  5,
+   12, 19, 26, 33, 40, 48, 41, 34,
+   27, 20, 13,  6,  7, 14, 21, 28,
+   35, 42, 49, 56, 57, 50, 43, 36,
+   29, 22, 15, 23, 30, 37, 44, 51,
+   58, 59, 52, 45, 38, 31, 39, 46,
+   53, 60, 61, 54, 47, 55, 62, 63,
+   // let corrupt input sample past end
+   63, 63, 63, 63, 63, 63, 63, 63,
+   63, 63, 63, 63, 63, 63, 63
+};
+
+// decode one 64-entry block--
+static int stbi__jpeg_decode_block(stbi__jpeg *j, short data[64], stbi__huffman *hdc, stbi__huffman *hac, stbi__int16 *fac, int b, stbi__uint16 *dequant)
+{
+   int diff,dc,k;
+   int t;
+
+   if (j->code_bits < 16) stbi__grow_buffer_unsafe(j);
+   t = stbi__jpeg_huff_decode(j, hdc);
+   if (t < 0 || t > 15) return stbi__err("bad huffman code","Corrupt JPEG");
+
+   // 0 all the ac values now so we can do it 32-bits at a time
+   memset(data,0,64*sizeof(data[0]));
+
+   diff = t ? stbi__extend_receive(j, t) : 0;
+   dc = j->img_comp[b].dc_pred + diff;
+   j->img_comp[b].dc_pred = dc;
+   data[0] = (short) (dc * dequant[0]);
+
+   // decode AC components, see JPEG spec
+   k = 1;
+   do {
+      unsigned int zig;
+      int c,r,s;
+      if (j->code_bits < 16) stbi__grow_buffer_unsafe(j);
+      c = (j->code_buffer >> (32 - FAST_BITS)) & ((1 << FAST_BITS)-1);
+      r = fac[c];
+      if (r) { // fast-AC path
+         k += (r >> 4) & 15; // run
+         s = r & 15; // combined length
+         j->code_buffer <<= s;
+         j->code_bits -= s;
+         // decode into unzigzag'd location
+         zig = stbi__jpeg_dezigzag[k++];
+         data[zig] = (short) ((r >> 8) * dequant[zig]);
+      } else {
+         int rs = stbi__jpeg_huff_decode(j, hac);
+         if (rs < 0) return stbi__err("bad huffman code","Corrupt JPEG");
+         s = rs & 15;
+         r = rs >> 4;
+         if (s == 0) {
+            if (rs != 0xf0) break; // end block
+            k += 16;
+         } else {
+            k += r;
+            // decode into unzigzag'd location
+            zig = stbi__jpeg_dezigzag[k++];
+            data[zig] = (short) (stbi__extend_receive(j,s) * dequant[zig]);
+         }
+      }
+   } while (k < 64);
+   return 1;
+}
+
+static int stbi__jpeg_decode_block_prog_dc(stbi__jpeg *j, short data[64], stbi__huffman *hdc, int b)
+{
+   int diff,dc;
+   int t;
+   if (j->spec_end != 0) return stbi__err("can't merge dc and ac", "Corrupt JPEG");
+
+   if (j->code_bits < 16) stbi__grow_buffer_unsafe(j);
+
+   if (j->succ_high == 0) {
+      // first scan for DC coefficient, must be first
+      memset(data,0,64*sizeof(data[0])); // 0 all the ac values now
+      t = stbi__jpeg_huff_decode(j, hdc);
+      if (t < 0 || t > 15) return stbi__err("can't merge dc and ac", "Corrupt JPEG");
+      diff = t ? stbi__extend_receive(j, t) : 0;
+
+      dc = j->img_comp[b].dc_pred + diff;
+      j->img_comp[b].dc_pred = dc;
+      data[0] = (short) (dc * (1 << j->succ_low));
+   } else {
+      // refinement scan for DC coefficient
+      if (stbi__jpeg_get_bit(j))
+         data[0] += (short) (1 << j->succ_low);
+   }
+   return 1;
+}
+
+// @OPTIMIZE: store non-zigzagged during the decode passes,
+// and only de-zigzag when dequantizing
+static int stbi__jpeg_decode_block_prog_ac(stbi__jpeg *j, short data[64], stbi__huffman *hac, stbi__int16 *fac)
+{
+   int k;
+   if (j->spec_start == 0) return stbi__err("can't merge dc and ac", "Corrupt JPEG");
+
+   if (j->succ_high == 0) {
+      int shift = j->succ_low;
+
+      if (j->eob_run) {
+         --j->eob_run;
+         return 1;
+      }
+
+      k = j->spec_start;
+      do {
+         unsigned int zig;
+         int c,r,s;
+         if (j->code_bits < 16) stbi__grow_buffer_unsafe(j);
+         c = (j->code_buffer >> (32 - FAST_BITS)) & ((1 << FAST_BITS)-1);
+         r = fac[c];
+         if (r) { // fast-AC path
+            k += (r >> 4) & 15; // run
+            s = r & 15; // combined length
+            j->code_buffer <<= s;
+            j->code_bits -= s;
+            zig = stbi__jpeg_dezigzag[k++];
+            data[zig] = (short) ((r >> 8) * (1 << shift));
+         } else {
+            int rs = stbi__jpeg_huff_decode(j, hac);
+            if (rs < 0) return stbi__err("bad huffman code","Corrupt JPEG");
+            s = rs & 15;
+            r = rs >> 4;
+            if (s == 0) {
+               if (r < 15) {
+                  j->eob_run = (1 << r);
+                  if (r)
+                     j->eob_run += stbi__jpeg_get_bits(j, r);
+                  --j->eob_run;
+                  break;
+               }
+               k += 16;
+            } else {
+               k += r;
+               zig = stbi__jpeg_dezigzag[k++];
+               data[zig] = (short) (stbi__extend_receive(j,s) * (1 << shift));
+            }
+         }
+      } while (k <= j->spec_end);
+   } else {
+      // refinement scan for these AC coefficients
+
+      short bit = (short) (1 << j->succ_low);
+
+      if (j->eob_run) {
+         --j->eob_run;
+         for (k = j->spec_start; k <= j->spec_end; ++k) {
+            short *p = &data[stbi__jpeg_dezigzag[k]];
+            if (*p != 0)
+               if (stbi__jpeg_get_bit(j))
+                  if ((*p & bit)==0) {
+                     if (*p > 0)
+                        *p += bit;
+                     else
+                        *p -= bit;
+                  }
+         }
+      } else {
+         k = j->spec_start;
+         do {
+            int r,s;
+            int rs = stbi__jpeg_huff_decode(j, hac); // @OPTIMIZE see if we can use the fast path here, advance-by-r is so slow, eh
+            if (rs < 0) return stbi__err("bad huffman code","Corrupt JPEG");
+            s = rs & 15;
+            r = rs >> 4;
+            if (s == 0) {
+               if (r < 15) {
+                  j->eob_run = (1 << r) - 1;
+                  if (r)
+                     j->eob_run += stbi__jpeg_get_bits(j, r);
+                  r = 64; // force end of block
+               } else {
+                  // r=15 s=0 should write 16 0s, so we just do
+                  // a run of 15 0s and then write s (which is 0),
+                  // so we don't have to do anything special here
+               }
+            } else {
+               if (s != 1) return stbi__err("bad huffman code", "Corrupt JPEG");
+               // sign bit
+               if (stbi__jpeg_get_bit(j))
+                  s = bit;
+               else
+                  s = -bit;
+            }
+
+            // advance by r
+            while (k <= j->spec_end) {
+               short *p = &data[stbi__jpeg_dezigzag[k++]];
+               if (*p != 0) {
+                  if (stbi__jpeg_get_bit(j))
+                     if ((*p & bit)==0) {
+                        if (*p > 0)
+                           *p += bit;
+                        else
+                           *p -= bit;
+                     }
+               } else {
+                  if (r == 0) {
+                     *p = (short) s;
+                     break;
+                  }
+                  --r;
+               }
+            }
+         } while (k <= j->spec_end);
+      }
+   }
+   return 1;
+}
+
+// take a -128..127 value and stbi__clamp it and convert to 0..255
+stbi_inline static stbi_uc stbi__clamp(int x)
+{
+   // trick to use a single test to catch both cases
+   if ((unsigned int) x > 255) {
+      if (x < 0) return 0;
+      if (x > 255) return 255;
+   }
+   return (stbi_uc) x;
+}
+
+#define stbi__f2f(x)  ((int) (((x) * 4096 + 0.5)))
+#define stbi__fsh(x)  ((x) * 4096)
+
+// derived from jidctint -- DCT_ISLOW
+#define STBI__IDCT_1D(s0,s1,s2,s3,s4,s5,s6,s7) \
+   int t0,t1,t2,t3,p1,p2,p3,p4,p5,x0,x1,x2,x3; \
+   p2 = s2;                                    \
+   p3 = s6;                                    \
+   p1 = (p2+p3) * stbi__f2f(0.5411961f);       \
+   t2 = p1 + p3*stbi__f2f(-1.847759065f);      \
+   t3 = p1 + p2*stbi__f2f( 0.765366865f);      \
+   p2 = s0;                                    \
+   p3 = s4;                                    \
+   t0 = stbi__fsh(p2+p3);                      \
+   t1 = stbi__fsh(p2-p3);                      \
+   x0 = t0+t3;                                 \
+   x3 = t0-t3;                                 \
+   x1 = t1+t2;                                 \
+   x2 = t1-t2;                                 \
+   t0 = s7;                                    \
+   t1 = s5;                                    \
+   t2 = s3;                                    \
+   t3 = s1;                                    \
+   p3 = t0+t2;                                 \
+   p4 = t1+t3;                                 \
+   p1 = t0+t3;                                 \
+   p2 = t1+t2;                                 \
+   p5 = (p3+p4)*stbi__f2f( 1.175875602f);      \
+   t0 = t0*stbi__f2f( 0.298631336f);           \
+   t1 = t1*stbi__f2f( 2.053119869f);           \
+   t2 = t2*stbi__f2f( 3.072711026f);           \
+   t3 = t3*stbi__f2f( 1.501321110f);           \
+   p1 = p5 + p1*stbi__f2f(-0.899976223f);      \
+   p2 = p5 + p2*stbi__f2f(-2.562915447f);      \
+   p3 = p3*stbi__f2f(-1.961570560f);           \
+   p4 = p4*stbi__f2f(-0.390180644f);           \
+   t3 += p1+p4;                                \
+   t2 += p2+p3;                                \
+   t1 += p2+p4;                                \
+   t0 += p1+p3;
+
+static void stbi__idct_block(stbi_uc *out, int out_stride, short data[64])
+{
+   int i,val[64],*v=val;
+   stbi_uc *o;
+   short *d = data;
+
+   // columns
+   for (i=0; i < 8; ++i,++d, ++v) {
+      // if all zeroes, shortcut -- this avoids dequantizing 0s and IDCTing
+      if (d[ 8]==0 && d[16]==0 && d[24]==0 && d[32]==0
+           && d[40]==0 && d[48]==0 && d[56]==0) {
+         //    no shortcut                 0     seconds
+         //    (1|2|3|4|5|6|7)==0          0     seconds
+         //    all separate               -0.047 seconds
+         //    1 && 2|3 && 4|5 && 6|7:    -0.047 seconds
+         int dcterm = d[0]*4;
+         v[0] = v[8] = v[16] = v[24] = v[32] = v[40] = v[48] = v[56] = dcterm;
+      } else {
+         STBI__IDCT_1D(d[ 0],d[ 8],d[16],d[24],d[32],d[40],d[48],d[56])
+         // constants scaled things up by 1<<12; let's bring them back
+         // down, but keep 2 extra bits of precision
+         x0 += 512; x1 += 512; x2 += 512; x3 += 512;
+         v[ 0] = (x0+t3) >> 10;
+         v[56] = (x0-t3) >> 10;
+         v[ 8] = (x1+t2) >> 10;
+         v[48] = (x1-t2) >> 10;
+         v[16] = (x2+t1) >> 10;
+         v[40] = (x2-t1) >> 10;
+         v[24] = (x3+t0) >> 10;
+         v[32] = (x3-t0) >> 10;
+      }
+   }
+
+   for (i=0, v=val, o=out; i < 8; ++i,v+=8,o+=out_stride) {
+      // no fast case since the first 1D IDCT spread components out
+      STBI__IDCT_1D(v[0],v[1],v[2],v[3],v[4],v[5],v[6],v[7])
+      // constants scaled things up by 1<<12, plus we had 1<<2 from first
+      // loop, plus horizontal and vertical each scale by sqrt(8) so together
+      // we've got an extra 1<<3, so 1<<17 total we need to remove.
+      // so we want to round that, which means adding 0.5 * 1<<17,
+      // aka 65536. Also, we'll end up with -128 to 127 that we want
+      // to encode as 0..255 by adding 128, so we'll add that before the shift
+      x0 += 65536 + (128<<17);
+      x1 += 65536 + (128<<17);
+      x2 += 65536 + (128<<17);
+      x3 += 65536 + (128<<17);
+      // tried computing the shifts into temps, or'ing the temps to see
+      // if any were out of range, but that was slower
+      o[0] = stbi__clamp((x0+t3) >> 17);
+      o[7] = stbi__clamp((x0-t3) >> 17);
+      o[1] = stbi__clamp((x1+t2) >> 17);
+      o[6] = stbi__clamp((x1-t2) >> 17);
+      o[2] = stbi__clamp((x2+t1) >> 17);
+      o[5] = stbi__clamp((x2-t1) >> 17);
+      o[3] = stbi__clamp((x3+t0) >> 17);
+      o[4] = stbi__clamp((x3-t0) >> 17);
+   }
+}
+
+#ifdef STBI_SSE2
+// sse2 integer IDCT. not the fastest possible implementation but it
+// produces bit-identical results to the generic C version so it's
+// fully "transparent".
+static void stbi__idct_simd(stbi_uc *out, int out_stride, short data[64])
+{
+   // This is constructed to match our regular (generic) integer IDCT exactly.
+   __m128i row0, row1, row2, row3, row4, row5, row6, row7;
+   __m128i tmp;
+
+   // dot product constant: even elems=x, odd elems=y
+   #define dct_const(x,y)  _mm_setr_epi16((x),(y),(x),(y),(x),(y),(x),(y))
+
+   // out(0) = c0[even]*x + c0[odd]*y   (c0, x, y 16-bit, out 32-bit)
+   // out(1) = c1[even]*x + c1[odd]*y
+   #define dct_rot(out0,out1, x,y,c0,c1) \
+      __m128i c0##lo = _mm_unpacklo_epi16((x),(y)); \
+      __m128i c0##hi = _mm_unpackhi_epi16((x),(y)); \
+      __m128i out0##_l = _mm_madd_epi16(c0##lo, c0); \
+      __m128i out0##_h = _mm_madd_epi16(c0##hi, c0); \
+      __m128i out1##_l = _mm_madd_epi16(c0##lo, c1); \
+      __m128i out1##_h = _mm_madd_epi16(c0##hi, c1)
+
+   // out = in << 12  (in 16-bit, out 32-bit)
+   #define dct_widen(out, in) \
+      __m128i out##_l = _mm_srai_epi32(_mm_unpacklo_epi16(_mm_setzero_si128(), (in)), 4); \
+      __m128i out##_h = _mm_srai_epi32(_mm_unpackhi_epi16(_mm_setzero_si128(), (in)), 4)
+
+   // wide add
+   #define dct_wadd(out, a, b) \
+      __m128i out##_l = _mm_add_epi32(a##_l, b##_l); \
+      __m128i out##_h = _mm_add_epi32(a##_h, b##_h)
+
+   // wide sub
+   #define dct_wsub(out, a, b) \
+      __m128i out##_l = _mm_sub_epi32(a##_l, b##_l); \
+      __m128i out##_h = _mm_sub_epi32(a##_h, b##_h)
+
+   // butterfly a/b, add bias, then shift by "s" and pack
+   #define dct_bfly32o(out0, out1, a,b,bias,s) \
+      { \
+         __m128i abiased_l = _mm_add_epi32(a##_l, bias); \
+         __m128i abiased_h = _mm_add_epi32(a##_h, bias); \
+         dct_wadd(sum, abiased, b); \
+         dct_wsub(dif, abiased, b); \
+         out0 = _mm_packs_epi32(_mm_srai_epi32(sum_l, s), _mm_srai_epi32(sum_h, s)); \
+         out1 = _mm_packs_epi32(_mm_srai_epi32(dif_l, s), _mm_srai_epi32(dif_h, s)); \
+      }
+
+   // 8-bit interleave step (for transposes)
+   #define dct_interleave8(a, b) \
+      tmp = a; \
+      a = _mm_unpacklo_epi8(a, b); \
+      b = _mm_unpackhi_epi8(tmp, b)
+
+   // 16-bit interleave step (for transposes)
+   #define dct_interleave16(a, b) \
+      tmp = a; \
+      a = _mm_unpacklo_epi16(a, b); \
+      b = _mm_unpackhi_epi16(tmp, b)
+
+   #define dct_pass(bias,shift) \
+      { \
+         /* even part */ \
+         dct_rot(t2e,t3e, row2,row6, rot0_0,rot0_1); \
+         __m128i sum04 = _mm_add_epi16(row0, row4); \
+         __m128i dif04 = _mm_sub_epi16(row0, row4); \
+         dct_widen(t0e, sum04); \
+         dct_widen(t1e, dif04); \
+         dct_wadd(x0, t0e, t3e); \
+         dct_wsub(x3, t0e, t3e); \
+         dct_wadd(x1, t1e, t2e); \
+         dct_wsub(x2, t1e, t2e); \
+         /* odd part */ \
+         dct_rot(y0o,y2o, row7,row3, rot2_0,rot2_1); \
+         dct_rot(y1o,y3o, row5,row1, rot3_0,rot3_1); \
+         __m128i sum17 = _mm_add_epi16(row1, row7); \
+         __m128i sum35 = _mm_add_epi16(row3, row5); \
+         dct_rot(y4o,y5o, sum17,sum35, rot1_0,rot1_1); \
+         dct_wadd(x4, y0o, y4o); \
+         dct_wadd(x5, y1o, y5o); \
+         dct_wadd(x6, y2o, y5o); \
+         dct_wadd(x7, y3o, y4o); \
+         dct_bfly32o(row0,row7, x0,x7,bias,shift); \
+         dct_bfly32o(row1,row6, x1,x6,bias,shift); \
+         dct_bfly32o(row2,row5, x2,x5,bias,shift); \
+         dct_bfly32o(row3,row4, x3,x4,bias,shift); \
+      }
+
+   __m128i rot0_0 = dct_const(stbi__f2f(0.5411961f), stbi__f2f(0.5411961f) + stbi__f2f(-1.847759065f));
+   __m128i rot0_1 = dct_const(stbi__f2f(0.5411961f) + stbi__f2f( 0.765366865f), stbi__f2f(0.5411961f));
+   __m128i rot1_0 = dct_const(stbi__f2f(1.175875602f) + stbi__f2f(-0.899976223f), stbi__f2f(1.175875602f));
+   __m128i rot1_1 = dct_const(stbi__f2f(1.175875602f), stbi__f2f(1.175875602f) + stbi__f2f(-2.562915447f));
+   __m128i rot2_0 = dct_const(stbi__f2f(-1.961570560f) + stbi__f2f( 0.298631336f), stbi__f2f(-1.961570560f));
+   __m128i rot2_1 = dct_const(stbi__f2f(-1.961570560f), stbi__f2f(-1.961570560f) + stbi__f2f( 3.072711026f));
+   __m128i rot3_0 = dct_const(stbi__f2f(-0.390180644f) + stbi__f2f( 2.053119869f), stbi__f2f(-0.390180644f));
+   __m128i rot3_1 = dct_const(stbi__f2f(-0.390180644f), stbi__f2f(-0.390180644f) + stbi__f2f( 1.501321110f));
+
+   // rounding biases in column/row passes, see stbi__idct_block for explanation.
+   __m128i bias_0 = _mm_set1_epi32(512);
+   __m128i bias_1 = _mm_set1_epi32(65536 + (128<<17));
+
+   // load
+   row0 = _mm_load_si128((const __m128i *) (data + 0*8));
+   row1 = _mm_load_si128((const __m128i *) (data + 1*8));
+   row2 = _mm_load_si128((const __m128i *) (data + 2*8));
+   row3 = _mm_load_si128((const __m128i *) (data + 3*8));
+   row4 = _mm_load_si128((const __m128i *) (data + 4*8));
+   row5 = _mm_load_si128((const __m128i *) (data + 5*8));
+   row6 = _mm_load_si128((const __m128i *) (data + 6*8));
+   row7 = _mm_load_si128((const __m128i *) (data + 7*8));
+
+   // column pass
+   dct_pass(bias_0, 10);
+
+   {
+      // 16bit 8x8 transpose pass 1
+      dct_interleave16(row0, row4);
+      dct_interleave16(row1, row5);
+      dct_interleave16(row2, row6);
+      dct_interleave16(row3, row7);
+
+      // transpose pass 2
+      dct_interleave16(row0, row2);
+      dct_interleave16(row1, row3);
+      dct_interleave16(row4, row6);
+      dct_interleave16(row5, row7);
+
+      // transpose pass 3
+      dct_interleave16(row0, row1);
+      dct_interleave16(row2, row3);
+      dct_interleave16(row4, row5);
+      dct_interleave16(row6, row7);
+   }
+
+   // row pass
+   dct_pass(bias_1, 17);
+
+   {
+      // pack
+      __m128i p0 = _mm_packus_epi16(row0, row1); // a0a1a2a3...a7b0b1b2b3...b7
+      __m128i p1 = _mm_packus_epi16(row2, row3);
+      __m128i p2 = _mm_packus_epi16(row4, row5);
+      __m128i p3 = _mm_packus_epi16(row6, row7);
+
+      // 8bit 8x8 transpose pass 1
+      dct_interleave8(p0, p2); // a0e0a1e1...
+      dct_interleave8(p1, p3); // c0g0c1g1...
+
+      // transpose pass 2
+      dct_interleave8(p0, p1); // a0c0e0g0...
+      dct_interleave8(p2, p3); // b0d0f0h0...
+
+      // transpose pass 3
+      dct_interleave8(p0, p2); // a0b0c0d0...
+      dct_interleave8(p1, p3); // a4b4c4d4...
+
+      // store
+      _mm_storel_epi64((__m128i *) out, p0); out += out_stride;
+      _mm_storel_epi64((__m128i *) out, _mm_shuffle_epi32(p0, 0x4e)); out += out_stride;
+      _mm_storel_epi64((__m128i *) out, p2); out += out_stride;
+      _mm_storel_epi64((__m128i *) out, _mm_shuffle_epi32(p2, 0x4e)); out += out_stride;
+      _mm_storel_epi64((__m128i *) out, p1); out += out_stride;
+      _mm_storel_epi64((__m128i *) out, _mm_shuffle_epi32(p1, 0x4e)); out += out_stride;
+      _mm_storel_epi64((__m128i *) out, p3); out += out_stride;
+      _mm_storel_epi64((__m128i *) out, _mm_shuffle_epi32(p3, 0x4e));
+   }
+
+#undef dct_const
+#undef dct_rot
+#undef dct_widen
+#undef dct_wadd
+#undef dct_wsub
+#undef dct_bfly32o
+#undef dct_interleave8
+#undef dct_interleave16
+#undef dct_pass
+}
+
+#endif // STBI_SSE2
+
+#ifdef STBI_NEON
+
+// NEON integer IDCT. should produce bit-identical
+// results to the generic C version.
+static void stbi__idct_simd(stbi_uc *out, int out_stride, short data[64])
+{
+   int16x8_t row0, row1, row2, row3, row4, row5, row6, row7;
+
+   int16x4_t rot0_0 = vdup_n_s16(stbi__f2f(0.5411961f));
+   int16x4_t rot0_1 = vdup_n_s16(stbi__f2f(-1.847759065f));
+   int16x4_t rot0_2 = vdup_n_s16(stbi__f2f( 0.765366865f));
+   int16x4_t rot1_0 = vdup_n_s16(stbi__f2f( 1.175875602f));
+   int16x4_t rot1_1 = vdup_n_s16(stbi__f2f(-0.899976223f));
+   int16x4_t rot1_2 = vdup_n_s16(stbi__f2f(-2.562915447f));
+   int16x4_t rot2_0 = vdup_n_s16(stbi__f2f(-1.961570560f));
+   int16x4_t rot2_1 = vdup_n_s16(stbi__f2f(-0.390180644f));
+   int16x4_t rot3_0 = vdup_n_s16(stbi__f2f( 0.298631336f));
+   int16x4_t rot3_1 = vdup_n_s16(stbi__f2f( 2.053119869f));
+   int16x4_t rot3_2 = vdup_n_s16(stbi__f2f( 3.072711026f));
+   int16x4_t rot3_3 = vdup_n_s16(stbi__f2f( 1.501321110f));
+
+#define dct_long_mul(out, inq, coeff) \
+   int32x4_t out##_l = vmull_s16(vget_low_s16(inq), coeff); \
+   int32x4_t out##_h = vmull_s16(vget_high_s16(inq), coeff)
+
+#define dct_long_mac(out, acc, inq, coeff) \
+   int32x4_t out##_l = vmlal_s16(acc##_l, vget_low_s16(inq), coeff); \
+   int32x4_t out##_h = vmlal_s16(acc##_h, vget_high_s16(inq), coeff)
+
+#define dct_widen(out, inq) \
+   int32x4_t out##_l = vshll_n_s16(vget_low_s16(inq), 12); \
+   int32x4_t out##_h = vshll_n_s16(vget_high_s16(inq), 12)
+
+// wide add
+#define dct_wadd(out, a, b) \
+   int32x4_t out##_l = vaddq_s32(a##_l, b##_l); \
+   int32x4_t out##_h = vaddq_s32(a##_h, b##_h)
+
+// wide sub
+#define dct_wsub(out, a, b) \
+   int32x4_t out##_l = vsubq_s32(a##_l, b##_l); \
+   int32x4_t out##_h = vsubq_s32(a##_h, b##_h)
+
+// butterfly a/b, then shift using "shiftop" by "s" and pack
+#define dct_bfly32o(out0,out1, a,b,shiftop,s) \
+   { \
+      dct_wadd(sum, a, b); \
+      dct_wsub(dif, a, b); \
+      out0 = vcombine_s16(shiftop(sum_l, s), shiftop(sum_h, s)); \
+      out1 = vcombine_s16(shiftop(dif_l, s), shiftop(dif_h, s)); \
+   }
+
+#define dct_pass(shiftop, shift) \
+   { \
+      /* even part */ \
+      int16x8_t sum26 = vaddq_s16(row2, row6); \
+      dct_long_mul(p1e, sum26, rot0_0); \
+      dct_long_mac(t2e, p1e, row6, rot0_1); \
+      dct_long_mac(t3e, p1e, row2, rot0_2); \
+      int16x8_t sum04 = vaddq_s16(row0, row4); \
+      int16x8_t dif04 = vsubq_s16(row0, row4); \
+      dct_widen(t0e, sum04); \
+      dct_widen(t1e, dif04); \
+      dct_wadd(x0, t0e, t3e); \
+      dct_wsub(x3, t0e, t3e); \
+      dct_wadd(x1, t1e, t2e); \
+      dct_wsub(x2, t1e, t2e); \
+      /* odd part */ \
+      int16x8_t sum15 = vaddq_s16(row1, row5); \
+      int16x8_t sum17 = vaddq_s16(row1, row7); \
+      int16x8_t sum35 = vaddq_s16(row3, row5); \
+      int16x8_t sum37 = vaddq_s16(row3, row7); \
+      int16x8_t sumodd = vaddq_s16(sum17, sum35); \
+      dct_long_mul(p5o, sumodd, rot1_0); \
+      dct_long_mac(p1o, p5o, sum17, rot1_1); \
+      dct_long_mac(p2o, p5o, sum35, rot1_2); \
+      dct_long_mul(p3o, sum37, rot2_0); \
+      dct_long_mul(p4o, sum15, rot2_1); \
+      dct_wadd(sump13o, p1o, p3o); \
+      dct_wadd(sump24o, p2o, p4o); \
+      dct_wadd(sump23o, p2o, p3o); \
+      dct_wadd(sump14o, p1o, p4o); \
+      dct_long_mac(x4, sump13o, row7, rot3_0); \
+      dct_long_mac(x5, sump24o, row5, rot3_1); \
+      dct_long_mac(x6, sump23o, row3, rot3_2); \
+      dct_long_mac(x7, sump14o, row1, rot3_3); \
+      dct_bfly32o(row0,row7, x0,x7,shiftop,shift); \
+      dct_bfly32o(row1,row6, x1,x6,shiftop,shift); \
+      dct_bfly32o(row2,row5, x2,x5,shiftop,shift); \
+      dct_bfly32o(row3,row4, x3,x4,shiftop,shift); \
+   }
+
+   // load
+   row0 = vld1q_s16(data + 0*8);
+   row1 = vld1q_s16(data + 1*8);
+   row2 = vld1q_s16(data + 2*8);
+   row3 = vld1q_s16(data + 3*8);
+   row4 = vld1q_s16(data + 4*8);
+   row5 = vld1q_s16(data + 5*8);
+   row6 = vld1q_s16(data + 6*8);
+   row7 = vld1q_s16(data + 7*8);
+
+   // add DC bias
+   row0 = vaddq_s16(row0, vsetq_lane_s16(1024, vdupq_n_s16(0), 0));
+
+   // column pass
+   dct_pass(vrshrn_n_s32, 10);
+
+   // 16bit 8x8 transpose
+   {
+// these three map to a single VTRN.16, VTRN.32, and VSWP, respectively.
+// whether compilers actually get this is another story, sadly.
+#define dct_trn16(x, y) { int16x8x2_t t = vtrnq_s16(x, y); x = t.val[0]; y = t.val[1]; }
+#define dct_trn32(x, y) { int32x4x2_t t = vtrnq_s32(vreinterpretq_s32_s16(x), vreinterpretq_s32_s16(y)); x = vreinterpretq_s16_s32(t.val[0]); y = vreinterpretq_s16_s32(t.val[1]); }
+#define dct_trn64(x, y) { int16x8_t x0 = x; int16x8_t y0 = y; x = vcombine_s16(vget_low_s16(x0), vget_low_s16(y0)); y = vcombine_s16(vget_high_s16(x0), vget_high_s16(y0)); }
+
+      // pass 1
+      dct_trn16(row0, row1); // a0b0a2b2a4b4a6b6
+      dct_trn16(row2, row3);
+      dct_trn16(row4, row5);
+      dct_trn16(row6, row7);
+
+      // pass 2
+      dct_trn32(row0, row2); // a0b0c0d0a4b4c4d4
+      dct_trn32(row1, row3);
+      dct_trn32(row4, row6);
+      dct_trn32(row5, row7);
+
+      // pass 3
+      dct_trn64(row0, row4); // a0b0c0d0e0f0g0h0
+      dct_trn64(row1, row5);
+      dct_trn64(row2, row6);
+      dct_trn64(row3, row7);
+
+#undef dct_trn16
+#undef dct_trn32
+#undef dct_trn64
+   }
+
+   // row pass
+   // vrshrn_n_s32 only supports shifts up to 16, we need
+   // 17. so do a non-rounding shift of 16 first then follow
+   // up with a rounding shift by 1.
+   dct_pass(vshrn_n_s32, 16);
+
+   {
+      // pack and round
+      uint8x8_t p0 = vqrshrun_n_s16(row0, 1);
+      uint8x8_t p1 = vqrshrun_n_s16(row1, 1);
+      uint8x8_t p2 = vqrshrun_n_s16(row2, 1);
+      uint8x8_t p3 = vqrshrun_n_s16(row3, 1);
+      uint8x8_t p4 = vqrshrun_n_s16(row4, 1);
+      uint8x8_t p5 = vqrshrun_n_s16(row5, 1);
+      uint8x8_t p6 = vqrshrun_n_s16(row6, 1);
+      uint8x8_t p7 = vqrshrun_n_s16(row7, 1);
+
+      // again, these can translate into one instruction, but often don't.
+#define dct_trn8_8(x, y) { uint8x8x2_t t = vtrn_u8(x, y); x = t.val[0]; y = t.val[1]; }
+#define dct_trn8_16(x, y) { uint16x4x2_t t = vtrn_u16(vreinterpret_u16_u8(x), vreinterpret_u16_u8(y)); x = vreinterpret_u8_u16(t.val[0]); y = vreinterpret_u8_u16(t.val[1]); }
+#define dct_trn8_32(x, y) { uint32x2x2_t t = vtrn_u32(vreinterpret_u32_u8(x), vreinterpret_u32_u8(y)); x = vreinterpret_u8_u32(t.val[0]); y = vreinterpret_u8_u32(t.val[1]); }
+
+      // sadly can't use interleaved stores here since we only write
+      // 8 bytes to each scan line!
+
+      // 8x8 8-bit transpose pass 1
+      dct_trn8_8(p0, p1);
+      dct_trn8_8(p2, p3);
+      dct_trn8_8(p4, p5);
+      dct_trn8_8(p6, p7);
+
+      // pass 2
+      dct_trn8_16(p0, p2);
+      dct_trn8_16(p1, p3);
+      dct_trn8_16(p4, p6);
+      dct_trn8_16(p5, p7);
+
+      // pass 3
+      dct_trn8_32(p0, p4);
+      dct_trn8_32(p1, p5);
+      dct_trn8_32(p2, p6);
+      dct_trn8_32(p3, p7);
+
+      // store
+      vst1_u8(out, p0); out += out_stride;
+      vst1_u8(out, p1); out += out_stride;
+      vst1_u8(out, p2); out += out_stride;
+      vst1_u8(out, p3); out += out_stride;
+      vst1_u8(out, p4); out += out_stride;
+      vst1_u8(out, p5); out += out_stride;
+      vst1_u8(out, p6); out += out_stride;
+      vst1_u8(out, p7);
+
+#undef dct_trn8_8
+#undef dct_trn8_16
+#undef dct_trn8_32
+   }
+
+#undef dct_long_mul
+#undef dct_long_mac
+#undef dct_widen
+#undef dct_wadd
+#undef dct_wsub
+#undef dct_bfly32o
+#undef dct_pass
+}
+
+#endif // STBI_NEON
+
+#define STBI__MARKER_none  0xff
+// if there's a pending marker from the entropy stream, return that
+// otherwise, fetch from the stream and get a marker. if there's no
+// marker, return 0xff, which is never a valid marker value
+static stbi_uc stbi__get_marker(stbi__jpeg *j)
+{
+   stbi_uc x;
+   if (j->marker != STBI__MARKER_none) { x = j->marker; j->marker = STBI__MARKER_none; return x; }
+   x = stbi__get8(j->s);
+   if (x != 0xff) return STBI__MARKER_none;
+   while (x == 0xff)
+      x = stbi__get8(j->s); // consume repeated 0xff fill bytes
+   return x;
+}
+
+// in each scan, we'll have scan_n components, and the order
+// of the components is specified by order[]
+#define STBI__RESTART(x)     ((x) >= 0xd0 && (x) <= 0xd7)
+
+// after a restart interval, stbi__jpeg_reset the entropy decoder and
+// the dc prediction
+static void stbi__jpeg_reset(stbi__jpeg *j)
+{
+   j->code_bits = 0;
+   j->code_buffer = 0;
+   j->nomore = 0;
+   j->img_comp[0].dc_pred = j->img_comp[1].dc_pred = j->img_comp[2].dc_pred = j->img_comp[3].dc_pred = 0;
+   j->marker = STBI__MARKER_none;
+   j->todo = j->restart_interval ? j->restart_interval : 0x7fffffff;
+   j->eob_run = 0;
+   // no more than 1<<31 MCUs if no restart_interal? that's plenty safe,
+   // since we don't even allow 1<<30 pixels
+}
+
+static int stbi__parse_entropy_coded_data(stbi__jpeg *z)
+{
+   stbi__jpeg_reset(z);
+   if (!z->progressive) {
+      if (z->scan_n == 1) {
+         int i,j;
+         STBI_SIMD_ALIGN(short, data[64]);
+         int n = z->order[0];
+         // non-interleaved data, we just need to process one block at a time,
+         // in trivial scanline order
+         // number of blocks to do just depends on how many actual "pixels" this
+         // component has, independent of interleaved MCU blocking and such
+         int w = (z->img_comp[n].x+7) >> 3;
+         int h = (z->img_comp[n].y+7) >> 3;
+         for (j=0; j < h; ++j) {
+            for (i=0; i < w; ++i) {
+               int ha = z->img_comp[n].ha;
+               if (!stbi__jpeg_decode_block(z, data, z->huff_dc+z->img_comp[n].hd, z->huff_ac+ha, z->fast_ac[ha], n, z->dequant[z->img_comp[n].tq])) return 0;
+               z->idct_block_kernel(z->img_comp[n].data+z->img_comp[n].w2*j*8+i*8, z->img_comp[n].w2, data);
+               // every data block is an MCU, so countdown the restart interval
+               if (--z->todo <= 0) {
+                  if (z->code_bits < 24) stbi__grow_buffer_unsafe(z);
+                  // if it's NOT a restart, then just bail, so we get corrupt data
+                  // rather than no data
+                  if (!STBI__RESTART(z->marker)) return 1;
+                  stbi__jpeg_reset(z);
+               }
+            }
+         }
+         return 1;
+      } else { // interleaved
+         int i,j,k,x,y;
+         STBI_SIMD_ALIGN(short, data[64]);
+         for (j=0; j < z->img_mcu_y; ++j) {
+            for (i=0; i < z->img_mcu_x; ++i) {
+               // scan an interleaved mcu... process scan_n components in order
+               for (k=0; k < z->scan_n; ++k) {
+                  int n = z->order[k];
+                  // scan out an mcu's worth of this component; that's just determined
+                  // by the basic H and V specified for the component
+                  for (y=0; y < z->img_comp[n].v; ++y) {
+                     for (x=0; x < z->img_comp[n].h; ++x) {
+                        int x2 = (i*z->img_comp[n].h + x)*8;
+                        int y2 = (j*z->img_comp[n].v + y)*8;
+                        int ha = z->img_comp[n].ha;
+                        if (!stbi__jpeg_decode_block(z, data, z->huff_dc+z->img_comp[n].hd, z->huff_ac+ha, z->fast_ac[ha], n, z->dequant[z->img_comp[n].tq])) return 0;
+                        z->idct_block_kernel(z->img_comp[n].data+z->img_comp[n].w2*y2+x2, z->img_comp[n].w2, data);
+                     }
+                  }
+               }
+               // after all interleaved components, that's an interleaved MCU,
+               // so now count down the restart interval
+               if (--z->todo <= 0) {
+                  if (z->code_bits < 24) stbi__grow_buffer_unsafe(z);
+                  if (!STBI__RESTART(z->marker)) return 1;
+                  stbi__jpeg_reset(z);
+               }
+            }
+         }
+         return 1;
+      }
+   } else {
+      if (z->scan_n == 1) {
+         int i,j;
+         int n = z->order[0];
+         // non-interleaved data, we just need to process one block at a time,
+         // in trivial scanline order
+         // number of blocks to do just depends on how many actual "pixels" this
+         // component has, independent of interleaved MCU blocking and such
+         int w = (z->img_comp[n].x+7) >> 3;
+         int h = (z->img_comp[n].y+7) >> 3;
+         for (j=0; j < h; ++j) {
+            for (i=0; i < w; ++i) {
+               short *data = z->img_comp[n].coeff + 64 * (i + j * z->img_comp[n].coeff_w);
+               if (z->spec_start == 0) {
+                  if (!stbi__jpeg_decode_block_prog_dc(z, data, &z->huff_dc[z->img_comp[n].hd], n))
+                     return 0;
+               } else {
+                  int ha = z->img_comp[n].ha;
+                  if (!stbi__jpeg_decode_block_prog_ac(z, data, &z->huff_ac[ha], z->fast_ac[ha]))
+                     return 0;
+               }
+               // every data block is an MCU, so countdown the restart interval
+               if (--z->todo <= 0) {
+                  if (z->code_bits < 24) stbi__grow_buffer_unsafe(z);
+                  if (!STBI__RESTART(z->marker)) return 1;
+                  stbi__jpeg_reset(z);
+               }
+            }
+         }
+         return 1;
+      } else { // interleaved
+         int i,j,k,x,y;
+         for (j=0; j < z->img_mcu_y; ++j) {
+            for (i=0; i < z->img_mcu_x; ++i) {
+               // scan an interleaved mcu... process scan_n components in order
+               for (k=0; k < z->scan_n; ++k) {
+                  int n = z->order[k];
+                  // scan out an mcu's worth of this component; that's just determined
+                  // by the basic H and V specified for the component
+                  for (y=0; y < z->img_comp[n].v; ++y) {
+                     for (x=0; x < z->img_comp[n].h; ++x) {
+                        int x2 = (i*z->img_comp[n].h + x);
+                        int y2 = (j*z->img_comp[n].v + y);
+                        short *data = z->img_comp[n].coeff + 64 * (x2 + y2 * z->img_comp[n].coeff_w);
+                        if (!stbi__jpeg_decode_block_prog_dc(z, data, &z->huff_dc[z->img_comp[n].hd], n))
+                           return 0;
+                     }
+                  }
+               }
+               // after all interleaved components, that's an interleaved MCU,
+               // so now count down the restart interval
+               if (--z->todo <= 0) {
+                  if (z->code_bits < 24) stbi__grow_buffer_unsafe(z);
+                  if (!STBI__RESTART(z->marker)) return 1;
+                  stbi__jpeg_reset(z);
+               }
+            }
+         }
+         return 1;
+      }
+   }
+}
+
+static void stbi__jpeg_dequantize(short *data, stbi__uint16 *dequant)
+{
+   int i;
+   for (i=0; i < 64; ++i)
+      data[i] *= dequant[i];
+}
+
+static void stbi__jpeg_finish(stbi__jpeg *z)
+{
+   if (z->progressive) {
+      // dequantize and idct the data
+      int i,j,n;
+      for (n=0; n < z->s->img_n; ++n) {
+         int w = (z->img_comp[n].x+7) >> 3;
+         int h = (z->img_comp[n].y+7) >> 3;
+         for (j=0; j < h; ++j) {
+            for (i=0; i < w; ++i) {
+               short *data = z->img_comp[n].coeff + 64 * (i + j * z->img_comp[n].coeff_w);
+               stbi__jpeg_dequantize(data, z->dequant[z->img_comp[n].tq]);
+               z->idct_block_kernel(z->img_comp[n].data+z->img_comp[n].w2*j*8+i*8, z->img_comp[n].w2, data);
+            }
+         }
+      }
+   }
+}
+
+static int stbi__process_marker(stbi__jpeg *z, int m)
+{
+   int L;
+   switch (m) {
+      case STBI__MARKER_none: // no marker found
+         return stbi__err("expected marker","Corrupt JPEG");
+
+      case 0xDD: // DRI - specify restart interval
+         if (stbi__get16be(z->s) != 4) return stbi__err("bad DRI len","Corrupt JPEG");
+         z->restart_interval = stbi__get16be(z->s);
+         return 1;
+
+      case 0xDB: // DQT - define quantization table
+         L = stbi__get16be(z->s)-2;
+         while (L > 0) {
+            int q = stbi__get8(z->s);
+            int p = q >> 4, sixteen = (p != 0);
+            int t = q & 15,i;
+            if (p != 0 && p != 1) return stbi__err("bad DQT type","Corrupt JPEG");
+            if (t > 3) return stbi__err("bad DQT table","Corrupt JPEG");
+
+            for (i=0; i < 64; ++i)
+               z->dequant[t][stbi__jpeg_dezigzag[i]] = (stbi__uint16)(sixteen ? stbi__get16be(z->s) : stbi__get8(z->s));
+            L -= (sixteen ? 129 : 65);
+         }
+         return L==0;
+
+      case 0xC4: // DHT - define huffman table
+         L = stbi__get16be(z->s)-2;
+         while (L > 0) {
+            stbi_uc *v;
+            int sizes[16],i,n=0;
+            int q = stbi__get8(z->s);
+            int tc = q >> 4;
+            int th = q & 15;
+            if (tc > 1 || th > 3) return stbi__err("bad DHT header","Corrupt JPEG");
+            for (i=0; i < 16; ++i) {
+               sizes[i] = stbi__get8(z->s);
+               n += sizes[i];
+            }
+            L -= 17;
+            if (tc == 0) {
+               if (!stbi__build_huffman(z->huff_dc+th, sizes)) return 0;
+               v = z->huff_dc[th].values;
+            } else {
+               if (!stbi__build_huffman(z->huff_ac+th, sizes)) return 0;
+               v = z->huff_ac[th].values;
+            }
+            for (i=0; i < n; ++i)
+               v[i] = stbi__get8(z->s);
+            if (tc != 0)
+               stbi__build_fast_ac(z->fast_ac[th], z->huff_ac + th);
+            L -= n;
+         }
+         return L==0;
+   }
+
+   // check for comment block or APP blocks
+   if ((m >= 0xE0 && m <= 0xEF) || m == 0xFE) {
+      L = stbi__get16be(z->s);
+      if (L < 2) {
+         if (m == 0xFE)
+            return stbi__err("bad COM len","Corrupt JPEG");
+         else
+            return stbi__err("bad APP len","Corrupt JPEG");
+      }
+      L -= 2;
+
+      if (m == 0xE0 && L >= 5) { // JFIF APP0 segment
+         static const unsigned char tag[5] = {'J','F','I','F','\0'};
+         int ok = 1;
+         int i;
+         for (i=0; i < 5; ++i)
+            if (stbi__get8(z->s) != tag[i])
+               ok = 0;
+         L -= 5;
+         if (ok)
+            z->jfif = 1;
+      } else if (m == 0xEE && L >= 12) { // Adobe APP14 segment
+         static const unsigned char tag[6] = {'A','d','o','b','e','\0'};
+         int ok = 1;
+         int i;
+         for (i=0; i < 6; ++i)
+            if (stbi__get8(z->s) != tag[i])
+               ok = 0;
+         L -= 6;
+         if (ok) {
+            stbi__get8(z->s); // version
+            stbi__get16be(z->s); // flags0
+            stbi__get16be(z->s); // flags1
+            z->app14_color_transform = stbi__get8(z->s); // color transform
+            L -= 6;
+         }
+      }
+
+      stbi__skip(z->s, L);
+      return 1;
+   }
+
+   return stbi__err("unknown marker","Corrupt JPEG");
+}
+
+// after we see SOS
+static int stbi__process_scan_header(stbi__jpeg *z)
+{
+   int i;
+   int Ls = stbi__get16be(z->s);
+   z->scan_n = stbi__get8(z->s);
+   if (z->scan_n < 1 || z->scan_n > 4 || z->scan_n > (int) z->s->img_n) return stbi__err("bad SOS component count","Corrupt JPEG");
+   if (Ls != 6+2*z->scan_n) return stbi__err("bad SOS len","Corrupt JPEG");
+   for (i=0; i < z->scan_n; ++i) {
+      int id = stbi__get8(z->s), which;
+      int q = stbi__get8(z->s);
+      for (which = 0; which < z->s->img_n; ++which)
+         if (z->img_comp[which].id == id)
+            break;
+      if (which == z->s->img_n) return 0; // no match
+      z->img_comp[which].hd = q >> 4;   if (z->img_comp[which].hd > 3) return stbi__err("bad DC huff","Corrupt JPEG");
+      z->img_comp[which].ha = q & 15;   if (z->img_comp[which].ha > 3) return stbi__err("bad AC huff","Corrupt JPEG");
+      z->order[i] = which;
+   }
+
+   {
+      int aa;
+      z->spec_start = stbi__get8(z->s);
+      z->spec_end   = stbi__get8(z->s); // should be 63, but might be 0
+      aa = stbi__get8(z->s);
+      z->succ_high = (aa >> 4);
+      z->succ_low  = (aa & 15);
+      if (z->progressive) {
+         if (z->spec_start > 63 || z->spec_end > 63  || z->spec_start > z->spec_end || z->succ_high > 13 || z->succ_low > 13)
+            return stbi__err("bad SOS", "Corrupt JPEG");
+      } else {
+         if (z->spec_start != 0) return stbi__err("bad SOS","Corrupt JPEG");
+         if (z->succ_high != 0 || z->succ_low != 0) return stbi__err("bad SOS","Corrupt JPEG");
+         z->spec_end = 63;
+      }
+   }
+
+   return 1;
+}
+
+static int stbi__free_jpeg_components(stbi__jpeg *z, int ncomp, int why)
+{
+   int i;
+   for (i=0; i < ncomp; ++i) {
+      if (z->img_comp[i].raw_data) {
+         STBI_FREE(z->img_comp[i].raw_data);
+         z->img_comp[i].raw_data = NULL;
+         z->img_comp[i].data = NULL;
+      }
+      if (z->img_comp[i].raw_coeff) {
+         STBI_FREE(z->img_comp[i].raw_coeff);
+         z->img_comp[i].raw_coeff = 0;
+         z->img_comp[i].coeff = 0;
+      }
+      if (z->img_comp[i].linebuf) {
+         STBI_FREE(z->img_comp[i].linebuf);
+         z->img_comp[i].linebuf = NULL;
+      }
+   }
+   return why;
+}
+
+static int stbi__process_frame_header(stbi__jpeg *z, int scan)
+{
+   stbi__context *s = z->s;
+   int Lf,p,i,q, h_max=1,v_max=1,c;
+   Lf = stbi__get16be(s);         if (Lf < 11) return stbi__err("bad SOF len","Corrupt JPEG"); // JPEG
+   p  = stbi__get8(s);            if (p != 8) return stbi__err("only 8-bit","JPEG format not supported: 8-bit only"); // JPEG baseline
+   s->img_y = stbi__get16be(s);   if (s->img_y == 0) return stbi__err("no header height", "JPEG format not supported: delayed height"); // Legal, but we don't handle it--but neither does IJG
+   s->img_x = stbi__get16be(s);   if (s->img_x == 0) return stbi__err("0 width","Corrupt JPEG"); // JPEG requires
+   if (s->img_y > STBI_MAX_DIMENSIONS) return stbi__err("too large","Very large image (corrupt?)");
+   if (s->img_x > STBI_MAX_DIMENSIONS) return stbi__err("too large","Very large image (corrupt?)");
+   c = stbi__get8(s);
+   if (c != 3 && c != 1 && c != 4) return stbi__err("bad component count","Corrupt JPEG");
+   s->img_n = c;
+   for (i=0; i < c; ++i) {
+      z->img_comp[i].data = NULL;
+      z->img_comp[i].linebuf = NULL;
+   }
+
+   if (Lf != 8+3*s->img_n) return stbi__err("bad SOF len","Corrupt JPEG");
+
+   z->rgb = 0;
+   for (i=0; i < s->img_n; ++i) {
+      static const unsigned char rgb[3] = { 'R', 'G', 'B' };
+      z->img_comp[i].id = stbi__get8(s);
+      if (s->img_n == 3 && z->img_comp[i].id == rgb[i])
+         ++z->rgb;
+      q = stbi__get8(s);
+      z->img_comp[i].h = (q >> 4);  if (!z->img_comp[i].h || z->img_comp[i].h > 4) return stbi__err("bad H","Corrupt JPEG");
+      z->img_comp[i].v = q & 15;    if (!z->img_comp[i].v || z->img_comp[i].v > 4) return stbi__err("bad V","Corrupt JPEG");
+      z->img_comp[i].tq = stbi__get8(s);  if (z->img_comp[i].tq > 3) return stbi__err("bad TQ","Corrupt JPEG");
+   }
+
+   if (scan != STBI__SCAN_load) return 1;
+
+   if (!stbi__mad3sizes_valid(s->img_x, s->img_y, s->img_n, 0)) return stbi__err("too large", "Image too large to decode");
+
+   for (i=0; i < s->img_n; ++i) {
+      if (z->img_comp[i].h > h_max) h_max = z->img_comp[i].h;
+      if (z->img_comp[i].v > v_max) v_max = z->img_comp[i].v;
+   }
+
+   // check that plane subsampling factors are integer ratios; our resamplers can't deal with fractional ratios
+   // and I've never seen a non-corrupted JPEG file actually use them
+   for (i=0; i < s->img_n; ++i) {
+      if (h_max % z->img_comp[i].h != 0) return stbi__err("bad H","Corrupt JPEG");
+      if (v_max % z->img_comp[i].v != 0) return stbi__err("bad V","Corrupt JPEG");
+   }
+
+   // compute interleaved mcu info
+   z->img_h_max = h_max;
+   z->img_v_max = v_max;
+   z->img_mcu_w = h_max * 8;
+   z->img_mcu_h = v_max * 8;
+   // these sizes can't be more than 17 bits
+   z->img_mcu_x = (s->img_x + z->img_mcu_w-1) / z->img_mcu_w;
+   z->img_mcu_y = (s->img_y + z->img_mcu_h-1) / z->img_mcu_h;
+
+   for (i=0; i < s->img_n; ++i) {
+      // number of effective pixels (e.g. for non-interleaved MCU)
+      z->img_comp[i].x = (s->img_x * z->img_comp[i].h + h_max-1) / h_max;
+      z->img_comp[i].y = (s->img_y * z->img_comp[i].v + v_max-1) / v_max;
+      // to simplify generation, we'll allocate enough memory to decode
+      // the bogus oversized data from using interleaved MCUs and their
+      // big blocks (e.g. a 16x16 iMCU on an image of width 33); we won't
+      // discard the extra data until colorspace conversion
+      //
+      // img_mcu_x, img_mcu_y: <=17 bits; comp[i].h and .v are <=4 (checked earlier)
+      // so these muls can't overflow with 32-bit ints (which we require)
+      z->img_comp[i].w2 = z->img_mcu_x * z->img_comp[i].h * 8;
+      z->img_comp[i].h2 = z->img_mcu_y * z->img_comp[i].v * 8;
+      z->img_comp[i].coeff = 0;
+      z->img_comp[i].raw_coeff = 0;
+      z->img_comp[i].linebuf = NULL;
+      z->img_comp[i].raw_data = stbi__malloc_mad2(z->img_comp[i].w2, z->img_comp[i].h2, 15);
+      if (z->img_comp[i].raw_data == NULL)
+         return stbi__free_jpeg_components(z, i+1, stbi__err("outofmem", "Out of memory"));
+      // align blocks for idct using mmx/sse
+      z->img_comp[i].data = (stbi_uc*) (((size_t) z->img_comp[i].raw_data + 15) & ~15);
+      if (z->progressive) {
+         // w2, h2 are multiples of 8 (see above)
+         z->img_comp[i].coeff_w = z->img_comp[i].w2 / 8;
+         z->img_comp[i].coeff_h = z->img_comp[i].h2 / 8;
+         z->img_comp[i].raw_coeff = stbi__malloc_mad3(z->img_comp[i].w2, z->img_comp[i].h2, sizeof(short), 15);
+         if (z->img_comp[i].raw_coeff == NULL)
+            return stbi__free_jpeg_components(z, i+1, stbi__err("outofmem", "Out of memory"));
+         z->img_comp[i].coeff = (short*) (((size_t) z->img_comp[i].raw_coeff + 15) & ~15);
+      }
+   }
+
+   return 1;
+}
+
+// use comparisons since in some cases we handle more than one case (e.g. SOF)
+#define stbi__DNL(x)         ((x) == 0xdc)
+#define stbi__SOI(x)         ((x) == 0xd8)
+#define stbi__EOI(x)         ((x) == 0xd9)
+#define stbi__SOF(x)         ((x) == 0xc0 || (x) == 0xc1 || (x) == 0xc2)
+#define stbi__SOS(x)         ((x) == 0xda)
+
+#define stbi__SOF_progressive(x)   ((x) == 0xc2)
+
+static int stbi__decode_jpeg_header(stbi__jpeg *z, int scan)
+{
+   int m;
+   z->jfif = 0;
+   z->app14_color_transform = -1; // valid values are 0,1,2
+   z->marker = STBI__MARKER_none; // initialize cached marker to empty
+   m = stbi__get_marker(z);
+   if (!stbi__SOI(m)) return stbi__err("no SOI","Corrupt JPEG");
+   if (scan == STBI__SCAN_type) return 1;
+   m = stbi__get_marker(z);
+   while (!stbi__SOF(m)) {
+      if (!stbi__process_marker(z,m)) return 0;
+      m = stbi__get_marker(z);
+      while (m == STBI__MARKER_none) {
+         // some files have extra padding after their blocks, so ok, we'll scan
+         if (stbi__at_eof(z->s)) return stbi__err("no SOF", "Corrupt JPEG");
+         m = stbi__get_marker(z);
+      }
+   }
+   z->progressive = stbi__SOF_progressive(m);
+   if (!stbi__process_frame_header(z, scan)) return 0;
+   return 1;
+}
+
+// decode image to YCbCr format
+static int stbi__decode_jpeg_image(stbi__jpeg *j)
+{
+   int m;
+   for (m = 0; m < 4; m++) {
+      j->img_comp[m].raw_data = NULL;
+      j->img_comp[m].raw_coeff = NULL;
+   }
+   j->restart_interval = 0;
+   if (!stbi__decode_jpeg_header(j, STBI__SCAN_load)) return 0;
+   m = stbi__get_marker(j);
+   while (!stbi__EOI(m)) {
+      if (stbi__SOS(m)) {
+         if (!stbi__process_scan_header(j)) return 0;
+         if (!stbi__parse_entropy_coded_data(j)) return 0;
+         if (j->marker == STBI__MARKER_none ) {
+            // handle 0s at the end of image data from IP Kamera 9060
+            while (!stbi__at_eof(j->s)) {
+               int x = stbi__get8(j->s);
+               if (x == 255) {
+                  j->marker = stbi__get8(j->s);
+                  break;
+               }
+            }
+            // if we reach eof without hitting a marker, stbi__get_marker() below will fail and we'll eventually return 0
+         }
+      } else if (stbi__DNL(m)) {
+         int Ld = stbi__get16be(j->s);
+         stbi__uint32 NL = stbi__get16be(j->s);
+         if (Ld != 4) return stbi__err("bad DNL len", "Corrupt JPEG");
+         if (NL != j->s->img_y) return stbi__err("bad DNL height", "Corrupt JPEG");
+      } else {
+         if (!stbi__process_marker(j, m)) return 0;
+      }
+      m = stbi__get_marker(j);
+   }
+   if (j->progressive)
+      stbi__jpeg_finish(j);
+   return 1;
+}
+
+// static jfif-centered resampling (across block boundaries)
+
+typedef stbi_uc *(*resample_row_func)(stbi_uc *out, stbi_uc *in0, stbi_uc *in1,
+                                    int w, int hs);
+
+#define stbi__div4(x) ((stbi_uc) ((x) >> 2))
+
+static stbi_uc *resample_row_1(stbi_uc *out, stbi_uc *in_near, stbi_uc *in_far, int w, int hs)
+{
+   STBI_NOTUSED(out);
+   STBI_NOTUSED(in_far);
+   STBI_NOTUSED(w);
+   STBI_NOTUSED(hs);
+   return in_near;
+}
+
+static stbi_uc* stbi__resample_row_v_2(stbi_uc *out, stbi_uc *in_near, stbi_uc *in_far, int w, int hs)
+{
+   // need to generate two samples vertically for every one in input
+   int i;
+   STBI_NOTUSED(hs);
+   for (i=0; i < w; ++i)
+      out[i] = stbi__div4(3*in_near[i] + in_far[i] + 2);
+   return out;
+}
+
+static stbi_uc*  stbi__resample_row_h_2(stbi_uc *out, stbi_uc *in_near, stbi_uc *in_far, int w, int hs)
+{
+   // need to generate two samples horizontally for every one in input
+   int i;
+   stbi_uc *input = in_near;
+
+   if (w == 1) {
+      // if only one sample, can't do any interpolation
+      out[0] = out[1] = input[0];
+      return out;
+   }
+
+   out[0] = input[0];
+   out[1] = stbi__div4(input[0]*3 + input[1] + 2);
+   for (i=1; i < w-1; ++i) {
+      int n = 3*input[i]+2;
+      out[i*2+0] = stbi__div4(n+input[i-1]);
+      out[i*2+1] = stbi__div4(n+input[i+1]);
+   }
+   out[i*2+0] = stbi__div4(input[w-2]*3 + input[w-1] + 2);
+   out[i*2+1] = input[w-1];
+
+   STBI_NOTUSED(in_far);
+   STBI_NOTUSED(hs);
+
+   return out;
+}
+
+#define stbi__div16(x) ((stbi_uc) ((x) >> 4))
+
+static stbi_uc *stbi__resample_row_hv_2(stbi_uc *out, stbi_uc *in_near, stbi_uc *in_far, int w, int hs)
+{
+   // need to generate 2x2 samples for every one in input
+   int i,t0,t1;
+   if (w == 1) {
+      out[0] = out[1] = stbi__div4(3*in_near[0] + in_far[0] + 2);
+      return out;
+   }
+
+   t1 = 3*in_near[0] + in_far[0];
+   out[0] = stbi__div4(t1+2);
+   for (i=1; i < w; ++i) {
+      t0 = t1;
+      t1 = 3*in_near[i]+in_far[i];
+      out[i*2-1] = stbi__div16(3*t0 + t1 + 8);
+      out[i*2  ] = stbi__div16(3*t1 + t0 + 8);
+   }
+   out[w*2-1] = stbi__div4(t1+2);
+
+   STBI_NOTUSED(hs);
+
+   return out;
+}
+
+#if defined(STBI_SSE2) || defined(STBI_NEON)
+static stbi_uc *stbi__resample_row_hv_2_simd(stbi_uc *out, stbi_uc *in_near, stbi_uc *in_far, int w, int hs)
+{
+   // need to generate 2x2 samples for every one in input
+   int i=0,t0,t1;
+
+   if (w == 1) {
+      out[0] = out[1] = stbi__div4(3*in_near[0] + in_far[0] + 2);
+      return out;
+   }
+
+   t1 = 3*in_near[0] + in_far[0];
+   // process groups of 8 pixels for as long as we can.
+   // note we can't handle the last pixel in a row in this loop
+   // because we need to handle the filter boundary conditions.
+   for (; i < ((w-1) & ~7); i += 8) {
+#if defined(STBI_SSE2)
+      // load and perform the vertical filtering pass
+      // this uses 3*x + y = 4*x + (y - x)
+      __m128i zero  = _mm_setzero_si128();
+      __m128i farb  = _mm_loadl_epi64((__m128i *) (in_far + i));
+      __m128i nearb = _mm_loadl_epi64((__m128i *) (in_near + i));
+      __m128i farw  = _mm_unpacklo_epi8(farb, zero);
+      __m128i nearw = _mm_unpacklo_epi8(nearb, zero);
+      __m128i diff  = _mm_sub_epi16(farw, nearw);
+      __m128i nears = _mm_slli_epi16(nearw, 2);
+      __m128i curr  = _mm_add_epi16(nears, diff); // current row
+
+      // horizontal filter works the same based on shifted vers of current
+      // row. "prev" is current row shifted right by 1 pixel; we need to
+      // insert the previous pixel value (from t1).
+      // "next" is current row shifted left by 1 pixel, with first pixel
+      // of next block of 8 pixels added in.
+      __m128i prv0 = _mm_slli_si128(curr, 2);
+      __m128i nxt0 = _mm_srli_si128(curr, 2);
+      __m128i prev = _mm_insert_epi16(prv0, t1, 0);
+      __m128i next = _mm_insert_epi16(nxt0, 3*in_near[i+8] + in_far[i+8], 7);
+
+      // horizontal filter, polyphase implementation since it's convenient:
+      // even pixels = 3*cur + prev = cur*4 + (prev - cur)
+      // odd  pixels = 3*cur + next = cur*4 + (next - cur)
+      // note the shared term.
+      __m128i bias  = _mm_set1_epi16(8);
+      __m128i curs = _mm_slli_epi16(curr, 2);
+      __m128i prvd = _mm_sub_epi16(prev, curr);
+      __m128i nxtd = _mm_sub_epi16(next, curr);
+      __m128i curb = _mm_add_epi16(curs, bias);
+      __m128i even = _mm_add_epi16(prvd, curb);
+      __m128i odd  = _mm_add_epi16(nxtd, curb);
+
+      // interleave even and odd pixels, then undo scaling.
+      __m128i int0 = _mm_unpacklo_epi16(even, odd);
+      __m128i int1 = _mm_unpackhi_epi16(even, odd);
+      __m128i de0  = _mm_srli_epi16(int0, 4);
+      __m128i de1  = _mm_srli_epi16(int1, 4);
+
+      // pack and write output
+      __m128i outv = _mm_packus_epi16(de0, de1);
+      _mm_storeu_si128((__m128i *) (out + i*2), outv);
+#elif defined(STBI_NEON)
+      // load and perform the vertical filtering pass
+      // this uses 3*x + y = 4*x + (y - x)
+      uint8x8_t farb  = vld1_u8(in_far + i);
+      uint8x8_t nearb = vld1_u8(in_near + i);
+      int16x8_t diff  = vreinterpretq_s16_u16(vsubl_u8(farb, nearb));
+      int16x8_t nears = vreinterpretq_s16_u16(vshll_n_u8(nearb, 2));
+      int16x8_t curr  = vaddq_s16(nears, diff); // current row
+
+      // horizontal filter works the same based on shifted vers of current
+      // row. "prev" is current row shifted right by 1 pixel; we need to
+      // insert the previous pixel value (from t1).
+      // "next" is current row shifted left by 1 pixel, with first pixel
+      // of next block of 8 pixels added in.
+      int16x8_t prv0 = vextq_s16(curr, curr, 7);
+      int16x8_t nxt0 = vextq_s16(curr, curr, 1);
+      int16x8_t prev = vsetq_lane_s16(t1, prv0, 0);
+      int16x8_t next = vsetq_lane_s16(3*in_near[i+8] + in_far[i+8], nxt0, 7);
+
+      // horizontal filter, polyphase implementation since it's convenient:
+      // even pixels = 3*cur + prev = cur*4 + (prev - cur)
+      // odd  pixels = 3*cur + next = cur*4 + (next - cur)
+      // note the shared term.
+      int16x8_t curs = vshlq_n_s16(curr, 2);
+      int16x8_t prvd = vsubq_s16(prev, curr);
+      int16x8_t nxtd = vsubq_s16(next, curr);
+      int16x8_t even = vaddq_s16(curs, prvd);
+      int16x8_t odd  = vaddq_s16(curs, nxtd);
+
+      // undo scaling and round, then store with even/odd phases interleaved
+      uint8x8x2_t o;
+      o.val[0] = vqrshrun_n_s16(even, 4);
+      o.val[1] = vqrshrun_n_s16(odd,  4);
+      vst2_u8(out + i*2, o);
+#endif
+
+      // "previous" value for next iter
+      t1 = 3*in_near[i+7] + in_far[i+7];
+   }
+
+   t0 = t1;
+   t1 = 3*in_near[i] + in_far[i];
+   out[i*2] = stbi__div16(3*t1 + t0 + 8);
+
+   for (++i; i < w; ++i) {
+      t0 = t1;
+      t1 = 3*in_near[i]+in_far[i];
+      out[i*2-1] = stbi__div16(3*t0 + t1 + 8);
+      out[i*2  ] = stbi__div16(3*t1 + t0 + 8);
+   }
+   out[w*2-1] = stbi__div4(t1+2);
+
+   STBI_NOTUSED(hs);
+
+   return out;
+}
+#endif
+
+static stbi_uc *stbi__resample_row_generic(stbi_uc *out, stbi_uc *in_near, stbi_uc *in_far, int w, int hs)
+{
+   // resample with nearest-neighbor
+   int i,j;
+   STBI_NOTUSED(in_far);
+   for (i=0; i < w; ++i)
+      for (j=0; j < hs; ++j)
+         out[i*hs+j] = in_near[i];
+   return out;
+}
+
+// this is a reduced-precision calculation of YCbCr-to-RGB introduced
+// to make sure the code produces the same results in both SIMD and scalar
+#define stbi__float2fixed(x)  (((int) ((x) * 4096.0f + 0.5f)) << 8)
+static void stbi__YCbCr_to_RGB_row(stbi_uc *out, const stbi_uc *y, const stbi_uc *pcb, const stbi_uc *pcr, int count, int step)
+{
+   int i;
+   for (i=0; i < count; ++i) {
+      int y_fixed = (y[i] << 20) + (1<<19); // rounding
+      int r,g,b;
+      int cr = pcr[i] - 128;
+      int cb = pcb[i] - 128;
+      r = y_fixed +  cr* stbi__float2fixed(1.40200f);
+      g = y_fixed + (cr*-stbi__float2fixed(0.71414f)) + ((cb*-stbi__float2fixed(0.34414f)) & 0xffff0000);
+      b = y_fixed                                     +   cb* stbi__float2fixed(1.77200f);
+      r >>= 20;
+      g >>= 20;
+      b >>= 20;
+      if ((unsigned) r > 255) { if (r < 0) r = 0; else r = 255; }
+      if ((unsigned) g > 255) { if (g < 0) g = 0; else g = 255; }
+      if ((unsigned) b > 255) { if (b < 0) b = 0; else b = 255; }
+      out[0] = (stbi_uc)r;
+      out[1] = (stbi_uc)g;
+      out[2] = (stbi_uc)b;
+      out[3] = 255;
+      out += step;
+   }
+}
+
+#if defined(STBI_SSE2) || defined(STBI_NEON)
+static void stbi__YCbCr_to_RGB_simd(stbi_uc *out, stbi_uc const *y, stbi_uc const *pcb, stbi_uc const *pcr, int count, int step)
+{
+   int i = 0;
+
+#ifdef STBI_SSE2
+   // step == 3 is pretty ugly on the final interleave, and i'm not convinced
+   // it's useful in practice (you wouldn't use it for textures, for example).
+   // so just accelerate step == 4 case.
+   if (step == 4) {
+      // this is a fairly straightforward implementation and not super-optimized.
+      __m128i signflip  = _mm_set1_epi8(-0x80);
+      __m128i cr_const0 = _mm_set1_epi16(   (short) ( 1.40200f*4096.0f+0.5f));
+      __m128i cr_const1 = _mm_set1_epi16( - (short) ( 0.71414f*4096.0f+0.5f));
+      __m128i cb_const0 = _mm_set1_epi16( - (short) ( 0.34414f*4096.0f+0.5f));
+      __m128i cb_const1 = _mm_set1_epi16(   (short) ( 1.77200f*4096.0f+0.5f));
+      __m128i y_bias = _mm_set1_epi8((char) (unsigned char) 128);
+      __m128i xw = _mm_set1_epi16(255); // alpha channel
+
+      for (; i+7 < count; i += 8) {
+         // load
+         __m128i y_bytes = _mm_loadl_epi64((__m128i *) (y+i));
+         __m128i cr_bytes = _mm_loadl_epi64((__m128i *) (pcr+i));
+         __m128i cb_bytes = _mm_loadl_epi64((__m128i *) (pcb+i));
+         __m128i cr_biased = _mm_xor_si128(cr_bytes, signflip); // -128
+         __m128i cb_biased = _mm_xor_si128(cb_bytes, signflip); // -128
+
+         // unpack to short (and left-shift cr, cb by 8)
+         __m128i yw  = _mm_unpacklo_epi8(y_bias, y_bytes);
+         __m128i crw = _mm_unpacklo_epi8(_mm_setzero_si128(), cr_biased);
+         __m128i cbw = _mm_unpacklo_epi8(_mm_setzero_si128(), cb_biased);
+
+         // color transform
+         __m128i yws = _mm_srli_epi16(yw, 4);
+         __m128i cr0 = _mm_mulhi_epi16(cr_const0, crw);
+         __m128i cb0 = _mm_mulhi_epi16(cb_const0, cbw);
+         __m128i cb1 = _mm_mulhi_epi16(cbw, cb_const1);
+         __m128i cr1 = _mm_mulhi_epi16(crw, cr_const1);
+         __m128i rws = _mm_add_epi16(cr0, yws);
+         __m128i gwt = _mm_add_epi16(cb0, yws);
+         __m128i bws = _mm_add_epi16(yws, cb1);
+         __m128i gws = _mm_add_epi16(gwt, cr1);
+
+         // descale
+         __m128i rw = _mm_srai_epi16(rws, 4);
+         __m128i bw = _mm_srai_epi16(bws, 4);
+         __m128i gw = _mm_srai_epi16(gws, 4);
+
+         // back to byte, set up for transpose
+         __m128i brb = _mm_packus_epi16(rw, bw);
+         __m128i gxb = _mm_packus_epi16(gw, xw);
+
+         // transpose to interleave channels
+         __m128i t0 = _mm_unpacklo_epi8(brb, gxb);
+         __m128i t1 = _mm_unpackhi_epi8(brb, gxb);
+         __m128i o0 = _mm_unpacklo_epi16(t0, t1);
+         __m128i o1 = _mm_unpackhi_epi16(t0, t1);
+
+         // store
+         _mm_storeu_si128((__m128i *) (out + 0), o0);
+         _mm_storeu_si128((__m128i *) (out + 16), o1);
+         out += 32;
+      }
+   }
+#endif
+
+#ifdef STBI_NEON
+   // in this version, step=3 support would be easy to add. but is there demand?
+   if (step == 4) {
+      // this is a fairly straightforward implementation and not super-optimized.
+      uint8x8_t signflip = vdup_n_u8(0x80);
+      int16x8_t cr_const0 = vdupq_n_s16(   (short) ( 1.40200f*4096.0f+0.5f));
+      int16x8_t cr_const1 = vdupq_n_s16( - (short) ( 0.71414f*4096.0f+0.5f));
+      int16x8_t cb_const0 = vdupq_n_s16( - (short) ( 0.34414f*4096.0f+0.5f));
+      int16x8_t cb_const1 = vdupq_n_s16(   (short) ( 1.77200f*4096.0f+0.5f));
+
+      for (; i+7 < count; i += 8) {
+         // load
+         uint8x8_t y_bytes  = vld1_u8(y + i);
+         uint8x8_t cr_bytes = vld1_u8(pcr + i);
+         uint8x8_t cb_bytes = vld1_u8(pcb + i);
+         int8x8_t cr_biased = vreinterpret_s8_u8(vsub_u8(cr_bytes, signflip));
+         int8x8_t cb_biased = vreinterpret_s8_u8(vsub_u8(cb_bytes, signflip));
+
+         // expand to s16
+         int16x8_t yws = vreinterpretq_s16_u16(vshll_n_u8(y_bytes, 4));
+         int16x8_t crw = vshll_n_s8(cr_biased, 7);
+         int16x8_t cbw = vshll_n_s8(cb_biased, 7);
+
+         // color transform
+         int16x8_t cr0 = vqdmulhq_s16(crw, cr_const0);
+         int16x8_t cb0 = vqdmulhq_s16(cbw, cb_const0);
+         int16x8_t cr1 = vqdmulhq_s16(crw, cr_const1);
+         int16x8_t cb1 = vqdmulhq_s16(cbw, cb_const1);
+         int16x8_t rws = vaddq_s16(yws, cr0);
+         int16x8_t gws = vaddq_s16(vaddq_s16(yws, cb0), cr1);
+         int16x8_t bws = vaddq_s16(yws, cb1);
+
+         // undo scaling, round, convert to byte
+         uint8x8x4_t o;
+         o.val[0] = vqrshrun_n_s16(rws, 4);
+         o.val[1] = vqrshrun_n_s16(gws, 4);
+         o.val[2] = vqrshrun_n_s16(bws, 4);
+         o.val[3] = vdup_n_u8(255);
+
+         // store, interleaving r/g/b/a
+         vst4_u8(out, o);
+         out += 8*4;
+      }
+   }
+#endif
+
+   for (; i < count; ++i) {
+      int y_fixed = (y[i] << 20) + (1<<19); // rounding
+      int r,g,b;
+      int cr = pcr[i] - 128;
+      int cb = pcb[i] - 128;
+      r = y_fixed + cr* stbi__float2fixed(1.40200f);
+      g = y_fixed + cr*-stbi__float2fixed(0.71414f) + ((cb*-stbi__float2fixed(0.34414f)) & 0xffff0000);
+      b = y_fixed                                   +   cb* stbi__float2fixed(1.77200f);
+      r >>= 20;
+      g >>= 20;
+      b >>= 20;
+      if ((unsigned) r > 255) { if (r < 0) r = 0; else r = 255; }
+      if ((unsigned) g > 255) { if (g < 0) g = 0; else g = 255; }
+      if ((unsigned) b > 255) { if (b < 0) b = 0; else b = 255; }
+      out[0] = (stbi_uc)r;
+      out[1] = (stbi_uc)g;
+      out[2] = (stbi_uc)b;
+      out[3] = 255;
+      out += step;
+   }
+}
+#endif
+
+// set up the kernels
+static void stbi__setup_jpeg(stbi__jpeg *j)
+{
+   j->idct_block_kernel = stbi__idct_block;
+   j->YCbCr_to_RGB_kernel = stbi__YCbCr_to_RGB_row;
+   j->resample_row_hv_2_kernel = stbi__resample_row_hv_2;
+
+#ifdef STBI_SSE2
+   if (stbi__sse2_available()) {
+      j->idct_block_kernel = stbi__idct_simd;
+      j->YCbCr_to_RGB_kernel = stbi__YCbCr_to_RGB_simd;
+      j->resample_row_hv_2_kernel = stbi__resample_row_hv_2_simd;
+   }
+#endif
+
+#ifdef STBI_NEON
+   j->idct_block_kernel = stbi__idct_simd;
+   j->YCbCr_to_RGB_kernel = stbi__YCbCr_to_RGB_simd;
+   j->resample_row_hv_2_kernel = stbi__resample_row_hv_2_simd;
+#endif
+}
+
+// clean up the temporary component buffers
+static void stbi__cleanup_jpeg(stbi__jpeg *j)
+{
+   stbi__free_jpeg_components(j, j->s->img_n, 0);
+}
+
+typedef struct
+{
+   resample_row_func resample;
+   stbi_uc *line0,*line1;
+   int hs,vs;   // expansion factor in each axis
+   int w_lores; // horizontal pixels pre-expansion
+   int ystep;   // how far through vertical expansion we are
+   int ypos;    // which pre-expansion row we're on
+} stbi__resample;
+
+// fast 0..255 * 0..255 => 0..255 rounded multiplication
+static stbi_uc stbi__blinn_8x8(stbi_uc x, stbi_uc y)
+{
+   unsigned int t = x*y + 128;
+   return (stbi_uc) ((t + (t >>8)) >> 8);
+}
+
+static stbi_uc *load_jpeg_image(stbi__jpeg *z, int *out_x, int *out_y, int *comp, int req_comp)
+{
+   int n, decode_n, is_rgb;
+   z->s->img_n = 0; // make stbi__cleanup_jpeg safe
+
+   // validate req_comp
+   if (req_comp < 0 || req_comp > 4) return stbi__errpuc("bad req_comp", "Internal error");
+
+   // load a jpeg image from whichever source, but leave in YCbCr format
+   if (!stbi__decode_jpeg_image(z)) { stbi__cleanup_jpeg(z); return NULL; }
+
+   // determine actual number of components to generate
+   n = req_comp ? req_comp : z->s->img_n >= 3 ? 3 : 1;
+
+   is_rgb = z->s->img_n == 3 && (z->rgb == 3 || (z->app14_color_transform == 0 && !z->jfif));
+
+   if (z->s->img_n == 3 && n < 3 && !is_rgb)
+      decode_n = 1;
+   else
+      decode_n = z->s->img_n;
+
+   // nothing to do if no components requested; check this now to avoid
+   // accessing uninitialized coutput[0] later
+   if (decode_n <= 0) { stbi__cleanup_jpeg(z); return NULL; }
+
+   // resample and color-convert
+   {
+      int k;
+      unsigned int i,j;
+      stbi_uc *output;
+      stbi_uc *coutput[4] = { NULL, NULL, NULL, NULL };
+
+      stbi__resample res_comp[4];
+
+      for (k=0; k < decode_n; ++k) {
+         stbi__resample *r = &res_comp[k];
+
+         // allocate line buffer big enough for upsampling off the edges
+         // with upsample factor of 4
+         z->img_comp[k].linebuf = (stbi_uc *) stbi__malloc(z->s->img_x + 3);
+         if (!z->img_comp[k].linebuf) { stbi__cleanup_jpeg(z); return stbi__errpuc("outofmem", "Out of memory"); }
+
+         r->hs      = z->img_h_max / z->img_comp[k].h;
+         r->vs      = z->img_v_max / z->img_comp[k].v;
+         r->ystep   = r->vs >> 1;
+         r->w_lores = (z->s->img_x + r->hs-1) / r->hs;
+         r->ypos    = 0;
+         r->line0   = r->line1 = z->img_comp[k].data;
+
+         if      (r->hs == 1 && r->vs == 1) r->resample = resample_row_1;
+         else if (r->hs == 1 && r->vs == 2) r->resample = stbi__resample_row_v_2;
+         else if (r->hs == 2 && r->vs == 1) r->resample = stbi__resample_row_h_2;
+         else if (r->hs == 2 && r->vs == 2) r->resample = z->resample_row_hv_2_kernel;
+         else                               r->resample = stbi__resample_row_generic;
+      }
+
+      // can't error after this so, this is safe
+      output = (stbi_uc *) stbi__malloc_mad3(n, z->s->img_x, z->s->img_y, 1);
+      if (!output) { stbi__cleanup_jpeg(z); return stbi__errpuc("outofmem", "Out of memory"); }
+
+      // now go ahead and resample
+      for (j=0; j < z->s->img_y; ++j) {
+         stbi_uc *out = output + n * z->s->img_x * j;
+         for (k=0; k < decode_n; ++k) {
+            stbi__resample *r = &res_comp[k];
+            int y_bot = r->ystep >= (r->vs >> 1);
+            coutput[k] = r->resample(z->img_comp[k].linebuf,
+                                     y_bot ? r->line1 : r->line0,
+                                     y_bot ? r->line0 : r->line1,
+                                     r->w_lores, r->hs);
+            if (++r->ystep >= r->vs) {
+               r->ystep = 0;
+               r->line0 = r->line1;
+               if (++r->ypos < z->img_comp[k].y)
+                  r->line1 += z->img_comp[k].w2;
+            }
+         }
+         if (n >= 3) {
+            stbi_uc *y = coutput[0];
+            if (z->s->img_n == 3) {
+               if (is_rgb) {
+                  for (i=0; i < z->s->img_x; ++i) {
+                     out[0] = y[i];
+                     out[1] = coutput[1][i];
+                     out[2] = coutput[2][i];
+                     out[3] = 255;
+                     out += n;
+                  }
+               } else {
+                  z->YCbCr_to_RGB_kernel(out, y, coutput[1], coutput[2], z->s->img_x, n);
+               }
+            } else if (z->s->img_n == 4) {
+               if (z->app14_color_transform == 0) { // CMYK
+                  for (i=0; i < z->s->img_x; ++i) {
+                     stbi_uc m = coutput[3][i];
+                     out[0] = stbi__blinn_8x8(coutput[0][i], m);
+                     out[1] = stbi__blinn_8x8(coutput[1][i], m);
+                     out[2] = stbi__blinn_8x8(coutput[2][i], m);
+                     out[3] = 255;
+                     out += n;
+                  }
+               } else if (z->app14_color_transform == 2) { // YCCK
+                  z->YCbCr_to_RGB_kernel(out, y, coutput[1], coutput[2], z->s->img_x, n);
+                  for (i=0; i < z->s->img_x; ++i) {
+                     stbi_uc m = coutput[3][i];
+                     out[0] = stbi__blinn_8x8(255 - out[0], m);
+                     out[1] = stbi__blinn_8x8(255 - out[1], m);
+                     out[2] = stbi__blinn_8x8(255 - out[2], m);
+                     out += n;
+                  }
+               } else { // YCbCr + alpha?  Ignore the fourth channel for now
+                  z->YCbCr_to_RGB_kernel(out, y, coutput[1], coutput[2], z->s->img_x, n);
+               }
+            } else
+               for (i=0; i < z->s->img_x; ++i) {
+                  out[0] = out[1] = out[2] = y[i];
+                  out[3] = 255; // not used if n==3
+                  out += n;
+               }
+         } else {
+            if (is_rgb) {
+               if (n == 1)
+                  for (i=0; i < z->s->img_x; ++i)
+                     *out++ = stbi__compute_y(coutput[0][i], coutput[1][i], coutput[2][i]);
+               else {
+                  for (i=0; i < z->s->img_x; ++i, out += 2) {
+                     out[0] = stbi__compute_y(coutput[0][i], coutput[1][i], coutput[2][i]);
+                     out[1] = 255;
+                  }
+               }
+            } else if (z->s->img_n == 4 && z->app14_color_transform == 0) {
+               for (i=0; i < z->s->img_x; ++i) {
+                  stbi_uc m = coutput[3][i];
+                  stbi_uc r = stbi__blinn_8x8(coutput[0][i], m);
+                  stbi_uc g = stbi__blinn_8x8(coutput[1][i], m);
+                  stbi_uc b = stbi__blinn_8x8(coutput[2][i], m);
+                  out[0] = stbi__compute_y(r, g, b);
+                  out[1] = 255;
+                  out += n;
+               }
+            } else if (z->s->img_n == 4 && z->app14_color_transform == 2) {
+               for (i=0; i < z->s->img_x; ++i) {
+                  out[0] = stbi__blinn_8x8(255 - coutput[0][i], coutput[3][i]);
+                  out[1] = 255;
+                  out += n;
+               }
+            } else {
+               stbi_uc *y = coutput[0];
+               if (n == 1)
+                  for (i=0; i < z->s->img_x; ++i) out[i] = y[i];
+               else
+                  for (i=0; i < z->s->img_x; ++i) { *out++ = y[i]; *out++ = 255; }
+            }
+         }
+      }
+      stbi__cleanup_jpeg(z);
+      *out_x = z->s->img_x;
+      *out_y = z->s->img_y;
+      if (comp) *comp = z->s->img_n >= 3 ? 3 : 1; // report original components, not output
+      return output;
+   }
+}
+
+static void *stbi__jpeg_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri)
+{
+   unsigned char* result;
+   stbi__jpeg* j = (stbi__jpeg*) stbi__malloc(sizeof(stbi__jpeg));
+   if (!j) return stbi__errpuc("outofmem", "Out of memory");
+   STBI_NOTUSED(ri);
+   j->s = s;
+   stbi__setup_jpeg(j);
+   result = load_jpeg_image(j, x,y,comp,req_comp);
+   STBI_FREE(j);
+   return result;
+}
+
+static int stbi__jpeg_test(stbi__context *s)
+{
+   int r;
+   stbi__jpeg* j = (stbi__jpeg*)stbi__malloc(sizeof(stbi__jpeg));
+   if (!j) return stbi__err("outofmem", "Out of memory");
+   j->s = s;
+   stbi__setup_jpeg(j);
+   r = stbi__decode_jpeg_header(j, STBI__SCAN_type);
+   stbi__rewind(s);
+   STBI_FREE(j);
+   return r;
+}
+
+static int stbi__jpeg_info_raw(stbi__jpeg *j, int *x, int *y, int *comp)
+{
+   if (!stbi__decode_jpeg_header(j, STBI__SCAN_header)) {
+      stbi__rewind( j->s );
+      return 0;
+   }
+   if (x) *x = j->s->img_x;
+   if (y) *y = j->s->img_y;
+   if (comp) *comp = j->s->img_n >= 3 ? 3 : 1;
+   return 1;
+}
+
+static int stbi__jpeg_info(stbi__context *s, int *x, int *y, int *comp)
+{
+   int result;
+   stbi__jpeg* j = (stbi__jpeg*) (stbi__malloc(sizeof(stbi__jpeg)));
+   if (!j) return stbi__err("outofmem", "Out of memory");
+   j->s = s;
+   result = stbi__jpeg_info_raw(j, x, y, comp);
+   STBI_FREE(j);
+   return result;
+}
+#endif
+
+// public domain zlib decode    v0.2  Sean Barrett 2006-11-18
+//    simple implementation
+//      - all input must be provided in an upfront buffer
+//      - all output is written to a single output buffer (can malloc/realloc)
+//    performance
+//      - fast huffman
+
+#ifndef STBI_NO_ZLIB
+
+// fast-way is faster to check than jpeg huffman, but slow way is slower
+#define STBI__ZFAST_BITS  9 // accelerate all cases in default tables
+#define STBI__ZFAST_MASK  ((1 << STBI__ZFAST_BITS) - 1)
+#define STBI__ZNSYMS 288 // number of symbols in literal/length alphabet
+
+// zlib-style huffman encoding
+// (jpegs packs from left, zlib from right, so can't share code)
+typedef struct
+{
+   stbi__uint16 fast[1 << STBI__ZFAST_BITS];
+   stbi__uint16 firstcode[16];
+   int maxcode[17];
+   stbi__uint16 firstsymbol[16];
+   stbi_uc  size[STBI__ZNSYMS];
+   stbi__uint16 value[STBI__ZNSYMS];
+} stbi__zhuffman;
+
+stbi_inline static int stbi__bitreverse16(int n)
+{
+  n = ((n & 0xAAAA) >>  1) | ((n & 0x5555) << 1);
+  n = ((n & 0xCCCC) >>  2) | ((n & 0x3333) << 2);
+  n = ((n & 0xF0F0) >>  4) | ((n & 0x0F0F) << 4);
+  n = ((n & 0xFF00) >>  8) | ((n & 0x00FF) << 8);
+  return n;
+}
+
+stbi_inline static int stbi__bit_reverse(int v, int bits)
+{
+   STBI_ASSERT(bits <= 16);
+   // to bit reverse n bits, reverse 16 and shift
+   // e.g. 11 bits, bit reverse and shift away 5
+   return stbi__bitreverse16(v) >> (16-bits);
+}
+
+static int stbi__zbuild_huffman(stbi__zhuffman *z, const stbi_uc *sizelist, int num)
+{
+   int i,k=0;
+   int code, next_code[16], sizes[17];
+
+   // DEFLATE spec for generating codes
+   memset(sizes, 0, sizeof(sizes));
+   memset(z->fast, 0, sizeof(z->fast));
+   for (i=0; i < num; ++i)
+      ++sizes[sizelist[i]];
+   sizes[0] = 0;
+   for (i=1; i < 16; ++i)
+      if (sizes[i] > (1 << i))
+         return stbi__err("bad sizes", "Corrupt PNG");
+   code = 0;
+   for (i=1; i < 16; ++i) {
+      next_code[i] = code;
+      z->firstcode[i] = (stbi__uint16) code;
+      z->firstsymbol[i] = (stbi__uint16) k;
+      code = (code + sizes[i]);
+      if (sizes[i])
+         if (code-1 >= (1 << i)) return stbi__err("bad codelengths","Corrupt PNG");
+      z->maxcode[i] = code << (16-i); // preshift for inner loop
+      code <<= 1;
+      k += sizes[i];
+   }
+   z->maxcode[16] = 0x10000; // sentinel
+   for (i=0; i < num; ++i) {
+      int s = sizelist[i];
+      if (s) {
+         int c = next_code[s] - z->firstcode[s] + z->firstsymbol[s];
+         stbi__uint16 fastv = (stbi__uint16) ((s << 9) | i);
+         z->size [c] = (stbi_uc     ) s;
+         z->value[c] = (stbi__uint16) i;
+         if (s <= STBI__ZFAST_BITS) {
+            int j = stbi__bit_reverse(next_code[s],s);
+            while (j < (1 << STBI__ZFAST_BITS)) {
+               z->fast[j] = fastv;
+               j += (1 << s);
+            }
+         }
+         ++next_code[s];
+      }
+   }
+   return 1;
+}
+
+// zlib-from-memory implementation for PNG reading
+//    because PNG allows splitting the zlib stream arbitrarily,
+//    and it's annoying structurally to have PNG call ZLIB call PNG,
+//    we require PNG read all the IDATs and combine them into a single
+//    memory buffer
+
+typedef struct
+{
+   stbi_uc *zbuffer, *zbuffer_end;
+   int num_bits;
+   stbi__uint32 code_buffer;
+
+   char *zout;
+   char *zout_start;
+   char *zout_end;
+   int   z_expandable;
+
+   stbi__zhuffman z_length, z_distance;
+} stbi__zbuf;
+
+stbi_inline static int stbi__zeof(stbi__zbuf *z)
+{
+   return (z->zbuffer >= z->zbuffer_end);
+}
+
+stbi_inline static stbi_uc stbi__zget8(stbi__zbuf *z)
+{
+   return stbi__zeof(z) ? 0 : *z->zbuffer++;
+}
+
+static void stbi__fill_bits(stbi__zbuf *z)
+{
+   do {
+      if (z->code_buffer >= (1U << z->num_bits)) {
+        z->zbuffer = z->zbuffer_end;  /* treat this as EOF so we fail. */
+        return;
+      }
+      z->code_buffer |= (unsigned int) stbi__zget8(z) << z->num_bits;
+      z->num_bits += 8;
+   } while (z->num_bits <= 24);
+}
+
+stbi_inline static unsigned int stbi__zreceive(stbi__zbuf *z, int n)
+{
+   unsigned int k;
+   if (z->num_bits < n) stbi__fill_bits(z);
+   k = z->code_buffer & ((1 << n) - 1);
+   z->code_buffer >>= n;
+   z->num_bits -= n;
+   return k;
+}
+
+static int stbi__zhuffman_decode_slowpath(stbi__zbuf *a, stbi__zhuffman *z)
+{
+   int b,s,k;
+   // not resolved by fast table, so compute it the slow way
+   // use jpeg approach, which requires MSbits at top
+   k = stbi__bit_reverse(a->code_buffer, 16);
+   for (s=STBI__ZFAST_BITS+1; ; ++s)
+      if (k < z->maxcode[s])
+         break;
+   if (s >= 16) return -1; // invalid code!
+   // code size is s, so:
+   b = (k >> (16-s)) - z->firstcode[s] + z->firstsymbol[s];
+   if (b >= STBI__ZNSYMS) return -1; // some data was corrupt somewhere!
+   if (z->size[b] != s) return -1;  // was originally an assert, but report failure instead.
+   a->code_buffer >>= s;
+   a->num_bits -= s;
+   return z->value[b];
+}
+
+stbi_inline static int stbi__zhuffman_decode(stbi__zbuf *a, stbi__zhuffman *z)
+{
+   int b,s;
+   if (a->num_bits < 16) {
+      if (stbi__zeof(a)) {
+         return -1;   /* report error for unexpected end of data. */
+      }
+      stbi__fill_bits(a);
+   }
+   b = z->fast[a->code_buffer & STBI__ZFAST_MASK];
+   if (b) {
+      s = b >> 9;
+      a->code_buffer >>= s;
+      a->num_bits -= s;
+      return b & 511;
+   }
+   return stbi__zhuffman_decode_slowpath(a, z);
+}
+
+static int stbi__zexpand(stbi__zbuf *z, char *zout, int n)  // need to make room for n bytes
+{
+   char *q;
+   unsigned int cur, limit, old_limit;
+   z->zout = zout;
+   if (!z->z_expandable) return stbi__err("output buffer limit","Corrupt PNG");
+   cur   = (unsigned int) (z->zout - z->zout_start);
+   limit = old_limit = (unsigned) (z->zout_end - z->zout_start);
+   if (UINT_MAX - cur < (unsigned) n) return stbi__err("outofmem", "Out of memory");
+   while (cur + n > limit) {
+      if(limit > UINT_MAX / 2) return stbi__err("outofmem", "Out of memory");
+      limit *= 2;
+   }
+   q = (char *) STBI_REALLOC_SIZED(z->zout_start, old_limit, limit);
+   STBI_NOTUSED(old_limit);
+   if (q == NULL) return stbi__err("outofmem", "Out of memory");
+   z->zout_start = q;
+   z->zout       = q + cur;
+   z->zout_end   = q + limit;
+   return 1;
+}
+
+static const int stbi__zlength_base[31] = {
+   3,4,5,6,7,8,9,10,11,13,
+   15,17,19,23,27,31,35,43,51,59,
+   67,83,99,115,131,163,195,227,258,0,0 };
+
+static const int stbi__zlength_extra[31]=
+{ 0,0,0,0,0,0,0,0,1,1,1,1,2,2,2,2,3,3,3,3,4,4,4,4,5,5,5,5,0,0,0 };
+
+static const int stbi__zdist_base[32] = { 1,2,3,4,5,7,9,13,17,25,33,49,65,97,129,193,
+257,385,513,769,1025,1537,2049,3073,4097,6145,8193,12289,16385,24577,0,0};
+
+static const int stbi__zdist_extra[32] =
+{ 0,0,0,0,1,1,2,2,3,3,4,4,5,5,6,6,7,7,8,8,9,9,10,10,11,11,12,12,13,13};
+
+static int stbi__parse_huffman_block(stbi__zbuf *a)
+{
+   char *zout = a->zout;
+   for(;;) {
+      int z = stbi__zhuffman_decode(a, &a->z_length);
+      if (z < 256) {
+         if (z < 0) return stbi__err("bad huffman code","Corrupt PNG"); // error in huffman codes
+         if (zout >= a->zout_end) {
+            if (!stbi__zexpand(a, zout, 1)) return 0;
+            zout = a->zout;
+         }
+         *zout++ = (char) z;
+      } else {
+         stbi_uc *p;
+         int len,dist;
+         if (z == 256) {
+            a->zout = zout;
+            return 1;
+         }
+         z -= 257;
+         len = stbi__zlength_base[z];
+         if (stbi__zlength_extra[z]) len += stbi__zreceive(a, stbi__zlength_extra[z]);
+         z = stbi__zhuffman_decode(a, &a->z_distance);
+         if (z < 0) return stbi__err("bad huffman code","Corrupt PNG");
+         dist = stbi__zdist_base[z];
+         if (stbi__zdist_extra[z]) dist += stbi__zreceive(a, stbi__zdist_extra[z]);
+         if (zout - a->zout_start < dist) return stbi__err("bad dist","Corrupt PNG");
+         if (zout + len > a->zout_end) {
+            if (!stbi__zexpand(a, zout, len)) return 0;
+            zout = a->zout;
+         }
+         p = (stbi_uc *) (zout - dist);
+         if (dist == 1) { // run of one byte; common in images.
+            stbi_uc v = *p;
+            if (len) { do *zout++ = v; while (--len); }
+         } else {
+            if (len) { do *zout++ = *p++; while (--len); }
+         }
+      }
+   }
+}
+
+static int stbi__compute_huffman_codes(stbi__zbuf *a)
+{
+   static const stbi_uc length_dezigzag[19] = { 16,17,18,0,8,7,9,6,10,5,11,4,12,3,13,2,14,1,15 };
+   stbi__zhuffman z_codelength;
+   stbi_uc lencodes[286+32+137];//padding for maximum single op
+   stbi_uc codelength_sizes[19];
+   int i,n;
+
+   int hlit  = stbi__zreceive(a,5) + 257;
+   int hdist = stbi__zreceive(a,5) + 1;
+   int hclen = stbi__zreceive(a,4) + 4;
+   int ntot  = hlit + hdist;
+
+   memset(codelength_sizes, 0, sizeof(codelength_sizes));
+   for (i=0; i < hclen; ++i) {
+      int s = stbi__zreceive(a,3);
+      codelength_sizes[length_dezigzag[i]] = (stbi_uc) s;
+   }
+   if (!stbi__zbuild_huffman(&z_codelength, codelength_sizes, 19)) return 0;
+
+   n = 0;
+   while (n < ntot) {
+      int c = stbi__zhuffman_decode(a, &z_codelength);
+      if (c < 0 || c >= 19) return stbi__err("bad codelengths", "Corrupt PNG");
+      if (c < 16)
+         lencodes[n++] = (stbi_uc) c;
+      else {
+         stbi_uc fill = 0;
+         if (c == 16) {
+            c = stbi__zreceive(a,2)+3;
+            if (n == 0) return stbi__err("bad codelengths", "Corrupt PNG");
+            fill = lencodes[n-1];
+         } else if (c == 17) {
+            c = stbi__zreceive(a,3)+3;
+         } else if (c == 18) {
+            c = stbi__zreceive(a,7)+11;
+         } else {
+            return stbi__err("bad codelengths", "Corrupt PNG");
+         }
+         if (ntot - n < c) return stbi__err("bad codelengths", "Corrupt PNG");
+         memset(lencodes+n, fill, c);
+         n += c;
+      }
+   }
+   if (n != ntot) return stbi__err("bad codelengths","Corrupt PNG");
+   if (!stbi__zbuild_huffman(&a->z_length, lencodes, hlit)) return 0;
+   if (!stbi__zbuild_huffman(&a->z_distance, lencodes+hlit, hdist)) return 0;
+   return 1;
+}
+
+static int stbi__parse_uncompressed_block(stbi__zbuf *a)
+{
+   stbi_uc header[4];
+   int len,nlen,k;
+   if (a->num_bits & 7)
+      stbi__zreceive(a, a->num_bits & 7); // discard
+   // drain the bit-packed data into header
+   k = 0;
+   while (a->num_bits > 0) {
+      header[k++] = (stbi_uc) (a->code_buffer & 255); // suppress MSVC run-time check
+      a->code_buffer >>= 8;
+      a->num_bits -= 8;
+   }
+   if (a->num_bits < 0) return stbi__err("zlib corrupt","Corrupt PNG");
+   // now fill header the normal way
+   while (k < 4)
+      header[k++] = stbi__zget8(a);
+   len  = header[1] * 256 + header[0];
+   nlen = header[3] * 256 + header[2];
+   if (nlen != (len ^ 0xffff)) return stbi__err("zlib corrupt","Corrupt PNG");
+   if (a->zbuffer + len > a->zbuffer_end) return stbi__err("read past buffer","Corrupt PNG");
+   if (a->zout + len > a->zout_end)
+      if (!stbi__zexpand(a, a->zout, len)) return 0;
+   memcpy(a->zout, a->zbuffer, len);
+   a->zbuffer += len;
+   a->zout += len;
+   return 1;
+}
+
+static int stbi__parse_zlib_header(stbi__zbuf *a)
+{
+   int cmf   = stbi__zget8(a);
+   int cm    = cmf & 15;
+   /* int cinfo = cmf >> 4; */
+   int flg   = stbi__zget8(a);
+   if (stbi__zeof(a)) return stbi__err("bad zlib header","Corrupt PNG"); // zlib spec
+   if ((cmf*256+flg) % 31 != 0) return stbi__err("bad zlib header","Corrupt PNG"); // zlib spec
+   if (flg & 32) return stbi__err("no preset dict","Corrupt PNG"); // preset dictionary not allowed in png
+   if (cm != 8) return stbi__err("bad compression","Corrupt PNG"); // DEFLATE required for png
+   // window = 1 << (8 + cinfo)... but who cares, we fully buffer output
+   return 1;
+}
+
+static const stbi_uc stbi__zdefault_length[STBI__ZNSYMS] =
+{
+   8,8,8,8,8,8,8,8,8,8,8,8,8,8,8,8, 8,8,8,8,8,8,8,8,8,8,8,8,8,8,8,8,
+   8,8,8,8,8,8,8,8,8,8,8,8,8,8,8,8, 8,8,8,8,8,8,8,8,8,8,8,8,8,8,8,8,
+   8,8,8,8,8,8,8,8,8,8,8,8,8,8,8,8, 8,8,8,8,8,8,8,8,8,8,8,8,8,8,8,8,
+   8,8,8,8,8,8,8,8,8,8,8,8,8,8,8,8, 8,8,8,8,8,8,8,8,8,8,8,8,8,8,8,8,
+   8,8,8,8,8,8,8,8,8,8,8,8,8,8,8,8, 9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,
+   9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,9, 9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,
+   9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,9, 9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,
+   9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,9, 9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,
+   7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7, 7,7,7,7,7,7,7,7,8,8,8,8,8,8,8,8
+};
+static const stbi_uc stbi__zdefault_distance[32] =
+{
+   5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5,5
+};
+/*
+Init algorithm:
+{
+   int i;   // use <= to match clearly with spec
+   for (i=0; i <= 143; ++i)     stbi__zdefault_length[i]   = 8;
+   for (   ; i <= 255; ++i)     stbi__zdefault_length[i]   = 9;
+   for (   ; i <= 279; ++i)     stbi__zdefault_length[i]   = 7;
+   for (   ; i <= 287; ++i)     stbi__zdefault_length[i]   = 8;
+
+   for (i=0; i <=  31; ++i)     stbi__zdefault_distance[i] = 5;
+}
+*/
+
+static int stbi__parse_zlib(stbi__zbuf *a, int parse_header)
+{
+   int final, type;
+   if (parse_header)
+      if (!stbi__parse_zlib_header(a)) return 0;
+   a->num_bits = 0;
+   a->code_buffer = 0;
+   do {
+      final = stbi__zreceive(a,1);
+      type = stbi__zreceive(a,2);
+      if (type == 0) {
+         if (!stbi__parse_uncompressed_block(a)) return 0;
+      } else if (type == 3) {
+         return 0;
+      } else {
+         if (type == 1) {
+            // use fixed code lengths
+            if (!stbi__zbuild_huffman(&a->z_length  , stbi__zdefault_length  , STBI__ZNSYMS)) return 0;
+            if (!stbi__zbuild_huffman(&a->z_distance, stbi__zdefault_distance,  32)) return 0;
+         } else {
+            if (!stbi__compute_huffman_codes(a)) return 0;
+         }
+         if (!stbi__parse_huffman_block(a)) return 0;
+      }
+   } while (!final);
+   return 1;
+}
+
+static int stbi__do_zlib(stbi__zbuf *a, char *obuf, int olen, int exp, int parse_header)
+{
+   a->zout_start = obuf;
+   a->zout       = obuf;
+   a->zout_end   = obuf + olen;
+   a->z_expandable = exp;
+
+   return stbi__parse_zlib(a, parse_header);
+}
+
+STBIDEF char *stbi_zlib_decode_malloc_guesssize(const char *buffer, int len, int initial_size, int *outlen)
+{
+   stbi__zbuf a;
+   char *p = (char *) stbi__malloc(initial_size);
+   if (p == NULL) return NULL;
+   a.zbuffer = (stbi_uc *) buffer;
+   a.zbuffer_end = (stbi_uc *) buffer + len;
+   if (stbi__do_zlib(&a, p, initial_size, 1, 1)) {
+      if (outlen) *outlen = (int) (a.zout - a.zout_start);
+      return a.zout_start;
+   } else {
+      STBI_FREE(a.zout_start);
+      return NULL;
+   }
+}
+
+STBIDEF char *stbi_zlib_decode_malloc(char const *buffer, int len, int *outlen)
+{
+   return stbi_zlib_decode_malloc_guesssize(buffer, len, 16384, outlen);
+}
+
+STBIDEF char *stbi_zlib_decode_malloc_guesssize_headerflag(const char *buffer, int len, int initial_size, int *outlen, int parse_header)
+{
+   stbi__zbuf a;
+   char *p = (char *) stbi__malloc(initial_size);
+   if (p == NULL) return NULL;
+   a.zbuffer = (stbi_uc *) buffer;
+   a.zbuffer_end = (stbi_uc *) buffer + len;
+   if (stbi__do_zlib(&a, p, initial_size, 1, parse_header)) {
+      if (outlen) *outlen = (int) (a.zout - a.zout_start);
+      return a.zout_start;
+   } else {
+      STBI_FREE(a.zout_start);
+      return NULL;
+   }
+}
+
+STBIDEF int stbi_zlib_decode_buffer(char *obuffer, int olen, char const *ibuffer, int ilen)
+{
+   stbi__zbuf a;
+   a.zbuffer = (stbi_uc *) ibuffer;
+   a.zbuffer_end = (stbi_uc *) ibuffer + ilen;
+   if (stbi__do_zlib(&a, obuffer, olen, 0, 1))
+      return (int) (a.zout - a.zout_start);
+   else
+      return -1;
+}
+
+STBIDEF char *stbi_zlib_decode_noheader_malloc(char const *buffer, int len, int *outlen)
+{
+   stbi__zbuf a;
+   char *p = (char *) stbi__malloc(16384);
+   if (p == NULL) return NULL;
+   a.zbuffer = (stbi_uc *) buffer;
+   a.zbuffer_end = (stbi_uc *) buffer+len;
+   if (stbi__do_zlib(&a, p, 16384, 1, 0)) {
+      if (outlen) *outlen = (int) (a.zout - a.zout_start);
+      return a.zout_start;
+   } else {
+      STBI_FREE(a.zout_start);
+      return NULL;
+   }
+}
+
+STBIDEF int stbi_zlib_decode_noheader_buffer(char *obuffer, int olen, const char *ibuffer, int ilen)
+{
+   stbi__zbuf a;
+   a.zbuffer = (stbi_uc *) ibuffer;
+   a.zbuffer_end = (stbi_uc *) ibuffer + ilen;
+   if (stbi__do_zlib(&a, obuffer, olen, 0, 0))
+      return (int) (a.zout - a.zout_start);
+   else
+      return -1;
+}
+#endif
+
+// public domain "baseline" PNG decoder   v0.10  Sean Barrett 2006-11-18
+//    simple implementation
+//      - only 8-bit samples
+//      - no CRC checking
+//      - allocates lots of intermediate memory
+//        - avoids problem of streaming data between subsystems
+//        - avoids explicit window management
+//    performance
+//      - uses stb_zlib, a PD zlib implementation with fast huffman decoding
+
+#ifndef STBI_NO_PNG
+typedef struct
+{
+   stbi__uint32 length;
+   stbi__uint32 type;
+} stbi__pngchunk;
+
+static stbi__pngchunk stbi__get_chunk_header(stbi__context *s)
+{
+   stbi__pngchunk c;
+   c.length = stbi__get32be(s);
+   c.type   = stbi__get32be(s);
+   return c;
+}
+
+static int stbi__check_png_header(stbi__context *s)
+{
+   static const stbi_uc png_sig[8] = { 137,80,78,71,13,10,26,10 };
+   int i;
+   for (i=0; i < 8; ++i)
+      if (stbi__get8(s) != png_sig[i]) return stbi__err("bad png sig","Not a PNG");
+   return 1;
+}
+
+typedef struct
+{
+   stbi__context *s;
+   stbi_uc *idata, *expanded, *out;
+   int depth;
+} stbi__png;
+
+
+enum {
+   STBI__F_none=0,
+   STBI__F_sub=1,
+   STBI__F_up=2,
+   STBI__F_avg=3,
+   STBI__F_paeth=4,
+   // synthetic filters used for first scanline to avoid needing a dummy row of 0s
+   STBI__F_avg_first,
+   STBI__F_paeth_first
+};
+
+static stbi_uc first_row_filter[5] =
+{
+   STBI__F_none,
+   STBI__F_sub,
+   STBI__F_none,
+   STBI__F_avg_first,
+   STBI__F_paeth_first
+};
+
+static int stbi__paeth(int a, int b, int c)
+{
+   int p = a + b - c;
+   int pa = abs(p-a);
+   int pb = abs(p-b);
+   int pc = abs(p-c);
+   if (pa <= pb && pa <= pc) return a;
+   if (pb <= pc) return b;
+   return c;
+}
+
+static const stbi_uc stbi__depth_scale_table[9] = { 0, 0xff, 0x55, 0, 0x11, 0,0,0, 0x01 };
+
+// create the png data from post-deflated data
+static int stbi__create_png_image_raw(stbi__png *a, stbi_uc *raw, stbi__uint32 raw_len, int out_n, stbi__uint32 x, stbi__uint32 y, int depth, int color)
+{
+   int bytes = (depth == 16? 2 : 1);
+   stbi__context *s = a->s;
+   stbi__uint32 i,j,stride = x*out_n*bytes;
+   stbi__uint32 img_len, img_width_bytes;
+   int k;
+   int img_n = s->img_n; // copy it into a local for later
+
+   int output_bytes = out_n*bytes;
+   int filter_bytes = img_n*bytes;
+   int width = x;
+
+   STBI_ASSERT(out_n == s->img_n || out_n == s->img_n+1);
+   a->out = (stbi_uc *) stbi__malloc_mad3(x, y, output_bytes, 0); // extra bytes to write off the end into
+   if (!a->out) return stbi__err("outofmem", "Out of memory");
+
+   if (!stbi__mad3sizes_valid(img_n, x, depth, 7)) return stbi__err("too large", "Corrupt PNG");
+   img_width_bytes = (((img_n * x * depth) + 7) >> 3);
+   img_len = (img_width_bytes + 1) * y;
+
+   // we used to check for exact match between raw_len and img_len on non-interlaced PNGs,
+   // but issue #276 reported a PNG in the wild that had extra data at the end (all zeros),
+   // so just check for raw_len < img_len always.
+   if (raw_len < img_len) return stbi__err("not enough pixels","Corrupt PNG");
+
+   for (j=0; j < y; ++j) {
+      stbi_uc *cur = a->out + stride*j;
+      stbi_uc *prior;
+      int filter = *raw++;
+
+      if (filter > 4)
+         return stbi__err("invalid filter","Corrupt PNG");
+
+      if (depth < 8) {
+         if (img_width_bytes > x) return stbi__err("invalid width","Corrupt PNG");
+         cur += x*out_n - img_width_bytes; // store output to the rightmost img_len bytes, so we can decode in place
+         filter_bytes = 1;
+         width = img_width_bytes;
+      }
+      prior = cur - stride; // bugfix: need to compute this after 'cur +=' computation above
+
+      // if first row, use special filter that doesn't sample previous row
+      if (j == 0) filter = first_row_filter[filter];
+
+      // handle first byte explicitly
+      for (k=0; k < filter_bytes; ++k) {
+         switch (filter) {
+            case STBI__F_none       : cur[k] = raw[k]; break;
+            case STBI__F_sub        : cur[k] = raw[k]; break;
+            case STBI__F_up         : cur[k] = STBI__BYTECAST(raw[k] + prior[k]); break;
+            case STBI__F_avg        : cur[k] = STBI__BYTECAST(raw[k] + (prior[k]>>1)); break;
+            case STBI__F_paeth      : cur[k] = STBI__BYTECAST(raw[k] + stbi__paeth(0,prior[k],0)); break;
+            case STBI__F_avg_first  : cur[k] = raw[k]; break;
+            case STBI__F_paeth_first: cur[k] = raw[k]; break;
+         }
+      }
+
+      if (depth == 8) {
+         if (img_n != out_n)
+            cur[img_n] = 255; // first pixel
+         raw += img_n;
+         cur += out_n;
+         prior += out_n;
+      } else if (depth == 16) {
+         if (img_n != out_n) {
+            cur[filter_bytes]   = 255; // first pixel top byte
+            cur[filter_bytes+1] = 255; // first pixel bottom byte
+         }
+         raw += filter_bytes;
+         cur += output_bytes;
+         prior += output_bytes;
+      } else {
+         raw += 1;
+         cur += 1;
+         prior += 1;
+      }
+
+      // this is a little gross, so that we don't switch per-pixel or per-component
+      if (depth < 8 || img_n == out_n) {
+         int nk = (width - 1)*filter_bytes;
+         #define STBI__CASE(f) \
+             case f:     \
+                for (k=0; k < nk; ++k)
+         switch (filter) {
+            // "none" filter turns into a memcpy here; make that explicit.
+            case STBI__F_none:         memcpy(cur, raw, nk); break;
+            STBI__CASE(STBI__F_sub)          { cur[k] = STBI__BYTECAST(raw[k] + cur[k-filter_bytes]); } break;
+            STBI__CASE(STBI__F_up)           { cur[k] = STBI__BYTECAST(raw[k] + prior[k]); } break;
+            STBI__CASE(STBI__F_avg)          { cur[k] = STBI__BYTECAST(raw[k] + ((prior[k] + cur[k-filter_bytes])>>1)); } break;
+            STBI__CASE(STBI__F_paeth)        { cur[k] = STBI__BYTECAST(raw[k] + stbi__paeth(cur[k-filter_bytes],prior[k],prior[k-filter_bytes])); } break;
+            STBI__CASE(STBI__F_avg_first)    { cur[k] = STBI__BYTECAST(raw[k] + (cur[k-filter_bytes] >> 1)); } break;
+            STBI__CASE(STBI__F_paeth_first)  { cur[k] = STBI__BYTECAST(raw[k] + stbi__paeth(cur[k-filter_bytes],0,0)); } break;
+         }
+         #undef STBI__CASE
+         raw += nk;
+      } else {
+         STBI_ASSERT(img_n+1 == out_n);
+         #define STBI__CASE(f) \
+             case f:     \
+                for (i=x-1; i >= 1; --i, cur[filter_bytes]=255,raw+=filter_bytes,cur+=output_bytes,prior+=output_bytes) \
+                   for (k=0; k < filter_bytes; ++k)
+         switch (filter) {
+            STBI__CASE(STBI__F_none)         { cur[k] = raw[k]; } break;
+            STBI__CASE(STBI__F_sub)          { cur[k] = STBI__BYTECAST(raw[k] + cur[k- output_bytes]); } break;
+            STBI__CASE(STBI__F_up)           { cur[k] = STBI__BYTECAST(raw[k] + prior[k]); } break;
+            STBI__CASE(STBI__F_avg)          { cur[k] = STBI__BYTECAST(raw[k] + ((prior[k] + cur[k- output_bytes])>>1)); } break;
+            STBI__CASE(STBI__F_paeth)        { cur[k] = STBI__BYTECAST(raw[k] + stbi__paeth(cur[k- output_bytes],prior[k],prior[k- output_bytes])); } break;
+            STBI__CASE(STBI__F_avg_first)    { cur[k] = STBI__BYTECAST(raw[k] + (cur[k- output_bytes] >> 1)); } break;
+            STBI__CASE(STBI__F_paeth_first)  { cur[k] = STBI__BYTECAST(raw[k] + stbi__paeth(cur[k- output_bytes],0,0)); } break;
+         }
+         #undef STBI__CASE
+
+         // the loop above sets the high byte of the pixels' alpha, but for
+         // 16 bit png files we also need the low byte set. we'll do that here.
+         if (depth == 16) {
+            cur = a->out + stride*j; // start at the beginning of the row again
+            for (i=0; i < x; ++i,cur+=output_bytes) {
+               cur[filter_bytes+1] = 255;
+            }
+         }
+      }
+   }
+
+   // we make a separate pass to expand bits to pixels; for performance,
+   // this could run two scanlines behind the above code, so it won't
+   // intefere with filtering but will still be in the cache.
+   if (depth < 8) {
+      for (j=0; j < y; ++j) {
+         stbi_uc *cur = a->out + stride*j;
+         stbi_uc *in  = a->out + stride*j + x*out_n - img_width_bytes;
+         // unpack 1/2/4-bit into a 8-bit buffer. allows us to keep the common 8-bit path optimal at minimal cost for 1/2/4-bit
+         // png guarante byte alignment, if width is not multiple of 8/4/2 we'll decode dummy trailing data that will be skipped in the later loop
+         stbi_uc scale = (color == 0) ? stbi__depth_scale_table[depth] : 1; // scale grayscale values to 0..255 range
+
+         // note that the final byte might overshoot and write more data than desired.
+         // we can allocate enough data that this never writes out of memory, but it
+         // could also overwrite the next scanline. can it overwrite non-empty data
+         // on the next scanline? yes, consider 1-pixel-wide scanlines with 1-bit-per-pixel.
+         // so we need to explicitly clamp the final ones
+
+         if (depth == 4) {
+            for (k=x*img_n; k >= 2; k-=2, ++in) {
+               *cur++ = scale * ((*in >> 4)       );
+               *cur++ = scale * ((*in     ) & 0x0f);
+            }
+            if (k > 0) *cur++ = scale * ((*in >> 4)       );
+         } else if (depth == 2) {
+            for (k=x*img_n; k >= 4; k-=4, ++in) {
+               *cur++ = scale * ((*in >> 6)       );
+               *cur++ = scale * ((*in >> 4) & 0x03);
+               *cur++ = scale * ((*in >> 2) & 0x03);
+               *cur++ = scale * ((*in     ) & 0x03);
+            }
+            if (k > 0) *cur++ = scale * ((*in >> 6)       );
+            if (k > 1) *cur++ = scale * ((*in >> 4) & 0x03);
+            if (k > 2) *cur++ = scale * ((*in >> 2) & 0x03);
+         } else if (depth == 1) {
+            for (k=x*img_n; k >= 8; k-=8, ++in) {
+               *cur++ = scale * ((*in >> 7)       );
+               *cur++ = scale * ((*in >> 6) & 0x01);
+               *cur++ = scale * ((*in >> 5) & 0x01);
+               *cur++ = scale * ((*in >> 4) & 0x01);
+               *cur++ = scale * ((*in >> 3) & 0x01);
+               *cur++ = scale * ((*in >> 2) & 0x01);
+               *cur++ = scale * ((*in >> 1) & 0x01);
+               *cur++ = scale * ((*in     ) & 0x01);
+            }
+            if (k > 0) *cur++ = scale * ((*in >> 7)       );
+            if (k > 1) *cur++ = scale * ((*in >> 6) & 0x01);
+            if (k > 2) *cur++ = scale * ((*in >> 5) & 0x01);
+            if (k > 3) *cur++ = scale * ((*in >> 4) & 0x01);
+            if (k > 4) *cur++ = scale * ((*in >> 3) & 0x01);
+            if (k > 5) *cur++ = scale * ((*in >> 2) & 0x01);
+            if (k > 6) *cur++ = scale * ((*in >> 1) & 0x01);
+         }
+         if (img_n != out_n) {
+            int q;
+            // insert alpha = 255
+            cur = a->out + stride*j;
+            if (img_n == 1) {
+               for (q=x-1; q >= 0; --q) {
+                  cur[q*2+1] = 255;
+                  cur[q*2+0] = cur[q];
+               }
+            } else {
+               STBI_ASSERT(img_n == 3);
+               for (q=x-1; q >= 0; --q) {
+                  cur[q*4+3] = 255;
+                  cur[q*4+2] = cur[q*3+2];
+                  cur[q*4+1] = cur[q*3+1];
+                  cur[q*4+0] = cur[q*3+0];
+               }
+            }
+         }
+      }
+   } else if (depth == 16) {
+      // force the image data from big-endian to platform-native.
+      // this is done in a separate pass due to the decoding relying
+      // on the data being untouched, but could probably be done
+      // per-line during decode if care is taken.
+      stbi_uc *cur = a->out;
+      stbi__uint16 *cur16 = (stbi__uint16*)cur;
+
+      for(i=0; i < x*y*out_n; ++i,cur16++,cur+=2) {
+         *cur16 = (cur[0] << 8) | cur[1];
+      }
+   }
+
+   return 1;
+}
+
+static int stbi__create_png_image(stbi__png *a, stbi_uc *image_data, stbi__uint32 image_data_len, int out_n, int depth, int color, int interlaced)
+{
+   int bytes = (depth == 16 ? 2 : 1);
+   int out_bytes = out_n * bytes;
+   stbi_uc *final;
+   int p;
+   if (!interlaced)
+      return stbi__create_png_image_raw(a, image_data, image_data_len, out_n, a->s->img_x, a->s->img_y, depth, color);
+
+   // de-interlacing
+   final = (stbi_uc *) stbi__malloc_mad3(a->s->img_x, a->s->img_y, out_bytes, 0);
+   if (!final) return stbi__err("outofmem", "Out of memory");
+   for (p=0; p < 7; ++p) {
+      int xorig[] = { 0,4,0,2,0,1,0 };
+      int yorig[] = { 0,0,4,0,2,0,1 };
+      int xspc[]  = { 8,8,4,4,2,2,1 };
+      int yspc[]  = { 8,8,8,4,4,2,2 };
+      int i,j,x,y;
+      // pass1_x[4] = 0, pass1_x[5] = 1, pass1_x[12] = 1
+      x = (a->s->img_x - xorig[p] + xspc[p]-1) / xspc[p];
+      y = (a->s->img_y - yorig[p] + yspc[p]-1) / yspc[p];
+      if (x && y) {
+         stbi__uint32 img_len = ((((a->s->img_n * x * depth) + 7) >> 3) + 1) * y;
+         if (!stbi__create_png_image_raw(a, image_data, image_data_len, out_n, x, y, depth, color)) {
+            STBI_FREE(final);
+            return 0;
+         }
+         for (j=0; j < y; ++j) {
+            for (i=0; i < x; ++i) {
+               int out_y = j*yspc[p]+yorig[p];
+               int out_x = i*xspc[p]+xorig[p];
+               memcpy(final + out_y*a->s->img_x*out_bytes + out_x*out_bytes,
+                      a->out + (j*x+i)*out_bytes, out_bytes);
+            }
+         }
+         STBI_FREE(a->out);
+         image_data += img_len;
+         image_data_len -= img_len;
+      }
+   }
+   a->out = final;
+
+   return 1;
+}
+
+static int stbi__compute_transparency(stbi__png *z, stbi_uc tc[3], int out_n)
+{
+   stbi__context *s = z->s;
+   stbi__uint32 i, pixel_count = s->img_x * s->img_y;
+   stbi_uc *p = z->out;
+
+   // compute color-based transparency, assuming we've
+   // already got 255 as the alpha value in the output
+   STBI_ASSERT(out_n == 2 || out_n == 4);
+
+   if (out_n == 2) {
+      for (i=0; i < pixel_count; ++i) {
+         p[1] = (p[0] == tc[0] ? 0 : 255);
+         p += 2;
+      }
+   } else {
+      for (i=0; i < pixel_count; ++i) {
+         if (p[0] == tc[0] && p[1] == tc[1] && p[2] == tc[2])
+            p[3] = 0;
+         p += 4;
+      }
+   }
+   return 1;
+}
+
+static int stbi__compute_transparency16(stbi__png *z, stbi__uint16 tc[3], int out_n)
+{
+   stbi__context *s = z->s;
+   stbi__uint32 i, pixel_count = s->img_x * s->img_y;
+   stbi__uint16 *p = (stbi__uint16*) z->out;
+
+   // compute color-based transparency, assuming we've
+   // already got 65535 as the alpha value in the output
+   STBI_ASSERT(out_n == 2 || out_n == 4);
+
+   if (out_n == 2) {
+      for (i = 0; i < pixel_count; ++i) {
+         p[1] = (p[0] == tc[0] ? 0 : 65535);
+         p += 2;
+      }
+   } else {
+      for (i = 0; i < pixel_count; ++i) {
+         if (p[0] == tc[0] && p[1] == tc[1] && p[2] == tc[2])
+            p[3] = 0;
+         p += 4;
+      }
+   }
+   return 1;
+}
+
+static int stbi__expand_png_palette(stbi__png *a, stbi_uc *palette, int len, int pal_img_n)
+{
+   stbi__uint32 i, pixel_count = a->s->img_x * a->s->img_y;
+   stbi_uc *p, *temp_out, *orig = a->out;
+
+   p = (stbi_uc *) stbi__malloc_mad2(pixel_count, pal_img_n, 0);
+   if (p == NULL) return stbi__err("outofmem", "Out of memory");
+
+   // between here and free(out) below, exitting would leak
+   temp_out = p;
+
+   if (pal_img_n == 3) {
+      for (i=0; i < pixel_count; ++i) {
+         int n = orig[i]*4;
+         p[0] = palette[n  ];
+         p[1] = palette[n+1];
+         p[2] = palette[n+2];
+         p += 3;
+      }
+   } else {
+      for (i=0; i < pixel_count; ++i) {
+         int n = orig[i]*4;
+         p[0] = palette[n  ];
+         p[1] = palette[n+1];
+         p[2] = palette[n+2];
+         p[3] = palette[n+3];
+         p += 4;
+      }
+   }
+   STBI_FREE(a->out);
+   a->out = temp_out;
+
+   STBI_NOTUSED(len);
+
+   return 1;
+}
+
+static int stbi__unpremultiply_on_load_global = 0;
+static int stbi__de_iphone_flag_global = 0;
+
+STBIDEF void stbi_set_unpremultiply_on_load(int flag_true_if_should_unpremultiply)
+{
+   stbi__unpremultiply_on_load_global = flag_true_if_should_unpremultiply;
+}
+
+STBIDEF void stbi_convert_iphone_png_to_rgb(int flag_true_if_should_convert)
+{
+   stbi__de_iphone_flag_global = flag_true_if_should_convert;
+}
+
+#ifndef STBI_THREAD_LOCAL
+#define stbi__unpremultiply_on_load  stbi__unpremultiply_on_load_global
+#define stbi__de_iphone_flag  stbi__de_iphone_flag_global
+#else
+static STBI_THREAD_LOCAL int stbi__unpremultiply_on_load_local, stbi__unpremultiply_on_load_set;
+static STBI_THREAD_LOCAL int stbi__de_iphone_flag_local, stbi__de_iphone_flag_set;
+
+STBIDEF void stbi__unpremultiply_on_load_thread(int flag_true_if_should_unpremultiply)
+{
+   stbi__unpremultiply_on_load_local = flag_true_if_should_unpremultiply;
+   stbi__unpremultiply_on_load_set = 1;
+}
+
+STBIDEF void stbi_convert_iphone_png_to_rgb_thread(int flag_true_if_should_convert)
+{
+   stbi__de_iphone_flag_local = flag_true_if_should_convert;
+   stbi__de_iphone_flag_set = 1;
+}
+
+#define stbi__unpremultiply_on_load  (stbi__unpremultiply_on_load_set           \
+                                       ? stbi__unpremultiply_on_load_local      \
+                                       : stbi__unpremultiply_on_load_global)
+#define stbi__de_iphone_flag  (stbi__de_iphone_flag_set                         \
+                                ? stbi__de_iphone_flag_local                    \
+                                : stbi__de_iphone_flag_global)
+#endif // STBI_THREAD_LOCAL
+
+static void stbi__de_iphone(stbi__png *z)
+{
+   stbi__context *s = z->s;
+   stbi__uint32 i, pixel_count = s->img_x * s->img_y;
+   stbi_uc *p = z->out;
+
+   if (s->img_out_n == 3) {  // convert bgr to rgb
+      for (i=0; i < pixel_count; ++i) {
+         stbi_uc t = p[0];
+         p[0] = p[2];
+         p[2] = t;
+         p += 3;
+      }
+   } else {
+      STBI_ASSERT(s->img_out_n == 4);
+      if (stbi__unpremultiply_on_load) {
+         // convert bgr to rgb and unpremultiply
+         for (i=0; i < pixel_count; ++i) {
+            stbi_uc a = p[3];
+            stbi_uc t = p[0];
+            if (a) {
+               stbi_uc half = a / 2;
+               p[0] = (p[2] * 255 + half) / a;
+               p[1] = (p[1] * 255 + half) / a;
+               p[2] = ( t   * 255 + half) / a;
+            } else {
+               p[0] = p[2];
+               p[2] = t;
+            }
+            p += 4;
+         }
+      } else {
+         // convert bgr to rgb
+         for (i=0; i < pixel_count; ++i) {
+            stbi_uc t = p[0];
+            p[0] = p[2];
+            p[2] = t;
+            p += 4;
+         }
+      }
+   }
+}
+
+#define STBI__PNG_TYPE(a,b,c,d)  (((unsigned) (a) << 24) + ((unsigned) (b) << 16) + ((unsigned) (c) << 8) + (unsigned) (d))
+
+static int stbi__parse_png_file(stbi__png *z, int scan, int req_comp)
+{
+   stbi_uc palette[1024], pal_img_n=0;
+   stbi_uc has_trans=0, tc[3]={0};
+   stbi__uint16 tc16[3];
+   stbi__uint32 ioff=0, idata_limit=0, i, pal_len=0;
+   int first=1,k,interlace=0, color=0, is_iphone=0;
+   stbi__context *s = z->s;
+
+   z->expanded = NULL;
+   z->idata = NULL;
+   z->out = NULL;
+
+   if (!stbi__check_png_header(s)) return 0;
+
+   if (scan == STBI__SCAN_type) return 1;
+
+   for (;;) {
+      stbi__pngchunk c = stbi__get_chunk_header(s);
+      switch (c.type) {
+         case STBI__PNG_TYPE('C','g','B','I'):
+            is_iphone = 1;
+            stbi__skip(s, c.length);
+            break;
+         case STBI__PNG_TYPE('I','H','D','R'): {
+            int comp,filter;
+            if (!first) return stbi__err("multiple IHDR","Corrupt PNG");
+            first = 0;
+            if (c.length != 13) return stbi__err("bad IHDR len","Corrupt PNG");
+            s->img_x = stbi__get32be(s);
+            s->img_y = stbi__get32be(s);
+            if (s->img_y > STBI_MAX_DIMENSIONS) return stbi__err("too large","Very large image (corrupt?)");
+            if (s->img_x > STBI_MAX_DIMENSIONS) return stbi__err("too large","Very large image (corrupt?)");
+            z->depth = stbi__get8(s);  if (z->depth != 1 && z->depth != 2 && z->depth != 4 && z->depth != 8 && z->depth != 16)  return stbi__err("1/2/4/8/16-bit only","PNG not supported: 1/2/4/8/16-bit only");
+            color = stbi__get8(s);  if (color > 6)         return stbi__err("bad ctype","Corrupt PNG");
+            if (color == 3 && z->depth == 16)                  return stbi__err("bad ctype","Corrupt PNG");
+            if (color == 3) pal_img_n = 3; else if (color & 1) return stbi__err("bad ctype","Corrupt PNG");
+            comp  = stbi__get8(s);  if (comp) return stbi__err("bad comp method","Corrupt PNG");
+            filter= stbi__get8(s);  if (filter) return stbi__err("bad filter method","Corrupt PNG");
+            interlace = stbi__get8(s); if (interlace>1) return stbi__err("bad interlace method","Corrupt PNG");
+            if (!s->img_x || !s->img_y) return stbi__err("0-pixel image","Corrupt PNG");
+            if (!pal_img_n) {
+               s->img_n = (color & 2 ? 3 : 1) + (color & 4 ? 1 : 0);
+               if ((1 << 30) / s->img_x / s->img_n < s->img_y) return stbi__err("too large", "Image too large to decode");
+               if (scan == STBI__SCAN_header) return 1;
+            } else {
+               // if paletted, then pal_n is our final components, and
+               // img_n is # components to decompress/filter.
+               s->img_n = 1;
+               if ((1 << 30) / s->img_x / 4 < s->img_y) return stbi__err("too large","Corrupt PNG");
+               // if SCAN_header, have to scan to see if we have a tRNS
+            }
+            break;
+         }
+
+         case STBI__PNG_TYPE('P','L','T','E'):  {
+            if (first) return stbi__err("first not IHDR", "Corrupt PNG");
+            if (c.length > 256*3) return stbi__err("invalid PLTE","Corrupt PNG");
+            pal_len = c.length / 3;
+            if (pal_len * 3 != c.length) return stbi__err("invalid PLTE","Corrupt PNG");
+            for (i=0; i < pal_len; ++i) {
+               palette[i*4+0] = stbi__get8(s);
+               palette[i*4+1] = stbi__get8(s);
+               palette[i*4+2] = stbi__get8(s);
+               palette[i*4+3] = 255;
+            }
+            break;
+         }
+
+         case STBI__PNG_TYPE('t','R','N','S'): {
+            if (first) return stbi__err("first not IHDR", "Corrupt PNG");
+            if (z->idata) return stbi__err("tRNS after IDAT","Corrupt PNG");
+            if (pal_img_n) {
+               if (scan == STBI__SCAN_header) { s->img_n = 4; return 1; }
+               if (pal_len == 0) return stbi__err("tRNS before PLTE","Corrupt PNG");
+               if (c.length > pal_len) return stbi__err("bad tRNS len","Corrupt PNG");
+               pal_img_n = 4;
+               for (i=0; i < c.length; ++i)
+                  palette[i*4+3] = stbi__get8(s);
+            } else {
+               if (!(s->img_n & 1)) return stbi__err("tRNS with alpha","Corrupt PNG");
+               if (c.length != (stbi__uint32) s->img_n*2) return stbi__err("bad tRNS len","Corrupt PNG");
+               has_trans = 1;
+               if (z->depth == 16) {
+                  for (k = 0; k < s->img_n; ++k) tc16[k] = (stbi__uint16)stbi__get16be(s); // copy the values as-is
+               } else {
+                  for (k = 0; k < s->img_n; ++k) tc[k] = (stbi_uc)(stbi__get16be(s) & 255) * stbi__depth_scale_table[z->depth]; // non 8-bit images will be larger
+               }
+            }
+            break;
+         }
+
+         case STBI__PNG_TYPE('I','D','A','T'): {
+            if (first) return stbi__err("first not IHDR", "Corrupt PNG");
+            if (pal_img_n && !pal_len) return stbi__err("no PLTE","Corrupt PNG");
+            if (scan == STBI__SCAN_header) { s->img_n = pal_img_n; return 1; }
+            if ((int)(ioff + c.length) < (int)ioff) return 0;
+            if (ioff + c.length > idata_limit) {
+               stbi__uint32 idata_limit_old = idata_limit;
+               stbi_uc *p;
+               if (idata_limit == 0) idata_limit = c.length > 4096 ? c.length : 4096;
+               while (ioff + c.length > idata_limit)
+                  idata_limit *= 2;
+               STBI_NOTUSED(idata_limit_old);
+               p = (stbi_uc *) STBI_REALLOC_SIZED(z->idata, idata_limit_old, idata_limit); if (p == NULL) return stbi__err("outofmem", "Out of memory");
+               z->idata = p;
+            }
+            if (!stbi__getn(s, z->idata+ioff,c.length)) return stbi__err("outofdata","Corrupt PNG");
+            ioff += c.length;
+            break;
+         }
+
+         case STBI__PNG_TYPE('I','E','N','D'): {
+            stbi__uint32 raw_len, bpl;
+            if (first) return stbi__err("first not IHDR", "Corrupt PNG");
+            if (scan != STBI__SCAN_load) return 1;
+            if (z->idata == NULL) return stbi__err("no IDAT","Corrupt PNG");
+            // initial guess for decoded data size to avoid unnecessary reallocs
+            bpl = (s->img_x * z->depth + 7) / 8; // bytes per line, per component
+            raw_len = bpl * s->img_y * s->img_n /* pixels */ + s->img_y /* filter mode per row */;
+            z->expanded = (stbi_uc *) stbi_zlib_decode_malloc_guesssize_headerflag((char *) z->idata, ioff, raw_len, (int *) &raw_len, !is_iphone);
+            if (z->expanded == NULL) return 0; // zlib should set error
+            STBI_FREE(z->idata); z->idata = NULL;
+            if ((req_comp == s->img_n+1 && req_comp != 3 && !pal_img_n) || has_trans)
+               s->img_out_n = s->img_n+1;
+            else
+               s->img_out_n = s->img_n;
+            if (!stbi__create_png_image(z, z->expanded, raw_len, s->img_out_n, z->depth, color, interlace)) return 0;
+            if (has_trans) {
+               if (z->depth == 16) {
+                  if (!stbi__compute_transparency16(z, tc16, s->img_out_n)) return 0;
+               } else {
+                  if (!stbi__compute_transparency(z, tc, s->img_out_n)) return 0;
+               }
+            }
+            if (is_iphone && stbi__de_iphone_flag && s->img_out_n > 2)
+               stbi__de_iphone(z);
+            if (pal_img_n) {
+               // pal_img_n == 3 or 4
+               s->img_n = pal_img_n; // record the actual colors we had
+               s->img_out_n = pal_img_n;
+               if (req_comp >= 3) s->img_out_n = req_comp;
+               if (!stbi__expand_png_palette(z, palette, pal_len, s->img_out_n))
+                  return 0;
+            } else if (has_trans) {
+               // non-paletted image with tRNS -> source image has (constant) alpha
+               ++s->img_n;
+            }
+            STBI_FREE(z->expanded); z->expanded = NULL;
+            // end of PNG chunk, read and skip CRC
+            stbi__get32be(s);
+            return 1;
+         }
+
+         default:
+            // if critical, fail
+            if (first) return stbi__err("first not IHDR", "Corrupt PNG");
+            if ((c.type & (1 << 29)) == 0) {
+               #ifndef STBI_NO_FAILURE_STRINGS
+               // not threadsafe
+               static char invalid_chunk[] = "XXXX PNG chunk not known";
+               invalid_chunk[0] = STBI__BYTECAST(c.type >> 24);
+               invalid_chunk[1] = STBI__BYTECAST(c.type >> 16);
+               invalid_chunk[2] = STBI__BYTECAST(c.type >>  8);
+               invalid_chunk[3] = STBI__BYTECAST(c.type >>  0);
+               #endif
+               return stbi__err(invalid_chunk, "PNG not supported: unknown PNG chunk type");
+            }
+            stbi__skip(s, c.length);
+            break;
+      }
+      // end of PNG chunk, read and skip CRC
+      stbi__get32be(s);
+   }
+}
+
+static void *stbi__do_png(stbi__png *p, int *x, int *y, int *n, int req_comp, stbi__result_info *ri)
+{
+   void *result=NULL;
+   if (req_comp < 0 || req_comp > 4) return stbi__errpuc("bad req_comp", "Internal error");
+   if (stbi__parse_png_file(p, STBI__SCAN_load, req_comp)) {
+      if (p->depth <= 8)
+         ri->bits_per_channel = 8;
+      else if (p->depth == 16)
+         ri->bits_per_channel = 16;
+      else
+         return stbi__errpuc("bad bits_per_channel", "PNG not supported: unsupported color depth");
+      result = p->out;
+      p->out = NULL;
+      if (req_comp && req_comp != p->s->img_out_n) {
+         if (ri->bits_per_channel == 8)
+            result = stbi__convert_format((unsigned char *) result, p->s->img_out_n, req_comp, p->s->img_x, p->s->img_y);
+         else
+            result = stbi__convert_format16((stbi__uint16 *) result, p->s->img_out_n, req_comp, p->s->img_x, p->s->img_y);
+         p->s->img_out_n = req_comp;
+         if (result == NULL) return result;
+      }
+      *x = p->s->img_x;
+      *y = p->s->img_y;
+      if (n) *n = p->s->img_n;
+   }
+   STBI_FREE(p->out);      p->out      = NULL;
+   STBI_FREE(p->expanded); p->expanded = NULL;
+   STBI_FREE(p->idata);    p->idata    = NULL;
+
+   return result;
+}
+
+static void *stbi__png_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri)
+{
+   stbi__png p;
+   p.s = s;
+   return stbi__do_png(&p, x,y,comp,req_comp, ri);
+}
+
+static int stbi__png_test(stbi__context *s)
+{
+   int r;
+   r = stbi__check_png_header(s);
+   stbi__rewind(s);
+   return r;
+}
+
+static int stbi__png_info_raw(stbi__png *p, int *x, int *y, int *comp)
+{
+   if (!stbi__parse_png_file(p, STBI__SCAN_header, 0)) {
+      stbi__rewind( p->s );
+      return 0;
+   }
+   if (x) *x = p->s->img_x;
+   if (y) *y = p->s->img_y;
+   if (comp) *comp = p->s->img_n;
+   return 1;
+}
+
+static int stbi__png_info(stbi__context *s, int *x, int *y, int *comp)
+{
+   stbi__png p;
+   p.s = s;
+   return stbi__png_info_raw(&p, x, y, comp);
+}
+
+static int stbi__png_is16(stbi__context *s)
+{
+   stbi__png p;
+   p.s = s;
+   if (!stbi__png_info_raw(&p, NULL, NULL, NULL))
+	   return 0;
+   if (p.depth != 16) {
+      stbi__rewind(p.s);
+      return 0;
+   }
+   return 1;
+}
+#endif
+
+// Microsoft/Windows BMP image
+
+#ifndef STBI_NO_BMP
+static int stbi__bmp_test_raw(stbi__context *s)
+{
+   int r;
+   int sz;
+   if (stbi__get8(s) != 'B') return 0;
+   if (stbi__get8(s) != 'M') return 0;
+   stbi__get32le(s); // discard filesize
+   stbi__get16le(s); // discard reserved
+   stbi__get16le(s); // discard reserved
+   stbi__get32le(s); // discard data offset
+   sz = stbi__get32le(s);
+   r = (sz == 12 || sz == 40 || sz == 56 || sz == 108 || sz == 124);
+   return r;
+}
+
+static int stbi__bmp_test(stbi__context *s)
+{
+   int r = stbi__bmp_test_raw(s);
+   stbi__rewind(s);
+   return r;
+}
+
+
+// returns 0..31 for the highest set bit
+static int stbi__high_bit(unsigned int z)
+{
+   int n=0;
+   if (z == 0) return -1;
+   if (z >= 0x10000) { n += 16; z >>= 16; }
+   if (z >= 0x00100) { n +=  8; z >>=  8; }
+   if (z >= 0x00010) { n +=  4; z >>=  4; }
+   if (z >= 0x00004) { n +=  2; z >>=  2; }
+   if (z >= 0x00002) { n +=  1;/* >>=  1;*/ }
+   return n;
+}
+
+static int stbi__bitcount(unsigned int a)
+{
+   a = (a & 0x55555555) + ((a >>  1) & 0x55555555); // max 2
+   a = (a & 0x33333333) + ((a >>  2) & 0x33333333); // max 4
+   a = (a + (a >> 4)) & 0x0f0f0f0f; // max 8 per 4, now 8 bits
+   a = (a + (a >> 8)); // max 16 per 8 bits
+   a = (a + (a >> 16)); // max 32 per 8 bits
+   return a & 0xff;
+}
+
+// extract an arbitrarily-aligned N-bit value (N=bits)
+// from v, and then make it 8-bits long and fractionally
+// extend it to full full range.
+static int stbi__shiftsigned(unsigned int v, int shift, int bits)
+{
+   static unsigned int mul_table[9] = {
+      0,
+      0xff/*0b11111111*/, 0x55/*0b01010101*/, 0x49/*0b01001001*/, 0x11/*0b00010001*/,
+      0x21/*0b00100001*/, 0x41/*0b01000001*/, 0x81/*0b10000001*/, 0x01/*0b00000001*/,
+   };
+   static unsigned int shift_table[9] = {
+      0, 0,0,1,0,2,4,6,0,
+   };
+   if (shift < 0)
+      v <<= -shift;
+   else
+      v >>= shift;
+   STBI_ASSERT(v < 256);
+   v >>= (8-bits);
+   STBI_ASSERT(bits >= 0 && bits <= 8);
+   return (int) ((unsigned) v * mul_table[bits]) >> shift_table[bits];
+}
+
+typedef struct
+{
+   int bpp, offset, hsz;
+   unsigned int mr,mg,mb,ma, all_a;
+   int extra_read;
+} stbi__bmp_data;
+
+static int stbi__bmp_set_mask_defaults(stbi__bmp_data *info, int compress)
+{
+   // BI_BITFIELDS specifies masks explicitly, don't override
+   if (compress == 3)
+      return 1;
+
+   if (compress == 0) {
+      if (info->bpp == 16) {
+         info->mr = 31u << 10;
+         info->mg = 31u <<  5;
+         info->mb = 31u <<  0;
+      } else if (info->bpp == 32) {
+         info->mr = 0xffu << 16;
+         info->mg = 0xffu <<  8;
+         info->mb = 0xffu <<  0;
+         info->ma = 0xffu << 24;
+         info->all_a = 0; // if all_a is 0 at end, then we loaded alpha channel but it was all 0
+      } else {
+         // otherwise, use defaults, which is all-0
+         info->mr = info->mg = info->mb = info->ma = 0;
+      }
+      return 1;
+   }
+   return 0; // error
+}
+
+static void *stbi__bmp_parse_header(stbi__context *s, stbi__bmp_data *info)
+{
+   int hsz;
+   if (stbi__get8(s) != 'B' || stbi__get8(s) != 'M') return stbi__errpuc("not BMP", "Corrupt BMP");
+   stbi__get32le(s); // discard filesize
+   stbi__get16le(s); // discard reserved
+   stbi__get16le(s); // discard reserved
+   info->offset = stbi__get32le(s);
+   info->hsz = hsz = stbi__get32le(s);
+   info->mr = info->mg = info->mb = info->ma = 0;
+   info->extra_read = 14;
+
+   if (info->offset < 0) return stbi__errpuc("bad BMP", "bad BMP");
+
+   if (hsz != 12 && hsz != 40 && hsz != 56 && hsz != 108 && hsz != 124) return stbi__errpuc("unknown BMP", "BMP type not supported: unknown");
+   if (hsz == 12) {
+      s->img_x = stbi__get16le(s);
+      s->img_y = stbi__get16le(s);
+   } else {
+      s->img_x = stbi__get32le(s);
+      s->img_y = stbi__get32le(s);
+   }
+   if (stbi__get16le(s) != 1) return stbi__errpuc("bad BMP", "bad BMP");
+   info->bpp = stbi__get16le(s);
+   if (hsz != 12) {
+      int compress = stbi__get32le(s);
+      if (compress == 1 || compress == 2) return stbi__errpuc("BMP RLE", "BMP type not supported: RLE");
+      if (compress >= 4) return stbi__errpuc("BMP JPEG/PNG", "BMP type not supported: unsupported compression"); // this includes PNG/JPEG modes
+      if (compress == 3 && info->bpp != 16 && info->bpp != 32) return stbi__errpuc("bad BMP", "bad BMP"); // bitfields requires 16 or 32 bits/pixel
+      stbi__get32le(s); // discard sizeof
+      stbi__get32le(s); // discard hres
+      stbi__get32le(s); // discard vres
+      stbi__get32le(s); // discard colorsused
+      stbi__get32le(s); // discard max important
+      if (hsz == 40 || hsz == 56) {
+         if (hsz == 56) {
+            stbi__get32le(s);
+            stbi__get32le(s);
+            stbi__get32le(s);
+            stbi__get32le(s);
+         }
+         if (info->bpp == 16 || info->bpp == 32) {
+            if (compress == 0) {
+               stbi__bmp_set_mask_defaults(info, compress);
+            } else if (compress == 3) {
+               info->mr = stbi__get32le(s);
+               info->mg = stbi__get32le(s);
+               info->mb = stbi__get32le(s);
+               info->extra_read += 12;
+               // not documented, but generated by photoshop and handled by mspaint
+               if (info->mr == info->mg && info->mg == info->mb) {
+                  // ?!?!?
+                  return stbi__errpuc("bad BMP", "bad BMP");
+               }
+            } else
+               return stbi__errpuc("bad BMP", "bad BMP");
+         }
+      } else {
+         // V4/V5 header
+         int i;
+         if (hsz != 108 && hsz != 124)
+            return stbi__errpuc("bad BMP", "bad BMP");
+         info->mr = stbi__get32le(s);
+         info->mg = stbi__get32le(s);
+         info->mb = stbi__get32le(s);
+         info->ma = stbi__get32le(s);
+         if (compress != 3) // override mr/mg/mb unless in BI_BITFIELDS mode, as per docs
+            stbi__bmp_set_mask_defaults(info, compress);
+         stbi__get32le(s); // discard color space
+         for (i=0; i < 12; ++i)
+            stbi__get32le(s); // discard color space parameters
+         if (hsz == 124) {
+            stbi__get32le(s); // discard rendering intent
+            stbi__get32le(s); // discard offset of profile data
+            stbi__get32le(s); // discard size of profile data
+            stbi__get32le(s); // discard reserved
+         }
+      }
+   }
+   return (void *) 1;
+}
+
+
+static void *stbi__bmp_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri)
+{
+   stbi_uc *out;
+   unsigned int mr=0,mg=0,mb=0,ma=0, all_a;
+   stbi_uc pal[256][4];
+   int psize=0,i,j,width;
+   int flip_vertically, pad, target;
+   stbi__bmp_data info;
+   STBI_NOTUSED(ri);
+
+   info.all_a = 255;
+   if (stbi__bmp_parse_header(s, &info) == NULL)
+      return NULL; // error code already set
+
+   flip_vertically = ((int) s->img_y) > 0;
+   s->img_y = abs((int) s->img_y);
+
+   if (s->img_y > STBI_MAX_DIMENSIONS) return stbi__errpuc("too large","Very large image (corrupt?)");
+   if (s->img_x > STBI_MAX_DIMENSIONS) return stbi__errpuc("too large","Very large image (corrupt?)");
+
+   mr = info.mr;
+   mg = info.mg;
+   mb = info.mb;
+   ma = info.ma;
+   all_a = info.all_a;
+
+   if (info.hsz == 12) {
+      if (info.bpp < 24)
+         psize = (info.offset - info.extra_read - 24) / 3;
+   } else {
+      if (info.bpp < 16)
+         psize = (info.offset - info.extra_read - info.hsz) >> 2;
+   }
+   if (psize == 0) {
+      if (info.offset != s->callback_already_read + (s->img_buffer - s->img_buffer_original)) {
+        return stbi__errpuc("bad offset", "Corrupt BMP");
+      }
+   }
+
+   if (info.bpp == 24 && ma == 0xff000000)
+      s->img_n = 3;
+   else
+      s->img_n = ma ? 4 : 3;
+   if (req_comp && req_comp >= 3) // we can directly decode 3 or 4
+      target = req_comp;
+   else
+      target = s->img_n; // if they want monochrome, we'll post-convert
+
+   // sanity-check size
+   if (!stbi__mad3sizes_valid(target, s->img_x, s->img_y, 0))
+      return stbi__errpuc("too large", "Corrupt BMP");
+
+   out = (stbi_uc *) stbi__malloc_mad3(target, s->img_x, s->img_y, 0);
+   if (!out) return stbi__errpuc("outofmem", "Out of memory");
+   if (info.bpp < 16) {
+      int z=0;
+      if (psize == 0 || psize > 256) { STBI_FREE(out); return stbi__errpuc("invalid", "Corrupt BMP"); }
+      for (i=0; i < psize; ++i) {
+         pal[i][2] = stbi__get8(s);
+         pal[i][1] = stbi__get8(s);
+         pal[i][0] = stbi__get8(s);
+         if (info.hsz != 12) stbi__get8(s);
+         pal[i][3] = 255;
+      }
+      stbi__skip(s, info.offset - info.extra_read - info.hsz - psize * (info.hsz == 12 ? 3 : 4));
+      if (info.bpp == 1) width = (s->img_x + 7) >> 3;
+      else if (info.bpp == 4) width = (s->img_x + 1) >> 1;
+      else if (info.bpp == 8) width = s->img_x;
+      else { STBI_FREE(out); return stbi__errpuc("bad bpp", "Corrupt BMP"); }
+      pad = (-width)&3;
+      if (info.bpp == 1) {
+         for (j=0; j < (int) s->img_y; ++j) {
+            int bit_offset = 7, v = stbi__get8(s);
+            for (i=0; i < (int) s->img_x; ++i) {
+               int color = (v>>bit_offset)&0x1;
+               out[z++] = pal[color][0];
+               out[z++] = pal[color][1];
+               out[z++] = pal[color][2];
+               if (target == 4) out[z++] = 255;
+               if (i+1 == (int) s->img_x) break;
+               if((--bit_offset) < 0) {
+                  bit_offset = 7;
+                  v = stbi__get8(s);
+               }
+            }
+            stbi__skip(s, pad);
+         }
+      } else {
+         for (j=0; j < (int) s->img_y; ++j) {
+            for (i=0; i < (int) s->img_x; i += 2) {
+               int v=stbi__get8(s),v2=0;
+               if (info.bpp == 4) {
+                  v2 = v & 15;
+                  v >>= 4;
+               }
+               out[z++] = pal[v][0];
+               out[z++] = pal[v][1];
+               out[z++] = pal[v][2];
+               if (target == 4) out[z++] = 255;
+               if (i+1 == (int) s->img_x) break;
+               v = (info.bpp == 8) ? stbi__get8(s) : v2;
+               out[z++] = pal[v][0];
+               out[z++] = pal[v][1];
+               out[z++] = pal[v][2];
+               if (target == 4) out[z++] = 255;
+            }
+            stbi__skip(s, pad);
+         }
+      }
+   } else {
+      int rshift=0,gshift=0,bshift=0,ashift=0,rcount=0,gcount=0,bcount=0,acount=0;
+      int z = 0;
+      int easy=0;
+      stbi__skip(s, info.offset - info.extra_read - info.hsz);
+      if (info.bpp == 24) width = 3 * s->img_x;
+      else if (info.bpp == 16) width = 2*s->img_x;
+      else /* bpp = 32 and pad = 0 */ width=0;
+      pad = (-width) & 3;
+      if (info.bpp == 24) {
+         easy = 1;
+      } else if (info.bpp == 32) {
+         if (mb == 0xff && mg == 0xff00 && mr == 0x00ff0000 && ma == 0xff000000)
+            easy = 2;
+      }
+      if (!easy) {
+         if (!mr || !mg || !mb) { STBI_FREE(out); return stbi__errpuc("bad masks", "Corrupt BMP"); }
+         // right shift amt to put high bit in position #7
+         rshift = stbi__high_bit(mr)-7; rcount = stbi__bitcount(mr);
+         gshift = stbi__high_bit(mg)-7; gcount = stbi__bitcount(mg);
+         bshift = stbi__high_bit(mb)-7; bcount = stbi__bitcount(mb);
+         ashift = stbi__high_bit(ma)-7; acount = stbi__bitcount(ma);
+         if (rcount > 8 || gcount > 8 || bcount > 8 || acount > 8) { STBI_FREE(out); return stbi__errpuc("bad masks", "Corrupt BMP"); }
+      }
+      for (j=0; j < (int) s->img_y; ++j) {
+         if (easy) {
+            for (i=0; i < (int) s->img_x; ++i) {
+               unsigned char a;
+               out[z+2] = stbi__get8(s);
+               out[z+1] = stbi__get8(s);
+               out[z+0] = stbi__get8(s);
+               z += 3;
+               a = (easy == 2 ? stbi__get8(s) : 255);
+               all_a |= a;
+               if (target == 4) out[z++] = a;
+            }
+         } else {
+            int bpp = info.bpp;
+            for (i=0; i < (int) s->img_x; ++i) {
+               stbi__uint32 v = (bpp == 16 ? (stbi__uint32) stbi__get16le(s) : stbi__get32le(s));
+               unsigned int a;
+               out[z++] = STBI__BYTECAST(stbi__shiftsigned(v & mr, rshift, rcount));
+               out[z++] = STBI__BYTECAST(stbi__shiftsigned(v & mg, gshift, gcount));
+               out[z++] = STBI__BYTECAST(stbi__shiftsigned(v & mb, bshift, bcount));
+               a = (ma ? stbi__shiftsigned(v & ma, ashift, acount) : 255);
+               all_a |= a;
+               if (target == 4) out[z++] = STBI__BYTECAST(a);
+            }
+         }
+         stbi__skip(s, pad);
+      }
+   }
+
+   // if alpha channel is all 0s, replace with all 255s
+   if (target == 4 && all_a == 0)
+      for (i=4*s->img_x*s->img_y-1; i >= 0; i -= 4)
+         out[i] = 255;
+
+   if (flip_vertically) {
+      stbi_uc t;
+      for (j=0; j < (int) s->img_y>>1; ++j) {
+         stbi_uc *p1 = out +      j     *s->img_x*target;
+         stbi_uc *p2 = out + (s->img_y-1-j)*s->img_x*target;
+         for (i=0; i < (int) s->img_x*target; ++i) {
+            t = p1[i]; p1[i] = p2[i]; p2[i] = t;
+         }
+      }
+   }
+
+   if (req_comp && req_comp != target) {
+      out = stbi__convert_format(out, target, req_comp, s->img_x, s->img_y);
+      if (out == NULL) return out; // stbi__convert_format frees input on failure
+   }
+
+   *x = s->img_x;
+   *y = s->img_y;
+   if (comp) *comp = s->img_n;
+   return out;
+}
+#endif
+
+// Targa Truevision - TGA
+// by Jonathan Dummer
+#ifndef STBI_NO_TGA
+// returns STBI_rgb or whatever, 0 on error
+static int stbi__tga_get_comp(int bits_per_pixel, int is_grey, int* is_rgb16)
+{
+   // only RGB or RGBA (incl. 16bit) or grey allowed
+   if (is_rgb16) *is_rgb16 = 0;
+   switch(bits_per_pixel) {
+      case 8:  return STBI_grey;
+      case 16: if(is_grey) return STBI_grey_alpha;
+               // fallthrough
+      case 15: if(is_rgb16) *is_rgb16 = 1;
+               return STBI_rgb;
+      case 24: // fallthrough
+      case 32: return bits_per_pixel/8;
+      default: return 0;
+   }
+}
+
+static int stbi__tga_info(stbi__context *s, int *x, int *y, int *comp)
+{
+    int tga_w, tga_h, tga_comp, tga_image_type, tga_bits_per_pixel, tga_colormap_bpp;
+    int sz, tga_colormap_type;
+    stbi__get8(s);                   // discard Offset
+    tga_colormap_type = stbi__get8(s); // colormap type
+    if( tga_colormap_type > 1 ) {
+        stbi__rewind(s);
+        return 0;      // only RGB or indexed allowed
+    }
+    tga_image_type = stbi__get8(s); // image type
+    if ( tga_colormap_type == 1 ) { // colormapped (paletted) image
+        if (tga_image_type != 1 && tga_image_type != 9) {
+            stbi__rewind(s);
+            return 0;
+        }
+        stbi__skip(s,4);       // skip index of first colormap entry and number of entries
+        sz = stbi__get8(s);    //   check bits per palette color entry
+        if ( (sz != 8) && (sz != 15) && (sz != 16) && (sz != 24) && (sz != 32) ) {
+            stbi__rewind(s);
+            return 0;
+        }
+        stbi__skip(s,4);       // skip image x and y origin
+        tga_colormap_bpp = sz;
+    } else { // "normal" image w/o colormap - only RGB or grey allowed, +/- RLE
+        if ( (tga_image_type != 2) && (tga_image_type != 3) && (tga_image_type != 10) && (tga_image_type != 11) ) {
+            stbi__rewind(s);
+            return 0; // only RGB or grey allowed, +/- RLE
+        }
+        stbi__skip(s,9); // skip colormap specification and image x/y origin
+        tga_colormap_bpp = 0;
+    }
+    tga_w = stbi__get16le(s);
+    if( tga_w < 1 ) {
+        stbi__rewind(s);
+        return 0;   // test width
+    }
+    tga_h = stbi__get16le(s);
+    if( tga_h < 1 ) {
+        stbi__rewind(s);
+        return 0;   // test height
+    }
+    tga_bits_per_pixel = stbi__get8(s); // bits per pixel
+    stbi__get8(s); // ignore alpha bits
+    if (tga_colormap_bpp != 0) {
+        if((tga_bits_per_pixel != 8) && (tga_bits_per_pixel != 16)) {
+            // when using a colormap, tga_bits_per_pixel is the size of the indexes
+            // I don't think anything but 8 or 16bit indexes makes sense
+            stbi__rewind(s);
+            return 0;
+        }
+        tga_comp = stbi__tga_get_comp(tga_colormap_bpp, 0, NULL);
+    } else {
+        tga_comp = stbi__tga_get_comp(tga_bits_per_pixel, (tga_image_type == 3) || (tga_image_type == 11), NULL);
+    }
+    if(!tga_comp) {
+      stbi__rewind(s);
+      return 0;
+    }
+    if (x) *x = tga_w;
+    if (y) *y = tga_h;
+    if (comp) *comp = tga_comp;
+    return 1;                   // seems to have passed everything
+}
+
+static int stbi__tga_test(stbi__context *s)
+{
+   int res = 0;
+   int sz, tga_color_type;
+   stbi__get8(s);      //   discard Offset
+   tga_color_type = stbi__get8(s);   //   color type
+   if ( tga_color_type > 1 ) goto errorEnd;   //   only RGB or indexed allowed
+   sz = stbi__get8(s);   //   image type
+   if ( tga_color_type == 1 ) { // colormapped (paletted) image
+      if (sz != 1 && sz != 9) goto errorEnd; // colortype 1 demands image type 1 or 9
+      stbi__skip(s,4);       // skip index of first colormap entry and number of entries
+      sz = stbi__get8(s);    //   check bits per palette color entry
+      if ( (sz != 8) && (sz != 15) && (sz != 16) && (sz != 24) && (sz != 32) ) goto errorEnd;
+      stbi__skip(s,4);       // skip image x and y origin
+   } else { // "normal" image w/o colormap
+      if ( (sz != 2) && (sz != 3) && (sz != 10) && (sz != 11) ) goto errorEnd; // only RGB or grey allowed, +/- RLE
+      stbi__skip(s,9); // skip colormap specification and image x/y origin
+   }
+   if ( stbi__get16le(s) < 1 ) goto errorEnd;      //   test width
+   if ( stbi__get16le(s) < 1 ) goto errorEnd;      //   test height
+   sz = stbi__get8(s);   //   bits per pixel
+   if ( (tga_color_type == 1) && (sz != 8) && (sz != 16) ) goto errorEnd; // for colormapped images, bpp is size of an index
+   if ( (sz != 8) && (sz != 15) && (sz != 16) && (sz != 24) && (sz != 32) ) goto errorEnd;
+
+   res = 1; // if we got this far, everything's good and we can return 1 instead of 0
+
+errorEnd:
+   stbi__rewind(s);
+   return res;
+}
+
+// read 16bit value and convert to 24bit RGB
+static void stbi__tga_read_rgb16(stbi__context *s, stbi_uc* out)
+{
+   stbi__uint16 px = (stbi__uint16)stbi__get16le(s);
+   stbi__uint16 fiveBitMask = 31;
+   // we have 3 channels with 5bits each
+   int r = (px >> 10) & fiveBitMask;
+   int g = (px >> 5) & fiveBitMask;
+   int b = px & fiveBitMask;
+   // Note that this saves the data in RGB(A) order, so it doesn't need to be swapped later
+   out[0] = (stbi_uc)((r * 255)/31);
+   out[1] = (stbi_uc)((g * 255)/31);
+   out[2] = (stbi_uc)((b * 255)/31);
+
+   // some people claim that the most significant bit might be used for alpha
+   // (possibly if an alpha-bit is set in the "image descriptor byte")
+   // but that only made 16bit test images completely translucent..
+   // so let's treat all 15 and 16bit TGAs as RGB with no alpha.
+}
+
+static void *stbi__tga_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri)
+{
+   //   read in the TGA header stuff
+   int tga_offset = stbi__get8(s);
+   int tga_indexed = stbi__get8(s);
+   int tga_image_type = stbi__get8(s);
+   int tga_is_RLE = 0;
+   int tga_palette_start = stbi__get16le(s);
+   int tga_palette_len = stbi__get16le(s);
+   int tga_palette_bits = stbi__get8(s);
+   int tga_x_origin = stbi__get16le(s);
+   int tga_y_origin = stbi__get16le(s);
+   int tga_width = stbi__get16le(s);
+   int tga_height = stbi__get16le(s);
+   int tga_bits_per_pixel = stbi__get8(s);
+   int tga_comp, tga_rgb16=0;
+   int tga_inverted = stbi__get8(s);
+   // int tga_alpha_bits = tga_inverted & 15; // the 4 lowest bits - unused (useless?)
+   //   image data
+   unsigned char *tga_data;
+   unsigned char *tga_palette = NULL;
+   int i, j;
+   unsigned char raw_data[4] = {0};
+   int RLE_count = 0;
+   int RLE_repeating = 0;
+   int read_next_pixel = 1;
+   STBI_NOTUSED(ri);
+   STBI_NOTUSED(tga_x_origin); // @TODO
+   STBI_NOTUSED(tga_y_origin); // @TODO
+
+   if (tga_height > STBI_MAX_DIMENSIONS) return stbi__errpuc("too large","Very large image (corrupt?)");
+   if (tga_width > STBI_MAX_DIMENSIONS) return stbi__errpuc("too large","Very large image (corrupt?)");
+
+   //   do a tiny bit of precessing
+   if ( tga_image_type >= 8 )
+   {
+      tga_image_type -= 8;
+      tga_is_RLE = 1;
+   }
+   tga_inverted = 1 - ((tga_inverted >> 5) & 1);
+
+   //   If I'm paletted, then I'll use the number of bits from the palette
+   if ( tga_indexed ) tga_comp = stbi__tga_get_comp(tga_palette_bits, 0, &tga_rgb16);
+   else tga_comp = stbi__tga_get_comp(tga_bits_per_pixel, (tga_image_type == 3), &tga_rgb16);
+
+   if(!tga_comp) // shouldn't really happen, stbi__tga_test() should have ensured basic consistency
+      return stbi__errpuc("bad format", "Can't find out TGA pixelformat");
+
+   //   tga info
+   *x = tga_width;
+   *y = tga_height;
+   if (comp) *comp = tga_comp;
+
+   if (!stbi__mad3sizes_valid(tga_width, tga_height, tga_comp, 0))
+      return stbi__errpuc("too large", "Corrupt TGA");
+
+   tga_data = (unsigned char*)stbi__malloc_mad3(tga_width, tga_height, tga_comp, 0);
+   if (!tga_data) return stbi__errpuc("outofmem", "Out of memory");
+
+   // skip to the data's starting position (offset usually = 0)
+   stbi__skip(s, tga_offset );
+
+   if ( !tga_indexed && !tga_is_RLE && !tga_rgb16 ) {
+      for (i=0; i < tga_height; ++i) {
+         int row = tga_inverted ? tga_height -i - 1 : i;
+         stbi_uc *tga_row = tga_data + row*tga_width*tga_comp;
+         stbi__getn(s, tga_row, tga_width * tga_comp);
+      }
+   } else  {
+      //   do I need to load a palette?
+      if ( tga_indexed)
+      {
+         if (tga_palette_len == 0) {  /* you have to have at least one entry! */
+            STBI_FREE(tga_data);
+            return stbi__errpuc("bad palette", "Corrupt TGA");
+         }
+
+         //   any data to skip? (offset usually = 0)
+         stbi__skip(s, tga_palette_start );
+         //   load the palette
+         tga_palette = (unsigned char*)stbi__malloc_mad2(tga_palette_len, tga_comp, 0);
+         if (!tga_palette) {
+            STBI_FREE(tga_data);
+            return stbi__errpuc("outofmem", "Out of memory");
+         }
+         if (tga_rgb16) {
+            stbi_uc *pal_entry = tga_palette;
+            STBI_ASSERT(tga_comp == STBI_rgb);
+            for (i=0; i < tga_palette_len; ++i) {
+               stbi__tga_read_rgb16(s, pal_entry);
+               pal_entry += tga_comp;
+            }
+         } else if (!stbi__getn(s, tga_palette, tga_palette_len * tga_comp)) {
+               STBI_FREE(tga_data);
+               STBI_FREE(tga_palette);
+               return stbi__errpuc("bad palette", "Corrupt TGA");
+         }
+      }
+      //   load the data
+      for (i=0; i < tga_width * tga_height; ++i)
+      {
+         //   if I'm in RLE mode, do I need to get a RLE stbi__pngchunk?
+         if ( tga_is_RLE )
+         {
+            if ( RLE_count == 0 )
+            {
+               //   yep, get the next byte as a RLE command
+               int RLE_cmd = stbi__get8(s);
+               RLE_count = 1 + (RLE_cmd & 127);
+               RLE_repeating = RLE_cmd >> 7;
+               read_next_pixel = 1;
+            } else if ( !RLE_repeating )
+            {
+               read_next_pixel = 1;
+            }
+         } else
+         {
+            read_next_pixel = 1;
+         }
+         //   OK, if I need to read a pixel, do it now
+         if ( read_next_pixel )
+         {
+            //   load however much data we did have
+            if ( tga_indexed )
+            {
+               // read in index, then perform the lookup
+               int pal_idx = (tga_bits_per_pixel == 8) ? stbi__get8(s) : stbi__get16le(s);
+               if ( pal_idx >= tga_palette_len ) {
+                  // invalid index
+                  pal_idx = 0;
+               }
+               pal_idx *= tga_comp;
+               for (j = 0; j < tga_comp; ++j) {
+                  raw_data[j] = tga_palette[pal_idx+j];
+               }
+            } else if(tga_rgb16) {
+               STBI_ASSERT(tga_comp == STBI_rgb);
+               stbi__tga_read_rgb16(s, raw_data);
+            } else {
+               //   read in the data raw
+               for (j = 0; j < tga_comp; ++j) {
+                  raw_data[j] = stbi__get8(s);
+               }
+            }
+            //   clear the reading flag for the next pixel
+            read_next_pixel = 0;
+         } // end of reading a pixel
+
+         // copy data
+         for (j = 0; j < tga_comp; ++j)
+           tga_data[i*tga_comp+j] = raw_data[j];
+
+         //   in case we're in RLE mode, keep counting down
+         --RLE_count;
+      }
+      //   do I need to invert the image?
+      if ( tga_inverted )
+      {
+         for (j = 0; j*2 < tga_height; ++j)
+         {
+            int index1 = j * tga_width * tga_comp;
+            int index2 = (tga_height - 1 - j) * tga_width * tga_comp;
+            for (i = tga_width * tga_comp; i > 0; --i)
+            {
+               unsigned char temp = tga_data[index1];
+               tga_data[index1] = tga_data[index2];
+               tga_data[index2] = temp;
+               ++index1;
+               ++index2;
+            }
+         }
+      }
+      //   clear my palette, if I had one
+      if ( tga_palette != NULL )
+      {
+         STBI_FREE( tga_palette );
+      }
+   }
+
+   // swap RGB - if the source data was RGB16, it already is in the right order
+   if (tga_comp >= 3 && !tga_rgb16)
+   {
+      unsigned char* tga_pixel = tga_data;
+      for (i=0; i < tga_width * tga_height; ++i)
+      {
+         unsigned char temp = tga_pixel[0];
+         tga_pixel[0] = tga_pixel[2];
+         tga_pixel[2] = temp;
+         tga_pixel += tga_comp;
+      }
+   }
+
+   // convert to target component count
+   if (req_comp && req_comp != tga_comp)
+      tga_data = stbi__convert_format(tga_data, tga_comp, req_comp, tga_width, tga_height);
+
+   //   the things I do to get rid of an error message, and yet keep
+   //   Microsoft's C compilers happy... [8^(
+   tga_palette_start = tga_palette_len = tga_palette_bits =
+         tga_x_origin = tga_y_origin = 0;
+   STBI_NOTUSED(tga_palette_start);
+   //   OK, done
+   return tga_data;
+}
+#endif
+
+// *************************************************************************************************
+// Photoshop PSD loader -- PD by Thatcher Ulrich, integration by Nicolas Schulz, tweaked by STB
+
+#ifndef STBI_NO_PSD
+static int stbi__psd_test(stbi__context *s)
+{
+   int r = (stbi__get32be(s) == 0x38425053);
+   stbi__rewind(s);
+   return r;
+}
+
+static int stbi__psd_decode_rle(stbi__context *s, stbi_uc *p, int pixelCount)
+{
+   int count, nleft, len;
+
+   count = 0;
+   while ((nleft = pixelCount - count) > 0) {
+      len = stbi__get8(s);
+      if (len == 128) {
+         // No-op.
+      } else if (len < 128) {
+         // Copy next len+1 bytes literally.
+         len++;
+         if (len > nleft) return 0; // corrupt data
+         count += len;
+         while (len) {
+            *p = stbi__get8(s);
+            p += 4;
+            len--;
+         }
+      } else if (len > 128) {
+         stbi_uc   val;
+         // Next -len+1 bytes in the dest are replicated from next source byte.
+         // (Interpret len as a negative 8-bit int.)
+         len = 257 - len;
+         if (len > nleft) return 0; // corrupt data
+         val = stbi__get8(s);
+         count += len;
+         while (len) {
+            *p = val;
+            p += 4;
+            len--;
+         }
+      }
+   }
+
+   return 1;
+}
+
+static void *stbi__psd_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri, int bpc)
+{
+   int pixelCount;
+   int channelCount, compression;
+   int channel, i;
+   int bitdepth;
+   int w,h;
+   stbi_uc *out;
+   STBI_NOTUSED(ri);
+
+   // Check identifier
+   if (stbi__get32be(s) != 0x38425053)   // "8BPS"
+      return stbi__errpuc("not PSD", "Corrupt PSD image");
+
+   // Check file type version.
+   if (stbi__get16be(s) != 1)
+      return stbi__errpuc("wrong version", "Unsupported version of PSD image");
+
+   // Skip 6 reserved bytes.
+   stbi__skip(s, 6 );
+
+   // Read the number of channels (R, G, B, A, etc).
+   channelCount = stbi__get16be(s);
+   if (channelCount < 0 || channelCount > 16)
+      return stbi__errpuc("wrong channel count", "Unsupported number of channels in PSD image");
+
+   // Read the rows and columns of the image.
+   h = stbi__get32be(s);
+   w = stbi__get32be(s);
+
+   if (h > STBI_MAX_DIMENSIONS) return stbi__errpuc("too large","Very large image (corrupt?)");
+   if (w > STBI_MAX_DIMENSIONS) return stbi__errpuc("too large","Very large image (corrupt?)");
+
+   // Make sure the depth is 8 bits.
+   bitdepth = stbi__get16be(s);
+   if (bitdepth != 8 && bitdepth != 16)
+      return stbi__errpuc("unsupported bit depth", "PSD bit depth is not 8 or 16 bit");
+
+   // Make sure the color mode is RGB.
+   // Valid options are:
+   //   0: Bitmap
+   //   1: Grayscale
+   //   2: Indexed color
+   //   3: RGB color
+   //   4: CMYK color
+   //   7: Multichannel
+   //   8: Duotone
+   //   9: Lab color
+   if (stbi__get16be(s) != 3)
+      return stbi__errpuc("wrong color format", "PSD is not in RGB color format");
+
+   // Skip the Mode Data.  (It's the palette for indexed color; other info for other modes.)
+   stbi__skip(s,stbi__get32be(s) );
+
+   // Skip the image resources.  (resolution, pen tool paths, etc)
+   stbi__skip(s, stbi__get32be(s) );
+
+   // Skip the reserved data.
+   stbi__skip(s, stbi__get32be(s) );
+
+   // Find out if the data is compressed.
+   // Known values:
+   //   0: no compression
+   //   1: RLE compressed
+   compression = stbi__get16be(s);
+   if (compression > 1)
+      return stbi__errpuc("bad compression", "PSD has an unknown compression format");
+
+   // Check size
+   if (!stbi__mad3sizes_valid(4, w, h, 0))
+      return stbi__errpuc("too large", "Corrupt PSD");
+
+   // Create the destination image.
+
+   if (!compression && bitdepth == 16 && bpc == 16) {
+      out = (stbi_uc *) stbi__malloc_mad3(8, w, h, 0);
+      ri->bits_per_channel = 16;
+   } else
+      out = (stbi_uc *) stbi__malloc(4 * w*h);
+
+   if (!out) return stbi__errpuc("outofmem", "Out of memory");
+   pixelCount = w*h;
+
+   // Initialize the data to zero.
+   //memset( out, 0, pixelCount * 4 );
+
+   // Finally, the image data.
+   if (compression) {
+      // RLE as used by .PSD and .TIFF
+      // Loop until you get the number of unpacked bytes you are expecting:
+      //     Read the next source byte into n.
+      //     If n is between 0 and 127 inclusive, copy the next n+1 bytes literally.
+      //     Else if n is between -127 and -1 inclusive, copy the next byte -n+1 times.
+      //     Else if n is 128, noop.
+      // Endloop
+
+      // The RLE-compressed data is preceded by a 2-byte data count for each row in the data,
+      // which we're going to just skip.
+      stbi__skip(s, h * channelCount * 2 );
+
+      // Read the RLE data by channel.
+      for (channel = 0; channel < 4; channel++) {
+         stbi_uc *p;
+
+         p = out+channel;
+         if (channel >= channelCount) {
+            // Fill this channel with default data.
+            for (i = 0; i < pixelCount; i++, p += 4)
+               *p = (channel == 3 ? 255 : 0);
+         } else {
+            // Read the RLE data.
+            if (!stbi__psd_decode_rle(s, p, pixelCount)) {
+               STBI_FREE(out);
+               return stbi__errpuc("corrupt", "bad RLE data");
+            }
+         }
+      }
+
+   } else {
+      // We're at the raw image data.  It's each channel in order (Red, Green, Blue, Alpha, ...)
+      // where each channel consists of an 8-bit (or 16-bit) value for each pixel in the image.
+
+      // Read the data by channel.
+      for (channel = 0; channel < 4; channel++) {
+         if (channel >= channelCount) {
+            // Fill this channel with default data.
+            if (bitdepth == 16 && bpc == 16) {
+               stbi__uint16 *q = ((stbi__uint16 *) out) + channel;
+               stbi__uint16 val = channel == 3 ? 65535 : 0;
+               for (i = 0; i < pixelCount; i++, q += 4)
+                  *q = val;
+            } else {
+               stbi_uc *p = out+channel;
+               stbi_uc val = channel == 3 ? 255 : 0;
+               for (i = 0; i < pixelCount; i++, p += 4)
+                  *p = val;
+            }
+         } else {
+            if (ri->bits_per_channel == 16) {    // output bpc
+               stbi__uint16 *q = ((stbi__uint16 *) out) + channel;
+               for (i = 0; i < pixelCount; i++, q += 4)
+                  *q = (stbi__uint16) stbi__get16be(s);
+            } else {
+               stbi_uc *p = out+channel;
+               if (bitdepth == 16) {  // input bpc
+                  for (i = 0; i < pixelCount; i++, p += 4)
+                     *p = (stbi_uc) (stbi__get16be(s) >> 8);
+               } else {
+                  for (i = 0; i < pixelCount; i++, p += 4)
+                     *p = stbi__get8(s);
+               }
+            }
+         }
+      }
+   }
+
+   // remove weird white matte from PSD
+   if (channelCount >= 4) {
+      if (ri->bits_per_channel == 16) {
+         for (i=0; i < w*h; ++i) {
+            stbi__uint16 *pixel = (stbi__uint16 *) out + 4*i;
+            if (pixel[3] != 0 && pixel[3] != 65535) {
+               float a = pixel[3] / 65535.0f;
+               float ra = 1.0f / a;
+               float inv_a = 65535.0f * (1 - ra);
+               pixel[0] = (stbi__uint16) (pixel[0]*ra + inv_a);
+               pixel[1] = (stbi__uint16) (pixel[1]*ra + inv_a);
+               pixel[2] = (stbi__uint16) (pixel[2]*ra + inv_a);
+            }
+         }
+      } else {
+         for (i=0; i < w*h; ++i) {
+            unsigned char *pixel = out + 4*i;
+            if (pixel[3] != 0 && pixel[3] != 255) {
+               float a = pixel[3] / 255.0f;
+               float ra = 1.0f / a;
+               float inv_a = 255.0f * (1 - ra);
+               pixel[0] = (unsigned char) (pixel[0]*ra + inv_a);
+               pixel[1] = (unsigned char) (pixel[1]*ra + inv_a);
+               pixel[2] = (unsigned char) (pixel[2]*ra + inv_a);
+            }
+         }
+      }
+   }
+
+   // convert to desired output format
+   if (req_comp && req_comp != 4) {
+      if (ri->bits_per_channel == 16)
+         out = (stbi_uc *) stbi__convert_format16((stbi__uint16 *) out, 4, req_comp, w, h);
+      else
+         out = stbi__convert_format(out, 4, req_comp, w, h);
+      if (out == NULL) return out; // stbi__convert_format frees input on failure
+   }
+
+   if (comp) *comp = 4;
+   *y = h;
+   *x = w;
+
+   return out;
+}
+#endif
+
+// *************************************************************************************************
+// Softimage PIC loader
+// by Tom Seddon
+//
+// See http://softimage.wiki.softimage.com/index.php/INFO:_PIC_file_format
+// See http://ozviz.wasp.uwa.edu.au/~pbourke/dataformats/softimagepic/
+
+#ifndef STBI_NO_PIC
+static int stbi__pic_is4(stbi__context *s,const char *str)
+{
+   int i;
+   for (i=0; i<4; ++i)
+      if (stbi__get8(s) != (stbi_uc)str[i])
+         return 0;
+
+   return 1;
+}
+
+static int stbi__pic_test_core(stbi__context *s)
+{
+   int i;
+
+   if (!stbi__pic_is4(s,"\x53\x80\xF6\x34"))
+      return 0;
+
+   for(i=0;i<84;++i)
+      stbi__get8(s);
+
+   if (!stbi__pic_is4(s,"PICT"))
+      return 0;
+
+   return 1;
+}
+
+typedef struct
+{
+   stbi_uc size,type,channel;
+} stbi__pic_packet;
+
+static stbi_uc *stbi__readval(stbi__context *s, int channel, stbi_uc *dest)
+{
+   int mask=0x80, i;
+
+   for (i=0; i<4; ++i, mask>>=1) {
+      if (channel & mask) {
+         if (stbi__at_eof(s)) return stbi__errpuc("bad file","PIC file too short");
+         dest[i]=stbi__get8(s);
+      }
+   }
+
+   return dest;
+}
+
+static void stbi__copyval(int channel,stbi_uc *dest,const stbi_uc *src)
+{
+   int mask=0x80,i;
+
+   for (i=0;i<4; ++i, mask>>=1)
+      if (channel&mask)
+         dest[i]=src[i];
+}
+
+static stbi_uc *stbi__pic_load_core(stbi__context *s,int width,int height,int *comp, stbi_uc *result)
+{
+   int act_comp=0,num_packets=0,y,chained;
+   stbi__pic_packet packets[10];
+
+   // this will (should...) cater for even some bizarre stuff like having data
+    // for the same channel in multiple packets.
+   do {
+      stbi__pic_packet *packet;
+
+      if (num_packets==sizeof(packets)/sizeof(packets[0]))
+         return stbi__errpuc("bad format","too many packets");
+
+      packet = &packets[num_packets++];
+
+      chained = stbi__get8(s);
+      packet->size    = stbi__get8(s);
+      packet->type    = stbi__get8(s);
+      packet->channel = stbi__get8(s);
+
+      act_comp |= packet->channel;
+
+      if (stbi__at_eof(s))          return stbi__errpuc("bad file","file too short (reading packets)");
+      if (packet->size != 8)  return stbi__errpuc("bad format","packet isn't 8bpp");
+   } while (chained);
+
+   *comp = (act_comp & 0x10 ? 4 : 3); // has alpha channel?
+
+   for(y=0; y<height; ++y) {
+      int packet_idx;
+
+      for(packet_idx=0; packet_idx < num_packets; ++packet_idx) {
+         stbi__pic_packet *packet = &packets[packet_idx];
+         stbi_uc *dest = result+y*width*4;
+
+         switch (packet->type) {
+            default:
+               return stbi__errpuc("bad format","packet has bad compression type");
+
+            case 0: {//uncompressed
+               int x;
+
+               for(x=0;x<width;++x, dest+=4)
+                  if (!stbi__readval(s,packet->channel,dest))
+                     return 0;
+               break;
+            }
+
+            case 1://Pure RLE
+               {
+                  int left=width, i;
+
+                  while (left>0) {
+                     stbi_uc count,value[4];
+
+                     count=stbi__get8(s);
+                     if (stbi__at_eof(s))   return stbi__errpuc("bad file","file too short (pure read count)");
+
+                     if (count > left)
+                        count = (stbi_uc) left;
+
+                     if (!stbi__readval(s,packet->channel,value))  return 0;
+
+                     for(i=0; i<count; ++i,dest+=4)
+                        stbi__copyval(packet->channel,dest,value);
+                     left -= count;
+                  }
+               }
+               break;
+
+            case 2: {//Mixed RLE
+               int left=width;
+               while (left>0) {
+                  int count = stbi__get8(s), i;
+                  if (stbi__at_eof(s))  return stbi__errpuc("bad file","file too short (mixed read count)");
+
+                  if (count >= 128) { // Repeated
+                     stbi_uc value[4];
+
+                     if (count==128)
+                        count = stbi__get16be(s);
+                     else
+                        count -= 127;
+                     if (count > left)
+                        return stbi__errpuc("bad file","scanline overrun");
+
+                     if (!stbi__readval(s,packet->channel,value))
+                        return 0;
+
+                     for(i=0;i<count;++i, dest += 4)
+                        stbi__copyval(packet->channel,dest,value);
+                  } else { // Raw
+                     ++count;
+                     if (count>left) return stbi__errpuc("bad file","scanline overrun");
+
+                     for(i=0;i<count;++i, dest+=4)
+                        if (!stbi__readval(s,packet->channel,dest))
+                           return 0;
+                  }
+                  left-=count;
+               }
+               break;
+            }
+         }
+      }
+   }
+
+   return result;
+}
+
+static void *stbi__pic_load(stbi__context *s,int *px,int *py,int *comp,int req_comp, stbi__result_info *ri)
+{
+   stbi_uc *result;
+   int i, x,y, internal_comp;
+   STBI_NOTUSED(ri);
+
+   if (!comp) comp = &internal_comp;
+
+   for (i=0; i<92; ++i)
+      stbi__get8(s);
+
+   x = stbi__get16be(s);
+   y = stbi__get16be(s);
+
+   if (y > STBI_MAX_DIMENSIONS) return stbi__errpuc("too large","Very large image (corrupt?)");
+   if (x > STBI_MAX_DIMENSIONS) return stbi__errpuc("too large","Very large image (corrupt?)");
+
+   if (stbi__at_eof(s))  return stbi__errpuc("bad file","file too short (pic header)");
+   if (!stbi__mad3sizes_valid(x, y, 4, 0)) return stbi__errpuc("too large", "PIC image too large to decode");
+
+   stbi__get32be(s); //skip `ratio'
+   stbi__get16be(s); //skip `fields'
+   stbi__get16be(s); //skip `pad'
+
+   // intermediate buffer is RGBA
+   result = (stbi_uc *) stbi__malloc_mad3(x, y, 4, 0);
+   if (!result) return stbi__errpuc("outofmem", "Out of memory");
+   memset(result, 0xff, x*y*4);
+
+   if (!stbi__pic_load_core(s,x,y,comp, result)) {
+      STBI_FREE(result);
+      result=0;
+   }
+   *px = x;
+   *py = y;
+   if (req_comp == 0) req_comp = *comp;
+   result=stbi__convert_format(result,4,req_comp,x,y);
+
+   return result;
+}
+
+static int stbi__pic_test(stbi__context *s)
+{
+   int r = stbi__pic_test_core(s);
+   stbi__rewind(s);
+   return r;
+}
+#endif
+
+// *************************************************************************************************
+// GIF loader -- public domain by Jean-Marc Lienher -- simplified/shrunk by stb
+
+#ifndef STBI_NO_GIF
+typedef struct
+{
+   stbi__int16 prefix;
+   stbi_uc first;
+   stbi_uc suffix;
+} stbi__gif_lzw;
+
+typedef struct
+{
+   int w,h;
+   stbi_uc *out;                 // output buffer (always 4 components)
+   stbi_uc *background;          // The current "background" as far as a gif is concerned
+   stbi_uc *history;
+   int flags, bgindex, ratio, transparent, eflags;
+   stbi_uc  pal[256][4];
+   stbi_uc lpal[256][4];
+   stbi__gif_lzw codes[8192];
+   stbi_uc *color_table;
+   int parse, step;
+   int lflags;
+   int start_x, start_y;
+   int max_x, max_y;
+   int cur_x, cur_y;
+   int line_size;
+   int delay;
+} stbi__gif;
+
+static int stbi__gif_test_raw(stbi__context *s)
+{
+   int sz;
+   if (stbi__get8(s) != 'G' || stbi__get8(s) != 'I' || stbi__get8(s) != 'F' || stbi__get8(s) != '8') return 0;
+   sz = stbi__get8(s);
+   if (sz != '9' && sz != '7') return 0;
+   if (stbi__get8(s) != 'a') return 0;
+   return 1;
+}
+
+static int stbi__gif_test(stbi__context *s)
+{
+   int r = stbi__gif_test_raw(s);
+   stbi__rewind(s);
+   return r;
+}
+
+static void stbi__gif_parse_colortable(stbi__context *s, stbi_uc pal[256][4], int num_entries, int transp)
+{
+   int i;
+   for (i=0; i < num_entries; ++i) {
+      pal[i][2] = stbi__get8(s);
+      pal[i][1] = stbi__get8(s);
+      pal[i][0] = stbi__get8(s);
+      pal[i][3] = transp == i ? 0 : 255;
+   }
+}
+
+static int stbi__gif_header(stbi__context *s, stbi__gif *g, int *comp, int is_info)
+{
+   stbi_uc version;
+   if (stbi__get8(s) != 'G' || stbi__get8(s) != 'I' || stbi__get8(s) != 'F' || stbi__get8(s) != '8')
+      return stbi__err("not GIF", "Corrupt GIF");
+
+   version = stbi__get8(s);
+   if (version != '7' && version != '9')    return stbi__err("not GIF", "Corrupt GIF");
+   if (stbi__get8(s) != 'a')                return stbi__err("not GIF", "Corrupt GIF");
+
+   stbi__g_failure_reason = "";
+   g->w = stbi__get16le(s);
+   g->h = stbi__get16le(s);
+   g->flags = stbi__get8(s);
+   g->bgindex = stbi__get8(s);
+   g->ratio = stbi__get8(s);
+   g->transparent = -1;
+
+   if (g->w > STBI_MAX_DIMENSIONS) return stbi__err("too large","Very large image (corrupt?)");
+   if (g->h > STBI_MAX_DIMENSIONS) return stbi__err("too large","Very large image (corrupt?)");
+
+   if (comp != 0) *comp = 4;  // can't actually tell whether it's 3 or 4 until we parse the comments
+
+   if (is_info) return 1;
+
+   if (g->flags & 0x80)
+      stbi__gif_parse_colortable(s,g->pal, 2 << (g->flags & 7), -1);
+
+   return 1;
+}
+
+static int stbi__gif_info_raw(stbi__context *s, int *x, int *y, int *comp)
+{
+   stbi__gif* g = (stbi__gif*) stbi__malloc(sizeof(stbi__gif));
+   if (!g) return stbi__err("outofmem", "Out of memory");
+   if (!stbi__gif_header(s, g, comp, 1)) {
+      STBI_FREE(g);
+      stbi__rewind( s );
+      return 0;
+   }
+   if (x) *x = g->w;
+   if (y) *y = g->h;
+   STBI_FREE(g);
+   return 1;
+}
+
+static void stbi__out_gif_code(stbi__gif *g, stbi__uint16 code)
+{
+   stbi_uc *p, *c;
+   int idx;
+
+   // recurse to decode the prefixes, since the linked-list is backwards,
+   // and working backwards through an interleaved image would be nasty
+   if (g->codes[code].prefix >= 0)
+      stbi__out_gif_code(g, g->codes[code].prefix);
+
+   if (g->cur_y >= g->max_y) return;
+
+   idx = g->cur_x + g->cur_y;
+   p = &g->out[idx];
+   g->history[idx / 4] = 1;
+
+   c = &g->color_table[g->codes[code].suffix * 4];
+   if (c[3] > 128) { // don't render transparent pixels;
+      p[0] = c[2];
+      p[1] = c[1];
+      p[2] = c[0];
+      p[3] = c[3];
+   }
+   g->cur_x += 4;
+
+   if (g->cur_x >= g->max_x) {
+      g->cur_x = g->start_x;
+      g->cur_y += g->step;
+
+      while (g->cur_y >= g->max_y && g->parse > 0) {
+         g->step = (1 << g->parse) * g->line_size;
+         g->cur_y = g->start_y + (g->step >> 1);
+         --g->parse;
+      }
+   }
+}
+
+static stbi_uc *stbi__process_gif_raster(stbi__context *s, stbi__gif *g)
+{
+   stbi_uc lzw_cs;
+   stbi__int32 len, init_code;
+   stbi__uint32 first;
+   stbi__int32 codesize, codemask, avail, oldcode, bits, valid_bits, clear;
+   stbi__gif_lzw *p;
+
+   lzw_cs = stbi__get8(s);
+   if (lzw_cs > 12) return NULL;
+   clear = 1 << lzw_cs;
+   first = 1;
+   codesize = lzw_cs + 1;
+   codemask = (1 << codesize) - 1;
+   bits = 0;
+   valid_bits = 0;
+   for (init_code = 0; init_code < clear; init_code++) {
+      g->codes[init_code].prefix = -1;
+      g->codes[init_code].first = (stbi_uc) init_code;
+      g->codes[init_code].suffix = (stbi_uc) init_code;
+   }
+
+   // support no starting clear code
+   avail = clear+2;
+   oldcode = -1;
+
+   len = 0;
+   for(;;) {
+      if (valid_bits < codesize) {
+         if (len == 0) {
+            len = stbi__get8(s); // start new block
+            if (len == 0)
+               return g->out;
+         }
+         --len;
+         bits |= (stbi__int32) stbi__get8(s) << valid_bits;
+         valid_bits += 8;
+      } else {
+         stbi__int32 code = bits & codemask;
+         bits >>= codesize;
+         valid_bits -= codesize;
+         // @OPTIMIZE: is there some way we can accelerate the non-clear path?
+         if (code == clear) {  // clear code
+            codesize = lzw_cs + 1;
+            codemask = (1 << codesize) - 1;
+            avail = clear + 2;
+            oldcode = -1;
+            first = 0;
+         } else if (code == clear + 1) { // end of stream code
+            stbi__skip(s, len);
+            while ((len = stbi__get8(s)) > 0)
+               stbi__skip(s,len);
+            return g->out;
+         } else if (code <= avail) {
+            if (first) {
+               return stbi__errpuc("no clear code", "Corrupt GIF");
+            }
+
+            if (oldcode >= 0) {
+               p = &g->codes[avail++];
+               if (avail > 8192) {
+                  return stbi__errpuc("too many codes", "Corrupt GIF");
+               }
+
+               p->prefix = (stbi__int16) oldcode;
+               p->first = g->codes[oldcode].first;
+               p->suffix = (code == avail) ? p->first : g->codes[code].first;
+            } else if (code == avail)
+               return stbi__errpuc("illegal code in raster", "Corrupt GIF");
+
+            stbi__out_gif_code(g, (stbi__uint16) code);
+
+            if ((avail & codemask) == 0 && avail <= 0x0FFF) {
+               codesize++;
+               codemask = (1 << codesize) - 1;
+            }
+
+            oldcode = code;
+         } else {
+            return stbi__errpuc("illegal code in raster", "Corrupt GIF");
+         }
+      }
+   }
+}
+
+// this function is designed to support animated gifs, although stb_image doesn't support it
+// two back is the image from two frames ago, used for a very specific disposal format
+static stbi_uc *stbi__gif_load_next(stbi__context *s, stbi__gif *g, int *comp, int req_comp, stbi_uc *two_back)
+{
+   int dispose;
+   int first_frame;
+   int pi;
+   int pcount;
+   STBI_NOTUSED(req_comp);
+
+   // on first frame, any non-written pixels get the background colour (non-transparent)
+   first_frame = 0;
+   if (g->out == 0) {
+      if (!stbi__gif_header(s, g, comp,0)) return 0; // stbi__g_failure_reason set by stbi__gif_header
+      if (!stbi__mad3sizes_valid(4, g->w, g->h, 0))
+         return stbi__errpuc("too large", "GIF image is too large");
+      pcount = g->w * g->h;
+      g->out = (stbi_uc *) stbi__malloc(4 * pcount);
+      g->background = (stbi_uc *) stbi__malloc(4 * pcount);
+      g->history = (stbi_uc *) stbi__malloc(pcount);
+      if (!g->out || !g->background || !g->history)
+         return stbi__errpuc("outofmem", "Out of memory");
+
+      // image is treated as "transparent" at the start - ie, nothing overwrites the current background;
+      // background colour is only used for pixels that are not rendered first frame, after that "background"
+      // color refers to the color that was there the previous frame.
+      memset(g->out, 0x00, 4 * pcount);
+      memset(g->background, 0x00, 4 * pcount); // state of the background (starts transparent)
+      memset(g->history, 0x00, pcount);        // pixels that were affected previous frame
+      first_frame = 1;
+   } else {
+      // second frame - how do we dispose of the previous one?
+      dispose = (g->eflags & 0x1C) >> 2;
+      pcount = g->w * g->h;
+
+      if ((dispose == 3) && (two_back == 0)) {
+         dispose = 2; // if I don't have an image to revert back to, default to the old background
+      }
+
+      if (dispose == 3) { // use previous graphic
+         for (pi = 0; pi < pcount; ++pi) {
+            if (g->history[pi]) {
+               memcpy( &g->out[pi * 4], &two_back[pi * 4], 4 );
+            }
+         }
+      } else if (dispose == 2) {
+         // restore what was changed last frame to background before that frame;
+         for (pi = 0; pi < pcount; ++pi) {
+            if (g->history[pi]) {
+               memcpy( &g->out[pi * 4], &g->background[pi * 4], 4 );
+            }
+         }
+      } else {
+         // This is a non-disposal case eithe way, so just
+         // leave the pixels as is, and they will become the new background
+         // 1: do not dispose
+         // 0:  not specified.
+      }
+
+      // background is what out is after the undoing of the previou frame;
+      memcpy( g->background, g->out, 4 * g->w * g->h );
+   }
+
+   // clear my history;
+   memset( g->history, 0x00, g->w * g->h );        // pixels that were affected previous frame
+
+   for (;;) {
+      int tag = stbi__get8(s);
+      switch (tag) {
+         case 0x2C: /* Image Descriptor */
+         {
+            stbi__int32 x, y, w, h;
+            stbi_uc *o;
+
+            x = stbi__get16le(s);
+            y = stbi__get16le(s);
+            w = stbi__get16le(s);
+            h = stbi__get16le(s);
+            if (((x + w) > (g->w)) || ((y + h) > (g->h)))
+               return stbi__errpuc("bad Image Descriptor", "Corrupt GIF");
+
+            g->line_size = g->w * 4;
+            g->start_x = x * 4;
+            g->start_y = y * g->line_size;
+            g->max_x   = g->start_x + w * 4;
+            g->max_y   = g->start_y + h * g->line_size;
+            g->cur_x   = g->start_x;
+            g->cur_y   = g->start_y;
+
+            // if the width of the specified rectangle is 0, that means
+            // we may not see *any* pixels or the image is malformed;
+            // to make sure this is caught, move the current y down to
+            // max_y (which is what out_gif_code checks).
+            if (w == 0)
+               g->cur_y = g->max_y;
+
+            g->lflags = stbi__get8(s);
+
+            if (g->lflags & 0x40) {
+               g->step = 8 * g->line_size; // first interlaced spacing
+               g->parse = 3;
+            } else {
+               g->step = g->line_size;
+               g->parse = 0;
+            }
+
+            if (g->lflags & 0x80) {
+               stbi__gif_parse_colortable(s,g->lpal, 2 << (g->lflags & 7), g->eflags & 0x01 ? g->transparent : -1);
+               g->color_table = (stbi_uc *) g->lpal;
+            } else if (g->flags & 0x80) {
+               g->color_table = (stbi_uc *) g->pal;
+            } else
+               return stbi__errpuc("missing color table", "Corrupt GIF");
+
+            o = stbi__process_gif_raster(s, g);
+            if (!o) return NULL;
+
+            // if this was the first frame,
+            pcount = g->w * g->h;
+            if (first_frame && (g->bgindex > 0)) {
+               // if first frame, any pixel not drawn to gets the background color
+               for (pi = 0; pi < pcount; ++pi) {
+                  if (g->history[pi] == 0) {
+                     g->pal[g->bgindex][3] = 255; // just in case it was made transparent, undo that; It will be reset next frame if need be;
+                     memcpy( &g->out[pi * 4], &g->pal[g->bgindex], 4 );
+                  }
+               }
+            }
+
+            return o;
+         }
+
+         case 0x21: // Comment Extension.
+         {
+            int len;
+            int ext = stbi__get8(s);
+            if (ext == 0xF9) { // Graphic Control Extension.
+               len = stbi__get8(s);
+               if (len == 4) {
+                  g->eflags = stbi__get8(s);
+                  g->delay = 10 * stbi__get16le(s); // delay - 1/100th of a second, saving as 1/1000ths.
+
+                  // unset old transparent
+                  if (g->transparent >= 0) {
+                     g->pal[g->transparent][3] = 255;
+                  }
+                  if (g->eflags & 0x01) {
+                     g->transparent = stbi__get8(s);
+                     if (g->transparent >= 0) {
+                        g->pal[g->transparent][3] = 0;
+                     }
+                  } else {
+                     // don't need transparent
+                     stbi__skip(s, 1);
+                     g->transparent = -1;
+                  }
+               } else {
+                  stbi__skip(s, len);
+                  break;
+               }
+            }
+            while ((len = stbi__get8(s)) != 0) {
+               stbi__skip(s, len);
+            }
+            break;
+         }
+
+         case 0x3B: // gif stream termination code
+            return (stbi_uc *) s; // using '1' causes warning on some compilers
+
+         default:
+            return stbi__errpuc("unknown code", "Corrupt GIF");
+      }
+   }
+}
+
+static void *stbi__load_gif_main_outofmem(stbi__gif *g, stbi_uc *out, int **delays)
+{
+   STBI_FREE(g->out);
+   STBI_FREE(g->history);
+   STBI_FREE(g->background);
+
+   if (out) STBI_FREE(out);
+   if (delays && *delays) STBI_FREE(*delays);
+   return stbi__errpuc("outofmem", "Out of memory");
+}
+
+static void *stbi__load_gif_main(stbi__context *s, int **delays, int *x, int *y, int *z, int *comp, int req_comp)
+{
+   if (stbi__gif_test(s)) {
+      int layers = 0;
+      stbi_uc *u = 0;
+      stbi_uc *out = 0;
+      stbi_uc *two_back = 0;
+      stbi__gif g;
+      int stride;
+      int out_size = 0;
+      int delays_size = 0;
+
+      STBI_NOTUSED(out_size);
+      STBI_NOTUSED(delays_size);
+
+      memset(&g, 0, sizeof(g));
+      if (delays) {
+         *delays = 0;
+      }
+
+      do {
+         u = stbi__gif_load_next(s, &g, comp, req_comp, two_back);
+         if (u == (stbi_uc *) s) u = 0;  // end of animated gif marker
+
+         if (u) {
+            *x = g.w;
+            *y = g.h;
+            ++layers;
+            stride = g.w * g.h * 4;
+
+            if (out) {
+               void *tmp = (stbi_uc*) STBI_REALLOC_SIZED( out, out_size, layers * stride );
+               if (!tmp)
+                  return stbi__load_gif_main_outofmem(&g, out, delays);
+               else {
+                   out = (stbi_uc*) tmp;
+                   out_size = layers * stride;
+               }
+
+               if (delays) {
+                  int *new_delays = (int*) STBI_REALLOC_SIZED( *delays, delays_size, sizeof(int) * layers );
+                  if (!new_delays)
+                     return stbi__load_gif_main_outofmem(&g, out, delays);
+                  *delays = new_delays;
+                  delays_size = layers * sizeof(int);
+               }
+            } else {
+               out = (stbi_uc*)stbi__malloc( layers * stride );
+               if (!out)
+                  return stbi__load_gif_main_outofmem(&g, out, delays);
+               out_size = layers * stride;
+               if (delays) {
+                  *delays = (int*) stbi__malloc( layers * sizeof(int) );
+                  if (!*delays)
+                     return stbi__load_gif_main_outofmem(&g, out, delays);
+                  delays_size = layers * sizeof(int);
+               }
+            }
+            memcpy( out + ((layers - 1) * stride), u, stride );
+            if (layers >= 2) {
+               two_back = out - 2 * stride;
+            }
+
+            if (delays) {
+               (*delays)[layers - 1U] = g.delay;
+            }
+         }
+      } while (u != 0);
+
+      // free temp buffer;
+      STBI_FREE(g.out);
+      STBI_FREE(g.history);
+      STBI_FREE(g.background);
+
+      // do the final conversion after loading everything;
+      if (req_comp && req_comp != 4)
+         out = stbi__convert_format(out, 4, req_comp, layers * g.w, g.h);
+
+      *z = layers;
+      return out;
+   } else {
+      return stbi__errpuc("not GIF", "Image was not as a gif type.");
+   }
+}
+
+static void *stbi__gif_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri)
+{
+   stbi_uc *u = 0;
+   stbi__gif g;
+   memset(&g, 0, sizeof(g));
+   STBI_NOTUSED(ri);
+
+   u = stbi__gif_load_next(s, &g, comp, req_comp, 0);
+   if (u == (stbi_uc *) s) u = 0;  // end of animated gif marker
+   if (u) {
+      *x = g.w;
+      *y = g.h;
+
+      // moved conversion to after successful load so that the same
+      // can be done for multiple frames.
+      if (req_comp && req_comp != 4)
+         u = stbi__convert_format(u, 4, req_comp, g.w, g.h);
+   } else if (g.out) {
+      // if there was an error and we allocated an image buffer, free it!
+      STBI_FREE(g.out);
+   }
+
+   // free buffers needed for multiple frame loading;
+   STBI_FREE(g.history);
+   STBI_FREE(g.background);
+
+   return u;
+}
+
+static int stbi__gif_info(stbi__context *s, int *x, int *y, int *comp)
+{
+   return stbi__gif_info_raw(s,x,y,comp);
+}
+#endif
+
+// *************************************************************************************************
+// Radiance RGBE HDR loader
+// originally by Nicolas Schulz
+#ifndef STBI_NO_HDR
+static int stbi__hdr_test_core(stbi__context *s, const char *signature)
+{
+   int i;
+   for (i=0; signature[i]; ++i)
+      if (stbi__get8(s) != signature[i])
+          return 0;
+   stbi__rewind(s);
+   return 1;
+}
+
+static int stbi__hdr_test(stbi__context* s)
+{
+   int r = stbi__hdr_test_core(s, "#?RADIANCE\n");
+   stbi__rewind(s);
+   if(!r) {
+       r = stbi__hdr_test_core(s, "#?RGBE\n");
+       stbi__rewind(s);
+   }
+   return r;
+}
+
+#define STBI__HDR_BUFLEN  1024
+static char *stbi__hdr_gettoken(stbi__context *z, char *buffer)
+{
+   int len=0;
+   char c = '\0';
+
+   c = (char) stbi__get8(z);
+
+   while (!stbi__at_eof(z) && c != '\n') {
+      buffer[len++] = c;
+      if (len == STBI__HDR_BUFLEN-1) {
+         // flush to end of line
+         while (!stbi__at_eof(z) && stbi__get8(z) != '\n')
+            ;
+         break;
+      }
+      c = (char) stbi__get8(z);
+   }
+
+   buffer[len] = 0;
+   return buffer;
+}
+
+static void stbi__hdr_convert(float *output, stbi_uc *input, int req_comp)
+{
+   if ( input[3] != 0 ) {
+      float f1;
+      // Exponent
+      f1 = (float) ldexp(1.0f, input[3] - (int)(128 + 8));
+      if (req_comp <= 2)
+         output[0] = (input[0] + input[1] + input[2]) * f1 / 3;
+      else {
+         output[0] = input[0] * f1;
+         output[1] = input[1] * f1;
+         output[2] = input[2] * f1;
+      }
+      if (req_comp == 2) output[1] = 1;
+      if (req_comp == 4) output[3] = 1;
+   } else {
+      switch (req_comp) {
+         case 4: output[3] = 1; /* fallthrough */
+         case 3: output[0] = output[1] = output[2] = 0;
+                 break;
+         case 2: output[1] = 1; /* fallthrough */
+         case 1: output[0] = 0;
+                 break;
+      }
+   }
+}
+
+static float *stbi__hdr_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri)
+{
+   char buffer[STBI__HDR_BUFLEN];
+   char *token;
+   int valid = 0;
+   int width, height;
+   stbi_uc *scanline;
+   float *hdr_data;
+   int len;
+   unsigned char count, value;
+   int i, j, k, c1,c2, z;
+   const char *headerToken;
+   STBI_NOTUSED(ri);
+
+   // Check identifier
+   headerToken = stbi__hdr_gettoken(s,buffer);
+   if (strcmp(headerToken, "#?RADIANCE") != 0 && strcmp(headerToken, "#?RGBE") != 0)
+      return stbi__errpf("not HDR", "Corrupt HDR image");
+
+   // Parse header
+   for(;;) {
+      token = stbi__hdr_gettoken(s,buffer);
+      if (token[0] == 0) break;
+      if (strcmp(token, "FORMAT=32-bit_rle_rgbe") == 0) valid = 1;
+   }
+
+   if (!valid)    return stbi__errpf("unsupported format", "Unsupported HDR format");
+
+   // Parse width and height
+   // can't use sscanf() if we're not using stdio!
+   token = stbi__hdr_gettoken(s,buffer);
+   if (strncmp(token, "-Y ", 3))  return stbi__errpf("unsupported data layout", "Unsupported HDR format");
+   token += 3;
+   height = (int) strtol(token, &token, 10);
+   while (*token == ' ') ++token;
+   if (strncmp(token, "+X ", 3))  return stbi__errpf("unsupported data layout", "Unsupported HDR format");
+   token += 3;
+   width = (int) strtol(token, NULL, 10);
+
+   if (height > STBI_MAX_DIMENSIONS) return stbi__errpf("too large","Very large image (corrupt?)");
+   if (width > STBI_MAX_DIMENSIONS) return stbi__errpf("too large","Very large image (corrupt?)");
+
+   *x = width;
+   *y = height;
+
+   if (comp) *comp = 3;
+   if (req_comp == 0) req_comp = 3;
+
+   if (!stbi__mad4sizes_valid(width, height, req_comp, sizeof(float), 0))
+      return stbi__errpf("too large", "HDR image is too large");
+
+   // Read data
+   hdr_data = (float *) stbi__malloc_mad4(width, height, req_comp, sizeof(float), 0);
+   if (!hdr_data)
+      return stbi__errpf("outofmem", "Out of memory");
+
+   // Load image data
+   // image data is stored as some number of sca
+   if ( width < 8 || width >= 32768) {
+      // Read flat data
+      for (j=0; j < height; ++j) {
+         for (i=0; i < width; ++i) {
+            stbi_uc rgbe[4];
+           main_decode_loop:
+            stbi__getn(s, rgbe, 4);
+            stbi__hdr_convert(hdr_data + j * width * req_comp + i * req_comp, rgbe, req_comp);
+         }
+      }
+   } else {
+      // Read RLE-encoded data
+      scanline = NULL;
+
+      for (j = 0; j < height; ++j) {
+         c1 = stbi__get8(s);
+         c2 = stbi__get8(s);
+         len = stbi__get8(s);
+         if (c1 != 2 || c2 != 2 || (len & 0x80)) {
+            // not run-length encoded, so we have to actually use THIS data as a decoded
+            // pixel (note this can't be a valid pixel--one of RGB must be >= 128)
+            stbi_uc rgbe[4];
+            rgbe[0] = (stbi_uc) c1;
+            rgbe[1] = (stbi_uc) c2;
+            rgbe[2] = (stbi_uc) len;
+            rgbe[3] = (stbi_uc) stbi__get8(s);
+            stbi__hdr_convert(hdr_data, rgbe, req_comp);
+            i = 1;
+            j = 0;
+            STBI_FREE(scanline);
+            goto main_decode_loop; // yes, this makes no sense
+         }
+         len <<= 8;
+         len |= stbi__get8(s);
+         if (len != width) { STBI_FREE(hdr_data); STBI_FREE(scanline); return stbi__errpf("invalid decoded scanline length", "corrupt HDR"); }
+         if (scanline == NULL) {
+            scanline = (stbi_uc *) stbi__malloc_mad2(width, 4, 0);
+            if (!scanline) {
+               STBI_FREE(hdr_data);
+               return stbi__errpf("outofmem", "Out of memory");
+            }
+         }
+
+         for (k = 0; k < 4; ++k) {
+            int nleft;
+            i = 0;
+            while ((nleft = width - i) > 0) {
+               count = stbi__get8(s);
+               if (count > 128) {
+                  // Run
+                  value = stbi__get8(s);
+                  count -= 128;
+                  if (count > nleft) { STBI_FREE(hdr_data); STBI_FREE(scanline); return stbi__errpf("corrupt", "bad RLE data in HDR"); }
+                  for (z = 0; z < count; ++z)
+                     scanline[i++ * 4 + k] = value;
+               } else {
+                  // Dump
+                  if (count > nleft) { STBI_FREE(hdr_data); STBI_FREE(scanline); return stbi__errpf("corrupt", "bad RLE data in HDR"); }
+                  for (z = 0; z < count; ++z)
+                     scanline[i++ * 4 + k] = stbi__get8(s);
+               }
+            }
+         }
+         for (i=0; i < width; ++i)
+            stbi__hdr_convert(hdr_data+(j*width + i)*req_comp, scanline + i*4, req_comp);
+      }
+      if (scanline)
+         STBI_FREE(scanline);
+   }
+
+   return hdr_data;
+}
+
+static int stbi__hdr_info(stbi__context *s, int *x, int *y, int *comp)
+{
+   char buffer[STBI__HDR_BUFLEN];
+   char *token;
+   int valid = 0;
+   int dummy;
+
+   if (!x) x = &dummy;
+   if (!y) y = &dummy;
+   if (!comp) comp = &dummy;
+
+   if (stbi__hdr_test(s) == 0) {
+       stbi__rewind( s );
+       return 0;
+   }
+
+   for(;;) {
+      token = stbi__hdr_gettoken(s,buffer);
+      if (token[0] == 0) break;
+      if (strcmp(token, "FORMAT=32-bit_rle_rgbe") == 0) valid = 1;
+   }
+
+   if (!valid) {
+       stbi__rewind( s );
+       return 0;
+   }
+   token = stbi__hdr_gettoken(s,buffer);
+   if (strncmp(token, "-Y ", 3)) {
+       stbi__rewind( s );
+       return 0;
+   }
+   token += 3;
+   *y = (int) strtol(token, &token, 10);
+   while (*token == ' ') ++token;
+   if (strncmp(token, "+X ", 3)) {
+       stbi__rewind( s );
+       return 0;
+   }
+   token += 3;
+   *x = (int) strtol(token, NULL, 10);
+   *comp = 3;
+   return 1;
+}
+#endif // STBI_NO_HDR
+
+#ifndef STBI_NO_BMP
+static int stbi__bmp_info(stbi__context *s, int *x, int *y, int *comp)
+{
+   void *p;
+   stbi__bmp_data info;
+
+   info.all_a = 255;
+   p = stbi__bmp_parse_header(s, &info);
+   if (p == NULL) {
+      stbi__rewind( s );
+      return 0;
+   }
+   if (x) *x = s->img_x;
+   if (y) *y = s->img_y;
+   if (comp) {
+      if (info.bpp == 24 && info.ma == 0xff000000)
+         *comp = 3;
+      else
+         *comp = info.ma ? 4 : 3;
+   }
+   return 1;
+}
+#endif
+
+#ifndef STBI_NO_PSD
+static int stbi__psd_info(stbi__context *s, int *x, int *y, int *comp)
+{
+   int channelCount, dummy, depth;
+   if (!x) x = &dummy;
+   if (!y) y = &dummy;
+   if (!comp) comp = &dummy;
+   if (stbi__get32be(s) != 0x38425053) {
+       stbi__rewind( s );
+       return 0;
+   }
+   if (stbi__get16be(s) != 1) {
+       stbi__rewind( s );
+       return 0;
+   }
+   stbi__skip(s, 6);
+   channelCount = stbi__get16be(s);
+   if (channelCount < 0 || channelCount > 16) {
+       stbi__rewind( s );
+       return 0;
+   }
+   *y = stbi__get32be(s);
+   *x = stbi__get32be(s);
+   depth = stbi__get16be(s);
+   if (depth != 8 && depth != 16) {
+       stbi__rewind( s );
+       return 0;
+   }
+   if (stbi__get16be(s) != 3) {
+       stbi__rewind( s );
+       return 0;
+   }
+   *comp = 4;
+   return 1;
+}
+
+static int stbi__psd_is16(stbi__context *s)
+{
+   int channelCount, depth;
+   if (stbi__get32be(s) != 0x38425053) {
+       stbi__rewind( s );
+       return 0;
+   }
+   if (stbi__get16be(s) != 1) {
+       stbi__rewind( s );
+       return 0;
+   }
+   stbi__skip(s, 6);
+   channelCount = stbi__get16be(s);
+   if (channelCount < 0 || channelCount > 16) {
+       stbi__rewind( s );
+       return 0;
+   }
+   STBI_NOTUSED(stbi__get32be(s));
+   STBI_NOTUSED(stbi__get32be(s));
+   depth = stbi__get16be(s);
+   if (depth != 16) {
+       stbi__rewind( s );
+       return 0;
+   }
+   return 1;
+}
+#endif
+
+#ifndef STBI_NO_PIC
+static int stbi__pic_info(stbi__context *s, int *x, int *y, int *comp)
+{
+   int act_comp=0,num_packets=0,chained,dummy;
+   stbi__pic_packet packets[10];
+
+   if (!x) x = &dummy;
+   if (!y) y = &dummy;
+   if (!comp) comp = &dummy;
+
+   if (!stbi__pic_is4(s,"\x53\x80\xF6\x34")) {
+      stbi__rewind(s);
+      return 0;
+   }
+
+   stbi__skip(s, 88);
+
+   *x = stbi__get16be(s);
+   *y = stbi__get16be(s);
+   if (stbi__at_eof(s)) {
+      stbi__rewind( s);
+      return 0;
+   }
+   if ( (*x) != 0 && (1 << 28) / (*x) < (*y)) {
+      stbi__rewind( s );
+      return 0;
+   }
+
+   stbi__skip(s, 8);
+
+   do {
+      stbi__pic_packet *packet;
+
+      if (num_packets==sizeof(packets)/sizeof(packets[0]))
+         return 0;
+
+      packet = &packets[num_packets++];
+      chained = stbi__get8(s);
+      packet->size    = stbi__get8(s);
+      packet->type    = stbi__get8(s);
+      packet->channel = stbi__get8(s);
+      act_comp |= packet->channel;
+
+      if (stbi__at_eof(s)) {
+          stbi__rewind( s );
+          return 0;
+      }
+      if (packet->size != 8) {
+          stbi__rewind( s );
+          return 0;
+      }
+   } while (chained);
+
+   *comp = (act_comp & 0x10 ? 4 : 3);
+
+   return 1;
+}
+#endif
+
+// *************************************************************************************************
+// Portable Gray Map and Portable Pixel Map loader
+// by Ken Miller
+//
+// PGM: http://netpbm.sourceforge.net/doc/pgm.html
+// PPM: http://netpbm.sourceforge.net/doc/ppm.html
+//
+// Known limitations:
+//    Does not support comments in the header section
+//    Does not support ASCII image data (formats P2 and P3)
+
+#ifndef STBI_NO_PNM
+
+static int      stbi__pnm_test(stbi__context *s)
+{
+   char p, t;
+   p = (char) stbi__get8(s);
+   t = (char) stbi__get8(s);
+   if (p != 'P' || (t != '5' && t != '6')) {
+       stbi__rewind( s );
+       return 0;
+   }
+   return 1;
+}
+
+static void *stbi__pnm_load(stbi__context *s, int *x, int *y, int *comp, int req_comp, stbi__result_info *ri)
+{
+   stbi_uc *out;
+   STBI_NOTUSED(ri);
+
+   ri->bits_per_channel = stbi__pnm_info(s, (int *)&s->img_x, (int *)&s->img_y, (int *)&s->img_n);
+   if (ri->bits_per_channel == 0)
+      return 0;
+
+   if (s->img_y > STBI_MAX_DIMENSIONS) return stbi__errpuc("too large","Very large image (corrupt?)");
+   if (s->img_x > STBI_MAX_DIMENSIONS) return stbi__errpuc("too large","Very large image (corrupt?)");
+
+   *x = s->img_x;
+   *y = s->img_y;
+   if (comp) *comp = s->img_n;
+
+   if (!stbi__mad4sizes_valid(s->img_n, s->img_x, s->img_y, ri->bits_per_channel / 8, 0))
+      return stbi__errpuc("too large", "PNM too large");
+
+   out = (stbi_uc *) stbi__malloc_mad4(s->img_n, s->img_x, s->img_y, ri->bits_per_channel / 8, 0);
+   if (!out) return stbi__errpuc("outofmem", "Out of memory");
+   stbi__getn(s, out, s->img_n * s->img_x * s->img_y * (ri->bits_per_channel / 8));
+
+   if (req_comp && req_comp != s->img_n) {
+      out = stbi__convert_format(out, s->img_n, req_comp, s->img_x, s->img_y);
+      if (out == NULL) return out; // stbi__convert_format frees input on failure
+   }
+   return out;
+}
+
+static int      stbi__pnm_isspace(char c)
+{
+   return c == ' ' || c == '\t' || c == '\n' || c == '\v' || c == '\f' || c == '\r';
+}
+
+static void     stbi__pnm_skip_whitespace(stbi__context *s, char *c)
+{
+   for (;;) {
+      while (!stbi__at_eof(s) && stbi__pnm_isspace(*c))
+         *c = (char) stbi__get8(s);
+
+      if (stbi__at_eof(s) || *c != '#')
+         break;
+
+      while (!stbi__at_eof(s) && *c != '\n' && *c != '\r' )
+         *c = (char) stbi__get8(s);
+   }
+}
+
+static int      stbi__pnm_isdigit(char c)
+{
+   return c >= '0' && c <= '9';
+}
+
+static int      stbi__pnm_getinteger(stbi__context *s, char *c)
+{
+   int value = 0;
+
+   while (!stbi__at_eof(s) && stbi__pnm_isdigit(*c)) {
+      value = value*10 + (*c - '0');
+      *c = (char) stbi__get8(s);
+   }
+
+   return value;
+}
+
+static int      stbi__pnm_info(stbi__context *s, int *x, int *y, int *comp)
+{
+   int maxv, dummy;
+   char c, p, t;
+
+   if (!x) x = &dummy;
+   if (!y) y = &dummy;
+   if (!comp) comp = &dummy;
+
+   stbi__rewind(s);
+
+   // Get identifier
+   p = (char) stbi__get8(s);
+   t = (char) stbi__get8(s);
+   if (p != 'P' || (t != '5' && t != '6')) {
+       stbi__rewind(s);
+       return 0;
+   }
+
+   *comp = (t == '6') ? 3 : 1;  // '5' is 1-component .pgm; '6' is 3-component .ppm
+
+   c = (char) stbi__get8(s);
+   stbi__pnm_skip_whitespace(s, &c);
+
+   *x = stbi__pnm_getinteger(s, &c); // read width
+   stbi__pnm_skip_whitespace(s, &c);
+
+   *y = stbi__pnm_getinteger(s, &c); // read height
+   stbi__pnm_skip_whitespace(s, &c);
+
+   maxv = stbi__pnm_getinteger(s, &c);  // read max value
+   if (maxv > 65535)
+      return stbi__err("max value > 65535", "PPM image supports only 8-bit and 16-bit images");
+   else if (maxv > 255)
+      return 16;
+   else
+      return 8;
+}
+
+static int stbi__pnm_is16(stbi__context *s)
+{
+   if (stbi__pnm_info(s, NULL, NULL, NULL) == 16)
+	   return 1;
+   return 0;
+}
+#endif
+
+static int stbi__info_main(stbi__context *s, int *x, int *y, int *comp)
+{
+   #ifndef STBI_NO_JPEG
+   if (stbi__jpeg_info(s, x, y, comp)) return 1;
+   #endif
+
+   #ifndef STBI_NO_PNG
+   if (stbi__png_info(s, x, y, comp))  return 1;
+   #endif
+
+   #ifndef STBI_NO_GIF
+   if (stbi__gif_info(s, x, y, comp))  return 1;
+   #endif
+
+   #ifndef STBI_NO_BMP
+   if (stbi__bmp_info(s, x, y, comp))  return 1;
+   #endif
+
+   #ifndef STBI_NO_PSD
+   if (stbi__psd_info(s, x, y, comp))  return 1;
+   #endif
+
+   #ifndef STBI_NO_PIC
+   if (stbi__pic_info(s, x, y, comp))  return 1;
+   #endif
+
+   #ifndef STBI_NO_PNM
+   if (stbi__pnm_info(s, x, y, comp))  return 1;
+   #endif
+
+   #ifndef STBI_NO_HDR
+   if (stbi__hdr_info(s, x, y, comp))  return 1;
+   #endif
+
+   // test tga last because it's a crappy test!
+   #ifndef STBI_NO_TGA
+   if (stbi__tga_info(s, x, y, comp))
+       return 1;
+   #endif
+   return stbi__err("unknown image type", "Image not of any known type, or corrupt");
+}
+
+static int stbi__is_16_main(stbi__context *s)
+{
+   #ifndef STBI_NO_PNG
+   if (stbi__png_is16(s))  return 1;
+   #endif
+
+   #ifndef STBI_NO_PSD
+   if (stbi__psd_is16(s))  return 1;
+   #endif
+
+   #ifndef STBI_NO_PNM
+   if (stbi__pnm_is16(s))  return 1;
+   #endif
+   return 0;
+}
+
+#ifndef STBI_NO_STDIO
+STBIDEF int stbi_info(char const *filename, int *x, int *y, int *comp)
+{
+    FILE *f = stbi__fopen(filename, "rb");
+    int result;
+    if (!f) return stbi__err("can't fopen", "Unable to open file");
+    result = stbi_info_from_file(f, x, y, comp);
+    fclose(f);
+    return result;
+}
+
+STBIDEF int stbi_info_from_file(FILE *f, int *x, int *y, int *comp)
+{
+   int r;
+   stbi__context s;
+   long pos = ftell(f);
+   stbi__start_file(&s, f);
+   r = stbi__info_main(&s,x,y,comp);
+   fseek(f,pos,SEEK_SET);
+   return r;
+}
+
+STBIDEF int stbi_is_16_bit(char const *filename)
+{
+    FILE *f = stbi__fopen(filename, "rb");
+    int result;
+    if (!f) return stbi__err("can't fopen", "Unable to open file");
+    result = stbi_is_16_bit_from_file(f);
+    fclose(f);
+    return result;
+}
+
+STBIDEF int stbi_is_16_bit_from_file(FILE *f)
+{
+   int r;
+   stbi__context s;
+   long pos = ftell(f);
+   stbi__start_file(&s, f);
+   r = stbi__is_16_main(&s);
+   fseek(f,pos,SEEK_SET);
+   return r;
+}
+#endif // !STBI_NO_STDIO
+
+STBIDEF int stbi_info_from_memory(stbi_uc const *buffer, int len, int *x, int *y, int *comp)
+{
+   stbi__context s;
+   stbi__start_mem(&s,buffer,len);
+   return stbi__info_main(&s,x,y,comp);
+}
+
+STBIDEF int stbi_info_from_callbacks(stbi_io_callbacks const *c, void *user, int *x, int *y, int *comp)
+{
+   stbi__context s;
+   stbi__start_callbacks(&s, (stbi_io_callbacks *) c, user);
+   return stbi__info_main(&s,x,y,comp);
+}
+
+STBIDEF int stbi_is_16_bit_from_memory(stbi_uc const *buffer, int len)
+{
+   stbi__context s;
+   stbi__start_mem(&s,buffer,len);
+   return stbi__is_16_main(&s);
+}
+
+STBIDEF int stbi_is_16_bit_from_callbacks(stbi_io_callbacks const *c, void *user)
+{
+   stbi__context s;
+   stbi__start_callbacks(&s, (stbi_io_callbacks *) c, user);
+   return stbi__is_16_main(&s);
+}
+
+#endif // STB_IMAGE_IMPLEMENTATION
+
+/*
+   revision history:
+      2.20  (2019-02-07) support utf8 filenames in Windows; fix warnings and platform ifdefs
+      2.19  (2018-02-11) fix warning
+      2.18  (2018-01-30) fix warnings
+      2.17  (2018-01-29) change sbti__shiftsigned to avoid clang -O2 bug
+                         1-bit BMP
+                         *_is_16_bit api
+                         avoid warnings
+      2.16  (2017-07-23) all functions have 16-bit variants;
+                         STBI_NO_STDIO works again;
+                         compilation fixes;
+                         fix rounding in unpremultiply;
+                         optimize vertical flip;
+                         disable raw_len validation;
+                         documentation fixes
+      2.15  (2017-03-18) fix png-1,2,4 bug; now all Imagenet JPGs decode;
+                         warning fixes; disable run-time SSE detection on gcc;
+                         uniform handling of optional "return" values;
+                         thread-safe initialization of zlib tables
+      2.14  (2017-03-03) remove deprecated STBI_JPEG_OLD; fixes for Imagenet JPGs
+      2.13  (2016-11-29) add 16-bit API, only supported for PNG right now
+      2.12  (2016-04-02) fix typo in 2.11 PSD fix that caused crashes
+      2.11  (2016-04-02) allocate large structures on the stack
+                         remove white matting for transparent PSD
+                         fix reported channel count for PNG & BMP
+                         re-enable SSE2 in non-gcc 64-bit
+                         support RGB-formatted JPEG
+                         read 16-bit PNGs (only as 8-bit)
+      2.10  (2016-01-22) avoid warning introduced in 2.09 by STBI_REALLOC_SIZED
+      2.09  (2016-01-16) allow comments in PNM files
+                         16-bit-per-pixel TGA (not bit-per-component)
+                         info() for TGA could break due to .hdr handling
+                         info() for BMP to shares code instead of sloppy parse
+                         can use STBI_REALLOC_SIZED if allocator doesn't support realloc
+                         code cleanup
+      2.08  (2015-09-13) fix to 2.07 cleanup, reading RGB PSD as RGBA
+      2.07  (2015-09-13) fix compiler warnings
+                         partial animated GIF support
+                         limited 16-bpc PSD support
+                         #ifdef unused functions
+                         bug with < 92 byte PIC,PNM,HDR,TGA
+      2.06  (2015-04-19) fix bug where PSD returns wrong '*comp' value
+      2.05  (2015-04-19) fix bug in progressive JPEG handling, fix warning
+      2.04  (2015-04-15) try to re-enable SIMD on MinGW 64-bit
+      2.03  (2015-04-12) extra corruption checking (mmozeiko)
+                         stbi_set_flip_vertically_on_load (nguillemot)
+                         fix NEON support; fix mingw support
+      2.02  (2015-01-19) fix incorrect assert, fix warning
+      2.01  (2015-01-17) fix various warnings; suppress SIMD on gcc 32-bit without -msse2
+      2.00b (2014-12-25) fix STBI_MALLOC in progressive JPEG
+      2.00  (2014-12-25) optimize JPG, including x86 SSE2 & NEON SIMD (ryg)
+                         progressive JPEG (stb)
+                         PGM/PPM support (Ken Miller)
+                         STBI_MALLOC,STBI_REALLOC,STBI_FREE
+                         GIF bugfix -- seemingly never worked
+                         STBI_NO_*, STBI_ONLY_*
+      1.48  (2014-12-14) fix incorrectly-named assert()
+      1.47  (2014-12-14) 1/2/4-bit PNG support, both direct and paletted (Omar Cornut & stb)
+                         optimize PNG (ryg)
+                         fix bug in interlaced PNG with user-specified channel count (stb)
+      1.46  (2014-08-26)
+              fix broken tRNS chunk (colorkey-style transparency) in non-paletted PNG
+      1.45  (2014-08-16)
+              fix MSVC-ARM internal compiler error by wrapping malloc
+      1.44  (2014-08-07)
+              various warning fixes from Ronny Chevalier
+      1.43  (2014-07-15)
+              fix MSVC-only compiler problem in code changed in 1.42
+      1.42  (2014-07-09)
+              don't define _CRT_SECURE_NO_WARNINGS (affects user code)
+              fixes to stbi__cleanup_jpeg path
+              added STBI_ASSERT to avoid requiring assert.h
+      1.41  (2014-06-25)
+              fix search&replace from 1.36 that messed up comments/error messages
+      1.40  (2014-06-22)
+              fix gcc struct-initialization warning
+      1.39  (2014-06-15)
+              fix to TGA optimization when req_comp != number of components in TGA;
+              fix to GIF loading because BMP wasn't rewinding (whoops, no GIFs in my test suite)
+              add support for BMP version 5 (more ignored fields)
+      1.38  (2014-06-06)
+              suppress MSVC warnings on integer casts truncating values
+              fix accidental rename of 'skip' field of I/O
+      1.37  (2014-06-04)
+              remove duplicate typedef
+      1.36  (2014-06-03)
+              convert to header file single-file library
+              if de-iphone isn't set, load iphone images color-swapped instead of returning NULL
+      1.35  (2014-05-27)
+              various warnings
+              fix broken STBI_SIMD path
+              fix bug where stbi_load_from_file no longer left file pointer in correct place
+              fix broken non-easy path for 32-bit BMP (possibly never used)
+              TGA optimization by Arseny Kapoulkine
+      1.34  (unknown)
+              use STBI_NOTUSED in stbi__resample_row_generic(), fix one more leak in tga failure case
+      1.33  (2011-07-14)
+              make stbi_is_hdr work in STBI_NO_HDR (as specified), minor compiler-friendly improvements
+      1.32  (2011-07-13)
+              support for "info" function for all supported filetypes (SpartanJ)
+      1.31  (2011-06-20)
+              a few more leak fixes, bug in PNG handling (SpartanJ)
+      1.30  (2011-06-11)
+              added ability to load files via callbacks to accomidate custom input streams (Ben Wenger)
+              removed deprecated format-specific test/load functions
+              removed support for installable file formats (stbi_loader) -- would have been broken for IO callbacks anyway
+              error cases in bmp and tga give messages and don't leak (Raymond Barbiero, grisha)
+              fix inefficiency in decoding 32-bit BMP (David Woo)
+      1.29  (2010-08-16)
+              various warning fixes from Aurelien Pocheville
+      1.28  (2010-08-01)
+              fix bug in GIF palette transparency (SpartanJ)
+      1.27  (2010-08-01)
+              cast-to-stbi_uc to fix warnings
+      1.26  (2010-07-24)
+              fix bug in file buffering for PNG reported by SpartanJ
+      1.25  (2010-07-17)
+              refix trans_data warning (Won Chun)
+      1.24  (2010-07-12)
+              perf improvements reading from files on platforms with lock-heavy fgetc()
+              minor perf improvements for jpeg
+              deprecated type-specific functions so we'll get feedback if they're needed
+              attempt to fix trans_data warning (Won Chun)
+      1.23    fixed bug in iPhone support
+      1.22  (2010-07-10)
+              removed image *writing* support
+              stbi_info support from Jetro Lauha
+              GIF support from Jean-Marc Lienher
+              iPhone PNG-extensions from James Brown
+              warning-fixes from Nicolas Schulz and Janez Zemva (i.stbi__err. Janez (U+017D)emva)
+      1.21    fix use of 'stbi_uc' in header (reported by jon blow)
+      1.20    added support for Softimage PIC, by Tom Seddon
+      1.19    bug in interlaced PNG corruption check (found by ryg)
+      1.18  (2008-08-02)
+              fix a threading bug (local mutable static)
+      1.17    support interlaced PNG
+      1.16    major bugfix - stbi__convert_format converted one too many pixels
+      1.15    initialize some fields for thread safety
+      1.14    fix threadsafe conversion bug
+              header-file-only version (#define STBI_HEADER_FILE_ONLY before including)
+      1.13    threadsafe
+      1.12    const qualifiers in the API
+      1.11    Support installable IDCT, colorspace conversion routines
+      1.10    Fixes for 64-bit (don't use "unsigned long")
+              optimized upsampling by Fabian "ryg" Giesen
+      1.09    Fix format-conversion for PSD code (bad global variables!)
+      1.08    Thatcher Ulrich's PSD code integrated by Nicolas Schulz
+      1.07    attempt to fix C++ warning/errors again
+      1.06    attempt to fix C++ warning/errors again
+      1.05    fix TGA loading to return correct *comp and use good luminance calc
+      1.04    default float alpha is 1, not 255; use 'void *' for stbi_image_free
+      1.03    bugfixes to STBI_NO_STDIO, STBI_NO_HDR
+      1.02    support for (subset of) HDR files, float interface for preferred access to them
+      1.01    fix bug: possible bug in handling right-side up bmps... not sure
+              fix bug: the stbi__bmp_load() and stbi__tga_load() functions didn't work at all
+      1.00    interface to zlib that skips zlib header
+      0.99    correct handling of alpha in palette
+      0.98    TGA loader by lonesock; dynamically add loaders (untested)
+      0.97    jpeg errors on too large a file; also catch another malloc failure
+      0.96    fix detection of invalid v value - particleman@mollyrocket forum
+      0.95    during header scan, seek to markers in case of padding
+      0.94    STBI_NO_STDIO to disable stdio usage; rename all #defines the same
+      0.93    handle jpegtran output; verbose errors
+      0.92    read 4,8,16,24,32-bit BMP files of several formats
+      0.91    output 24-bit Windows 3.0 BMP files
+      0.90    fix a few more warnings; bump version number to approach 1.0
+      0.61    bugfixes due to Marc LeBlanc, Christopher Lloyd
+      0.60    fix compiling as c++
+      0.59    fix warnings: merge Dave Moore's -Wall fixes
+      0.58    fix bug: zlib uncompressed mode len/nlen was wrong endian
+      0.57    fix bug: jpg last huffman symbol before marker was >9 bits but less than 16 available
+      0.56    fix bug: zlib uncompressed mode len vs. nlen
+      0.55    fix bug: restart_interval not initialized to 0
+      0.54    allow NULL for 'int *comp'
+      0.53    fix bug in png 3->4; speedup png decoding
+      0.52    png handles req_comp=3,4 directly; minor cleanup; jpeg comments
+      0.51    obey req_comp requests, 1-component jpegs return as 1-component,
+              on 'test' only check type, not whether we support this variant
+      0.50  (2006-11-19)
+              first released version
+*/
+
+
+/*
+------------------------------------------------------------------------------
+This software is available under 2 licenses -- choose whichever you prefer.
+------------------------------------------------------------------------------
+ALTERNATIVE A - MIT License
+Copyright (c) 2017 Sean Barrett
+Permission is hereby granted, free of charge, to any person obtaining a copy of
+this software and associated documentation files (the "Software"), to deal in
+the Software without restriction, including without limitation the rights to
+use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
+of the Software, and to permit persons to whom the Software is furnished to do
+so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+------------------------------------------------------------------------------
+ALTERNATIVE B - Public Domain (www.unlicense.org)
+This is free and unencumbered software released into the public domain.
+Anyone is free to copy, modify, publish, use, compile, sell, or distribute this
+software, either in source code form or as a compiled binary, for any purpose,
+commercial or non-commercial, and by any means.
+In jurisdictions that recognize copyright laws, the author or authors of this
+software dedicate any and all copyright interest in the software to the public
+domain. We make this dedication for the benefit of the public at large and to
+the detriment of our heirs and successors. We intend this dedication to be an
+overt act of relinquishment in perpetuity of all present and future rights to
+this software under copyright law.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
+ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
+WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
+------------------------------------------------------------------------------
+*/
diff --git a/lib/stb_image.onyx b/lib/stb_image.onyx
new file mode 100644
index 0000000..d937507
--- /dev/null
+++ b/lib/stb_image.onyx
@@ -0,0 +1,13 @@
+package stb_image
+
+#library "stb_image"
+
+#foreign "stb_image" {
+    stbi_load       :: (filename: cstr, width: ^i32, height: ^i32, channels: ^i32, desired_channels: i32) -> ^u8 ---
+    stbi_image_free :: (image_data: ^u8) -> void ---
+}
+
+#export "stbi_heap_alloc"  calloc
+#export "stbi_heap_resize" cresize
+#export "stbi_heap_free"   cfree
+
diff --git a/run_tree/assets/shaders/world_fragment.glsl b/run_tree/assets/shaders/world_fragment.glsl
index f1f7549..f54d2ff 100644
--- a/run_tree/assets/shaders/world_fragment.glsl
+++ b/run_tree/assets/shaders/world_fragment.glsl
@@ -1,9 +1,13 @@
 #version 300 es
 precision mediump float;
 
+uniform sampler2D u_sampler;
+
 in vec4 v_color;
+in vec2 v_tex;
+in float v_tex_enabled;
 
 out vec4 fragColor;
 void main() {
-    fragColor = v_color;
+    fragColor = vec4((v_color * mix(vec4(1), texture(u_sampler, v_tex), v_tex_enabled)).xyz, 1);
 }
diff --git a/run_tree/assets/shaders/world_vertex.glsl b/run_tree/assets/shaders/world_vertex.glsl
index 8f50ed8..5e53074 100644
--- a/run_tree/assets/shaders/world_vertex.glsl
+++ b/run_tree/assets/shaders/world_vertex.glsl
@@ -1,6 +1,7 @@
 #version 300 es
 layout(location = 0) in vec3 a_pos;
-layout(location = 1) in uint a_data;
+layout(location = 1) in vec2 a_tex;
+layout(location = 2) in uint a_data;
 
 layout(std140) uniform u_world_matrix_block {
     mat4 u_view;
@@ -9,6 +10,8 @@ layout(std140) uniform u_world_matrix_block {
 };
 
 out vec4 v_color;
+out vec2 v_tex;
+out float v_tex_enabled;
 
 void main() {
     gl_Position = u_view * u_world * u_model * vec4(a_pos, 1);
@@ -19,5 +22,7 @@ void main() {
         float((a_data & 0x00F00U) >>  8U) / 15.0
     ) * (float((a_data & 0x0F000U) >> 12U) / 15.0);
 
-    v_color = vec4(block_color, 1);
+    v_color       = vec4(block_color, 1);
+    v_tex         = a_tex;
+    v_tex_enabled = float((a_data & 0x10000U) >> 16U);
 }
diff --git a/run_tree/assets/textures/block.png b/run_tree/assets/textures/block.png
new file mode 100644
index 0000000000000000000000000000000000000000..38fcfe9c36745ae9dfc20b7a57d920afccfb2ed4
GIT binary patch
literal 2406
zcmV-s37PhZP)<h;3K|Lk000e1NJLTq001BW001Be0ssI2{21+{0004nX+uL$Nkc;*
zaB^>EX>4Tx04R}tkv&MmP!xqvQ>8^J3audGkfAzR5EXIMDionYs1;guFnQ@8G-*gu
zTpR`0f`dPcRR<SmT^(EnLGTB}(aA~CMM}J{DYS_3!sC6MchBLy`v9R{W}4MC4rsb<
zrV?>6lU)@9ukfKCVFWQCGs~Ehq$E7+>z=x)?qWR4yYJ8HRdW^td?N8IGfbO!gLrz=
zHaPDSM_5r-iO-40Ou8WPBi9v|-#8bVEbz>TnNH0UM~KBj2P+-Sil#<9MI2Q%o$`f@
z%PQwB&RV(3TKD8H4CVBdWv<g2Mgogif&>u?swklh8!_5-QY@tCJnrEiYWgK|DdZ}F
zkz)ZBXpozJ@IUxHTPr^~;U<ORK=+H|e2f5rU7%5OobO}DX`BH5XW&Y2`zv)|=9BbV
zTZ<k6ecQmrbz4*RfXf|V@X3%(xheT+3Hdzmen#Jv1;V#L&zd{8);UfefHci2c>^3A
z0;2`WUiWx+uybzz_O#~r0}-xrfPyDkMgRZ+32;bRa{vG?BLDy{BLR4&KXw2B00(qQ
zO+^Rh0T2@j3D?dt)Bpeg8FWQhbVF}#ZDnqB07G(RVRU6=Aa`kWXdp*PO;A^X4i^9b
z2Tw^vK~zY`RaRSj<hBh3smo|Q9*@0VJISW~`u~4UA2vzbZT4c1$8*zNlt=<NebB74
z<&z{55C|Nc0|L;Tt6><<+kNyw7|i_q{2W67a6XpfH2TqthlpTaEC9rf07N8&5Cwp`
zrdL$}3P7Vq^yi*f0rsjIV|??_R22Xyy1E0Phya**^yq8%^z8{i1XM5Q{n*xZ-89Y1
z%L{&73Il+MR8_2IlzN)P<7%;_AC{MCkrZ9mEtktQP5apOr@_RGautmqK70rv)OG#%
z_};nc%1|45wOUnGO-%N%I}nkzHo8DWr|mfeCZcJY2$vs7m<SSMj4?j#p0Bg@{rmf3
zlct&d<>3PnjjnrmcoZT4PO)CElO(ymUR~#fEv~N!`W9@S=ZH!~=hKl44Z|=^)74@#
zbp3k0UM`on%XdVSW$9|Qy1%>q_VSgPH@El3P~UVblcrgIKA)L6&vQ-17K@yXC8EP_
zM??>sJ2FayU;p-ZA=z#ZPzbbARUJt*TNollGR7Ds^N(MDF~$tTKt!AMIxZHcy54Ly
zX_~6a?r<dUy*3j7KY9Qn2r&YPg8hDv3nl=dX__A6{45d5Gn(L>15maN02Pb@jRJr$
z1F(6XH##26s_k1MYNvr?BqB(>dwe924lSvU<9IskudpDZ?RG1OQ<xG<bNxg_eDG0>
zYLU?mVpUZ(Nr;HXaRku!z3>l6R}8}d;CMVb=R_E)Gse9~({xacV9a-o5rS!&=4TOU
z+g24}oB$;W@bVX;=iZ4EAY9k=UwDQGfWS@Nj^pU3^Str0y8yqcDxEOLG=J&3b_{{$
zmk3{1RR{q<-IV}-`~9B)#s(vL@OU^JS`5%jqzb5_?3x(4uItaAKLZf(Fbv!6F2)F;
z>pBM0Y!hQt4^{=RdwHHq3Ps=d0H$g3e%e3p=V*pO6grM$S(d<@IWRLbgF{oD-tMgd
z1R#VU5$E#w{QL|+6{@O&X#z7tMgZsY8NdX0JRXM&l(66Lhkl&50DSuN$$Jlhs@C<H
zV^mdARj@W)J0A+lU%q^)$L`|d_$s2_`~N;~LkRjk-nu@!7@&cn%q-%%F$jA&FmTu(
z9E++#)rxS{);HH{f}Bn#*Y=y6+t^QaGZ4}3`@8aZraapei!93w8Dpp$!)Ei&_XCRo
zOOhnkF0V5=92yizh>|o(6FK*11q?GMNuorSD1?wFX-Gm2LuN6PM~pGavct=3nlEl{
zR#wNf*leFq%PY&wkB^TcWI%zZq9}+WQAP@~226+MM5og!DinfvNo~A9mZ2Ire*5|j
zfX6gf3(&f*pPrr~&vjHdfyx`oopXRn!~{7Wk7k7AELA()zuR~p7K;UWcp4XrD<V>z
z$mV|Z*4o7)Co%*D8Dq?hoGi;gFl2~GG@g%TvAim73Iq+4NA%Wo_HZuyuDN(8q6NLa
zys9!0tX){L%jHrgB{IZJEPd~GyPYv6%QB6mQHW?5CTr5ihliV+_5OKhja{$TX0fEx
z>Eyj<#2^!Zz&v-nbFS~f2y-7u095Br9H&tQs`&Et&j!upgNPvTx0i3<`~ELtpkbI0
zL*Mtzd_igmWm!6~!@x02W7jlIRn;*@Mr_-b`~Q>0+3@q%r@4DyUtixSc(>b8S(buP
zp&<nCf0R?13q7-wsygQc91wr>9z9&w0EkehqKb1@jXIm4I-Kn7?XAQl5NF5?`4EB<
zNQI0o%Q7JoW3<*rqpCt`64<`)s;Vr{<!)D{Il-nx)Yr|@Sns=c*SE3jjInCke6=JW
z;hY=2>xXa|5xfV`_C0=(8~^=wr+pQoKOT<)jhF!Fh`01QxTbF240nfDt2`}><svJR
zj76AqGR8Dbv&b?cVwR5|KLVt=IUEil1e+(p$GiLY+o$L1;D{&~KTD<{=%6>78zRzR
zh)9ArK_pI7Q54o%0VReoQ7DF#mT?SS-@V&BBsm=phsVc9A{vHawOSF8C<|+nBxPB?
zd${u;cdkt|)ljXjv%I*!zrDUN!Cca|ZHLwY@b02<P<0Lf&aPu9kAPl4{QCK@e|>H1
zGoTQjWm!Zxg1^gRS(Xlg6b?W;xEbRvgg1mdJw43?K6nA}pMU>rKBKBHFE0wHYST0v
zn3+R&*%A>I#2A$!%+}CSBw8_9mJty$5YadcM8X^&e*XE-FJG=w`{~oC;(ncF87UcK
z?l->}B4f<W%}wXpBuS!;1Tgb<yKVcHO=65}UtXw<7exgSBKF6VGCbG?2VnH`B&*HT
ziBpD~#b+D_1o`^)BEJD+7{@tLKN8>T>#JR-<h@_t+!9eHevu`UZxW$pwj?5;4c<p1
z`J#x{j6<Lh3u}t2D>Bm}(V^{s|LwO-^R&p9%Oyxp=W?ER|M=sNpMLu3GW<@{lozR`
zL<k@t0Hk@Ii&A2#I+m;3wS}gME&G0ReFFfg$tWQWRWsbK?jnUeQ<Y+HeJbhlu9)TI
Yf8PYf8H-dQrvLx|07*qoM6N<$f<%^DDF6Tf

literal 0
HcmV?d00001

diff --git a/run_tree/lib/stb_image.so b/run_tree/lib/stb_image.so
new file mode 100755
index 0000000000000000000000000000000000000000..e8d39d62fed49716912ffc8c8633ebfc1b584b50
GIT binary patch
literal 156624
zcmeFadwg7FwLZR6dI^Y3z=9P~1Kxmg35ZC!=oC9T`fW8TQRDzkfd(qQ#5Td=A!X{Y
zHQVWiQHiHs@C0uM6^_wkpmL~A3O130I$(t=sG}B~kg7we60y?n^Q^VrnY|}TTfWEN
zAHUDX^wU{;t#>`^UGI9Y``x$eQw!fRt)anle+PMQ^vIQ7sgk56G+jK+jyx~vo#h>h
z-&c4q7v1UAl!*t)7pu%suSt34F@uNA{J~$d{8s7Xo2lV>jz)2kUrE!wI(q!+YRAzi
zZYGj4FVk{lPL9*7#2L>UG3s#CA}(*Zyx|-znj4NbYW5y|<o}XpGl4dno}=|R?;umC
zqpvctqs)VUv+$qCQ<aZ8{A-q9&vW^`=kcy9h<m<%wi<5spELmVbPt1uKS!OP?*h(}
zRAE2A)?B=ITYgiOFJp0b)T%{dLL02sx4xszgIa;UxUlkgw((5gvgO(46`7M4pZfb9
z7kuvXU;Omf_TF(4lD${s{~Y|MK4X_!?@gaMzomI+COPx6%MMBo{O01>OO8G6v@Z>v
zKl9Z2Tiy#5(I<Tg{vVD1FDHY)S19q0HOj8`D*R_2ufhM<;y?dR#Q(YYPX|uHfBv0@
z|7YO;nfN~s|IfyM_jfK1&cpvV;eQhU-;Dq6FNK4fO7lw}ytnalH=g#vhaP_XhT)mh
z-mvNY?>uJPl{0Vijvv|m??1U|<iFRQ^7Gd%`O1$Acf9+3FaNiT=dHhG!PsA(8UEvF
z=h1(jRsQiep8V62O&b%p-ZHrC<m0ZmXVVMc`tw`ge@5vOf4T83GrsVZk1fi-`HaEz
zXZG|TyXn*|jZYnSUUvA0!<W46hF5>}hVzeFu;=H;?LED(=lnaKyXY_5j!iE3<ktq*
z9ChEd@A%`Aul@dlr{1tK=zZdMb3c32)t&x(o>+7Aw4>iNboQn1`<-_Ti!<e48WnQH
zB&lsv$k`T}C(-{bWRuysZVLH3(ZD9tzj_M&OQw*&YzjNQQ|J#)A%Djd<;|kOPv&Re
z6n5awr180A3j42`!v7nmu>X-M<a4L6vj_gWF#yo&ANxdem8%`R1&7Dg*y_=H#r|R5
zJnJxzS;}k-3`cl}dH?lGDBzEMk$-1M+z#{Bov-{YO1#s|&O>LZAZPOHF`&@SXHHi;
zFHqtY%}xtDApY3L`8Q<xm%dvSZJPA@P5$NAseFs7dq=>}!!eQ+PlrMLaV+BB-Ddwq
zX8&a>_Ewnuw{KR#mrVY3smH^-*Zo}Wf5zk=G5IOmReqVt{|qYeu>pwV3;%uvHOkX(
zRQ|0B^Nuq+KeTc={c}wJ5)NAUbMgO_$=}Ao3xD5G;w>@%KW_eCX!17D!#SG14hr~l
z^VkZrbL2T9_FTP`ES}wUaSqJBzd-drsKooQ+37bsUo-i*$^Sj60w-T-<z4a!6!7;W
zP4-SO`%lkTf%7L}^0diac{vF)p1*%s?R?nm`~WQFw^$&Z{x+mj{&}kx*M2y$QNHX{
zwKGSF_hrlXFIL`{nSD-%)PKO*!{<!?gz2}{wcDSY{*}K_!>dgH6DH4F`*H2<R`c_c
zxvJ>${U+edcemBMi|1bRe?wjS*=_b8wtQWE-DmcDEDmmNJ=^RIwy2-SDe>NB<$CFx
z)gR~oai+iC^f|}!?@E(D!j6x>E%J+>#fz_8v1;YwHC;<qcP(D*Eq>btixyw8boJ6J
zm#yhqy841eZ(hD?<<bk5T(*3vrcIu*`0}+&7I!RLxn%jW4=?prcdzVPwgP~~OV+Ge
z3cDRkmMsT|OfJ8A@#R-tt%8o#OP5^Xb*x#s^lGo;%B5YGd)+IAbSz!f;dLxsy?WJZ
zZ%x-_%S63<_0q)vtXZ`Zmb#X&Sq#<1ORl)WRF<t+a^=#+Fu7DAYmnNpd|Bt>Yv91L
z%a<%)e(hqEbNMP{DK__^u(<0gac#xY70~iPF7Le7>sZyfbfsczR(OP5SFJ$l5u%RE
zm#<o59>kLtpLS*qThFKk<g;q^wJ|MCp!b&{bZa7MlIH}3NGDUja#_dZne1CUiK&j7
z6NZ(NOH7xoS$x$Mt0!ipas@_pG-h2(moJ}~R-ZNOcC8ZgS1wtxVu^WCldb{4B2OQn
zyBs8<8<DDR=c*5>l@Bjpb{QJ|<*Tk(x_AX*z3TGCS9UL5vt|t&vlMKi##Hhea`9DY
z-b+_^EMIcvMCHr6JJ7%<%2%#Zl=-m_g{TF#<?fZ8tCz0mUf#8=v%aZczG@|V!Qy3|
zSD`a6?p%2#!?XIz%hdejP}d2h{8L(RTFb9ky0#PMR$snC$V#JKt6bHt>{zAQEyIyE
zkyyhy?aalOE$cFsHRvH^C+JnN(WYOsSl4LK)}nS|n0QhRxERC4wQConNvvM7`dW-x
zmo1jD#e?MXQ`W3H<xFq+6(=uWwz7Ne$!pI#^W-znpzw6>tqb3F{+kz{e#+~rN2i@p
zJ**v_e#+}P^iIRS2Kk+asgB$<oRcY~d`9({T*Lo||8yc?4zI`B%$--fXxXwC@+|S~
zknyhpUe2|2@;86t(>VQ|;ay;|*`j}tx7hgZqn91bQZ6&R+oy2rocyb3#q)Y?AHvC7
zP41nB2@Zcw?)apw8=d?Fo?PNDT_?Z9<gIn`|1x=do&1PD=)8DUo%|S+ch<?@`l#x!
zt&=Cs?@XP%-Q@jsa+mLIb@JC(z5{jgx7hlAQ=L3x_6v3L7F%Ds^|p(fEC2R7edk~M
zsT%+KbC%92<e4et`6=Z6Q^*IVkQb(q7fsH+7%XwBf7>H+Te3-7DI!l)wLPyKkvB)=
zm5BVPh<rREudZ2<KBq<F#(gYXstKw&B3BJHc6>yRrD652B_iiuiTgV%BDbz3Ny&&D
zXBE}IbVSY=xxdzkoW8oh3nTJ3I3Z|zMDE%Uldp=%(c!Cqoe}vVRjKE#jmTdRk!K?E
zmqz5h5xFg~B{d(B9~#l$7?EQDtN!&z<cC$Io_AYB9&PIb5&7W}{Y?@1@ez3;B9HD<
zj6~!wis%<3^7#?@_K2MOdG4<ikss-Vpyi0%ol7&h5|JMl(I1b<&yUFedHBx={4)ao
zjKDu5@XrYRGXnpN!2jPO@O0wk&!)3G8`HTN4<@F0X}{1lZErE1y|3|JDazj0{}$q1
zdtd!Kki;uI>R-i_U8BF*yLWG1crMs?jXqfAxlrFVI#lI(g0XA#TUDM5_Fbd5R(USS
zca46c%5%ZJYjk~;=R$ke=m)Dj7t*^%msEK!pm&YFtIBiXylZrRmFI$a*XU_go(tby
zqsLZxE_ip19$w|S(A_oKP~~~TvupIJ=UjQY;6?eXJQunsf0gG#7Ui$<T)?9IRh|n}
zl)uVzVT$rsd7dz#{8gSON+^Go=YkdGukyUWjPh4`p2(p5Rh}mXD1VhdM)+eLkJ|mi
z3t77hJgHysf3M^JT*uezKVFyq%R2sNb^MR&_#f2qo9p<&I{uD2{wsC-Ep>cf9Us>5
zejVRa$9LE9E9&^Ab^IlDd|MsAsE$w7@#od?udm}zuH#=_$G^<+>F~S;_UmxQvxkAq
z8}B+2UH#z~XjeaYZz=JL3|fPCuTkhfNX78=_miCPTso+vhyM7c^w9W0>4vT82cPSj
z4FiK_pmA@hL)wkQb3DkL*9WZEJ-02LJ@1py^wPoOU5BP~=iPYdG_M@|eed4#73f@B
zXRLr;!zI90^Cy1vLrCO78*uNz=(INI*>FWVH~rN-b4&-R@@WP5@HRT=7ZUzWl;&m}
zOrLVz!dx;9?r(<(m(Fo$`=eu$jp^{nIse@ND?d&L!}BrJ1*whDc))42wx)BC1jBnD
zN(VC@M;wv*D-yrZeLUiL$OzFxcXQAI`{><dx8mrRax`3i8_Jg+P8E>ufsT;oQX7KQ
z2)KTZmFX~5K)$zuA26PNY(h>8)DINmLU0|-H*6b7hl~2F9_LcqF-o6;<QG?+PJ%nw
zamglge+yL88`BNNu^F4_MLO43z9Kz$w#2b(M)~?Z@HBVH_z&-`MSK0uUTOxL*P;@F
z!7ltx4E@8XN5<n{knJZAW{6zaZ%|Id{vpRm*njrjc-VUZZgUzE_FfnEYhZskb%Xev
z6;Hgb)1dyEsyYii$8og+r*l62PM=T=Qa99B0{Ehs98PT~&82QYrR02;F+ik-Q+du@
zRy!NPyV@E^v$k?GzS`)@%GxQi!G&%8sGWSIb~ah<T&v3ITq~Wu+Ho~!bExrs)Xs07
zt*;$)h4ysNb6d1R#-%ST(*7tF(ol7h{ov_Y;<8rA6ONGzY1<U95VpVjoQ71$CRZVU
zVB5;}+~#%982vb7l$-I{swRuK!Ev?Xp&#8Q74aQJvIG!&Lzy&}`VKlVxB@v)=_8<W
z7aihXO0zz4GtN}2)*G&(6Jc8c@kV!X{Wq5yN1N8M0d4vlf8D#c)}B#9&%31Byb-+d
zbkJQ1+IGUb@$_&~_O5t5oNN(ic$ksiLf5F2YpbM#JX?;kwZkA^fHardnZCS;v`V^R
zi>L&7wlCAJ9tL?9GavCLyR+GOln&a;>D(gZ)?G>GW~OuRZA=IAo6^C%=A?6P0iEBh
z_MjHD9?#?9<QW;u2F}YkGST_4^(=E~>H?_3aQOpRCuk<(sp05<z7|om!K%{;qboc;
zPgTArUIfGCKR*+#1;dns?j5<*j`Zat&@E%MM0Qe*<tN73)X^jWJrT!2YEQOj&)%-X
zIb!8fd(y$fNEtv%+!MqF70OCN^1G0XF{!D_!v}Q5S<(h<1dNqK(P$1*#k3N>@Fcc4
zb*hc)qX@udm8)+6l3}h^=MyTr1GDPW2Tk)jI@0BTfmawVW350Oq0)~{=}b{-L$R8q
zDMq}=?yMFXWqufCt|bONdxGxqY|prN?JU8K9li-;+x2r(<MUE`5??4J?kv<YcG`Qq
zwKJobSCHwpupJ==KJ!e^WEN1bO==}*+nsA0M@>mZeHNJ_@-GLU_-1N6*S1^4Z7SYJ
zg;b3Niz*R&Z&%>FI(x5E@o^?bR&b&sSv`rm+h^U+iDtDRNbQVd_o#v|tjq2`70;g}
zyRT`|Ya&VT21VE@-dwytZ=zA$jZpx0f*+%LKP5oa1-gniHpk2dnAdkV6ft)|<#$+Z
z)LKBSMi@lKad)m;EDo3RF?+{E+@;Nmvw2g!&E^Tw>e(4JJwF(SE4Rd~H%F{97|da(
z%i-ku9IB0)WjYjNc%<hca|UEa=k#fH!zbg$e)CmaF=gj^?&-aIb8UNqCJJvg;V6W|
za#1N_6M;%%@W6=EUBcMAJsm76q8U7}Fj!PTe=gk3bHwj4>~!d(FhS|CTvwH&WTPZf
zn3M}pkjnV==$Q>3n%;>Ek(BFs0E2oF<I8po>?Nu!3Wg9Z8a)?^qla^KY{+Tz4iI@^
z5=h=~=8*4SbAZV610ZjSAiud-kf$xoEh;R?r6#zGI5p;an%+l;ztfKOLiWC<(TgJn
zX0JZLtnXQcta%%jbNZA~@4y0eH5Lt{_+Ld{|Ahn0a{!8?{~1AMKQ74k?6-2-LavQc
z7)&4Vx*OqgG3SjPBmrvMo;w1yTFPNX+A|&um5+Z7I_Lj!#riw$Ttof8cE4G?p{>Ci
zn~f8P$NrOf4VRxpv!6KJx3HOF<_y|O!J@}7f1)#$a&3<#zPTm9fS1~><G`Z;(_yUA
zFnS*avm4Fqr<~cbcMhj2Y_(&jaIvy69nRK}HWU+gc^yOL#$bpEvX~jiX+v;-Z&Mb-
z0)*$Jc3*eDE8_A$OLvHzH=vp9*UyH6dV1OfPycv_24EDknGSVJou_D%=1>_9CGPYv
zg$<RWj#lMGE7Tb*6x^>g+}{yI{r`^h|MuMz{9nJb6CFAoY`zUsZ!q{}{`U3rH~c()
z>sH)3p9%<6&Sxshh1y65{&q4spEkgiK!*K$@XMf&@>cJhu%fTZ0alEnh|&R4fO5`f
zzH>!0TW*+Ic?4=eOQwNe1ULF+WCRh9@8(#Qo>xpK-b&ZXqTHt>WIpN8uaM|!=XHOg
zF_&(pMNQLR6iE+50p@&B)AXnRD9(ue1}O*pFwU$AcY-*V&TgiUUc!F|Ch@G4wLuI1
z;P^aY6B~Yl`6SP}jIQth=MQ!BUA*044BuYuBipr)XtiU(Y_0#e+@kHdwo<Np2aU7m
z{Tb7d_M`@MdDr3}yYAt9e9CA?UmU@dQNWb32~)-Zvb(*mZ7dA2nCQ73Bg6p4{Y@D6
z3&>`K1L+4EYoq@f_5uv1=(8pC*^<|Nh&27t9jHRgl-cpdt`?z9UEFr~ue;bshVK3i
zCL6H#eVy!99NjNR!{vu|vJ8TIUAE_T9km8@)Pgr{n`G1~$f#AqsP&n@vF=l);nYqv
z6pu6Js=qeKG<p|JaS(e6rEfFottL(M6~<nWoAKK{9OuB?Q0O{!LWV)=F_d~!t_i<|
zTuW{d*%D(N$fg61vEqtuM(i4^tJwDcWw4uS!JdhMWzt|jIeD-<?$luaO@sZuueo4f
zB1gmJrEu0N=YWE}jpy<j>?RBLv~dmg+i9vA?8lx_=@}-qV0Ztm7VOtg7VI42y|JMX
z3`L{vLVgshn&Gbt`SnlMg*-Xgl89}f&D^>Lh?=vfn)G8PHD^bjtvP!h+IHFNI&;E2
zic>r+>e3sBO4G#Y?b1|AxfVDo>!>9NS-kf(SG_~;RkerNqDGLtOnvChv8C{&#Svh5
z<PZOYbt?GJU<d-f0#_?Kb$(M4hszi4aud?&6PI!oTgM$-%f3Q)UNS1tj=HjbC(q9@
zyNqK<O9z7$A$?^bVF_eG;6DaZH<n;P7DVVbiI3v$*-xPkHd8yD6D)^q;nc1wn{#iH
zUhX#%p5091b-flLz<RW;h~1fIw#(_b&upS+<QGUG6j#@3-d2vanty27F0DL|vK9Xy
z%eEE;z~m$`sVm!x-^a=}#YuuSp^tv0+JxSV2_)WxmP_Jr`AC#V*EIWRLa(7mT)c4!
zgC_Lw6ZA0Fn%D1a)+R)^gTd+29<+4?A=}eJ%<&)#g3v=+T|>(C2_P3rp<Q$07FxN)
zVSO_(XinOW`lNm41|x0Hn$sn+CmA2O=fT-Xw~IN7wl0=~$vxcxhwD5=V>VwVx_Ym;
zO3(qg`fX0Ib=7<0<5Ro(kBsRCj@}0vQ&~aQIr{jHsU7{t#&ngqdVn!~>Ms*xdUn05
zI5~AgT`;(tl@&xsI<(X65H1YDqEuuGOCWy)hjk4h*C*Iq7-@yJRy`Rb?!sJ1&_XPB
z#Y{+}XgnND)44%u$kxu~6n2iB!uEBe%gU-tx<9A34_9=?-SRusS#=)1z@)dE)TXvS
zJYAdG&cql(7jkED#mxhpCra5kmHBjpvzcUM-6tg{PLqy2PyaSn<GRzozqKaD2&fE~
zZ~s@i)pfxXYtPz3Xx%yvS+?TD2Hk{pYRNqPy__zjN@G_})EP0I-|;kx8}-?q?OxZ3
z6P6|DebGhdb}TxN#HDUI=Pmy`9T_hF1yw1-V|`cs-EU&?h>a@$$gcVujQ9uKRWFgo
z6(9c2-iM?A*sgk?xO#wH_1m10>PD5DO0k&kdv?1GdndL)TFY)9TOi#iiNobLV41Mr
z*=_vS0<X?)!tY~tn>1=zAnio->jnvQ_}DZd3#6BnS*6s*G@(<OPCq%FjA9F<kIU&u
zyh^Wx!?797tDk!7+}OwTx*k(b+D*8_<!NgX)w*gK|5YqIy}(jN-!9`~^|9Ekvub!s
z`y0+<cjFv_*W<>$u9tG1z@D@VPGdvJv7drboYKaM(Nr6m>k5EjN`_h3c@{v7$P(7c
zmY@I4wMnf&r+uiw3;gKnLQUN*F6!REEV!04op_}G{>xa=*YAu(+M2-xPp4iVd<j!g
z#I;XfGcnd1Vi`W2I6SrI=|mHM4xiDqvmv^_98Y{^Y|_LT|AjNcrxTZ|g@>n5x-qIW
z7+1o^K(n0Ku)cF?o-mhlt!I#=!%oaC6eo{I74LlzCry&v%RZ+matTro2jmi8fMtCp
zoZUcKkf$OprFq>c^0kYcuq{^xajI3bkS&}Au^=HHspgR>;BYJV4JD&VkPyk)oL&K?
zQKI9gZ<y!pVqMN<i6J2)+05Ir<`u9_o_VFiG`!&TuaA?(w%^z}OwJ`+FwM;sO*GZ-
zN*CW3O7DA!bb`p`GeotC_q(008Miho)lff#D~Wd51>3xqv%4r}u1->l#HV<TEta2D
zF7|J;Jv+R_4Y#8>Ji3<s78P5Ivev`s1{PoIT)exqUN6_nkfd47BYF~jPHIQb8|u{}
z)tXD=%F&LwxP-#X)6$yc#CPw5W5*hdCV6QVw<D;I!p9ooRoLRrz=JmK=g<_LOx$oQ
zU8*Zk+)?gSpObp5=fm7*lO1NDwJ5SNB<CXk`3rPlF_Uh>j>g>7Zn@T#zPtiyiT59w
z|JECDS&K^ZQsar68F=d-6T^zeIkv(a)Usl`#Fe$$20xVIHp*1a9bR=#DqeP6oCyur
z<X4(`2NSw)&vxX$og;M_Q;s;xtLNOzzSpJvSW_CH8ow*2&cdyGIo2z@sRsWz#P!(N
z@Pf>*cA3jaLU-P;5;}rQbbA_#6PvF@4yykl`Bsq|!48$08e}V{hN@mHgte=Si_m+P
z6+Vpy(!lGMR~KH^P#hX>tX+qOhe?Jf=-w8z6@x_&U{iGj7hKLsZR<Xmkr_P!H;86?
zirzY0r!G!k$L-MFU*xnnboY;Da<rH+*hh9Njt=@XkA}<lK7u)?Z6w$I08D)sxqA@)
z42x_mWb7izt6kVX{}|_u8CQyt;qqlzCdr~^bO8H*!zu2_dZWEK)}7@C7^iLATV`L`
zE<5+BawM(j(r^``$b}Qs!`VNe8938W%$5(yj=v=Fv4deU!0jxveI~(!55R-m^l50C
z;gOfpn}*^W_m*(g3D*IzY9D(I@+&9q<Q!4ymEUx>(6H6pn_W?ANM}>HT7cc_Y1~e}
zcH8JfxbL=xeLX=K-lwSzua^hd^C~nX?mVKmscJQ5>L4-ogVB%0OeGJ{lx1*Gy@S)m
z>fNKK#jMJRIKho+EK!31em%-Z760E$B&J-6265rFX6miar$k}vK~P6MBpZ6Cxp0Yb
zE!cmJUKlg}cGZs7n$5CmBA$10TD4}PfjfwCQ2PU;*gB3l|7O}pMNX5;V@2aot(Z7R
zG;bUg<c@+1(b+MxR%(umVGZzIqc|&z7=Fj|FuYgxm}wXwX;zV1mprst-adLxERW~o
z{O789xTsIBwT`<+e=GgV^_8~g;r#hk!{U6cb`Gk=NwU&1d}R!?n9Ju)%%|FH>+onG
zCb4eE+KoA{?eV|IIH<is&Z>s)eo_auQr-<}i$0-)+8-an#j?~6T#y}^hYP_QmW$sy
zt2}}M4|zqlo&VwEaNERjc!Qjt4Bb5w_voVpCs$qmS2-Fkp97aM=;5OE1Nc9JOB4kT
z&nG=P=}3G83xQi{Z_@H^$CRrh@h>7H@wX=#i8+dL1v1rW?9%r$BG0WKk&`Hf8<Edo
zk?Ka|6Od;)ahLRMTy2)hMo;V*#wMn#=g83T;OJAaA?z#xgss!njMovk?lUcM*AXyS
zGaa*ri4a5lmeDW8tZ|LcA^rfYnWHl&I@&0v2S?K})5oZTuAI)9NT>MK=ut7m|3lHl
znk(8!Yz*b?70;(=VJq&TWX&X}A*L~RwSeCoy)u@;JL3hk?6lXak+=uR>9x9wM{y>{
zB+cX-qtjxUEMO)Wsi)(9i^N@Sq()VP(~+7-I#Qo$BXz`mv8+SToujwKhS7ID56h3)
zXjdyhyuC^`I@Nq_bbc(G=Tm_0S~f2JjSP(|!0%(j_4}Sj0bW|OY?b2bX=Wr^l9?9c
zOJhB?0sDOBRO?rD7T8=&WZg(=I#vR0qMKyQ&TZsSHFWnYbpSjmN0tlG&&bhm`RpIX
z$84Qzbj*Gw21jHT8M7xWhOx`Dy?SrJJ*<qj2XfuG*Jay$85zHe5sORPcWj?@KplEe
z2Gk9>?}@|i$A0Dp)DK#{mT<F1S0kc>y`!;%U6gj?t^nBeM!$m}yKiE2BaX3IGNb$p
z?3gG1^w86Zi{Qsj4((hK^Y%eGcj6eVcj`c^@O0ut{BL^UjR+JrN`@eN6v*uz>BPG2
z9f{-b$HB@%`9%m5)oy}uB>!+%;{CW8DQ28EEa^%aAwwR!5*NYp;T{)=$R4*SB{p1)
zQ<5z1Gn55-syGi8Hk=C?&OFXZJ<zk#$~E@>h;80WIfdhOTJ;{#;XD6L%cY(~bH46#
zs9QPXJE!>k>iH!cHC#Qrlb1OUPg=vj{)yD^*L$^wzw%R8!`mj-@XlHd?{w!ixX}$Y
zT$bA2W;J}+&!aWWJI<tr%Lr671gvO;pb`IP{CYdX@cyZ)_l*D9yB9T&YQ1QL>KUA-
zL0yj5%JGFm+;FR~$s|rqRjxT$8xKU#PgN49&R7V&YhFn7`GRmsPbW@7J5(>xX37mC
zdW$*Q$Ovy>E2A}(&tXewmX?6y2NK~YP*#UR>)lt`eu`5u=j{K;u{yikoZVe>b~l~f
z4QKxydg^SSAP!Gy(*B&~;tuDQY`R$BU9LM^(un?o9x`FD;EoJZyNlMatyah0ZdE#V
z9LmVs`gUSbi~IGnL)=)yQ$f8O__8GQ9Y%*6KefJ9M78F;d8zVs_j0j`?W)AO0is|f
zy>aUe0(7H7HQzGYkvIB7iR#X|xZih(tsnRAr!Rjfy?zVUPF}Due`wWC;!ZV$GZSRh
z-7)qmoR);=<2)Cq%R8|F7%bWuJgCm5XK-J*BRCXex499AcioEtAZ$f9F9$<EeKIIw
zP~)wYqaW2?aT7Y==wYz2iMQX(#o0P;6d(HOZ<#^F$&5NV{lTRb1_rmTG$n348I5Lw
z*6@Nn_q-+HZro_>eUCT!afrQW7<c{Io<WW>@fZ<~c#N?&+q3)N>p!4&@kj(i#4;xC
zn%;_)!6rUk#_ccqh-aC`oj~r<aMC@ll8?q-sWjnS+YT4A-b1HVoBp2bex;`kJER*d
zgX5c!nOEDhsWqb=kb9%AMKU~RzoO^Ur}d_O=h}%|XJhT?d6}Ny?M>Xk3lfPtQ@<m`
zN{V@@w#hX<JzGj>&C0><I%Tv(QO5nYyRl396_}GEVQ9{dADp=9W(xQu0opPn^6I^;
zsVy!l5I)N=l`+g?t0W#I1m>L7o}L#Y?QT{XEl9Ai^#KSfIdk0`@O%CBr$Ibanr@Ss
z9pMgNAR9)wdnNtkP%Hn4++Dh(VSUdIdXu>E0d&^<#OHgk&k4seC#8A2b2pxz<i4pi
zm0#mR6^d=oreO1OJsx^NNxLtKDBZ0}Xai$-bhC>6QdPXZXPls}-^%r%S0GHm7Ap4U
zk4Kg~8kWpi;bRw*&kZzNN-qB@9BrC|q!Ws~b6%o*@YY}#^@4m=FGIbswNb@n#E^)y
z<8u->z8H~>G$(gagSXc+M^j8(j{yK>KtFj{hc+ZJlcDm9<>D1?%j6x+Y;n>cD(ibH
z&%wLvd(gCyhTE27{YdsA)jA$=S$D`L*6`?4(t44t6ad?hESI_-FVS4LDIQ25;(2Hb
z9{sX2W{x(YDzGHtL*_7vTd{G2GP^Gaj~s>t>_)Gi$u-GXDUUnK4)2ytcJ(oAt*9Fk
zcJVb;HBZ^RRK*qIB$ptC*wl>tWLU-U_Mil!I%J14j{Jz6rXI^Nx8@PYTzGV711=Qs
z!eF)Ht5J4Ca8b<TsmY<A{xNt;!ywh*6nO8pn<2s(UtJ%|4jcOM@vAUzNN!raQSPE2
zy8F$Ih*dZvfe`89_zoCgBY4>s8A7dnuz1pRU2W8AP)2JFoz`Hq2wG7STVEh|_?mId
zr|YVXk9*z{5UbNya8sB8vIfIpW(!9Y+@u(t9K#vkKpC(h@J#WQwWdRl>h-d!cdT8p
zllDIsQ*oqx^^gi7v!|g0V+=dCIOT5q)W!OUoERNQF?L*kV8ysc_4ZwiJrhH(!DWl~
z3$;G~+h?O;x2rWe0NAq#6NenBCv6bu$gf5($i%X1$J8|vy(fDip4D9tEc!BB7>SQN
zP#Z2^Dn9VWY~DK~Hw?T5VZ-)1H$M0%Tq&`RYljMoPQZIcFrqBP6c0q<?hG8LJ{Pp|
z`#9SGs_R91N9u^$>%zSk)j@p+?gSsnrM}El3|zFsQxI5150z$Mahjg7=`CnEO=t*s
z*n&g*l$v2)R8!>u?V~KM2zx`GyU<X;Tr`||4E>#6PFCzI<#sqGRfk(%Kay@u%x!QB
z1~+1o=54Tv8~zQpFw6|e)ZLK6lP49Ky4g=gTtC6&C<E(Awcaf6xi$+SfsFtc%Vhn@
zt8U?uZ^d0m7~yfvfmiG#6TSA74rOv}LTsdPSbpp=8N$X1cl29QL_88-tG<t+Xu6{E
zu4To&0p?k8pWTXz`;-)8x4MqG1?7<<;vt#D`kvi<9;SPFHuYH3*hO$e${BU_^F1+F
zaY-8aYAxT$R)a->^Kc(tXL}xdQ{u+UFyoCi<m*>n_UH_naEVW%1&g*Jk8&<^mUJFj
z#$E$2SfY_1phT^1UYIzie&iX~zs?nK!hc-Cl`6&C?Va~fj}N7BE|xxUK5mh>AhHka
z);{p}>ontcGUG>Ji|aGCc9~8T`B8MJYHLS)7L{=Zv(MH(&eo2ZdrD2$+V`-v+hyxq
zCW$hAk4+qn?unq{+I|VmVr-rkWw^WswSvVz_hn0HL)eOuU=kZy7B=WaL+HfnXvc`M
z3Dq%x>bMP0dGy1?rd;L>2`LtE;fyD6za8u2tosm_*JAOi8ZPLIbg%%1*~+8rG_XJn
zbRDb8<Z#A9CdiW!M@IRA^;&*>X@q3XPLv(j<r91xF8`Z8g9WqI{){dv{Yy5&`>Xv~
z#<j!^x`Zyd{yc*CNT<N41Lths<Jl7zN^ps0YkAL2>7auIx`Iw1{dq+C^M^hh=_D9c
zkcsr??XlWIXWnU@dB8gJq0*EQWaMb=@NSeVNbQh&BpB)sz&6YKBdiog?~xtm9qKnm
zP3g=iU)k$kfpPe->z5$&YBg&)7+M*lPtY-XleXIbV0-6eY!xH-Jy=cDq_GMbJqy`q
zQzK1d??W~X7zJZd_~5m%DDZiH#8Eoe<>;3jD)tu;&6pj3UTP$9V*>_^(R*W!sam+8
z*b$`IxT_5-al=ovvzsL5yDG8?qe+e42t|&c9E|T?TXh>NJXSeshgYpR)QzJHb)Y-(
zv_YEPY=jN`LYMZ+)K;W-pX+$Pu<mF(4z?ujN^M0~XOzd;NsqFW#9eJ$vDS2QgtP%E
zaJyRa#azYzPzO55&2J1@(WY_}p2`hU+p;~|bliUvO2Ve{#R9;%Vum7alcs`}w@sSL
z1H6l%yB!as9G19gfoMDsiD)chd}5^wZRP>Grq#Fx_d!n8W`<J_BoWooKjH_uG|0Gp
z2X2m|M@{rdHV7<?KY}HM@zBKgQ(J>nag<xRJbq?7xvztZx2+>#$Y#uVCGm8kVwJ>O
zg`|>Jsr3$*W|j0_$6F;47ptTSE2+h_B9$caIr0e4VYrqjArRS%vnw8`uevv*>gY(M
zHW#2B*A27!O!s+=$u%$I4QlR<1uwF5;B~X)RF2Qw?y21?@}Bhiop}Eag1R{kqro6e
zr-Qz;K(45JLr^HUV5jxwa@^oZ9dNu)eAvGbzsTDgZIRJiq_{A{H5J-(!q*3tow(VF
zUm#7=iCdhQ+aJh*reP%M#J`M*Tb+1oOx*6o-;9YnotV4sW*Z`TUdqoiBfa}PJ);DL
zTpvZe{@BM`(s4Fgpw#2F47o`?J)@t3BWfzyCo|FXY@t1tx+NJ;ZDy+6*v<^F5G!FY
ztd*G&+8FpZt78@j77fCU5a#-rl#}Cz;<Ccm8Zi?2pRdZ66+ei3bMQDVBp5RMen}x_
zS@BJW!t-j%mm!P9qdrdtf6_dMN{0siZB?^##T60WPGO%W(K_=V5Jk%7`jiF!cPQx-
zUGa`un?#GUxgrbvdvIKf3M&!L&`eFpb^sw!HDQYiS?rpyNrlYc`9}rjtT9z@oX>@b
zo|8$0>%5kl=o1S*F|3aw-dPv;_tAp5yR0ybg@_9n^I2B-MKdLuC;eDfIPo+}c#J2a
zMKS|hNr4<|jV&vFj*qK}W%{i(uJyVX7c^=q;+2$ZS>X#MM!e?XvckPw<BPYsKDD8q
zH)vk5*43aMnat^l--e~-hGK)1biLFyw{X`>ed-bGQIA;fJj(THo6yJ(jUU2cQ2G}7
zh1jr`;>6lBhn_tI>3y4E1<yA#-)efc(5$JFueG3R>Wl(9tfA>mP9h&gCk@TixsqCS
zNxQqDSpu!qD7xLyOr0x{sG+mvjHG5|oWxCKGPL171}X3K?B)vrnw7ZmUM&4<V`;j6
z#7#pBBW@97v_aOj`oK)GG4L;Dn#M1eoD=x%;B$SH=H$3GNL*2sxj}*wHm0j2g%~$T
zxRm9PIqPVTvCNt#%S;A>&Z@n+;)4jgDD2ZDnq|goMUk?(K4pP_9VLCDD{fIMBU+Tr
z6<OflfMe%Y@|eJ<g(^Qg@TptnF<h~LRepLPc{yL0##}UTnzQq-7imt<$s~+*9!j|T
z#DY&uZ6w%03*w&}2{Z!C$BhJ<C;f0E0grRy<+6f~1k63>GjBH%&@%lNf23xX6?G(V
zDdLrs%Z&sz58X(hB~%;gd4ol#hGq{JkE~faJ@LCwv9wG*mTtY&EACTmSTA*_M>ilv
zk66b%%JpgevuwPV_3&W0{3<!~?khsnI}I<P1J$O1WK7DGr^Ab8LGxKG&Uz2Z^<^N+
zSzC!IH9+ZSsw8e`<B6%vgvz(g4*kPB?C>kT)H0g}rO@n9X|5>6?97152h0vjr!`(@
z=O8Gh%np_2O0Z&frbFd8QK^j>BT#M5`3pdBp3xwqKy~2Qg|qZLR*8HaVfEE*m2a@M
zM{j(_YL8!5NoNmzl~;G1!2$xSz>SZf_YK~RU#tRqL87Zbyc@4$*zeuGckkC4aqw{*
z96g4E4Nh{SljNP`lTLE8lYCkviSLV@#P|DXCGq``HWJ?-q=m%yHxs`AI)sCUM1%Gb
z+_50&+o&}BtWy8;q`~Gd2pQ}b5`Ixg-<O5>Uj<3rC8Ps4NZ?Qs689AvIufg}Kjw?R
zCW!@0Dj`V>Ym#JTNkt@y3z{TeSrTr=xa<KK#s&OUBRKvk=ob7hb|jYHPkBCZg75tT
zZV&rc!L{;i9DD!=658cXveHR9on*C>bUDd2B0;oh2SK70#Edo&QCdJmiDyI!XGDo+
zL<wd@*D4J^tkl1bG}ydO$Y4fD_z@v}Hwf`R3W5NTSVScu5>e6D*ocKlM8&WsNmh}F
ziVK<~UOk_PHfcoD@agL5i0IpKP&@($3!UU0PSWZm?{<<4oaDVCL9}QGL82AJj5ZKa
zT0lgJXG95SM2TiZ31&nuR2p8S)W4WC*nFvw!FD0xWkUL{5aM@$AfhA|QAvnIRP;4A
zVj&VyF|0|FRV1R~f+mSq&nKeI8qwq7lLYca9Q<Sy5k1LCPH~bJCpq0o&Tx`5MS^J2
z4uV80h#74lqO^dB63>Vd&WIAth!V_*o~1NATd998X|VZ?LI#sU!t;gnEfC_r1q2Z#
zv4~1SB%-3Pu@MWAh>BrNlB^;T6&Ex~ym~$nZPAD}!l$K=BanyS;0q-j9O@*8IZ2a~
z9N{Fho#ZHyAX>D8Akhk9MjMDIEg+)AGopkuqC_*I1T&&@l!iwu^^YM9HosiRV6%|$
zI3azn65_uG1Q8{%h)O~vqN1;{5et!sieXKXtRfK=7c@z{dOi_NYDCMJuOyI9;$Y-(
zM0BT<{Lx7&PO{5Mc00*mM1pA14uV80h#74lqO^dB63>Vd&WIAth!V_*jw=nHRqF2{
z4K_a~WYCishSP-fO&8+N1VKbeETWPSiKysnY{Wt&qGDK+B&$e7#RW|gubxjtTQ#C1
zaQl{{5y<;-aPMDn@PL#2*hz{`@{p5kbCQQef@skWf<!Bb8Eqh<w19{b&xjJvh!V|+
z63mEhR~r68ss9*hu=!U)21`Q1-wNs5A;f<I1Q8{%h)O~vqN1;{5et!sieXKXtRfK=
z7c@z{dOi_t*NEN*pCpi9$APrb+nwY;on*jCzU?I6agsYlf@skWf<!Bb8Eqh<w19{b
z&xjJvh!V|+63mEhQX1Z^)W3%`*!(>qg9Rbs79oB23GugrAfhA|QAvnIRP;4AVj&Vy
zF|0|FRV1R~f+mSq&nKdti0H6?@y~5PL5^_#20mxUS457liX1POW6|uR4vK^|*~&83
zX+Od_1XKH{0~ywAD{&L$Wm~aslQmmLa!n&u&Ru*S1^z-}?6@^@d_m;+LOB-AKI&Mm
z<FNjdoG+Sv)UjOY%@16zdE|;S*IvXQI{;;9fg{0E(!)x!Ka!4ZSLl>fhs1OSVmi&x
z*{(Vyrc;RNv_Pk*IwYo3jOiqyGom^qrc;XPv_hw#IwYo3iRrXMXOrrXn2z^ot=!o{
zCv*l>hs1Q6po2r7z9&vdVTHZQCl1GWoBpar{GoKo5CYX4S00Ec7pTmi6r{_j++xZE
z!CGFFHJ5(s@n;dFf2MNMlnDaciGBNseunz|2{l0=tugz4t3jG13%}i1qqv$vivnzq
z=hYGiCXF>3YO(-34aoKaC!0)@)djX$+0coV|2s>Ui32M*4Q1&J=$Rc8%PW&Q5`QHy
zFF@Rce1e>^5=2{IOKL;jxkWKg>aCUvI2`sDppLQ4<uPiMpks)vBk^0DQmvx({+jiE
zHRr4kC>t7;y+W(jyjV|0tW!ekltru$)U0=!bruKtX3V-#IfXah+r|315$lxDI%N^-
zg_`wb+<L27H|lG$Hc7F5R>XRXS*I*wy(rdKNrd2VljYE^{x@3=POSWM3~9-LEIil>
zZoXmdbSmo^(2127V8wu}699__v>Z#unmAPcS?1_Hrde2y1MwUS#+o=(UVu#oENG5-
z(@ZMcuWabV%8RSb1}v&(rvY1)%^1*$l^0-3Jjd2}j_uBl8BktaO~!L<ahjTA(pVFR
z$_ud7fK95|WSSg=5xQo}$*8Z%GSaojft5WPWCMBzH0o=zG_g(t(g5qxfJx1<WUSFp
zlVxzp7?1`49Ebx8#u^PZS%7&1T8??sY}Fk5jWrr-vH<%HXgPMqff-|shMFwE0RvVv
zi&oPdP_|v!(5SD;64gQ+*b)aO4QSNYWQl6gfHZ*MG#Rj6b8I%&XsF5JYRP~!0AS^B
zT8{?w3}`geWC2zTXgTure$tUO$C9x|LroT-_e*Okn&UtmSTNRTsL29sGN6SqZ<^M0
z`;`rySb3RUnq7|STc-i7b}|NZV&w(cVn7-|a9RyWG1ztk8ntAp$7CGX5(g#?Xw=ta
zsmE3W(g5qxfX!Bqjx__CEWv3vAPuk{pVc56&@-UXP?H7N8PBn3z!uH1WUSFplLeTG
z=Qt1t7K}9-YO(<H2Fz#!$eSih0MGlC4V_qd86Nu$m{(w@0a*e7GX`{G<pnrkKsI)0
zwi=Kn0NZXrCstm71p~6NL$k$zECJZ00i9TR0TvC|ufV2wj?D&iV&w%`GT?v$D}U8`
zv>ZJHI<fKstQgQ!---roSGJ^V=)}qk(EF8U(WIIK2JBR}U_d8UUVu#oEIlgG$Qv;8
z3t{^W=)}qku-SkW1$M@P83R_u!V9p)fHc5*G$2dBdNiODD=)yL0cn8sXh4>L^=LpR
zR$hRu2DBWT;yE@uJ7z$6nONK7IabCk$eN>PKof_`3$W9G%o)Cw037zu`1#(we1w5(
zRZ6(tqs&%h4|3#X838B?pd|vJgaFDSOSl1u6DRZ)Bo#|wr9Q<SiK}J#i<*=%T`l(`
z1sk&w%aqVEWl>jHc({@m!0{0PB?M3waitStxRR07RiROzVsnLqJY8wF9;}+awY7Ew
zwwhRZslW_eA+W`Ia2%L4V2g>B7hv9iG=Q=+nFjkO*k%JdvGM}!Hy{l_lP_PV1MHt*
zJp($i@&X))=g3#C6KFY>j5Tqnyfm3YJja1}j(jaV?U-2JCf|_|V9|ig8NT&HbJ%}X
zq`oL&eNh&zV3rYpya1Xb07?j;ELy=3vw|fR6|B_n6e?|vlRCYmOR(IIlwtpvh-FG>
znX;%WEIa_M0+<s4P(lD@5m#CuhAT-)T@@PjDYmxeSzAlm*sYqbtu-64$;8S_1(x6n
z%g}0LH?FagwMOb0uwr861z0g44WKMV(<o?@DJdH|vGM}+eyv&10DuDqEZW#@KqoE;
zFTf@PT8?=GT8{n3nmANmnoM&%$4=9<95cq6I8<JMEe2%HtYByk`?DkUMG5PRvS<af
zjI3Y*G(`ZE5I|Y9f+1!FODZZ@sox@0+FHTd8eM|rW~AWqNW?NFv`ksl6&4<VCIK`?
z0F)3wS;UnJZjXj5o}{h{jrtT@TjLs(ZN$?iQ<RiylPM`1I<fLnfl0VRV3Ps|;=qCd
zomhDRwi=KIP?o#_`?bmR8?Y)CUV!ZeqyYds4LG2{i~*fkc>#9Db8I!B<=Aeli9_Y3
z$z<X=w#0Kx8f)TEc>(4P$edZh&>Z%sN9v0b))!^b3T7Eu!2<9i07?j;ELy>M$tNpV
zQc=N5{R+fZ!9}ZJx&+H5qzwCewnwIO(OoIBs4FZy07U_eM*x)270M#63_uK53X+QH
zT&Yj7xl%G$`axm29~rO(8Jjl%wU}yljQW}^CpQELP(AF712YCR>T9x`+|V?E9P1+v
z7~5)g*d>tKZg!0Nnk)_w5OJU-4on)*sIST508JBEh&y0xliA_;4+omfj!|Ee^)x;1
zKn1t9)2snK0~+-;SsZXvOEK<%u|>0EXS5|{L!-VXivt8iA}|mK77S?A*JN?Pt)p0n
zkt#4YZ+2XK%uc_FHF?rD5C>)qXw>f%UL2rldOi?$z}Qx^V*zP5J4Ss?p0o|bfk^`z
z^;?7&2VCe%aR-cTGCQsfn4M-5YqB^%K%@#P`1nM$4H(cfpeD!KKqc;gu|>1v+JLfQ
z$;6s04iFG=U?2`G7|^J%$p_K~%+7$hXLkBcoEJK28;Aol1~lq-3NH@OG(Bfqh%`cD
zTg^^UQ`^msQD2kA0RkcsXo&-p1~lqx@`1Dgv%>&$956dZ{U+fjZ39oKKL+#+Xw<Jr
zvN%AENNaIJv9-FQ*>P<^*|20{O%?~-ctQhkbs!Eb7|^IC$J&6!Ja0gApx=N-eNC1e
z2W-|bU}qedF`!XjlO@N30cilPwmP8Iva#)EK$B&=sOWN3U`rgBG}dUS$pS3Jb8Irr
zCaYFso0W!|EWk=U$4W&j%YdE%jfR>mK(AyCQnM%;u%v8B*{~`WUN#z=;=qA8uwbl-
zL*?cASF-@+`d8kxXp6l{+0dx3$x??IBn|t!v3_vZzbN6Fg0je(qNQfNJ#M|ztQ++;
zSt`0!tXCq|DWP@BBG!{N>n&!T#ewfhvu@PaWbwUOtnZ9ir-arii&$^1S@+`Bo6NdV
zUz4?8;=5_XemP>j0tu~C7O~zg*0HUi4i`lWC;8e&OUi~$th_FU4amZ?#~RR6wqQUf
zR$hP^16q#xc#i$XnmANm7sK%!JL5TKj5Tqnya4+R$Vjrsnr2bU*sg5o#LA1S0|snY
zV2c6SA6dBubYkTNScvD?6wk5QSQCfJi>t+Wjum{~j>D_v=o!$&q4EMO8PJB>q5+H6
zW0eg{PApW~VI>Y6a2g6M7|^J%$<oBU->7difN10mm{efDu|`8pmcgaTfHVMLXB?O@
z)@Z270&I@w*lL=snq#}MMng>&U`ss5mN+nJtkF=D1(<X>Y8FkVIiPH_vY}C5lO?LH
zabV>S8Y=^O1~lqxvP8ArfHZ*M6b;y}IhKqy8fvn*+G#)<0B|4<EEsDv)MNo>;yLC`
zvr}{IH`ZvV$pXyBbL@-*GsYSXHCcfD2DE6jnx-|~c4b2+R$gY80RtA*w-y6dlua7Y
ziIo>%!Q}{w;4~SKVzA8yG-}CGkHt8!f=@xof=_{-0gd{aEcIA2APuk{4cKh;Xe_^i
z1$&_;OK>U%qyg4r99S^cXsF2o^zbAjeX|_%rrBckXl%dIP?H7NWI)TYGY-rcYc$kk
z0X7@3NnLF<O_l(jw_8q5th@}5Ee32>%@zZ)1OO%t=)}qkFloR}1vVLwB>=G5fKIHu
z09y^1QD6n1pJJ?70suV&I<fKsY&T$w0*eN;981cEPOQ8DI}Mmr;6Oabf&raac>!h&
zm{(xlfELw$13Izt0?Zq*UxA$l^dLqVGX`{G<ptPpz)l^>TMd}kmeX!PCstm70|v|}
zuq6&m8qkTA7hu7FGyvb498lS213Izt0xTMk1^}$!J5H=emVotWKqppSfF%Q3jzt6J
z6<9LX#G&#su~rOdIS#~gEEsFzP<a7*_=XpKW6tocADYAd4y?Wox9eY&a79L$t;pp1
z7t07hUI3*CfD!^Ii!9+fA;yMTMpAK2La9%&ZJ70=Cg}=Yg5`Fk4Ev8oEK@?ulto=(
z;Q?qB!1f4$5&|fTxY7bKTuDkQwyc%<6q_p?<mt+QHkl^Vu(sB0KqppSDzM4I$)y!s
zs^Ak)v|~WefKIHu0Gka+0{|8c*r`P;DH}Sm@&arzAPoRGV8Dz53kGyz<pr3G=a`S@
z*l(<fL*=E(w8nGnjOUnfc9e$73$WdQ%o(n>Lu1(A7O5{vSYMPyE0|>jpj80H2!Ij-
zD2rAw#H?URMFlJMTZG20f6*maZbk}jhmTmMgqA6by28Q(&?JD72!Ij-D2upK;j0L-
zWi6@LvR3L-Y;DbLDipQJ6eXqFWJ=10POQ9CU?*IWuB*U-IIv(qCstm783WP)%91x=
zt2UW_13Izt0?Zqb1_10dV7me{26STO1=t_Yu{EA!yJO9O^3r4m;yJdMrsbG4*2JOm
z0xTGiIkSSHIqcsTsV_=cUz9~Fm}O)I3!o4IP(lD@(F(?g=UBm#iV9ZhS0J_uF4(w6
zmteVs6nyzSVwn<JrY!0T3lBh10GlEJN(i7V;>rNTaHSxrxF(_0r`TMnm@9d0GI`Um
z;i=z%POQ9CU=gmct@SIgGY-rc(2127V99_qfU>k2utl3py8)e8c>z`oNCN=27%-{8
zqyej9;RWd7LuYi=a%?i7<=AYji9_Y3$ut?za;)H6ZnR@LdImIcsJsB14al5X!2k~X
z--*;0C9E&Xq7}?CvVsLL5CKp^0A<k%hL{yBsi<J3{(w*!*NRrbbP1OGkuvPx9<fXb
zEmIbCg@p$oFM!)307?j;EaFNh#Be1eshG}{`V?DRE14^t)?vBTGzOGyH=t2VzLNLB
zv{*RVZ^#;uMFX2OpixT}VA6oh8JbN7tSH-TK%<r{z*Ym=eryGwC1lOpsh(#*qrN5!
zu-$-k89DabPNuO%vqSSpEh!rs^)<OYT4Wl4=0F@+FrZOOzKTHSIg1`~z}URmp_@!K
zJ4Ss?76%BB{;dvl#(^0F8uc|<9H40eCyzj@*)f0G&5luDlP8NnOB|Rqpiy6w#R2EJ
z1=&@Bu}x-&ZXyEBX2+<n$>M;Eq*X!1%4I;$fJS{yK7a@m%?{1Ofs(SJQD2iMi@-n}
zSTLYbUy~1{4VayFP__ZHW7N+JKWQ6?12YCR>URoXjR2lt+W3e(&vctyv#+*@3Rolx
z3HSmRrl*6Ze9pg_0KWc!NY{uu5}gHnTgh4Lhc?`vV1@EYtki%Tp+K9h@N+T)OrOMn
zgVec^pTZ5wC$Um<qu1O>PT>aACow=b2&r=;Gld(JPhzF!##(cueF`_2K8XRkK}ek&
zom03$Ij!*R730yjSDe0V(idRk9T$l^Gkg>GxqG`_!B<`w+nYk0NtL%s8eRjQ+AH6<
z#9IULUJHD`ZUbHulG>Z;*}J#vC7br*Z|oTATk@A9$*`D;zI)p~vpFp92gNBa-|06#
zEbob|aeN(ljobd#8kftHBPPhNwWD11D9F#L%G?n?Gm7`v5@Ds`VJ>qOvfxYZY8+k@
zih^8^_xOzmA6brMCJoDrF`0k#-RbLhw&;7_wm&!Fr5>nrN*ShEuxD&8(;^ur{7=lH
zWzorHE`TsQ-jML$Tzg?zE^{HIf!``<`E+<rnaN(#dk<gI>tzeGhQ<#H{0j~UQ;1<M
z1ZLQ;z-Jb7^cK8M3eS2wwi_(IRLmmn!;9~TMZC-Cfbzdxv@!Bz3(N4f;aO=Jmn3R<
zxnsDt5s#eG&_*O4k`D8kGpixP+aDLoo8C3ZVLp8{-@j(+%L@6KPz?{AW)WT(CL8g=
z^?i9?NzWK?{wV%!c+=zpD{MH}DMixk@UiyyrGlYFcvUj0clKA|Bfi&;S4<wlcO-hF
zPrjh)=)zp4Q`*q}LU$iCKL96-&`a~1?VI;in(_1uF^HEhOO+0l4#L}Rb5fr?#%PZS
zpF1-h$}^RSeDLG>dyCZu$#ySqnv?<udF=<*TFKyz*?5(s3G~IUFTOru5=P~7|6XnM
zZfyC<HAk3&lRR?GA^JwyO}NcF0{+?G@Xl&+wn2S9N1AkE!?k~B0vjn3NY3%uZW9~c
zg#<OV0;Y!LOVLsnGjXvOSAAVOegqv1ccMA=m`H!?qg3A#KO1kF!%OKK13wAtxQPzG
zV(nYfD?G>Y^IX+lLDflLDg0$=SEvbkfmf{h#N!1<CG^w<1i5}SrG?v^g>kb$hs;9y
zfGoJ4x$uCr51?m?p#$%kroQi<IeGb~?3tpzub%ngFCw_Hp4r-1ZD;j8bMnmb{`0z?
zIk_I3tnZnVD@J>!R2{pew1O%6WLBHY{u_xlvw5PP*sxT3inNpcL$!U)lXjli@KS-Y
zH{iXg*2OtP&69qU*ziAl*k&Vx!T)Zg_~7TN=G?fjkCEcWnbjKPF!K%EUY?bXRr58E
z-ZD>Qi4A<_FDs)#E&XOmXIDyW_zgxH9XDQIGaQ+a|0F%!%BmA`OSB6Kv;PVCj03{N
zC*-q$!42B@m7(WtGW0Y$_SopqGo=?56g3^0Rwh?O;~j@$j<W^x;~2$^IKs^2T)`LH
zr}3&k$f_03_Z?%(TU~8kliNlI8W7vCv#codvNj!=fiTDS2`)DnF^<mz1<$f}ue+76
zAWrzVA_6+K-XyPRw8?bJ9NlPlE*#GJ{GDPEfseR1Ru$afluu$YVdWGr`AM0me{`)A
zV@qwuACJr<ng9LddFjS#pbwx+{A(?9dbSZa;%2q}v>MOx+58e4ekA>x6^zM~<Q$)E
zEV1D$)ycC(rpMWkN}D@K*e1trlO{OFvByOEMjxg1ljo}-8<rO!=;VpTGM;X6@GIp#
z#a5M6-S^~4FW4}N=erq?C&JB~Q^Kn=C(A^5v%ya~Ab5TMnLM9p|Dj#xL-*?YPx}Go
zxu5PLF60K)mJCeQ?y~3$(KdMn;+xfQ?LSU#@?dl^d0=eJYN+-Pb(04pi^)TvYz?&m
zS0@k3FnOS@RmYG6=_&tG)t+pbc}8E=+`f9sEE(g+E^xgX-Q<I~p)o5j>!>-J$4E6#
zWQh$glHS5*Q%l#GgR;bi9eZr%;F%&$vS+{gc(n4a8RZ|nKX#HG^x*Rq-KF8w9(IDU
z^Z79jey0c{49=A0gC=M%DwHpalww~NfvQNMsvq;(gHOKgdDFU0bzkwqYi00}J$@+8
zonqclVSlr4WIiaJZIOH)Z@<$OzF?J`S~WIHrSKKbvh?o7lG_eBe)E2Et9GmI$sLMx
zs1&~GAm5&eO+|e1|I{8%x_s5oF6-yP#_dB6??Yo{%&Kd_scpJd;M5)$Wv<1US<mE!
zimd$j2{$<*!{;HQXJgoDaHnF`Z{bxE8@|Opm9kGn;sc_6!tX@8M4@tCF4-vG5IqLs
zeC@kKd=EV*O}>X7Ef(*g$L|&K7tpWYOd$vRu0^%u#7!wov&!@R@Lj3eapI;Es%iHj
z4PSIXWo!DQ)Lk*!2!(Vw<6mE_9~QW4F<z~F`b?Qp>4@zPt?xmh#;40S2-;0`165~D
zP<<~{@y=K&#Yebfqbs&w>1**LHczI_@-*Fm7==+z<B{|uK8&7=5Bm7m!H=B$$~PA>
z*`AD-=qt#_es0hN`6@#%6S|JZuYN4y-lMckzq=HUUW)v)J-r9XmzeIflpiu>0aAwL
zT|<b7H`bZ$xxqt0W4^415ByqQ)W6l&ihsF28Qt;0vhao9KayWnn0-j%&igF{>C2zW
zE$U5Q{=@XpZ)T<&o=UGD;)10kSn&47tYq4d-An^-TK6%@c-E%%^kT-Q`5-6ACP{Yl
z#Zd4PH$BFtWX#Ph|7b63FXq)F{~C?z3uF;+72)`cYkqsJ#y7Pgm)ana&Er5Kd2_ZW
z-*7#?+H<qU>t>XTtCi1Of_TkFp2PkXW^?T9xYdirDo&HAklq+v;P<=Z+ycKJFHnX&
zE2$_sl@jYVXYXJM4@a(EH+L$e6`=R$Qa5uYsyjq@*Laxf=jYynN6K%{MQ6|TSo*|t
z!@L)X47N|Qg~oJ{+BmkjYF&4srp#dU<IxP7CuWd*c`cx|3?hL!$z_F3-zU+y9Ic`a
zbHp)+Gnl7;i0^H-P-u+Kk?35vm4WDbi^JQ7S=?1EuI#n-+FqMP4QqcXt9&MA)duz)
zM!c>imH%GflHQ1xq65RP(NfkOs>grgag!cDhvS4lOV^Q-mu@UCML*C^tZlR5`ZH<(
z`MS{+FVg07(Z8Vi{EQtvoN=+q-a^?BWZDL%DYPVc@r$}@b9&;&8^8?v%TX36<ERry
zIPkd19qpEncB9OFOyvqUeBtVsX`ei+*ma2FiOLEdEs%=S*WIJJ&&Y0O1{fz<ShG8v
zNn;darlXuZ)j@uhCE@=Zzv|!%@U>1b!+sa=>L5D8qz;}f4l-38eE68CgT%uS9Ha&u
zB$?qHoSEG$3SF1Q3;hJ7ami26y5f?}6C?vbCGO-#BC9jVFGM*t5HrUb@-;MGqtA3{
zQfuJ7uFn#v#V;PNHJiaQ3T>Nj->xpLR<}|Xd;7M2nM_tbHnAKJr||hSn;h9KUh14m
zZ4dHXj51A6^6{CO*VZ`9N7v60wyI|H>lPX0k2K$QT!<F-S82A+P_}ST13nU5k@;+f
z>D@!U2RUHcB54)sG2+-q*4TK7<%~?_^mc_4;?ueEf%CDs`&#VuW7)wkA&++*$&ZSg
zAzc$(w^f23StYnF>T}@~7M&cUhtj#J7c~R09^mwM>V*+CaOGiKhxHdXY3*%!A4>iR
zN{dW5{_isrp04jZ6Fs4KnS3vynOwq5R$EBXRHX5LTsCjpb_N&pHfFJClIoNzEck?T
zV#7L2c#&XxtF67VX>dy;lD6Z6ku-kxDUvoKY4|kYZu?#zE~(N4Kd%M}i)@l)wY}-3
zpRT3U)bB-Q$KP~)N?F<`d#12eS91EjsV&#PT-9hlJN`m$wbKZVgI#wuI?i|S?P#{2
zx4st(i^ZC*n>1aABe~C#k7shSW(}Jdht-VXS{RkDGUdOuLHR{Y9u`O5gkeOwYHgXB
zw$JF|i=RQ8JIxs_NUba?^TcMd^NsDOa`so`cP(1ie)UkU&%TQ_w;$DE4s@_QwVEu`
z_pequKnI;39Q><{PE+SBs{7Bm!kqW7R<1et?tPWl>A}GZ_v4_bYR=iz9(;3s&pG_S
z`x)pmxl}1u<w<_gH0Zt$O=CpHU4C!4gi6Oyw}S);IF~`Kp`+llq4@sYA=mR;c}L-U
zdX(S#9`xM>a-mEWuUTnh;m&N&&PEwV|AJ3hQMa4Ab0WGa8fE_)4_c>_<dW0Tj%oi#
zhM7;y4!NwP_7AUNngqh#OCoMJM1qKK8v+K;Ln#`rp~fdo;}7qKM&4<7HH8nF!UI%T
z70LA06;>#Iu=Jp=X8bnrbfTi?J#RML&BVRI8OCSdTO0AEROIiCv2I8B(ZtDmQM@fr
zsTQl($55}2os+6u_f?5PYhzGsDBu(31)M~dCG2Ys(Xc;<4mWx$zVZ&mk>N}$#v1;a
zXQQvy`A=&3yIAAMwBM~xV7GY0wvFX8vN)mVJQZl<lZ_b3yIc2FGHUaqv+}XX7alrW
zJ}uXX^OJd7x?fCxa^ep@@JJ@e(>WZ8Gbf2Nk+GSRkNSlRw#De@ZQ&PpzGU*5Tm$>p
zx;KWA3M+-F>q51#f{>L$&%qkQyV2!FFKMh!3j1{Bw*9(7jT~=S*rzM1<y;wWR98-=
zD-X@8#cBH0`>izYq_EPaF1GHqxS9Erme;-SL|z@p3tz2e4WWagc|E4vf7zb<ye_-&
zd%pRDbnc_&-aQ>_LLM9uJn~((wqQ$n9UQm5+GzGKr~R40y2ki<sP4;6t(|$PQqQaR
zuNI_A`%=>I;#=MOwxw$PPH0^WF2Ksy`Q3XUem7$D{me6e4T`9Ejz`V2v_>y^2cqE3
z+;_>v4OrL_wXkERT6iffe2@DWbw2V05A`;J?~w-iUbF&bb_DqiY=Ws$IQs{z9*Tqf
zMv?7^$v&^3aej{vb~4myD9WWm#|A?|@orjq<|!G?VJYuWGOhzgGZ7fsNnqTVbs_zQ
zoTj76p+)Vx+w+3gNN_(&gYggBYdt0P<{4S8j!Zi0V#MIRHXJdKMH;iu)OlzNusrbj
zY{_HC0p(F}d5q+GH6~MMqis9!&7ts6tCOj9?~B-F&<@1?1F<_|cBdXF;>()JgNwm7
zzDSx<txVsC*>+HbsWYWp`)&seNY1-E0Ykx$vDP?b5gI;Qqs4HNnM~HM`yLf*%iHb~
z(P6)Z^KUL>Zht%1EofI^nxo=K@MB89y&Iiyp3J6Gm&94j782=fsgmAz6P1O5v{7^+
zJ?}`|uvypSQ^r(75w_04CD-&8-bgl74Z|c8=lFiBT%wQrhz`);o&z)3vabr)GJKcS
zc{d{JA-p&IpZ(UTG`fA)sHn&ZOZRJ0qrd*U*61&=%`ve?OS^E|^nrc(>C7EibxPj}
za5@{GOpkImFT|GS%~+b3aW;kqR@RLs#DN1fIBv&aWarTC?&{<rTj3Kwv!&`DeBE|C
z5Hi(_V3&%iyWWa6`Ugny(d!0mB5;X6%4-7-{vTEN*y>yxKAfH^>+a49Jg|Y;+is2f
zdIZu{gYc}kZ2LF6FC#!sL*He&cOmyN+-abmo?FG)cX+#oa8Q8duA^`;#Df>&U<(cs
z{wfsLG2G!Uifegxid>rnN&S4q)8gkWxz7Nb<t*XExDKZ(kn6I%jL#ZRx-6HzS{<CG
zRErFC*;ECW^(qIgyN%ur%WbL5hurt%0Cg}2=V7%-UN5~_BXZ(4cbYMJF2w75D!%|I
z;oo8=ScCWPjH2g9&?h0DHM_616n8mwZ^C~VX2$sWY*$71<MM)BD`8vV-eNbmCtT|7
zNafC5??-q`@#se9gzoJgxrDiOeQPuWIXvZQPB$*{R^eA&&NIf{5y^W+GM??(Jzbi`
zd~Bt%NSCD0EIw?CIAh}`*vaUeCtLb?Ous1CR-ua4@~?MDS*@1eC|Fn;eaHn69&rmc
z;oqejMP)aB%00r;Q$C7kpX!?j?`ICWF)X*0gGD<Q$O<x5seKfheUg`fp|Cwzv<(VH
zcSU%i?U7&^!pp&T;&M-s=ValbIRBB|6Kub@ltRNuwlHmId|EJ6P2^SN;QrpG>N)$i
z>uzVk_L(~r;7kfZ-PX|kN{K_ZfJv!sJaOj{y-kTbxoj)<%I_$z?Se&8O$x?&%1^f9
z)C+i#$=Rg%NO_s^-X?S$81Y6wjvwnc#6%0slhA3hqgLS+@>Y&gH4W^l;eHA&cm;PP
z;e43Jwdk}+2xrwvAeeFqfriYxyq3;zRd6c24T~~t+a@+#iE#p~n0YQ{Moy4nLekRa
z)ks}YQ5}<brRH2g&=MOSl1<9DGtzM5epu<9#)9m#vZRudP%G61eS4i3k$^|*syzBE
z!oDv&S^^?xO-rn>%63bY-6T~u9;Ei54m9qQv{Xxpwp1Ez+vCDFE}IP8aYih6TXirr
zS{-P4PIFIH6H%pRtgf>VL3~bX8*WsQN~`*fI+|d&F1YJ=_Ts`Du8Ggt!)3uBZxF<1
zIU7NOa5{b$1il9{?4OHYlpI%MC~oL}C$3&lJ6;7okrQjd7xU8cr6Po9Z<2%2_C{96
z{><U_V;CO|XYv);^0uo1@VH+MzY-J499<wC_`Q_jV@5(eImbY;@?`OqYE4vP!oGe@
zyG_!R%lYIw()f53f1bpbl75iqM>Pu&NAs1aNxtm@_mx!hy^7Mn@6<#keJbo*t7#cY
zQ!eL|tLD24`EHebixlJGmjbALdPqKjf#V9~i}=G263K&8B~vB{3IzfO^tec6{!l8)
z6;mb%%KcQP495f1qhJw^<b7k&4|+f$KkQ!sRjx0omFIJr6m%q>a^KK#pA;cQ{5sK2
znF9^MKnBP5&7xIg<h3)+NTZI@HRIEOYl+LYQ<j7*CoN+m)m7!b0>4<*DoN5jI2txu
z6N`_sxH-*fq^Z#e&w0xchjR?wVw8DwB<?HBg3)#!5Bn!Vt<l35(0G6kpD78I3@X`7
z!mp$ml~jHujXb}Sc9PQY6s7ttk6`oZWP`yogoI}b={rk^e>Modl173!^Bc300O#B{
zW<_6<#DXR98?$0qlUl@pqWFzjaY2*BD?=U7H)cB}JX%$Z5NdZ=K4@Z1BBX?^qE#}j
zwu+45SWm1;YZcAPVw+1EfQc~ylGhJD8IW}WU~?SU;#j5jZ7Kow8<05z=$R%90Jg~h
zPOQAXJ;{K1)huB(#MU;TEFZmK8+Kyl_3cRpWX{N<5C;|w=)}qkuxP-70{aa}G3*Q&
z(5QWSN?yBEiUTuoVBUa6?JHCI-a7-*0J7+WCO&G5D#H#Edv-_(tC6yf#DlJLdzM2*
zaqWUjM{tx7M_B~dWH{oHU(#5L!L}+J8ntA3zPTAm+G}kx)agYA;0q-Wv_-YjqE>uT
zbZ(|54)^esr|a{rv-UeGP@`^C(5WaZRvL3YXGAQVvZe8PB1&xdm%qAE2@ka(b&}bl
zHgR%ks}6Byce9v{KqH!0t}h8Qwj>afkyU|!>tZ2GU`-hPJ}OYh$bXnOER^$xo>jfE
z@wB$^u*$&_^M6wY4bV9f>coaq(NncRZjGjuFj=mM=o~m0IeDGz<YOEm^2QdpvyfA{
zaF%sei4V?!OMEj`<Wdc*vFZYBOXALk-f7hnjpB7b%%;Y%8XL!I?7HvNEwy+<YS4|v
zNgFoN78P*LbI*cc(I#9VWY(kSVR4CVX|;{3GJ5J$7%I)iesrTJCjypQsHSEM8Cj}Y
z!bm&;3)JytMQ_znyatamgH%}spW2P3Jq0YzvVynn*}WY&&!@&tN{Ze^$2dr3sHZ%8
zsAnhsS7u{zdL9>n*BpflnBKJq+kG5kvv5FpF153ozEjfmjt!*m)bvU<y&~zleSq|e
zrsMWjgl)T=Xl>`IQm$=hm6?V!hAMN=Ru84vgcFp8)b{G_q4y*<@Juy&H}L%T&42Iw
zw)q$E2GAm6iN)>+dM6gU1tEQ#goFbiSnb{}B)km-qu;Y`(Mx`M!v8Z~K(*EX4VX;g
zdwryd?}bVRm24(ikocY`fl4Z<D1+XjYC^z%#nkUGDpnvDGiD|5^OBL64E!(Gm|p+4
zWbPDMum3w`sNL)D!0&?I&5sKid_u?_zZdeAGDz<&qr%+sq>#QbA>mFT{vSY+y_^3i
zWbjWQy<vsFeNW*xac3V<$e5_~&~F>l2ct9i1lKs)sBtt^<7lzQ(Q=Jr4mD0o7_w~X
zp%OB}+AL(@Y8=a0<5<)h#}d~#7QDtW0LJm`fE>;aKsdLP<zinxmo@C4ji#{bC@ki9
zfHj<wP|2W@%_Lm#8I@En_{ej?cdpX#jY{?7QNiZ($>NS=A>mtu^reOPZwJBpjKmgv
zk`P(&iM}q~#6o1jCx$gCDF$i_K5;>l#H;7C;FC{|4g1H#<fnF{xI929m4r$Lm24(q
zNQ_D<LqeV*IZ<hNl2ZQ^(qOZEPAeEZUAXWJA$?~G@y`O`!k3(uKoTM$5q(V(3z3lM
zce-TdELm9+*TCX}qQtA`6Ov|ZKI63DDEPGQSrnHCD5a86$)J+WBn*jBNo7dLGbD4A
zhDR&)k0He;(}fJmcfx}3IN|zUCB%OX2ueU=A(4bgNJL)?Cl(?h5yP4!Sw%u3E@+Z?
z^?X7iU$n#1!tm*$V^CZkpp;5NC4)*flQ1MkC6yr|&ydVi8a68R4<QXUA1Y+<Fd?CQ
zNiFC*LO6dm2tq<)A(4bgNc78V(iFr(BqU;3%Pm<&LLx3`l6dueLXt!)+3FWDvT*t!
z#RQ>bP|0QzjQ^qpDyg8N40?;I2?6^RQ@_KgSb<#3n3d}EL7nRKL8jM#kS@6C;~{18
zlJZmhV*1!7WbkJ~?s!<pR~`ZBy=A*FxBOg4-!FuOj|%Z01Htt1OCf{50_hEZ&ELKf
zeldLzg^Y=+4fO=qINGRjG*#nhvBuGIjbjcqPD>cFY_)-(g{yHaV~t}`YaB~l<5=(-
z#{d{N_4LuI1H&%p;<o4S`#eCyRuU>1RI-_by}+oXvKNqNFW9X#{EJe5oHW?{tdPMy
zLc-^S^vPEN1Am(K0ut*5k`U<yqOa{)EJS*N7}g}oD$)zY1x*sKo=-1mM@UAC*v8Ar
z0!#PqWHBbEaNFT47VS!^duSy}@m+FFRMMxyzKW)eOPX>ypImhht+sd9iOi$<4j^1u
zHpBFQnpRTHcaz#KXrhun750s2T2a!J%lYK0`PTOCGIjZGs^;6Prj=Cl&8zK=ny92t
zg?;^+cAKOrhrLR0)qJ1Dp5d_U8Rpsku$*E3wwotQ8XOlO=cb-)1O7=q_Giijac7S}
zPmlYlOab=-MR~xKTScL|sn@Cc8S3-L5@egPAQ0KR)$N>Be!rsIZSTdXyxPU~CW|$Y
z+uC8)+%hnbQD2jF_ftUFDpk#9XyVZUgvf1XP=X#IvdE@H#c)lE^E3yaJ|IKg5nAP_
zeT4jRhR(w|CQI9*nkCzKC@EVp)~M|i39!k4rdcq}qyme^8nus<3$WRM=3BpMHY;$z
zSfimP3sCp|P_r-q&oic3QD9!#(213oJt>~(vy5~Z!1g$>(|}H_ya09M4_nHbMbdyQ
z0qnFI(2127V7ui=1JG<XAWHzY#eh|@@B-{KAYF!L6H@R*OQilOVf|Cqk@$_<%*q&!
z83X4DZg~Vp32~G~aCyTqU*NbGHtb&&!BIjSWf5Gz;g~OQ+}>k^X%4LI<=L0a@%Bhb
zmQAn$1JVFA2MpM*5$3KT?AVvgb)&K)A;5wGX#l{y0VxLCZ$P7#EM2M?2X@AR83P*i
zHCf)oRx%(BAd6N5QVh1;fJQA@zpoGnw#0!+0~)ohfBn7!k}!pgaEuMyM}h5vhWnto
zP$*?kA>0#m`q@GgFl(in+$9S8=s8-x8fL0svXV!0RwlAWomcSMsd=)Ekhtlka6q2D
ziq1GT)9L<Rb$`dd7&fD7HZiFhH+tk7#Ze8LLLwShh>dpq+P;ri#m0_&?l>nFkirch
zmxBE|qGH=X{sm%3<hmK;wEYW_GPJoBzq5xnQw@Z&*?2V+h;Hw^A}bo+wTI$50HoaD
z8pE?;JeGYP$)KuBGomX8rpsg1rTMBZ8PSyk)8(=1G6!xUNwvrYMri}wNa~}-sAyWQ
zkHDx%HkJI_*le(`Bu2Dq@rsCr&^<@%b;HRR1n@q&_4jc@>0jnwJpYpUm(E`txoC}d
zV&NVKKF2hk4v(zh;ly;1@5KEdCV2vHTZd$AO>*dOM3RA|T*2gon?iUS5aIoJ79bAi
z*B0XN6LA*?B!ovEddAZzXw2pZo|5DhuGF|(4%M6OQa_44Bpo~(RC=-F##i38?Ziv!
z%874o$(FInh`q!;L*+)>0mV_Ru-sVd<t-7x=8cF8HrDb&`g(=PM1qaA>%d(Rf8HAP
zB#4|hoNQzx$!?~WxAtH?n7-~M>2St%c#xX+xAYu`8%?M+x(he7IV=)79+kUTUJ?=g
z4Q5pL|FZWs&`}oG|M(^(5)j;=U}>egDp)95QBXlZ!^`TTps5f=t0FJqrR60JyS`LH
zf}7QBm({eAmRhS=v85I(wxE$3n^3<jwX_Y2HMLe_McwVvHmy|CO3Cl@xp(H-XEzD*
zZO{3g|NopHhwSq_Gk5OXxpU{v+nqbR0c+5Pd=^4ZiHAG$*Y<71_O~ZJPz+eo$Kk9q
z5=J90;5P@hPl(4LNv_)3!^S&!h7&?dG8hfvw44FqiADq%PYZ=YOEj{lC%mVIo0wmI
z^^kBA0X!izo9%d^xdD$GSth|MJSq|4CPsUz-6iga5H0ck6TqE>Y;KWTcrDWA!B>u8
zOz2Sanus(K8~&x*v11pA$2m5NNhrtWt}_A!*cpX#>;$}vEI8Wh6K!S{6`judNBi3$
zj4~*Y1S`{6wcdl-QehwuM#EyTN)yAl8!#&`0Kx!P0M*cNq|Fi;(J2!|W63L^7oQ72
zu@?T-fe0~`U@Wyij+V_Zw2T!+TWJwa)xpw5OP#6|6Yq~N(Uu;uzyYM-i<J!9*XhDO
z+?EBBNHYlL87moTOuOx8j%l}{j8aVaM9E00$&clsn7=yN1fr!j$3QIeibFOTI^caV
zgp&b=j$!;f*?dAD4S9{VT%7tLvUh-n5{L~#i-I)yA<8a4ktSc$&_2yTAVGe1f;@ME
zt4)F#*$GBDpOV9;@VSvW#6<O(ND!AEWZ&aM`oL8(g2Ez>(BzFsFi{$kcl`<4p(_sf
zj(|CigA$g|(cLjo2G6oBLeMUQprHY@G0U*{9Q1_Tav4S^0lECmODdNye%i|Ar8uvZ
zknLaAS?Uov-Q+ZE?Eg^(K-t3QR5RX$3du#LrmYBaHPhcy+kSjA?I4xv7%)~!iDQ6B
z;)Gq^?=;h7F|s!UGn1y_0y7<=Xu$)%a1()GL~4Q{HAU&;Gatp>0V;}J02M_uV+~}m
zRVlCygjE{!K_~UWOq9@R=F!BIu6?nFMpA{t<<Z(#JkUj!mXhId+O!Fc(M*XlZzaP}
zvh_PuE?L?{$#C-9MXY^Qc~_2%bfaZ;N^k&gS-K-vJwcB(v(<Yhv{X&Ecw+&yu8&Km
zcG)zp8*IzNX4#{Jo`hnU9>RO?VoYC=lQ0E~A!L(n0CaqUPRSd=VHWgw(vx^=x1#j$
z>kmNkAytE)SOY(iPLgw@k@}z&VH^rIu(OCs3NDMp8W<4>@1ijyZSxw~gY*!eZ{h_J
zcJ6d2B^@b;Qp6G#tSm640rt({oCJCA;sKjfL{2|R<V?7)MGxu*oq{eV7H963Na;4g
zY{Ld-F(vv>^aoSAUP_J6AY)GC4fgLIVFzcr2QmMqKQ+1{aPbIj7ck<&%PA)d7x@V?
zz|tijpoDc`<Bhpc^tVtE+i=mhVOt%TV!_>PHQ+!Z%#B~4Cn;}5%DO(8ByLW3OOh{1
zrb!Z0egA8&pG>ZMu@INV66j@bWHeQbGU~ss3m0#n>5aEPR^IYqN&}XE2-$3wa(>|-
z*-Ul8ahKS_=5lm6k_kt%;VG+vI|HxmJcP3+b$wJB%M9RS#P&Qg@YmWVDbxQot5WNL
zEW@w#ExC==NERAoZi538tfjKknE#W;Sh+rR7=vO*gPbqwgbf)UnPXW^CA}ErxTRE$
z7N9la-Nk(mTB^Ivbf6MYy@A+wv=OY%!_0xNa`0%u1+0l)HAdy#sp~+bi&J0z?@5u2
zQ{!BcmT6ddFgLK&goUlph28ZSoNaWanlehprFuqXT2#zYJvhnhDulQ{K{+@wx2lCK
zt&98!e1T%%1I%@^(XDzez(Je3$dg&H-77*{R6l{;mIdpsN;lp={Ec|&cMCM=Bd#eW
zGvV7)V|(S>v9~7{EVVYnC>Q%47R@0XSN4gTie}3r=9k@=Cudx`u`Hunc!e*LQS#Wo
z*(SpZKUTsk>r%f^@>l?j58HuE`|P~XRW2bt+iA{(K>r$xYhSFrtTBMMa@I}0Dx1@b
zT-c^(V^as;EJuLjnW*6OK0QblIC6qr(%e0lEnyjhx;tu|CXq1jU6+X_R>?<i_w~P$
zdzpqH1J`=cz{#BxY=+f!8Xj({!Hb8dwlfgupD`WZDbw-7oe%+bKZFxRZFu1s0k`{`
z)%_Tj<Nl_^eY6C2R;{qJ+B*~WRzIu5cp|yvM5LiR92_t5U``V+9FCJooI;+47@0z*
zG2;LLGQ*rfUJ-ldU(h0}_Tmg1lv`OF4g$6_Y6=Fji2XZafwj{@9~nr>{GBeFGvgLS
zsd#IUfe%-8dP4Lt^3ZOj;#-JG!!H$aSpp=B?{dWl!Osh4kmo0V0oIsvLHH~pN+!d5
zHL{0+SGU{|sb_M)7n0xkJPmZ2V(%VVLBSl48B5SJPzK76n}u08YNU~v6k&?w?*MaX
z1r|KfhHEAJlM>PH37+mm^i;S0_GoeLu_5(d1itIZAXc9;Y#WFX20IK}fwR4&d?{km
z7idm~VOdoq3=vP`!YlclHz0>U(JC%)?du#-R)$%g82L4icpQiG`oSblR=zs(M~oe7
z;#%7CN9=_!s!U|T2rpKdBw<T?!H5o6wPhlUpn$k|)?Va&rr8E(R?oOZhy0@<oIUC+
zUON)PaIwrDTXz0|%Utoo*b6M`ZoF0R(L#UgI2PbAihnWmO>|ddG3s$N+<&yZ{I6)M
ztKMPpCN(TB57E7r5WHa$exWG~#6>6BdR}uPaw7r(iwynSc238ObI@)gazk4T0AMGb
zzBv(RAR-|i=b11)2KKdp;gS(-Gx=tX7!eek)36Pb2=Q09Ei8bTi4%UJcqCr4E8*Wp
zG>VW?o}Oe7Zj8-|Y}0oUe-!iGXvYL~LUpTYzw=H&*YO7kv_T$jB69EApJqG{W>BX-
z0)7X(_!o?Bkc~>Lks}$8`bvSZM9hL<D!Oi$2gnyk2bAi?3O$015s;as1rF}%k!^W`
z(j9`e-E;I?6dlU*$7t&W0TXu_Ta7k|p&_UG0jE~5uuHumN|Jp&5DAYEp6G!3eUGsi
z?mY9PhO?RDy|+{JsuVR*a|<dLW}v1D_?`*@ox#$*TGa)1xM?Y}f=9Qh0?UuU#+Y)`
z5*U|I_-I_$LN0orDF~o3ME8x#@L3_qXEM?I%=FR%faL9oibp#2vDebx4~<ON(64oI
zG;*z!kttal;t?|@;DL>G>+@?-90hjO6`Y}%>TI=jr3L6$y+|_w@wF-n4T70-x~s7f
z6&06?>GN%wjK{&3ywAi*he`%hxau@d(yS9Nj9kuL3+knyHV<^vHpB>E4{ZY%J)oLI
zS)y0S@~*ooKgY6}eGvZGap3_sB3KZ)pG!Si8mGwF6hPsg2hCWjrXLwm{&Fg?44M*N
zHt8pmg5c6AuC0w&DZF^%R9i_g<nd49ki+y6TucNutixTdFIc`uHhSLJB>1DI9o&!I
z30xOhT*fJ_EK>^daOcpq*_#?Z_VVUXH*$ybk+r<D20ce23BN_`36mfW_S7zg0So=p
zsn0W!q?%uvcM_OJ`wv7(4uW{xG^^N>sq{_6UNZQ3YF%VV3qvSToDamJo(GBBV`Vu0
zM^R>Lj1|=5B<`Bycu+6>Ry~gGde`=E1d&}SZp0YfeTWDCsJ_vtT?kBTDMeFYTXDtY
zv=Tqh9-l@L>npg^^C2qjC_-SP_vu<`3lM?{{zE|%KZT_f9v$k54Tl^yXs$SU%L1{{
z*tU5z<`joJz14b-796?}i>%OjCg-)xnKktTS$h>;j$rGMEZd`KQ3Wh8c*^cRI1$p(
z(%H{lbBB8(`LIJW5(q+Wo|Ls~cH&#{b7)6dWS2mY+EAyh(J~C~=ozpKt9)Gihd;TJ
zF=!U_FmrZ`_PZbTMWrRRk^!n<fmi^N(Ha=FhvQ1YQHqsA;>twOFP>P}cYG*j_j@Po
zT751sfA2ZP{0K4M3(PQ~k2K%GAz{o!-HoX9t^3Lk#>)2cRBbD~8&|f$E?)B}@##_S
zgLx2pjzOIv(iH}Qp9nZaV(HK(OMQ9<9BZ%?bripJsG@U)jO=-A1{6et<zZXcc<DGr
zA`Jc$subm1S0(oT)o}HTa{y#v8Ac7P^G1vrQeS}-8AKxkIBr}Cr8-M^rvrc8n=C_R
zp#qGngv&B%Y~~$0&nfGWLjtK4Xi~@+9T-RUTHFp6PKuH$1cG%d4(1^mOqR9R2pG;0
z*0P_mnc}eZf!vtiXpD5&If=G2YH&U?(i*rCrWf#`z+)5#B>Q;%&>~Y%h1kn(#7~cI
z%9N5OWy+(4U`lxpgtc12lDULk*eoRXMA#{eaufD*C@9P(NLW(&0>R`QXVe~S*0C{e
zL^n~zYMO_%tfoPv=w)!nIg-+0r6pE^I@@*Y7;zV&wHD9{+l=C6Dy#viH8+(O&F4di
z8>J5D(9qbzlX)Q-zjK|#|27<IU?}lj)eKGrV>kM398q6!0B#`;ctQtK>j0pjw<#$0
z$vNlcd3|<0PD(ijWz)TyngM8+0$6v@$Bme1Qxdb<oFOs#d4|#*l(3`<Rsn^So@itM
zR$X(WZ$>m$BBPOFS0o2iWaku#EQm%1BQn;&^f>N}Uz%nNWrDbvDD6B637qluu74fD
z_}YVLgnBqFREju9Cf0N(M<v4q8KEfCLq3hMqxb28VrctV1LH6j+E7@GwuGy5@QLvT
z9}|TXct(iF8HfCR2$lRzZ9bzOKuq(y0<8zO+<+l1sc(Z1fp`Pc7^;j9c^;{VMv4#~
zZsM=(<@4o48QH${QziW=j9XG40Et4OufPE=K%o+&4Sc~q1b&6~F`zH?S-|d&bfH2_
zlHyRA<p)R;e*FGJRspV&((Hv;(cd?kTqiQu8er1QFd&fLv5+~`3G(zJC1_CSG>hGG
zyUL9{JxSqC%)nv4L8vGbxZ{<IG#k|)(9g5Jo`Z@`iT;r~A1x)GAk+$Tb{Mz~grnOH
zoCPEk7Ge!hsEfr}Ci*&$?;y=^cTQ*Bze#SyI9`GC1gVy9qGaP;KO3O#5b+ukFqwS@
znWb0RN{k1_sdz#lBnQR+L#&aZWg9;sQ*d93R1PFSfa2qz21Pal@jB`}6>c<i(6%Zo
zt$LDSN9110+4A8LSF@arIq`UO%zNA|GI?Gz+Vvic(ZcQUpcKT;ul+(k^d2Q0(5sM;
zgue~UQy(pRVgU>T+bCCXHS!_^YEB`wGY}0HdlpG5V^89amv(9Z2ha?_&2G;+uXl_=
zZTgKc{iW+jS86<k>87^$w7e+$MR@;2J;S^TmGpAm^dSerRc(FNz5zp;chDZO1Q6YY
z_XBvRGJYNJ@43R?HQ^Yxy?y~38XWYA+o6|CUERqnvG75?x+h>ALP{@=PZ{isht4Mr
z{FQ_^dKduc=EZ}glRy+X_W6k{fHA=9S^{yy^(tyOQ{}Ub_csA8(iBwd0{Zv|M>ygJ
z662!MWPpVr3C+pZ_Q()|to6J{|3Nf4>v=wo^npeOj2A;Cfk$!{Qk)8N!lF_1S0qs~
zyk{-EhXroP35QbK;5(5)6OSC}O0UIGOlksyV-UJ<7u?@ZD>}V4(314grAk3`U&}vF
z!)UIh<*mX|@X0r7k3qA{pgHt!pt%Ui!|gs3b+d{39ixU}2v#H+Uu%MQF}OD;N|?v6
zD-(&9VglIJkHRS`>pPh!;e5lq4z{n(df*!<E{A`Bbe8pAl(56NA;r2R0u#O=y|g#7
z87O3Km-+$T0Mo|~wZ5g_d7*2CyW!?>JAEV~K5!Efm`dM>1<8zjEEC8=w*8$xBnRvU
zDZ2>Ba)murvP(}ESWpr||CK>;mJN=g31@=69M5`dxi!&!NJ{DG#PGc%3J=$_l343y
z+XfTh<Ot(j*E>Z2psY-B<UxIbWHL;LPnKk~R7W$Ig^Cin0TqxnO7MX7f$)Ig_&HdD
z;X)f$y`ww!^S7auE8x-i9z5Lo3X5vkOJLkair!yfkru#?Jp;l`e0VIozd?TCyaS`6
zkq$g!5u(<GGzk_XkWR*EcG&YKKwO}w2w%iPg*p8}q$hYTvLQ{LAZ?I}IslHnIzC2W
z27(|)vV}$%h<-|6h~ZLbW2vfKHJ$f&x0(hog#XddAv$_ubB^IvSi5hhr-Y&ca{iW;
zX5GPK<RvTyUjT(iVd=LqJnDs|lwcI-*jO58K0Puvy2s(_Js3Emt^XHXO+mf&$kiWq
z9EC$;I5=fZ?Kps6Z0fK~(Re$4b6AsGUV`*2LV~F$5dznw&K?jI5v2K6w%|aAap59Y
zE>eFzN(r*t3rax2%c1>el$PX+7{&Bbq1uTZTZPghgk`s_gQb#sbYyZTW@`UkWe&rZ
zLXVaC#$S%YivL@cDJA9)8{n@n`$J)mxiW`km%waXp;=4cbjlEjU#8m~AfN1Wd)Vx<
z&J-@Ri66lx6}=&1DJed1J^BY;<%4TO*hfcxqU3%PgNd}4J{8a<^<Dcyj?#}-9gK#O
z(Xs=W^Mj<kR<79jJ22xL?LQdZ_2FyY8N1YJ+Gu~$`Gz+y#A9jC#A8nf9<w^D2g>ts
zbs>6(GzKql+#nyxbRSH7GfSp4ao!^Ql*MlBq{uEo!;NSR(fC~aLS4;~hxn-pR}~jy
zw9JW#>Gq@k2ho~j?U(y&{-mx<!`zR_I17Ie)_+m|Ch`hHxu}1$h44QZ^>2y!H^T!3
z-qy!7g}>fFPLTER;Kk+>b5Ik)t)z1yq;QV9vkQI;@L7UAE!|4G@W*^hB(K7q*0CL>
zph5A*%C?|hWL@(HbOY!!gy!hfp$_>N_n~{{#3qT61ChLq){y$~i5Lp+U}-?>vz!gZ
z%8C*BYv?@#KlcfR{|VvmB0NjwaG;pR=D4#v*(d7X8uM?J#c`4*oWTwd**(#}Z8h_L
z=qbgugt#sQu7tmqgr_FL($b-oL(ffMTrG^pWWk{kQLH<&Mb1~XLy7uvC({OXS3bw!
zKAyN=1M5(qeXFN}B)xfA2HBSwpm*N~&<+6E`jYaD_HSjDe)#uTkFgU<x;5&r2QdM=
z0@A1iHS<!c(8+q+P<+T$|8%DBpeW(5lQMl3C_vqD-h0;Ijj-{-cJZox8$t^5W%9ot
z??8J=7p4%n6RXu07KR38_~z|M$X4C#rOp#n9}5Qe_sB6D42vu_$WO+?giyXaAcV-E
zBM<%;Q~RXYxd{~za|I@(kx6S3Mz+MyFeKiS_je@T&|_lMrs6ZX(trqa9f<30tdyY(
z;Z@o61!<tj<M`m?>#z-B!?gB$Vo3VTkB6xb`|IG~rEa2sy?6Z=G17u$6osZhj`iy8
zAd0tH$C=D~H+__BM%85R0a7khS{UVTPA?XPaa9HlNLinQW<6_ITsk_K8Duc~w+O1n
zn0aYVpBOOLp9RAH#ytEqL!%b=UF&sn@kVw+L&f~{&{@b&TG@6LvwDeei&?{uGGZ3R
zyA`wTLZ-O*lKRsr;WuHEnYt24j0C5#h@UG7MF<-0E@n?s<nVj@nx@phAc_{@_?{6e
z(|VIh7q;fqRu{JGx?}4msNSddSc<KjtLn(x1Ka-YGVIFik<_KG%vN{LjDqd(LaB#r
zw+f)Et@KKQm|(SWJ+KGicM%dvJ&k5!d3b4eLRe}c#J0xXTBr-@v#?51MU}p$JI1V{
zQFN7Q(rjg^6Me*~A5Z!B>SO-xj=ZNnk7Zd1a&~VwMO1Rj&e`Y=&_!JHC>~-svFV3=
zOC)c3=LlLX_2_fl9M00Ct$?w5^aaAJ9u;klmBOgMCcVrS^Q_!rc2}<sf7Y*gDZHWv
zN~5O+-COJBMT?=YrA{W5ZVJ{~3VLl%TQX|nsO@R}nx_AZEU(;~mbw$`qFJQfX-WI<
zTITvS&HpJ~ccL>-y-m&KVp-||m%#sTnmHKxziZ~}*F5r{QqF-*YE&-e?xxzS&M@`;
z@j9bhc|>Py##-f3b;kNNk^i(*B`no!4j<h0ahIz;dR0Im_LvpW`Zdq~rxXTBA(Tco
zg`8|!VeVC-8NT<T&}Lyd@?+Tgz5kTx`5+o*1ejsa2d_>kx{q@c{u&g+llD>Z<cu7`
ze(ED<#89K7+R9hL{#u0BP89D8-n*WLY;efny>Bkg2sq<wy!W0jYONbdEm<RD4vY81
zW^Lu}qYTMg!&O5)p%Y{NV$wNe{bM=;HWR11NHxj}GH`n1eiR5w-%c6)b?I3cbFf2c
zPRh-FaIF`gifusb2JHFZF(wpu(u6SA?)3x_UID1EzZK)7y1eQq@ays3djR_F<B_MD
z00!c4V&Y;7x|_JvH$kq0;y4;1^_05<Q4nsIJ0^|_l>hNSM}a^|3v5aIc<-AhoUQY$
zJ;NcQS2D?)wcIN(>^@p9RXF%^@1sy>4*1c?PTc`W@DRrfR#63J@sRs|4wk+j%fsWs
z?Rg&yRCp{vsEv=u)aO`$Q1*|*)SCQwn4>_TT8nJ8qP6n49);Ldt-W$Cr&^E3KY-@D
zB;aUV1ZW=@=+Sry&;l3e(KrgwLKo=K_zKYD)($s<b5!m^+;r;Zt-VQPt(*E{*GiQV
zuG*Xzn(gY#Hl{C*`8TT1QJI)gp~;kQqYlFOjr)k{<(^Y-eCpIYykaAC%|_21&8ZZ0
z1Q7QLa<yjN_aN+8t=X#M*ROBnCk=o9wux_v<fhlS&&xFy8If*GAsh{6BTSM-$M->r
zEfHlKqpiHkP9pM61gL5GW4<iFU4gI+Nr-TP=k)-Nu%5uV$RK%I)IFBe8@-l9=kzbI
z6-eKKmR}rN?Q|R5Rg|sNHay#HFUBQA<K18O?)YgAeqjj!R@J)@(!Lmne9^U`DS#hg
ze_Out3jGCFk*w(`=D8F6HI+}u%3{uj<GO?G;3(GI$0Grj`Nl9^!`b|ekHjyQ`G(6w
z&dBGiVuza;m%H#6nTfzygsDLYKj4i6zbLmSGzaCDtYV(&a(!0j%M+6vW0E`8v`LDA
zjy3u4aa~OEyN-e}oBkxiFBGT#EZvsH5`#_t?o1Xi-A}+z2h!>q->&4XZ_ARq3?hsn
zudM8yfK4gl?e`Yu@!tZ@gjjTgH=fjD`K$mIe(HtHn5W?Fb|-8N-k{4dXsE$2#|~&)
zc*t^A!e6g}T;xIEMoH~|P`@^5y3P8vMbmA=#v&lM>!VQ<a1MvSW=-&dKK5vWR)yTJ
zk2Zb0t_j-paX=F!`Ec>5*ch){6Wvj;+2u$UcEL2}=ACWs0QVVvX_+omv;%jN)@LDV
z%|+Cjg=j7^3^%c%WAF1XD3Y49<Kr!SxUwiIGNU0pD1BT%?d-!Nkx$CHu-+R!J*JD)
z+8+Klg7vSY3Kmvy>1{#;1#&U$_h$bi#RbWP7?88VQU&rkorLrAb^N$^&<d&oh+|XC
zFos4@w;<FNwhe$p;sR8oY{D)QSc)-pTdYCb&lN+}06h9z?~}R;-9Q9+fA>DwAfViI
z7zguY1Ak(yznao}pL{VU5Z)*EMRE3=*j;JzV34b8;CO?Yfkn&CSFnm8<iVJVndtc0
zyB<e~5WxZ>f)CTPtp5{wWT(=o;S$N$en(Z#i655m#^9kJqasu`Vc`z$CMT1Q^WGaj
z>`HG|<c(b;v~rdy%}x8WHlSp`I>*EnEn9YQ^fE$NV;9KMpEW3@0`3S`?adE<4!;G`
zGxgm>ebBP=Bkh?wzs67YOiyEa&Egz~Y?&qm7urcyefm6T<PJGoE<?ugyFz_s%_m*B
z6NLghuoDkC#pyI$Jp(7&xN*>*oCw?2MEXk>#|_<ZTx!!9%%&3nc8*Pn5$9ry@!G1d
z9>l;`fyDHIX&f^vaAo#T&i;~a@c;J=``{sE*kD-nflUc$JY`tqTYO6-UwO$e>@r)}
zu_V*`j1cdA#<LiAyY|GfeDrd;rTCw8g~c+jJC<pt{P_mCa7Hs2X`*n}!ZHo7k~iEv
z2-l8Vj1xA(w;~tczSW&?r8L=sF-CK=>^V3#M{-OC#l4BX7%_WYBcz}2fLT#&R-?#;
zEJr->I{PDRHHLAtOnRc)`;=eR82Y4c6y?XANLr3I!r1|LL9D&kDmj@4qU{<ZhDBo2
zo8>p1<-|=+G;FogVj1DVe8F*ZU?Vwfaz&aW*I+{*j4mLrZ4>>kS4LBtGeo4;<Gn{Z
z+A%=MTAj9Zv>%NQjqH&Q;$sOo=yMSX2Lg1|03sphmPqxm06<iU>Yp2+#PnNi!qrGR
zWAvg&;-ZB=Zihpu%tojUemFZAt%ir#76;;!{|uGCcyS;(q80iL*BuozFlhpd5tyKX
zcCM2ulepEuC4b{e{7Vz~G6H)_j9qoKR}KheXSEZrN7HN)T{3`oF8ghxITwM@RWLw)
zPv1((adkFNQ({!S|2<)92WsBYRKG|)q5=sW3WTaEhkcs@+p@DpTmG*g5ZdxLV_k_Y
z|M$N>0!N+k$uIw2IrR~~<rd>lGV}=(`i=?pHZ-S?j}?CQP5P6<M{TpWHVp<E(q)%T
zX)ftgC+1IDkaudtk~$7hnjE$!>-_H$&ZtFfE<{@~l!h@-3*z79R$K^|;vR`|ByCI1
zafG?oEC;p<u;`r)Mrd)EXuoqbjLaANa4<$9r+eV<JIY^|a`xVJCOV3AN%vZMyH_l4
zcf(To3)k5pZsc>g8HhG5<yPU2Mf`1`*F^VV9>%7-BWn=|o8xLe;M)5SeB%2}J`<5z
z`Q+HA&UveM-ZtQkVxEXR=!9)@-Zq;z4yf=davN!sHw|!X{p=^luN?LXc%o#e`IIye
zsk`0~lR0Cny&OKU!c8ohb2sJn2tslTe=6VuaQ*`j7^&fR^6aaw33_X<z^;nE-m`81
zUj1`smU?TuFyPnMd%ncbYo-Tg1aFat_nzw+GW{z53~%jDP^qu?Ok?PbsY|8>izm;S
zG98h;o;r0lf)f!IpUjB~0Td!3Ol|Liu!c%~190IcGEqB$JHM_?=PMXxq~d}^A{`{*
z&Vgbndy4`5JOLL0&{gPLV7-R19C;8$^LCgKaD`7TFcBCOO$K(o@qW{K&Hkg8f%Sw8
z)|l(k`!xpURl@w~_^h0N0FxRy`X==!hKcePEAhc=R<IO#vSQ^kKRCtxSrFubLnpQ<
zc&7WaSPFf+jK*-xidnD9&iZqbH5@%r`oc~8Jx+|xuQQ20!$cP&kw*66?T4BCilq-8
zZD2pbm?d?B3$~xOl0NCvW12yG9!!mBp3x}-o<wpFll-2CEHVs#;Ll_SXxbt)@mH@`
z{gp{{KNEc~J5jk!v{e%ER}*b9iEd`1FJ~tjV-v9zhMV}CC#8>=M5CB!QYMk;;S&t4
zkO5=3@+AZQuYCX?2=JOF(GK1SmS`Zy!rb<Jls(IXfkxn#My%b@=v2jA9Ia6bV?!H}
zx<p1lAHMIj16u!NUj;7dKn)I!k+*}ss^Yku)KvGgjU8*yH{nADW~rrkGa16SB3qj+
zlw?}mJyT%!hKDg(yzt4W=Fp!xd>Ub<F-p}gHzTq?qccx=5UK5WvIlBHEMsmk0DB4W
zCX|A0=#4*o{PD*Fm~7D2dS4Qb>B)r#{>tJLW`$Hq6Lv{HCmA&K$dTFzG>OQ1#G)wX
z-c0$7591KfmX7`F#PpG_=xcSgL)wX5fG`k@&&2|k)8;?X3yfPYypLI1cRb?jaCdDX
zkz<}liZI#ZW1<wtdlx5=sr^uQZl+y?!+j*K5rdf2FA)i1*s8^B-?W)?4a^3@d>=4Y
z%4(lN300%#i;qc452}^x7+T$TNOscyNQ*s$exKRRAgUV?X*eq+iV(eRAU;Egivgic
zxgf*j^k^6JFvxV6_gc!u7>5N?bHa$qMCujYBoZly>n*AUq3bIq*QYSLNxcA|SOe2p
z*@UDvo7$gdAnzgM1Ax??n3d>g!{X4DiO5Ezrv#)imvKluA7*V_J78pB<KpNB|8MaY
zmTxNuXlD~7V9oB-2xQ<w<#(ZakD}6&$(Cd8A@89H!g#Sbx`$I|CnKD+;xM7Ne14E>
zLI>*>3!mvV9{CkYxgC+F%7dQ{H)U#bj)A(9Q1=Q7_U`$iQ{az>ipY=)pLQw^Uj&SD
zHYNiVteSwvT0r8QpFL374Q7H2WxQbwU?DGcfQGwK{DzzOjw1vrL_2B0J)zY*br<g0
zL`3?yeUI^(ouMMDJP>POoM9iOUAy_o30Zh-W?Z<55AEq2)~VpuV-q9wC`W3xoiqq6
zifFZo6B9rX%NEFEHBsiw8HGczLNbE)$(Z6DPrO$GuVTrQgsHO-;I5Xa(Xjmq{b`9L
z!#zQB)pvh4VK{eVGI`!4d-<10_Ab<+A&1BDt<*wZjE!St8!1(SWer9G+}(ip$<|Cf
zSH5bHBHXl@q<DFI_a3;&!3S1#cL)P4uRv0~fiY9yc{RE(`Y-B&`+qLupQQ*6M5kJk
zP$k8r-$=z6rCNYcSxh&ERb?<6KfMlBMPh(+3s8nm3^(!FC)m%*FkWQv9OTNOQ3Ybb
zCLht#0dnd<BAh-Ep(d~C7!KKVfdMfoj)@AyDvGhBxrrq)guyF8O!{|O4nI4I7%Ycp
z$~70Oyq26Vn?y3+Dh^?xN~uHE@i_H_MXI)JZ|UikiR`RBDK8LZC18WkPEdW&JsN)l
zov*30;EkN&ee^4x_w{LU&--36p?_}HP&4nlaGx{p3*uIB!$wRt^VfQvTocJZci>7H
z9g_rCbyEtt0RyzE^4C%bg#R)FQr^oq8BYC!gNE(y@+FeT!`Bhm`dQ^h9tvmK3I`H~
zydrlk7g;hXXb`8j;7ZO0W#&1|m9am47YoZAuB5()A9tJl$KBe3Z{35&h4Bema4Qmx
zz#C3sg|5)gmgLa7!aII#V_TBNb%kGYeHPUf-sF7N6<&jPjCTTjAoouJH~rYKPl`GN
zHaQdYI(ACZdG)4@1TF@tsqf>66_#ML4zj)WJWH5!kgY@xvbj7PS;tg?gufGIz%Jlk
z&+W%?#Z|ms-(905-GkPrynYUBfe!#oeUr`+;o)+)(pwuq93w=ei>lFv{LKkm8)(*H
zHM}@v!lA!CX}Z=PVt9InlgV`k5!3?Lfw`EH444TgDfHGpio_C1ubKlU`1g8iF*;^Y
zbIcR&ERxgQNv{0ej>!~K;|(&PFBJo{1f9ln*5fe9V>W3nejaP0e`8?g&<5;fdnvi%
z_n;rpbfz!~bV#&bB_QgW0k*_YvpBSmRn)3hPtb`FpCzpb7C>Dk8@G#9iG<Fan@CiU
zhi2l)P?MwT%)@BgCLJq*aoGnXZn2A{I6Bn`M_1b*4qM@;Y?FH#0%ypO5E|UyIy2_q
z6sy__KMC6)ZjEq2)*OiYTW3XE3@5)P=isyV0zMDta+xJPb6yMdqYRMWS-*ymt2-2a
z?nb-p$>m8W&)3NTFXJ^#rVh>-!|$p-pu+_Si?pIOz$79I^BnqF!}$)4JZ9HntOH_$
zr(wMH=qb!uZMF>Tg>ktYlV&da581pL@zWe$vB74YKz7vzSub0t$_uGsun+=4-Dr+U
z`>@g#?kwiX8|+3PdJ#Hc<x9_}puf8_hXkMK3{zc;-Z;`VX(~n_%q@k6s{#kSS1@K4
z+^aB#XSub0Q`oz;@0(oj8(i=I<9dG<@3OAmIUqO`t!ZTNMEs5q4#4m7AT(3wnjC-j
z;v21Z0XrXTb_rNH*pnq-ILl*>2+<=3a09+8eI=cTU_^f_wi^x?x2!l=Y`lp`KoJ6p
z0PdBq0(=$VtB-u;<0~IudADK_@i3O>59cmi!@*lw8HU1e_Lh`)4639M@a{HttVFaV
z>FRClSR2y<%Q7a&YlV|HuUElway-vmiBPOBSkK60W|qU@(=A$d2z<kZ6_Do-+u*gP
z{BXJm?|555k3F2Z+)C4r4{A}LST%kNCwuYv&0G1o8*lg2@GX&itP#RPT{0S;WSAO`
zgrvVXR3uL0b{GV2D}rks1XmdZi+}*foj84Q&W=<h(4`dQ<ABUz8n9<a-mj6!>`1i3
zRm(VXizA=No(G1dtA-mBbYF)&-pG&e2AS(*Pf*OIB=|)t8Q@u?q3G`0Wqird!KVQ>
zeTRkig(g^NPnY1}-~jy5(81)Cz7EA31sgbq;nkz=|1t`?69?THZ9Ph<V=3!SiXQJ7
zH$X^-ks(oJRh_mv_SB{!{Rvx7lct8WV?b5B#_w4e)y4~pszDWk-ujvCrI*XpKwIDv
zG)#-+RM-27uJ>tpkFrB*kCtkG33Q)hpme_N^b4h0FjK;IEg@3i*e-lR=|fA1FA|D4
zcJ}Rw65k0Zpn!2X>kd+V!&;?!v_tjNs1^w7fZ%!f9T^;r-|@i__+1`64Zmxou%k_~
zL(kj7R-0s@(a1nLm5XrvSc;Q09Vtq4W+tq(AkBSR0iA(h4xOS{bjc)^5H7=N(0kYr
z<Qgf-ezZ!-4m$bM#>7H4aqAH7o}y3zoddkJZ@A*#Kpa{wP88-*ksZ#5F#~RoF!+W$
z_?|=>o`jbXSgDCFbfS4GhS4GJ7qyFw2Z!5NpU~JvQAe3un=FsM;G*MNp;1eAh3owi
z*ZcXd_p|Vh(u@rD$M1M=<Ww{_zJ<ovQWv<OJ7JVz!w<UN+x6WLjA?_??(;@?EEWag
z`7<2Lq}0e*cM!}CQs2=y?6G1U&f)R~!38c)rFcm_u5*H%7P8U_QUNXT#Z?^jP(EZ-
zgcAcPEILNUA}1kAB^RDK82V|3#tVORr!utqIm=KUNJB(}iCFAJ{0(%1J8qG!FhElr
zpuMibB+!sWWHN=>?gTl7dBh1~VWi0SIzi|t5BCWU%3|M3IB{zs7XcEU;gG2(?O?nb
zfpiB4oq7D)KY`>mAszohaK;L1&E_+%_fuT&Uc6&2A{s2Cn7Ow#6pK38+bWXT)DDk4
z8ahc&G~R&+?AH$BF%u`q@o*2Bu;qmd(vX0p!l=u6yWM$P<GlHtH_ntqHOCvwa)#zD
za`b&>oSB0!$1oZ5Cj!XQy7yr$VPG4e1_7CHdq|hlFM^6%w23BzxV&50cn7RjxmdE(
z%Edqzdb2S@z_%+E@Dc~`fS1$5=ZITM9FtoDqf%zLe3o#QIu_X@?<}{O6Gn!~J7=rm
z&H<r`F<G+-cYdP!hM26C!H)pqMzw~ML%G?%?4@fl;s~_-$=A|(8dvq<S0qC2r9W$v
zdaF;%PO4i}qu`1pUtz;d!tapDLW~HMAvNs1<eZ9p2V!;23{b`eVl}P&8r2er7n}f}
zU811wxn0?D?z5I}ub_jl#0(7$Ti0ajxr;rX;KiyB6ul>X8ZJ@-?H=rMpqInZW^vc-
z)KgKoiNfUxenMaJ*Paj)af`~Wh?IX*k3|~de9M$f<K)VfF~~(t6cfpNK`3O1RXOy_
zO8aV#g+PEO^-0ivOjzQm{Qxfa24bu?^5GGbBUUI%pM!GuzzjRQ-uwQ67L|yMV*>m$
zRS_JpPU{4!2%|5v&WzSuupQaN3(vVtvA&4Q=#|h4U`<4Z8#LnT&(O`@q7K_ou?EJ%
zG`Fs{;g5VXwTS3tIni%rM_-W>-HvEoih+y<xlE*OGLiHVQm6=Q++7=a8-Q4>X1>_N
z;A5f)r+2-Y<8krV3Un+^p@;ZlA=!$*xjm~;>@i`nM=>4cv|CXDk4cVH4ZI(SOGMKA
zab=X8^NyU2m~^=nzXG{t$U@|Ci%0;bTYw^X%eE*?oSXfT9}D}R4k`PueA=@AZ`ibq
z39b*@cyd9OeJxTPJa_^Xi3`m^jEGfOKF8w|8zWZ0SW$0cFG_UQB*eMua~Kl9k{5xo
z21a4f3{T87*^g{spa>9F#i9+AByGVP`IZNE5<(o2MObrn`Ns-PF*tT;%2Zu`xQT76
zAOxL5N_r$oY}iE{bRAFY1Nx&h`~-^#yF@-bcbt)sBIoevr`S<)cx0r@sk8}#*Sj7t
z?80IVwZLRzb?~toEDlRmaHB@@ruTW)jd%SLBul-83|*Bq9s?{_RlJX?FbP>>=U8e=
zfFKc>PQvle);%N+W~T_``5=jHY2qg=cYEazs*E7VUS%2RW2v$X^nYJv-rA2`g)PD!
zTt*q3gq=0i6K}mESE5p=|Nj+RB@A;2qgkwkbz(uRX9*jGg7+$6KSr`twJ7}nxI$S;
zL}of~rOw+N=WVX@cBAuli}SX~d0XndEjMpD9lxVuO<}Y_EWoax71yB|6<QpX;~iED
zT8Lt~L`|BFCl7-w(Vw_`lTQ|=S1mY{*A9{}v>#8}Z}Is;7q4r&9l=Z;`rNvvAQ9ms
zbjG@-3PFml^kmnl0htjES|z$mzF}Q}L;SFUV^v9U1aZqF5t|#-@W%GKYpba6k5;J)
zuiIu-_~(uz@yroW&tgv|oa`Hou#TKiFV-TX5mrY`26F(cw}3O<q3<FTmhloq5&*cw
z0<wl<5fj=ZfUHbh4XJ>aSU?JZ6S_eFS=X@C$8S;fDd8q&P*iO;#)_&@UIK8vCNpAq
z>4#F@<4t)tK55H)iOAqcBmg5lso!$$Y1mmi0PJ+Byte^h_Q7Zn%C@i(=>qX#wpoy~
zXTEquE;phWis2~rYY%WA{lW#u<2^kA{Z@d&va8ug>B@KdX6Cj70LEQZUF1{95<V>X
z=qE#H+YOCSvZWgmx-$9Y!BwK9K&Pcc6i`wG47@dLI1#Qdf>fp+1}{`tbvxR{msKKl
zb$~6-qV4P0)=j&|Mb9H3Dz*!1@^Gfk3mRCHv3LN#Vx2q;3zIn2D~0Zn<W{<ywJ6w7
zVhti>aY~<{_#F=F96O5J1%-%ToN_5BzHv+_>`)z!Ro5fsnIgV8-9U_Simu?g0=QU9
z5FlfXBNigrl{EZlCDwgHIOpx9j@F>Z?xB~DW2dcG9XuF1*h<LkaMLhQ>j_<9t3NZ1
z;JF2u_V6s6<evVt8Qi+0h=ZB%6O@+%oX;YrJ6^*DG<@;a@|H8#NP>q~oLq2Z3qaU{
zkLjK6wDYiSfd>M`=*vQv6vP?`K8nYKY@p{TiMIeaBdO^xx(VNeIJIG~i=2XYcO294
zRH2zH;ILhTg6qk`?x1W%MAE$#VZc5H5w<aXMdku5glpWjuhWja4xk?G{O)?4)=iZ3
z!7FWfx!<QPv?$iVnII0Wkz7?EW}m7NdLefrhFv?+F+9#~nz-=VgVbC`)G*z+i*Pjq
zf#D{uXL!`F8Q^5AD8evFA$kpqi*7HoQy)RrS^KguJI5kDc938e&5f%5ShnfFvN!c9
zmJ5@(xMt{W^KfE4vt+(v8RCq)rTKVAWx(B%E+$`$r5sF-)$i9iStub{9=&UL2r$P>
z;lkD%*oC87J*_~OVBe>WUg<&E9&8RagDiZ*e~Ij!>-!wMbC~T<;;cm8T5iAz%#kg&
z2RTz$9wqcF3k~n%NlbXSMar#`Ae@yR>=$%WH#@1{k;dR}d!AE$X8xKh^H;HzC7I)(
zP)89D3UzpcBk@}tJOjT&iMGR+LA%UBdv7k<FwlbQIH-}n47B7E%|YC)jNkr3-SHVT
zXE<msw`lqq>LvkA!hZl?Xu`^gAMWO=FLx?D)lLE5{Jv$6wsr-r5m1~d>2!f^cR+vV
z!umS4v83o+Fcsduh!FAMIuVP3MWp#~afarV4i<G^a3Hg12&Ps-)#03L`fMpQ)}{|0
zAL=XK3e$zM0s?7~1fs5|D|EQ3-NRv?W<StofQ=B@(dH&N&K)0OE2-M!3G#an_YwHr
ztl!OCDevI|CLgyP&4MM8$!h1HTG(#%{SCZJ>B*}+?|nnH9t3Wejl)7aCi_dlhdi!a
zAMWRkyssQgI?}WrOtVO%u7rkx-r&i?#$x;q6(m@$rWqvDI7luBlJq$M$rtcGL4x-e
z@Z<Gtkbqkmadzy%_<JEQk><5aEDdY*n<vhsF#muZj#jf22AiOujC%*gp$YQNm0vHn
zNKx609V)TD(5c`anBqyFT%SIvK3!a&9$265U!U$<pDw7!gv4fW?PHYt?zeOy_srH)
z676g;j^iy(`2T(yZr;FKOS1psGyQ*;3o;IwkU}S<Q$lR~VM>7>^Wd7pvX|7+@t=Ho
zyITHLkXe#M$L4Rx$OSTTH0V(Rhm#yQ@4>S@#{`R0AFcx!SfiFj$*5e<gcH_sHZv-B
z_h5~h=N+*|JqZu2QS(@&dyQIl;N@5=_0eqXUP%pYKo7wKvkbh%25xi(jxvFAd=;}3
zz@mcK)!Sq>5F~ZcXhT*?$R-!e+t>$^{5HD+DS>d$=nA<&LSU)kAU{(=wz)zENyv6r
z$lVrsV?xfi=FqpqMn4C0Au<r>e`Hf35m{qOlYP{BUDb8~<;h0YTVGHGKIu`b`pU3^
zvaV{I1MxEh@hJylEFknic;B^y!cQzkCPm6Q%682ET$sME#Rw5y&~x-=0Q<DKoSu#O
zH;aK1s^k7ns5iMyDSeir>!XH?4rrq&wl6twm?g46vN&75KnV|j*Ao69CV}7@g(g<E
zO?rBsvyGK)r*f0yvL0FSq#(r_h$>pF&sb=C%ui3?;@omPN@`Y>cio`5eA>z7LQXX$
zadx7>W{zE8kVCa96ux_{rhV%XOX0sTZHtvzk<=OdCTs?hL*58o3t_edvhYzyPD*Wq
zlC^q}p5&z$gsYzO1W$m&v(XW{D8c}jt2BI#!ph3uj17C9kY@4Nu4yAAJ}QzZp$U(o
zt<Fk15+;7Q50DN)gXLago9N%Z=Kj=b^zcGn?E+M8xN4I}4%6;odm8&46ggh_?k!r*
ze{QnnJW<N|pvgeX*@#`XSe#VF{F^ep*8hO9v|$3<T3x8y9u(A%mMQ9o9MsQ%9?O^D
zohTi~LH;%s40V*zzL05Jc6OeOC+=?%6ttGO!q9o!H!&KJA__xCVVAGX;e{+r-_7x<
za&RMjFt+9JWz(9yX?P2R?@)meZi3OKO$#@_fzqPlU_MF{EnLCK@)%Q}!{3&&JvmRy
zw(DWbw%=nTB}15aG&J%Myb4n`u+9^@(8(u}T#0=PQ93Wg{4a#ttD$?N(&X{k(%BbY
z>5OlMH2TXLPpH^__BAhbFY2w8^%qKDtq%Mebt%v)yCTg+=EOE^1%xH)uY;$%iT+J%
zfR5sdmS1OC;;+kie85?OvO27qfPM&~h-9lwVK5tJpxnD~D69Y)G*KA4CXuQqTGI@I
zGu+ku&-q%-qdp<keAjG#vYHp(tbDC+Ae(X9maQ16+8=geQajm29FH{FVtpFhNwEf@
z30p1GhxAC)Z@@g3)`jCDZ85g+SOX>wTUfL|6T(&D>4k?l-4cMT!u~Y;1gkjD3L9Ii
zfBOUxRPXxtIqgNu_tyS8EAP~gghNEfhOe55=MLZu*uNdhVYFnG69<2ZjxLZ4(l<Ch
z2&pc3+%>WQIN<;^qeNn5a8rm`rOVZeE1Hu@CPC@o);8>~&kH|6J%SwpK0MXm$tpDt
zbNIJ=@0)@sY5PI$`lB%?lCN)sCK64bzjnE;{LlhzO0ZhVG~G)P)-JRzBpUgU)1w%#
z@JmnUMi|Mx5K)P2(Ct0(c+HQ)O&nWzf@5Pc$WS2+j)+xlhh-)9ZV(yUAxO}w&6Kt9
zr;swJ{e*ujg+g5UZi)G~&_}a>bJV{HdO`*d&;vQ%7=H8hqnY&m8nQTfcInjdwjbq`
zLPnnxpg%D3&us3)q-=~>17dI(EqmSc{wa26HqA8bc8RL!Tvydug9vZ!1Ng=8wYqvr
z*xw0*IQqB7<#P!2q`rY4gyi`TrBAUaJV1dWw96sd_JZ(=PS_~mirP2RvklI*S2WV*
zdo)a_VCAI<jp1RyV%fO^3yA*r4RX#?P=RIdi>C({()V!qpT=xrm*er?Hx9hdF=@bP
zk%JUiG)RMuYRyEA2MlpKi_zkZNQlv5DIRF(3YkcL89TbdT-o-%%yjbOAF!JEN*L3*
zz&!xBhDN6w;Nu<OQ!~KNV{ib963G`)Oc#QmVXqf1p2Jo3VwP85EMu<&*DG-Iw`{&I
zV`Sw@#w}uadUl00O321_RU43zj^IwaMzMUw!4j7d+(rlD-=9~Axemmavh(o?)(68?
z4;Im+>%n4S%k_r5)174FvXiAC5jZL@z*7zIAv9i<p}yI`M*z&8QtCj51dnk;JX0yJ
zcZUdPL+tDhF+UsPT0;0YVVt7O`I~eLiR4WVSrr_=m2H4yEVd6ihsKD)lbnu1nlaz6
zOO;)toHUb=Mut8Yk~yI<;+E>O*;pV1p5!zL1++mkN=1oF@HCVs4KKGFp@282CoV|G
zzrSg~IOUeH;?9|x=MKau`}S}QrRktcn7g<37r+L`w7^v#A8Z9hd3pU$xWpmda7xz_
z>Qr%y_Xj8_>8tD4jDyc{VDY3+ryn*r5doQ4<&^;$8si=;)<S#3L&Tl}^avCEo7cRW
zo*FB|v}P6*m}x*V#NpX8aEvB<%@p|&_oGnp!kO1;Nz&i2B{{+&BwS-NL+`y*#;NZ^
zO;~EbhIb{-yZ%W~CM>=|SUd;eVv~xpsv8T86qW8qrCWG~N$}maSc3uC>V2l{Zt?de
zC21`(B{`5fUGvJ~Oj~z^b^eIOCo3t?P!WeQZI&_bq+SBKrmEGb6`6M<xZR>U-Qiy%
z`6E;pTZ8dSCUmx2I$uq%As!hind(alS1z=uIB2oDY#~s!bQTFV_%1Qkm$X#Al0Mg_
z;u#^E>U`{-L7OMFw-%2ehD)zy>Z+XUx>fb4HCi{iOX`hWCRHf1lo}yyU9a*jl4)zJ
z6Gg<elg-D`aSY~!wI2w}GGXD)F8Hm=4#e`sV((v@-}inNf5ihw&-HlT_uky{zITv+
zI|2$%&;Wi6@;5T%Foe!Ka?ktT8)wOPC%)hJUN1?WBMHbp3+wevH`o8%``)vgg>#+s
zoTIeD6;98<HXey^!>|RXPn;fc8}I@H&WbS&dICMf;~b#g5oW3<C3Yfy;i9|hJAkJH
zETr!iI{2U^qbq0<`1eM35ITA{|K7$t)bei&x%F!e@Z)2Ue=9?tLx|y@d~Xv7<=-}D
zCZ0ZASg&Wgx&Cbq|8l*8^Z;v!&Lcl$e8y72dx|HEUW?g4=PPtB^Y+V*13Pz5a3wZV
z@lp^hcS~sKtXOD6Y}Q8XvLO=Knx{lNoW;T4qMx9mP7gmC)X1mYdippb!C@pEkdu7j
z1W8<zB|Pjw@WF);bPALV8EevSBBi7`YpCY4Lp6H^ien%B5Vp5zEGlE{c5w)KB5pu2
zLnwRiNuRa9$sGx~?_r4#c}co^ne9YC5p=Y{0GBq0L8;5w^lap4u2Y%4_D>)+iSx_f
z%%t~crO&;j%-+S<77gv^ZUlU>)Bt_Le^7G4y>R=_^e1tEeJU`^YWOtdhwqcoPh4mQ
zB|on>{Y3g4=Nhg(x;w3D>aYo32hTbO^Y&Fi4Ib>X_WMAG&d7a;4#!1gX%rXv;mDj)
zp=BKdtY`W=k?Uy~G^<i=!xSfn(Qu1IM(nG?+BIyvU#xdIHo{1A6G~)8n$aDc&O~Ji
z2&<B;^qK0TE@wH?v}@zh5PGz~boE=WCMpaO@3S4`4UiwXX#w{T)(7IVWRi?qgW)|C
zbI3d_AjpWqs_xq!H)HwjkTV;&0D;iw%^00$0%zGk_&v^qUgU%V7VAY%m!J_g_k%0w
z49o+70n2Du88`HP%AxmhtW#)8&!i%OX}e0x^ufKhOm_n&jCDqDqz@Q`t|i=#6Sv)r
zL&?1;)+IQc#q}&)0P$~>_tTgOcmb8kO3P-)9vKD6M39{h)ul8=@+<0Zq<o-Q@K4l?
z!?51kQuI%FsqO~~PUS%UizwG{L-SOJ=9kdPCDheqdc45_)^Oqml)`E~_50CbXcV+7
zGh2E9>B9a8IcjP|xBK8kAq;m?T!#p|G`A`BQ_4_=#oMr7Rp*bnLPq?+Vfs)*++%Ue
z&<lVI&X{5o{F|zd!=zG@N->2*UFe`RD2a2kN&HZH>&@hBnwRO3J*;(IAb~?RS!w+d
z5{3PnwIG_=<~95HGRn^}H6~&ckwdDQ{k;?t%iF2N_;Qt^4O>pYj3bM#z$;K#BTtiO
zsjR%X-WKf!R!`N|YVW;|gT8fDTWjzTb2Ka6)euJ@Ok>u$wHkBmiT*7zgZkS{#kJPK
zb%GFM%Lhdw3qTpZlwj2As=7CkQ^L=A<k9%@4I~Qtx7iBbHqpOz%}ePoh5cL6qdUYb
zGQ|8XW(&5?g`M{p8?JX3sK>G3NUDsYo|&83&yme2|CVso7E}QgCVafZxiFf>M1Q?^
z{VP&!8}PkB*DSp2pJw%&Hj%UJF!!#UWrxz-9p&j*w8wGNZ8`c3%QTp+6b0f~Sb;_|
z8>(`0L6rNO*t81!<r?NMNM|CUFQDeJ4~^2x=MMSgCE(zV&e3k3rj_{YS1sReM<uR<
zlRpbF$v}M5fw)$ySy283`5M`J>k37+(g8dNfU(d)^lUQS6Weqs-!jw@_)Y!x=2T5{
zv6JSX$k@_*Iq0?T|Ab`Q_dnyk2fR}uh+qyzHZU0w^zD}@`rk)w>A3I$dN7MSXqA`0
z<9Y5nv0F&hFq5hdOt`QQdoUIf*3F1^GV+V?icC4-ET@A3+aiEY_&bo8B%@c;vsHVL
z6b_HEU>M>KFHT>hPD$^qWUP!M;tuy{sDy<i)x?@3E~7wC591fJ7Ig<MG{zzg63Wul
zLv`JkrhGEqF#tcs*2<*IGe?wu$nO~;pGEL(eqWY3P8Z|%csm4|V!?t479E4#<iit!
z1Mz#21sZ07u4dZ#HaK_il6&I$3aZXbN%r59Qxa#eL)(iej+M{Cct-|0a*GJZE}7Gl
zT*(vzI~96va@0-BKPt>40)sYu6g*Xg=>t6iSE$+kKTWa$5i1B7Hq@2Ms0mRMaS(s~
z4JcrJefF@)y>f^VTw8S3e#^Z<$je<*dHi<O)ZehH<*q62a-pW^gKE*`D$2>b;RNAM
zZK)z2O@OKMchyvNT@?HjekTa{1qS?Cg3ok;-%FJ91!j<eX&}r<z|dL7O1M;^JIUWx
zL44yw{&5+zEw%;t1vlj6%%2T;#)f2$5ROI`;(d*WA{{9l;tm~dlXqbg%7Gn;P#mB<
z8%(86!1*~jezca?6~;}IPoi<A*GjDM7$?yyP4q7qJrA0qO^u7%bRrS1+D|(nl+lx>
zz_-J1!-yJuLC2kKzH!YpujlgMD8U~Y6o^-h!!!A;kORGN8MX_$&l1MisR!#CwnMEy
ztH6p;awU}rkCe)KE=w@_Vy(fmNMaCNY=u(+&gGNNrKis#2WX<x5GbnYtaW6!s)29T
z8eNBB6zx%DZD0Lv!mvb3Oc$~^jaz_6n^c-$X@|DyneMh|2iAG^V`+yX+D13^>vj#`
zpy-+D^#xd4xP4?Vao%S@Ju;CQ(f72z+G6#$py&*b)y%~kP8G&^U$TVM-{`~<ipRYV
zN~SO*)0QUV%nl91?b!Z<aJ7o%4O(r{+kW1j-5w0NL1wIOJTUY?+0)bO`$C23nu(0@
z$zRlgO!Oz!+&Yb)-MnEED?&^1IM9c-7K>hn(66fo^f4fPBn0JSY2t>{nWAOhYUTg{
z3|Rj>L<)()oS6vWTQmdZV%T)V%0<bDCxg;o&{T^|s#r}4-i&YphVTkeYTs%Ywy)ET
zMIa=l*hw;TqS1uRMgg?8)(pvjgYoy>iF!@vxs6G}2RX25gu31aP&^aK$=I;2^Z&A@
z>X!p<HDmWrV48se?k{(;y^-Q5D!U`$-_LJGa8nf=@wd4k<bnn4vm^n7;iL2d#`Gdx
zip;jL!8iiCH~|6W90=}IyG7Q`tjB1+mzci1cm}Z({T*wzpmMQXBKIB~U^7qn_cD7?
z?`>73big8uu~O36*l(5&a<7E5v4IOEMXArA#e`Svr5Fj|X9W<mtb<zkelQvIA1q2E
zyX2Yv*X6oY`X;DKf(4`e7)arA)Q-@_M`ulUTKALI)YYI{;_@c=4~1r^zn4aBncoB@
zX&jc_OVTu`R(H*X&~@1L%9N=3RX}Np%1~26RlE1T3-B)blLNbVOCU0+_4(8(l07es
zp)sDfjx!<XO&V&K(Nl6EHHl-%Nz`cJ;pPIW#dXkNKAhzv&P@jAKnLe<1rx511wm#J
z5!DZ`(vE(5dQLr;jymf~F#-Vh+CwxYWh2f{)ASJFhuq-P30~G&H?>dtRFi-UCgV)j
zU$3^x^=8DXa@(f-`UUM4{OzbWXy(&FcbC`WsUB)vJ$DmeB!^{XY9}-~@bAA=*>%3f
zpEc^MaN1I|Y)f?3=9y9dMkDep0%Z#WQ+SyKi$VPs^cM*9H_E7+wGhQf5mcFGcbRMs
zq3EKPw#7VIn=#LT1i+HvQ!Y}f9$afH@pzlGSa@eVhqHyME=6A70WgTz23KZ9?(j$^
zycprAcK}yp0*AVa68x0;pa-;|Z9sCpE$QkvR_Q8m=vvK<B_%?ZZ-pn+s3L?XhB%%S
z5}nv$C-zWKVs&+j35PmSze5xl4Yqn@`$7vnMjVI2#DlG6TP&LuX!3nRC!m|%2*)W<
z6A*2PJ;JVqUL!$i_ASVUH-qhGcf}3=+UDR$d^%GSjAjS0OCem5i2&%XSRTA6KtCdA
zqQ7m;j`U5yogcc+;=ZhB++5`(DllI1I7ak8W-@pA9QuGPP^3spij7mhNnloPf}WUK
zyISBxv5dr)n<$po!&R?O^wxeAt8wyn-`)Cly0>;ZdI^M`?Tu6-3^_>3CD`qQKDM88
z<@133oFSh{`+2c^9>jnYnpL_zNd1Ie)h9t&K>L~y`f(LSbJHZ1o6UDxxj#vBMk;G?
z4$egD+2>M|8NV$OW_s^!u^Pr=qN(Z$(5C<0rae3;0XsG8Xgx;(pcZislud8Qi`KLA
zRT!IxGeU5s(@{ZK-Si7an@(daPo98@j*h57TEL>N;aj-91kFx_MoSSN{67?3X6_6q
zwk2e^fXeZt&rq^h;GSS?+L&M;QG;*bUm%G}#)uPAv4!3iD>>U7O`-;geO-w8V_)%U
z72WspyV1Xk*QoeY<D@>S8lx@AHh5Yira-)2L-87|=fE$0iRR#p;5lpoTq%d^4iFW}
zIy2<{$sM-B&tR8CEhge7qu0}*L^C6Gqf7rKDmS~8&?XKBb>7-_D5#P!92U*D+D3}4
z5@esN0C<iDcuG0t*@iA@_w@RUv^|v!hnfgC!wF(W&e%o91028;Q<2lIyQzr#0n#a#
zJ>o@L&UWk-OPlLhSJlDg7H`BXx=3_`ji!Bm0bG%2Atde&iECx9(b6#%;p^CKj_#t-
zaef|-K1y#4Iaz9Ds^n};5V)6%(w)smcIk`&z_?E78|=<R;2{>ka9wu{p7d0v;@m+L
zeJhd@%FGS1!Ne6vJEHk9VsYQJJLq9eAccDnCPBg%IhYW7Rb1jX!UiW^7#gqm@4wA<
z|AnauSeMM|rG4n7J2B$zzyyz)2U805Iajw@sN(lfc6zsGzM(r4$))_}nw3n|kQ_^7
z8kF<|)dVQ!VMj<0F~BTE9ZQIK;gQiw**|YJlx0Yo8GmrNrv@^+?jTJe0^tF}Ju@e~
z9{MW+I*ORAY5Z*z=^bO_(J)dTaUUMoR2eFdcrhM}0<nS-BZbF)HTBkniR5T;GUu&5
z9_<mA4FMKVo<JfpH}iT+=5?ug#lc<Yt<*-xBQ<#4$yu?}0nc4Q)-;ho*xh1LRY*-R
z6SS;2@daWHq%jcR!Q=oTZ8M^KVzY#~J3e3$g&xF_tiVJ8!R<3HGI2N*QE0PU(D32Y
zR8f&5G*hnCPoI3^A|X8U6bKG(@uA1vqLDd-!xkkTK-C9giR*?WUZU7CB8=1#<4dbh
zI2d7TB0gji(I91v#R(WtrkEb~J`5I9+eI^JDr|iLC_4{ft>u}w_DY9{0B@rc5;Oyk
zQZZAhxLv8><724kM=Cz2R4AqfNeo6wVKtvfDKMpeg?h>&PltVXaHycfTXu2!)O*Pr
zu%w>i7&;4CG^?z^g*N{H$0=w<C(4LKu}1T)^hjGedUj_qyIjsmiEvRD8MP3H4_UF8
zjKc6#gZ7xpRd2@>C)&i~TB<X@gthr55t_B9D+0Nj@WVFVTcr{qn`e=wOk~CVbcbNW
zSk8Q#rEJjhe!AzfQXA>eEr&YEG?6@+b&8{V=CiMU)|=1Hm7oWg+yzVUTM)chWtfLw
zYXE`rkW_~<cq+#2TV=)0_WgZd%T!)W)C4a0Vv1r@7I+Vi7ruTzH4IM1RT{;F-Zbkz
ztXa$4YuiUtR?VucggMb2(k!A4%HKGp43>seC$Kau!6R2$!BiNbqA+^WFdr<%=s(W%
zkUwI}C=zBkMJBH-$Z|TAjS4c9lQ^MB2qKEa$pc5{5#|Xlc9aMSb}5m$@)>Rt4H&#Z
zUkZYsH?^=^YXP;<phQVl?hOMk_Mi+QG!Tu{0io#~^c}<wq2A00z;XI%1>nQw5-VlM
zsg-AzxNF6%(`R}$@iaQC9d(I*2t6HpIcA5`%9)PGS>1<8thIWeF}^HAUx>{g3_Haf
z04)Y1c;0a1@jg%g@@5Nel<^X&vj;%v6e;vmi{vK|=<X|(K3QR9KJg)~V<>(yZY#&S
zhih};Hl)Rtg|62S^r;N!#o3@#jk(6Ynn|W)yZs+=j3;Hg0lQdr{*Tfyox@2|tZo>S
z2b5qJ)@(ki%co~ajF>}b*4s2sAPuJ5^sy*7PR947{-O5tXKYA;Vzr-ZG(o?bs*n1I
zzLAEj7He5SM(t+5=x@)ej4{F&wNGZGS>~iY6L;ubK^XqT>t)|JR(Js#aP-y10q@G@
z<ay;sy8iCH0Ty9{XcYW<e)TM-67!)}lU^?*YL*ENv%n5F*6?u8X~rDtdjDY<JPmyN
zJhh2J!Xz+y(kmQfS(Zz(vqgaH94tO2=Q0s&&4||lGa2WA6**v}UpDbf>f*wSg`h#4
zWn#elT^U;l?g6yV8fId}w>3e6KK@o$;TNY~_*?yD{N@F3#&3RbdU~NDO_Kis;$^6V
zw3QYqU4zgaS@MfvXEg{g#Ue<2Peb=Rv4!7uVKAvZ^{&-c`j^|n2@$NZxx)@?Y<V;+
zl}G#*JZO!L2d%O3aO+6%FGo)Vsv;ZO@k#~9hc=)i>|CPaa}5!D7!e;5KF4WbeHO_c
zFi*#r$S-Fi-(4t?oMkPLQ1~~7`q4GPce$Jt?;*>WX4$B;@S%$&I4>klu0X)BOdfYh
z9-$q2MFvFLlm0<{xJe2n3t4?l&M%`U)|{93mNQ)}qOh)<)t6d);45dd#A1GX-U6pk
zKbKGp>K)XBWQ|NQU_&7rSs*UHWOnwakSVf5Ko%9J1?dxQ@v!inoessH<O{Z&cuUgF
z8Im5F?~pXcko3+MZE4qHc`SoEha{oJ8F4QbYBq!8>*P`*(5aRJ<IW_-iR66_){(%v
zPA@&MKwbm%MF*&lW=)BVH4v=~6DXPLAOWB1^xngDz6fPC!3%3}8jk|&3BhX(Ul?SZ
zcI?>1)N)&ucF)g3_;G`7atZ3dEM4AxhEn?$Mj2Y;U!hI6dj04X!5nssQE^`ns#+y~
zO76x}72Ev|wzGjvFAwOuwpf|aRgJ0iy<8|si03f8cv26`XFW0DU-~Qc5P;Y5g`%>B
ziAjW!gEz6?r#{Cp1S6;LV98~$NeuRzYlfM%0Hqeog<7~kJR<mY==lL`7Q*5=1P2R=
zW1?bSPcyo(kco&55<#wd*K?O3bvd<3LcA}MY*%^m8Dq5rrmkU~Gs}%puJBSDz7<Ga
z;p1)iHiU<pw%|8EG%Vaiu>8<T>MmwP4f4c#b}gSVL0u<>ibV)lCpW$+XkFwDgt#(z
z^)7V5auu9qhh=vw0ky@ochbiP*+E^ADIM@M3sfSxA1WnP3S*y^$4F|CD~lkqK*!ck
zJWMJX%GKaSfYNMmz!nHx_-gqXFKomtnvLiR46{@$-{wThUbIrGQoR#Yd1Sl|P#<It
zGAV>vxRI`mKC77jaf)K@SZpyzfjM(^PKukyT4-WV)#B4tsE4tGTo?H&idxeozuvo>
z0Oo?I5{MWf6b?tu2suIAYgW0-{!Qo*SJ~_MiMy-LQVOqfD11*ydJsrRQW{P>StsJa
zM_zQfOI?sa<i*lZ_#iHbND5E$F+Bz!h8TXWc{=qN5ISMo5tc>Z2T+zS0^j3jyzm4=
z;1d|_Xyu5Vy>nAw8r}|%kwA6u#1_ulo{9}CSkd-G=@VMxqXn_O)ra)L*6b$QS&RP_
z9OK)FFq{Rr7-5-OOwU(}IN!~1Cq546?bxP`9-(JQ(v4xX(I_rsnT+}nWfR@S8SBsf
z(WBZ}^R*sT#zEk=A}nXTZ6mtx7GZNM<1u4!yL`F&3ygAG5n~WjqJx+=!bf*VvS@=0
zDWY-WbPrpw4wZ-;Kp;iOQPw9w{k2PStHhbygAExcT=3b3<O&y}V-d|fk=*>gY?<+f
z92+zlEluU($80?Dh7RUr<7KY#GE$+jCN+YO%(z7Y<3kn=XEPA!7jKaM3gZ?Q1UPlv
zBBjE(#bQn*e~uQUIgjrx=j*%WYzGOSmJDUwa>w;%kdQ&W)It3RGBT#L>$t^L40K!k
za*takfqICG4*H_SGI)^`I(Ts<&J11z2fOk>eBdK8RuH=0nk#f+L)Kw-E83(KIUVSg
zsO*u;RuoR?q2S0UgH@`737ITH2D4Tmeu-SOCQ7%s_gP`0lY8d}tPLn`uxsU{r_t2n
z4Ue$SVH7XU2e{6Sm_*X+6ksJ{w#o9PztP;ZK@SNuD3vAMMmSw2;W)U;&`qA;MX)=7
zha<Sa^e1WB)Fl_hY|^r%KZ#JR2Iu(t^=~q6V{(gm;JTb*mY|qzw4~#?0eUgYX;+{D
z?f__O3cG&s4gjYL_LIdlmZ*$v2HC)sNPZi8v3jbL+v*ZD5Y1nu_U|HE8af7mGy`|Q
z-koQ`erdp-$Cy#NNzWQ;2~F1tLo-;1aGjjD@pKetJS%N>FhpG$^+QI&);$ykMe+|K
zA*)+6VGj#pF8afs9>01qh?L+;i&(C~k)SUFn&&R%Y#Iyx83%^T^UZ2U)}y?A;o6*v
z@Hq<>z;go-XBa4J0ef$@oT=AxN$6j}6f%$$NWfzjEWMmT4)=C_MYtz0JCO+H6f`m;
z_d1K$I>{G1$<MJE*9$c5JCzxN;t~h02XoE}6lDu!Y7=B?BV?*RN2U_~=THRL>ooHr
zQZ6FZ2pQUhPwbXc!uW~3E*#Z$KDkn|1@pbzWehHQbM#)(&6FVI30-}Y<<kRHj|hE!
zE^|TD^Vrd|U{7N^7mZ_6lyh%Qs399OA*TW!ZOcJD!$EziqTVDok&Xd|O|c?Mck#DA
z{AZLRwUJxORZdE;ld{kfg>_6JY7{a-E9!3zG7cadq9aR2%{`w%;Zm89`~kM0F#3%8
zU$7wu5Q1Xu5sNc{dC7+G=!qu#nG?jq+Y<=={4__FG$U@8f>SEwyYxoG)AS5Yz~d%P
z?D<YCZlrhtJBa6C+91wndN^p}ukS@OT`~J;4PpRDuJa#3?n&0<zp=w5_NzxqLjz#H
zdO`4$_`NXG3?9OeLevemkil_JmTE7NriL{zYkdhj`@OKUr~XP}Clv#HK4}pnM&FX<
zGW1m7Y;%-6gBf?mgr-HSGzrZurl;ch{=~sry(=ssDI<<adml09k_S&xsLLIwphcE-
zC6?_JXrL+H!!SMeC$ZOyhiWfS<nmW1_H86cgb`U{2FL^@MLJ0a3ol2lnfdWzLq!WZ
zan;d(p>Rqu|941zkaM(J7*9gC$ZE?MVfe%vD|c{zU2&5bOPySyNb=w-lD#Pl6A<Tn
zEpWa^CmLu|v#@8%+LuAX&maIas0-47hNy7G8K+!$*9*<`HnUhoQTA14Z$h#&1d26S
z8rAH+_bb|2=RaIib=Vg?6~Fz0L-E@`cp`p}4?@-s4+tKI-+|e;EM?tIgS|%G{N>e&
zx+p#qyH8SDJ)YS~mi!E1r~w)x$g$4nn-O>`+71E}HsJ#b#CAuZNoR&G$zc5e`@XqY
zmuZ3rY=Zv5`|Rt$(C+kIuC+p2(sS1iM2RL;8(Zf>k%6od`D}}^OZelAXR*vCzbpVh
z-yBYkkxQA7r!<?{mPGXgB4N7`W(sanq2Noj;NQ<(V`pP+JEj3j2P(D|l4k}e{B#Xa
z_}L7qfGd%#zK&{A-=D&!RGt4X_Vc^)`PZ7Nzldu2>jlAKHC2DTFf&A%hP2vBUWFtx
z4krLOjK$%7sv00_&I~AK3%WmJnD}SSK{~D9h^1dv5DvdlbGJgjWWzq%9TvlM(emA3
zZ|e?wAz)!Vx~}RFr$=J<K5wYD$$c1uq=zsDWUuYpSS*ETl%6SPc)WF1j&@cVhjfd*
zpe|A%xwQ35kR@-H%95un4NQ4L8*pD)*L@@Dt2p$E?$=yjrT5Qthr0J`Zm5BxKD$F*
z^o|?qJrWx04)t%D=h+-vdVzW#oXpVm?Ovb`!q$KTbLoE4xA&CY$*8RiNLf!H=?*u@
z`8|Ow`=J}ei(cjJep(NIo6}pRu?;+3?@l)s(kWVL8K(OgqIiZ!g7Z+PnP62BSyej5
zstDVuA|*P}A&o+eNPQibR-E2}#~U6plwJ->)1O7@p#A9sOnfU!zVBbbu__IB<a6+q
z+=X-dV_bL8$2yNTb+S=JcXY_3At{e|J03ZsPs|_{G?82kY?z@JLG@t6S3={FVt(nI
z{4*Gnz_Nr$5HBcWnt=sNB+o)6Mk6pQC!}H${L&;$Z*?=NHZa-K&N(Pv78}_zl7@9v
zvezxFo5j_WEY>ZQ$V74gXiUSQgz_ht&8~N5bZ1v_hF!gLW+w0)jWYwUL41Y@8;^kr
z*8^qGOt>0Ux|rb9D7hKkA*_vR?cjbS)CCNZSQk0e#~R#~U}=-l!knw69<>4+L_%Ua
zvZ_0gycz2Q5WcKMfu{q#69!T9h@^ZxWsn^KHS&=~+U3VU+Ru3?HHWlQa!K=OwPtvB
z?CiPVs;tWVWe=R#dU*~fT-g~;<m7j>LSK`e;SD`xI58{3Dc4RZn=*$d|JXkEpyyy$
zj(Jc?5q5n`remDv`W}N|=&Ff<SmDe$)b#jYT7s`j>{ki8uSC~NVshi4VY0x+nensp
z)5lHWf;W;mk-iMh&e?99f3jaa;$$-798R1v>viEQ&fwf^u?U^tuwOmmWHOjeVOcp{
z_)|BTita)bw9Fz9beG$&?&uU%UaN6%?T>cMjHYHr{}_nA!9HThWmE$gC-H0?S0Oos
zLhcD>i(R1-jumhZg+|OpB^17Pjhj1r?N?UTZGlm(fdt1)z%fm5M5oCF8mj>>_`WdZ
z#wj;VxjAbDs^blg7^vw$L#D7xZ5~qC8|+tBjy8$d*qg$#fcyPsFz3=g9Gb)mPZT_5
z=yi(mH5gwv{hXWkr~V642&sFa2%rD&-~Z!4j~qbHAe#}`3zzuS!3E3aEiIp4F>n6z
z<*OEY@I7zYiup^*KPT_*IN#}$eOHyuoJklHURl0+*;mS40gEfk%RQl$Us}29wv|4?
z;|tzVQSMn43a(nbqI`u5|5C}na@pq=EDNrlS5aO$Z{gDUD_52;_f4Mc8}D1Q#@9>S
zc^7&r7kC!VU-_A!Z}F;%@|8qXS^njD3s<eE@Le+5cb@O8vwTj#q{+T<9vG*1JX^ka
zr0W3w&czP=y)Z9y|3ysL(|G1#gWVm+_vaDz2^gsH{pKFx??l{w{7phUO=bsG9O;^e
zzt=FObpP!%VF&TN_{-UGg!5opb_4$S{_P&(TM%~&;v)E4Fn^J6;i^UDzUAdBmjsut
zW*Pa9HA@`^6AuqoIXtJ~?^66#<ByfkO&ppk@Om<y|LOuj7XWA*V5MW^$dO+>=MrL{
zw;;55ae3t^-zAs$Mvgt-caCrAIhU~7zp(J8QKNik`9vJ%Em$#s^_RYoiMnYN>k;3?
z0Z`;?|4{}pF6+X!e;3Y0biIYY7W}QlUmpK3hRTD5OCEN>^DxiIYsX(R{%Sy7UQuzs
z{675$4fTEU#N!JJ2b}b&(?^aOb;c=!2Oih=gdxMu{Ooz-C!9Ze_@__ye&W;-XOF#j
z;<$6pI_)!`yI|7f3(vjil1p>`k%dc9z7_LV3M-9RtthWtQtn%{&^LeOBH#Rlp7Pr(
z$`=O97x`Aqul!PZrH9F;Uo(S@*Z0rQQ8||ge#~F6yj-IKb9`uDi%hC%SI=@%O(`vv
zciUcE$Y)<Y8}zKGShcczWe{(nl|jMAa3|AgLb`-calHe^z+NV>t5z<*!#DmMG&9f2
zRfZNkmMvKt^o;S{wro*wsVBH<m2dfc6k1aDlyg90u9e?8pC_i-SI^MLWfD03s+k$m
z@NRM-M{Ha4u&MjdAkl;wPAOU~Zxj+M#n2TMp`cI2&bNHo3J~u6qg-PH)&t8H4>w>a
z<Lsv~U-Qsh>3IAN#2@8;5dKcW-zV?~!vkptXW}^;e`E1C5r5P0hf#=UA^zBa!uWd>
ze?Q0H+xW{@HHo)l`$us1AIuv(?!P|xcK@*~?mw2x{fE!2f5c6E#9{eB9<cl@H_QA<
z{GE<Jm;`#J;BP+u*5R)Oe|dR$$6p?h<N-+@kmP}pd0=AR0Q_OCB@fFmc|QC>Yvz^U
z?-oz5|A0!$Ys+ZMX3J#D!n(5cW$Vn=o2@%rf2>20B7ZCs|Li}C&7x(igPyM}U$y`Z
zqp~to5rp<faK-%9R%%411i~~uh-(EptMVWcFVv<)AxF^aWviqEF&Py7f9zks|I7dS
z_VUlNrSN0^v3@F6E<w{?q8#li6Pcu(@E;oYyp`-3R-bdpvK344j*h-t;OO(9S%SXu
zm8(Kamij7|-Cn+YwP)GNTjwudw#c`5+43N?sr^(1Cb&kQN6doFqsZ|&)^k40#jeL+
z4gQ|R-v{`cR@&9I1b<bZ@9KI8e}Bc_<ZHUR9>?F<*;rD--_$u>T`%BoURhVyhxmKy
z+ODp9uERA=bGy16lF!d7z&MX7mlHqEvm&%SxU6D%xo<{b`ZXe%d=XuF-nr+WJMP@^
z=bm>V)w7S9TGgQpn#fBT)2t{DE?u=qVzlr+SIDxJ;KuU#3(IZbm~(_-I{fl1URH@_
zL2gR+mTRRm=lDIrYp$B@o4*+8eKV#{nWNte$``MyEcXcjDG(s`Ir4JbvfxtR{N)u(
z=Tr9!5Q@5L@uK-b2@yO@mOHBR-0GX;JO2VGe)a(vrH$bz&2|XmrM{=mDwRU=X*)%}
z<Ii`^Ousy@DD_`{Zs}E*3*f57i_xa7C`izPiVAshI0A+K*f%h~=;iNOgm3L7&ZgOS
z4Dl>3c(!7`Dwc}*%gckoa!+u{d>xWP2xrfkI%8htk_A%C(%I8Jw^gn}E4j72QuL30
z+3~M-_o0=mLlqUPDmm<+a4agXKu2vLS1n&vY4fy7aCXfH<2<D^rp=M^Lr}^kx65Z-
z=3!keTwXrE67sYNl%coBi02OZLc?0VynM<0<?`iQw$fJ#MQVmCGdLCSO)p=)uyR>N
za8;#e#WHA2P`*$o&|!|PD#3l`rPoZEK4Z#N)BOECc)xtAK24Yj62jOTF1z}gSySdr
z9(z9Je_rMCax#fCh)mfHXV1CbmlaHb!;s|;NS|l)T%RZx{8;&3R8DFz#K1gZ`LdOE
zjO<x4|8^hLNT}R*iSNP-E*N`3W=5jZnB}YHFVZ)ezRZ&ujm7Tq%$v7r<sG-r%S?e}
z+BEOB%J~(T!e9)+xzRi#nTN6Cyoyz;gB6vl7NVb-Hy%YiTKstz5+LWF;#;_CB}64S
z&+x(p(^EV~SI$3;|6)b?l6f5G&Qrd4uDA?RF=f#z@ETR*KwJ8yGRi5P<*qos77sen
zQ`EQLas3OAFBs5gVEzet9BIL@8BKCv|4;Qd^q@lymd`^+pp(gYmGf^CFjIbNwGaS;
zmGf7wu9#n0zH;Fm9~ZBsQv8^eEUQ?G!Lh-&dg-#oL3BAQ%NHpc6V4_m6^hUr%y6ow
z;pI|HbS_u04uqAI<ek!IVkZVCZy<2Mc}KbiV}Nq-e9YzWJdEcYJR=tz>7qIQ``EUs
z$Mb9Bk92Lv^XC&V@5A#YJP+Y{%f(2Kfz6PKN4m!0IRno*cs`705YIp0xdG1;CLulJ
z@!XH+VmuGwxdG3?7!W;$=Qupy#B&awr%y(DJXhkm0ngvzxgF0X*wfmN=TGoFglFGN
zksbr7Wq6LmvkuQWcs`705YN}~+<<3zD$?UQdK%K>na1-Fo{wVPX)p$0UM#SU!*dOm
zJLll}S1juW@r+|hd;^}(<GCHr8CX2ukLUks@5{rhDzbey34^v=Kn0p1bRPs10YiWw
zs3>8EmLWp40RuaS%#z6rKw_j3L~+7g#TFDXDk@%4v4IQPu`epN6L!-AiW+QM5V%fY
zi#+-@H}!t2YOOlE4(H&#-+SNti~W7cI{WuqYt^u8*RHBvyQ&x7BpioqHWBt{yxj|#
z3ON|>=Q1GoLsmlGH5vAhsTf|~1bIt3>>=;D4)%mkg*_U4e}zniylEQjAzR@^OeN$z
z$Q6)(g4_go^YyTY`~vbgq=IbU#`BW!3NaOO1Y`ze9%LotM7$(j0l5ou6XdAru!n3r
z1NM;PFdd*hiu7HOsgQ3$W<Vy~2z$t(kSiebAvZy8!~2ijkVhepLsnwmaC@|&GYeo3
z`2@xrG9bUfm_a3E8pa1!KwgD0f=!UGppU;BvaTHVkg4d`w?`xXDacgFym_#P{Bb_)
zAv14<J>-Lsn;;k8*`)SD4tuXjorK&1+35mYxA&XWP{=1fX;RZ6TYlQ47C?4wY*H&B
zy#r0E0dn!7Ce;X8b)-q1f^2uZNhMwAc?CbB{6pUPznWAg<T}V&$cyoIVm0Khf509x
z<)5&J?1gt6ryw7NOlt3W?OQ4}402f~r3xV1b;dks$TY}xkX4ZHK&nfX`UY}UAEjD%
zKwqt|QvD$R067tI2-Z(4g4_ssFJxQH;aLx<Qk2>O*=qpoA+sS{cl5k3A^Snj90+^J
z`Ga5&nVbrH!Uw}1vj0%nL;mq9*hBvLYHah0j^Yc~D3t>F?Qo^iA+JwUstmGt1lGob
zd;)R<<eMXv+6lRIlv2ka>qf&K{idmSH=F`_2V^?r7m#I;)5pRdG7XFDZGt@CS86xp
z$SkFfL)L_qYLAZFudw=kDr6Wk19AamCFEwv6_9_2+yvP@5B88NE0sD4`RqKUI(6~9
zZurh}DC8u_>5xYt7eG!}pwvpp9gtfg7gj5^7xG2OlaO6%V2@7nosdHzb8dk><j7js
zL;e@WURFY;JfKtq<aWqL$l(v+x<kH(c2ZK3=RNr_t~=!8^-5(zehOI&x$_C7RzoiR
zH`o&n*$6omFNse<?t=_<^Smq9E0qS>@nxm5AjfP}Y7t}=WIbftO-gNp91gi3vi)YP
z>y1fw-WH{LLT-f|4SDnxyoZCl>NTZqhy2@irPe}LzJ)eDWcT-!ItaPtec1mJ*Bi1Y
z<Q&Y}8x8q3WDaD_2e5~n^=H^a_SlPZ3;EQiN*#f``!jrZ5yCjbKBam?ehxVvvgdx3
zd&q^5%OD^B0_C1~$af&`Iskjf4Up$_M?HKH_K<IU342KI5bPo6ABH{TF35F|la9b1
zvde$M9<mnloQp8F@fGYLw?dAGoc1;BA>V*p207>(*h3D)S_nHKABQ{!iCa$}&1$B4
z%@(w4*0pu3bLyHQ{y=eAyknO(sr@+j+O!+nrqi$5o;UxTMc(i(SN0jy6V}FlG~~Lz
zO$ybQJ;-k+{_272rHPmcL001L{NyH8LVm}zX?I7$sDEiWW=UdVRx^a|d8D%ve>e7T
zQfq=b<Dqk((V@6C;BQY#lNuP*NxW1m5Z{Qu!+4&fT8@M>RtKTeb_(!E;Fkyagr!=6
z>}k3E(RluEcKG#{9|ryt@Toz5Zp42k_;11A5abgkS^HY>Jq9(YYl3`L#C|pS5#R>|
z`GN@F0Dda?tAc!agl`023?8>hB>fo?{uKC|z$XX!+z6kPfcobQ_QSweoxwg6{1WgZ
zgZ`@{{%gTM4SrIPPZ+HgDF0W3{}B9Kho58l2Jqcd<6pl<@b`e9=-7|4_NTya0iWUU
z*IGUagIQmLpX2Z|EI$nVWrLe&_&k!oH)vXyuT1d$z~k`{;U`D<TJSx<UmfHtBm8Rc
zY2cqlJnemwxF&%#D1REjzdfW$tqa;GJgyxO-w1vR+Ns+dev9Q#fj<gf&jgbDF!3dO
z|0H1$@6IdH?se?5t^F|YyTBKt97W=nW9>7+htPhlaQK@nUkknh?btPr|A(yq)!@Ge
zAGiF2Pe8l(9>;#MwQmGp48GCfcUk@v_)F0qj>jiq@bXLW@%#@1pPtsFo^$-yTmPBh
zKLP)|!#`>HTJSj|;@htV|1J1<_6^_{pdC-U8AtN}8k@h3;2%f3o+j2r_*Rxb1^)ig
z@xxC-pQsc11M$MAO^>L*5HEi+!M8y_;xQ-vD<bI!e-HRlhtIS8YVe<epYHHeEZ+eB
z0`yOwa`;Cq-w6I8@HacWsX*!eI0gO?_;~eW68duo&cIXua6kB7LI0ULcys@Q|MCoc
zE%>j%9}3zh?6dJ-4SoaqU3WVCLd!RR|2g_$We%Tj`9|>h;CDFuo0dNX{zCNMhC1b=
zzbzk0coz4)Hmd%{bDF9s%D-XYCxIUp^bfv-`AqPI;N#VAwczgne|gZpSVvFi-)iuy
z!S@gHrg)h85B&4sXP_KM%6EDT@<8!x1b-0y%Xs#u!2bY#sbgPj?UT+$yB+<;BToMO
z)#lGI@FDac$2j%#Fk3%of**ta<FyVy((<+7%QEr&ar|Fv{jUa3Uyb}TnEr&n>kOjw
zHGu!k>?XC)@n2>AH-g`Xe(A@K{hzG;Dex;W^>MAkKWh0Tj0beWl-_vv=P>a3;NNt@
zf7OPc3I1ofP3nFpeRtUO)q=0iYf|}6{?E4gzZ(3uxlL+FFn(0Ha2~>61Ne`@A4NLs
z^`|!C=jYlq?1#>iRZZ&EkpZ2=mq(HU<srQ=9JaMd-9o?R8JJ)iQN)M9KMejYhi|a{
z)5!i6)BzYfu=a^bZNz^T_z`b6sa(h2R1)NW5%@d6cX0Bswa&v3_<HcSyxXL{L|tY5
zQyO=-v~k!@aoE|U7UOwtbrP!+B@PF{ui4e4esHeCSN1wIZ;f%3J(zC*y@>q-=ZSq!
z@Zao5J?z*|vG$|E_xu9wASVqSZ8^vR-{WAD>JInT|8yOFeGP6Wd+-Z`e1d5RQy#4a
zzZm=rPWWqW_}js^J=COVWm)S#F~jl)!B0Hgq<*A=BiA_bn{y<6%`tA&{aBNl=Y(%6
zA_~7J`1#<g9sgz8e{b-k!SDPY<1;j_BL36wPh8&oz83ekT+%A>#tU>}$yXV4J7J7u
z8Gc*cgx^@c4*VkUDM8*;={m1AfTy*h2M75glb0c2JHbB<{%-1wNnEJBRJXHX&^Xz7
z9h7<`=p*4@E#Dqxc`5jK*CQ4D0r1Z{_G_$t2KbvgDpl?9WtOi5|0eiahp({w3h=-D
zImQnhewyVsfxi*_F{ivAw&i^{_`Y40x;SV*OPlLFJPv*U_;~%U_HEH_2ERCHpI|yJ
zbPZF%zYM<0;mt)LJ_CHqB&E7J<)ytXkCosPyD7EBv47E~Zw2^A!1r_PdszET;Gg-0
zQhS{HZHK+zc7wmMyHXE3`LkT-PY7Wi2mfJDrOpl7Q~&#)ItZOdolt(ZT&&dRP8|2x
zI1UA0bqU65oH!1#ahwkRq23sSaO{0+zX1F`@SPm{w$^?n_&pdKjMul`3jROAU*y<#
zw)T6$f89r^H=OWavEiQte_vmv&U5S&tbHepr7q|f-+n0gE*Oi97r*J?lflO;!wbOQ
z1U^=s6GEI<g5L)I2*y;M`}pGvZ5kS&b34W(|AKyu)k%D(IVn&%Yy>|T<BkKIH1@V>
zJOzI2IE?o>e4zb@`fT=ij2Ail+tz*<_%^>%ar?KK;9H!5uLXZ<0^YkLt~UO`{xA5>
zu#d+#fWI7k|6n;zyx2ZF8^Mp6sMLJi@76!ng?ak%tn-K_2(84JY+J`iOM5Scz~7k}
z`#Mn`r-9!GJ|&ojKz*GB{#)>m2Kj^s>@{2jzF?M8VTU&lNAh0}{yFeV9KOcdZv)?Y
zwo<=y_~$IYAN(5d@#04VfG>hCa_qCMeF*&j24C#(IhIcYKMrHr`y76^<+H#y&x&7<
zECT-q_}@Ea_;<Pthv2gw{H$Ee$v|0kuHi-J+c366rwHTUE1WpoWBG&N_k+L1xyI%8
z8aK!LgR3wOzR)S>Rkob>1iuR7;$J%c8?FD*;Ah{0IgL*H;<#;J<dFZ{v8++h-ZU|F
z8N40*4d71%`Gjw+|Fz)zEmdl><A1&Nza9MR_bJS@!6DE5go)PvAovsD7dU*W=0m`m
zcl5l;%kgP+kjL{N;a07p<JcQIo1rr+sFRRk!x#_#@8D_7#l|6Vm#vEmz`yul?0c2U
z`7-dYJruv3t^@x8_;_uWcfgPPZEX7x{2u}TYw&yU+s2R5_;w_Xtuat{&ck>g<dlO0
zwjA^Wzk4O#p9Fm*ykzrWBKV?JN)2(!S+Xr>Mc|h_iuY2^b9t0)x7-W<r8P=DgMPV<
zW8!12C;-Z%_236Tqtt^=_;=gzcYt39{sre6thLwR8?t|1soy&3GXv`6zjY_{r`M~v
z{qcU_Uk6|1gdb`5Oa$NY1r@iiQw07-@EaZbf3xww7yNhN4><ArROf#PHtWH^{E||C
z4BiJ+pKsQ;g3hCz(3!Rs?~I&lFyCH-W8gQws?=d84xigNw8Oi!n&0E|E+-C)Y#B%a
zf1p9B_Z|B;tbIE8<*z9<)(QV=8-5x1P5+_POvnB@YhMTcJMi5d`%cz=1Nft_E1Iqy
zDI@c=xk*3xHgBl7V|K^DuL6Hb(0+Erz8&5L)`O4NA5H=PPw)>r`Lo>SPdfPW?eW{z
zW#H?;&v)!gtbHB$!+1xR8H`^-r0u@}e2+gWRpanC+x*)J{#NiGIQ(|Y9|Pa#Z54M+
zzg<_{!{DEC>?31}Dd3NSU*+(1)_*$qf_LIS@5{g+0AK3ZN5(wszz=*^#T>Kj37ZYz
zmw?v`F-cv2?efI?n%~=ENz25qDI@7#-V42%@5g^`p9KFb_#VM{%+$#s<m_=a2hQfe
z*&H~V17~yKYz~~wfwMVqHV4k;!2g3BsG~+aj&zpP4Wgqjy#vJ|=Y#niudd7yG6Jt|
z^s#rJ(L{GnAB!%d4x{<bktB7I=|Fc!AIq4hz5yM=|H!X*d()T%4i45EO78-3&}&CJ
zXz6}B@H$l=RjkNr9=g@~U^kd3YT{%5V_qWvz)+k%Xo!Oj3`yvN<_6Otcs-5x;gEP9
zVS9SjONWHl#9gU0)<@4scdaB`d_JttU&MGn9sl5S3=RK(JtQ3xsJ*TXaP)-sB%cJ3
z^vbzhM>+rR$~rCw(fTPNgQT%cXPL#ajO8Mhbu8;yZeY2M<xZCSSsr7lKTP#7AG|yM
z;RvxzVVTA<on;owGM0;2*0HQ-xq;<2mOEMQXL*dJH$X~;2|xP(2RmA)(YGSWuO7kc
zL3}gP%xfX{0O`v85p5^u&E!WM`BVIK9HI2d<3ia5_^c{K-|gwe6oT#)PH3!m0{+g&
zA0=%B{%*tHPx*(6Jw%ssgl_L(I;~RFk4yU)U>3`bEJf{tZ;jU^mg7D%=V_epSwE5g
zVt+B)kL7x95!<B<a<5<3KyzNtQsOag)Tk>%y|15x59g~w0|q1yOisCMNR>Vvcqs#-
z8%t8Gn|t3=RyzmXw+UVwZ@(TmiBR;4iSTw@uM5+iajEYGAA%pvP&*&vc$-`@-=jD4
zI(SlFi~ddQN1h*o&(nU|ds6=k{t$k|ivJT@AGOVX6CzjZdUxGs*n#gH#-+Y`PwRK_
z&f$C){8QkR-c_7lJ(nBUKiGd7Uq3xJ78uPzr1Z9n^3xqS`DvwJ*5h53iIz8l^*crB
zr?dXkdH@q+Wvox(lb?@!BQP9z#jTGej2~irIpYs9UU{hjHZ%Sl<27RpaES5O7?<*&
z%J`ocm;2!c#{bH=+#h<b0l1^Uo8b%nG`{XqueU%krucu)_tOCO(~<Fu`WoOW#(My7
z>EY!bA97u;Wc?b}PiB5J<Lemj#`txNzZIpQ$M_G7k7WH?#s~K^z$C^WV0<y-a~Y?d
z3MpORGA{W~yQLC-%VkD!BJ1yD{B6cF82^ItuAHDbj2{P1<toJGM9On#G(;$WBwqx-
zn(@|bFSrk!;&Y7s>p9oZDP?>>9xfaX{T>x^A>+T#H8|aeblk`I0|l-=&E+Ql=a(5=
zzt4pJ^Nja+%GIZZJ4t^q?TCRxzq5gSm+_5yQXSqaY8K<Yj32Bs`ubfVxWkOkc+&NM
zg7H4}2G{S<q2B@-LgBv9+29M=e+R}dWc(4vdoe!r&qjYH<Fv~y`FVhG{XPTSD8}dg
z-stDD{#3?q{)55wJ05Uh#>;+f6!lz7{G?r$$^SIkA_RwicMEwN<Ntn#!Sy>?;B|~Y
z%s19LGQ#l;<HHA<^KC|W4U8+sw;FfePR6%z1yIELUo+lgumOr$|2#Aps9w$D`Y^=$
z7XhdE*IjM^Jx3ltN3s4Q*6+^xGg&`zr~%e6Ue5Rvj7z<-knv@kOhoiMLD)RN`2G3?
zlBt);)l;HR4GSE4&MV|5;8b6Q`1y-u>SH_OJ)`j5jQ5Vh4>8^^3O@;)@*!)i@p~ux
zryZFHKg@U;<Lwy#^*96UV7x2iJ;obA&uPKWiy6O>8cR4v8sVif{utxK7$3>_CyeX4
zC*aZ<@AxaD$d}EV&G<yd`?H@C#&2O<&rt@q1UQw44San&u>K>gzk7-S#Lo+iC#D-*
z&sE0H?d)eK`;mUsXRN<@hSAq^kMZ*;<NBj4oa;HqkcsGUQ9ftr7yEd(XUx1L;1tjO
ze>3H0G~>Nlf68nF=()%EIh^&6MaAa^#ut5I{G_p;Iqc_yECYPZ_<Y9Kh7GWm@p~8_
z&lP_u<7?ReHulfi=lzcLx3IpRqYRt(7{{t*`rvBR`-<^%^9`=&B;)7L@BpFwDdQWR
z+HG`nWc*pi^&Dj2moWZYejw<1$H0d$p8g71V@|IT-gw5}XZ$V3XE0v(ssZ%;V*Fgd
z_~v&E&dKnWGv4K0gX{Uk_*u_*|Mv~9=Mm#4Js;@$w))Oo7u<&WXkffG<0v-zc$59K
z|InQ4xyJapkMZB`F}R*%jGreNzl$%do?8t3!gEcy7qEXkhV;<|IOTKC1Ll0XiIz8r
z@!Eq1*K>^V^IFCqJ!J6iMtCzBZ(v-WUpF&;<zb`v0{dUa_~9c4pT&4R<D<VaxSl(V
zpRX}~#SaFT=l)*CUt+wP{ZP4}boKtx=<7Mc_}S`b24CIEC@wR!*NO3-=NMet8+{qi
zV0<v^U&Z)cjO%&7;I3u7Zx`d|S=RR%|B&%&#!DH$wyV*vWqdK?Z!@0B_zK`uenNa5
zWjy71*6)#I{OCElu-V4=g&~7q%zoZy{0hdeVf<sp=QF;T@xzS&gYhcHPcU9W9SR)X
zjPN>~XY%=;iwv-Z_4_hDvWLO-Tw8Eg0H<_qJ7{pphlz}*ed*#fzhCP!zKH$bEc%Cx
zzTiuMQ+X)qX>dJ<7dDSEKI#&K>$$tYUlBi?&(h-G!TO)}G5UHgFZ91=`~WBDb6|8N
zw&v?~*ywZid7T+g;|G37Yh!*iaEj;aml^#uBfOD}H|uYJ0@hDwJTKMY(m%>){1L{b
z{44}c`8J)?h3Y~d%QW8EOW}5c)Jv<_&k6P;_ubR%r;Ou|+f5&@v3}8D6CXW~7R+AO
z&*E^qvi^6hpE1Gc|AiYmEim9p`Os^!!3P-Og@9B17e)EGob_**VictvGL7}?Szr2J
zg{;4vI<`1=vj4?ezl+y1s$cUo<GrKs*MU=iryZw<qwgJHynPg&*v9Bf|5NmT!FW=X
z{t)1l4=tye2ugop9B^I!Ib9O|EY=@<z0ucmaN)CD>v#6*`TBO|a2B)v`fQ`G=i`FA
zpYbsFzaC}%CmBD*c$o2*8K0GJ{48O78{_*K{~hDI7=NR{=oc~m1>?zu1}|p(d&VDS
zd>`Y9ZB0Jx<b06&u(QTHd)qj@Jz2jO;~tL#2tEin<@17@Ot^CYPGS6pxdzwsW#KE2
z@zJ*#d<FZjW_&N>dhRQ@WsLu2snP$E^&bOH*YOC)AE)}*$ok)LL+J$L?=Ze<mGN^u
z;~$AW;|m!7it)ThjQ%~0pJe=d#<>~lwM0Rpe3<;G(bw}zVbg{2ySP6q{m{!8pT_;@
zJ?wux<Gt4!KYDH_xEYMMf5zZjS-*(!9gOR_oZx=Lcp?oD;m~t9A?Z5>iszK|2G?^p
zfv;!$$BhPmkc@D=%lP}R8vJqtd-S~m`Dw=eVtKB8!}w>6Z)AO1Y=QKbHyA$$jPTCK
zfH2`h-ZsFZ1Y;0le9OBA=Vp-CpYb*C8T>Bxa}DE{>@dLl9PT8>|IWCc=Ljy7@!`9S
zzMdZld@kb~|6*|Nc6zspAI6_&{|__%*oQ{{62_lnd^_XPe*OdFAMG~!(th}W@%DQR
zuIC%V*FMJY`N-h%Jo*l}9+%_$RO-cF;zlMsD+<3(aK3+gb3ChoQ~t}ix1Og5?lIP1
z6y;~P#=Cejt}WrV#)F>1m2qwHe<g78FXQ4;FHve@jrZngKNomCFW`c}@gxyTzg+uo
z>&g2?QD4CE@i_j1FV%QQFZ#XGa^UoKqWw{m&!YbX`#Hk-Cin{)N9y^#q2O-<PoTGs
zAwi6M7dW!+wBxfl_)*}Y)3os&93G4pAU~ImHssB$bFs!xH@JfJ!ylV;eZVS{;^_OV
zfA3VIe>LkbW_;mD13bp~7-Rv(XCuG&=)w5Itp9G5pV#7qyOZ@l`qYFg>G}@%`Seye
zYFzz996#rGF!5QPY$Eb=j?X~G3%MQG$pqtNXq=S-q9hJ}TO9mB_TP1saZ<{@o@abk
zUjuYw{6FIODMcZn{QPjJQIzM-UiMSB*F^j&_VaxlKlF_R`B^p4=<DysVAG57jhsJn
zeJ5$0od$#-2QLF23h2qt-?0C+gG{(@Fi{`J&&D|TTkPky6yqnA{p@4>`Y{IR#rO}5
zU&y%R^SLMhln*IU`oCoShY`ks<Z~a!XI)|NM)rS=#`z>5u8V_bv!CO`jPi4A(?{R$
zZM<7K|K)vCHS3S(_{j6+LB<DtV)9`X`*}|E`2jM{(B7MjPvCIH&tDmz&G#ct_0h!m
z4)!nY)t~cyeS+&5$<NC)&c*>T95^2FryZk!pO5FlPOd+3s*g<Vr;V4-_q*IL^BF(P
z&$}Adzm4%Lt~7vLmz9iv!S|iq7cVltnadA%r@haBhuCLO{K)!uv!CfqHbaA-%Fknb
zqey;sVZ6gtMp4SoC5(T}9WN>W!+~EE43K}%Wc_;fBju!m@yFAQqTqKkp3L>Y9QLz{
z@v5ln>t&Z$R#ajoP3(_=HQjUbu@*J9E~qT_vx~4EWd#-p%_;Tsi%RE&i~Jm{m|Ee7
zs}^{);3Zat&CN+piLK%16_ynG;qvluwT~s=%d5S-@^EpkpHo#_Tn&@JnGelMM-_`=
z+D#kghbxMGy=Z!ckHt>0;AdVK3lMvg#!Q+rb%vilV%!*i+Ju>7%nF%U9$R*P_=%NG
zeLsEbn2d}W{@Cj$kII-ZWwP%l4@?Po;k_VEb7OG3LaJWCQwOV8Ry|FfP*>TnsK_1Y
zhv$V0i}b4cW(m-W$}kp0<t-(!<f=K(#&WE4!r55)*JzdJVjbKf-ok*fipreAQlFL#
zcYunyg=G$qTbk#bNBcG*>UDM{u=#~0;xymSLxii!v7&8mxB_d88=c(pa{g6pH{3w%
z!#O#6F??SyaV;8EMFV4?;hfm$pqRR;u~6FT1EnKppoC;ru>~^dGz3dp>osj@0op>!
zgK9sosIUy{;F@J_O<Dg5C4?6)`UxFc$=L*@m(MK@7fPnlI<l3ySoGb{bQ)Qv7duas
z1z9=`u=#~~L6%MfY*|H4kfqZgTbS*zI1R9RQQbha^m%|UD=BuYaT;I?a!_kT(nP1x
zY^h(ABc+8_vJI%)g>6la$ojwoF83=-{h^#sf(|7R%jde+QD4Pam|sy;n2nk&a4ljk
zWgM$U7;wdz%*+bMG3_MIdB}vy;Ihf=&usJ(h!S1MKoOz5a{<cVQXly$F&bFl=ZA}n
z!+~?G4vkf^jn{&KMTYka1BlkJNPcdmL=>?MR1lH611eH%@e?T)|2P{oFnBiLavQeh
z?3t{NT+Q*2>&UA=$IQPWR@bboTphXKt~ts<Ob1dt=2R6H<><Adu|haIHCP^&1^2NT
zipj40^3wTSuliW7JDex!)EmLD(rN2X#|&Dp!Hr7rra6USDR#LFDs!=Zc6n}gZs9y}
zt=%E7e5_9`ia{(GYEEuVVSY_G-^FNAaDNVJqq*^LAIo*;`#F+K?cOY!ZR`whvmv`E
zTr7``!klbGE#O=O6@|t2nSiMCCNCxvwRgQQ1xE*KVOQkp20&?9HCB(u66U^MT0fwl
zlY4VjxTMl<yyR;y)PATa5I4N!I0sf4&QBhY>S-YrysS!23#8KqP_#jf2}D1EwNEOD
zdIuWGY%wye5w^mL?a2e=Ny1sB%^j~nLa(fjO*<-(ceLa?O40xh+yUqL;?{u+;=u9L
zf%}20;P}eVEy*n}l&d{s)SOYe+Q6dd6fKUF0|z|eiB(mmv!4}djr|fAnuFEnOZ=e=
zhI&**nQLXzAGoB2C3$F(V2$)BjL%Wr%gt)+wiXYr&>r)qk_@ehbwk%gs;(N`Pg19u
zwo>HYs&Q|>8r~_17m>$vqI7;)7@HE9SVz%<V(%n8KIF`7^5f45V`X_ZV+ePAxzx=y
zw8e{~q=BG{xl<%Y!MjeXPvPh;s_-}zsTPt4aNE^4j;cz?3`L^?cU;h$p=mD}_b#d7
zhP7`TOJW42_=ZceC6N&?tcXqm`Q$UI)AWR2H;n9p-0Zn}6@9*ysO5uY?vt-D+j{6b
z2N#WYYcQEv7RFW~5(I4+;hP7T*{H$jWXD>ZKUNu%Vi9e?{w1HCMf_v=iGDT(4dOhG
z<Y{CIkIn+wR>LHssstB{cUGy6-4?Z*1fZo8&gVWE$33=ru$3BHBhp5V@*XseqGH&@
zd<4s5(3BOr)VgoMJ6f3Xku0rolpkowRfld=6+-3&1vM%nwFftu19eUT_5-8mDjVRJ
z*@nbqcW{G+SeJMZ?Q-MmQkIN5o3>-%GpUEDS&p2*^RHsAbV}v1LYzsp^T?n^uD&yH
zXL7U%3M7k8sUt_bhQujJ_BKb;o}WS3W<;_DE&9R=$<s1!?&G;zE*j(=eKOY1##1?R
zM*6x^59mvGBapKMnbhe`Q-Zf5QBINxh`N%rlMumFjY+im@lG&r)?zLb0Xjw{s47`m
zpA$i?WnXXB6X`V*9>`DWlmv5tFkFSo(z)0J$OJ<Ww<-fjzz<!}z$taBqE91*k+Lz!
zqMsCfT7gYMB6TSgsI%_RFDOKpD2gep$SKUX#hChFh&=6)lpm=iDTGM)6j-n;QCNYt
zvjKQ?LT|BDf&m>|#&EH;dXX2ryNS*f%4giydV3gafCmZ&U;ZZ+c!1FEGC%40zoT=e
z=mvJT`5#6440bW1eg^HR1UQ;wr;eC3#ve0zwC{U*WDFUbQ-R(bS`xT<{n0ZfkC-%J
z6wq;#ulL7{_l*JVDCGMYlSYZ@xQSCnj+p3A89R2`m<&H-#K?(b;E=}8yrLXDThhi&
zoG@~fKM<dXQ0-e@l3na#{)CK4s5WGr53XsHFC#Jzg~CF2Ltc3)MgZ;L6ZXq2FD;Mq
zj*WqIQPaA*YDY^uoO8Ms`cttUZj}Y3Zf-a#Y<VVB?MatF>FAlQar8qIJz!LgKAYxY
zjItv4^Z-qXrzT}oI?D0+OkpuHoQBuX6v-}_tB19$3$8k;V%LL0fk7f3A2RXP?I*5&
z&A^wRUxmgN4Nk#(7|kx)-UuUR)-_!cR8(;7KzX>GvmHdIJ$M~pRf+*rjYkc_`F>?l
zg?^}D#4U1xxKk9B51g~*(S<@g4yLH2)KucAG-MOqLjACdlPC6iROS}B3C=^q+)148
z=NBU<%~+#<dS=?7&32hkD6cGaeIh%u%c`wcbOcXJKrr6=8K8%rOxw|DV<d`)Q-Wwf
zH!!rK3n!aVpC?k_t4dD0df31%cdm_`xesxt=%<!83|`GZv5(wr=K5159#daGJYzGc
z<~0%Ji%N6MThOE_auY|{1@g$`h90zX(pH8(C0Dm-{g;Q!t0R>?d)H4NdoKo4A9*T9
za)-*O9qI|*1d(bXSW=_!J#Kwa1KHDc-A~nY(U&zk3+Q@FGcy=47f;{MUJ#}l9XmPJ
z#HfjM!sN09(;m3;LD=50CSGxCKrF^tQC*Ct7bNZwEeqrqKC;YB&M&D-#_$F<ajUHM
zk}afr&zBYEcv_(#j3Jifoaz!dGqSSWFtk@1?Ifzz_{0ZSo?8?q1O8QpH!;cj`IC&F
z$@!%?r5_c!*<NxbHQJJCAP3r|de|p9w*W<yUIgJ*^XwUP=TuY}Pv%XKv6J5jFkFmL
z4GMt#Bd)YRW3o0vzpWUrnD|B4|E1^(`&Rf%U_bl$hsY4)B4nPYoYQODpuOJMmdHe-
zA@kzQ8O>R74|=_O0^f8?`0^dQ$Xb4nD|XT0Ukm&5@F({2ox8|7o&ethI^;_1@p@Aq
z)9|07D)#c-yh!;@-e?;i@|)z1_@i&u#a_Ns7kMu$OZ-JoWC3{k242q7Fpr52ky-l8
ze78(G5`Tuh`S?M;#lD{HMap;g6290=`fp?Vk?c^u;}<F4{gXY}MBCGQUdmU_=E%$B
z5I`JMzJiCuL$EvWBWNEA8AjxOA_IrKQy2NK;DYw{rSe6_Nc6;ooQtIShe7*xV#iYE
z^TxBM_v=A>`L0;xiC5eNNVwvU-eU*tW!{!ZO#gL`==^($?Gr?6KZnP%J?3Wyk5KRg
zzqjCzEW}>sdx@kyHiAcV_-}y>+P6Dl!WY>oDQF!jKZ5=lKd4M4vSaxUdQmqMqmU@F
zl=3I=9{gy7Kdx@<chq7ZtuN;y{{~yiBC(h6wwH1Eq6Zay$hpXGfl?NUz09MlV|yt-
zRR7Q+c2W)=0!BF|_F4T+y0iF0nR;-+L+nMK02#Em^Y21@Ma|`~F2qixinf>ef&9TI
zPs_LVA^XexXaWD^OX4rz!ymcGgfH_(#7xpH=RbozMKMJHmSW#43YX*rC8yNUY)2nh
z<4F01foZ<Zf8kHkE%o2Iz$ETQ)BH~xVeGeJ9!c<!a0R34HkSR#na2LYD1)d|@BaW*
CSPCNm

literal 0
HcmV?d00001

diff --git a/run_tree/run.sh b/run_tree/run.sh
index a9fbfea..ad1b01f 100755
--- a/run_tree/run.sh
+++ b/run_tree/run.sh
@@ -1,2 +1,2 @@
 
-onyx build -I ../src -o game.wasm $@ && onyxrun game.wasm
+onyx -V build -I ../src -o game.wasm $@ && onyxrun game.wasm
diff --git a/src/build.onyx b/src/build.onyx
index f7eaea8..c4562a1 100644
--- a/src/build.onyx
+++ b/src/build.onyx
@@ -7,22 +7,26 @@
 #library_path "./lib"
 
 // Primary source files
-#load "config"
-#load "main"
 #load "camera"
-#load "mesh"
-#load "vecmath"
 #load "chunk"
-#load "world"
+#load "config"
 #load "font"
-#load "shader"
 #load "input"
+#load "main"
+#load "mesh"
 #load "physics"
 #load "player"
+#load "shader"
+#load "texture"
+#load "vecmath"
+#load "world"
+#load "worldgen"
 
 // Onyx library code
 #load "stb_truetype"
+#load "stb_image"
 
 // Onyx modules
 #load "glfw3/module"
 #load "opengles/module"
+#load "perlin/module"
diff --git a/src/chunk.onyx b/src/chunk.onyx
index d915d8c..be71bb2 100644
--- a/src/chunk.onyx
+++ b/src/chunk.onyx
@@ -7,17 +7,24 @@ Block :: #distinct u32;
 
 Block_Empty :: cast(Block) 0;
 
-block_make :: (red, green, blue: f32, brightness: f32) -> Block {
+Block_Options :: struct {
+    texture_enabled := true;
+}
+
+block_make :: (red, green, blue: f32, brightness: f32, options := Block_Options.{}) -> Block {
     r := cast(u32) (red        * 15.0f);
     g := cast(u32) (green      * 15.0f);
     b := cast(u32) (blue       * 15.0f);
     i := cast(u32) (brightness * 15.0f);
 
-    return ~~((i << 12) | (b << 8) | (g << 4) | r);
+    tex := 1 if options.texture_enabled else 0;
+
+    return ~~((tex << 16) | (i << 12) | (b << 8) | (g << 4) | r);
 }
 
 Chunk_Vertex :: struct {
-    position: Vector3;
+    position : Vector3;
+    texture  : Vector2;
 
     // This field is broken up by bit, but Onyx does not (nor ever will) support bit-fields.
     //
@@ -31,6 +38,7 @@ Chunk_Vertex :: struct {
 Chunk_Size :: 32
 
 Chunk :: struct {
+    coord:    Vector3i;
     position: Vector3;
     blocks: [] Block;
 
@@ -40,6 +48,7 @@ Chunk :: struct {
 
 chunk_make :: (x, y, z: i32, allocator := context.allocator) -> ^Chunk {
     chunk := new(Chunk, allocator);
+    chunk.coord = .{ x, y, z };
     chunk.position = .{
         ~~(x * Chunk_Size),
         ~~(y * Chunk_Size),
@@ -60,6 +69,10 @@ chunk_make :: (x, y, z: i32, allocator := context.allocator) -> ^Chunk {
     return true;
 }
 
+chunk_coords_to_world :: (use chunk: ^Chunk, x, y, z: i32) -> Vector3i {
+    return coord * Chunk_Size + .{x,y,z}; 
+}
+
 chunk_set :: (use chunk: ^Chunk, x, y, z: i32, block: Block) {
     if !in_chunk_bounds(x, y, z) do return;
     blocks[x * Chunk_Size * Chunk_Size + y * Chunk_Size + z] = block;
@@ -91,6 +104,22 @@ chunk_get :: (use chunk: ^Chunk, x, y, z: i32) -> Block {
     Vector3.{ 1, 0, 1 },
 ];
 
+#local block_textures := Vector2.[
+    Vector2.{ 0, 0 },
+    Vector2.{ 0, 1 },
+    Vector2.{ 1, 1 },
+    Vector2.{ 1, 0 },
+];
+
+#local block_texture_indicies := ([6] u32).[
+    u32.[ 0, 2, 1, 0, 3, 2 ],
+    u32.[ 0, 2, 1, 0, 3, 2 ],
+    u32.[ 0, 2, 1, 0, 3, 2 ],
+    u32.[ 0, 1, 2, 0, 2, 3 ],
+    u32.[ 0, 1, 2, 0, 2, 3 ],
+    u32.[ 0, 1, 2, 0, 2, 3 ],
+];
+
 #local block_indicies := ([6] u32).[
     u32.[ 0, 2, 1, 0, 3, 2 ],
     u32.[ 3, 6, 2, 3, 7, 6 ],
@@ -122,16 +151,18 @@ chunk_build_mesh :: (use chunk: ^Chunk) {
             if chunk_get(chunk, nx, ny, nz) != Block_Empty do continue;
             color := block;
             if i != 4 {
-                color = cast(Block) (0xb000 | (0xfff & cast(u32) color));
+                color = cast(Block) (0xb000 | (0xffff0fff & cast(u32) color));
             }
             if i == 5 {
-                color = cast(Block) (0x9000 | (0xfff & cast(u32) color));
+                color = cast(Block) (0x9000 | (0xffff0fff & cast(u32) color));
             }
 
             indicies := cast([] u32) block_indicies[i];
+            tex_indicies := cast([] u32) block_texture_indicies[i];
             for j: 6 {
                 v := block_verticies[indicies[j]];
-                verticies << .{ .{ ~~x+v.x, ~~y+v.y, ~~z+v.z }, ~~color };
+                t := block_textures[tex_indicies[j]];
+                verticies << .{ .{ ~~x+v.x, ~~y+v.y, ~~z+v.z }, t, ~~color };
             }
         }
     }
@@ -159,14 +190,14 @@ chunk_highlight_block :: (x, y, z: f32) {
     data := 0xf000;
 
     vertex_data := cast(^Chunk_Vertex) alloc.from_stack(sizeof Chunk_Vertex * 8);
-    vertex_data[0] = .{.{x-0.001,y-0.001,z-0.001},data};
-    vertex_data[1] = .{.{x-0.001,y+1.001,z-0.001},data};
-    vertex_data[2] = .{.{x+1.001,y+1.001,z-0.001},data};
-    vertex_data[3] = .{.{x+1.001,y-0.001,z-0.001},data};
-    vertex_data[4] = .{.{x-0.001,y-0.001,z+1.001},data};
-    vertex_data[5] = .{.{x-0.001,y+1.001,z+1.001},data};
-    vertex_data[6] = .{.{x+1.001,y+1.001,z+1.001},data};
-    vertex_data[7] = .{.{x+1.001,y-0.001,z+1.001},data};
+    vertex_data[0] = .{.{x-0.001,y-0.001,z-0.001},.{0,0},data};
+    vertex_data[1] = .{.{x-0.001,y+1.001,z-0.001},.{0,0},data};
+    vertex_data[2] = .{.{x+1.001,y+1.001,z-0.001},.{0,0},data};
+    vertex_data[3] = .{.{x+1.001,y-0.001,z-0.001},.{0,0},data};
+    vertex_data[4] = .{.{x-0.001,y-0.001,z+1.001},.{0,0},data};
+    vertex_data[5] = .{.{x-0.001,y+1.001,z+1.001},.{0,0},data};
+    vertex_data[6] = .{.{x+1.001,y+1.001,z+1.001},.{0,0},data};
+    vertex_data[7] = .{.{x+1.001,y-0.001,z+1.001},.{0,0},data};
 
     if block_highlight == null {
         #persist index_data := u32.[
diff --git a/src/input.onyx b/src/input.onyx
index a9a173a..a05c3f5 100644
--- a/src/input.onyx
+++ b/src/input.onyx
@@ -61,4 +61,4 @@ is_button_just_up   :: (button) => !buttons_this_frame[button] && buttons_last_f
 
 mouse_get_delta :: () -> (f64, f64) {
 	return mouse_x - last_mouse_x, mouse_y - last_mouse_y;
-}
\ No newline at end of file
+}
diff --git a/src/main.onyx b/src/main.onyx
index 62b2bbd..3da9d41 100644
--- a/src/main.onyx
+++ b/src/main.onyx
@@ -75,6 +75,8 @@ toggle_cursor_grabbed :: () {
     }
 }
 
+#local block_texture: Texture;
+
 setup_opengl :: () {
     glInit(glfwGetLoadProcAddress());
 
@@ -96,6 +98,8 @@ setup_opengl :: () {
     shader_link_world_matrix_block(world_shader);
 
     font = font_lookup(.{"./assets/fonts/calibri.ttf", 32});
+
+    block_texture = texture_make(#cstr "assets/textures/block.png");
     
     shader_use(world_shader);
     world = world_make();
@@ -145,6 +149,8 @@ draw :: () {
     glClear(GL_COLOR_BUFFER_BIT | GL_DEPTH_BUFFER_BIT);
 
     shader_use(world_shader);
+    shader_set_uniform(world_shader, #cstr "u_texture", 0);
+    texture_use(^block_texture);
     world_draw(world);
     
     glLineWidth(2);
diff --git a/src/mesh.onyx b/src/mesh.onyx
index 3c969c7..132a4c2 100644
--- a/src/mesh.onyx
+++ b/src/mesh.onyx
@@ -1,7 +1,7 @@
 use package core
 use package opengles
 
-Mesh :: struct (T: type_expr) {
+Mesh :: struct (Vertex_Type: type_expr) {
     handle: GLint;
     vertex_handle: GLint;
     index_handle: GLint;
@@ -53,13 +53,15 @@ mesh_make :: (verticies: [] $T, indicies: [] u32) -> ^Mesh(T) {
     return mesh;
 }
 
-mesh_update_verticies :: (use mesh: ^Mesh($T), verticies: [] T) {
+mesh_update_verticies :: (use mesh: ^Mesh, verticies: [] mesh.Vertex_Type) {
+    @TODO // Add bounds checking to arrays here.
+
     glBindBuffer(GL_ARRAY_BUFFER, vertex_handle);
-    glBufferSubData(GL_ARRAY_BUFFER, 0, verticies.count * sizeof T, verticies.data);
+    glBufferSubData(GL_ARRAY_BUFFER, 0, verticies.count * sizeof mesh.Vertex_Type, verticies.data);
     glBindBuffer(GL_ARRAY_BUFFER, -1);
 }
 
-mesh_draw :: (use mesh: ^Mesh($T)) {
+mesh_draw :: (use mesh: ^Mesh) {
     glBindVertexArray(handle);
     if index_count > 0 {
         glDrawElements(primitive, index_count, GL_UNSIGNED_INT, ~~0);
@@ -69,7 +71,7 @@ mesh_draw :: (use mesh: ^Mesh($T)) {
     glBindVertexArray(-1);
 }
 
-mesh_free :: (mesh: ^Mesh($T)) {
+mesh_free :: (mesh: ^Mesh) {
     glDeleteBuffers(1, ^mesh.vertex_handle);
     glDeleteBuffers(1, ^mesh.index_handle);
     glDeleteVertexArrays(1, ^mesh.handle);
diff --git a/src/physics.onyx b/src/physics.onyx
index 834ed17..8b89b6a 100644
--- a/src/physics.onyx
+++ b/src/physics.onyx
@@ -31,7 +31,7 @@ physics_apply_gravity :: (use body: ^PhysicsBody) {
 }
 
 physics_simulate :: (use body: ^PhysicsBody, dt: f32, world: ^World) {
-    aabb_buffer := (cast(^AABB) alloc.from_stack(sizeof [128] AABB))[0..128];
+    aabb_buffer := (cast(^AABB) alloc.from_stack(sizeof [256] AABB))[0..256];
 
     aabbs := world_get_aabbs(world, pos, 3, aabb_buffer);
     vel += acc * dt;
diff --git a/src/player.onyx b/src/player.onyx
index 3c634fb..52a1b41 100644
--- a/src/player.onyx
+++ b/src/player.onyx
@@ -11,7 +11,7 @@ player_make :: () -> Player {
 
     player.camera = null;
     player.body = .{
-        .{0,10,0},
+        .{0,48,0},
         .{0,0,0},
         .{0,0,0},
 
@@ -61,7 +61,7 @@ player_update :: (use player: ^Player, dt: f32) {
     physics_simulate(^body, dt, world);
 
     // Fix falling off the world
-    if body.pos.y < -10 do body.pos = .{0,10,0};
+    if body.pos.y < -10 do body.pos = .{0,48,0};
 
     camera.position = body.pos;
 
diff --git a/src/texture.onyx b/src/texture.onyx
new file mode 100644
index 0000000..5d51168
--- /dev/null
+++ b/src/texture.onyx
@@ -0,0 +1,38 @@
+
+use package core
+use package opengles
+use package stb_image
+
+Texture :: struct {
+    texture: GLint;
+    width, height, channels: i32;
+    filename: str;
+}
+
+texture_make :: (path: cstr) -> Texture {
+    tex: Texture;
+    tex.filename = path |> string.from_cstr();
+    pixels := stbi_load(path, ^tex.width, ^tex.height, ^tex.channels, 4);
+    assert(pixels != null, "Failed to load texture.");
+    defer stbi_image_free(pixels);
+
+    glGenTextures(1, ^tex.texture);
+    glBindTexture(GL_TEXTURE_2D, tex.texture);
+    glTexImage2D(GL_TEXTURE_2D, 0, GL_RGBA, tex.width, tex.height, 0, GL_RGBA, GL_UNSIGNED_BYTE, pixels);
+
+    // Are these sensible defaults?
+    glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER, GL_NEAREST);
+    glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MAG_FILTER, GL_NEAREST);
+    glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_WRAP_S, GL_CLAMP_TO_EDGE);
+    glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_WRAP_S, GL_CLAMP_TO_EDGE);
+
+    glBindTexture(GL_TEXTURE_2D, 0);
+
+    return tex;
+}
+
+texture_use :: (use tex: ^Texture, texture_binding := 0) {
+    glActiveTexture(GL_TEXTURE0 + texture_binding);
+    glBindTexture(GL_TEXTURE_2D, texture);
+}
+
diff --git a/src/world.onyx b/src/world.onyx
index 2a1bf35..72238b0 100644
--- a/src/world.onyx
+++ b/src/world.onyx
@@ -13,16 +13,8 @@ world_make :: (allocator := context.allocator) -> ^World {
 
     for x: 0 .. 3 do for y: 0 .. 3 do for z: 0 .. 3 {
         chunk := chunk_make(x, y, z);
-
-        for z: 32 do for x: 32 {
-            chunk_set(chunk, x, 0, z, block_make(0.2, 1, 0.2, 0.8));
-        }
-        for z: 32 do for x: 32 {
-            if random.between(0, 10) >= 3 do continue;
-            chunk_set(chunk, x, 1, z, block_make(random.float(0, 1), random.float(0, 1), random.float(0, 1), 1));
-        }
-
         world.chunks[x * world.chunk_dist * world.chunk_dist + y * world.chunk_dist + z] = chunk;
+        generate_chunk(world, chunk);
     }
 
     return world;
diff --git a/src/worldgen.onyx b/src/worldgen.onyx
new file mode 100644
index 0000000..96041d2
--- /dev/null
+++ b/src/worldgen.onyx
@@ -0,0 +1,20 @@
+
+use package core
+#local perlin :: package perlin
+
+#local seed :: 1234
+
+generate_chunk :: (world: ^World, chunk: ^Chunk) {
+    for cz: 32 do for cx: 32 {
+        t := chunk_coords_to_world(chunk, cx, 0, cz);
+        px := cast(f64) t.x / 16;
+        pz := cast(f64) t.z / 16;
+        h: i32 = ~~(perlin.noise(px, ~~(10 * seed), pz) * 24 + 14);
+
+        h -= chunk.coord.y * Chunk_Size;
+        if h >= 0 { chunk_set(chunk, cx, h, cz, block_make(0.2, 1, 0.2, 1)); h -= 1; }
+        for cy: 2 .. h+1 do chunk_set(chunk, cx, cy, cz, block_make(0.3, 0.3, 0.1, 1, .{texture_enabled=false}));
+        for cy: 0 .. math.min(h, 2)+1 do chunk_set(chunk, cx, cy, cz, block_make(0.2, 0.2, 0.2, 0.5, .{texture_enabled=false}));
+    }
+}
+
-- 
2.25.1