diff --git a/.gitmodules b/.gitmodules
index 6e456528..0479e3d8 100644
--- a/.gitmodules
+++ b/.gitmodules
@@ -34,3 +34,6 @@
 [submodule "Plugins/nosWebRTC/Source/ssl-cert"]
 	path = Plugins/nosWebRTC/Source/ssl-cert
 	url = https://github.com/mediaz/ssl-cert.git
+[submodule "Plugins/nosUtilities/External/freetype"]
+	path = Plugins/nosUtilities/External/freetype
+	url = https://github.com/freetype/freetype.git
diff --git a/Plugins/CMakeLists.txt b/Plugins/CMakeLists.txt
index 589829f7..63685e54 100644
--- a/Plugins/CMakeLists.txt
+++ b/Plugins/CMakeLists.txt
@@ -42,6 +42,7 @@ add_subdirectory(nosReflect)
 add_subdirectory(nosStrings)
 add_subdirectory(nosAnimation)
 add_subdirectory(nosGraphics)
+add_subdirectory(nosGeometry)
 
 nos_get_targets(PLUGINS_COMMON_EXTERNAL_TARGETS "./External")
 nos_group_targets("${PLUGINS_COMMON_EXTERNAL_TARGETS}" "External")
diff --git a/Plugins/nosFilters/Config/BokehDof.nosdef b/Plugins/nosFilters/Config/BokehDof.nosdef
new file mode 100644
index 00000000..df5b08fb
--- /dev/null
+++ b/Plugins/nosFilters/Config/BokehDof.nosdef
@@ -0,0 +1,121 @@
+{
+	"nodes": [
+		{
+			"class_name": "BokehDof",
+			"menu_info": {
+				"category": "Filters",
+				"display_name": "Bokeh DoF"
+			},
+			"node": {
+				"class_name": "BokehDof",
+				"name": "Bokeh DoF",
+				"description": "Single-pass 2D depth-of-field. CoC is computed from a linear view-space Z input; samples are gathered on a Vogel disc weighted by the BokehShape kernel texture, so bokeh takes the shape painted into BokehShape.",
+				"contents_type": "Job",
+				"contents": {
+					"type": "nos.sys.vulkan.GPUNode",
+					"options": {
+						"shader": "Shaders/BokehDof.frag"
+					}
+				},
+				"pins": [
+					{
+						"name": "Input",
+						"type_name": "nos.sys.vulkan.Texture",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": {
+							"filtering": "LINEAR"
+						}
+					},
+					{
+						"name": "Depth",
+						"type_name": "nos.sys.vulkan.Texture",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": {
+							"filtering": "NEAREST"
+						}
+					},
+					{
+						"name": "BokehShape",
+						"type_name": "nos.sys.vulkan.Texture",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": {
+							"filtering": "LINEAR"
+						}
+					},
+					{
+						"name": "FocusDistance",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 5.0,
+						"min": 0.0,
+						"max": 1000.0
+					},
+					{
+						"name": "FocusRange",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 2.0,
+						"min": 0.01,
+						"max": 1000.0
+					},
+					{
+						"name": "MaxRadius",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 16.0,
+						"min": 0.0,
+						"max": 128.0
+					},
+					{
+						"name": "MinRadius",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 0.5,
+						"min": 0.0,
+						"max": 8.0
+					},
+					{
+						"name": "BackgroundIsFar",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 1.0,
+						"min": 0.0,
+						"max": 1.0
+					},
+					{
+						"name": "SampleCount",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 48.0,
+						"min": 4.0,
+						"max": 256.0
+					},
+					{
+						"name": "KernelRotation",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 0.0,
+						"min": -6.2832,
+						"max": 6.2832
+					},
+					{
+						"name": "Output",
+						"type_name": "nos.sys.vulkan.Texture",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_OR_PROPERTY"
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosFilters/Config/BokehShape.nosdef b/Plugins/nosFilters/Config/BokehShape.nosdef
new file mode 100644
index 00000000..3a466b9a
--- /dev/null
+++ b/Plugins/nosFilters/Config/BokehShape.nosdef
@@ -0,0 +1,93 @@
+{
+	"nodes": [
+		{
+			"class_name": "BokehShape",
+			"menu_info": {
+				"category": "Filters",
+				"display_name": "Bokeh Shape"
+			},
+			"node": {
+				"class_name": "BokehShape",
+				"name": "Bokeh Shape",
+				"description": "Procedural bokeh kernel generator. Produces a unit-disc grayscale mask shaped like a regular polygon aperture (blade count, roundness, rotation), with soft edge and optional rim brightening. Feed the Output into a Bokeh DoF node's BokehShape pin.",
+				"contents_type": "Job",
+				"contents": {
+					"type": "nos.sys.vulkan.GPUNode",
+					"options": {
+						"shader": "Shaders/BokehShape.frag"
+					}
+				},
+				"pins": [
+					{
+						"name": "BladeCount",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 6.0,
+						"min": 0.0,
+						"max": 16.0
+					},
+					{
+						"name": "Roundness",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 0.3,
+						"min": 0.0,
+						"max": 1.0
+					},
+					{
+						"name": "Rotation",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 0.0,
+						"min": -6.2832,
+						"max": 6.2832
+					},
+					{
+						"name": "EdgeSoftness",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 0.04,
+						"min": 0.0,
+						"max": 0.5
+					},
+					{
+						"name": "RimBoost",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 0.0,
+						"min": 0.0,
+						"max": 4.0
+					},
+					{
+						"name": "RimWidth",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 0.08,
+						"min": 0.005,
+						"max": 0.5
+					},
+					{
+						"name": "Output",
+						"type_name": "nos.sys.vulkan.Texture",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_OR_PROPERTY",
+						"data": {
+							"resolution": "CUSTOM",
+							"width": 128,
+							"height": 128,
+							"format": "R16_UNORM",
+							"usage": "TRANSFER_SRC TRANSFER_DST SAMPLED STORAGE RENDER_TARGET",
+							"filtering": "LINEAR"
+						}
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosFilters/Config/DepthOfField.nosdef b/Plugins/nosFilters/Config/DepthOfField.nosdef
new file mode 100644
index 00000000..1db5a70f
--- /dev/null
+++ b/Plugins/nosFilters/Config/DepthOfField.nosdef
@@ -0,0 +1,990 @@
+{ "nodes": [
+    {
+      "class_name": "nos.filters.DepthOfField",
+      "node": {
+        "id": "5899940c-437e-4f71-b119-bb80fb5d1e1a",
+        "name": "DepthOfField",
+        "class_name": "nos.filters.DepthOfField",
+        "pins": [
+          {
+            "id": "1950c2e6-a0f6-485b-8a02-bded8a2f6ed5",
+            "name": "Depth",
+            "type_name": "nos.sys.vulkan.Texture",
+            "show_as": "INPUT_PIN",
+            "can_show_as": "INPUT_PIN_OR_PROPERTY",
+            "visualizer": {
+            },
+            "data": {
+              "resolution": "HD",
+              "width": 1920,
+              "height": 1080,
+              "format": "R16G16B16A16_SFLOAT",
+              "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED"
+            },
+            "def": {
+            },
+            "advanced_property": true,
+            "meta_data_map": [
+              { "key": "AdvancedProperty", "value": "true" }
+            ],
+            "contents_type": "PortalPin",
+            "contents": { "source_id": "74a1bfd0-4f2d-447b-945c-8d0cb67a2120" }
+          },
+          {
+            "id": "e0b8f433-212f-48f6-ba4f-c8a194e1a707",
+            "name": "FocusDistance",
+            "type_name": "float",
+            "show_as": "INPUT_PIN",
+            "can_show_as": "INPUT_PIN_OR_PROPERTY",
+            "visualizer": {
+            },
+            "data": 5.0,
+            "min": 0.0,
+            "max": 1000.0,
+            "def": 5.0,
+            "step": 10.0,
+            "contents_type": "PortalPin",
+            "contents": { "source_id": "e709c7b4-9a59-4546-be53-0dc51abc5605" }
+          },
+          {
+            "id": "68187c92-92f3-40d0-8b24-df6f33f9f649",
+            "name": "FocusRange",
+            "type_name": "float",
+            "show_as": "INPUT_PIN",
+            "can_show_as": "INPUT_PIN_OR_PROPERTY",
+            "visualizer": {
+            },
+            "data": 2.0,
+            "min": 0.01,
+            "max": 1000.0,
+            "def": 2.0,
+            "step": 9.9999,
+            "contents_type": "PortalPin",
+            "contents": { "source_id": "534a26e9-1ebd-4ed2-89fb-bdf5d34b6ec1" }
+          },
+          {
+            "id": "42554a0a-2d70-4ec4-a2ea-594ad71559f3",
+            "name": "MaxRadius",
+            "type_name": "float",
+            "show_as": "INPUT_PIN",
+            "can_show_as": "INPUT_PIN_OR_PROPERTY",
+            "visualizer": {
+            },
+            "data": 16.0,
+            "min": 0.0,
+            "max": 128.0,
+            "def": 16.0,
+            "step": 1.28,
+            "contents_type": "PortalPin",
+            "contents": { "source_id": "63f77504-73aa-4b89-8849-65e27649b272" }
+          },
+          {
+            "id": "312c4450-a4ad-4690-ba3d-afcbc93da6eb",
+            "name": "MinRadius",
+            "type_name": "float",
+            "show_as": "INPUT_PIN",
+            "can_show_as": "INPUT_PIN_OR_PROPERTY",
+            "visualizer": {
+            },
+            "data": 0.5,
+            "min": 0.0,
+            "max": 8.0,
+            "def": 0.5,
+            "step": 0.08,
+            "contents_type": "PortalPin",
+            "contents": { "source_id": "97561978-6da1-4a33-a6bc-c654008a8261" }
+          },
+          {
+            "id": "ce6c0d45-8ce1-47ef-bd73-addda06d826e",
+            "name": "Output",
+            "type_name": "nos.sys.vulkan.Texture",
+            "show_as": "OUTPUT_PIN",
+            "can_show_as": "OUTPUT_PIN_OR_PROPERTY",
+            "visualizer": {
+            },
+            "data": {
+              "resolution": "HD",
+              "width": 1920,
+              "height": 1080,
+              "format": "R16G16B16A16_SFLOAT",
+              "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED STORAGE RENDER_TARGET"
+            },
+            "def": {
+              "resolution": "HD",
+              "width": 1920,
+              "height": 1080,
+              "format": "R16G16B16A16_SFLOAT",
+              "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED STORAGE RENDER_TARGET"
+            },
+            "advanced_property": true,
+            "meta_data_map": [
+              { "key": "AdvancedProperty", "value": "true" }
+            ],
+            "contents_type": "PortalPin",
+            "contents": { "source_id": "c278680b-43b5-40ce-b1af-a4551c2e58f0" }
+          },
+          {
+            "id": "2be9d3ba-9386-43b0-ae1c-58168be2a289",
+            "name": "Input",
+            "type_name": "nos.sys.vulkan.Texture",
+            "show_as": "INPUT_PIN",
+            "can_show_as": "INPUT_PIN_OR_PROPERTY",
+            "visualizer": {
+            },
+            "data": {
+              "resolution": "HD",
+              "width": 1920,
+              "height": 1080,
+              "format": "R16G16B16A16_SFLOAT",
+              "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED",
+              "filtering": "LINEAR"
+            },
+            "def": {
+              "filtering": "LINEAR"
+            },
+            "advanced_property": true,
+            "meta_data_map": [
+              { "key": "AdvancedProperty", "value": "true" }
+            ],
+            "contents_type": "PortalPin",
+            "contents": { "source_id": "479248dc-200d-4a4d-87d2-f2c7c77f667f" }
+          }
+        ],
+        "pos": { "x": 0.0, "y": 0.0 },
+        "contents_type": "Graph",
+        "contents": { "nodes": [
+            {
+              "id": "393281e0-2cb8-4b90-a98e-a8e708719229",
+              "name": "Output",
+              "class_name": "nos.internal.GraphOutput",
+              "pins": [
+                {
+                  "id": "2e4ec877-e014-49ae-ae1d-881a0e4d1ac5",
+                  "name": "Input",
+                  "type_name": "nos.sys.vulkan.Texture",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_ONLY",
+                  "visualizer": {
+                  },
+                  "data": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED STORAGE RENDER_TARGET"
+                  },
+                  "def": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED STORAGE RENDER_TARGET"
+                  },
+                  "advanced_property": true,
+                  "meta_data_map": [
+                    { "key": "AdvancedProperty", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "c278680b-43b5-40ce-b1af-a4551c2e58f0",
+                  "name": "Output",
+                  "type_name": "nos.sys.vulkan.Texture",
+                  "show_as": "OUTPUT_PIN",
+                  "can_show_as": "OUTPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED STORAGE RENDER_TARGET"
+                  },
+                  "referred_by": [
+                    "ce6c0d45-8ce1-47ef-bd73-addda06d826e"
+                  ],
+                  "def": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED STORAGE RENDER_TARGET"
+                  },
+                  "advanced_property": true,
+                  "meta_data_map": [
+                    { "key": "AdvancedProperty", "value": "true" },
+                    { "key": "PinHidden", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                }
+              ],
+              "pos": { "x": 1329.0, "y": 1025.0 },
+              "contents_type": "Job",
+              "contents": { "type": "" },
+              "function_category": "Default Node",
+              "plugin_version": { "major": 0, "minor": 0, "patch": 0 }
+            },
+            {
+              "id": "6a261add-ff1c-49ba-b9b7-a3bbad8e1fb3",
+              "name": "Directional DoF (1)",
+              "class_name": "nos.filters.DirectionalDof",
+              "pins": [
+                {
+                  "id": "b1b03fce-6863-42e6-a78a-260743b5441d",
+                  "name": "Input",
+                  "type_name": "nos.sys.vulkan.Texture",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED STORAGE RENDER_TARGET",
+                    "filtering": "LINEAR"
+                  },
+                  "def": {
+                    "filtering": "LINEAR"
+                  },
+                  "advanced_property": true,
+                  "meta_data_map": [
+                    { "key": "AdvancedProperty", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "14aab6c6-10ce-4a39-9c6f-8c5633fe59e2",
+                  "name": "Depth",
+                  "type_name": "nos.sys.vulkan.Texture",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED"
+                  },
+                  "def": {
+                  },
+                  "advanced_property": true,
+                  "meta_data_map": [
+                    { "key": "AdvancedProperty", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "d6a91b7a-b576-487b-bd2c-89fee90a37d1",
+                  "name": "FocusDistance",
+                  "type_name": "float",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 7.4,
+                  "min": 0.0,
+                  "max": 1000.0,
+                  "def": 5.0,
+                  "step": 10.0,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "55bffdc3-e0fa-4c0f-9ead-5a3b96c232bf",
+                  "name": "FocusRange",
+                  "type_name": "float",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 3.1,
+                  "min": 0.01,
+                  "max": 1000.0,
+                  "def": 2.0,
+                  "step": 9.9999,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "bdc5ae5a-10cc-4c3c-b013-573a64bd8ec6",
+                  "name": "MaxRadius",
+                  "type_name": "float",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 5.0,
+                  "min": 0.0,
+                  "max": 128.0,
+                  "def": 16.0,
+                  "step": 1.28,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "d77d3716-69f5-4c5d-a342-414dc11597fb",
+                  "name": "MinRadius",
+                  "type_name": "float",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 0.0,
+                  "min": 0.0,
+                  "max": 8.0,
+                  "def": 0.5,
+                  "step": 0.08,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "ad25df82-1942-4f9f-a062-c072261a2d92",
+                  "name": "BackgroundIsFar",
+                  "type_name": "float",
+                  "show_as": "PROPERTY",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 1.0,
+                  "min": 0.0,
+                  "max": 1.0,
+                  "def": 1.0,
+                  "step": 0.01,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "aaff92e1-63fe-4253-8edb-1f34a76019c9",
+                  "name": "Direction",
+                  "type_name": "nos.fb.vec2",
+                  "show_as": "PROPERTY",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": { "x": 0.0, "y": 1.0 },
+                  "min": { "x": -1.0, "y": -1.0 },
+                  "max": { "x": 1.0, "y": 1.0 },
+                  "def": { "x": 1.0, "y": 0.0 },
+                  "step": 0.02,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "ad6603e0-2b1d-4bf6-a1d1-af0fc05978a2",
+                  "name": "SampleCount",
+                  "type_name": "float",
+                  "show_as": "PROPERTY",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 12.0,
+                  "min": 1.0,
+                  "max": 64.0,
+                  "def": 12.0,
+                  "step": 0.63,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "0ef0f439-9766-4957-8931-a02ce1019bd1",
+                  "name": "Output",
+                  "type_name": "nos.sys.vulkan.Texture",
+                  "show_as": "OUTPUT_PIN",
+                  "can_show_as": "OUTPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED STORAGE RENDER_TARGET"
+                  },
+                  "def": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED STORAGE RENDER_TARGET"
+                  },
+                  "advanced_property": true,
+                  "meta_data_map": [
+                    { "key": "AdvancedProperty", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                }
+              ],
+              "pos": { "x": 1129.0, "y": 1073.0 },
+              "contents_type": "Job",
+              "contents": { "type": "nos.sys.vulkan.GPUNode", "options": { "shader": "Shaders/DirectionalDof.frag" } },
+              "function_category": "Default Node",
+              "description": "1D depth-aware blur. CoC is computed per pixel from a linear view-space Z input. Chain two instances along (1,0) and (0,1) for a separable disc bokeh.",
+              "plugin_version": { "major": 1, "minor": 7, "patch": 0 }
+            },
+            {
+              "id": "deac982f-b51b-4ae0-b6c6-9b2998d3e5a9",
+              "name": "MaxRadius",
+              "class_name": "nos.internal.GraphInput",
+              "pins": [
+                {
+                  "id": "d5387b2e-f8c6-4b2e-8a42-a11eed779a1d",
+                  "name": "Output",
+                  "type_name": "float",
+                  "show_as": "OUTPUT_PIN",
+                  "can_show_as": "OUTPUT_PIN_ONLY",
+                  "visualizer": {
+                  },
+                  "data": 5.0,
+                  "min": 0.0,
+                  "max": 128.0,
+                  "def": 16.0,
+                  "step": 1.28,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "63f77504-73aa-4b89-8849-65e27649b272",
+                  "name": "Input",
+                  "type_name": "float",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 16.0,
+                  "referred_by": [
+                    "42554a0a-2d70-4ec4-a2ea-594ad71559f3"
+                  ],
+                  "min": 0.0,
+                  "max": 128.0,
+                  "def": 16.0,
+                  "step": 1.28,
+                  "meta_data_map": [
+                    { "key": "PinHidden", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                }
+              ],
+              "pos": { "x": 655.0, "y": 1250.0 },
+              "contents_type": "Job",
+              "contents": { "type": "" },
+              "function_category": "Default Node",
+              "plugin_version": { "major": 0, "minor": 0, "patch": 0 }
+            },
+            {
+              "id": "af576b2d-dde0-4d7b-86fc-37cb9f97b49e",
+              "name": "Directional DoF",
+              "class_name": "nos.filters.DirectionalDof",
+              "pins": [
+                {
+                  "id": "9e368dde-bb31-44d8-aaad-782e92fe2366",
+                  "name": "Input",
+                  "type_name": "nos.sys.vulkan.Texture",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED",
+                    "filtering": "LINEAR"
+                  },
+                  "def": {
+                    "filtering": "LINEAR"
+                  },
+                  "advanced_property": true,
+                  "meta_data_map": [
+                    { "key": "AdvancedProperty", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "7e88a91a-1eca-4cc5-8dce-7c4aca61368d",
+                  "name": "Depth",
+                  "type_name": "nos.sys.vulkan.Texture",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED"
+                  },
+                  "def": {
+                  },
+                  "advanced_property": true,
+                  "meta_data_map": [
+                    { "key": "AdvancedProperty", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "c1b814c4-e424-40a0-99d6-0437d948d1d7",
+                  "name": "FocusDistance",
+                  "type_name": "float",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 7.4,
+                  "min": 0.0,
+                  "max": 1000.0,
+                  "def": 5.0,
+                  "step": 10.0,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "78893474-3dfc-4a36-b897-77760ba19c8c",
+                  "name": "FocusRange",
+                  "type_name": "float",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 3.1,
+                  "min": 0.01,
+                  "max": 1000.0,
+                  "def": 2.0,
+                  "step": 9.9999,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "4f471215-bebf-49be-a6e4-909c394d1f1a",
+                  "name": "MaxRadius",
+                  "type_name": "float",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 5.0,
+                  "min": 0.0,
+                  "max": 128.0,
+                  "def": 16.0,
+                  "step": 1.28,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "05132381-cf95-4253-9fc2-e87f84b70dd8",
+                  "name": "MinRadius",
+                  "type_name": "float",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 0.0,
+                  "min": 0.0,
+                  "max": 8.0,
+                  "def": 0.5,
+                  "step": 0.08,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "2b52da00-b45d-41ae-a1ec-c88566879043",
+                  "name": "BackgroundIsFar",
+                  "type_name": "float",
+                  "show_as": "PROPERTY",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 1.0,
+                  "min": 0.0,
+                  "max": 1.0,
+                  "def": 1.0,
+                  "step": 0.01,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "ac684e31-1a90-462f-8b64-2b368a93b563",
+                  "name": "Direction",
+                  "type_name": "nos.fb.vec2",
+                  "show_as": "PROPERTY",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": { "x": 1.0, "y": 0.0 },
+                  "min": { "x": -1.0, "y": -1.0 },
+                  "max": { "x": 1.0, "y": 1.0 },
+                  "def": { "x": 1.0, "y": 0.0 },
+                  "step": 0.02,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "b8527f03-5c5c-4a41-b485-fa05e0f50cb1",
+                  "name": "SampleCount",
+                  "type_name": "float",
+                  "show_as": "PROPERTY",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 12.0,
+                  "min": 1.0,
+                  "max": 64.0,
+                  "def": 12.0,
+                  "step": 0.63,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "8f4d23a7-3b94-4a1c-ba14-d1ce47e92acd",
+                  "name": "Output",
+                  "type_name": "nos.sys.vulkan.Texture",
+                  "show_as": "OUTPUT_PIN",
+                  "can_show_as": "OUTPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED STORAGE RENDER_TARGET"
+                  },
+                  "def": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED STORAGE RENDER_TARGET"
+                  },
+                  "advanced_property": true,
+                  "meta_data_map": [
+                    { "key": "AdvancedProperty", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                }
+              ],
+              "pos": { "x": 855.0, "y": 977.0 },
+              "contents_type": "Job",
+              "contents": { "type": "nos.sys.vulkan.GPUNode", "options": { "shader": "Shaders/DirectionalDof.frag" } },
+              "function_category": "Default Node",
+              "description": "1D depth-aware blur. CoC is computed per pixel from a linear view-space Z input. Chain two instances along (1,0) and (0,1) for a separable disc bokeh.",
+              "plugin_version": { "major": 1, "minor": 7, "patch": 0 }
+            },
+            {
+              "id": "8b497dab-5466-4d32-a440-125976e3a3ee",
+              "name": "Depth",
+              "class_name": "nos.internal.GraphInput",
+              "pins": [
+                {
+                  "id": "9587b7b1-8fc7-437b-9459-ee73f90de097",
+                  "name": "Output",
+                  "type_name": "nos.sys.vulkan.Texture",
+                  "show_as": "OUTPUT_PIN",
+                  "can_show_as": "OUTPUT_PIN_ONLY",
+                  "visualizer": {
+                  },
+                  "data": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED"
+                  },
+                  "def": {
+                  },
+                  "advanced_property": true,
+                  "meta_data_map": [
+                    { "key": "AdvancedProperty", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "74a1bfd0-4f2d-447b-945c-8d0cb67a2120",
+                  "name": "Input",
+                  "type_name": "nos.sys.vulkan.Texture",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED"
+                  },
+                  "referred_by": [
+                    "1950c2e6-a0f6-485b-8a02-bded8a2f6ed5"
+                  ],
+                  "def": {
+                  },
+                  "advanced_property": true,
+                  "meta_data_map": [
+                    { "key": "AdvancedProperty", "value": "true" },
+                    { "key": "PinHidden", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                }
+              ],
+              "pos": { "x": 655.0, "y": 1025.0 },
+              "contents_type": "Job",
+              "contents": { "type": "" },
+              "function_category": "Default Node",
+              "plugin_version": { "major": 0, "minor": 0, "patch": 0 }
+            },
+            {
+              "id": "9813ee9d-1f75-4554-9f9c-b9ecafc2e9fe",
+              "name": "FocusDistance",
+              "class_name": "nos.internal.GraphInput",
+              "pins": [
+                {
+                  "id": "7c60934b-ba19-4faf-9923-411511649cd0",
+                  "name": "Output",
+                  "type_name": "float",
+                  "show_as": "OUTPUT_PIN",
+                  "can_show_as": "OUTPUT_PIN_ONLY",
+                  "visualizer": {
+                  },
+                  "data": 7.4,
+                  "min": 0.0,
+                  "max": 1000.0,
+                  "def": 5.0,
+                  "step": 10.0,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "e709c7b4-9a59-4546-be53-0dc51abc5605",
+                  "name": "Input",
+                  "type_name": "float",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 5.0,
+                  "referred_by": [
+                    "e0b8f433-212f-48f6-ba4f-c8a194e1a707"
+                  ],
+                  "min": 0.0,
+                  "max": 1000.0,
+                  "def": 5.0,
+                  "step": 10.0,
+                  "meta_data_map": [
+                    { "key": "PinHidden", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                }
+              ],
+              "pos": { "x": 655.0, "y": 1100.0 },
+              "contents_type": "Job",
+              "contents": { "type": "" },
+              "function_category": "Default Node",
+              "plugin_version": { "major": 0, "minor": 0, "patch": 0 }
+            },
+            {
+              "id": "2c0861b9-e416-4741-b56d-8dfa81c49516",
+              "name": "FocusRange",
+              "class_name": "nos.internal.GraphInput",
+              "pins": [
+                {
+                  "id": "6a933bab-7bf6-4388-b990-abd1b9729e64",
+                  "name": "Output",
+                  "type_name": "float",
+                  "show_as": "OUTPUT_PIN",
+                  "can_show_as": "OUTPUT_PIN_ONLY",
+                  "visualizer": {
+                  },
+                  "data": 3.1,
+                  "min": 0.01,
+                  "max": 1000.0,
+                  "def": 2.0,
+                  "step": 9.9999,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "534a26e9-1ebd-4ed2-89fb-bdf5d34b6ec1",
+                  "name": "Input",
+                  "type_name": "float",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 2.0,
+                  "referred_by": [
+                    "68187c92-92f3-40d0-8b24-df6f33f9f649"
+                  ],
+                  "min": 0.01,
+                  "max": 1000.0,
+                  "def": 2.0,
+                  "step": 9.9999,
+                  "meta_data_map": [
+                    { "key": "PinHidden", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                }
+              ],
+              "pos": { "x": 655.0, "y": 1175.0 },
+              "contents_type": "Job",
+              "contents": { "type": "" },
+              "function_category": "Default Node",
+              "plugin_version": { "major": 0, "minor": 0, "patch": 0 }
+            },
+            {
+              "id": "3951aaae-16df-4b07-b1a9-b8b2a01b19c7",
+              "name": "MinRadius",
+              "class_name": "nos.internal.GraphInput",
+              "pins": [
+                {
+                  "id": "f0feee29-3782-49fe-a834-94e2b57916a8",
+                  "name": "Output",
+                  "type_name": "float",
+                  "show_as": "OUTPUT_PIN",
+                  "can_show_as": "OUTPUT_PIN_ONLY",
+                  "visualizer": {
+                  },
+                  "data": 0.0,
+                  "min": 0.0,
+                  "max": 8.0,
+                  "def": 0.5,
+                  "step": 0.08,
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "97561978-6da1-4a33-a6bc-c654008a8261",
+                  "name": "Input",
+                  "type_name": "float",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": 0.5,
+                  "referred_by": [
+                    "312c4450-a4ad-4690-ba3d-afcbc93da6eb"
+                  ],
+                  "min": 0.0,
+                  "max": 8.0,
+                  "def": 0.5,
+                  "step": 0.08,
+                  "meta_data_map": [
+                    { "key": "PinHidden", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                }
+              ],
+              "pos": { "x": 655.0, "y": 1325.0 },
+              "contents_type": "Job",
+              "contents": { "type": "" },
+              "function_category": "Default Node",
+              "plugin_version": { "major": 0, "minor": 0, "patch": 0 }
+            },
+            {
+              "id": "a1d16ddd-0144-4daa-97b2-e9b3b019c8c1",
+              "name": "Input",
+              "class_name": "nos.internal.GraphInput",
+              "pins": [
+                {
+                  "id": "c271ac23-2923-45c2-b262-b654455a93c3",
+                  "name": "Output",
+                  "type_name": "nos.sys.vulkan.Texture",
+                  "show_as": "OUTPUT_PIN",
+                  "can_show_as": "OUTPUT_PIN_ONLY",
+                  "visualizer": {
+                  },
+                  "data": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED",
+                    "filtering": "LINEAR"
+                  },
+                  "def": {
+                    "filtering": "LINEAR"
+                  },
+                  "advanced_property": true,
+                  "meta_data_map": [
+                    { "key": "AdvancedProperty", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                },
+                {
+                  "id": "479248dc-200d-4a4d-87d2-f2c7c77f667f",
+                  "name": "Input",
+                  "type_name": "nos.sys.vulkan.Texture",
+                  "show_as": "INPUT_PIN",
+                  "can_show_as": "INPUT_PIN_OR_PROPERTY",
+                  "visualizer": {
+                  },
+                  "data": {
+                    "resolution": "HD",
+                    "width": 1920,
+                    "height": 1080,
+                    "format": "R16G16B16A16_SFLOAT",
+                    "usage": "TRANSFER_SRC TRANSFER_DST SAMPLED",
+                    "filtering": "LINEAR"
+                  },
+                  "referred_by": [
+                    "2be9d3ba-9386-43b0-ae1c-58168be2a289"
+                  ],
+                  "def": {
+                    "filtering": "LINEAR"
+                  },
+                  "advanced_property": true,
+                  "meta_data_map": [
+                    { "key": "AdvancedProperty", "value": "true" },
+                    { "key": "PinHidden", "value": "true" }
+                  ],
+                  "contents_type": "JobPin",
+                  "contents": { }
+                }
+              ],
+              "pos": { "x": 655.0, "y": 1400.0 },
+              "contents_type": "Job",
+              "contents": { "type": "" },
+              "function_category": "Default Node",
+              "plugin_version": { "major": 0, "minor": 0, "patch": 0 }
+            }
+          ], "connections": [
+            { "from": "8f4d23a7-3b94-4a1c-ba14-d1ce47e92acd", "to": "b1b03fce-6863-42e6-a78a-260743b5441d", "id": "83839676-0760-4699-ae80-c0a789e273d8" },
+            { "from": "f0feee29-3782-49fe-a834-94e2b57916a8", "to": "d77d3716-69f5-4c5d-a342-414dc11597fb", "id": "4c05135f-6001-4679-b39c-b248559ae56d" },
+            { "from": "9587b7b1-8fc7-437b-9459-ee73f90de097", "to": "14aab6c6-10ce-4a39-9c6f-8c5633fe59e2", "id": "231cdfe5-7ac7-4013-9d20-68d5af8509b7" },
+            { "from": "7c60934b-ba19-4faf-9923-411511649cd0", "to": "d6a91b7a-b576-487b-bd2c-89fee90a37d1", "id": "1cdaef73-876c-472a-97ff-04bf1f01348e" },
+            { "from": "c271ac23-2923-45c2-b262-b654455a93c3", "to": "9e368dde-bb31-44d8-aaad-782e92fe2366", "id": "231fc88c-a52e-48d0-a6ee-8c2fdfe3ef0d" },
+            { "from": "6a933bab-7bf6-4388-b990-abd1b9729e64", "to": "55bffdc3-e0fa-4c0f-9ead-5a3b96c232bf", "id": "7c1cae59-5834-420e-9d3d-e4767f6c3273" },
+            { "from": "d5387b2e-f8c6-4b2e-8a42-a11eed779a1d", "to": "bdc5ae5a-10cc-4c3c-b013-573a64bd8ec6", "id": "d74bdb3a-8c8c-4f82-8038-01a237e27a89" },
+            { "from": "0ef0f439-9766-4957-8931-a02ce1019bd1", "to": "2e4ec877-e014-49ae-ae1d-881a0e4d1ac5", "id": "353cc954-d098-417a-8331-357b879ba654" },
+            { "from": "9587b7b1-8fc7-437b-9459-ee73f90de097", "to": "7e88a91a-1eca-4cc5-8dce-7c4aca61368d", "id": "b126f4c4-d748-46f2-be51-ce1c778c0c4b" },
+            { "from": "7c60934b-ba19-4faf-9923-411511649cd0", "to": "c1b814c4-e424-40a0-99d6-0437d948d1d7", "id": "fc25a2f4-0af4-49ae-9052-133a76cfc044" },
+            { "from": "6a933bab-7bf6-4388-b990-abd1b9729e64", "to": "78893474-3dfc-4a36-b897-77760ba19c8c", "id": "f6ba18f8-0ef1-42db-a774-c4b02aa78fac" },
+            { "from": "d5387b2e-f8c6-4b2e-8a42-a11eed779a1d", "to": "4f471215-bebf-49be-a6e4-909c394d1f1a", "id": "afd9d7ff-f9e2-4a67-b874-2cfb2f870447" },
+            { "from": "f0feee29-3782-49fe-a834-94e2b57916a8", "to": "05132381-cf95-4253-9fc2-e87f84b70dd8", "id": "82919455-4a51-490a-8ab2-201952d2e126" }
+          ] },
+        "function_category": "Default Node",
+        "display_name": "Depth of Field",
+        "plugin_version": { "major": 0, "minor": 0, "patch": 0 }
+      }
+    }
+  ] }
diff --git a/Plugins/nosFilters/Config/DirectionalDof.nosdef b/Plugins/nosFilters/Config/DirectionalDof.nosdef
new file mode 100644
index 00000000..427e4385
--- /dev/null
+++ b/Plugins/nosFilters/Config/DirectionalDof.nosdef
@@ -0,0 +1,121 @@
+{
+	"nodes": [
+		{
+			"class_name": "DirectionalDof",
+			"menu_info": {
+				"category": "Filters",
+				"display_name": "Directional DoF"
+			},
+			"node": {
+				"class_name": "DirectionalDof",
+				"name": "Directional DoF",
+				"description": "1D depth-aware blur. CoC is computed per pixel from a linear view-space Z input. Chain two instances along (1,0) and (0,1) for a separable disc bokeh.",
+				"contents_type": "Job",
+				"contents": {
+					"type": "nos.sys.vulkan.GPUNode",
+					"options": {
+						"shader": "Shaders/DirectionalDof.frag"
+					}
+				},
+				"pins": [
+					{
+						"name": "Input",
+						"type_name": "nos.sys.vulkan.Texture",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": {
+							"filtering": "LINEAR"
+						}
+					},
+					{
+						"name": "Depth",
+						"type_name": "nos.sys.vulkan.Texture",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": {
+							"filtering": "NEAREST"
+						}
+					},
+					{
+						"name": "FocusDistance",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 5.0,
+						"min": 0.0,
+						"max": 1000.0
+					},
+					{
+						"name": "FocusRange",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 2.0,
+						"min": 0.01,
+						"max": 1000.0
+					},
+					{
+						"name": "MaxRadius",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 16.0,
+						"min": 0.0,
+						"max": 128.0
+					},
+					{
+						"name": "MinRadius",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 0.5,
+						"min": 0.0,
+						"max": 8.0
+					},
+					{
+						"name": "BackgroundIsFar",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 1.0,
+						"min": 0.0,
+						"max": 1.0
+					},
+					{
+						"name": "Direction",
+						"type_name": "nos.fb.vec2",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": {
+							"x": 1.0,
+							"y": 0.0
+						},
+						"min": {
+							"x": -1.0,
+							"y": -1.0
+						},
+						"max": {
+							"x": 1.0,
+							"y": 1.0
+						}
+					},
+					{
+						"name": "SampleCount",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 12.0,
+						"min": 1.0,
+						"max": 64.0
+					},
+					{
+						"name": "Output",
+						"type_name": "nos.sys.vulkan.Texture",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_OR_PROPERTY"
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosFilters/Filters.noscfg b/Plugins/nosFilters/Filters.noscfg
index 072c6ce0..3660bb3f 100644
--- a/Plugins/nosFilters/Filters.noscfg
+++ b/Plugins/nosFilters/Filters.noscfg
@@ -2,7 +2,7 @@
     "info": {
         "id": {
             "name": "nos.filters",
-            "version": "1.7.0"
+            "version": "1.8.0"
         },
         "display_name": "Filters",
         "description": "Collection of image filters.",
@@ -27,6 +27,10 @@
         "Config/Diff.nosdef",
         "Config/GaussianBlur.nosdef",
         "Config/DirectionalBlur.nosdef",
+        "Config/DirectionalDof.nosdef",
+        "Config/DepthOfField.nosdef",
+        "Config/BokehDof.nosdef",
+        "Config/BokehShape.nosdef",
         "Config/KawaseLightStreak.nosdef",
         "Config/Kuwahara.nosdef",
         "Config/PremultiplyAlpha.nosdef",
diff --git a/Plugins/nosFilters/Shaders/BokehDof.frag b/Plugins/nosFilters/Shaders/BokehDof.frag
new file mode 100644
index 00000000..b365ddf2
--- /dev/null
+++ b/Plugins/nosFilters/Shaders/BokehDof.frag
@@ -0,0 +1,105 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+// Single-pass 2D bokeh depth-of-field with a kernel-texture shaping the bokeh.
+//
+// Computes a per-pixel circle of confusion (CoC) from a linear view-space Z
+// input, then gathers samples on a Vogel (golden-angle) disc within that CoC.
+// Each sample's contribution is weighted by BokehShape sampled at the same
+// unit-disc position, so the bokeh takes on the shape painted into BokehShape
+// (regular polygon, ring, custom artwork, etc.).
+
+#version 450
+
+#define MASK_THRESHOLD 0.001
+#define GOLDEN_ANGLE   2.39996322972865332
+
+layout(binding = 0) uniform sampler2D Input;
+layout(binding = 1) uniform sampler2D Depth;
+layout(binding = 2) uniform sampler2D BokehShape;
+layout(binding = 3) uniform BokehDofParams
+{
+    // Focus distance in the same units as the Depth input (linear view-space Z).
+    float FocusDistance;
+    // Distance from focus where CoC reaches MaxRadius.
+    float FocusRange;
+    // Maximum CoC radius in pixels.
+    float MaxRadius;
+    // Skip the gather when CoC <= MinRadius (keeps focused regions crisp & cheap).
+    float MinRadius;
+    // 0 = treat zero depth as "near focus" (stays sharp); 1 = treat as far plane.
+    float BackgroundIsFar;
+    // Total Vogel-disc sample count. ~32 = soft, ~64 = clean, ~128 = no banding.
+    float SampleCount;
+    // Rotate the kernel lookup (radians). Useful for animated highlights.
+    float KernelRotation;
+}
+Params;
+
+layout(location = 0) out vec4 rt;
+layout(location = 0) in vec2 uv;
+
+float CocFromDepth(float Z)
+{
+    if (Z <= 0.0)
+        Z = mix(Params.FocusDistance, Params.FocusDistance + Params.FocusRange * 4.0, Params.BackgroundIsFar);
+
+    float D   = abs(Z - Params.FocusDistance);
+    float Coc = D / max(Params.FocusRange, 1e-4);
+    return clamp(Coc * Params.MaxRadius, 0.0, Params.MaxRadius);
+}
+
+void main()
+{
+    vec2 TextureSize = textureSize(Input, 0);
+    vec2 TexelSize   = 1.0 / TextureSize;
+
+    vec4  CenterColor = texture(Input, uv);
+    float CenterZ     = texture(Depth, uv).r;
+    float CenterCoC   = CocFromDepth(CenterZ);
+
+    if (CenterCoC <= Params.MinRadius || Params.MaxRadius < MASK_THRESHOLD)
+    {
+        rt = CenterColor;
+        return;
+    }
+
+    int   N        = int(max(1.0, Params.SampleCount));
+    float CosR     = cos(Params.KernelRotation);
+    float SinR     = sin(Params.KernelRotation);
+
+    // Vogel disc: golden-angle spiral with sqrt radius for uniform area density.
+    // Sample 0 is the center; included implicitly via CenterColor initialization.
+    vec4  Accum  = CenterColor;
+    float Weight = texture(BokehShape, vec2(0.5)).r;
+    Accum       *= Weight;
+
+    for (int i = 1; i < N; ++i)
+    {
+        float Frac = float(i) / float(N);
+        float R    = sqrt(Frac);                          // unit-disc radius
+        float Th   = float(i) * GOLDEN_ANGLE;
+        vec2  Unit = vec2(cos(Th) * R, sin(Th) * R);      // unit disc position
+
+        // Rotated lookup into the bokeh kernel.
+        vec2 ShapeUv = vec2(Unit.x * CosR - Unit.y * SinR,
+                            Unit.x * SinR + Unit.y * CosR) * 0.5 + 0.5;
+        float WShape = texture(BokehShape, ShapeUv).r;
+        if (WShape <= MASK_THRESHOLD)
+            continue;
+
+        vec2  Ofs    = Unit * CenterCoC * TexelSize;
+        vec4  Sample = texture(Input, uv + Ofs);
+        float ZSamp  = texture(Depth, uv + Ofs).r;
+        float CocSmp = CocFromDepth(ZSamp);
+
+        // Per-sample CoC rejection prevents in-focus pixels bleeding outward.
+        // A sample contributes only if its own CoC is at least its distance from center.
+        float Dist = R * CenterCoC;
+        float WCoc = Dist <= CocSmp ? 1.0 : 0.0;
+
+        float W = WShape * WCoc;
+        Accum  += Sample * W;
+        Weight += W;
+    }
+
+    rt = Accum / max(Weight, 1e-4);
+}
diff --git a/Plugins/nosFilters/Shaders/BokehShape.frag b/Plugins/nosFilters/Shaders/BokehShape.frag
new file mode 100644
index 00000000..cb963629
--- /dev/null
+++ b/Plugins/nosFilters/Shaders/BokehShape.frag
@@ -0,0 +1,77 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+// Procedural bokeh kernel generator.
+//
+// Produces a grayscale unit-disc mask shaped like a regular polygon aperture
+// (number of blades configurable) with optional roundness, rotation, soft edge
+// and brightened rim. Intended as input to a kernel-weighted DoF gather.
+//
+// Convention: image is treated as the [-1, 1] unit square; pixels outside the
+// kernel shape return 0; pixels inside return ~1, with a smooth edge falloff
+// over EdgeSoftness. The mask is normalized so that center stays at 1.
+
+#version 450
+
+#define PI 3.14159265358979323846
+
+layout(location = 0) out vec4 rt;
+layout(location = 0) in vec2 uv;
+
+layout(binding = 1) uniform BokehShapeParams
+{
+    // Aperture blade count. 0 or 1 = perfect circle.
+    float BladeCount;
+    // 0 = sharp polygon, 1 = perfect circle. Interpolates polygon edge toward disc.
+    float Roundness;
+    // Rotation of the polygon (radians).
+    float Rotation;
+    // Soft falloff width at the edge, in [0, 1] of unit-disc radius.
+    float EdgeSoftness;
+    // Extra brightness boost near the rim, [0, 1]. Mimics cat's-eye / specular bokeh.
+    float RimBoost;
+    // Width of the rim brightening band, in [0, 1] of radius.
+    float RimWidth;
+}
+Params;
+
+void main()
+{
+    // Map uv [0,1] to centered coords [-1,1]
+    vec2  Pos = uv * 2.0 - 1.0;
+    float R   = length(Pos);
+
+    if (R > 1.0)
+    {
+        rt = vec4(0.0);
+        return;
+    }
+
+    float Blades = max(Params.BladeCount, 1.0);
+
+    // Polygon edge radius along this angular direction.
+    // sectorAngle = 2*pi / N; angle from sector center is a; edge distance = cos(pi/N) / cos(a).
+    float PolygonR = 1.0;
+    if (Blades >= 3.0)
+    {
+        float Theta       = atan(Pos.y, Pos.x) - Params.Rotation;
+        float SectorAngle = 2.0 * PI / Blades;
+        float HalfSector  = SectorAngle * 0.5;
+        // Angle measured from the nearest sector centerline, in [-HalfSector, +HalfSector].
+        float A = mod(Theta + HalfSector, SectorAngle) - HalfSector;
+        PolygonR = cos(HalfSector) / max(cos(A), 1e-4);
+    }
+
+    // Roundness mixes polygon edge toward the circumscribed circle (radius 1).
+    float EdgeR = mix(PolygonR, 1.0, clamp(Params.Roundness, 0.0, 1.0));
+
+    // Soft edge: 1 inside, 0 past the edge, smooth across EdgeSoftness.
+    float Soft = max(Params.EdgeSoftness, 1e-4);
+    float Mask = 1.0 - smoothstep(EdgeR - Soft, EdgeR, R);
+
+    // Rim brightening: a soft band just inside the edge.
+    float RimW   = max(Params.RimWidth, 1e-4);
+    float RimPos = (R - (EdgeR - RimW)) / RimW;            // 0 at inner edge of rim, 1 at outer
+    float Rim    = clamp(1.0 - abs(RimPos * 2.0 - 1.0), 0.0, 1.0);
+    Mask        += Rim * Params.RimBoost * Mask;
+
+    rt = vec4(Mask, Mask, Mask, 1.0);
+}
diff --git a/Plugins/nosFilters/Shaders/DirectionalDof.frag b/Plugins/nosFilters/Shaders/DirectionalDof.frag
new file mode 100644
index 00000000..308cfcc7
--- /dev/null
+++ b/Plugins/nosFilters/Shaders/DirectionalDof.frag
@@ -0,0 +1,95 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+// Directional depth-of-field pass.
+// Computes circle-of-confusion (CoC) per pixel from a linear view-space Z input,
+// then does a 1D weighted gather along Direction. Chain two instances
+// (Direction = (1,0) and Direction = (0,1)) for a separable approximation of
+// disc bokeh; visually close to a gaussian bokeh and cheap.
+
+#version 450
+
+#define MASK_THRESHOLD 0.001
+
+layout(binding = 0) uniform sampler2D Input;
+layout(binding = 1) uniform sampler2D Depth;
+layout(binding = 2) uniform DirectionalDofParams
+{
+    // Focus distance in the same units as the Depth input (linear view-space Z).
+    float FocusDistance;
+    // Distance from focus where CoC reaches MaxRadius.
+    // Smaller value = sharper focus falloff; larger = gentler.
+    float FocusRange;
+    // Maximum CoC radius in pixels.
+    float MaxRadius;
+    // 0 = treat zero depth as "no info, keep sharp"; 1 = treat zero depth as far.
+    float BackgroundIsFar;
+    vec2 Direction;
+    // Optional: clamp CoC near the focus plane to avoid noise; raise to skip tiny blurs.
+    float MinRadius;
+    // Sample count along the direction (one side; total taps = 2*N+1). Higher = smoother.
+    float SampleCount;
+}
+Params;
+
+layout(location = 0) out vec4 rt;
+layout(location = 0) in vec2 uv;
+
+float CocFromDepth(float Z)
+{
+    // Treat Z<=0 (no depth signal) as either "near focus" (BackgroundIsFar=0)
+    // or as far plane (BackgroundIsFar=1). Picking far avoids halos around empty regions.
+    if (Z <= 0.0)
+        Z = mix(Params.FocusDistance, Params.FocusDistance + Params.FocusRange * 4.0, Params.BackgroundIsFar);
+
+    float D   = abs(Z - Params.FocusDistance);
+    float Coc = D / max(Params.FocusRange, 1e-4);
+    Coc       = clamp(Coc * Params.MaxRadius, 0.0, Params.MaxRadius);
+    return Coc;
+}
+
+void main()
+{
+    vec2 TextureSize = textureSize(Input, 0);
+    vec2 TexelSize   = 1.0 / TextureSize;
+
+    vec4  CenterColor = texture(Input, uv);
+    float CenterZ     = texture(Depth, uv).r;
+    float CenterCoC   = CocFromDepth(CenterZ);
+
+    if (CenterCoC <= Params.MinRadius || Params.MaxRadius < MASK_THRESHOLD)
+    {
+        rt = CenterColor;
+        return;
+    }
+
+    vec2 Dir = normalize(Params.Direction);
+
+    int   N        = int(max(1.0, Params.SampleCount));
+    float RadiusPx = CenterCoC;
+    float Step     = RadiusPx / float(N);
+
+    // Box-weighted average; for separable-2D this gives a soft disc.
+    // CoC-clamping per sample prevents fragments in focus from bleeding outward.
+    vec4  Accum  = CenterColor;
+    float Weight = 1.0;
+
+    for (int i = 1; i <= N; ++i)
+    {
+        float T      = float(i) * Step;
+        vec2  Ofs    = Dir * T * TexelSize;
+
+        vec4  SPos   = texture(Input, uv + Ofs);
+        float ZPos   = texture(Depth, uv + Ofs).r;
+        float CocPos = CocFromDepth(ZPos);
+        float WPos   = Step <= CocPos ? 1.0 : 0.0;
+
+        vec4  SNeg   = texture(Input, uv - Ofs);
+        float ZNeg   = texture(Depth, uv - Ofs).r;
+        float CocNeg = CocFromDepth(ZNeg);
+        float WNeg   = Step <= CocNeg ? 1.0 : 0.0;
+
+        Accum  += SPos * WPos + SNeg * WNeg;
+        Weight += WPos + WNeg;
+    }
+
+    rt = Accum / Weight;
+}
diff --git a/Plugins/nosGeometry/CMakeLists.txt b/Plugins/nosGeometry/CMakeLists.txt
new file mode 100644
index 00000000..82e8b4ed
--- /dev/null
+++ b/Plugins/nosGeometry/CMakeLists.txt
@@ -0,0 +1,33 @@
+# Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+# Vendored OpenFBX, used to read object transforms out of .fbx files.
+# Built under a plugin-unique target name so it never clashes with the
+# "openFBX" target the zd plugins create from their own copy.
+if (NOT TARGET nosGeometry_openFBX)
+    add_library(nosGeometry_openFBX STATIC
+        External/openFBX/libdeflate.c
+        External/openFBX/ofbx.cpp)
+    target_include_directories(nosGeometry_openFBX PUBLIC "${CMAKE_CURRENT_SOURCE_DIR}/External/openFBX")
+    nos_group_targets("nosGeometry_openFBX" "External")
+endif()
+
+# nos.sys.track provides the CoordinateFrame type and the shared
+# CoordinateFrameConv.h helpers used to express FBX transforms in a frame
+# convention that composes with nosTrack's Convert/Track Transform nodes.
+set(MODULE_DEPENDENCIES "nos.sys.track-1.1")
+set(dep_idx 0)
+foreach(module_name_version ${MODULE_DEPENDENCIES})
+    string(REPLACE "-" ";" module_name_version ${module_name_version})
+    list(GET module_name_version 0 module_name)
+    list(GET module_name_version 1 module_version)
+    nos_get_module("${module_name}" "${module_version}" DEP_${dep_idx})
+    list(APPEND MODULE_DEPENDENCIES_TARGETS ${DEP_${dep_idx}})
+endforeach()
+
+set(DEPENDENCIES ${NOS_PLUGIN_SDK_TARGET} nosGeometry_openFBX ${MODULE_DEPENDENCIES_TARGETS})
+set(INCLUDE_FOLDERS "")
+
+nos_add_plugin("nosGeometry" "${DEPENDENCIES}" "${INCLUDE_FOLDERS}")
+
+# Helpers need C++20
+set_target_properties("nosGeometry" PROPERTIES CXX_STANDARD 20)
diff --git a/Plugins/nosGeometry/Config/ReadFBXTransform.nosdef b/Plugins/nosGeometry/Config/ReadFBXTransform.nosdef
new file mode 100644
index 00000000..8950b04b
--- /dev/null
+++ b/Plugins/nosGeometry/Config/ReadFBXTransform.nosdef
@@ -0,0 +1,78 @@
+{
+	"nodes": [
+		{
+			"class_name": "ReadFBXTransform",
+			"menu_info": {
+				"category": "Geometry",
+				"display_name": "Read FBX Transform",
+				"name_aliases": [ "FBX", "Load FBX", "FBX Transform", "FBX Reader" ]
+			},
+			"node": {
+				"class_name": "ReadFBXTransform",
+				"contents_type": "Job",
+				"description": "Reads an .fbx file and outputs the local and global transform of a\nselected object inside it. Pick the object from the 'Object' dropdown,\nwhich is populated with the names found in the file.",
+				"pins": [
+					{
+						"name": "Path",
+						"type_name": "string",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"visualizer": {
+							"type": "FILE_PICKER",
+							"file_extensions": [ "fbx" ],
+							"file_picker_type": "OPEN"
+						},
+						"description": "Path to the .fbx file to read."
+					},
+					{
+						"name": "Object",
+						"type_name": "string",
+						"show_as": "PROPERTY",
+						"can_show_as": "PROPERTY_ONLY",
+						"data": "",
+						"visualizer": {
+							"type": "COMBO_BOX",
+							"name": ""
+						},
+						"description": "Object inside the .fbx whose transform is reported.\nThe list is populated once the file is loaded."
+					},
+					{
+						"name": "SourceFrame",
+						"display_name": "Source Frame",
+						"type_name": "nos.sys.track.CoordinateFrame",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": "RH_YUp_FwdNegZ_RightX",
+						"description": "Coordinate frame the .fbx is authored in. The output transforms are expressed in this frame; set Convert Transform's 'SourceFrame' to the same value."
+					},
+					{
+						"name": "LocalTransform",
+						"display_name": "Local Transform",
+						"type_name": "nos.fb.Transform",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY",
+						"description": "Transform of the object relative to its parent."
+					},
+					{
+						"name": "GlobalTransform",
+						"display_name": "Global Transform",
+						"type_name": "nos.fb.Transform",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY",
+						"description": "World transform of the object, accounting for its parent hierarchy."
+					},
+					{
+						"name": "IsLoaded",
+						"display_name": "Is Loaded",
+						"type_name": "bool",
+						"show_as": "PROPERTY",
+						"can_show_as": "OUTPUT_PIN_OR_PROPERTY",
+						"data": false,
+						"readonly": true,
+						"description": "True if a valid 'Path' was selected and the file could be loaded."
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosGeometry/External/openFBX/libdeflate.c b/Plugins/nosGeometry/External/openFBX/libdeflate.c
new file mode 100644
index 00000000..e421d791
--- /dev/null
+++ b/Plugins/nosGeometry/External/openFBX/libdeflate.c
@@ -0,0 +1,4193 @@
+// ofbx changes : removed unused code, single .h and .c
+/*
+ * Copyright 2016 Eric Biggers
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ *
+ * ---------------------------------------------------------------------------
+ *
+ * This is a highly optimized DEFLATE decompressor.  It is much faster than
+ * vanilla zlib, typically well over twice as fast, though results vary by CPU.
+ *
+ * Why this is faster than vanilla zlib:
+ *
+ * - Word accesses rather than byte accesses when reading input
+ * - Word accesses rather than byte accesses when copying matches
+ * - Faster Huffman decoding combined with various DEFLATE-specific tricks
+ * - Larger bitbuffer variable that doesn't need to be refilled as often
+ * - Other optimizations to remove unnecessary branches
+ * - Only full-buffer decompression is supported, so the code doesn't need to
+ *   support stopping and resuming decompression.
+ * - On x86_64, a version of the decompression routine is compiled with BMI2
+ *   instructions enabled and is used automatically at runtime when supported.
+ */
+
+/*
+ * lib_common.h - internal header included by all library code
+ */
+
+#ifndef LIB_LIB_COMMON_H
+#define LIB_LIB_COMMON_H
+
+#ifdef LIBDEFLATE_H
+ /*
+  * When building the library, LIBDEFLATEAPI needs to be defined properly before
+  * including libdeflate.h.
+  */
+#  error "lib_common.h must always be included before libdeflate.h"
+#endif
+
+#if defined(LIBDEFLATE_DLL) && (defined(_WIN32) || defined(__CYGWIN__))
+#  define LIBDEFLATE_EXPORT_SYM  __declspec(dllexport)
+#elif defined(__GNUC__)
+#  define LIBDEFLATE_EXPORT_SYM  __attribute__((visibility("default")))
+#else
+#  define LIBDEFLATE_EXPORT_SYM
+#endif
+
+/*
+ * On i386, gcc assumes that the stack is 16-byte aligned at function entry.
+ * However, some compilers (e.g. MSVC) and programming languages (e.g. Delphi)
+ * only guarantee 4-byte alignment when calling functions.  This is mainly an
+ * issue on Windows, but it has been seen on Linux too.  Work around this ABI
+ * incompatibility by realigning the stack pointer when entering libdeflate.
+ * This prevents crashes in SSE/AVX code.
+ */
+#if defined(__GNUC__) && defined(__i386__)
+#  define LIBDEFLATE_ALIGN_STACK  __attribute__((force_align_arg_pointer))
+#else
+#  define LIBDEFLATE_ALIGN_STACK
+#endif
+
+#define LIBDEFLATEAPI	LIBDEFLATE_EXPORT_SYM LIBDEFLATE_ALIGN_STACK
+
+/*
+ * common_defs.h
+ *
+ * Copyright 2016 Eric Biggers
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef COMMON_DEFS_H
+#define COMMON_DEFS_H
+
+#include "libdeflate.h"
+
+#include <stdbool.h>
+#include <stddef.h>	/* for size_t */
+#include <stdint.h>
+#ifdef _MSC_VER
+#  include <intrin.h>	/* for _BitScan*() and other intrinsics */
+#  include <stdlib.h>	/* for _byteswap_*() */
+   /* Disable MSVC warnings that are expected. */
+   /* /W2 */
+#  pragma warning(disable : 4146) /* unary minus on unsigned type */
+   /* /W3 */
+#  pragma warning(disable : 4018) /* signed/unsigned mismatch */
+#  pragma warning(disable : 4244) /* possible loss of data */
+#  pragma warning(disable : 4267) /* possible loss of precision */
+#  pragma warning(disable : 4310) /* cast truncates constant value */
+   /* /W4 */
+#  pragma warning(disable : 4100) /* unreferenced formal parameter */
+#  pragma warning(disable : 4127) /* conditional expression is constant */
+#  pragma warning(disable : 4189) /* local variable initialized but not referenced */
+#  pragma warning(disable : 4232) /* nonstandard extension used */
+#  pragma warning(disable : 4245) /* conversion from 'int' to 'unsigned int' */
+#  pragma warning(disable : 4295) /* array too small to include terminating null */
+#endif
+#ifndef FREESTANDING
+#  include <string.h>	/* for memcpy() */
+#endif
+
+/* ========================================================================== */
+/*                             Target architecture                            */
+/* ========================================================================== */
+
+/* If possible, define a compiler-independent ARCH_* macro. */
+#undef ARCH_X86_64
+#undef ARCH_X86_32
+#undef ARCH_ARM64
+#undef ARCH_ARM32
+#ifdef _MSC_VER
+#  if defined(_M_X64)
+#    define ARCH_X86_64
+#  elif defined(_M_IX86)
+#    define ARCH_X86_32
+#  elif defined(_M_ARM64)
+#    define ARCH_ARM64
+#  elif defined(_M_ARM)
+#    define ARCH_ARM32
+#  endif
+#else
+#  if defined(__x86_64__)
+#    define ARCH_X86_64
+#  elif defined(__i386__)
+#    define ARCH_X86_32
+#  elif defined(__aarch64__)
+#    define ARCH_ARM64
+#  elif defined(__arm__)
+#    define ARCH_ARM32
+#  endif
+#endif
+
+/* ========================================================================== */
+/*                              Type definitions                              */
+/* ========================================================================== */
+
+/* Fixed-width integer types */
+typedef uint8_t u8;
+typedef uint16_t u16;
+typedef uint32_t u32;
+typedef uint64_t u64;
+typedef int8_t s8;
+typedef int16_t s16;
+typedef int32_t s32;
+typedef int64_t s64;
+
+/* ssize_t, if not available in <sys/types.h> */
+#ifdef _MSC_VER
+#  ifdef _WIN64
+     typedef long long ssize_t;
+#  else
+     typedef long ssize_t;
+#  endif
+#endif
+
+/*
+ * Word type of the target architecture.  Use 'size_t' instead of
+ * 'unsigned long' to account for platforms such as Windows that use 32-bit
+ * 'unsigned long' on 64-bit architectures.
+ */
+typedef size_t machine_word_t;
+
+/* Number of bytes in a word */
+#define WORDBYTES	((int)sizeof(machine_word_t))
+
+/* Number of bits in a word */
+#define WORDBITS	(8 * WORDBYTES)
+
+/* ========================================================================== */
+/*                         Optional compiler features                         */
+/* ========================================================================== */
+
+/* Compiler version checks.  Only use when absolutely necessary. */
+#if defined(__GNUC__) && !defined(__clang__) && !defined(__INTEL_COMPILER)
+#  define GCC_PREREQ(major, minor)		\
+	(__GNUC__ > (major) ||			\
+	 (__GNUC__ == (major) && __GNUC_MINOR__ >= (minor)))
+#else
+#  define GCC_PREREQ(major, minor)	0
+#endif
+#ifdef __clang__
+#  ifdef __apple_build_version__
+#    define CLANG_PREREQ(major, minor, apple_version)	\
+	(__apple_build_version__ >= (apple_version))
+#  else
+#    define CLANG_PREREQ(major, minor, apple_version)	\
+	(__clang_major__ > (major) ||			\
+	 (__clang_major__ == (major) && __clang_minor__ >= (minor)))
+#  endif
+#else
+#  define CLANG_PREREQ(major, minor, apple_version)	0
+#endif
+
+/*
+ * Macros to check for compiler support for attributes and builtins.  clang
+ * implements these macros, but gcc doesn't, so generally any use of one of
+ * these macros must also be combined with a gcc version check.
+ */
+#ifndef __has_attribute
+#  define __has_attribute(attribute)	0
+#endif
+#ifndef __has_builtin
+#  define __has_builtin(builtin)	0
+#endif
+
+/* inline - suggest that a function be inlined */
+#ifdef _MSC_VER
+#  define inline		__inline
+#endif /* else assume 'inline' is usable as-is */
+
+/* forceinline - force a function to be inlined, if possible */
+#if defined(__GNUC__) || __has_attribute(always_inline)
+#  define forceinline		inline __attribute__((always_inline))
+#elif defined(_MSC_VER)
+#  define forceinline		__forceinline
+#else
+#  define forceinline		inline
+#endif
+
+/* MAYBE_UNUSED - mark a function or variable as maybe unused */
+#if defined(__GNUC__) || __has_attribute(unused)
+#  define MAYBE_UNUSED		__attribute__((unused))
+#else
+#  define MAYBE_UNUSED
+#endif
+
+/*
+ * restrict - hint that writes only occur through the given pointer.
+ *
+ * Don't use MSVC's __restrict, since it has nonstandard behavior.
+ * Standard restrict is okay, if it is supported.
+ */
+#if !defined(__STDC_VERSION__) || (__STDC_VERSION__ < 201112L)
+#  if defined(__GNUC__) || defined(__clang__)
+#    define restrict		__restrict__
+#  else
+#    define restrict
+#  endif
+#endif /* else assume 'restrict' is usable as-is */
+
+/* likely(expr) - hint that an expression is usually true */
+#if defined(__GNUC__) || __has_builtin(__builtin_expect)
+#  define likely(expr)		__builtin_expect(!!(expr), 1)
+#else
+#  define likely(expr)		(expr)
+#endif
+
+/* unlikely(expr) - hint that an expression is usually false */
+#if defined(__GNUC__) || __has_builtin(__builtin_expect)
+#  define unlikely(expr)	__builtin_expect(!!(expr), 0)
+#else
+#  define unlikely(expr)	(expr)
+#endif
+
+/* prefetchr(addr) - prefetch into L1 cache for read */
+#undef prefetchr
+#if defined(__GNUC__) || __has_builtin(__builtin_prefetch)
+#  define prefetchr(addr)	__builtin_prefetch((addr), 0)
+#elif defined(_MSC_VER)
+#  if defined(ARCH_X86_32) || defined(ARCH_X86_64)
+#    define prefetchr(addr)	_mm_prefetch((addr), _MM_HINT_T0)
+#  elif defined(ARCH_ARM64)
+#    define prefetchr(addr)	__prefetch2((addr), 0x00 /* prfop=PLDL1KEEP */)
+#  elif defined(ARCH_ARM32)
+#    define prefetchr(addr)	__prefetch(addr)
+#  endif
+#endif
+#ifndef prefetchr
+#  define prefetchr(addr)
+#endif
+
+/* prefetchw(addr) - prefetch into L1 cache for write */
+#undef prefetchw
+#if defined(__GNUC__) || __has_builtin(__builtin_prefetch)
+#  define prefetchw(addr)	__builtin_prefetch((addr), 1)
+#elif defined(_MSC_VER)
+#  if defined(ARCH_X86_32) || defined(ARCH_X86_64)
+#    define prefetchw(addr)	_m_prefetchw(addr)
+#  elif defined(ARCH_ARM64)
+#    define prefetchw(addr)	__prefetch2((addr), 0x10 /* prfop=PSTL1KEEP */)
+#  elif defined(ARCH_ARM32)
+#    define prefetchw(addr)	__prefetchw(addr)
+#  endif
+#endif
+#ifndef prefetchw
+#  define prefetchw(addr)
+#endif
+
+/*
+ * _aligned_attribute(n) - declare that the annotated variable, or variables of
+ * the annotated type, must be aligned on n-byte boundaries.
+ */
+#undef _aligned_attribute
+#if defined(__GNUC__) || __has_attribute(aligned)
+#  define _aligned_attribute(n)	__attribute__((aligned(n)))
+#elif defined(_MSC_VER)
+#  define _aligned_attribute(n)	__declspec(align(n))
+#endif
+
+/*
+ * _target_attribute(attrs) - override the compilation target for a function.
+ *
+ * This accepts one or more comma-separated suffixes to the -m prefix jointly
+ * forming the name of a machine-dependent option.  On gcc-like compilers, this
+ * enables codegen for the given targets, including arbitrary compiler-generated
+ * code as well as the corresponding intrinsics.  On other compilers this macro
+ * expands to nothing, though MSVC allows intrinsics to be used anywhere anyway.
+ */
+#if GCC_PREREQ(4, 4) || __has_attribute(target)
+#  define _target_attribute(attrs)	__attribute__((target(attrs)))
+#  define COMPILER_SUPPORTS_TARGET_FUNCTION_ATTRIBUTE	1
+#else
+#  define _target_attribute(attrs)
+#  define COMPILER_SUPPORTS_TARGET_FUNCTION_ATTRIBUTE	0
+#endif
+
+/* ========================================================================== */
+/*                          Miscellaneous macros                              */
+/* ========================================================================== */
+
+#define ARRAY_LEN(A)		(sizeof(A) / sizeof((A)[0]))
+#define MIN(a, b)		((a) <= (b) ? (a) : (b))
+#define MAX(a, b)		((a) >= (b) ? (a) : (b))
+#define DIV_ROUND_UP(n, d)	(((n) + (d) - 1) / (d))
+#define STATIC_ASSERT(expr)	((void)sizeof(char[1 - 2 * !(expr)]))
+#define ALIGN(n, a)		(((n) + (a) - 1) & ~((a) - 1))
+#define ROUND_UP(n, d)		((d) * DIV_ROUND_UP((n), (d)))
+
+/* ========================================================================== */
+/*                           Endianness handling                              */
+/* ========================================================================== */
+
+/*
+ * CPU_IS_LITTLE_ENDIAN() - 1 if the CPU is little endian, or 0 if it is big
+ * endian.  When possible this is a compile-time macro that can be used in
+ * preprocessor conditionals.  As a fallback, a generic method is used that
+ * can't be used in preprocessor conditionals but should still be optimized out.
+ */
+#if defined(__BYTE_ORDER__) /* gcc v4.6+ and clang */
+#  define CPU_IS_LITTLE_ENDIAN()  (__BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__)
+#elif defined(_MSC_VER)
+#  define CPU_IS_LITTLE_ENDIAN()  true
+#else
+static forceinline bool CPU_IS_LITTLE_ENDIAN(void)
+{
+	union {
+		u32 w;
+		u8 b;
+	} u;
+
+	u.w = 1;
+	return u.b;
+}
+#endif
+
+/* bswap16(v) - swap the bytes of a 16-bit integer */
+static forceinline u16 bswap16(u16 v)
+{
+#if GCC_PREREQ(4, 8) || __has_builtin(__builtin_bswap16)
+	return __builtin_bswap16(v);
+#elif defined(_MSC_VER)
+	return _byteswap_ushort(v);
+#else
+	return (v << 8) | (v >> 8);
+#endif
+}
+
+/* bswap32(v) - swap the bytes of a 32-bit integer */
+static forceinline u32 bswap32(u32 v)
+{
+#if GCC_PREREQ(4, 3) || __has_builtin(__builtin_bswap32)
+	return __builtin_bswap32(v);
+#elif defined(_MSC_VER)
+	return _byteswap_ulong(v);
+#else
+	return ((v & 0x000000FF) << 24) |
+	       ((v & 0x0000FF00) << 8) |
+	       ((v & 0x00FF0000) >> 8) |
+	       ((v & 0xFF000000) >> 24);
+#endif
+}
+
+/* bswap64(v) - swap the bytes of a 64-bit integer */
+static forceinline u64 bswap64(u64 v)
+{
+#if GCC_PREREQ(4, 3) || __has_builtin(__builtin_bswap64)
+	return __builtin_bswap64(v);
+#elif defined(_MSC_VER)
+	return _byteswap_uint64(v);
+#else
+	return ((v & 0x00000000000000FF) << 56) |
+	       ((v & 0x000000000000FF00) << 40) |
+	       ((v & 0x0000000000FF0000) << 24) |
+	       ((v & 0x00000000FF000000) << 8) |
+	       ((v & 0x000000FF00000000) >> 8) |
+	       ((v & 0x0000FF0000000000) >> 24) |
+	       ((v & 0x00FF000000000000) >> 40) |
+	       ((v & 0xFF00000000000000) >> 56);
+#endif
+}
+
+#define le16_bswap(v) (CPU_IS_LITTLE_ENDIAN() ? (v) : bswap16(v))
+#define le32_bswap(v) (CPU_IS_LITTLE_ENDIAN() ? (v) : bswap32(v))
+#define le64_bswap(v) (CPU_IS_LITTLE_ENDIAN() ? (v) : bswap64(v))
+#define be16_bswap(v) (CPU_IS_LITTLE_ENDIAN() ? bswap16(v) : (v))
+#define be32_bswap(v) (CPU_IS_LITTLE_ENDIAN() ? bswap32(v) : (v))
+#define be64_bswap(v) (CPU_IS_LITTLE_ENDIAN() ? bswap64(v) : (v))
+
+/* ========================================================================== */
+/*                          Unaligned memory accesses                         */
+/* ========================================================================== */
+
+/*
+ * UNALIGNED_ACCESS_IS_FAST() - 1 if unaligned memory accesses can be performed
+ * efficiently on the target platform, otherwise 0.
+ */
+#if (defined(__GNUC__) || defined(__clang__)) && \
+	(defined(ARCH_X86_64) || defined(ARCH_X86_32) || \
+	 defined(__ARM_FEATURE_UNALIGNED) || defined(__powerpc64__) || \
+	 /*
+	  * For all compilation purposes, WebAssembly behaves like any other CPU
+	  * instruction set. Even though WebAssembly engine might be running on
+	  * top of different actual CPU architectures, the WebAssembly spec
+	  * itself permits unaligned access and it will be fast on most of those
+	  * platforms, and simulated at the engine level on others, so it's
+	  * worth treating it as a CPU architecture with fast unaligned access.
+	  */ defined(__wasm__))
+#  define UNALIGNED_ACCESS_IS_FAST	1
+#elif defined(_MSC_VER)
+#  define UNALIGNED_ACCESS_IS_FAST	1
+#else
+#  define UNALIGNED_ACCESS_IS_FAST	0
+#endif
+
+/*
+ * Implementing unaligned memory accesses using memcpy() is portable, and it
+ * usually gets optimized appropriately by modern compilers.  I.e., each
+ * memcpy() of 1, 2, 4, or WORDBYTES bytes gets compiled to a load or store
+ * instruction, not to an actual function call.
+ *
+ * We no longer use the "packed struct" approach to unaligned accesses, as that
+ * is nonstandard, has unclear semantics, and doesn't receive enough testing
+ * (see https://gcc.gnu.org/bugzilla/show_bug.cgi?id=94994).
+ *
+ * arm32 with __ARM_FEATURE_UNALIGNED in gcc 5 and earlier is a known exception
+ * where memcpy() generates inefficient code
+ * (https://gcc.gnu.org/bugzilla/show_bug.cgi?id=67366).  However, we no longer
+ * consider that one case important enough to maintain different code for.
+ * If you run into it, please just use a newer version of gcc (or use clang).
+ */
+
+#ifdef FREESTANDING
+#  define MEMCOPY	__builtin_memcpy
+#else
+#  define MEMCOPY	memcpy
+#endif
+
+/* Unaligned loads and stores without endianness conversion */
+
+#define DEFINE_UNALIGNED_TYPE(type)				\
+static forceinline type						\
+load_##type##_unaligned(const void *p)				\
+{								\
+	type v;							\
+								\
+	MEMCOPY(&v, p, sizeof(v));				\
+	return v;						\
+}								\
+								\
+static forceinline void						\
+store_##type##_unaligned(type v, void *p)			\
+{								\
+	MEMCOPY(p, &v, sizeof(v));				\
+}
+
+DEFINE_UNALIGNED_TYPE(u16)
+DEFINE_UNALIGNED_TYPE(u32)
+DEFINE_UNALIGNED_TYPE(u64)
+DEFINE_UNALIGNED_TYPE(machine_word_t)
+
+#undef MEMCOPY
+
+#define load_word_unaligned	load_machine_word_t_unaligned
+#define store_word_unaligned	store_machine_word_t_unaligned
+
+/* Unaligned loads with endianness conversion */
+
+static forceinline u16
+get_unaligned_le16(const u8 *p)
+{
+	if (UNALIGNED_ACCESS_IS_FAST)
+		return le16_bswap(load_u16_unaligned(p));
+	else
+		return ((u16)p[1] << 8) | p[0];
+}
+
+static forceinline u16
+get_unaligned_be16(const u8 *p)
+{
+	if (UNALIGNED_ACCESS_IS_FAST)
+		return be16_bswap(load_u16_unaligned(p));
+	else
+		return ((u16)p[0] << 8) | p[1];
+}
+
+static forceinline u32
+get_unaligned_le32(const u8 *p)
+{
+	if (UNALIGNED_ACCESS_IS_FAST)
+		return le32_bswap(load_u32_unaligned(p));
+	else
+		return ((u32)p[3] << 24) | ((u32)p[2] << 16) |
+			((u32)p[1] << 8) | p[0];
+}
+
+static forceinline u32
+get_unaligned_be32(const u8 *p)
+{
+	if (UNALIGNED_ACCESS_IS_FAST)
+		return be32_bswap(load_u32_unaligned(p));
+	else
+		return ((u32)p[0] << 24) | ((u32)p[1] << 16) |
+			((u32)p[2] << 8) | p[3];
+}
+
+static forceinline u64
+get_unaligned_le64(const u8 *p)
+{
+	if (UNALIGNED_ACCESS_IS_FAST)
+		return le64_bswap(load_u64_unaligned(p));
+	else
+		return ((u64)p[7] << 56) | ((u64)p[6] << 48) |
+			((u64)p[5] << 40) | ((u64)p[4] << 32) |
+			((u64)p[3] << 24) | ((u64)p[2] << 16) |
+			((u64)p[1] << 8) | p[0];
+}
+
+static forceinline machine_word_t
+get_unaligned_leword(const u8 *p)
+{
+	STATIC_ASSERT(WORDBITS == 32 || WORDBITS == 64);
+	if (WORDBITS == 32)
+		return get_unaligned_le32(p);
+	else
+		return get_unaligned_le64(p);
+}
+
+/* Unaligned stores with endianness conversion */
+
+static forceinline void
+put_unaligned_le16(u16 v, u8 *p)
+{
+	if (UNALIGNED_ACCESS_IS_FAST) {
+		store_u16_unaligned(le16_bswap(v), p);
+	} else {
+		p[0] = (u8)(v >> 0);
+		p[1] = (u8)(v >> 8);
+	}
+}
+
+static forceinline void
+put_unaligned_be16(u16 v, u8 *p)
+{
+	if (UNALIGNED_ACCESS_IS_FAST) {
+		store_u16_unaligned(be16_bswap(v), p);
+	} else {
+		p[0] = (u8)(v >> 8);
+		p[1] = (u8)(v >> 0);
+	}
+}
+
+static forceinline void
+put_unaligned_le32(u32 v, u8 *p)
+{
+	if (UNALIGNED_ACCESS_IS_FAST) {
+		store_u32_unaligned(le32_bswap(v), p);
+	} else {
+		p[0] = (u8)(v >> 0);
+		p[1] = (u8)(v >> 8);
+		p[2] = (u8)(v >> 16);
+		p[3] = (u8)(v >> 24);
+	}
+}
+
+static forceinline void
+put_unaligned_be32(u32 v, u8 *p)
+{
+	if (UNALIGNED_ACCESS_IS_FAST) {
+		store_u32_unaligned(be32_bswap(v), p);
+	} else {
+		p[0] = (u8)(v >> 24);
+		p[1] = (u8)(v >> 16);
+		p[2] = (u8)(v >> 8);
+		p[3] = (u8)(v >> 0);
+	}
+}
+
+static forceinline void
+put_unaligned_le64(u64 v, u8 *p)
+{
+	if (UNALIGNED_ACCESS_IS_FAST) {
+		store_u64_unaligned(le64_bswap(v), p);
+	} else {
+		p[0] = (u8)(v >> 0);
+		p[1] = (u8)(v >> 8);
+		p[2] = (u8)(v >> 16);
+		p[3] = (u8)(v >> 24);
+		p[4] = (u8)(v >> 32);
+		p[5] = (u8)(v >> 40);
+		p[6] = (u8)(v >> 48);
+		p[7] = (u8)(v >> 56);
+	}
+}
+
+static forceinline void
+put_unaligned_leword(machine_word_t v, u8 *p)
+{
+	STATIC_ASSERT(WORDBITS == 32 || WORDBITS == 64);
+	if (WORDBITS == 32)
+		put_unaligned_le32(v, p);
+	else
+		put_unaligned_le64(v, p);
+}
+
+/* ========================================================================== */
+/*                         Bit manipulation functions                         */
+/* ========================================================================== */
+
+/*
+ * Bit Scan Reverse (BSR) - find the 0-based index (relative to the least
+ * significant end) of the *most* significant 1 bit in the input value.  The
+ * input value must be nonzero!
+ */
+
+static forceinline unsigned
+bsr32(u32 v)
+{
+#if defined(__GNUC__) || __has_builtin(__builtin_clz)
+	return 31 - __builtin_clz(v);
+#elif defined(_MSC_VER)
+	unsigned long i;
+
+	_BitScanReverse(&i, v);
+	return i;
+#else
+	unsigned i = 0;
+
+	while ((v >>= 1) != 0)
+		i++;
+	return i;
+#endif
+}
+
+static forceinline unsigned
+bsr64(u64 v)
+{
+#if defined(__GNUC__) || __has_builtin(__builtin_clzll)
+	return 63 - __builtin_clzll(v);
+#elif defined(_MSC_VER) && defined(_WIN64)
+	unsigned long i;
+
+	_BitScanReverse64(&i, v);
+	return i;
+#else
+	unsigned i = 0;
+
+	while ((v >>= 1) != 0)
+		i++;
+	return i;
+#endif
+}
+
+static forceinline unsigned
+bsrw(machine_word_t v)
+{
+	STATIC_ASSERT(WORDBITS == 32 || WORDBITS == 64);
+	if (WORDBITS == 32)
+		return bsr32(v);
+	else
+		return bsr64(v);
+}
+
+/*
+ * Bit Scan Forward (BSF) - find the 0-based index (relative to the least
+ * significant end) of the *least* significant 1 bit in the input value.  The
+ * input value must be nonzero!
+ */
+
+static forceinline unsigned
+bsf32(u32 v)
+{
+#if defined(__GNUC__) || __has_builtin(__builtin_ctz)
+	return __builtin_ctz(v);
+#elif defined(_MSC_VER)
+	unsigned long i;
+
+	_BitScanForward(&i, v);
+	return i;
+#else
+	unsigned i = 0;
+
+	for (; (v & 1) == 0; v >>= 1)
+		i++;
+	return i;
+#endif
+}
+
+static forceinline unsigned
+bsf64(u64 v)
+{
+#if defined(__GNUC__) || __has_builtin(__builtin_ctzll)
+	return __builtin_ctzll(v);
+#elif defined(_MSC_VER) && defined(_WIN64)
+	unsigned long i;
+
+	_BitScanForward64(&i, v);
+	return i;
+#else
+	unsigned i = 0;
+
+	for (; (v & 1) == 0; v >>= 1)
+		i++;
+	return i;
+#endif
+}
+
+static forceinline unsigned
+bsfw(machine_word_t v)
+{
+	STATIC_ASSERT(WORDBITS == 32 || WORDBITS == 64);
+	if (WORDBITS == 32)
+		return bsf32(v);
+	else
+		return bsf64(v);
+}
+
+/*
+ * rbit32(v): reverse the bits in a 32-bit integer.  This doesn't have a
+ * fallback implementation; use '#ifdef rbit32' to check if this is available.
+ */
+#undef rbit32
+#if (defined(__GNUC__) || defined(__clang__)) && defined(ARCH_ARM32) && \
+	(__ARM_ARCH >= 7 || (__ARM_ARCH == 6 && defined(__ARM_ARCH_6T2__)))
+static forceinline u32
+rbit32(u32 v)
+{
+	__asm__("rbit %0, %1" : "=r" (v) : "r" (v));
+	return v;
+}
+#define rbit32 rbit32
+#elif (defined(__GNUC__) || defined(__clang__)) && defined(ARCH_ARM64)
+static forceinline u32
+rbit32(u32 v)
+{
+	__asm__("rbit %w0, %w1" : "=r" (v) : "r" (v));
+	return v;
+}
+#define rbit32 rbit32
+#endif
+
+#endif /* COMMON_DEFS_H */
+
+
+typedef void *(*malloc_func_t)(size_t);
+typedef void (*free_func_t)(void *);
+
+extern malloc_func_t libdeflate_default_malloc_func;
+extern free_func_t libdeflate_default_free_func;
+
+void *libdeflate_aligned_malloc(malloc_func_t malloc_func,
+				size_t alignment, size_t size);
+void libdeflate_aligned_free(free_func_t free_func, void *ptr);
+
+#ifdef FREESTANDING
+/*
+ * With -ffreestanding, <string.h> may be missing, and we must provide
+ * implementations of memset(), memcpy(), memmove(), and memcmp().
+ * See https://gcc.gnu.org/onlinedocs/gcc/Standards.html
+ *
+ * Also, -ffreestanding disables interpreting calls to these functions as
+ * built-ins.  E.g., calling memcpy(&v, p, WORDBYTES) will make a function call,
+ * not be optimized to a single load instruction.  For performance reasons we
+ * don't want that.  So, declare these functions as macros that expand to the
+ * corresponding built-ins.  This approach is recommended in the gcc man page.
+ * We still need the actual function definitions in case gcc calls them.
+ */
+void *memset(void *s, int c, size_t n);
+#define memset(s, c, n)		__builtin_memset((s), (c), (n))
+
+void *memcpy(void *dest, const void *src, size_t n);
+#define memcpy(dest, src, n)	__builtin_memcpy((dest), (src), (n))
+
+void *memmove(void *dest, const void *src, size_t n);
+#define memmove(dest, src, n)	__builtin_memmove((dest), (src), (n))
+
+int memcmp(const void *s1, const void *s2, size_t n);
+#define memcmp(s1, s2, n)	__builtin_memcmp((s1), (s2), (n))
+
+#undef LIBDEFLATE_ENABLE_ASSERTIONS
+#else
+#include <string.h>
+#endif
+
+/*
+ * Runtime assertion support.  Don't enable this in production builds; it may
+ * hurt performance significantly.
+ */
+#ifdef LIBDEFLATE_ENABLE_ASSERTIONS
+void libdeflate_assertion_failed(const char *expr, const char *file, int line);
+#define ASSERT(expr) { if (unlikely(!(expr))) \
+	libdeflate_assertion_failed(#expr, __FILE__, __LINE__); }
+#else
+#define ASSERT(expr) (void)(expr)
+#endif
+
+#define CONCAT_IMPL(a, b)	a##b
+#define CONCAT(a, b)		CONCAT_IMPL(a, b)
+#define ADD_SUFFIX(name)	CONCAT(name, SUFFIX)
+
+#endif /* LIB_LIB_COMMON_H */
+
+/*
+ * deflate_constants.h - constants for the DEFLATE compression format
+ */
+
+#ifndef LIB_DEFLATE_CONSTANTS_H
+#define LIB_DEFLATE_CONSTANTS_H
+
+/* Valid block types  */
+#define DEFLATE_BLOCKTYPE_UNCOMPRESSED		0
+#define DEFLATE_BLOCKTYPE_STATIC_HUFFMAN	1
+#define DEFLATE_BLOCKTYPE_DYNAMIC_HUFFMAN	2
+
+/* Minimum and maximum supported match lengths (in bytes)  */
+#define DEFLATE_MIN_MATCH_LEN			3
+#define DEFLATE_MAX_MATCH_LEN			258
+
+/* Maximum supported match offset (in bytes) */
+#define DEFLATE_MAX_MATCH_OFFSET		32768
+
+/* log2 of DEFLATE_MAX_MATCH_OFFSET */
+#define DEFLATE_WINDOW_ORDER			15
+
+/* Number of symbols in each Huffman code.  Note: for the literal/length
+ * and offset codes, these are actually the maximum values; a given block
+ * might use fewer symbols.  */
+#define DEFLATE_NUM_PRECODE_SYMS		19
+#define DEFLATE_NUM_LITLEN_SYMS			288
+#define DEFLATE_NUM_OFFSET_SYMS			32
+
+/* The maximum number of symbols across all codes  */
+#define DEFLATE_MAX_NUM_SYMS			288
+
+/* Division of symbols in the literal/length code  */
+#define DEFLATE_NUM_LITERALS			256
+#define DEFLATE_END_OF_BLOCK			256
+#define DEFLATE_FIRST_LEN_SYM			257
+
+/* Maximum codeword length, in bits, within each Huffman code  */
+#define DEFLATE_MAX_PRE_CODEWORD_LEN		7
+#define DEFLATE_MAX_LITLEN_CODEWORD_LEN		15
+#define DEFLATE_MAX_OFFSET_CODEWORD_LEN		15
+
+/* The maximum codeword length across all codes  */
+#define DEFLATE_MAX_CODEWORD_LEN		15
+
+/* Maximum possible overrun when decoding codeword lengths  */
+#define DEFLATE_MAX_LENS_OVERRUN		137
+
+/*
+ * Maximum number of extra bits that may be required to represent a match
+ * length or offset.
+ */
+#define DEFLATE_MAX_EXTRA_LENGTH_BITS		5
+#define DEFLATE_MAX_EXTRA_OFFSET_BITS		13
+
+#endif /* LIB_DEFLATE_CONSTANTS_H */
+
+/*
+ * cpu_features_common.h - code shared by all lib/$arch/cpu_features.c
+ *
+ * Copyright 2020 Eric Biggers
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef LIB_CPU_FEATURES_COMMON_H
+#define LIB_CPU_FEATURES_COMMON_H
+
+#if defined(TEST_SUPPORT__DO_NOT_USE) && !defined(FREESTANDING)
+   /* for strdup() and strtok_r() */
+#  undef _ANSI_SOURCE
+#  ifndef __APPLE__
+#    undef _GNU_SOURCE
+#    define _GNU_SOURCE
+#  endif
+#  include <stdio.h>
+#  include <stdlib.h>
+#  include <string.h>
+#endif
+
+struct cpu_feature {
+	u32 bit;
+	const char *name;
+};
+
+#if defined(TEST_SUPPORT__DO_NOT_USE) && !defined(FREESTANDING)
+/* Disable any features that are listed in $LIBDEFLATE_DISABLE_CPU_FEATURES. */
+static inline void
+disable_cpu_features_for_testing(u32 *features,
+				 const struct cpu_feature *feature_table,
+				 size_t feature_table_length)
+{
+	char *env_value, *strbuf, *p, *saveptr = NULL;
+	size_t i;
+
+	env_value = getenv("LIBDEFLATE_DISABLE_CPU_FEATURES");
+	if (!env_value)
+		return;
+	strbuf = strdup(env_value);
+	if (!strbuf)
+		abort();
+	p = strtok_r(strbuf, ",", &saveptr);
+	while (p) {
+		for (i = 0; i < feature_table_length; i++) {
+			if (strcmp(p, feature_table[i].name) == 0) {
+				*features &= ~feature_table[i].bit;
+				break;
+			}
+		}
+		if (i == feature_table_length) {
+			fprintf(stderr,
+				"unrecognized feature in LIBDEFLATE_DISABLE_CPU_FEATURES: \"%s\"\n",
+				p);
+			abort();
+		}
+		p = strtok_r(NULL, ",", &saveptr);
+	}
+	free(strbuf);
+}
+#else /* TEST_SUPPORT__DO_NOT_USE */
+static inline void
+disable_cpu_features_for_testing(u32 *features,
+				 const struct cpu_feature *feature_table,
+				 size_t feature_table_length)
+{
+}
+#endif /* !TEST_SUPPORT__DO_NOT_USE */
+
+#endif /* LIB_CPU_FEATURES_COMMON_H */
+
+/*
+ * x86/cpu_features.h - feature detection for x86 CPUs
+ *
+ * Copyright 2016 Eric Biggers
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef LIB_X86_CPU_FEATURES_H
+#define LIB_X86_CPU_FEATURES_H
+
+#define HAVE_DYNAMIC_X86_CPU_FEATURES	0
+
+#if defined(ARCH_X86_32) || defined(ARCH_X86_64)
+
+#if COMPILER_SUPPORTS_TARGET_FUNCTION_ATTRIBUTE || defined(_MSC_VER)
+#  undef HAVE_DYNAMIC_X86_CPU_FEATURES
+#  define HAVE_DYNAMIC_X86_CPU_FEATURES	1
+#endif
+
+#define X86_CPU_FEATURE_SSE2		0x00000001
+#define X86_CPU_FEATURE_PCLMUL		0x00000002
+#define X86_CPU_FEATURE_AVX		0x00000004
+#define X86_CPU_FEATURE_AVX2		0x00000008
+#define X86_CPU_FEATURE_BMI2		0x00000010
+
+#define HAVE_SSE2(features)	(HAVE_SSE2_NATIVE     || ((features) & X86_CPU_FEATURE_SSE2))
+#define HAVE_PCLMUL(features)	(HAVE_PCLMUL_NATIVE   || ((features) & X86_CPU_FEATURE_PCLMUL))
+#define HAVE_AVX(features)	(HAVE_AVX_NATIVE      || ((features) & X86_CPU_FEATURE_AVX))
+#define HAVE_AVX2(features)	(HAVE_AVX2_NATIVE     || ((features) & X86_CPU_FEATURE_AVX2))
+#define HAVE_BMI2(features)	(HAVE_BMI2_NATIVE     || ((features) & X86_CPU_FEATURE_BMI2))
+
+#if HAVE_DYNAMIC_X86_CPU_FEATURES
+#define X86_CPU_FEATURES_KNOWN		0x80000000
+extern volatile u32 libdeflate_x86_cpu_features;
+
+void libdeflate_init_x86_cpu_features(void);
+
+static inline u32 get_x86_cpu_features(void)
+{
+	if (libdeflate_x86_cpu_features == 0)
+		libdeflate_init_x86_cpu_features();
+	return libdeflate_x86_cpu_features;
+}
+#else /* HAVE_DYNAMIC_X86_CPU_FEATURES */
+static inline u32 get_x86_cpu_features(void) { return 0; }
+#endif /* !HAVE_DYNAMIC_X86_CPU_FEATURES */
+
+/*
+ * Prior to gcc 4.9 (r200349) and clang 3.8 (r239883), x86 intrinsics not
+ * available in the main target couldn't be used in 'target' attribute
+ * functions.  Unfortunately clang has no feature test macro for this, so we
+ * have to check its version.
+ */
+#if HAVE_DYNAMIC_X86_CPU_FEATURES && \
+	(GCC_PREREQ(4, 9) || CLANG_PREREQ(3, 8, 7030000) || defined(_MSC_VER))
+#  define HAVE_TARGET_INTRINSICS	1
+#else
+#  define HAVE_TARGET_INTRINSICS	0
+#endif
+
+/* SSE2 */
+#if defined(__SSE2__) || \
+	(defined(_MSC_VER) && \
+	 (defined(ARCH_X86_64) || (defined(_M_IX86_FP) && _M_IX86_FP >= 2)))
+#  define HAVE_SSE2_NATIVE	1
+#else
+#  define HAVE_SSE2_NATIVE	0
+#endif
+#define HAVE_SSE2_INTRIN	(HAVE_SSE2_NATIVE || HAVE_TARGET_INTRINSICS)
+
+/* PCLMUL */
+#if defined(__PCLMUL__) || (defined(_MSC_VER) && defined(__AVX2__))
+#  define HAVE_PCLMUL_NATIVE	1
+#else
+#  define HAVE_PCLMUL_NATIVE	0
+#endif
+#if HAVE_PCLMUL_NATIVE || (HAVE_TARGET_INTRINSICS && \
+			   (GCC_PREREQ(4, 4) || CLANG_PREREQ(3, 2, 0) || \
+			    defined(_MSC_VER)))
+#  define HAVE_PCLMUL_INTRIN	1
+#else
+#  define HAVE_PCLMUL_INTRIN	0
+#endif
+
+/* AVX */
+#ifdef __AVX__
+#  define HAVE_AVX_NATIVE	1
+#else
+#  define HAVE_AVX_NATIVE	0
+#endif
+#if HAVE_AVX_NATIVE || (HAVE_TARGET_INTRINSICS && \
+			(GCC_PREREQ(4, 6) || CLANG_PREREQ(3, 0, 0) || \
+			 defined(_MSC_VER)))
+#  define HAVE_AVX_INTRIN	1
+#else
+#  define HAVE_AVX_INTRIN	0
+#endif
+
+/* AVX2 */
+#ifdef __AVX2__
+#  define HAVE_AVX2_NATIVE	1
+#else
+#  define HAVE_AVX2_NATIVE	0
+#endif
+#if HAVE_AVX2_NATIVE || (HAVE_TARGET_INTRINSICS && \
+			 (GCC_PREREQ(4, 7) || CLANG_PREREQ(3, 1, 0) || \
+			  defined(_MSC_VER)))
+#  define HAVE_AVX2_INTRIN	1
+#else
+#  define HAVE_AVX2_INTRIN	0
+#endif
+
+/* BMI2 */
+#if defined(__BMI2__) || (defined(_MSC_VER) && defined(__AVX2__))
+#  define HAVE_BMI2_NATIVE	1
+#else
+#  define HAVE_BMI2_NATIVE	0
+#endif
+#if HAVE_BMI2_NATIVE || (HAVE_TARGET_INTRINSICS && \
+			 (GCC_PREREQ(4, 7) || CLANG_PREREQ(3, 1, 0) || \
+			  defined(_MSC_VER)))
+#  define HAVE_BMI2_INTRIN	1
+#else
+#  define HAVE_BMI2_INTRIN	0
+#endif
+
+#endif /* ARCH_X86_32 || ARCH_X86_64 */
+
+#endif /* LIB_X86_CPU_FEATURES_H */
+
+
+/*
+ * If the expression passed to SAFETY_CHECK() evaluates to false, then the
+ * decompression routine immediately returns LIBDEFLATE_BAD_DATA, indicating the
+ * compressed data is invalid.
+ *
+ * Theoretically, these checks could be disabled for specialized applications
+ * where all input to the decompressor will be trusted.
+ */
+#if 0
+#  pragma message("UNSAFE DECOMPRESSION IS ENABLED. THIS MUST ONLY BE USED IF THE DECOMPRESSOR INPUT WILL ALWAYS BE TRUSTED!")
+#  define SAFETY_CHECK(expr)	(void)(expr)
+#else
+#  define SAFETY_CHECK(expr)	if (unlikely(!(expr))) return LIBDEFLATE_BAD_DATA
+#endif
+
+/*****************************************************************************
+ *				Input bitstream                              *
+ *****************************************************************************/
+
+/*
+ * The state of the "input bitstream" consists of the following variables:
+ *
+ *	- in_next: a pointer to the next unread byte in the input buffer
+ *
+ *	- in_end: a pointer to just past the end of the input buffer
+ *
+ *	- bitbuf: a word-sized variable containing bits that have been read from
+ *		  the input buffer or from the implicit appended zero bytes
+ *
+ *	- bitsleft: the number of bits in 'bitbuf' available to be consumed.
+ *		    After REFILL_BITS_BRANCHLESS(), 'bitbuf' can actually
+ *		    contain more bits than this.  However, only the bits counted
+ *		    by 'bitsleft' can actually be consumed; the rest can only be
+ *		    used for preloading.
+ *
+ *		    As a micro-optimization, we allow bits 8 and higher of
+ *		    'bitsleft' to contain garbage.  When consuming the bits
+ *		    associated with a decode table entry, this allows us to do
+ *		    'bitsleft -= entry' instead of 'bitsleft -= (u8)entry'.
+ *		    On some CPUs, this helps reduce instruction dependencies.
+ *		    This does have the disadvantage that 'bitsleft' sometimes
+ *		    needs to be cast to 'u8', such as when it's used as a shift
+ *		    amount in REFILL_BITS_BRANCHLESS().  But that one happens
+ *		    for free since most CPUs ignore high bits in shift amounts.
+ *
+ *	- overread_count: the total number of implicit appended zero bytes that
+ *			  have been loaded into the bitbuffer, including any
+ *			  counted by 'bitsleft' and any already consumed
+ */
+
+/*
+ * The type for the bitbuffer variable ('bitbuf' described above).  For best
+ * performance, this should have size equal to a machine word.
+ *
+ * 64-bit platforms have a significant advantage: they get a bigger bitbuffer
+ * which they don't have to refill as often.
+ */
+typedef machine_word_t bitbuf_t;
+#define BITBUF_NBITS	(8 * (int)sizeof(bitbuf_t))
+
+/* BITMASK(n) returns a bitmask of length 'n'. */
+#define BITMASK(n)	(((bitbuf_t)1 << (n)) - 1)
+
+/*
+ * MAX_BITSLEFT is the maximum number of consumable bits, i.e. the maximum value
+ * of '(u8)bitsleft'.  This is the size of the bitbuffer variable, minus 1 if
+ * the branchless refill method is being used (see REFILL_BITS_BRANCHLESS()).
+ */
+#define MAX_BITSLEFT	\
+	(UNALIGNED_ACCESS_IS_FAST ? BITBUF_NBITS - 1 : BITBUF_NBITS)
+
+/*
+ * CONSUMABLE_NBITS is the minimum number of bits that are guaranteed to be
+ * consumable (counted in 'bitsleft') immediately after refilling the bitbuffer.
+ * Since only whole bytes can be added to 'bitsleft', the worst case is
+ * 'MAX_BITSLEFT - 7': the smallest amount where another byte doesn't fit.
+ */
+#define CONSUMABLE_NBITS	(MAX_BITSLEFT - 7)
+
+/*
+ * FASTLOOP_PRELOADABLE_NBITS is the minimum number of bits that are guaranteed
+ * to be preloadable immediately after REFILL_BITS_IN_FASTLOOP().  (It is *not*
+ * guaranteed after REFILL_BITS(), since REFILL_BITS() falls back to a
+ * byte-at-a-time refill method near the end of input.)  This may exceed the
+ * number of consumable bits (counted by 'bitsleft').  Any bits not counted in
+ * 'bitsleft' can only be used for precomputation and cannot be consumed.
+ */
+#define FASTLOOP_PRELOADABLE_NBITS	\
+	(UNALIGNED_ACCESS_IS_FAST ? BITBUF_NBITS : CONSUMABLE_NBITS)
+
+/*
+ * PRELOAD_SLACK is the minimum number of bits that are guaranteed to be
+ * preloadable but not consumable, following REFILL_BITS_IN_FASTLOOP() and any
+ * subsequent consumptions.  This is 1 bit if the branchless refill method is
+ * being used, and 0 bits otherwise.
+ */
+#define PRELOAD_SLACK	MAX(0, FASTLOOP_PRELOADABLE_NBITS - MAX_BITSLEFT)
+
+/*
+ * CAN_CONSUME(n) is true if it's guaranteed that if the bitbuffer has just been
+ * refilled, then it's always possible to consume 'n' bits from it.  'n' should
+ * be a compile-time constant, to enable compile-time evaluation.
+ */
+#define CAN_CONSUME(n)	(CONSUMABLE_NBITS >= (n))
+
+/*
+ * CAN_CONSUME_AND_THEN_PRELOAD(consume_nbits, preload_nbits) is true if it's
+ * guaranteed that after REFILL_BITS_IN_FASTLOOP(), it's always possible to
+ * consume 'consume_nbits' bits, then preload 'preload_nbits' bits.  The
+ * arguments should be compile-time constants to enable compile-time evaluation.
+ */
+#define CAN_CONSUME_AND_THEN_PRELOAD(consume_nbits, preload_nbits)	\
+	(CONSUMABLE_NBITS >= (consume_nbits) &&				\
+	 FASTLOOP_PRELOADABLE_NBITS >= (consume_nbits) + (preload_nbits))
+
+/*
+ * REFILL_BITS_BRANCHLESS() branchlessly refills the bitbuffer variable by
+ * reading the next word from the input buffer and updating 'in_next' and
+ * 'bitsleft' based on how many bits were refilled -- counting whole bytes only.
+ * This is much faster than reading a byte at a time, at least if the CPU is
+ * little endian and supports fast unaligned memory accesses.
+ *
+ * The simplest way of branchlessly updating 'bitsleft' would be:
+ *
+ *	bitsleft += (MAX_BITSLEFT - bitsleft) & ~7;
+ *
+ * To make it faster, we define MAX_BITSLEFT to be 'WORDBITS - 1' rather than
+ * WORDBITS, so that in binary it looks like 111111 or 11111.  Then, we update
+ * 'bitsleft' by just setting the bits above the low 3 bits:
+ *
+ *	bitsleft |= MAX_BITSLEFT & ~7;
+ *
+ * That compiles down to a single instruction like 'or $0x38, %rbp'.  Using
+ * 'MAX_BITSLEFT == WORDBITS - 1' also has the advantage that refills can be
+ * done when 'bitsleft == MAX_BITSLEFT' without invoking undefined behavior.
+ *
+ * The simplest way of branchlessly updating 'in_next' would be:
+ *
+ *	in_next += (MAX_BITSLEFT - bitsleft) >> 3;
+ *
+ * With 'MAX_BITSLEFT == WORDBITS - 1' we could use an XOR instead, though this
+ * isn't really better:
+ *
+ *	in_next += (MAX_BITSLEFT ^ bitsleft) >> 3;
+ *
+ * An alternative which can be marginally better is the following:
+ *
+ *	in_next += sizeof(bitbuf_t) - 1;
+ *	in_next -= (bitsleft >> 3) & 0x7;
+ *
+ * It seems this would increase the number of CPU instructions from 3 (sub, shr,
+ * add) to 4 (add, shr, and, sub).  However, if the CPU has a bitfield
+ * extraction instruction (e.g. arm's ubfx), it stays at 3, and is potentially
+ * more efficient because the length of the longest dependency chain decreases
+ * from 3 to 2.  This alternative also has the advantage that it ignores the
+ * high bits in 'bitsleft', so it is compatible with the micro-optimization we
+ * use where we let the high bits of 'bitsleft' contain garbage.
+ */
+#define REFILL_BITS_BRANCHLESS()					\
+do {									\
+	bitbuf |= get_unaligned_leword(in_next) << (u8)bitsleft;	\
+	in_next += sizeof(bitbuf_t) - 1;				\
+	in_next -= (bitsleft >> 3) & 0x7;				\
+	bitsleft |= MAX_BITSLEFT & ~7;					\
+} while (0)
+
+/*
+ * REFILL_BITS() loads bits from the input buffer until the bitbuffer variable
+ * contains at least CONSUMABLE_NBITS consumable bits.
+ *
+ * This checks for the end of input, and it doesn't guarantee
+ * FASTLOOP_PRELOADABLE_NBITS, so it can't be used in the fastloop.
+ *
+ * If we would overread the input buffer, we just don't read anything, leaving
+ * the bits zeroed but marking them filled.  This simplifies the decompressor
+ * because it removes the need to always be able to distinguish between real
+ * overreads and overreads caused only by the decompressor's own lookahead.
+ *
+ * We do still keep track of the number of bytes that have been overread, for
+ * two reasons.  First, it allows us to determine the exact number of bytes that
+ * were consumed once the stream ends or an uncompressed block is reached.
+ * Second, it allows us to stop early if the overread amount gets so large (more
+ * than sizeof bitbuf) that it can only be caused by a real overread.  (The
+ * second part is arguably unneeded, since libdeflate is buffer-based; given
+ * infinite zeroes, it will eventually either completely fill the output buffer
+ * or return an error.  However, we do it to be slightly more friendly to the
+ * not-recommended use case of decompressing with an unknown output size.)
+ */
+#define REFILL_BITS()							\
+do {									\
+	if (UNALIGNED_ACCESS_IS_FAST &&					\
+	    likely(in_end - in_next >= sizeof(bitbuf_t))) {		\
+		REFILL_BITS_BRANCHLESS();				\
+	} else {							\
+		while ((u8)bitsleft < CONSUMABLE_NBITS) {		\
+			if (likely(in_next != in_end)) {		\
+				bitbuf |= (bitbuf_t)*in_next++ <<	\
+					  (u8)bitsleft;			\
+			} else {					\
+				overread_count++;			\
+				SAFETY_CHECK(overread_count <=		\
+					     sizeof(bitbuf_t));		\
+			}						\
+			bitsleft += 8;					\
+		}							\
+	}								\
+} while (0)
+
+/*
+ * REFILL_BITS_IN_FASTLOOP() is like REFILL_BITS(), but it doesn't check for the
+ * end of the input.  It can only be used in the fastloop.
+ */
+#define REFILL_BITS_IN_FASTLOOP()					\
+do {									\
+	STATIC_ASSERT(UNALIGNED_ACCESS_IS_FAST ||			\
+		      FASTLOOP_PRELOADABLE_NBITS == CONSUMABLE_NBITS);	\
+	if (UNALIGNED_ACCESS_IS_FAST) {					\
+		REFILL_BITS_BRANCHLESS();				\
+	} else {							\
+		while ((u8)bitsleft < CONSUMABLE_NBITS) {		\
+			bitbuf |= (bitbuf_t)*in_next++ << (u8)bitsleft;	\
+			bitsleft += 8;					\
+		}							\
+	}								\
+} while (0)
+
+/*
+ * This is the worst-case maximum number of output bytes that are written to
+ * during each iteration of the fastloop.  The worst case is 2 literals, then a
+ * match of length DEFLATE_MAX_MATCH_LEN.  Additionally, some slack space must
+ * be included for the intentional overrun in the match copy implementation.
+ */
+#define FASTLOOP_MAX_BYTES_WRITTEN	\
+	(2 + DEFLATE_MAX_MATCH_LEN + (5 * WORDBYTES) - 1)
+
+/*
+ * This is the worst-case maximum number of input bytes that are read during
+ * each iteration of the fastloop.  To get this value, we first compute the
+ * greatest number of bits that can be refilled during a loop iteration.  The
+ * refill at the beginning can add at most MAX_BITSLEFT, and the amount that can
+ * be refilled later is no more than the maximum amount that can be consumed by
+ * 2 literals that don't need a subtable, then a match.  We convert this value
+ * to bytes, rounding up; this gives the maximum number of bytes that 'in_next'
+ * can be advanced.  Finally, we add sizeof(bitbuf_t) to account for
+ * REFILL_BITS_BRANCHLESS() reading a word past 'in_next'.
+ */
+#define FASTLOOP_MAX_BYTES_READ					\
+	(DIV_ROUND_UP(MAX_BITSLEFT + (2 * LITLEN_TABLEBITS) +	\
+		      LENGTH_MAXBITS + OFFSET_MAXBITS, 8) +	\
+	 sizeof(bitbuf_t))
+
+/*****************************************************************************
+ *                              Huffman decoding                             *
+ *****************************************************************************/
+
+/*
+ * The fastest way to decode Huffman-encoded data is basically to use a decode
+ * table that maps the next TABLEBITS bits of data to their symbol.  Each entry
+ * decode_table[i] maps to the symbol whose codeword is a prefix of 'i'.  A
+ * symbol with codeword length 'n' has '2**(TABLEBITS-n)' entries in the table.
+ *
+ * Ideally, TABLEBITS and the maximum codeword length would be the same; some
+ * compression formats are designed with this goal in mind.  Unfortunately, in
+ * DEFLATE, the maximum litlen and offset codeword lengths are 15 bits, which is
+ * too large for a practical TABLEBITS.  It's not *that* much larger, though, so
+ * the workaround is to use a single level of subtables.  In the main table,
+ * entries for prefixes of codewords longer than TABLEBITS contain a "pointer"
+ * to the appropriate subtable along with the number of bits it is indexed with.
+ *
+ * The most efficient way to allocate subtables is to allocate them dynamically
+ * after the main table.  The worst-case number of table entries needed,
+ * including subtables, is precomputable; see the ENOUGH constants below.
+ *
+ * A useful optimization is to store the codeword lengths in the decode table so
+ * that they don't have to be looked up by indexing a separate table that maps
+ * symbols to their codeword lengths.  We basically do this; however, for the
+ * litlen and offset codes we also implement some DEFLATE-specific optimizations
+ * that build in the consideration of the "extra bits" and the
+ * literal/length/end-of-block division.  For the exact decode table entry
+ * format we use, see the definitions of the *_decode_results[] arrays below.
+ */
+
+
+/*
+ * These are the TABLEBITS values we use for each of the DEFLATE Huffman codes,
+ * along with their corresponding ENOUGH values.
+ *
+ * For the precode, we use PRECODE_TABLEBITS == 7 since this is the maximum
+ * precode codeword length.  This avoids ever needing subtables.
+ *
+ * For the litlen and offset codes, we cannot realistically avoid ever needing
+ * subtables, since litlen and offset codewords can be up to 15 bits.  A higher
+ * TABLEBITS reduces the number of lookups that need a subtable, which increases
+ * performance; however, it increases memory usage and makes building the table
+ * take longer, which decreases performance.  We choose values that work well in
+ * practice, making subtables rarely needed without making the tables too large.
+ *
+ * Our choice of OFFSET_TABLEBITS == 8 is a bit low; without any special
+ * considerations, 9 would fit the trade-off curve better.  However, there is a
+ * performance benefit to using exactly 8 bits when it is a compile-time
+ * constant, as many CPUs can take the low byte more easily than the low 9 bits.
+ *
+ * zlib treats its equivalents of TABLEBITS as maximum values; whenever it
+ * builds a table, it caps the actual table_bits to the longest codeword.  This
+ * makes sense in theory, as there's no need for the table to be any larger than
+ * needed to support the longest codeword.  However, having the table bits be a
+ * compile-time constant is beneficial to the performance of the decode loop, so
+ * there is a trade-off.  libdeflate currently uses the dynamic table_bits
+ * strategy for the litlen table only, due to its larger maximum size.
+ * PRECODE_TABLEBITS and OFFSET_TABLEBITS are smaller, so going dynamic there
+ * isn't as useful, and OFFSET_TABLEBITS=8 is useful as mentioned above.
+ *
+ * Each TABLEBITS value has a corresponding ENOUGH value that gives the
+ * worst-case maximum number of decode table entries, including the main table
+ * and all subtables.  The ENOUGH value depends on three parameters:
+ *
+ *	(1) the maximum number of symbols in the code (DEFLATE_NUM_*_SYMS)
+ *	(2) the maximum number of main table bits (*_TABLEBITS)
+ *	(3) the maximum allowed codeword length (DEFLATE_MAX_*_CODEWORD_LEN)
+ *
+ * The ENOUGH values were computed using the utility program 'enough' from zlib.
+ */
+#define PRECODE_TABLEBITS	7
+#define PRECODE_ENOUGH		128	/* enough 19 7 7	*/
+#define LITLEN_TABLEBITS	11
+#define LITLEN_ENOUGH		2342	/* enough 288 11 15	*/
+#define OFFSET_TABLEBITS	8
+#define OFFSET_ENOUGH		402	/* enough 32 8 15	*/
+
+/*
+ * make_decode_table_entry() creates a decode table entry for the given symbol
+ * by combining the static part 'decode_results[sym]' with the dynamic part
+ * 'len', which is the remaining codeword length (the codeword length for main
+ * table entries, or the codeword length minus TABLEBITS for subtable entries).
+ *
+ * In all cases, we add 'len' to each of the two low-order bytes to create the
+ * appropriately-formatted decode table entry.  See the definitions of the
+ * *_decode_results[] arrays below, where the entry format is described.
+ */
+static forceinline u32
+make_decode_table_entry(const u32 decode_results[], u32 sym, u32 len)
+{
+	return decode_results[sym] + (len << 8) + len;
+}
+
+/*
+ * Here is the format of our precode decode table entries.  Bits not explicitly
+ * described contain zeroes:
+ *
+ *	Bit 20-16:  presym
+ *	Bit 10-8:   codeword length [not used]
+ *	Bit 2-0:    codeword length
+ *
+ * The precode decode table never has subtables, since we use
+ * PRECODE_TABLEBITS == DEFLATE_MAX_PRE_CODEWORD_LEN.
+ *
+ * precode_decode_results[] contains the static part of the entry for each
+ * symbol.  make_decode_table_entry() produces the final entries.
+ */
+static const u32 precode_decode_results[] = {
+#define ENTRY(presym)	((u32)presym << 16)
+	ENTRY(0)   , ENTRY(1)   , ENTRY(2)   , ENTRY(3)   ,
+	ENTRY(4)   , ENTRY(5)   , ENTRY(6)   , ENTRY(7)   ,
+	ENTRY(8)   , ENTRY(9)   , ENTRY(10)  , ENTRY(11)  ,
+	ENTRY(12)  , ENTRY(13)  , ENTRY(14)  , ENTRY(15)  ,
+	ENTRY(16)  , ENTRY(17)  , ENTRY(18)  ,
+#undef ENTRY
+};
+
+/* Litlen and offset decode table entry flags */
+
+/* Indicates a literal entry in the litlen decode table */
+#define HUFFDEC_LITERAL			0x80000000
+
+/* Indicates that HUFFDEC_SUBTABLE_POINTER or HUFFDEC_END_OF_BLOCK is set */
+#define HUFFDEC_EXCEPTIONAL		0x00008000
+
+/* Indicates a subtable pointer entry in the litlen or offset decode table */
+#define HUFFDEC_SUBTABLE_POINTER	0x00004000
+
+/* Indicates an end-of-block entry in the litlen decode table */
+#define HUFFDEC_END_OF_BLOCK		0x00002000
+
+/* Maximum number of bits that can be consumed by decoding a match length */
+#define LENGTH_MAXBITS		(DEFLATE_MAX_LITLEN_CODEWORD_LEN + \
+				 DEFLATE_MAX_EXTRA_LENGTH_BITS)
+#define LENGTH_MAXFASTBITS	(LITLEN_TABLEBITS /* no subtable needed */ + \
+				 DEFLATE_MAX_EXTRA_LENGTH_BITS)
+
+/*
+ * Here is the format of our litlen decode table entries.  Bits not explicitly
+ * described contain zeroes:
+ *
+ *	Literals:
+ *		Bit 31:     1 (HUFFDEC_LITERAL)
+ *		Bit 23-16:  literal value
+ *		Bit 15:     0 (!HUFFDEC_EXCEPTIONAL)
+ *		Bit 14:     0 (!HUFFDEC_SUBTABLE_POINTER)
+ *		Bit 13:     0 (!HUFFDEC_END_OF_BLOCK)
+ *		Bit 11-8:   remaining codeword length [not used]
+ *		Bit 3-0:    remaining codeword length
+ *	Lengths:
+ *		Bit 31:     0 (!HUFFDEC_LITERAL)
+ *		Bit 24-16:  length base value
+ *		Bit 15:     0 (!HUFFDEC_EXCEPTIONAL)
+ *		Bit 14:     0 (!HUFFDEC_SUBTABLE_POINTER)
+ *		Bit 13:     0 (!HUFFDEC_END_OF_BLOCK)
+ *		Bit 11-8:   remaining codeword length
+ *		Bit 4-0:    remaining codeword length + number of extra bits
+ *	End of block:
+ *		Bit 31:     0 (!HUFFDEC_LITERAL)
+ *		Bit 15:     1 (HUFFDEC_EXCEPTIONAL)
+ *		Bit 14:     0 (!HUFFDEC_SUBTABLE_POINTER)
+ *		Bit 13:     1 (HUFFDEC_END_OF_BLOCK)
+ *		Bit 11-8:   remaining codeword length [not used]
+ *		Bit 3-0:    remaining codeword length
+ *	Subtable pointer:
+ *		Bit 31:     0 (!HUFFDEC_LITERAL)
+ *		Bit 30-16:  index of start of subtable
+ *		Bit 15:     1 (HUFFDEC_EXCEPTIONAL)
+ *		Bit 14:     1 (HUFFDEC_SUBTABLE_POINTER)
+ *		Bit 13:     0 (!HUFFDEC_END_OF_BLOCK)
+ *		Bit 11-8:   number of subtable bits
+ *		Bit 3-0:    number of main table bits
+ *
+ * This format has several desirable properties:
+ *
+ *	- The codeword length, length slot base, and number of extra length bits
+ *	  are all built in.  This eliminates the need to separately look up this
+ *	  information by indexing separate arrays by symbol or length slot.
+ *
+ *	- The HUFFDEC_* flags enable easily distinguishing between the different
+ *	  types of entries.  The HUFFDEC_LITERAL flag enables a fast path for
+ *	  literals; the high bit is used for this, as some CPUs can test the
+ *	  high bit more easily than other bits.  The HUFFDEC_EXCEPTIONAL flag
+ *	  makes it possible to detect the two unlikely cases (subtable pointer
+ *	  and end of block) in a single bit flag test.
+ *
+ *	- The low byte is the number of bits that need to be removed from the
+ *	  bitstream; this makes this value easily accessible, and it enables the
+ *	  micro-optimization of doing 'bitsleft -= entry' instead of
+ *	  'bitsleft -= (u8)entry'.  It also includes the number of extra bits,
+ *	  so they don't need to be removed separately.
+ *
+ *	- The flags in bits 15-13 are arranged to be 0 when the
+ *	  "remaining codeword length" in bits 11-8 is needed, making this value
+ *	  fairly easily accessible as well via a shift and downcast.
+ *
+ *	- Similarly, bits 13-12 are 0 when the "subtable bits" in bits 11-8 are
+ *	  needed, making it possible to extract this value with '& 0x3F' rather
+ *	  than '& 0xF'.  This value is only used as a shift amount, so this can
+ *	  save an 'and' instruction as the masking by 0x3F happens implicitly.
+ *
+ * litlen_decode_results[] contains the static part of the entry for each
+ * symbol.  make_decode_table_entry() produces the final entries.
+ */
+static const u32 litlen_decode_results[] = {
+
+	/* Literals */
+#define ENTRY(literal)	(HUFFDEC_LITERAL | ((u32)literal << 16))
+	ENTRY(0)   , ENTRY(1)   , ENTRY(2)   , ENTRY(3)   ,
+	ENTRY(4)   , ENTRY(5)   , ENTRY(6)   , ENTRY(7)   ,
+	ENTRY(8)   , ENTRY(9)   , ENTRY(10)  , ENTRY(11)  ,
+	ENTRY(12)  , ENTRY(13)  , ENTRY(14)  , ENTRY(15)  ,
+	ENTRY(16)  , ENTRY(17)  , ENTRY(18)  , ENTRY(19)  ,
+	ENTRY(20)  , ENTRY(21)  , ENTRY(22)  , ENTRY(23)  ,
+	ENTRY(24)  , ENTRY(25)  , ENTRY(26)  , ENTRY(27)  ,
+	ENTRY(28)  , ENTRY(29)  , ENTRY(30)  , ENTRY(31)  ,
+	ENTRY(32)  , ENTRY(33)  , ENTRY(34)  , ENTRY(35)  ,
+	ENTRY(36)  , ENTRY(37)  , ENTRY(38)  , ENTRY(39)  ,
+	ENTRY(40)  , ENTRY(41)  , ENTRY(42)  , ENTRY(43)  ,
+	ENTRY(44)  , ENTRY(45)  , ENTRY(46)  , ENTRY(47)  ,
+	ENTRY(48)  , ENTRY(49)  , ENTRY(50)  , ENTRY(51)  ,
+	ENTRY(52)  , ENTRY(53)  , ENTRY(54)  , ENTRY(55)  ,
+	ENTRY(56)  , ENTRY(57)  , ENTRY(58)  , ENTRY(59)  ,
+	ENTRY(60)  , ENTRY(61)  , ENTRY(62)  , ENTRY(63)  ,
+	ENTRY(64)  , ENTRY(65)  , ENTRY(66)  , ENTRY(67)  ,
+	ENTRY(68)  , ENTRY(69)  , ENTRY(70)  , ENTRY(71)  ,
+	ENTRY(72)  , ENTRY(73)  , ENTRY(74)  , ENTRY(75)  ,
+	ENTRY(76)  , ENTRY(77)  , ENTRY(78)  , ENTRY(79)  ,
+	ENTRY(80)  , ENTRY(81)  , ENTRY(82)  , ENTRY(83)  ,
+	ENTRY(84)  , ENTRY(85)  , ENTRY(86)  , ENTRY(87)  ,
+	ENTRY(88)  , ENTRY(89)  , ENTRY(90)  , ENTRY(91)  ,
+	ENTRY(92)  , ENTRY(93)  , ENTRY(94)  , ENTRY(95)  ,
+	ENTRY(96)  , ENTRY(97)  , ENTRY(98)  , ENTRY(99)  ,
+	ENTRY(100) , ENTRY(101) , ENTRY(102) , ENTRY(103) ,
+	ENTRY(104) , ENTRY(105) , ENTRY(106) , ENTRY(107) ,
+	ENTRY(108) , ENTRY(109) , ENTRY(110) , ENTRY(111) ,
+	ENTRY(112) , ENTRY(113) , ENTRY(114) , ENTRY(115) ,
+	ENTRY(116) , ENTRY(117) , ENTRY(118) , ENTRY(119) ,
+	ENTRY(120) , ENTRY(121) , ENTRY(122) , ENTRY(123) ,
+	ENTRY(124) , ENTRY(125) , ENTRY(126) , ENTRY(127) ,
+	ENTRY(128) , ENTRY(129) , ENTRY(130) , ENTRY(131) ,
+	ENTRY(132) , ENTRY(133) , ENTRY(134) , ENTRY(135) ,
+	ENTRY(136) , ENTRY(137) , ENTRY(138) , ENTRY(139) ,
+	ENTRY(140) , ENTRY(141) , ENTRY(142) , ENTRY(143) ,
+	ENTRY(144) , ENTRY(145) , ENTRY(146) , ENTRY(147) ,
+	ENTRY(148) , ENTRY(149) , ENTRY(150) , ENTRY(151) ,
+	ENTRY(152) , ENTRY(153) , ENTRY(154) , ENTRY(155) ,
+	ENTRY(156) , ENTRY(157) , ENTRY(158) , ENTRY(159) ,
+	ENTRY(160) , ENTRY(161) , ENTRY(162) , ENTRY(163) ,
+	ENTRY(164) , ENTRY(165) , ENTRY(166) , ENTRY(167) ,
+	ENTRY(168) , ENTRY(169) , ENTRY(170) , ENTRY(171) ,
+	ENTRY(172) , ENTRY(173) , ENTRY(174) , ENTRY(175) ,
+	ENTRY(176) , ENTRY(177) , ENTRY(178) , ENTRY(179) ,
+	ENTRY(180) , ENTRY(181) , ENTRY(182) , ENTRY(183) ,
+	ENTRY(184) , ENTRY(185) , ENTRY(186) , ENTRY(187) ,
+	ENTRY(188) , ENTRY(189) , ENTRY(190) , ENTRY(191) ,
+	ENTRY(192) , ENTRY(193) , ENTRY(194) , ENTRY(195) ,
+	ENTRY(196) , ENTRY(197) , ENTRY(198) , ENTRY(199) ,
+	ENTRY(200) , ENTRY(201) , ENTRY(202) , ENTRY(203) ,
+	ENTRY(204) , ENTRY(205) , ENTRY(206) , ENTRY(207) ,
+	ENTRY(208) , ENTRY(209) , ENTRY(210) , ENTRY(211) ,
+	ENTRY(212) , ENTRY(213) , ENTRY(214) , ENTRY(215) ,
+	ENTRY(216) , ENTRY(217) , ENTRY(218) , ENTRY(219) ,
+	ENTRY(220) , ENTRY(221) , ENTRY(222) , ENTRY(223) ,
+	ENTRY(224) , ENTRY(225) , ENTRY(226) , ENTRY(227) ,
+	ENTRY(228) , ENTRY(229) , ENTRY(230) , ENTRY(231) ,
+	ENTRY(232) , ENTRY(233) , ENTRY(234) , ENTRY(235) ,
+	ENTRY(236) , ENTRY(237) , ENTRY(238) , ENTRY(239) ,
+	ENTRY(240) , ENTRY(241) , ENTRY(242) , ENTRY(243) ,
+	ENTRY(244) , ENTRY(245) , ENTRY(246) , ENTRY(247) ,
+	ENTRY(248) , ENTRY(249) , ENTRY(250) , ENTRY(251) ,
+	ENTRY(252) , ENTRY(253) , ENTRY(254) , ENTRY(255) ,
+#undef ENTRY
+
+	/* End of block */
+	HUFFDEC_EXCEPTIONAL | HUFFDEC_END_OF_BLOCK,
+
+	/* Lengths */
+#define ENTRY(length_base, num_extra_bits)	\
+	(((u32)(length_base) << 16) | (num_extra_bits))
+	ENTRY(3  , 0) , ENTRY(4  , 0) , ENTRY(5  , 0) , ENTRY(6  , 0),
+	ENTRY(7  , 0) , ENTRY(8  , 0) , ENTRY(9  , 0) , ENTRY(10 , 0),
+	ENTRY(11 , 1) , ENTRY(13 , 1) , ENTRY(15 , 1) , ENTRY(17 , 1),
+	ENTRY(19 , 2) , ENTRY(23 , 2) , ENTRY(27 , 2) , ENTRY(31 , 2),
+	ENTRY(35 , 3) , ENTRY(43 , 3) , ENTRY(51 , 3) , ENTRY(59 , 3),
+	ENTRY(67 , 4) , ENTRY(83 , 4) , ENTRY(99 , 4) , ENTRY(115, 4),
+	ENTRY(131, 5) , ENTRY(163, 5) , ENTRY(195, 5) , ENTRY(227, 5),
+	ENTRY(258, 0) , ENTRY(258, 0) , ENTRY(258, 0) ,
+#undef ENTRY
+};
+
+/* Maximum number of bits that can be consumed by decoding a match offset */
+#define OFFSET_MAXBITS		(DEFLATE_MAX_OFFSET_CODEWORD_LEN + \
+				 DEFLATE_MAX_EXTRA_OFFSET_BITS)
+#define OFFSET_MAXFASTBITS	(OFFSET_TABLEBITS /* no subtable needed */ + \
+				 DEFLATE_MAX_EXTRA_OFFSET_BITS)
+
+/*
+ * Here is the format of our offset decode table entries.  Bits not explicitly
+ * described contain zeroes:
+ *
+ *	Offsets:
+ *		Bit 31-16:  offset base value
+ *		Bit 15:     0 (!HUFFDEC_EXCEPTIONAL)
+ *		Bit 14:     0 (!HUFFDEC_SUBTABLE_POINTER)
+ *		Bit 11-8:   remaining codeword length
+ *		Bit 4-0:    remaining codeword length + number of extra bits
+ *	Subtable pointer:
+ *		Bit 31-16:  index of start of subtable
+ *		Bit 15:     1 (HUFFDEC_EXCEPTIONAL)
+ *		Bit 14:     1 (HUFFDEC_SUBTABLE_POINTER)
+ *		Bit 11-8:   number of subtable bits
+ *		Bit 3-0:    number of main table bits
+ *
+ * These work the same way as the length entries and subtable pointer entries in
+ * the litlen decode table; see litlen_decode_results[] above.
+ */
+static const u32 offset_decode_results[] = {
+#define ENTRY(offset_base, num_extra_bits)	\
+	(((u32)(offset_base) << 16) | (num_extra_bits))
+	ENTRY(1     , 0)  , ENTRY(2     , 0)  , ENTRY(3     , 0)  , ENTRY(4     , 0)  ,
+	ENTRY(5     , 1)  , ENTRY(7     , 1)  , ENTRY(9     , 2)  , ENTRY(13    , 2) ,
+	ENTRY(17    , 3)  , ENTRY(25    , 3)  , ENTRY(33    , 4)  , ENTRY(49    , 4)  ,
+	ENTRY(65    , 5)  , ENTRY(97    , 5)  , ENTRY(129   , 6)  , ENTRY(193   , 6)  ,
+	ENTRY(257   , 7)  , ENTRY(385   , 7)  , ENTRY(513   , 8)  , ENTRY(769   , 8)  ,
+	ENTRY(1025  , 9)  , ENTRY(1537  , 9)  , ENTRY(2049  , 10) , ENTRY(3073  , 10) ,
+	ENTRY(4097  , 11) , ENTRY(6145  , 11) , ENTRY(8193  , 12) , ENTRY(12289 , 12) ,
+	ENTRY(16385 , 13) , ENTRY(24577 , 13) , ENTRY(24577 , 13) , ENTRY(24577 , 13) ,
+#undef ENTRY
+};
+
+/*
+ * The main DEFLATE decompressor structure.  Since libdeflate only supports
+ * full-buffer decompression, this structure doesn't store the entire
+ * decompression state, most of which is in stack variables.  Instead, this
+ * struct just contains the decode tables and some temporary arrays used for
+ * building them, as these are too large to comfortably allocate on the stack.
+ *
+ * Storing the decode tables in the decompressor struct also allows the decode
+ * tables for the static codes to be reused whenever two static Huffman blocks
+ * are decoded without an intervening dynamic block, even across streams.
+ */
+struct libdeflate_decompressor {
+
+	/*
+	 * The arrays aren't all needed at the same time.  'precode_lens' and
+	 * 'precode_decode_table' are unneeded after 'lens' has been filled.
+	 * Furthermore, 'lens' need not be retained after building the litlen
+	 * and offset decode tables.  In fact, 'lens' can be in union with
+	 * 'litlen_decode_table' provided that 'offset_decode_table' is separate
+	 * and is built first.
+	 */
+
+	union {
+		u8 precode_lens[DEFLATE_NUM_PRECODE_SYMS];
+
+		struct {
+			u8 lens[DEFLATE_NUM_LITLEN_SYMS +
+				DEFLATE_NUM_OFFSET_SYMS +
+				DEFLATE_MAX_LENS_OVERRUN];
+
+			u32 precode_decode_table[PRECODE_ENOUGH];
+		} l;
+
+		u32 litlen_decode_table[LITLEN_ENOUGH];
+	} u;
+
+	u32 offset_decode_table[OFFSET_ENOUGH];
+
+	/* used only during build_decode_table() */
+	u16 sorted_syms[DEFLATE_MAX_NUM_SYMS];
+
+	bool static_codes_loaded;
+	unsigned litlen_tablebits;
+
+	/* The free() function for this struct, chosen at allocation time */
+	free_func_t free_func;
+};
+
+/*
+ * Build a table for fast decoding of symbols from a Huffman code.  As input,
+ * this function takes the codeword length of each symbol which may be used in
+ * the code.  As output, it produces a decode table for the canonical Huffman
+ * code described by the codeword lengths.  The decode table is built with the
+ * assumption that it will be indexed with "bit-reversed" codewords, where the
+ * low-order bit is the first bit of the codeword.  This format is used for all
+ * Huffman codes in DEFLATE.
+ *
+ * @decode_table
+ *	The array in which the decode table will be generated.  This array must
+ *	have sufficient length; see the definition of the ENOUGH numbers.
+ * @lens
+ *	An array which provides, for each symbol, the length of the
+ *	corresponding codeword in bits, or 0 if the symbol is unused.  This may
+ *	alias @decode_table, since nothing is written to @decode_table until all
+ *	@lens have been consumed.  All codeword lengths are assumed to be <=
+ *	@max_codeword_len but are otherwise considered untrusted.  If they do
+ *	not form a valid Huffman code, then the decode table is not built and
+ *	%false is returned.
+ * @num_syms
+ *	The number of symbols in the code, including all unused symbols.
+ * @decode_results
+ *	An array which gives the incomplete decode result for each symbol.  The
+ *	needed values in this array will be combined with codeword lengths to
+ *	make the final decode table entries using make_decode_table_entry().
+ * @table_bits
+ *	The log base-2 of the number of main table entries to use.
+ *	If @table_bits_ret != NULL, then @table_bits is treated as a maximum
+ *	value and it will be decreased if a smaller table would be sufficient.
+ * @max_codeword_len
+ *	The maximum allowed codeword length for this Huffman code.
+ *	Must be <= DEFLATE_MAX_CODEWORD_LEN.
+ * @sorted_syms
+ *	A temporary array of length @num_syms.
+ * @table_bits_ret
+ *	If non-NULL, then the dynamic table_bits is enabled, and the actual
+ *	table_bits value will be returned here.
+ *
+ * Returns %true if successful; %false if the codeword lengths do not form a
+ * valid Huffman code.
+ */
+static bool
+build_decode_table(u32 decode_table[],
+		   const u8 lens[],
+		   const unsigned num_syms,
+		   const u32 decode_results[],
+		   unsigned table_bits,
+		   unsigned max_codeword_len,
+		   u16 *sorted_syms,
+		   unsigned *table_bits_ret)
+{
+	unsigned len_counts[DEFLATE_MAX_CODEWORD_LEN + 1];
+	unsigned offsets[DEFLATE_MAX_CODEWORD_LEN + 1];
+	unsigned sym;		/* current symbol */
+	unsigned codeword;	/* current codeword, bit-reversed */
+	unsigned len;		/* current codeword length in bits */
+	unsigned count;		/* num codewords remaining with this length */
+	u32 codespace_used;	/* codespace used out of '2^max_codeword_len' */
+	unsigned cur_table_end; /* end index of current table */
+	unsigned subtable_prefix; /* codeword prefix of current subtable */
+	unsigned subtable_start;  /* start index of current subtable */
+	unsigned subtable_bits;   /* log2 of current subtable length */
+
+	/* Count how many codewords have each length, including 0. */
+	for (len = 0; len <= max_codeword_len; len++)
+		len_counts[len] = 0;
+	for (sym = 0; sym < num_syms; sym++)
+		len_counts[lens[sym]]++;
+
+	/*
+	 * Determine the actual maximum codeword length that was used, and
+	 * decrease table_bits to it if allowed.
+	 */
+	while (max_codeword_len > 1 && len_counts[max_codeword_len] == 0)
+		max_codeword_len--;
+	if (table_bits_ret != NULL) {
+		table_bits = MIN(table_bits, max_codeword_len);
+		*table_bits_ret = table_bits;
+	}
+
+	/*
+	 * Sort the symbols primarily by increasing codeword length and
+	 * secondarily by increasing symbol value; or equivalently by their
+	 * codewords in lexicographic order, since a canonical code is assumed.
+	 *
+	 * For efficiency, also compute 'codespace_used' in the same pass over
+	 * 'len_counts[]' used to build 'offsets[]' for sorting.
+	 */
+
+	/* Ensure that 'codespace_used' cannot overflow. */
+	STATIC_ASSERT(sizeof(codespace_used) == 4);
+	STATIC_ASSERT(UINT32_MAX / (1U << (DEFLATE_MAX_CODEWORD_LEN - 1)) >=
+		      DEFLATE_MAX_NUM_SYMS);
+
+	offsets[0] = 0;
+	offsets[1] = len_counts[0];
+	codespace_used = 0;
+	for (len = 1; len < max_codeword_len; len++) {
+		offsets[len + 1] = offsets[len] + len_counts[len];
+		codespace_used = (codespace_used << 1) + len_counts[len];
+	}
+	codespace_used = (codespace_used << 1) + len_counts[len];
+
+	for (sym = 0; sym < num_syms; sym++)
+		sorted_syms[offsets[lens[sym]]++] = sym;
+
+	sorted_syms += offsets[0]; /* Skip unused symbols */
+
+	/* lens[] is done being used, so we can write to decode_table[] now. */
+
+	/*
+	 * Check whether the lengths form a complete code (exactly fills the
+	 * codespace), an incomplete code (doesn't fill the codespace), or an
+	 * overfull code (overflows the codespace).  A codeword of length 'n'
+	 * uses proportion '1/(2^n)' of the codespace.  An overfull code is
+	 * nonsensical, so is considered invalid.  An incomplete code is
+	 * considered valid only in two specific cases; see below.
+	 */
+
+	/* overfull code? */
+	if (unlikely(codespace_used > (1U << max_codeword_len)))
+		return false;
+
+	/* incomplete code? */
+	if (unlikely(codespace_used < (1U << max_codeword_len))) {
+		u32 entry;
+		unsigned i;
+
+		if (codespace_used == 0) {
+			/*
+			 * An empty code is allowed.  This can happen for the
+			 * offset code in DEFLATE, since a dynamic Huffman block
+			 * need not contain any matches.
+			 */
+
+			/* sym=0, len=1 (arbitrary) */
+			entry = make_decode_table_entry(decode_results, 0, 1);
+		} else {
+			/*
+			 * Allow codes with a single used symbol, with codeword
+			 * length 1.  The DEFLATE RFC is unclear regarding this
+			 * case.  What zlib's decompressor does is permit this
+			 * for the litlen and offset codes and assume the
+			 * codeword is '0' rather than '1'.  We do the same
+			 * except we allow this for precodes too, since there's
+			 * no convincing reason to treat the codes differently.
+			 * We also assign both codewords '0' and '1' to the
+			 * symbol to avoid having to handle '1' specially.
+			 */
+			if (codespace_used != (1U << (max_codeword_len - 1)) ||
+			    len_counts[1] != 1)
+				return false;
+			entry = make_decode_table_entry(decode_results,
+							*sorted_syms, 1);
+		}
+		/*
+		 * Note: the decode table still must be fully initialized, in
+		 * case the stream is malformed and contains bits from the part
+		 * of the codespace the incomplete code doesn't use.
+		 */
+		for (i = 0; i < (1U << table_bits); i++)
+			decode_table[i] = entry;
+		return true;
+	}
+
+	/*
+	 * The lengths form a complete code.  Now, enumerate the codewords in
+	 * lexicographic order and fill the decode table entries for each one.
+	 *
+	 * First, process all codewords with len <= table_bits.  Each one gets
+	 * '2^(table_bits-len)' direct entries in the table.
+	 *
+	 * Since DEFLATE uses bit-reversed codewords, these entries aren't
+	 * consecutive but rather are spaced '2^len' entries apart.  This makes
+	 * filling them naively somewhat awkward and inefficient, since strided
+	 * stores are less cache-friendly and preclude the use of word or
+	 * vector-at-a-time stores to fill multiple entries per instruction.
+	 *
+	 * To optimize this, we incrementally double the table size.  When
+	 * processing codewords with length 'len', the table is treated as
+	 * having only '2^len' entries, so each codeword uses just one entry.
+	 * Then, each time 'len' is incremented, the table size is doubled and
+	 * the first half is copied to the second half.  This significantly
+	 * improves performance over naively doing strided stores.
+	 *
+	 * Note that some entries copied for each table doubling may not have
+	 * been initialized yet, but it doesn't matter since they're guaranteed
+	 * to be initialized later (because the Huffman code is complete).
+	 */
+	codeword = 0;
+	len = 1;
+	while ((count = len_counts[len]) == 0)
+		len++;
+	cur_table_end = 1U << len;
+	while (len <= table_bits) {
+		/* Process all 'count' codewords with length 'len' bits. */
+		do {
+			unsigned bit;
+
+			/* Fill the first entry for the current codeword. */
+			decode_table[codeword] =
+				make_decode_table_entry(decode_results,
+							*sorted_syms++, len);
+
+			if (codeword == cur_table_end - 1) {
+				/* Last codeword (all 1's) */
+				for (; len < table_bits; len++) {
+					memcpy(&decode_table[cur_table_end],
+					       decode_table,
+					       cur_table_end *
+						sizeof(decode_table[0]));
+					cur_table_end <<= 1;
+				}
+				return true;
+			}
+			/*
+			 * To advance to the lexicographically next codeword in
+			 * the canonical code, the codeword must be incremented,
+			 * then 0's must be appended to the codeword as needed
+			 * to match the next codeword's length.
+			 *
+			 * Since the codeword is bit-reversed, appending 0's is
+			 * a no-op.  However, incrementing it is nontrivial.  To
+			 * do so efficiently, use the 'bsr' instruction to find
+			 * the last (highest order) 0 bit in the codeword, set
+			 * it, and clear any later (higher order) 1 bits.  But
+			 * 'bsr' actually finds the highest order 1 bit, so to
+			 * use it first flip all bits in the codeword by XOR'ing
+			 * it with (1U << len) - 1 == cur_table_end - 1.
+			 */
+			bit = 1U << bsr32(codeword ^ (cur_table_end - 1));
+			codeword &= bit - 1;
+			codeword |= bit;
+		} while (--count);
+
+		/* Advance to the next codeword length. */
+		do {
+			if (++len <= table_bits) {
+				memcpy(&decode_table[cur_table_end],
+				       decode_table,
+				       cur_table_end * sizeof(decode_table[0]));
+				cur_table_end <<= 1;
+			}
+		} while ((count = len_counts[len]) == 0);
+	}
+
+	/* Process codewords with len > table_bits.  These require subtables. */
+	cur_table_end = 1U << table_bits;
+	subtable_prefix = -1;
+	subtable_start = 0;
+	for (;;) {
+		u32 entry;
+		unsigned i;
+		unsigned stride;
+		unsigned bit;
+
+		/*
+		 * Start a new subtable if the first 'table_bits' bits of the
+		 * codeword don't match the prefix of the current subtable.
+		 */
+		if ((codeword & ((1U << table_bits) - 1)) != subtable_prefix) {
+			subtable_prefix = (codeword & ((1U << table_bits) - 1));
+			subtable_start = cur_table_end;
+			/*
+			 * Calculate the subtable length.  If the codeword has
+			 * length 'table_bits + n', then the subtable needs
+			 * '2^n' entries.  But it may need more; if fewer than
+			 * '2^n' codewords of length 'table_bits + n' remain,
+			 * then the length will need to be incremented to bring
+			 * in longer codewords until the subtable can be
+			 * completely filled.  Note that because the Huffman
+			 * code is complete, it will always be possible to fill
+			 * the subtable eventually.
+			 */
+			subtable_bits = len - table_bits;
+			codespace_used = count;
+			while (codespace_used < (1U << subtable_bits)) {
+				subtable_bits++;
+				codespace_used = (codespace_used << 1) +
+					len_counts[table_bits + subtable_bits];
+			}
+			cur_table_end = subtable_start + (1U << subtable_bits);
+
+			/*
+			 * Create the entry that points from the main table to
+			 * the subtable.
+			 */
+			decode_table[subtable_prefix] =
+				((u32)subtable_start << 16) |
+				HUFFDEC_EXCEPTIONAL |
+				HUFFDEC_SUBTABLE_POINTER |
+				(subtable_bits << 8) | table_bits;
+		}
+
+		/* Fill the subtable entries for the current codeword. */
+		entry = make_decode_table_entry(decode_results, *sorted_syms++,
+						len - table_bits);
+		i = subtable_start + (codeword >> table_bits);
+		stride = 1U << (len - table_bits);
+		do {
+			decode_table[i] = entry;
+			i += stride;
+		} while (i < cur_table_end);
+
+		/* Advance to the next codeword. */
+		if (codeword == (1U << len) - 1) /* last codeword (all 1's)? */
+			return true;
+		bit = 1U << bsr32(codeword ^ ((1U << len) - 1));
+		codeword &= bit - 1;
+		codeword |= bit;
+		count--;
+		while (count == 0)
+			count = len_counts[++len];
+	}
+}
+
+/* Build the decode table for the precode.  */
+static bool
+build_precode_decode_table(struct libdeflate_decompressor *d)
+{
+	/* When you change TABLEBITS, you must change ENOUGH, and vice versa! */
+	STATIC_ASSERT(PRECODE_TABLEBITS == 7 && PRECODE_ENOUGH == 128);
+
+	STATIC_ASSERT(ARRAY_LEN(precode_decode_results) ==
+		      DEFLATE_NUM_PRECODE_SYMS);
+
+	return build_decode_table(d->u.l.precode_decode_table,
+				  d->u.precode_lens,
+				  DEFLATE_NUM_PRECODE_SYMS,
+				  precode_decode_results,
+				  PRECODE_TABLEBITS,
+				  DEFLATE_MAX_PRE_CODEWORD_LEN,
+				  d->sorted_syms,
+				  NULL);
+}
+
+/* Build the decode table for the literal/length code.  */
+static bool
+build_litlen_decode_table(struct libdeflate_decompressor *d,
+			  unsigned num_litlen_syms, unsigned num_offset_syms)
+{
+	/* When you change TABLEBITS, you must change ENOUGH, and vice versa! */
+	STATIC_ASSERT(LITLEN_TABLEBITS == 11 && LITLEN_ENOUGH == 2342);
+
+	STATIC_ASSERT(ARRAY_LEN(litlen_decode_results) ==
+		      DEFLATE_NUM_LITLEN_SYMS);
+
+	return build_decode_table(d->u.litlen_decode_table,
+				  d->u.l.lens,
+				  num_litlen_syms,
+				  litlen_decode_results,
+				  LITLEN_TABLEBITS,
+				  DEFLATE_MAX_LITLEN_CODEWORD_LEN,
+				  d->sorted_syms,
+				  &d->litlen_tablebits);
+}
+
+/* Build the decode table for the offset code.  */
+static bool
+build_offset_decode_table(struct libdeflate_decompressor *d,
+			  unsigned num_litlen_syms, unsigned num_offset_syms)
+{
+	/* When you change TABLEBITS, you must change ENOUGH, and vice versa! */
+	STATIC_ASSERT(OFFSET_TABLEBITS == 8 && OFFSET_ENOUGH == 402);
+
+	STATIC_ASSERT(ARRAY_LEN(offset_decode_results) ==
+		      DEFLATE_NUM_OFFSET_SYMS);
+
+	return build_decode_table(d->offset_decode_table,
+				  d->u.l.lens + num_litlen_syms,
+				  num_offset_syms,
+				  offset_decode_results,
+				  OFFSET_TABLEBITS,
+				  DEFLATE_MAX_OFFSET_CODEWORD_LEN,
+				  d->sorted_syms,
+				  NULL);
+}
+
+/*****************************************************************************
+ *                         Main decompression routine
+ *****************************************************************************/
+
+typedef enum libdeflate_result (*decompress_func_t)
+	(struct libdeflate_decompressor * restrict d,
+	 const void * restrict in, size_t in_nbytes,
+	 void * restrict out, size_t out_nbytes_avail,
+	 size_t *actual_in_nbytes_ret, size_t *actual_out_nbytes_ret);
+
+#define FUNCNAME deflate_decompress_default
+#undef ATTRIBUTES
+#undef EXTRACT_VARBITS
+#undef EXTRACT_VARBITS8
+/*
+ * decompress_template.h
+ *
+ * Copyright 2016 Eric Biggers
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+/*
+ * This is the actual DEFLATE decompression routine, lifted out of
+ * deflate_decompress.c so that it can be compiled multiple times with different
+ * target instruction sets.
+ */
+
+#ifndef ATTRIBUTES
+#  define ATTRIBUTES
+#endif
+#ifndef EXTRACT_VARBITS
+#  define EXTRACT_VARBITS(word, count)	((word) & BITMASK(count))
+#endif
+#ifndef EXTRACT_VARBITS8
+#  define EXTRACT_VARBITS8(word, count)	((word) & BITMASK((u8)(count)))
+#endif
+
+static enum libdeflate_result ATTRIBUTES MAYBE_UNUSED
+FUNCNAME(struct libdeflate_decompressor * restrict d,
+	 const void * restrict in, size_t in_nbytes,
+	 void * restrict out, size_t out_nbytes_avail,
+	 size_t *actual_in_nbytes_ret, size_t *actual_out_nbytes_ret)
+{
+	u8 *out_next = out;
+	u8 * const out_end = out_next + out_nbytes_avail;
+	u8 * const out_fastloop_end =
+		out_end - MIN(out_nbytes_avail, FASTLOOP_MAX_BYTES_WRITTEN);
+
+	/* Input bitstream state; see deflate_decompress.c for documentation */
+	const u8 *in_next = in;
+	const u8 * const in_end = in_next + in_nbytes;
+	const u8 * const in_fastloop_end =
+		in_end - MIN(in_nbytes, FASTLOOP_MAX_BYTES_READ);
+	bitbuf_t bitbuf = 0;
+	bitbuf_t saved_bitbuf;
+	u32 bitsleft = 0;
+	size_t overread_count = 0;
+
+	bool is_final_block;
+	unsigned block_type;
+	unsigned num_litlen_syms;
+	unsigned num_offset_syms;
+	bitbuf_t litlen_tablemask;
+	u32 entry;
+
+next_block:
+	/* Starting to read the next block */
+	;
+
+	STATIC_ASSERT(CAN_CONSUME(1 + 2 + 5 + 5 + 4 + 3));
+	REFILL_BITS();
+
+	/* BFINAL: 1 bit */
+	is_final_block = bitbuf & BITMASK(1);
+
+	/* BTYPE: 2 bits */
+	block_type = (bitbuf >> 1) & BITMASK(2);
+
+	if (block_type == DEFLATE_BLOCKTYPE_DYNAMIC_HUFFMAN) {
+
+		/* Dynamic Huffman block */
+
+		/* The order in which precode lengths are stored */
+		static const u8 deflate_precode_lens_permutation[DEFLATE_NUM_PRECODE_SYMS] = {
+			16, 17, 18, 0, 8, 7, 9, 6, 10, 5, 11, 4, 12, 3, 13, 2, 14, 1, 15
+		};
+
+		unsigned num_explicit_precode_lens;
+		unsigned i;
+
+		/* Read the codeword length counts. */
+
+		STATIC_ASSERT(DEFLATE_NUM_LITLEN_SYMS == 257 + BITMASK(5));
+		num_litlen_syms = 257 + ((bitbuf >> 3) & BITMASK(5));
+
+		STATIC_ASSERT(DEFLATE_NUM_OFFSET_SYMS == 1 + BITMASK(5));
+		num_offset_syms = 1 + ((bitbuf >> 8) & BITMASK(5));
+
+		STATIC_ASSERT(DEFLATE_NUM_PRECODE_SYMS == 4 + BITMASK(4));
+		num_explicit_precode_lens = 4 + ((bitbuf >> 13) & BITMASK(4));
+
+		d->static_codes_loaded = false;
+
+		/*
+		 * Read the precode codeword lengths.
+		 *
+		 * A 64-bit bitbuffer is just one bit too small to hold the
+		 * maximum number of precode lens, so to minimize branches we
+		 * merge one len with the previous fields.
+		 */
+		STATIC_ASSERT(DEFLATE_MAX_PRE_CODEWORD_LEN == (1 << 3) - 1);
+		if (CAN_CONSUME(3 * (DEFLATE_NUM_PRECODE_SYMS - 1))) {
+			d->u.precode_lens[deflate_precode_lens_permutation[0]] =
+				(bitbuf >> 17) & BITMASK(3);
+			bitbuf >>= 20;
+			bitsleft -= 20;
+			REFILL_BITS();
+			i = 1;
+			do {
+				d->u.precode_lens[deflate_precode_lens_permutation[i]] =
+					bitbuf & BITMASK(3);
+				bitbuf >>= 3;
+				bitsleft -= 3;
+			} while (++i < num_explicit_precode_lens);
+		} else {
+			bitbuf >>= 17;
+			bitsleft -= 17;
+			i = 0;
+			do {
+				if ((u8)bitsleft < 3)
+					REFILL_BITS();
+				d->u.precode_lens[deflate_precode_lens_permutation[i]] =
+					bitbuf & BITMASK(3);
+				bitbuf >>= 3;
+				bitsleft -= 3;
+			} while (++i < num_explicit_precode_lens);
+		}
+		for (; i < DEFLATE_NUM_PRECODE_SYMS; i++)
+			d->u.precode_lens[deflate_precode_lens_permutation[i]] = 0;
+
+		/* Build the decode table for the precode. */
+		SAFETY_CHECK(build_precode_decode_table(d));
+
+		/* Decode the litlen and offset codeword lengths. */
+		i = 0;
+		do {
+			unsigned presym;
+			u8 rep_val;
+			unsigned rep_count;
+
+			if ((u8)bitsleft < DEFLATE_MAX_PRE_CODEWORD_LEN + 7)
+				REFILL_BITS();
+
+			/*
+			 * The code below assumes that the precode decode table
+			 * doesn't have any subtables.
+			 */
+			STATIC_ASSERT(PRECODE_TABLEBITS == DEFLATE_MAX_PRE_CODEWORD_LEN);
+
+			/* Decode the next precode symbol. */
+			entry = d->u.l.precode_decode_table[
+				bitbuf & BITMASK(DEFLATE_MAX_PRE_CODEWORD_LEN)];
+			bitbuf >>= (u8)entry;
+			bitsleft -= entry; /* optimization: subtract full entry */
+			presym = entry >> 16;
+
+			if (presym < 16) {
+				/* Explicit codeword length */
+				d->u.l.lens[i++] = presym;
+				continue;
+			}
+
+			/* Run-length encoded codeword lengths */
+
+			/*
+			 * Note: we don't need to immediately verify that the
+			 * repeat count doesn't overflow the number of elements,
+			 * since we've sized the lens array to have enough extra
+			 * space to allow for the worst-case overrun (138 zeroes
+			 * when only 1 length was remaining).
+			 *
+			 * In the case of the small repeat counts (presyms 16
+			 * and 17), it is fastest to always write the maximum
+			 * number of entries.  That gets rid of branches that
+			 * would otherwise be required.
+			 *
+			 * It is not just because of the numerical order that
+			 * our checks go in the order 'presym < 16', 'presym ==
+			 * 16', and 'presym == 17'.  For typical data this is
+			 * ordered from most frequent to least frequent case.
+			 */
+			STATIC_ASSERT(DEFLATE_MAX_LENS_OVERRUN == 138 - 1);
+
+			if (presym == 16) {
+				/* Repeat the previous length 3 - 6 times. */
+				SAFETY_CHECK(i != 0);
+				rep_val = d->u.l.lens[i - 1];
+				STATIC_ASSERT(3 + BITMASK(2) == 6);
+				rep_count = 3 + (bitbuf & BITMASK(2));
+				bitbuf >>= 2;
+				bitsleft -= 2;
+				d->u.l.lens[i + 0] = rep_val;
+				d->u.l.lens[i + 1] = rep_val;
+				d->u.l.lens[i + 2] = rep_val;
+				d->u.l.lens[i + 3] = rep_val;
+				d->u.l.lens[i + 4] = rep_val;
+				d->u.l.lens[i + 5] = rep_val;
+				i += rep_count;
+			} else if (presym == 17) {
+				/* Repeat zero 3 - 10 times. */
+				STATIC_ASSERT(3 + BITMASK(3) == 10);
+				rep_count = 3 + (bitbuf & BITMASK(3));
+				bitbuf >>= 3;
+				bitsleft -= 3;
+				d->u.l.lens[i + 0] = 0;
+				d->u.l.lens[i + 1] = 0;
+				d->u.l.lens[i + 2] = 0;
+				d->u.l.lens[i + 3] = 0;
+				d->u.l.lens[i + 4] = 0;
+				d->u.l.lens[i + 5] = 0;
+				d->u.l.lens[i + 6] = 0;
+				d->u.l.lens[i + 7] = 0;
+				d->u.l.lens[i + 8] = 0;
+				d->u.l.lens[i + 9] = 0;
+				i += rep_count;
+			} else {
+				/* Repeat zero 11 - 138 times. */
+				STATIC_ASSERT(11 + BITMASK(7) == 138);
+				rep_count = 11 + (bitbuf & BITMASK(7));
+				bitbuf >>= 7;
+				bitsleft -= 7;
+				memset(&d->u.l.lens[i], 0,
+				       rep_count * sizeof(d->u.l.lens[i]));
+				i += rep_count;
+			}
+		} while (i < num_litlen_syms + num_offset_syms);
+
+		/* Unnecessary, but check this for consistency with zlib. */
+		SAFETY_CHECK(i == num_litlen_syms + num_offset_syms);
+
+	} else if (block_type == DEFLATE_BLOCKTYPE_UNCOMPRESSED) {
+		u16 len, nlen;
+
+		/*
+		 * Uncompressed block: copy 'len' bytes literally from the input
+		 * buffer to the output buffer.
+		 */
+
+		bitsleft -= 3; /* for BTYPE and BFINAL */
+
+		/*
+		 * Align the bitstream to the next byte boundary.  This means
+		 * the next byte boundary as if we were reading a byte at a
+		 * time.  Therefore, we have to rewind 'in_next' by any bytes
+		 * that have been refilled but not actually consumed yet (not
+		 * counting overread bytes, which don't increment 'in_next').
+		 */
+		bitsleft = (u8)bitsleft;
+		SAFETY_CHECK(overread_count <= (bitsleft >> 3));
+		in_next -= (bitsleft >> 3) - overread_count;
+		overread_count = 0;
+		bitbuf = 0;
+		bitsleft = 0;
+
+		SAFETY_CHECK(in_end - in_next >= 4);
+		len = get_unaligned_le16(in_next);
+		nlen = get_unaligned_le16(in_next + 2);
+		in_next += 4;
+
+		SAFETY_CHECK(len == (u16)~nlen);
+		if (unlikely(len > out_end - out_next))
+			return LIBDEFLATE_INSUFFICIENT_SPACE;
+		SAFETY_CHECK(len <= in_end - in_next);
+
+		memcpy(out_next, in_next, len);
+		in_next += len;
+		out_next += len;
+
+		goto block_done;
+
+	} else {
+		unsigned i;
+
+		SAFETY_CHECK(block_type == DEFLATE_BLOCKTYPE_STATIC_HUFFMAN);
+
+		/*
+		 * Static Huffman block: build the decode tables for the static
+		 * codes.  Skip doing so if the tables are already set up from
+		 * an earlier static block; this speeds up decompression of
+		 * degenerate input of many empty or very short static blocks.
+		 *
+		 * Afterwards, the remainder is the same as decompressing a
+		 * dynamic Huffman block.
+		 */
+
+		bitbuf >>= 3; /* for BTYPE and BFINAL */
+		bitsleft -= 3;
+
+		if (d->static_codes_loaded)
+			goto have_decode_tables;
+
+		d->static_codes_loaded = true;
+
+		STATIC_ASSERT(DEFLATE_NUM_LITLEN_SYMS == 288);
+		STATIC_ASSERT(DEFLATE_NUM_OFFSET_SYMS == 32);
+
+		for (i = 0; i < 144; i++)
+			d->u.l.lens[i] = 8;
+		for (; i < 256; i++)
+			d->u.l.lens[i] = 9;
+		for (; i < 280; i++)
+			d->u.l.lens[i] = 7;
+		for (; i < 288; i++)
+			d->u.l.lens[i] = 8;
+
+		for (; i < 288 + 32; i++)
+			d->u.l.lens[i] = 5;
+
+		num_litlen_syms = 288;
+		num_offset_syms = 32;
+	}
+
+	/* Decompressing a Huffman block (either dynamic or static) */
+
+	SAFETY_CHECK(build_offset_decode_table(d, num_litlen_syms, num_offset_syms));
+	SAFETY_CHECK(build_litlen_decode_table(d, num_litlen_syms, num_offset_syms));
+have_decode_tables:
+	litlen_tablemask = BITMASK(d->litlen_tablebits);
+
+	/*
+	 * This is the "fastloop" for decoding literals and matches.  It does
+	 * bounds checks on in_next and out_next in the loop conditions so that
+	 * additional bounds checks aren't needed inside the loop body.
+	 *
+	 * To reduce latency, the bitbuffer is refilled and the next litlen
+	 * decode table entry is preloaded before each loop iteration.
+	 */
+	if (in_next >= in_fastloop_end || out_next >= out_fastloop_end)
+		goto generic_loop;
+	REFILL_BITS_IN_FASTLOOP();
+	entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+	do {
+		u32 length, offset, lit;
+		const u8 *src;
+		u8 *dst;
+
+		/*
+		 * Consume the bits for the litlen decode table entry.  Save the
+		 * original bitbuf for later, in case the extra match length
+		 * bits need to be extracted from it.
+		 */
+		saved_bitbuf = bitbuf;
+		bitbuf >>= (u8)entry;
+		bitsleft -= entry; /* optimization: subtract full entry */
+
+		/*
+		 * Begin by checking for a "fast" literal, i.e. a literal that
+		 * doesn't need a subtable.
+		 */
+		if (entry & HUFFDEC_LITERAL) {
+			/*
+			 * On 64-bit platforms, we decode up to 2 extra fast
+			 * literals in addition to the primary item, as this
+			 * increases performance and still leaves enough bits
+			 * remaining for what follows.  We could actually do 3,
+			 * assuming LITLEN_TABLEBITS=11, but that actually
+			 * decreases performance slightly (perhaps by messing
+			 * with the branch prediction of the conditional refill
+			 * that happens later while decoding the match offset).
+			 *
+			 * Note: the definitions of FASTLOOP_MAX_BYTES_WRITTEN
+			 * and FASTLOOP_MAX_BYTES_READ need to be updated if the
+			 * number of extra literals decoded here is changed.
+			 */
+			if (/* enough bits for 2 fast literals + length + offset preload? */
+			    CAN_CONSUME_AND_THEN_PRELOAD(2 * LITLEN_TABLEBITS +
+							 LENGTH_MAXBITS,
+							 OFFSET_TABLEBITS) &&
+			    /* enough bits for 2 fast literals + slow literal + litlen preload? */
+			    CAN_CONSUME_AND_THEN_PRELOAD(2 * LITLEN_TABLEBITS +
+							 DEFLATE_MAX_LITLEN_CODEWORD_LEN,
+							 LITLEN_TABLEBITS)) {
+				/* 1st extra fast literal */
+				lit = entry >> 16;
+				entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+				saved_bitbuf = bitbuf;
+				bitbuf >>= (u8)entry;
+				bitsleft -= entry;
+				*out_next++ = lit;
+				if (entry & HUFFDEC_LITERAL) {
+					/* 2nd extra fast literal */
+					lit = entry >> 16;
+					entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+					saved_bitbuf = bitbuf;
+					bitbuf >>= (u8)entry;
+					bitsleft -= entry;
+					*out_next++ = lit;
+					if (entry & HUFFDEC_LITERAL) {
+						/*
+						 * Another fast literal, but
+						 * this one is in lieu of the
+						 * primary item, so it doesn't
+						 * count as one of the extras.
+						 */
+						lit = entry >> 16;
+						entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+						REFILL_BITS_IN_FASTLOOP();
+						*out_next++ = lit;
+						continue;
+					}
+				}
+			} else {
+				/*
+				 * Decode a literal.  While doing so, preload
+				 * the next litlen decode table entry and refill
+				 * the bitbuffer.  To reduce latency, we've
+				 * arranged for there to be enough "preloadable"
+				 * bits remaining to do the table preload
+				 * independently of the refill.
+				 */
+				STATIC_ASSERT(CAN_CONSUME_AND_THEN_PRELOAD(
+						LITLEN_TABLEBITS, LITLEN_TABLEBITS));
+				lit = entry >> 16;
+				entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+				REFILL_BITS_IN_FASTLOOP();
+				*out_next++ = lit;
+				continue;
+			}
+		}
+
+		/*
+		 * It's not a literal entry, so it can be a length entry, a
+		 * subtable pointer entry, or an end-of-block entry.  Detect the
+		 * two unlikely cases by testing the HUFFDEC_EXCEPTIONAL flag.
+		 */
+		if (unlikely(entry & HUFFDEC_EXCEPTIONAL)) {
+			/* Subtable pointer or end-of-block entry */
+
+			if (unlikely(entry & HUFFDEC_END_OF_BLOCK))
+				goto block_done;
+
+			/*
+			 * A subtable is required.  Load and consume the
+			 * subtable entry.  The subtable entry can be of any
+			 * type: literal, length, or end-of-block.
+			 */
+			entry = d->u.litlen_decode_table[(entry >> 16) +
+				EXTRACT_VARBITS(bitbuf, (entry >> 8) & 0x3F)];
+			saved_bitbuf = bitbuf;
+			bitbuf >>= (u8)entry;
+			bitsleft -= entry;
+
+			/*
+			 * 32-bit platforms that use the byte-at-a-time refill
+			 * method have to do a refill here for there to always
+			 * be enough bits to decode a literal that requires a
+			 * subtable, then preload the next litlen decode table
+			 * entry; or to decode a match length that requires a
+			 * subtable, then preload the offset decode table entry.
+			 */
+			if (!CAN_CONSUME_AND_THEN_PRELOAD(DEFLATE_MAX_LITLEN_CODEWORD_LEN,
+							  LITLEN_TABLEBITS) ||
+			    !CAN_CONSUME_AND_THEN_PRELOAD(LENGTH_MAXBITS,
+							  OFFSET_TABLEBITS))
+				REFILL_BITS_IN_FASTLOOP();
+			if (entry & HUFFDEC_LITERAL) {
+				/* Decode a literal that required a subtable. */
+				lit = entry >> 16;
+				entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+				REFILL_BITS_IN_FASTLOOP();
+				*out_next++ = lit;
+				continue;
+			}
+			if (unlikely(entry & HUFFDEC_END_OF_BLOCK))
+				goto block_done;
+			/* Else, it's a length that required a subtable. */
+		}
+
+		/*
+		 * Decode the match length: the length base value associated
+		 * with the litlen symbol (which we extract from the decode
+		 * table entry), plus the extra length bits.  We don't need to
+		 * consume the extra length bits here, as they were included in
+		 * the bits consumed by the entry earlier.  We also don't need
+		 * to check for too-long matches here, as this is inside the
+		 * fastloop where it's already been verified that the output
+		 * buffer has enough space remaining to copy a max-length match.
+		 */
+		length = entry >> 16;
+		length += EXTRACT_VARBITS8(saved_bitbuf, entry) >> (u8)(entry >> 8);
+
+		/*
+		 * Decode the match offset.  There are enough "preloadable" bits
+		 * remaining to preload the offset decode table entry, but a
+		 * refill might be needed before consuming it.
+		 */
+		STATIC_ASSERT(CAN_CONSUME_AND_THEN_PRELOAD(LENGTH_MAXFASTBITS,
+							   OFFSET_TABLEBITS));
+		entry = d->offset_decode_table[bitbuf & BITMASK(OFFSET_TABLEBITS)];
+		if (CAN_CONSUME_AND_THEN_PRELOAD(OFFSET_MAXBITS,
+						 LITLEN_TABLEBITS)) {
+			/*
+			 * Decoding a match offset on a 64-bit platform.  We may
+			 * need to refill once, but then we can decode the whole
+			 * offset and preload the next litlen table entry.
+			 */
+			if (unlikely(entry & HUFFDEC_EXCEPTIONAL)) {
+				/* Offset codeword requires a subtable */
+				if (unlikely((u8)bitsleft < OFFSET_MAXBITS +
+					     LITLEN_TABLEBITS - PRELOAD_SLACK))
+					REFILL_BITS_IN_FASTLOOP();
+				bitbuf >>= OFFSET_TABLEBITS;
+				bitsleft -= OFFSET_TABLEBITS;
+				entry = d->offset_decode_table[(entry >> 16) +
+					EXTRACT_VARBITS(bitbuf, (entry >> 8) & 0x3F)];
+			} else if (unlikely((u8)bitsleft < OFFSET_MAXFASTBITS +
+					    LITLEN_TABLEBITS - PRELOAD_SLACK))
+				REFILL_BITS_IN_FASTLOOP();
+		} else {
+			/* Decoding a match offset on a 32-bit platform */
+			REFILL_BITS_IN_FASTLOOP();
+			if (unlikely(entry & HUFFDEC_EXCEPTIONAL)) {
+				/* Offset codeword requires a subtable */
+				bitbuf >>= OFFSET_TABLEBITS;
+				bitsleft -= OFFSET_TABLEBITS;
+				entry = d->offset_decode_table[(entry >> 16) +
+					EXTRACT_VARBITS(bitbuf, (entry >> 8) & 0x3F)];
+				REFILL_BITS_IN_FASTLOOP();
+				/* No further refill needed before extra bits */
+				STATIC_ASSERT(CAN_CONSUME(
+					OFFSET_MAXBITS - OFFSET_TABLEBITS));
+			} else {
+				/* No refill needed before extra bits */
+				STATIC_ASSERT(CAN_CONSUME(OFFSET_MAXFASTBITS));
+			}
+		}
+		saved_bitbuf = bitbuf;
+		bitbuf >>= (u8)entry;
+		bitsleft -= entry; /* optimization: subtract full entry */
+		offset = entry >> 16;
+		offset += EXTRACT_VARBITS8(saved_bitbuf, entry) >> (u8)(entry >> 8);
+
+		/* Validate the match offset; needed even in the fastloop. */
+		SAFETY_CHECK(offset <= out_next - (const u8 *)out);
+		src = out_next - offset;
+		dst = out_next;
+		out_next += length;
+
+		/*
+		 * Before starting to issue the instructions to copy the match,
+		 * refill the bitbuffer and preload the litlen decode table
+		 * entry for the next loop iteration.  This can increase
+		 * performance by allowing the latency of the match copy to
+		 * overlap with these other operations.  To further reduce
+		 * latency, we've arranged for there to be enough bits remaining
+		 * to do the table preload independently of the refill, except
+		 * on 32-bit platforms using the byte-at-a-time refill method.
+		 */
+		if (!CAN_CONSUME_AND_THEN_PRELOAD(
+			MAX(OFFSET_MAXBITS - OFFSET_TABLEBITS,
+			    OFFSET_MAXFASTBITS),
+			LITLEN_TABLEBITS) &&
+		    unlikely((u8)bitsleft < LITLEN_TABLEBITS - PRELOAD_SLACK))
+			REFILL_BITS_IN_FASTLOOP();
+		entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+		REFILL_BITS_IN_FASTLOOP();
+
+		/*
+		 * Copy the match.  On most CPUs the fastest method is a
+		 * word-at-a-time copy, unconditionally copying about 5 words
+		 * since this is enough for most matches without being too much.
+		 *
+		 * The normal word-at-a-time copy works for offset >= WORDBYTES,
+		 * which is most cases.  The case of offset == 1 is also common
+		 * and is worth optimizing for, since it is just RLE encoding of
+		 * the previous byte, which is the result of compressing long
+		 * runs of the same byte.
+		 *
+		 * Writing past the match 'length' is allowed here, since it's
+		 * been ensured there is enough output space left for a slight
+		 * overrun.  FASTLOOP_MAX_BYTES_WRITTEN needs to be updated if
+		 * the maximum possible overrun here is changed.
+		 */
+		if (UNALIGNED_ACCESS_IS_FAST && offset >= WORDBYTES) {
+			store_word_unaligned(load_word_unaligned(src), dst);
+			src += WORDBYTES;
+			dst += WORDBYTES;
+			store_word_unaligned(load_word_unaligned(src), dst);
+			src += WORDBYTES;
+			dst += WORDBYTES;
+			store_word_unaligned(load_word_unaligned(src), dst);
+			src += WORDBYTES;
+			dst += WORDBYTES;
+			store_word_unaligned(load_word_unaligned(src), dst);
+			src += WORDBYTES;
+			dst += WORDBYTES;
+			store_word_unaligned(load_word_unaligned(src), dst);
+			src += WORDBYTES;
+			dst += WORDBYTES;
+			while (dst < out_next) {
+				store_word_unaligned(load_word_unaligned(src), dst);
+				src += WORDBYTES;
+				dst += WORDBYTES;
+				store_word_unaligned(load_word_unaligned(src), dst);
+				src += WORDBYTES;
+				dst += WORDBYTES;
+				store_word_unaligned(load_word_unaligned(src), dst);
+				src += WORDBYTES;
+				dst += WORDBYTES;
+				store_word_unaligned(load_word_unaligned(src), dst);
+				src += WORDBYTES;
+				dst += WORDBYTES;
+				store_word_unaligned(load_word_unaligned(src), dst);
+				src += WORDBYTES;
+				dst += WORDBYTES;
+			}
+		} else if (UNALIGNED_ACCESS_IS_FAST && offset == 1) {
+			machine_word_t v;
+
+			/*
+			 * This part tends to get auto-vectorized, so keep it
+			 * copying a multiple of 16 bytes at a time.
+			 */
+			v = (machine_word_t)0x0101010101010101 * src[0];
+			store_word_unaligned(v, dst);
+			dst += WORDBYTES;
+			store_word_unaligned(v, dst);
+			dst += WORDBYTES;
+			store_word_unaligned(v, dst);
+			dst += WORDBYTES;
+			store_word_unaligned(v, dst);
+			dst += WORDBYTES;
+			while (dst < out_next) {
+				store_word_unaligned(v, dst);
+				dst += WORDBYTES;
+				store_word_unaligned(v, dst);
+				dst += WORDBYTES;
+				store_word_unaligned(v, dst);
+				dst += WORDBYTES;
+				store_word_unaligned(v, dst);
+				dst += WORDBYTES;
+			}
+		} else if (UNALIGNED_ACCESS_IS_FAST) {
+			store_word_unaligned(load_word_unaligned(src), dst);
+			src += offset;
+			dst += offset;
+			store_word_unaligned(load_word_unaligned(src), dst);
+			src += offset;
+			dst += offset;
+			do {
+				store_word_unaligned(load_word_unaligned(src), dst);
+				src += offset;
+				dst += offset;
+				store_word_unaligned(load_word_unaligned(src), dst);
+				src += offset;
+				dst += offset;
+			} while (dst < out_next);
+		} else {
+			*dst++ = *src++;
+			*dst++ = *src++;
+			do {
+				*dst++ = *src++;
+			} while (dst < out_next);
+		}
+	} while (in_next < in_fastloop_end && out_next < out_fastloop_end);
+
+	/*
+	 * This is the generic loop for decoding literals and matches.  This
+	 * handles cases where in_next and out_next are close to the end of
+	 * their respective buffers.  Usually this loop isn't performance-
+	 * critical, as most time is spent in the fastloop above instead.  We
+	 * therefore omit some optimizations here in favor of smaller code.
+	 */
+generic_loop:
+	for (;;) {
+		u32 length, offset;
+		const u8 *src;
+		u8 *dst;
+
+		REFILL_BITS();
+		entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+		saved_bitbuf = bitbuf;
+		bitbuf >>= (u8)entry;
+		bitsleft -= entry;
+		if (unlikely(entry & HUFFDEC_SUBTABLE_POINTER)) {
+			entry = d->u.litlen_decode_table[(entry >> 16) +
+					EXTRACT_VARBITS(bitbuf, (entry >> 8) & 0x3F)];
+			saved_bitbuf = bitbuf;
+			bitbuf >>= (u8)entry;
+			bitsleft -= entry;
+		}
+		length = entry >> 16;
+		if (entry & HUFFDEC_LITERAL) {
+			if (unlikely(out_next == out_end))
+				return LIBDEFLATE_INSUFFICIENT_SPACE;
+			*out_next++ = length;
+			continue;
+		}
+		if (unlikely(entry & HUFFDEC_END_OF_BLOCK))
+			goto block_done;
+		length += EXTRACT_VARBITS8(saved_bitbuf, entry) >> (u8)(entry >> 8);
+		if (unlikely(length > out_end - out_next))
+			return LIBDEFLATE_INSUFFICIENT_SPACE;
+
+		if (!CAN_CONSUME(LENGTH_MAXBITS + OFFSET_MAXBITS))
+			REFILL_BITS();
+		entry = d->offset_decode_table[bitbuf & BITMASK(OFFSET_TABLEBITS)];
+		if (unlikely(entry & HUFFDEC_EXCEPTIONAL)) {
+			bitbuf >>= OFFSET_TABLEBITS;
+			bitsleft -= OFFSET_TABLEBITS;
+			entry = d->offset_decode_table[(entry >> 16) +
+					EXTRACT_VARBITS(bitbuf, (entry >> 8) & 0x3F)];
+			if (!CAN_CONSUME(OFFSET_MAXBITS))
+				REFILL_BITS();
+		}
+		offset = entry >> 16;
+		offset += EXTRACT_VARBITS8(bitbuf, entry) >> (u8)(entry >> 8);
+		bitbuf >>= (u8)entry;
+		bitsleft -= entry;
+
+		SAFETY_CHECK(offset <= out_next - (const u8 *)out);
+		src = out_next - offset;
+		dst = out_next;
+		out_next += length;
+
+		STATIC_ASSERT(DEFLATE_MIN_MATCH_LEN == 3);
+		*dst++ = *src++;
+		*dst++ = *src++;
+		do {
+			*dst++ = *src++;
+		} while (dst < out_next);
+	}
+
+block_done:
+	/* Finished decoding a block */
+
+	if (!is_final_block)
+		goto next_block;
+
+	/* That was the last block. */
+
+	bitsleft = (u8)bitsleft;
+
+	/*
+	 * If any of the implicit appended zero bytes were consumed (not just
+	 * refilled) before hitting end of stream, then the data is bad.
+	 */
+	SAFETY_CHECK(overread_count <= (bitsleft >> 3));
+
+	/* Optionally return the actual number of bytes consumed. */
+	if (actual_in_nbytes_ret) {
+		/* Don't count bytes that were refilled but not consumed. */
+		in_next -= (bitsleft >> 3) - overread_count;
+
+		*actual_in_nbytes_ret = in_next - (u8 *)in;
+	}
+
+	/* Optionally return the actual number of bytes written. */
+	if (actual_out_nbytes_ret) {
+		*actual_out_nbytes_ret = out_next - (u8 *)out;
+	} else {
+		if (out_next != out_end)
+			return LIBDEFLATE_SHORT_OUTPUT;
+	}
+	return LIBDEFLATE_SUCCESS;
+}
+
+#undef FUNCNAME
+#undef ATTRIBUTES
+#undef EXTRACT_VARBITS
+#undef EXTRACT_VARBITS8
+
+
+/* Include architecture-specific implementation(s) if available. */
+#undef DEFAULT_IMPL
+#undef arch_select_decompress_func
+#if defined(ARCH_X86_32) || defined(ARCH_X86_64)
+#ifndef LIB_X86_DECOMPRESS_IMPL_H
+#define LIB_X86_DECOMPRESS_IMPL_H
+
+/*
+ * BMI2 optimized version
+ *
+ * FIXME: with MSVC, this isn't actually compiled with BMI2 code generation
+ * enabled yet.  That would require that this be moved to its own .c file.
+ */
+#if HAVE_BMI2_INTRIN
+#  define deflate_decompress_bmi2	deflate_decompress_bmi2
+#  define FUNCNAME			deflate_decompress_bmi2
+#  if !HAVE_BMI2_NATIVE
+#    define ATTRIBUTES			_target_attribute("bmi2")
+#  endif
+   /*
+    * Even with __attribute__((target("bmi2"))), gcc doesn't reliably use the
+    * bzhi instruction for 'word & BITMASK(count)'.  So use the bzhi intrinsic
+    * explicitly.  EXTRACT_VARBITS() is equivalent to 'word & BITMASK(count)';
+    * EXTRACT_VARBITS8() is equivalent to 'word & BITMASK((u8)count)'.
+    * Nevertheless, their implementation using the bzhi intrinsic is identical,
+    * as the bzhi instruction truncates the count to 8 bits implicitly.
+    */
+#  ifndef __clang__
+#    include <immintrin.h>
+#    ifdef ARCH_X86_64
+#      define EXTRACT_VARBITS(word, count)  _bzhi_u64((word), (count))
+#      define EXTRACT_VARBITS8(word, count) _bzhi_u64((word), (count))
+#    else
+#      define EXTRACT_VARBITS(word, count)  _bzhi_u32((word), (count))
+#      define EXTRACT_VARBITS8(word, count) _bzhi_u32((word), (count))
+#    endif
+#  endif
+/*
+ * decompress_template.h
+ *
+ * Copyright 2016 Eric Biggers
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+/*
+ * This is the actual DEFLATE decompression routine, lifted out of
+ * deflate_decompress.c so that it can be compiled multiple times with different
+ * target instruction sets.
+ */
+
+#ifndef ATTRIBUTES
+#  define ATTRIBUTES
+#endif
+#ifndef EXTRACT_VARBITS
+#  define EXTRACT_VARBITS(word, count)	((word) & BITMASK(count))
+#endif
+#ifndef EXTRACT_VARBITS8
+#  define EXTRACT_VARBITS8(word, count)	((word) & BITMASK((u8)(count)))
+#endif
+
+static enum libdeflate_result ATTRIBUTES MAYBE_UNUSED
+FUNCNAME(struct libdeflate_decompressor * restrict d,
+	 const void * restrict in, size_t in_nbytes,
+	 void * restrict out, size_t out_nbytes_avail,
+	 size_t *actual_in_nbytes_ret, size_t *actual_out_nbytes_ret)
+{
+	u8 *out_next = out;
+	u8 * const out_end = out_next + out_nbytes_avail;
+	u8 * const out_fastloop_end =
+		out_end - MIN(out_nbytes_avail, FASTLOOP_MAX_BYTES_WRITTEN);
+
+	/* Input bitstream state; see deflate_decompress.c for documentation */
+	const u8 *in_next = in;
+	const u8 * const in_end = in_next + in_nbytes;
+	const u8 * const in_fastloop_end =
+		in_end - MIN(in_nbytes, FASTLOOP_MAX_BYTES_READ);
+	bitbuf_t bitbuf = 0;
+	bitbuf_t saved_bitbuf;
+	u32 bitsleft = 0;
+	size_t overread_count = 0;
+
+	bool is_final_block;
+	unsigned block_type;
+	unsigned num_litlen_syms;
+	unsigned num_offset_syms;
+	bitbuf_t litlen_tablemask;
+	u32 entry;
+
+next_block:
+	/* Starting to read the next block */
+	;
+
+	STATIC_ASSERT(CAN_CONSUME(1 + 2 + 5 + 5 + 4 + 3));
+	REFILL_BITS();
+
+	/* BFINAL: 1 bit */
+	is_final_block = bitbuf & BITMASK(1);
+
+	/* BTYPE: 2 bits */
+	block_type = (bitbuf >> 1) & BITMASK(2);
+
+	if (block_type == DEFLATE_BLOCKTYPE_DYNAMIC_HUFFMAN) {
+
+		/* Dynamic Huffman block */
+
+		/* The order in which precode lengths are stored */
+		static const u8 deflate_precode_lens_permutation[DEFLATE_NUM_PRECODE_SYMS] = {
+			16, 17, 18, 0, 8, 7, 9, 6, 10, 5, 11, 4, 12, 3, 13, 2, 14, 1, 15
+		};
+
+		unsigned num_explicit_precode_lens;
+		unsigned i;
+
+		/* Read the codeword length counts. */
+
+		STATIC_ASSERT(DEFLATE_NUM_LITLEN_SYMS == 257 + BITMASK(5));
+		num_litlen_syms = 257 + ((bitbuf >> 3) & BITMASK(5));
+
+		STATIC_ASSERT(DEFLATE_NUM_OFFSET_SYMS == 1 + BITMASK(5));
+		num_offset_syms = 1 + ((bitbuf >> 8) & BITMASK(5));
+
+		STATIC_ASSERT(DEFLATE_NUM_PRECODE_SYMS == 4 + BITMASK(4));
+		num_explicit_precode_lens = 4 + ((bitbuf >> 13) & BITMASK(4));
+
+		d->static_codes_loaded = false;
+
+		/*
+		 * Read the precode codeword lengths.
+		 *
+		 * A 64-bit bitbuffer is just one bit too small to hold the
+		 * maximum number of precode lens, so to minimize branches we
+		 * merge one len with the previous fields.
+		 */
+		STATIC_ASSERT(DEFLATE_MAX_PRE_CODEWORD_LEN == (1 << 3) - 1);
+		if (CAN_CONSUME(3 * (DEFLATE_NUM_PRECODE_SYMS - 1))) {
+			d->u.precode_lens[deflate_precode_lens_permutation[0]] =
+				(bitbuf >> 17) & BITMASK(3);
+			bitbuf >>= 20;
+			bitsleft -= 20;
+			REFILL_BITS();
+			i = 1;
+			do {
+				d->u.precode_lens[deflate_precode_lens_permutation[i]] =
+					bitbuf & BITMASK(3);
+				bitbuf >>= 3;
+				bitsleft -= 3;
+			} while (++i < num_explicit_precode_lens);
+		} else {
+			bitbuf >>= 17;
+			bitsleft -= 17;
+			i = 0;
+			do {
+				if ((u8)bitsleft < 3)
+					REFILL_BITS();
+				d->u.precode_lens[deflate_precode_lens_permutation[i]] =
+					bitbuf & BITMASK(3);
+				bitbuf >>= 3;
+				bitsleft -= 3;
+			} while (++i < num_explicit_precode_lens);
+		}
+		for (; i < DEFLATE_NUM_PRECODE_SYMS; i++)
+			d->u.precode_lens[deflate_precode_lens_permutation[i]] = 0;
+
+		/* Build the decode table for the precode. */
+		SAFETY_CHECK(build_precode_decode_table(d));
+
+		/* Decode the litlen and offset codeword lengths. */
+		i = 0;
+		do {
+			unsigned presym;
+			u8 rep_val;
+			unsigned rep_count;
+
+			if ((u8)bitsleft < DEFLATE_MAX_PRE_CODEWORD_LEN + 7)
+				REFILL_BITS();
+
+			/*
+			 * The code below assumes that the precode decode table
+			 * doesn't have any subtables.
+			 */
+			STATIC_ASSERT(PRECODE_TABLEBITS == DEFLATE_MAX_PRE_CODEWORD_LEN);
+
+			/* Decode the next precode symbol. */
+			entry = d->u.l.precode_decode_table[
+				bitbuf & BITMASK(DEFLATE_MAX_PRE_CODEWORD_LEN)];
+			bitbuf >>= (u8)entry;
+			bitsleft -= entry; /* optimization: subtract full entry */
+			presym = entry >> 16;
+
+			if (presym < 16) {
+				/* Explicit codeword length */
+				d->u.l.lens[i++] = presym;
+				continue;
+			}
+
+			/* Run-length encoded codeword lengths */
+
+			/*
+			 * Note: we don't need to immediately verify that the
+			 * repeat count doesn't overflow the number of elements,
+			 * since we've sized the lens array to have enough extra
+			 * space to allow for the worst-case overrun (138 zeroes
+			 * when only 1 length was remaining).
+			 *
+			 * In the case of the small repeat counts (presyms 16
+			 * and 17), it is fastest to always write the maximum
+			 * number of entries.  That gets rid of branches that
+			 * would otherwise be required.
+			 *
+			 * It is not just because of the numerical order that
+			 * our checks go in the order 'presym < 16', 'presym ==
+			 * 16', and 'presym == 17'.  For typical data this is
+			 * ordered from most frequent to least frequent case.
+			 */
+			STATIC_ASSERT(DEFLATE_MAX_LENS_OVERRUN == 138 - 1);
+
+			if (presym == 16) {
+				/* Repeat the previous length 3 - 6 times. */
+				SAFETY_CHECK(i != 0);
+				rep_val = d->u.l.lens[i - 1];
+				STATIC_ASSERT(3 + BITMASK(2) == 6);
+				rep_count = 3 + (bitbuf & BITMASK(2));
+				bitbuf >>= 2;
+				bitsleft -= 2;
+				d->u.l.lens[i + 0] = rep_val;
+				d->u.l.lens[i + 1] = rep_val;
+				d->u.l.lens[i + 2] = rep_val;
+				d->u.l.lens[i + 3] = rep_val;
+				d->u.l.lens[i + 4] = rep_val;
+				d->u.l.lens[i + 5] = rep_val;
+				i += rep_count;
+			} else if (presym == 17) {
+				/* Repeat zero 3 - 10 times. */
+				STATIC_ASSERT(3 + BITMASK(3) == 10);
+				rep_count = 3 + (bitbuf & BITMASK(3));
+				bitbuf >>= 3;
+				bitsleft -= 3;
+				d->u.l.lens[i + 0] = 0;
+				d->u.l.lens[i + 1] = 0;
+				d->u.l.lens[i + 2] = 0;
+				d->u.l.lens[i + 3] = 0;
+				d->u.l.lens[i + 4] = 0;
+				d->u.l.lens[i + 5] = 0;
+				d->u.l.lens[i + 6] = 0;
+				d->u.l.lens[i + 7] = 0;
+				d->u.l.lens[i + 8] = 0;
+				d->u.l.lens[i + 9] = 0;
+				i += rep_count;
+			} else {
+				/* Repeat zero 11 - 138 times. */
+				STATIC_ASSERT(11 + BITMASK(7) == 138);
+				rep_count = 11 + (bitbuf & BITMASK(7));
+				bitbuf >>= 7;
+				bitsleft -= 7;
+				memset(&d->u.l.lens[i], 0,
+				       rep_count * sizeof(d->u.l.lens[i]));
+				i += rep_count;
+			}
+		} while (i < num_litlen_syms + num_offset_syms);
+
+		/* Unnecessary, but check this for consistency with zlib. */
+		SAFETY_CHECK(i == num_litlen_syms + num_offset_syms);
+
+	} else if (block_type == DEFLATE_BLOCKTYPE_UNCOMPRESSED) {
+		u16 len, nlen;
+
+		/*
+		 * Uncompressed block: copy 'len' bytes literally from the input
+		 * buffer to the output buffer.
+		 */
+
+		bitsleft -= 3; /* for BTYPE and BFINAL */
+
+		/*
+		 * Align the bitstream to the next byte boundary.  This means
+		 * the next byte boundary as if we were reading a byte at a
+		 * time.  Therefore, we have to rewind 'in_next' by any bytes
+		 * that have been refilled but not actually consumed yet (not
+		 * counting overread bytes, which don't increment 'in_next').
+		 */
+		bitsleft = (u8)bitsleft;
+		SAFETY_CHECK(overread_count <= (bitsleft >> 3));
+		in_next -= (bitsleft >> 3) - overread_count;
+		overread_count = 0;
+		bitbuf = 0;
+		bitsleft = 0;
+
+		SAFETY_CHECK(in_end - in_next >= 4);
+		len = get_unaligned_le16(in_next);
+		nlen = get_unaligned_le16(in_next + 2);
+		in_next += 4;
+
+		SAFETY_CHECK(len == (u16)~nlen);
+		if (unlikely(len > out_end - out_next))
+			return LIBDEFLATE_INSUFFICIENT_SPACE;
+		SAFETY_CHECK(len <= in_end - in_next);
+
+		memcpy(out_next, in_next, len);
+		in_next += len;
+		out_next += len;
+
+		goto block_done;
+
+	} else {
+		unsigned i;
+
+		SAFETY_CHECK(block_type == DEFLATE_BLOCKTYPE_STATIC_HUFFMAN);
+
+		/*
+		 * Static Huffman block: build the decode tables for the static
+		 * codes.  Skip doing so if the tables are already set up from
+		 * an earlier static block; this speeds up decompression of
+		 * degenerate input of many empty or very short static blocks.
+		 *
+		 * Afterwards, the remainder is the same as decompressing a
+		 * dynamic Huffman block.
+		 */
+
+		bitbuf >>= 3; /* for BTYPE and BFINAL */
+		bitsleft -= 3;
+
+		if (d->static_codes_loaded)
+			goto have_decode_tables;
+
+		d->static_codes_loaded = true;
+
+		STATIC_ASSERT(DEFLATE_NUM_LITLEN_SYMS == 288);
+		STATIC_ASSERT(DEFLATE_NUM_OFFSET_SYMS == 32);
+
+		for (i = 0; i < 144; i++)
+			d->u.l.lens[i] = 8;
+		for (; i < 256; i++)
+			d->u.l.lens[i] = 9;
+		for (; i < 280; i++)
+			d->u.l.lens[i] = 7;
+		for (; i < 288; i++)
+			d->u.l.lens[i] = 8;
+
+		for (; i < 288 + 32; i++)
+			d->u.l.lens[i] = 5;
+
+		num_litlen_syms = 288;
+		num_offset_syms = 32;
+	}
+
+	/* Decompressing a Huffman block (either dynamic or static) */
+
+	SAFETY_CHECK(build_offset_decode_table(d, num_litlen_syms, num_offset_syms));
+	SAFETY_CHECK(build_litlen_decode_table(d, num_litlen_syms, num_offset_syms));
+have_decode_tables:
+	litlen_tablemask = BITMASK(d->litlen_tablebits);
+
+	/*
+	 * This is the "fastloop" for decoding literals and matches.  It does
+	 * bounds checks on in_next and out_next in the loop conditions so that
+	 * additional bounds checks aren't needed inside the loop body.
+	 *
+	 * To reduce latency, the bitbuffer is refilled and the next litlen
+	 * decode table entry is preloaded before each loop iteration.
+	 */
+	if (in_next >= in_fastloop_end || out_next >= out_fastloop_end)
+		goto generic_loop;
+	REFILL_BITS_IN_FASTLOOP();
+	entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+	do {
+		u32 length, offset, lit;
+		const u8 *src;
+		u8 *dst;
+
+		/*
+		 * Consume the bits for the litlen decode table entry.  Save the
+		 * original bitbuf for later, in case the extra match length
+		 * bits need to be extracted from it.
+		 */
+		saved_bitbuf = bitbuf;
+		bitbuf >>= (u8)entry;
+		bitsleft -= entry; /* optimization: subtract full entry */
+
+		/*
+		 * Begin by checking for a "fast" literal, i.e. a literal that
+		 * doesn't need a subtable.
+		 */
+		if (entry & HUFFDEC_LITERAL) {
+			/*
+			 * On 64-bit platforms, we decode up to 2 extra fast
+			 * literals in addition to the primary item, as this
+			 * increases performance and still leaves enough bits
+			 * remaining for what follows.  We could actually do 3,
+			 * assuming LITLEN_TABLEBITS=11, but that actually
+			 * decreases performance slightly (perhaps by messing
+			 * with the branch prediction of the conditional refill
+			 * that happens later while decoding the match offset).
+			 *
+			 * Note: the definitions of FASTLOOP_MAX_BYTES_WRITTEN
+			 * and FASTLOOP_MAX_BYTES_READ need to be updated if the
+			 * number of extra literals decoded here is changed.
+			 */
+			if (/* enough bits for 2 fast literals + length + offset preload? */
+			    CAN_CONSUME_AND_THEN_PRELOAD(2 * LITLEN_TABLEBITS +
+							 LENGTH_MAXBITS,
+							 OFFSET_TABLEBITS) &&
+			    /* enough bits for 2 fast literals + slow literal + litlen preload? */
+			    CAN_CONSUME_AND_THEN_PRELOAD(2 * LITLEN_TABLEBITS +
+							 DEFLATE_MAX_LITLEN_CODEWORD_LEN,
+							 LITLEN_TABLEBITS)) {
+				/* 1st extra fast literal */
+				lit = entry >> 16;
+				entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+				saved_bitbuf = bitbuf;
+				bitbuf >>= (u8)entry;
+				bitsleft -= entry;
+				*out_next++ = lit;
+				if (entry & HUFFDEC_LITERAL) {
+					/* 2nd extra fast literal */
+					lit = entry >> 16;
+					entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+					saved_bitbuf = bitbuf;
+					bitbuf >>= (u8)entry;
+					bitsleft -= entry;
+					*out_next++ = lit;
+					if (entry & HUFFDEC_LITERAL) {
+						/*
+						 * Another fast literal, but
+						 * this one is in lieu of the
+						 * primary item, so it doesn't
+						 * count as one of the extras.
+						 */
+						lit = entry >> 16;
+						entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+						REFILL_BITS_IN_FASTLOOP();
+						*out_next++ = lit;
+						continue;
+					}
+				}
+			} else {
+				/*
+				 * Decode a literal.  While doing so, preload
+				 * the next litlen decode table entry and refill
+				 * the bitbuffer.  To reduce latency, we've
+				 * arranged for there to be enough "preloadable"
+				 * bits remaining to do the table preload
+				 * independently of the refill.
+				 */
+				STATIC_ASSERT(CAN_CONSUME_AND_THEN_PRELOAD(
+						LITLEN_TABLEBITS, LITLEN_TABLEBITS));
+				lit = entry >> 16;
+				entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+				REFILL_BITS_IN_FASTLOOP();
+				*out_next++ = lit;
+				continue;
+			}
+		}
+
+		/*
+		 * It's not a literal entry, so it can be a length entry, a
+		 * subtable pointer entry, or an end-of-block entry.  Detect the
+		 * two unlikely cases by testing the HUFFDEC_EXCEPTIONAL flag.
+		 */
+		if (unlikely(entry & HUFFDEC_EXCEPTIONAL)) {
+			/* Subtable pointer or end-of-block entry */
+
+			if (unlikely(entry & HUFFDEC_END_OF_BLOCK))
+				goto block_done;
+
+			/*
+			 * A subtable is required.  Load and consume the
+			 * subtable entry.  The subtable entry can be of any
+			 * type: literal, length, or end-of-block.
+			 */
+			entry = d->u.litlen_decode_table[(entry >> 16) +
+				EXTRACT_VARBITS(bitbuf, (entry >> 8) & 0x3F)];
+			saved_bitbuf = bitbuf;
+			bitbuf >>= (u8)entry;
+			bitsleft -= entry;
+
+			/*
+			 * 32-bit platforms that use the byte-at-a-time refill
+			 * method have to do a refill here for there to always
+			 * be enough bits to decode a literal that requires a
+			 * subtable, then preload the next litlen decode table
+			 * entry; or to decode a match length that requires a
+			 * subtable, then preload the offset decode table entry.
+			 */
+			if (!CAN_CONSUME_AND_THEN_PRELOAD(DEFLATE_MAX_LITLEN_CODEWORD_LEN,
+							  LITLEN_TABLEBITS) ||
+			    !CAN_CONSUME_AND_THEN_PRELOAD(LENGTH_MAXBITS,
+							  OFFSET_TABLEBITS))
+				REFILL_BITS_IN_FASTLOOP();
+			if (entry & HUFFDEC_LITERAL) {
+				/* Decode a literal that required a subtable. */
+				lit = entry >> 16;
+				entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+				REFILL_BITS_IN_FASTLOOP();
+				*out_next++ = lit;
+				continue;
+			}
+			if (unlikely(entry & HUFFDEC_END_OF_BLOCK))
+				goto block_done;
+			/* Else, it's a length that required a subtable. */
+		}
+
+		/*
+		 * Decode the match length: the length base value associated
+		 * with the litlen symbol (which we extract from the decode
+		 * table entry), plus the extra length bits.  We don't need to
+		 * consume the extra length bits here, as they were included in
+		 * the bits consumed by the entry earlier.  We also don't need
+		 * to check for too-long matches here, as this is inside the
+		 * fastloop where it's already been verified that the output
+		 * buffer has enough space remaining to copy a max-length match.
+		 */
+		length = entry >> 16;
+		length += EXTRACT_VARBITS8(saved_bitbuf, entry) >> (u8)(entry >> 8);
+
+		/*
+		 * Decode the match offset.  There are enough "preloadable" bits
+		 * remaining to preload the offset decode table entry, but a
+		 * refill might be needed before consuming it.
+		 */
+		STATIC_ASSERT(CAN_CONSUME_AND_THEN_PRELOAD(LENGTH_MAXFASTBITS,
+							   OFFSET_TABLEBITS));
+		entry = d->offset_decode_table[bitbuf & BITMASK(OFFSET_TABLEBITS)];
+		if (CAN_CONSUME_AND_THEN_PRELOAD(OFFSET_MAXBITS,
+						 LITLEN_TABLEBITS)) {
+			/*
+			 * Decoding a match offset on a 64-bit platform.  We may
+			 * need to refill once, but then we can decode the whole
+			 * offset and preload the next litlen table entry.
+			 */
+			if (unlikely(entry & HUFFDEC_EXCEPTIONAL)) {
+				/* Offset codeword requires a subtable */
+				if (unlikely((u8)bitsleft < OFFSET_MAXBITS +
+					     LITLEN_TABLEBITS - PRELOAD_SLACK))
+					REFILL_BITS_IN_FASTLOOP();
+				bitbuf >>= OFFSET_TABLEBITS;
+				bitsleft -= OFFSET_TABLEBITS;
+				entry = d->offset_decode_table[(entry >> 16) +
+					EXTRACT_VARBITS(bitbuf, (entry >> 8) & 0x3F)];
+			} else if (unlikely((u8)bitsleft < OFFSET_MAXFASTBITS +
+					    LITLEN_TABLEBITS - PRELOAD_SLACK))
+				REFILL_BITS_IN_FASTLOOP();
+		} else {
+			/* Decoding a match offset on a 32-bit platform */
+			REFILL_BITS_IN_FASTLOOP();
+			if (unlikely(entry & HUFFDEC_EXCEPTIONAL)) {
+				/* Offset codeword requires a subtable */
+				bitbuf >>= OFFSET_TABLEBITS;
+				bitsleft -= OFFSET_TABLEBITS;
+				entry = d->offset_decode_table[(entry >> 16) +
+					EXTRACT_VARBITS(bitbuf, (entry >> 8) & 0x3F)];
+				REFILL_BITS_IN_FASTLOOP();
+				/* No further refill needed before extra bits */
+				STATIC_ASSERT(CAN_CONSUME(
+					OFFSET_MAXBITS - OFFSET_TABLEBITS));
+			} else {
+				/* No refill needed before extra bits */
+				STATIC_ASSERT(CAN_CONSUME(OFFSET_MAXFASTBITS));
+			}
+		}
+		saved_bitbuf = bitbuf;
+		bitbuf >>= (u8)entry;
+		bitsleft -= entry; /* optimization: subtract full entry */
+		offset = entry >> 16;
+		offset += EXTRACT_VARBITS8(saved_bitbuf, entry) >> (u8)(entry >> 8);
+
+		/* Validate the match offset; needed even in the fastloop. */
+		SAFETY_CHECK(offset <= out_next - (const u8 *)out);
+		src = out_next - offset;
+		dst = out_next;
+		out_next += length;
+
+		/*
+		 * Before starting to issue the instructions to copy the match,
+		 * refill the bitbuffer and preload the litlen decode table
+		 * entry for the next loop iteration.  This can increase
+		 * performance by allowing the latency of the match copy to
+		 * overlap with these other operations.  To further reduce
+		 * latency, we've arranged for there to be enough bits remaining
+		 * to do the table preload independently of the refill, except
+		 * on 32-bit platforms using the byte-at-a-time refill method.
+		 */
+		if (!CAN_CONSUME_AND_THEN_PRELOAD(
+			MAX(OFFSET_MAXBITS - OFFSET_TABLEBITS,
+			    OFFSET_MAXFASTBITS),
+			LITLEN_TABLEBITS) &&
+		    unlikely((u8)bitsleft < LITLEN_TABLEBITS - PRELOAD_SLACK))
+			REFILL_BITS_IN_FASTLOOP();
+		entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+		REFILL_BITS_IN_FASTLOOP();
+
+		/*
+		 * Copy the match.  On most CPUs the fastest method is a
+		 * word-at-a-time copy, unconditionally copying about 5 words
+		 * since this is enough for most matches without being too much.
+		 *
+		 * The normal word-at-a-time copy works for offset >= WORDBYTES,
+		 * which is most cases.  The case of offset == 1 is also common
+		 * and is worth optimizing for, since it is just RLE encoding of
+		 * the previous byte, which is the result of compressing long
+		 * runs of the same byte.
+		 *
+		 * Writing past the match 'length' is allowed here, since it's
+		 * been ensured there is enough output space left for a slight
+		 * overrun.  FASTLOOP_MAX_BYTES_WRITTEN needs to be updated if
+		 * the maximum possible overrun here is changed.
+		 */
+		if (UNALIGNED_ACCESS_IS_FAST && offset >= WORDBYTES) {
+			store_word_unaligned(load_word_unaligned(src), dst);
+			src += WORDBYTES;
+			dst += WORDBYTES;
+			store_word_unaligned(load_word_unaligned(src), dst);
+			src += WORDBYTES;
+			dst += WORDBYTES;
+			store_word_unaligned(load_word_unaligned(src), dst);
+			src += WORDBYTES;
+			dst += WORDBYTES;
+			store_word_unaligned(load_word_unaligned(src), dst);
+			src += WORDBYTES;
+			dst += WORDBYTES;
+			store_word_unaligned(load_word_unaligned(src), dst);
+			src += WORDBYTES;
+			dst += WORDBYTES;
+			while (dst < out_next) {
+				store_word_unaligned(load_word_unaligned(src), dst);
+				src += WORDBYTES;
+				dst += WORDBYTES;
+				store_word_unaligned(load_word_unaligned(src), dst);
+				src += WORDBYTES;
+				dst += WORDBYTES;
+				store_word_unaligned(load_word_unaligned(src), dst);
+				src += WORDBYTES;
+				dst += WORDBYTES;
+				store_word_unaligned(load_word_unaligned(src), dst);
+				src += WORDBYTES;
+				dst += WORDBYTES;
+				store_word_unaligned(load_word_unaligned(src), dst);
+				src += WORDBYTES;
+				dst += WORDBYTES;
+			}
+		} else if (UNALIGNED_ACCESS_IS_FAST && offset == 1) {
+			machine_word_t v;
+
+			/*
+			 * This part tends to get auto-vectorized, so keep it
+			 * copying a multiple of 16 bytes at a time.
+			 */
+			v = (machine_word_t)0x0101010101010101 * src[0];
+			store_word_unaligned(v, dst);
+			dst += WORDBYTES;
+			store_word_unaligned(v, dst);
+			dst += WORDBYTES;
+			store_word_unaligned(v, dst);
+			dst += WORDBYTES;
+			store_word_unaligned(v, dst);
+			dst += WORDBYTES;
+			while (dst < out_next) {
+				store_word_unaligned(v, dst);
+				dst += WORDBYTES;
+				store_word_unaligned(v, dst);
+				dst += WORDBYTES;
+				store_word_unaligned(v, dst);
+				dst += WORDBYTES;
+				store_word_unaligned(v, dst);
+				dst += WORDBYTES;
+			}
+		} else if (UNALIGNED_ACCESS_IS_FAST) {
+			store_word_unaligned(load_word_unaligned(src), dst);
+			src += offset;
+			dst += offset;
+			store_word_unaligned(load_word_unaligned(src), dst);
+			src += offset;
+			dst += offset;
+			do {
+				store_word_unaligned(load_word_unaligned(src), dst);
+				src += offset;
+				dst += offset;
+				store_word_unaligned(load_word_unaligned(src), dst);
+				src += offset;
+				dst += offset;
+			} while (dst < out_next);
+		} else {
+			*dst++ = *src++;
+			*dst++ = *src++;
+			do {
+				*dst++ = *src++;
+			} while (dst < out_next);
+		}
+	} while (in_next < in_fastloop_end && out_next < out_fastloop_end);
+
+	/*
+	 * This is the generic loop for decoding literals and matches.  This
+	 * handles cases where in_next and out_next are close to the end of
+	 * their respective buffers.  Usually this loop isn't performance-
+	 * critical, as most time is spent in the fastloop above instead.  We
+	 * therefore omit some optimizations here in favor of smaller code.
+	 */
+generic_loop:
+	for (;;) {
+		u32 length, offset;
+		const u8 *src;
+		u8 *dst;
+
+		REFILL_BITS();
+		entry = d->u.litlen_decode_table[bitbuf & litlen_tablemask];
+		saved_bitbuf = bitbuf;
+		bitbuf >>= (u8)entry;
+		bitsleft -= entry;
+		if (unlikely(entry & HUFFDEC_SUBTABLE_POINTER)) {
+			entry = d->u.litlen_decode_table[(entry >> 16) +
+					EXTRACT_VARBITS(bitbuf, (entry >> 8) & 0x3F)];
+			saved_bitbuf = bitbuf;
+			bitbuf >>= (u8)entry;
+			bitsleft -= entry;
+		}
+		length = entry >> 16;
+		if (entry & HUFFDEC_LITERAL) {
+			if (unlikely(out_next == out_end))
+				return LIBDEFLATE_INSUFFICIENT_SPACE;
+			*out_next++ = length;
+			continue;
+		}
+		if (unlikely(entry & HUFFDEC_END_OF_BLOCK))
+			goto block_done;
+		length += EXTRACT_VARBITS8(saved_bitbuf, entry) >> (u8)(entry >> 8);
+		if (unlikely(length > out_end - out_next))
+			return LIBDEFLATE_INSUFFICIENT_SPACE;
+
+		if (!CAN_CONSUME(LENGTH_MAXBITS + OFFSET_MAXBITS))
+			REFILL_BITS();
+		entry = d->offset_decode_table[bitbuf & BITMASK(OFFSET_TABLEBITS)];
+		if (unlikely(entry & HUFFDEC_EXCEPTIONAL)) {
+			bitbuf >>= OFFSET_TABLEBITS;
+			bitsleft -= OFFSET_TABLEBITS;
+			entry = d->offset_decode_table[(entry >> 16) +
+					EXTRACT_VARBITS(bitbuf, (entry >> 8) & 0x3F)];
+			if (!CAN_CONSUME(OFFSET_MAXBITS))
+				REFILL_BITS();
+		}
+		offset = entry >> 16;
+		offset += EXTRACT_VARBITS8(bitbuf, entry) >> (u8)(entry >> 8);
+		bitbuf >>= (u8)entry;
+		bitsleft -= entry;
+
+		SAFETY_CHECK(offset <= out_next - (const u8 *)out);
+		src = out_next - offset;
+		dst = out_next;
+		out_next += length;
+
+		STATIC_ASSERT(DEFLATE_MIN_MATCH_LEN == 3);
+		*dst++ = *src++;
+		*dst++ = *src++;
+		do {
+			*dst++ = *src++;
+		} while (dst < out_next);
+	}
+
+block_done:
+	/* Finished decoding a block */
+
+	if (!is_final_block)
+		goto next_block;
+
+	/* That was the last block. */
+
+	bitsleft = (u8)bitsleft;
+
+	/*
+	 * If any of the implicit appended zero bytes were consumed (not just
+	 * refilled) before hitting end of stream, then the data is bad.
+	 */
+	SAFETY_CHECK(overread_count <= (bitsleft >> 3));
+
+	/* Optionally return the actual number of bytes consumed. */
+	if (actual_in_nbytes_ret) {
+		/* Don't count bytes that were refilled but not consumed. */
+		in_next -= (bitsleft >> 3) - overread_count;
+
+		*actual_in_nbytes_ret = in_next - (u8 *)in;
+	}
+
+	/* Optionally return the actual number of bytes written. */
+	if (actual_out_nbytes_ret) {
+		*actual_out_nbytes_ret = out_next - (u8 *)out;
+	} else {
+		if (out_next != out_end)
+			return LIBDEFLATE_SHORT_OUTPUT;
+	}
+	return LIBDEFLATE_SUCCESS;
+}
+
+#undef FUNCNAME
+#undef ATTRIBUTES
+#undef EXTRACT_VARBITS
+#undef EXTRACT_VARBITS8
+
+#endif /* HAVE_BMI2_INTRIN */
+
+#if defined(deflate_decompress_bmi2) && HAVE_BMI2_NATIVE
+#define DEFAULT_IMPL	deflate_decompress_bmi2
+#else
+static inline decompress_func_t
+arch_select_decompress_func(void)
+{
+#ifdef deflate_decompress_bmi2
+	if (HAVE_BMI2(get_x86_cpu_features()))
+		return deflate_decompress_bmi2;
+#endif
+	return NULL;
+}
+#define arch_select_decompress_func	arch_select_decompress_func
+#endif
+
+#endif /* LIB_X86_DECOMPRESS_IMPL_H */
+
+#endif
+
+#ifndef DEFAULT_IMPL
+#  define DEFAULT_IMPL deflate_decompress_default
+#endif
+
+#ifdef arch_select_decompress_func
+static enum libdeflate_result
+dispatch_decomp(struct libdeflate_decompressor *d,
+		const void *in, size_t in_nbytes,
+		void *out, size_t out_nbytes_avail,
+		size_t *actual_in_nbytes_ret, size_t *actual_out_nbytes_ret);
+
+static volatile decompress_func_t decompress_impl = dispatch_decomp;
+
+/* Choose the best implementation at runtime. */
+static enum libdeflate_result
+dispatch_decomp(struct libdeflate_decompressor *d,
+		const void *in, size_t in_nbytes,
+		void *out, size_t out_nbytes_avail,
+		size_t *actual_in_nbytes_ret, size_t *actual_out_nbytes_ret)
+{
+	decompress_func_t f = arch_select_decompress_func();
+
+	if (f == NULL)
+		f = DEFAULT_IMPL;
+
+	decompress_impl = f;
+	return f(d, in, in_nbytes, out, out_nbytes_avail,
+		 actual_in_nbytes_ret, actual_out_nbytes_ret);
+}
+#else
+/* The best implementation is statically known, so call it directly. */
+#  define decompress_impl DEFAULT_IMPL
+#endif
+
+/*
+ * This is the main DEFLATE decompression routine.  See libdeflate.h for the
+ * documentation.
+ *
+ * Note that the real code is in decompress_template.h.  The part here just
+ * handles calling the appropriate implementation depending on the CPU features
+ * at runtime.
+ */
+LIBDEFLATEAPI enum libdeflate_result
+libdeflate_deflate_decompress_ex(struct libdeflate_decompressor *d,
+				 const void *in, size_t in_nbytes,
+				 void *out, size_t out_nbytes_avail,
+				 size_t *actual_in_nbytes_ret,
+				 size_t *actual_out_nbytes_ret)
+{
+	return decompress_impl(d, in, in_nbytes, out, out_nbytes_avail,
+			       actual_in_nbytes_ret, actual_out_nbytes_ret);
+}
+
+LIBDEFLATEAPI enum libdeflate_result
+libdeflate_deflate_decompress(struct libdeflate_decompressor *d,
+			      const void *in, size_t in_nbytes,
+			      void *out, size_t out_nbytes_avail,
+			      size_t *actual_out_nbytes_ret)
+{
+	return libdeflate_deflate_decompress_ex(d, in, in_nbytes,
+						out, out_nbytes_avail,
+						NULL, actual_out_nbytes_ret);
+}
+
+LIBDEFLATEAPI struct libdeflate_decompressor *
+libdeflate_alloc_decompressor_ex(const struct libdeflate_options *options)
+{
+	struct libdeflate_decompressor *d;
+
+	/*
+	 * Note: if more fields are added to libdeflate_options, this code will
+	 * need to be updated to support both the old and new structs.
+	 */
+	if (options->sizeof_options != sizeof(*options))
+		return NULL;
+
+	d = (options->malloc_func ? options->malloc_func :
+	     libdeflate_default_malloc_func)(sizeof(*d));
+	if (d == NULL)
+		return NULL;
+	/*
+	 * Note that only certain parts of the decompressor actually must be
+	 * initialized here:
+	 *
+	 * - 'static_codes_loaded' must be initialized to false.
+	 *
+	 * - The first half of the main portion of each decode table must be
+	 *   initialized to any value, to avoid reading from uninitialized
+	 *   memory during table expansion in build_decode_table().  (Although,
+	 *   this is really just to avoid warnings with dynamic tools like
+	 *   valgrind, since build_decode_table() is guaranteed to initialize
+	 *   all entries eventually anyway.)
+	 *
+	 * - 'free_func' must be set.
+	 *
+	 * But for simplicity, we currently just zero the whole decompressor.
+	 */
+	memset(d, 0, sizeof(*d));
+	d->free_func = options->free_func ?
+		       options->free_func : libdeflate_default_free_func;
+	return d;
+}
+
+LIBDEFLATEAPI struct libdeflate_decompressor *
+libdeflate_alloc_decompressor(void)
+{
+	static const struct libdeflate_options defaults = {
+		.sizeof_options = sizeof(defaults),
+	};
+	return libdeflate_alloc_decompressor_ex(&defaults);
+}
+
+LIBDEFLATEAPI void
+libdeflate_free_decompressor(struct libdeflate_decompressor *d)
+{
+	if (d)
+		d->free_func(d);
+}
+
+
+/*
+ * utils.c - utility functions for libdeflate
+ *
+ * Copyright 2016 Eric Biggers
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+#ifdef FREESTANDING
+#  define malloc NULL
+#  define free NULL
+#else
+#  include <stdlib.h>
+#endif
+
+malloc_func_t libdeflate_default_malloc_func = malloc;
+free_func_t libdeflate_default_free_func = free;
+
+void *
+libdeflate_aligned_malloc(malloc_func_t malloc_func,
+			  size_t alignment, size_t size)
+{
+	void *ptr = (*malloc_func)(sizeof(void *) + alignment - 1 + size);
+
+	if (ptr) {
+		void *orig_ptr = ptr;
+
+		ptr = (void *)ALIGN((uintptr_t)ptr + sizeof(void *), alignment);
+		((void **)ptr)[-1] = orig_ptr;
+	}
+	return ptr;
+}
+
+void
+libdeflate_aligned_free(free_func_t free_func, void *ptr)
+{
+	(*free_func)(((void **)ptr)[-1]);
+}
+
+LIBDEFLATEAPI void
+libdeflate_set_memory_allocator(malloc_func_t malloc_func,
+				free_func_t free_func)
+{
+	libdeflate_default_malloc_func = malloc_func;
+	libdeflate_default_free_func = free_func;
+}
+
+/*
+ * Implementations of libc functions for freestanding library builds.
+ * Normal library builds don't use these.  Not optimized yet; usually the
+ * compiler expands these functions and doesn't actually call them anyway.
+ */
+#ifdef FREESTANDING
+#undef memset
+void * __attribute__((weak))
+memset(void *s, int c, size_t n)
+{
+	u8 *p = s;
+	size_t i;
+
+	for (i = 0; i < n; i++)
+		p[i] = c;
+	return s;
+}
+
+#undef memcpy
+void * __attribute__((weak))
+memcpy(void *dest, const void *src, size_t n)
+{
+	u8 *d = dest;
+	const u8 *s = src;
+	size_t i;
+
+	for (i = 0; i < n; i++)
+		d[i] = s[i];
+	return dest;
+}
+
+#undef memmove
+void * __attribute__((weak))
+memmove(void *dest, const void *src, size_t n)
+{
+	u8 *d = dest;
+	const u8 *s = src;
+	size_t i;
+
+	if (d <= s)
+		return memcpy(d, s, n);
+
+	for (i = n; i > 0; i--)
+		d[i - 1] = s[i - 1];
+	return dest;
+}
+
+#undef memcmp
+int __attribute__((weak))
+memcmp(const void *s1, const void *s2, size_t n)
+{
+	const u8 *p1 = s1;
+	const u8 *p2 = s2;
+	size_t i;
+
+	for (i = 0; i < n; i++) {
+		if (p1[i] != p2[i])
+			return (int)p1[i] - (int)p2[i];
+	}
+	return 0;
+}
+#endif /* FREESTANDING */
+
+#ifdef LIBDEFLATE_ENABLE_ASSERTIONS
+#include <stdio.h>
+#include <stdlib.h>
+void
+libdeflate_assertion_failed(const char *expr, const char *file, int line)
+{
+	fprintf(stderr, "Assertion failed: %s at %s:%d\n", expr, file, line);
+	abort();
+}
+#endif /* LIBDEFLATE_ENABLE_ASSERTIONS */
+
+/*
+ * x86/cpu_features.c - feature detection for x86 CPUs
+ *
+ * Copyright 2016 Eric Biggers
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+#if HAVE_DYNAMIC_X86_CPU_FEATURES
+
+/*
+ * With old GCC versions we have to manually save and restore the x86_32 PIC
+ * register (ebx).  See: https://gcc.gnu.org/bugzilla/show_bug.cgi?id=47602
+ */
+#if defined(ARCH_X86_32) && defined(__PIC__)
+#  define EBX_CONSTRAINT "=&r"
+#else
+#  define EBX_CONSTRAINT "=b"
+#endif
+
+/* Execute the CPUID instruction. */
+static inline void
+cpuid(u32 leaf, u32 subleaf, u32 *a, u32 *b, u32 *c, u32 *d)
+{
+#ifdef _MSC_VER
+	int result[4];
+
+	__cpuidex(result, leaf, subleaf);
+	*a = result[0];
+	*b = result[1];
+	*c = result[2];
+	*d = result[3];
+#else
+	__asm__ volatile(".ifnc %%ebx, %1; mov  %%ebx, %1; .endif\n"
+			 "cpuid                                  \n"
+			 ".ifnc %%ebx, %1; xchg %%ebx, %1; .endif\n"
+			 : "=a" (*a), EBX_CONSTRAINT (*b), "=c" (*c), "=d" (*d)
+			 : "a" (leaf), "c" (subleaf));
+#endif
+}
+
+/* Read an extended control register. */
+static inline u64
+read_xcr(u32 index)
+{
+#ifdef _MSC_VER
+	return _xgetbv(index);
+#else
+	u32 d, a;
+
+	/*
+	 * Execute the "xgetbv" instruction.  Old versions of binutils do not
+	 * recognize this instruction, so list the raw bytes instead.
+	 *
+	 * This must be 'volatile' to prevent this code from being moved out
+	 * from under the check for OSXSAVE.
+	 */
+	__asm__ volatile(".byte 0x0f, 0x01, 0xd0" :
+			 "=d" (d), "=a" (a) : "c" (index));
+
+	return ((u64)d << 32) | a;
+#endif
+}
+
+static const struct cpu_feature x86_cpu_feature_table[] = {
+	{X86_CPU_FEATURE_SSE2,		"sse2"},
+	{X86_CPU_FEATURE_PCLMUL,	"pclmul"},
+	{X86_CPU_FEATURE_AVX,		"avx"},
+	{X86_CPU_FEATURE_AVX2,		"avx2"},
+	{X86_CPU_FEATURE_BMI2,		"bmi2"},
+};
+
+volatile u32 libdeflate_x86_cpu_features = 0;
+
+/* Initialize libdeflate_x86_cpu_features. */
+void libdeflate_init_x86_cpu_features(void)
+{
+	u32 max_leaf, a, b, c, d;
+	u64 xcr0 = 0;
+	u32 features = 0;
+
+	/* EAX=0: Highest Function Parameter and Manufacturer ID */
+	cpuid(0, 0, &max_leaf, &b, &c, &d);
+	if (max_leaf < 1)
+		goto out;
+
+	/* EAX=1: Processor Info and Feature Bits */
+	cpuid(1, 0, &a, &b, &c, &d);
+	if (d & (1 << 26))
+		features |= X86_CPU_FEATURE_SSE2;
+	if (c & (1 << 1))
+		features |= X86_CPU_FEATURE_PCLMUL;
+	if (c & (1 << 27))
+		xcr0 = read_xcr(0);
+	if ((c & (1 << 28)) && ((xcr0 & 0x6) == 0x6))
+		features |= X86_CPU_FEATURE_AVX;
+
+	if (max_leaf < 7)
+		goto out;
+
+	/* EAX=7, ECX=0: Extended Features */
+	cpuid(7, 0, &a, &b, &c, &d);
+	if ((b & (1 << 5)) && ((xcr0 & 0x6) == 0x6))
+		features |= X86_CPU_FEATURE_AVX2;
+	if (b & (1 << 8))
+		features |= X86_CPU_FEATURE_BMI2;
+
+out:
+	disable_cpu_features_for_testing(&features, x86_cpu_feature_table,
+					 ARRAY_LEN(x86_cpu_feature_table));
+
+	libdeflate_x86_cpu_features = features | X86_CPU_FEATURES_KNOWN;
+}
+
+#endif /* HAVE_DYNAMIC_X86_CPU_FEATURES */
diff --git a/Plugins/nosGeometry/External/openFBX/libdeflate.h b/Plugins/nosGeometry/External/openFBX/libdeflate.h
new file mode 100644
index 00000000..382d895d
--- /dev/null
+++ b/Plugins/nosGeometry/External/openFBX/libdeflate.h
@@ -0,0 +1,411 @@
+/*
+ * libdeflate.h - public header for libdeflate
+ */
+
+#ifndef LIBDEFLATE_H
+#define LIBDEFLATE_H
+
+#include <stddef.h>
+#include <stdint.h>
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+#define LIBDEFLATE_VERSION_MAJOR	1
+#define LIBDEFLATE_VERSION_MINOR	18
+#define LIBDEFLATE_VERSION_STRING	"1.18"
+
+/*
+ * Users of libdeflate.dll on Windows can define LIBDEFLATE_DLL to cause
+ * __declspec(dllimport) to be used.  This should be done when it's easy to do.
+ * Otherwise it's fine to skip it, since it is a very minor performance
+ * optimization that is irrelevant for most use cases of libdeflate.
+ */
+#ifndef LIBDEFLATEAPI
+#  if defined(LIBDEFLATE_DLL) && (defined(_WIN32) || defined(__CYGWIN__))
+#    define LIBDEFLATEAPI	__declspec(dllimport)
+#  else
+#    define LIBDEFLATEAPI
+#  endif
+#endif
+
+/* ========================================================================== */
+/*                             Compression                                    */
+/* ========================================================================== */
+
+struct libdeflate_compressor;
+struct libdeflate_options;
+
+/*
+ * libdeflate_alloc_compressor() allocates a new compressor that supports
+ * DEFLATE, zlib, and gzip compression.  'compression_level' is the compression
+ * level on a zlib-like scale but with a higher maximum value (1 = fastest, 6 =
+ * medium/default, 9 = slow, 12 = slowest).  Level 0 is also supported and means
+ * "no compression", specifically "create a valid stream, but only emit
+ * uncompressed blocks" (this will expand the data slightly).
+ *
+ * The return value is a pointer to the new compressor, or NULL if out of memory
+ * or if the compression level is invalid (i.e. outside the range [0, 12]).
+ *
+ * Note: for compression, the sliding window size is defined at compilation time
+ * to 32768, the largest size permissible in the DEFLATE format.  It cannot be
+ * changed at runtime.
+ *
+ * A single compressor is not safe to use by multiple threads concurrently.
+ * However, different threads may use different compressors concurrently.
+ */
+LIBDEFLATEAPI struct libdeflate_compressor *
+libdeflate_alloc_compressor(int compression_level);
+
+/*
+ * Like libdeflate_alloc_compressor(), but adds the 'options' argument.
+ */
+LIBDEFLATEAPI struct libdeflate_compressor *
+libdeflate_alloc_compressor_ex(int compression_level,
+			       const struct libdeflate_options *options);
+
+/*
+ * libdeflate_deflate_compress() performs raw DEFLATE compression on a buffer of
+ * data.  It attempts to compress 'in_nbytes' bytes of data located at 'in' and
+ * write the result to 'out', which has space for 'out_nbytes_avail' bytes.  The
+ * return value is the compressed size in bytes, or 0 if the data could not be
+ * compressed to 'out_nbytes_avail' bytes or fewer (but see note below).
+ *
+ * If compression is successful, then the output data is guaranteed to be a
+ * valid DEFLATE stream that decompresses to the input data.  No other
+ * guarantees are made about the output data.  Notably, different versions of
+ * libdeflate can produce different compressed data for the same uncompressed
+ * data, even at the same compression level.  Do ***NOT*** do things like
+ * writing tests that compare compressed data to a golden output, as this can
+ * break when libdeflate is updated.  (This property isn't specific to
+ * libdeflate; the same is true for zlib and other compression libraries too.)
+ */
+LIBDEFLATEAPI size_t
+libdeflate_deflate_compress(struct libdeflate_compressor *compressor,
+			    const void *in, size_t in_nbytes,
+			    void *out, size_t out_nbytes_avail);
+
+/*
+ * libdeflate_deflate_compress_bound() returns a worst-case upper bound on the
+ * number of bytes of compressed data that may be produced by compressing any
+ * buffer of length less than or equal to 'in_nbytes' using
+ * libdeflate_deflate_compress() with the specified compressor.  This bound will
+ * necessarily be a number greater than or equal to 'in_nbytes'.  It may be an
+ * overestimate of the true upper bound.  The return value is guaranteed to be
+ * the same for all invocations with the same compressor and same 'in_nbytes'.
+ *
+ * As a special case, 'compressor' may be NULL.  This causes the bound to be
+ * taken across *any* libdeflate_compressor that could ever be allocated with
+ * this build of the library, with any options.
+ *
+ * Note that this function is not necessary in many applications.  With
+ * block-based compression, it is usually preferable to separately store the
+ * uncompressed size of each block and to store any blocks that did not compress
+ * to less than their original size uncompressed.  In that scenario, there is no
+ * need to know the worst-case compressed size, since the maximum number of
+ * bytes of compressed data that may be used would always be one less than the
+ * input length.  You can just pass a buffer of that size to
+ * libdeflate_deflate_compress() and store the data uncompressed if
+ * libdeflate_deflate_compress() returns 0, indicating that the compressed data
+ * did not fit into the provided output buffer.
+ */
+LIBDEFLATEAPI size_t
+libdeflate_deflate_compress_bound(struct libdeflate_compressor *compressor,
+				  size_t in_nbytes);
+
+/*
+ * Like libdeflate_deflate_compress(), but uses the zlib wrapper format instead
+ * of raw DEFLATE.
+ */
+LIBDEFLATEAPI size_t
+libdeflate_zlib_compress(struct libdeflate_compressor *compressor,
+			 const void *in, size_t in_nbytes,
+			 void *out, size_t out_nbytes_avail);
+
+/*
+ * Like libdeflate_deflate_compress_bound(), but assumes the data will be
+ * compressed with libdeflate_zlib_compress() rather than with
+ * libdeflate_deflate_compress().
+ */
+LIBDEFLATEAPI size_t
+libdeflate_zlib_compress_bound(struct libdeflate_compressor *compressor,
+			       size_t in_nbytes);
+
+/*
+ * Like libdeflate_deflate_compress(), but uses the gzip wrapper format instead
+ * of raw DEFLATE.
+ */
+LIBDEFLATEAPI size_t
+libdeflate_gzip_compress(struct libdeflate_compressor *compressor,
+			 const void *in, size_t in_nbytes,
+			 void *out, size_t out_nbytes_avail);
+
+/*
+ * Like libdeflate_deflate_compress_bound(), but assumes the data will be
+ * compressed with libdeflate_gzip_compress() rather than with
+ * libdeflate_deflate_compress().
+ */
+LIBDEFLATEAPI size_t
+libdeflate_gzip_compress_bound(struct libdeflate_compressor *compressor,
+			       size_t in_nbytes);
+
+/*
+ * libdeflate_free_compressor() frees a compressor that was allocated with
+ * libdeflate_alloc_compressor().  If a NULL pointer is passed in, no action is
+ * taken.
+ */
+LIBDEFLATEAPI void
+libdeflate_free_compressor(struct libdeflate_compressor *compressor);
+
+/* ========================================================================== */
+/*                             Decompression                                  */
+/* ========================================================================== */
+
+struct libdeflate_decompressor;
+struct libdeflate_options;
+
+/*
+ * libdeflate_alloc_decompressor() allocates a new decompressor that can be used
+ * for DEFLATE, zlib, and gzip decompression.  The return value is a pointer to
+ * the new decompressor, or NULL if out of memory.
+ *
+ * This function takes no parameters, and the returned decompressor is valid for
+ * decompressing data that was compressed at any compression level and with any
+ * sliding window size.
+ *
+ * A single decompressor is not safe to use by multiple threads concurrently.
+ * However, different threads may use different decompressors concurrently.
+ */
+LIBDEFLATEAPI struct libdeflate_decompressor *
+libdeflate_alloc_decompressor(void);
+
+/*
+ * Like libdeflate_alloc_decompressor(), but adds the 'options' argument.
+ */
+LIBDEFLATEAPI struct libdeflate_decompressor *
+libdeflate_alloc_decompressor_ex(const struct libdeflate_options *options);
+
+/*
+ * Result of a call to libdeflate_deflate_decompress(),
+ * libdeflate_zlib_decompress(), or libdeflate_gzip_decompress().
+ */
+enum libdeflate_result {
+	/* Decompression was successful.  */
+	LIBDEFLATE_SUCCESS = 0,
+
+	/* Decompression failed because the compressed data was invalid,
+	 * corrupt, or otherwise unsupported.  */
+	LIBDEFLATE_BAD_DATA = 1,
+
+	/* A NULL 'actual_out_nbytes_ret' was provided, but the data would have
+	 * decompressed to fewer than 'out_nbytes_avail' bytes.  */
+	LIBDEFLATE_SHORT_OUTPUT = 2,
+
+	/* The data would have decompressed to more than 'out_nbytes_avail'
+	 * bytes.  */
+	LIBDEFLATE_INSUFFICIENT_SPACE = 3,
+};
+
+/*
+ * libdeflate_deflate_decompress() decompresses a DEFLATE stream from the buffer
+ * 'in' with compressed size up to 'in_nbytes' bytes.  The uncompressed data is
+ * written to 'out', a buffer with size 'out_nbytes_avail' bytes.  If
+ * decompression succeeds, then 0 (LIBDEFLATE_SUCCESS) is returned.  Otherwise,
+ * a nonzero result code such as LIBDEFLATE_BAD_DATA is returned, and the
+ * contents of the output buffer are undefined.
+ *
+ * Decompression stops at the end of the DEFLATE stream (as indicated by the
+ * BFINAL flag), even if it is actually shorter than 'in_nbytes' bytes.
+ *
+ * libdeflate_deflate_decompress() can be used in cases where the actual
+ * uncompressed size is known (recommended) or unknown (not recommended):
+ *
+ *   - If the actual uncompressed size is known, then pass the actual
+ *     uncompressed size as 'out_nbytes_avail' and pass NULL for
+ *     'actual_out_nbytes_ret'.  This makes libdeflate_deflate_decompress() fail
+ *     with LIBDEFLATE_SHORT_OUTPUT if the data decompressed to fewer than the
+ *     specified number of bytes.
+ *
+ *   - If the actual uncompressed size is unknown, then provide a non-NULL
+ *     'actual_out_nbytes_ret' and provide a buffer with some size
+ *     'out_nbytes_avail' that you think is large enough to hold all the
+ *     uncompressed data.  In this case, if the data decompresses to less than
+ *     or equal to 'out_nbytes_avail' bytes, then
+ *     libdeflate_deflate_decompress() will write the actual uncompressed size
+ *     to *actual_out_nbytes_ret and return 0 (LIBDEFLATE_SUCCESS).  Otherwise,
+ *     it will return LIBDEFLATE_INSUFFICIENT_SPACE if the provided buffer was
+ *     not large enough but no other problems were encountered, or another
+ *     nonzero result code if decompression failed for another reason.
+ */
+LIBDEFLATEAPI enum libdeflate_result
+libdeflate_deflate_decompress(struct libdeflate_decompressor *decompressor,
+			      const void *in, size_t in_nbytes,
+			      void *out, size_t out_nbytes_avail,
+			      size_t *actual_out_nbytes_ret);
+
+/*
+ * Like libdeflate_deflate_decompress(), but adds the 'actual_in_nbytes_ret'
+ * argument.  If decompression succeeds and 'actual_in_nbytes_ret' is not NULL,
+ * then the actual compressed size of the DEFLATE stream (aligned to the next
+ * byte boundary) is written to *actual_in_nbytes_ret.
+ */
+LIBDEFLATEAPI enum libdeflate_result
+libdeflate_deflate_decompress_ex(struct libdeflate_decompressor *decompressor,
+				 const void *in, size_t in_nbytes,
+				 void *out, size_t out_nbytes_avail,
+				 size_t *actual_in_nbytes_ret,
+				 size_t *actual_out_nbytes_ret);
+
+/*
+ * Like libdeflate_deflate_decompress(), but assumes the zlib wrapper format
+ * instead of raw DEFLATE.
+ *
+ * Decompression will stop at the end of the zlib stream, even if it is shorter
+ * than 'in_nbytes'.  If you need to know exactly where the zlib stream ended,
+ * use libdeflate_zlib_decompress_ex().
+ */
+LIBDEFLATEAPI enum libdeflate_result
+libdeflate_zlib_decompress(struct libdeflate_decompressor *decompressor,
+			   const void *in, size_t in_nbytes,
+			   void *out, size_t out_nbytes_avail,
+			   size_t *actual_out_nbytes_ret);
+
+/*
+ * Like libdeflate_zlib_decompress(), but adds the 'actual_in_nbytes_ret'
+ * argument.  If 'actual_in_nbytes_ret' is not NULL and the decompression
+ * succeeds (indicating that the first zlib-compressed stream in the input
+ * buffer was decompressed), then the actual number of input bytes consumed is
+ * written to *actual_in_nbytes_ret.
+ */
+LIBDEFLATEAPI enum libdeflate_result
+libdeflate_zlib_decompress_ex(struct libdeflate_decompressor *decompressor,
+			      const void *in, size_t in_nbytes,
+			      void *out, size_t out_nbytes_avail,
+			      size_t *actual_in_nbytes_ret,
+			      size_t *actual_out_nbytes_ret);
+
+/*
+ * Like libdeflate_deflate_decompress(), but assumes the gzip wrapper format
+ * instead of raw DEFLATE.
+ *
+ * If multiple gzip-compressed members are concatenated, then only the first
+ * will be decompressed.  Use libdeflate_gzip_decompress_ex() if you need
+ * multi-member support.
+ */
+LIBDEFLATEAPI enum libdeflate_result
+libdeflate_gzip_decompress(struct libdeflate_decompressor *decompressor,
+			   const void *in, size_t in_nbytes,
+			   void *out, size_t out_nbytes_avail,
+			   size_t *actual_out_nbytes_ret);
+
+/*
+ * Like libdeflate_gzip_decompress(), but adds the 'actual_in_nbytes_ret'
+ * argument.  If 'actual_in_nbytes_ret' is not NULL and the decompression
+ * succeeds (indicating that the first gzip-compressed member in the input
+ * buffer was decompressed), then the actual number of input bytes consumed is
+ * written to *actual_in_nbytes_ret.
+ */
+LIBDEFLATEAPI enum libdeflate_result
+libdeflate_gzip_decompress_ex(struct libdeflate_decompressor *decompressor,
+			      const void *in, size_t in_nbytes,
+			      void *out, size_t out_nbytes_avail,
+			      size_t *actual_in_nbytes_ret,
+			      size_t *actual_out_nbytes_ret);
+
+/*
+ * libdeflate_free_decompressor() frees a decompressor that was allocated with
+ * libdeflate_alloc_decompressor().  If a NULL pointer is passed in, no action
+ * is taken.
+ */
+LIBDEFLATEAPI void
+libdeflate_free_decompressor(struct libdeflate_decompressor *decompressor);
+
+/* ========================================================================== */
+/*                                Checksums                                   */
+/* ========================================================================== */
+
+/*
+ * libdeflate_adler32() updates a running Adler-32 checksum with 'len' bytes of
+ * data and returns the updated checksum.  When starting a new checksum, the
+ * required initial value for 'adler' is 1.  This value is also returned when
+ * 'buffer' is specified as NULL.
+ */
+LIBDEFLATEAPI uint32_t
+libdeflate_adler32(uint32_t adler, const void *buffer, size_t len);
+
+
+/*
+ * libdeflate_crc32() updates a running CRC-32 checksum with 'len' bytes of data
+ * and returns the updated checksum.  When starting a new checksum, the required
+ * initial value for 'crc' is 0.  This value is also returned when 'buffer' is
+ * specified as NULL.
+ */
+LIBDEFLATEAPI uint32_t
+libdeflate_crc32(uint32_t crc, const void *buffer, size_t len);
+
+/* ========================================================================== */
+/*                           Custom memory allocator                          */
+/* ========================================================================== */
+
+/*
+ * Install a custom memory allocator which libdeflate will use for all memory
+ * allocations by default.  'malloc_func' is a function that must behave like
+ * malloc(), and 'free_func' is a function that must behave like free().
+ *
+ * The per-(de)compressor custom memory allocator that can be specified in
+ * 'struct libdeflate_options' takes priority over this.
+ *
+ * This doesn't affect the free() function that will be used to free
+ * (de)compressors that were already in existence when this is called.
+ */
+LIBDEFLATEAPI void
+libdeflate_set_memory_allocator(void *(*malloc_func)(size_t),
+				void (*free_func)(void *));
+
+/*
+ * Advanced options.  This is the options structure that
+ * libdeflate_alloc_compressor_ex() and libdeflate_alloc_decompressor_ex()
+ * require.  Most users won't need this and should just use the non-"_ex"
+ * functions instead.  If you do need this, it should be initialized like this:
+ *
+ *	struct libdeflate_options options;
+ *
+ *	memset(&options, 0, sizeof(options));
+ *	options.sizeof_options = sizeof(options);
+ *	// Then set the fields that you need to override the defaults for.
+ */
+struct libdeflate_options {
+
+	/*
+	 * This field must be set to the struct size.  This field exists for
+	 * extensibility, so that fields can be appended to this struct in
+	 * future versions of libdeflate while still supporting old binaries.
+	 */
+	size_t sizeof_options;
+
+	/*
+	 * An optional custom memory allocator to use for this (de)compressor.
+	 * 'malloc_func' must be a function that behaves like malloc(), and
+	 * 'free_func' must be a function that behaves like free().
+	 *
+	 * This is useful in cases where a process might have multiple users of
+	 * libdeflate who want to use different memory allocators.  For example,
+	 * a library might want to use libdeflate with a custom memory allocator
+	 * without interfering with user code that might use libdeflate too.
+	 *
+	 * This takes priority over the "global" memory allocator (which by
+	 * default is malloc() and free(), but can be changed by
+	 * libdeflate_set_memory_allocator()).  Moreover, libdeflate will never
+	 * call the "global" memory allocator if a per-(de)compressor custom
+	 * allocator is always given.
+	 */
+	void *(*malloc_func)(size_t);
+	void (*free_func)(void *);
+};
+
+#ifdef __cplusplus
+}
+#endif
+
+#endif /* LIBDEFLATE_H */
diff --git a/Plugins/nosGeometry/External/openFBX/ofbx.cpp b/Plugins/nosGeometry/External/openFBX/ofbx.cpp
new file mode 100644
index 00000000..f14444e6
--- /dev/null
+++ b/Plugins/nosGeometry/External/openFBX/ofbx.cpp
@@ -0,0 +1,4102 @@
+#include "ofbx.h"
+#include "libdeflate.h"
+#include <cassert>
+#include <math.h>
+#include <ctype.h>
+#include <memory>
+#include <numeric>
+#include <string>
+#include <unordered_map>
+#include <vector>
+#include <mutex>
+#include <inttypes.h>
+#include <string.h>
+
+#if __cplusplus >= 202002L
+#include <bit> // for std::bit_cast (C++20 and later)
+#endif
+#include <map>
+
+namespace ofbx
+{
+
+static int decodeIndex(int idx)
+{
+	return (idx < 0) ? (-idx - 1) : idx;
+}
+
+static int codeIndex(int idx, bool last)
+{
+	return last ? (-idx - 1) : idx;
+}
+
+template <typename T>
+static T& emplace_back(std::vector<T>& vec) {
+	vec.emplace_back();
+	return vec.back();
+}
+
+struct Allocator {
+	struct Page {
+		struct {
+			Page* next = nullptr;
+			u32 offset = 0;
+		} header;
+		u8 data[4096 * 1024 - 12];
+	};
+	Page* first = nullptr;
+
+	~Allocator() {
+		Page* p = first;
+		while (p) {
+			Page* n = p->header.next;
+			delete p;
+			p = n;
+		}
+	}
+
+	template <typename T, typename... Args> T* allocate(Args&&... args)
+	{
+		assert(sizeof(T) <= sizeof(first->data));
+		if (!first) {
+			first = new Page;
+		}
+		Page* p = first;
+		if (p->header.offset % alignof(T) != 0) {
+			p->header.offset += alignof(T) - p->header.offset % alignof(T);
+		}
+
+		if (p->header.offset + sizeof(T) > sizeof(p->data)) {
+			p = new Page;
+			p->header.next = first;
+			first = p;
+		}
+		T* res = new (p->data + p->header.offset) T(args...);
+		p->header.offset += sizeof(T);
+		return res;
+	}
+};
+
+
+struct Video
+{
+	IElementProperty* base64_property = nullptr;
+	DataView filename;
+	DataView content;
+	DataView media;
+	bool is_base_64;
+};
+
+
+struct Error
+{
+	Error() {}
+	Error(const char* msg)
+	{
+		s_message = msg;
+	}
+
+	// Format a message with printf-style arguments.
+	template <typename... Args>
+	Error(const char* fmt, Args... args) 
+	{
+		char buf[1024];
+		std::snprintf(buf, sizeof(buf), fmt, args...);
+		s_message = buf;
+	}
+
+	static const char* s_message;
+};
+
+
+const char* Error::s_message = "";
+
+
+template <typename T> struct OptionalError
+{
+	OptionalError(Error error)
+		: is_error(true)
+	{
+	}
+
+
+	OptionalError(T _value)
+		: value(_value)
+		, is_error(false)
+	{
+	}
+
+
+	T getValue() const
+	{
+#ifdef _DEBUG
+		assert(error_checked);
+#endif
+		return value;
+	}
+
+
+	bool isError()
+	{
+#ifdef _DEBUG
+		error_checked = true;
+#endif
+		return is_error;
+	}
+
+
+private:
+	T value;
+	bool is_error;
+#ifdef _DEBUG
+	bool error_checked = false;
+#endif
+};
+
+
+#pragma pack(1)
+struct Header
+{
+	u8 magic[21];
+	u8 reserved[2];
+	u32 version;
+};
+#pragma pack()
+
+
+struct Cursor
+{
+	const u8* current;
+	const u8* begin;
+	const u8* end;
+};
+
+
+static void setTranslation(const DVec3& t, DMatrix* mtx)
+{
+	mtx->m[12] = t.x;
+	mtx->m[13] = t.y;
+	mtx->m[14] = t.z;
+}
+
+
+static DVec3 operator-(const DVec3& v)
+{
+	return {-v.x, -v.y, -v.z};
+}
+
+
+static DMatrix operator*(const DMatrix& lhs, const DMatrix& rhs)
+{
+	DMatrix res;
+	for (int j = 0; j < 4; ++j)
+	{
+		for (int i = 0; i < 4; ++i)
+		{
+			double tmp = 0;
+			for (int k = 0; k < 4; ++k)
+			{
+				tmp += lhs.m[i + k * 4] * rhs.m[k + j * 4];
+			}
+			res.m[i + j * 4] = tmp;
+		}
+	}
+	return res;
+}
+
+
+static DMatrix makeIdentity()
+{
+	return {1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1};
+}
+
+
+static DMatrix rotationX(double angle)
+{
+	DMatrix m = makeIdentity();
+	double c = cos(angle);
+	double s = sin(angle);
+
+	m.m[5] = m.m[10] = c;
+	m.m[9] = -s;
+	m.m[6] = s;
+
+	return m;
+}
+
+
+static DMatrix rotationY(double angle)
+{
+	DMatrix m = makeIdentity();
+	double c = cos(angle);
+	double s = sin(angle);
+
+	m.m[0] = m.m[10] = c;
+	m.m[8] = s;
+	m.m[2] = -s;
+
+	return m;
+}
+
+
+static DMatrix rotationZ(double angle)
+{
+	DMatrix m = makeIdentity();
+	double c = cos(angle);
+	double s = sin(angle);
+
+	m.m[0] = m.m[5] = c;
+	m.m[4] = -s;
+	m.m[1] = s;
+
+	return m;
+}
+
+
+static DMatrix getRotationMatrix(const DVec3& euler, RotationOrder order)
+{
+	const double TO_RAD = 3.1415926535897932384626433832795028 / 180.0;
+	DMatrix rx = rotationX(euler.x * TO_RAD);
+	DMatrix ry = rotationY(euler.y * TO_RAD);
+	DMatrix rz = rotationZ(euler.z * TO_RAD);
+	switch (order)
+	{
+		default:
+		case RotationOrder::EULER_XYZ: return rz * ry * rx;
+		case RotationOrder::EULER_XZY: return ry * rz * rx;
+		case RotationOrder::EULER_YXZ: return rz * rx * ry;
+		case RotationOrder::EULER_YZX: return rx * rz * ry;
+		case RotationOrder::EULER_ZXY: return ry * rx * rz;
+		case RotationOrder::EULER_ZYX: return rx * ry * rz;
+		case RotationOrder::SPHERIC_XYZ: assert(false); Error::s_message = "Unsupported rotation order."; return rx * ry * rz;
+	}
+}
+
+
+double fbxTimeToSeconds(i64 value)
+{
+	return double(value) / 46186158000L;
+}
+
+
+i64 secondsToFbxTime(double value)
+{
+	return i64(value * 46186158000L);
+}
+
+
+static DVec3 operator*(const DVec3& v, float f)
+{
+	return {v.x * f, v.y * f, v.z * f};
+}
+
+
+static DVec3 operator+(const DVec3& a, const DVec3& b)
+{
+	return {a.x + b.x, a.y + b.y, a.z + b.z};
+}
+
+static FVec3 operator+(const FVec3& a, const FVec3& b)
+{
+	return {a.x + b.x, a.y + b.y, a.z + b.z};
+}
+
+
+template <int SIZE> static bool copyString(char (&destination)[SIZE], const char* source)
+{
+	const char* src = source;
+	char* dest = destination;
+	int length = SIZE;
+	if (!src) return false;
+
+	while (*src && length > 1)
+	{
+		*dest = *src;
+		--length;
+		++dest;
+		++src;
+	}
+	*dest = 0;
+	return *src == '\0';
+}
+
+
+u64 DataView::toU64() const
+{
+	if (is_binary)
+	{
+		assert(end - begin == sizeof(u64));
+		u64 result;
+		memcpy(&result, begin, sizeof(u64));
+		return result;
+	}
+	static_assert(sizeof(unsigned long long) >= sizeof(u64), "can't use strtoull");
+	return strtoull((const char*)begin, nullptr, 10);
+}
+
+
+i64 DataView::toI64() const
+{
+	if (is_binary)
+	{
+		assert(end - begin == sizeof(i64));
+		i64 result;
+		memcpy(&result, begin, sizeof(i64));
+		return result;
+	}
+	static_assert(sizeof(long long) >= sizeof(i64), "can't use atoll");
+	return atoll((const char*)begin);
+}
+
+
+int DataView::toInt() const
+{
+	if (is_binary)
+	{
+		assert(end - begin == sizeof(int));
+		int result;
+		memcpy(&result, begin, sizeof(int));
+		return result;
+	}
+	return atoi((const char*)begin);
+}
+
+
+u32 DataView::toU32() const
+{
+	if (is_binary)
+	{
+		assert(end - begin == sizeof(u32));
+		u32 result;
+		memcpy(&result, begin, sizeof(u32));
+		return result;
+	}
+	return (u32)atoll((const char*)begin);
+}
+
+bool DataView::toBool() const
+{
+	return toInt() != 0;
+}
+
+
+double DataView::toDouble() const
+{
+	if (is_binary)
+	{
+		assert(end - begin == sizeof(double));
+		double result;
+		memcpy(&result, begin, sizeof(double));
+		return result;
+	}
+	return atof((const char*)begin);
+}
+
+
+float DataView::toFloat() const
+{
+	if (is_binary)
+	{
+		assert(end - begin == sizeof(float));
+		float result;
+		memcpy(&result, begin, sizeof(float));
+		return result;
+	}
+	return (float)atof((const char*)begin);
+}
+
+
+bool DataView::operator==(const char* rhs) const
+{
+	if (!begin) return !rhs[0];
+	const char* c = rhs;
+	const char* c2 = (const char*)begin;
+	while (*c && c2 != (const char*)end)
+	{
+		if (*c != *c2) return false;
+		++c;
+		++c2;
+	}
+	return *c2 == '\0' || c2 == (const char*)end && *c == '\0';
+}
+
+
+struct Property;
+struct Element;
+
+template <typename T> static bool parseMemory(const Property& property, T* out, int max_size_bytes);
+template <typename T> static bool parseVecData(Property& property, std::vector<T>* out_vec);
+template <typename T> static bool parseVertexData(const Element& element, const char* name, const char* index_name, T& out, std::vector<struct ParseDataJob>& jobs);
+static bool parseDouble(Property& property, double* out);
+
+struct ParseDataJob {
+	using F = bool (*)(Property*, void*);
+	Property* property = nullptr;
+	void* data = nullptr;
+	bool error = false;
+	F f;
+};
+
+template <typename T> [[nodiscard]] bool pushJob(std::vector<ParseDataJob>& jobs, Property& prop, std::vector<T>& data) {
+	ParseDataJob& job = emplace_back(jobs);
+	job.property = &prop;
+	job.data = (void*)&data;
+	job.f = [](Property* prop, void* data){ return parseVecData(*prop, (std::vector<T>*)data); };
+	return true;
+}
+
+struct Property : IElementProperty
+{
+	Type getType() const override { return (Type)type; }
+	IElementProperty* getNext() const override { return next; }
+	DataView getValue() const override { return value; }
+	int getCount() const override
+	{
+		assert(type == ARRAY_DOUBLE || type == ARRAY_INT || type == ARRAY_FLOAT || type == ARRAY_LONG);
+		if (value.is_binary)
+		{
+			int i;
+			memcpy(&i, value.begin, sizeof(i));
+			return i;
+		}
+		return count;
+	}
+
+	bool getValues(double* values, int max_size) const override { return parseMemory(*this, values, max_size); }
+
+	bool getValues(float* values, int max_size) const override { return parseMemory(*this, values, max_size); }
+
+	bool getValues(u64* values, int max_size) const override { return parseMemory(*this, values, max_size); }
+
+	bool getValues(i64* values, int max_size) const override { return parseMemory(*this, values, max_size); }
+
+	bool getValues(int* values, int max_size) const override { return parseMemory(*this, values, max_size); }
+
+	int count = 0;
+	u8 type = INTEGER;
+	DataView value;
+	Property* next = nullptr;
+};
+
+struct Element : IElement
+{
+	IElement* getFirstChild() const override { return child; }
+	IElement* getSibling() const override { return sibling; }
+	DataView getID() const override { return id; }
+	IElementProperty* getFirstProperty() const override { return first_property; }
+	IElementProperty* getProperty(int idx) const
+	{
+		IElementProperty* prop = first_property;
+		for (int i = 0; i < idx; ++i)
+		{
+			if (prop == nullptr) return nullptr;
+			prop = prop->getNext();
+		}
+		return prop;
+	}
+
+	DataView id;
+	Element* child = nullptr;
+	Element* sibling = nullptr;
+	Property* first_property = nullptr;
+};
+
+
+static const Element* findChild(const Element& element, const char* id)
+{
+	Element* const* iter = &element.child;
+	while (*iter)
+	{
+		if ((*iter)->id == id) return *iter;
+		iter = &(*iter)->sibling;
+	}
+	return nullptr;
+}
+
+
+static IElement* resolveProperty(const Object& obj, const char* name, bool* is_p60)
+{
+	*is_p60 = false;
+	const Element* props = findChild((const Element&)obj.element, "Properties70");
+	if (!props) {
+		props = findChild((const Element&)obj.element, "Properties60");
+		*is_p60 = true;
+		if (!props) return nullptr;
+	}
+
+	Element* prop = props->child;
+	while (prop)
+	{
+		if (prop->first_property && prop->first_property->value == name)
+		{
+			return prop;
+		}
+		prop = prop->sibling;
+	}
+	return nullptr;
+}
+
+
+static int resolveEnumProperty(const Object& object, const char* name, int default_value)
+{
+	bool is_p60;
+	Element* element = (Element*)resolveProperty(object, name, &is_p60);
+	if (!element) return default_value;
+	Property* x = (Property*)element->getProperty(is_p60 ? 3 : 4);
+	if (!x) return default_value;
+
+	return x->value.toInt();
+}
+
+
+static DVec3 resolveVec3Property(const Object& object, const char* name, const DVec3& default_value)
+{
+	bool is_p60;
+	Element* element = (Element*)resolveProperty(object, name, &is_p60);
+	if (!element) return default_value;
+	Property* x = (Property*)element->getProperty(is_p60 ? 3 : 4);
+	if (!x || !x->next || !x->next->next) return default_value;
+
+	return {x->value.toDouble(), x->next->value.toDouble(), x->next->next->value.toDouble()};
+}
+
+static bool isString(const Property* prop)
+{
+	if (!prop) return false;
+	return prop->getType() == Property::STRING;
+}
+
+
+static bool isLong(const Property* prop)
+{
+	if (!prop) return false;
+	return prop->getType() == Property::LONG;
+}
+
+static bool decompress(const u8* in, size_t in_size, u8* out, size_t out_size)
+{
+	auto dec = libdeflate_alloc_decompressor();
+	size_t dummy;
+	bool res = libdeflate_deflate_decompress(dec, in + 2, in_size - 2, out, out_size, &dummy) == LIBDEFLATE_SUCCESS;
+	libdeflate_free_decompressor(dec);
+	return res;
+}
+
+
+template <typename T> static OptionalError<T> read(Cursor* cursor)
+{
+	if (cursor->current + sizeof(T) > cursor->end) return Error("Reading past the end");
+	T value = *(const T*)cursor->current;
+	cursor->current += sizeof(T);
+	return value;
+}
+
+
+static OptionalError<DataView> readShortString(Cursor* cursor)
+{
+	DataView value;
+	OptionalError<u8> length = read<u8>(cursor);
+	if (length.isError()) return Error();
+
+	if (cursor->current + length.getValue() > cursor->end) return Error("Reading past the end");
+	value.begin = cursor->current;
+	cursor->current += length.getValue();
+
+	value.end = cursor->current;
+
+	return value;
+}
+
+
+static OptionalError<DataView> readLongString(Cursor* cursor)
+{
+	DataView value;
+	OptionalError<u32> length = read<u32>(cursor);
+	if (length.isError()) return Error();
+
+	if (cursor->current + length.getValue() > cursor->end) return Error("Reading past the end");
+	value.begin = cursor->current;
+	cursor->current += length.getValue();
+
+	value.end = cursor->current;
+
+	return value;
+}
+
+// 	Cheat sheet: //
+/*
+'S': Long string
+'Y': 16-bit signed integer
+'C': 8-bit signed integer
+'I': 32-bit signed integer
+'F': Single precision floating-point number
+'D': Double precision floating-point number
+'L': 64-bit signed integer
+'R': Binary data
+'b', 'f', 'd', 'l', 'c' and 'i': Arrays of binary data
+
+Src: https://code.blender.org/2013/08/fbx-binary-file-format-specification/
+*/
+
+static OptionalError<Property*> readProperty(Cursor* cursor, Allocator& allocator)
+{
+	if (cursor->current == cursor->end) return Error("Reading past the end");
+
+	Property* prop = allocator.allocate<Property>();
+	prop->next = nullptr;
+	prop->type = *cursor->current;
+	++cursor->current;
+	prop->value.begin = cursor->current;
+
+	switch (prop->type)
+	{
+		case 'S':
+		{
+			OptionalError<DataView> val = readLongString(cursor);
+			if (val.isError()) return Error();
+			prop->value = val.getValue();
+			break;
+		}
+		case 'Y': cursor->current += 2; break;
+		case 'C': cursor->current += 1; break;
+		case 'I': cursor->current += 4; break;
+		case 'F': cursor->current += 4; break;
+		case 'D': cursor->current += 8; break;
+		case 'L': cursor->current += 8; break;
+		case 'R':
+		{
+			OptionalError<u32> len = read<u32>(cursor);
+			if (len.isError()) return Error();
+			if (cursor->current + len.getValue() > cursor->end) return Error("Reading past the end");
+			cursor->current += len.getValue();
+			break;
+		}
+		case 'b':
+		case 'c':
+		case 'f':
+		case 'd':
+		case 'l':
+		case 'i':
+		{
+			OptionalError<u32> length = read<u32>(cursor);
+			OptionalError<u32> encoding = read<u32>(cursor);
+			OptionalError<u32> comp_len = read<u32>(cursor);
+			if (length.isError() || encoding.isError() || comp_len.isError()) return Error();
+			if (cursor->current + comp_len.getValue() > cursor->end) return Error("Reading past the end");
+			cursor->current += comp_len.getValue();
+			break;
+		}
+		default:
+		{
+			char str[32];
+			snprintf(str, sizeof(str), "Unknown property type: %c", prop->type);
+			return Error(str);
+		}
+	}
+	prop->value.end = cursor->current;
+	return prop;
+}
+
+static OptionalError<u64> readElementOffset(Cursor* cursor, u32 version)
+{
+	if (version >= 7500)
+	{
+		OptionalError<u64> tmp = read<u64>(cursor);
+		if (tmp.isError()) return Error();
+		return tmp.getValue();
+	}
+
+	OptionalError<u32> tmp = read<u32>(cursor);
+	if (tmp.isError()) return Error();
+	return tmp.getValue();
+}
+
+
+static OptionalError<Element*> readElement(Cursor* cursor, u32 version, Allocator& allocator)
+{
+	OptionalError<u64> end_offset = readElementOffset(cursor, version);
+	if (end_offset.isError()) return Error();
+	if (end_offset.getValue() == 0) return nullptr;
+
+	OptionalError<u64> prop_count = readElementOffset(cursor, version);
+	OptionalError<u64> prop_length = readElementOffset(cursor, version);
+	if (prop_count.isError() || prop_length.isError()) return Error();
+
+	OptionalError<DataView> id = readShortString(cursor);
+	if (id.isError()) return Error();
+
+	Element* element = allocator.allocate<Element>();
+	element->first_property = nullptr;
+	element->id = id.getValue();
+
+	element->child = nullptr;
+	element->sibling = nullptr;
+
+	Property** prop_link = &element->first_property;
+	for (u32 i = 0; i < prop_count.getValue(); ++i)
+	{
+		OptionalError<Property*> prop = readProperty(cursor, allocator);
+		if (prop.isError())
+		{
+			return Error();
+		}
+
+		*prop_link = prop.getValue();
+		prop_link = &(*prop_link)->next;
+	}
+
+	if (cursor->current - cursor->begin >= (ptrdiff_t)end_offset.getValue()) return element;
+
+	int BLOCK_SENTINEL_LENGTH = version >= 7500 ? 25 : 13;
+
+	Element** link = &element->child;
+	while (cursor->current - cursor->begin < ((ptrdiff_t)end_offset.getValue() - BLOCK_SENTINEL_LENGTH))
+	{
+		OptionalError<Element*> child = readElement(cursor, version, allocator);
+		if (child.isError())
+		{
+			return Error();
+		}
+
+		*link = child.getValue();
+		if (child.getValue() == 0) break;
+		link = &(*link)->sibling;
+	}
+
+	if (cursor->current + BLOCK_SENTINEL_LENGTH > cursor->end)
+	{
+		return Error("Reading past the end");
+	}
+
+	cursor->current += BLOCK_SENTINEL_LENGTH;
+	return element;
+}
+
+
+static bool isEndLine(const Cursor& cursor)
+{
+	return *cursor.current == '\n' || *cursor.current == '\r' && cursor.current + 1 < cursor.end && *(cursor.current + 1) != '\n';
+}
+
+
+static void skipInsignificantWhitespaces(Cursor* cursor)
+{
+	while (cursor->current < cursor->end && isspace(*cursor->current) && !isEndLine(*cursor))
+	{
+		++cursor->current;
+	}
+}
+
+
+static void skipLine(Cursor* cursor)
+{
+	while (cursor->current < cursor->end && !isEndLine(*cursor))
+	{
+		++cursor->current;
+	}
+	if (cursor->current < cursor->end) ++cursor->current;
+	skipInsignificantWhitespaces(cursor);
+}
+
+
+static void skipWhitespaces(Cursor* cursor)
+{
+	while (cursor->current < cursor->end && isspace(*cursor->current))
+	{
+		++cursor->current;
+	}
+	while (cursor->current < cursor->end && *cursor->current == ';') skipLine(cursor);
+}
+
+
+static bool isTextTokenChar(char c)
+{
+	return isalnum(c) || c == '_' || c == '-';
+}
+
+
+static DataView readTextToken(Cursor* cursor)
+{
+	DataView ret;
+	ret.begin = cursor->current;
+	while (cursor->current < cursor->end && isTextTokenChar(*cursor->current))
+	{
+		++cursor->current;
+	}
+	ret.end = cursor->current;
+	return ret;
+}
+
+
+static OptionalError<Property*> readTextProperty(Cursor* cursor, Allocator& allocator)
+{
+	Property* prop = allocator.allocate<Property>();
+	prop->value.is_binary = false;
+	prop->next = nullptr;
+	if (*cursor->current == '"')
+	{
+		prop->type = 'S';
+		++cursor->current;
+		prop->value.begin = cursor->current;
+		while (cursor->current < cursor->end && *cursor->current != '"')
+		{
+			++cursor->current;
+		}
+		prop->value.end = cursor->current;
+		if (cursor->current < cursor->end) ++cursor->current; // skip '"'
+		return prop;
+	}
+
+	if (isdigit(*cursor->current) || *cursor->current == '-')
+	{
+		prop->type = 'L';
+		prop->value.begin = cursor->current;
+		if (*cursor->current == '-') ++cursor->current;
+		while (cursor->current < cursor->end && isdigit(*cursor->current))
+		{
+			++cursor->current;
+		}
+		prop->value.end = cursor->current;
+
+		if (cursor->current < cursor->end && *cursor->current == '.')
+		{
+			prop->type = 'D';
+			++cursor->current;
+			while (cursor->current < cursor->end && isdigit(*cursor->current))
+			{
+				++cursor->current;
+			}
+			if (cursor->current < cursor->end && (*cursor->current == 'e' || *cursor->current == 'E'))
+			{
+				// 10.5e-013
+				++cursor->current;
+				if (cursor->current < cursor->end && *cursor->current == '-') ++cursor->current;
+				while (cursor->current < cursor->end && isdigit(*cursor->current)) ++cursor->current;
+			}
+
+
+			prop->value.end = cursor->current;
+		}
+		else if (cursor->current < cursor->end && (*cursor->current == 'e' || *cursor->current == 'E')) {
+			prop->type = 'D';
+			// 10e-013
+			++cursor->current;
+			if (cursor->current < cursor->end && *cursor->current == '-') ++cursor->current;
+			while (cursor->current < cursor->end && isdigit(*cursor->current)) ++cursor->current;
+			prop->value.end = cursor->current;
+		}
+		return prop;
+	}
+
+	if (*cursor->current == 'T' || *cursor->current == 'Y' || *cursor->current == 'W' || *cursor->current == 'C')
+	{
+		// WTF is this
+		prop->type = *cursor->current;
+		prop->value.begin = cursor->current;
+		++cursor->current;
+		prop->value.end = cursor->current;
+		return prop;
+	}
+
+	if (*cursor->current == ',') {
+		// https://github.com/nem0/OpenFBX/issues/85
+		prop->type = IElementProperty::NONE;
+		prop->value.begin = cursor->current;
+		prop->value.end = cursor->current;
+		return prop;
+	}
+
+	if (*cursor->current == '*')
+	{
+		prop->type = 'l';
+		++cursor->current;
+		// Vertices: *10740 { a: 14.2760353088379,... }
+		while (cursor->current < cursor->end && *cursor->current != ':')
+		{
+			++cursor->current;
+		}
+		if (cursor->current < cursor->end) ++cursor->current; // skip ':'
+		skipInsignificantWhitespaces(cursor);
+		prop->value.begin = cursor->current;
+		prop->count = 0;
+		bool is_any = false;
+		while (cursor->current < cursor->end && *cursor->current != '}')
+		{
+			if (*cursor->current == ',')
+			{
+				if (is_any) ++prop->count;
+				is_any = false;
+			}
+			else if (!isspace(*cursor->current) && !isEndLine(*cursor))
+				is_any = true;
+			if (*cursor->current == '.') prop->type = 'd';
+			++cursor->current;
+		}
+		if (is_any) ++prop->count;
+		prop->value.end = cursor->current;
+		if (cursor->current < cursor->end) ++cursor->current; // skip '}'
+		return prop;
+	}
+
+	assert(false);
+	return Error("Unknown error");
+}
+
+
+static OptionalError<Element*> readTextElement(Cursor* cursor, Allocator& allocator)
+{
+	DataView id = readTextToken(cursor);
+	if (cursor->current == cursor->end) return Error("Unexpected end of file");
+	if (*cursor->current != ':') return Error("Unexpected character");
+	++cursor->current;
+
+	skipInsignificantWhitespaces(cursor);
+	if (cursor->current == cursor->end) return Error("Unexpected end of file");
+
+	Element* element = allocator.allocate<Element>();
+	element->id = id;
+
+	Property** prop_link = &element->first_property;
+	while (cursor->current < cursor->end && !isEndLine(*cursor) && *cursor->current != '{')
+	{
+		OptionalError<Property*> prop = readTextProperty(cursor, allocator);
+		if (prop.isError())
+		{
+			return Error();
+		}
+		if (cursor->current < cursor->end && *cursor->current == ',')
+		{
+			++cursor->current;
+			skipWhitespaces(cursor);
+		}
+		skipInsignificantWhitespaces(cursor);
+
+		*prop_link = prop.getValue();
+		prop_link = &(*prop_link)->next;
+	}
+
+	Element** link = &element->child;
+	if (*cursor->current == '{')
+	{
+		++cursor->current;
+		skipWhitespaces(cursor);
+		while (cursor->current < cursor->end && *cursor->current != '}')
+		{
+			OptionalError<Element*> child = readTextElement(cursor, allocator);
+			if (child.isError())
+			{
+				return Error();
+			}
+			skipWhitespaces(cursor);
+
+			*link = child.getValue();
+			link = &(*link)->sibling;
+		}
+		if (cursor->current < cursor->end) ++cursor->current; // skip '}'
+	}
+	return element;
+}
+
+
+static OptionalError<Element*> tokenizeText(const u8* data, size_t size, Allocator& allocator)
+{
+	Cursor cursor;
+	cursor.begin = data;
+	cursor.current = data;
+	cursor.end = data + size;
+
+	Element* root = allocator.allocate<Element>();
+	root->first_property = nullptr;
+	root->id.begin = nullptr;
+	root->id.end = nullptr;
+	root->child = nullptr;
+	root->sibling = nullptr;
+
+	Element** element = &root->child;
+	while (cursor.current < cursor.end)
+	{
+		if (*cursor.current == ';' || *cursor.current == '\r' || *cursor.current == '\n')
+		{
+			skipLine(&cursor);
+		}
+		else
+		{
+			OptionalError<Element*> child = readTextElement(&cursor, allocator);
+			if (child.isError())
+			{
+				return Error();
+			}
+			*element = child.getValue();
+			if (!*element) return root;
+			element = &(*element)->sibling;
+		}
+	}
+
+	return root;
+}
+
+
+static OptionalError<Element*> tokenize(const u8* data, size_t size, u32& version, Allocator& allocator) {
+	if (size < sizeof(Header)) return Error("Invalid header");
+
+	Cursor cursor;
+	cursor.begin = data;
+	cursor.current = data;
+	cursor.end = data + size;
+
+#if __cplusplus >= 202002L
+	const Header* header = std::bit_cast<const Header*>(cursor.current);
+#else
+	Header header_temp;
+	memcpy(&header_temp, cursor.current, sizeof(Header));
+	const Header* header = &header_temp;
+#endif
+
+	cursor.current += sizeof(Header);
+	version = header->version;
+
+	Element* root = allocator.allocate<Element>();
+	root->first_property = nullptr;
+	root->id.begin = nullptr;
+	root->id.end = nullptr;
+	root->child = nullptr;
+	root->sibling = nullptr;
+
+	Element** element = &root->child;
+	for (;;)
+	{
+		OptionalError<Element*> child = readElement(&cursor, header->version, allocator);
+		if (child.isError())
+		{
+			return Error();
+		}
+
+		*element = child.getValue();
+		if (!*element) return root;
+		element = &(*element)->sibling;
+	}
+}
+
+static void parseTemplates(const Element& root)
+{
+	const Element* defs = findChild(root, "Definitions");
+	if (!defs) return;
+
+	std::unordered_map<std::string, Element*> templates;
+	Element* def = defs->child;
+	while (def)
+	{
+		if (def->id == "ObjectType")
+		{
+			Element* subdef = def->child;
+			while (subdef)
+			{
+				if (subdef->id == "PropertyTemplate")
+				{
+					DataView prop1 = def->first_property->value;
+					DataView prop2 = subdef->first_property->value;
+					std::string key((const char*)prop1.begin, prop1.end - prop1.begin);
+					key += std::string((const char*)prop1.begin, prop1.end - prop1.begin);
+					templates[key] = subdef;
+				}
+				subdef = subdef->sibling;
+			}
+		}
+		def = def->sibling;
+	}
+	// TODO
+}
+
+
+struct Scene;
+
+enum class VertexDataMapping {
+	BY_POLYGON_VERTEX,
+	BY_POLYGON,
+	BY_VERTEX
+};
+
+struct Vec2AttributesImpl {
+	std::vector<Vec2> values;
+	std::vector<int> indices;
+	VertexDataMapping mapping;
+	operator Vec2Attributes() const {
+		return { values.data(), indices.data(), int(indices.empty() ? values.size() : indices.size()) };
+	}
+};
+
+struct Vec3AttributesImpl {
+	std::vector<Vec3> values;
+	std::vector<int> indices;
+	VertexDataMapping mapping;
+	operator Vec3Attributes() const {
+		return { values.data(), indices.data(), int(indices.empty() ? values.size() : indices.size()), int(values.size()) };
+	}
+};
+
+struct Vec4AttributesImpl {
+	std::vector<Vec4> values;
+	std::vector<int> indices;
+	VertexDataMapping mapping;
+	operator Vec4Attributes() const {
+		return { values.data(), indices.data(), int(indices.empty() ? values.size() : indices.size()) };
+	}
+};
+
+struct GeometryPartitionImpl {
+	std::vector<GeometryPartition::Polygon> polygons;
+	int max_polygon_triangles = 0;
+	int triangles_count = 0;
+};
+
+struct GeometryDataImpl : GeometryData {
+	Vec3AttributesImpl positions;
+	Vec3AttributesImpl normals;
+	Vec3AttributesImpl tangents;
+	Vec4AttributesImpl colors;
+	Vec2AttributesImpl uvs[Geometry::s_uvs_max];
+	std::vector<GeometryPartitionImpl> partitions;
+	
+	std::vector<int> materials;
+
+	template <typename T, typename S>
+	T patchAttributes(const S& attr) const {
+		T res = attr;
+		if (!attr.values.empty() && attr.mapping == VertexDataMapping::BY_VERTEX && attr.indices.empty()) {
+			res.indices = positions.indices.data();
+		}
+		return res;
+	}
+
+	Vec3Attributes getPositions() const override { return positions; }
+	Vec3Attributes getNormals() const override { return patchAttributes<Vec3Attributes>(normals); }
+	Vec2Attributes getUVs(int index) const override { return patchAttributes<Vec2Attributes>(uvs[index]); }
+	Vec4Attributes getColors() const override { return patchAttributes<Vec4Attributes>(colors); }
+	Vec3Attributes getTangents() const override { return patchAttributes<Vec3Attributes>(tangents); }
+	int getPartitionCount() const override { return (int)partitions.size(); }
+	
+	GeometryPartition getPartition(int index) const override { 
+		if (index >= partitions.size()) return {nullptr, 0, 0, 0};
+		return {
+			partitions[index].polygons.data(),
+			int(partitions[index].polygons.size()),
+			partitions[index].max_polygon_triangles,
+			partitions[index].triangles_count
+		};
+	}
+
+	template <typename T>
+	bool postprocess(T& attr) {
+		if (attr.values.empty()) return true;
+		if (attr.mapping == VertexDataMapping::BY_VERTEX && !attr.indices.empty()) {
+			if (positions.indices.empty()) return false; // not supported
+
+			std::vector<int> remapped;
+			attr.mapping = VertexDataMapping::BY_POLYGON_VERTEX;
+			remapped.resize(positions.indices.size());
+			for (int i = 0; i < remapped.size(); ++i) {
+				remapped[i] = attr.indices[decodeIndex(positions.indices[i])];
+			}
+			attr.indices = remapped;
+		}
+		else if (attr.mapping == VertexDataMapping::BY_POLYGON) {
+			if (!attr.indices.empty()) return false; // not supported
+			if (partitions.size() != 1) return false; // not supported
+			if (partitions[0].polygons.size() != attr.values.size()) return false; // invalid
+
+			std::vector<int> remapped;
+			attr.mapping = VertexDataMapping::BY_POLYGON_VERTEX;
+			remapped.resize(positions.indices.size());
+
+			for (int i = 0, c = (int)partitions[0].polygons.size(); i < c; ++i) {
+				GeometryPartition::Polygon& polygon = partitions[0].polygons[i];
+				for (int j = polygon.from_vertex; j < polygon.from_vertex + polygon.vertex_count; ++j) {
+					remapped[j] = i;
+				}
+			}
+			attr.indices = remapped;
+		}
+		return true;
+	}
+
+	bool postprocess() {
+		if (materials.empty()) {
+			GeometryPartitionImpl& partition = emplace_back(partitions);
+			int polygon_count = 0;
+			for (int i : positions.indices) {
+				if (i < 0) ++polygon_count;
+			}
+			partition.polygons.reserve(polygon_count);
+			int polygon_start = 0;
+			int max_polygon_triangles = 0;
+			int total_triangles = 0;
+			int* indices = positions.indices.data();
+			for (int i = 0, c = (int)positions.indices.size(); i < c; ++i) {
+				if (indices[i] < 0) {
+					int vertex_count = i - polygon_start + 1;
+					if (vertex_count > 2) {
+						partition.polygons.push_back({polygon_start, vertex_count});
+						indices[i] = -indices[i] - 1;
+						int triangles = vertex_count - 2;
+						total_triangles += triangles;
+						if (triangles > max_polygon_triangles) max_polygon_triangles = triangles;
+					}
+					polygon_start = i + 1;
+				}
+			}
+			partition.max_polygon_triangles = max_polygon_triangles;
+			partition.triangles_count = total_triangles;
+		}
+		else {
+			int max_partition = 0;
+			for (int m : materials) {
+				if (m > max_partition) max_partition = m;
+			}
+			partitions.resize(max_partition + 1);
+
+			u32 polygon_idx = 0;
+			int* indices = positions.indices.data();
+			int num_polygon_vertices = 0;
+			int polygon_start = 0;
+			for (int i = 0, c = (int)positions.indices.size(); i < c; ++i) {
+				++num_polygon_vertices;
+				if (indices[i] < 0) {
+					u32 material_index = materials[polygon_idx];
+					GeometryPartitionImpl& partition = partitions[material_index];
+					partition.polygons.push_back({polygon_start, num_polygon_vertices});
+
+					int triangles = num_polygon_vertices - 2;
+					partition.triangles_count += triangles;
+					if (triangles > partition.max_polygon_triangles) partition.max_polygon_triangles = triangles;
+					
+					indices[i] = -indices[i] - 1;
+
+					polygon_start = i + 1;
+					++polygon_idx;
+					num_polygon_vertices = 0;
+				}
+			}
+		}
+
+		postprocess(normals);
+		postprocess(tangents);
+		for (Vec2AttributesImpl& uv : uvs) postprocess(uv);
+		postprocess(colors);
+
+		return true;
+	}
+};
+
+
+Mesh::Mesh(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+struct GeometryImpl : Geometry, GeometryDataImpl {
+	const Skin* skin = nullptr;
+	const BlendShape* blendShape = nullptr;
+
+	GeometryImpl(const Scene& _scene, const IElement& _element)
+		: Geometry(_scene, _element)
+	{
+	}
+
+	Type getType() const override { return Type::GEOMETRY; }
+	const GeometryData& getGeometryData() const override { return *this; }
+	const Skin* getSkin() const override { return skin; }
+	const BlendShape* getBlendShape() const override { return blendShape; }
+};
+
+struct MeshImpl : Mesh
+{
+	MeshImpl(const Scene& _scene, const IElement& _element)
+		: Mesh(_scene, _element)
+	{
+		is_node = true;
+	}
+
+
+	DMatrix getGeometricMatrix() const override
+	{
+		DVec3 translation = resolveVec3Property(*this, "GeometricTranslation", {0, 0, 0});
+		DVec3 rotation = resolveVec3Property(*this, "GeometricRotation", {0, 0, 0});
+		DVec3 scale = resolveVec3Property(*this, "GeometricScaling", {1, 1, 1});
+
+		DMatrix scale_mtx = makeIdentity();
+		scale_mtx.m[0] = (float)scale.x;
+		scale_mtx.m[5] = (float)scale.y;
+		scale_mtx.m[10] = (float)scale.z;
+		DMatrix mtx = getRotationMatrix(rotation, RotationOrder::EULER_XYZ);
+		setTranslation(translation, &mtx);
+
+		return scale_mtx * mtx;
+	}
+
+	Type getType() const override { return Type::MESH; }
+
+	const Pose* getPose() const override { return pose; }
+	const Geometry* getGeometry() const override { return geometry; }
+	const Material* getMaterial(int index) const override { return materials[index]; }
+	int getMaterialCount() const override { return (int)materials.size(); }
+
+	const GeometryData& getGeometryData() const override { return geometry ? static_cast<const GeometryData&>(*geometry) : geometry_data; }
+	const Skin* getSkin() const override { return geometry ? geometry->getSkin() : skin; }
+	const BlendShape* getBlendShape() const override { return geometry ? geometry->getBlendShape() : blendShape; }
+
+	const Pose* pose = nullptr;
+	const GeometryImpl* geometry = nullptr;
+	std::vector<const Material*> materials;
+	const Skin* skin = nullptr;
+	const BlendShape* blendShape = nullptr;
+
+	// old formats do not use Geometry nodes but embed vertex data directly in Mesh
+	GeometryDataImpl geometry_data;
+};
+
+
+Material::Material(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+
+struct MaterialImpl : Material
+{
+	MaterialImpl(const Scene& _scene, const IElement& _element)
+		: Material(_scene, _element)
+	{
+		for (const Texture*& tex : textures) tex = nullptr;
+	}
+
+	Type getType() const override { return Type::MATERIAL; }
+
+	const Texture* getTexture(Texture::TextureType type) const override { return textures[type]; }
+	Color getDiffuseColor() const override { return diffuse_color; }
+	Color getSpecularColor() const override { return specular_color; }
+	Color getReflectionColor() const override { return reflection_color; };
+	Color getAmbientColor() const override { return ambient_color; };
+	Color getEmissiveColor() const override { return emissive_color; };
+
+	double getDiffuseFactor() const override { return diffuse_factor; };
+	double getSpecularFactor() const override { return specular_factor; };
+	double getReflectionFactor() const override { return reflection_factor; };
+	double getShininess() const override { return shininess; };
+	double getShininessExponent() const override { return shininess_exponent; };
+	double getAmbientFactor() const override { return ambient_factor; };
+	double getBumpFactor() const override { return bump_factor; };
+	double getEmissiveFactor() const override { return emissive_factor; };
+
+	const Texture* textures[Texture::TextureType::COUNT];
+	Color diffuse_color;
+	Color specular_color;
+	Color reflection_color;
+	Color ambient_color;
+	Color emissive_color;
+
+	double diffuse_factor;
+	double specular_factor;
+	double reflection_factor;
+	double shininess;
+	double shininess_exponent;
+	double ambient_factor;
+	double bump_factor;
+	double emissive_factor;
+ };
+
+
+struct LimbNodeImpl : Object
+{
+	LimbNodeImpl(const Scene& _scene, const IElement& _element)
+		: Object(_scene, _element)
+	{
+		is_node = true;
+	}
+	Type getType() const override { return Type::LIMB_NODE; }
+};
+
+
+struct NullImpl : Object
+{
+	NullImpl(const Scene& _scene, const IElement& _element)
+		: Object(_scene, _element)
+	{
+		is_node = true;
+	}
+	Type getType() const override { return Type::NULL_NODE; }
+};
+
+
+NodeAttribute::NodeAttribute(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+
+struct NodeAttributeImpl : NodeAttribute
+{
+	NodeAttributeImpl(const Scene& _scene, const IElement& _element)
+		: NodeAttribute(_scene, _element)
+	{
+	}
+	Type getType() const override { return Type::NODE_ATTRIBUTE; }
+	DataView getAttributeType() const override { return attribute_type; }
+
+
+	DataView attribute_type;
+};
+
+
+Geometry::Geometry(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+
+Shape::Shape(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+
+struct ShapeImpl : Shape {
+	std::vector<Vec3> vertices;
+	std::vector<Vec3> normals;
+	std::vector<int> indices;
+
+	ShapeImpl(const Scene& _scene, const IElement& _element)
+		: Shape(_scene, _element)
+	{}
+
+	bool postprocess(GeometryImpl& geom, Allocator& allocator);
+
+	Type getType() const override { return Type::SHAPE; }
+	int getVertexCount() const override { return (int)vertices.size(); }
+	int getIndexCount() const override { return (int)indices.size(); }
+	const Vec3* getVertices() const override { return &vertices[0]; }
+	const Vec3* getNormals() const override { return normals.empty() ? nullptr : &normals[0]; }
+	const int* getIndices() const override { return indices.empty() ? nullptr : &indices[0]; }
+};
+
+
+Cluster::Cluster(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+
+struct ClusterImpl : Cluster
+{
+	ClusterImpl(const Scene& _scene, const IElement& _element)
+		: Cluster(_scene, _element)
+	{
+	}
+
+	const int* getIndices() const override { return &indices[0]; }
+	int getIndicesCount() const override { return (int)indices.size(); }
+	const double* getWeights() const override { return &weights[0]; }
+	int getWeightsCount() const override { return (int)weights.size(); }
+	DMatrix getTransformMatrix() const override { return transform_matrix; }
+	DMatrix getTransformLinkMatrix() const override { return transform_link_matrix; }
+	Object* getLink() const override { return link; }
+
+	bool postprocess() {
+		assert(skin);
+
+		GeometryDataImpl* geom = static_cast<GeometryDataImpl*>(static_cast<GeometryImpl*>(skin->resolveObjectLinkReverse(Object::Type::GEOMETRY)));
+		if (!geom) {
+			MeshImpl* mesh = (MeshImpl*)skin->resolveObjectLinkReverse(Object::Type::MESH);
+			if(!mesh) return false;
+			geom = &mesh->geometry_data;
+		}
+
+		const Element* indexes = findChild((const Element&)element, "Indexes");
+		if (indexes && indexes->first_property)
+		{
+			if (!parseVecData(*indexes->first_property, &indices)) return false;
+		}
+
+		const Element* weights_el = findChild((const Element&)element, "Weights");
+		if (weights_el && weights_el->first_property)
+		{
+			if (!parseVecData(*weights_el->first_property, &weights)) return false;
+		}
+
+		return true;
+	}
+
+
+	Object* link = nullptr;
+	Skin* skin = nullptr;
+	std::vector<int> indices;
+	std::vector<double> weights;
+	DMatrix transform_matrix;
+	DMatrix transform_link_matrix;
+	Type getType() const override { return Type::CLUSTER; }
+};
+
+
+AnimationStack::AnimationStack(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+
+AnimationLayer::AnimationLayer(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+
+AnimationCurve::AnimationCurve(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+
+AnimationCurveNode::AnimationCurveNode(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+
+struct AnimationStackImpl : AnimationStack
+{
+	AnimationStackImpl(const Scene& _scene, const IElement& _element)
+		: AnimationStack(_scene, _element)
+	{
+	}
+
+
+	const AnimationLayer* getLayer(int index) const override
+	{
+		return resolveObjectLink<AnimationLayer>(index);
+	}
+
+
+	Type getType() const override { return Type::ANIMATION_STACK; }
+};
+
+
+struct AnimationCurveImpl : AnimationCurve
+{
+	AnimationCurveImpl(const Scene& _scene, const IElement& _element)
+		: AnimationCurve(_scene, _element)
+	{
+	}
+
+	int getKeyCount() const override { return (int)times.size(); }
+	const i64* getKeyTime() const override { return &times[0]; }
+	const float* getKeyValue() const override { return &values[0]; }
+
+	std::vector<i64> times;
+	std::vector<float> values;
+	Type getType() const override { return Type::ANIMATION_CURVE; }
+};
+
+
+Skin::Skin(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+
+struct SkinImpl : Skin
+{
+	SkinImpl(const Scene& _scene, const IElement& _element)
+		: Skin(_scene, _element)
+	{
+	}
+
+	int getClusterCount() const override { return (int)clusters.size(); }
+	const Cluster* getCluster(int idx) const override { return clusters[idx]; }
+
+	Type getType() const override { return Type::SKIN; }
+
+	std::vector<Cluster*> clusters;
+};
+
+
+BlendShapeChannel::BlendShapeChannel(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+
+struct BlendShapeChannelImpl : BlendShapeChannel
+{
+	BlendShapeChannelImpl(const Scene& _scene, const IElement& _element)
+		: BlendShapeChannel(_scene, _element)
+	{
+	}
+
+	double getDeformPercent() const override { return deformPercent; }
+	int getShapeCount() const override { return (int)shapes.size(); }
+	const Shape* getShape(int idx) const override { return shapes[idx]; }
+
+	Type getType() const override { return Type::BLEND_SHAPE_CHANNEL; }
+
+	bool postprocess(Allocator& allocator) {
+		assert(blendShape);
+
+		GeometryImpl* geom = (GeometryImpl*)blendShape->resolveObjectLinkReverse(Object::Type::GEOMETRY);
+		if (!geom) return false;
+
+		const Element* deform_percent_el = findChild((const Element&)element, "DeformPercent");
+		if (deform_percent_el && deform_percent_el->first_property)
+		{
+			if (!parseDouble(*deform_percent_el->first_property, &deformPercent)) return false;
+		}
+
+		const Element* full_weights_el = findChild((const Element&)element, "FullWeights");
+		if (full_weights_el && full_weights_el->first_property)
+		{
+			if (!parseVecData(*full_weights_el->first_property, &fullWeights)) return false;
+		}
+
+		for (int i = 0; i < (int)shapes.size(); i++)
+		{
+			auto shape = (ShapeImpl*)shapes[i];
+			if (!shape->postprocess(*geom, allocator)) return false;
+		}
+
+		return true;
+	}
+
+
+	BlendShape* blendShape = nullptr;
+	double deformPercent = 0;
+	std::vector<double> fullWeights;
+	std::vector<Shape*> shapes;
+};
+
+
+BlendShape::BlendShape(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+
+struct BlendShapeImpl : BlendShape
+{
+	BlendShapeImpl(const Scene& _scene, const IElement& _element)
+		: BlendShape(_scene, _element)
+	{
+	}
+
+	int getBlendShapeChannelCount() const override { return (int)blendShapeChannels.size(); }
+	const BlendShapeChannel* getBlendShapeChannel(int idx) const override { return blendShapeChannels[idx]; }
+
+	Type getType() const override { return Type::BLEND_SHAPE; }
+
+	std::vector<BlendShapeChannel*> blendShapeChannels;
+};
+
+
+Texture::Texture(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+
+Pose::Pose(const Scene& _scene, const IElement& _element)
+	: Object(_scene, _element)
+{
+}
+
+
+struct PoseImpl : Pose
+{
+	PoseImpl(const Scene& _scene, const IElement& _element)
+		: Pose(_scene, _element)
+	{}
+
+	bool postprocess(Scene& scene);
+	DMatrix getMatrix() const override { return matrix; }
+	const Object* getNode() const override { return node; }
+	Type getType() const override { return Type::POSE; }
+
+	DMatrix matrix;
+	Object* node = nullptr;
+	u64 node_id;
+};
+
+
+struct TextureImpl : Texture
+{
+	TextureImpl(const Scene& _scene, const IElement& _element)
+		: Texture(_scene, _element)
+	{
+	}
+
+	DataView getRelativeFileName() const override { return relative_filename; }
+	DataView getFileName() const override { return filename; }
+	DataView getEmbeddedData() const override;
+
+	DataView media;
+	DataView filename;
+	DataView relative_filename;
+	Type getType() const override { return Type::TEXTURE; }
+};
+
+struct LightImpl : Light
+{
+	LightImpl(const Scene& _scene, const IElement& _element)
+		: Light(_scene, _element)
+	{
+	}
+
+	Type getType() const override { return Type::LIGHT; }
+	LightType getLightType() const override { return lightType; }
+
+	bool doesCastLight() const override { return castLight; }
+
+	bool doesDrawVolumetricLight() const override
+	{
+		// Return the draw volumetric light property based on the stored data (WIP)
+		return false;
+	}
+
+	bool doesDrawGroundProjection() const override
+	{
+		// Return the draw ground projection property based on the stored data (WIP)
+		return false;
+	}
+
+	bool doesDrawFrontFacingVolumetricLight() const override
+	{
+		// Return the draw front-facing volumetric light property based on the stored data (WIP)
+		return false;
+	}
+
+	Color getColor() const override { return color; }
+	double getIntensity() const override { return intensity; }
+	double getInnerAngle() const override { return innerAngle; }
+	double getOuterAngle() const override { return outerAngle; }
+
+	double getFog() const override { return fog; }
+
+	DecayType getDecayType() const override { return decayType; }
+	double getDecayStart() const override { return decayStart; }
+
+	// Near attenuation
+	bool doesEnableNearAttenuation() const override { return enableNearAttenuation; }
+	double getNearAttenuationStart() const override { return nearAttenuationStart; }
+	double getNearAttenuationEnd() const override { return nearAttenuationEnd; }
+
+	// Far attenuation
+	bool doesEnableFarAttenuation() const override { return enableFarAttenuation; }
+	double getFarAttenuationStart() const override { return farAttenuationStart; }
+	double getFarAttenuationEnd() const override { return farAttenuationEnd; }
+
+	// Shadows
+	const Texture* getShadowTexture() const override { return shadowTexture; }
+	bool doesCastShadows() const override { return castShadows; }
+	Color getShadowColor() const override { return shadowColor; }
+
+	// Member variables to store light properties
+	//-------------------------------------------------------------------------
+	LightType lightType = LightType::POINT;
+	bool castLight = true;
+	Color color = {1, 1, 1};					// Light color (RGB values)
+	double intensity = 100.0;
+
+	double innerAngle = 0.0;
+	double outerAngle = 45.0;
+
+	double fog = 50;
+
+	DecayType decayType = DecayType::QUADRATIC;
+	double decayStart = 1.0;
+
+	bool enableNearAttenuation = false;
+	double nearAttenuationStart = 0.0;
+	double nearAttenuationEnd = 0.0;
+
+	bool enableFarAttenuation = false;
+	double farAttenuationStart = 0.0;
+	double farAttenuationEnd = 0.0;
+
+	const Texture* shadowTexture = nullptr;
+	bool castShadows = true;
+	Color shadowColor = {0, 0, 0};
+};
+
+static float OFBX_PI = 3.14159265358979323846f;
+struct CameraImpl : public Camera
+{
+	CameraImpl(const Scene& _scene, const IElement& _element)
+		: Camera(_scene, _element)
+	{
+	}
+
+	ProjectionType projectionType = ProjectionType::PERSPECTIVE;
+	ApertureMode apertureMode = ApertureMode::HORIZONTAL; // Used to determine the FOV
+
+	double filmHeight = 36.0;
+	double filmWidth = 24.0;
+
+	double aspectHeight = 1.0;
+	double aspectWidth = 1.0;
+
+	double nearPlane = 0.1;
+	double farPlane = 1000.0;
+	bool autoComputeClipPanes = true;
+	
+	GateFit gateFit = GateFit::HORIZONTAL;
+	double filmAspectRatio = 1.0;
+	double focalLength = 50.0;
+	double focusDistance = 50.0;
+	
+	DVec3 backgroundColor = {0, 0, 0};
+	DVec3 interestPosition = {0, 0, 0};
+
+	double fieldOfView = 60.0;
+
+	Type getType() const override { return Type::CAMERA; }
+	ProjectionType getProjectionType() const override { return projectionType; }
+	ApertureMode getApertureMode() const override { return apertureMode; }
+
+	double getFilmHeight() const override { return filmHeight; }
+	double getFilmWidth() const override { return filmWidth; }
+
+	double getAspectHeight() const override { return aspectHeight; }
+	double getAspectWidth() const override { return aspectWidth; }
+
+	double getNearPlane() const override { return nearPlane; }
+	double getFarPlane() const override { return farPlane; }
+	bool doesAutoComputeClipPanes() const override { return autoComputeClipPanes; }
+
+	GateFit getGateFit() const override { return gateFit; }
+	double getFilmAspectRatio() const override { return filmAspectRatio; }
+	double getFocalLength() const override { return focalLength; }
+	double getFocusDistance() const override { return focusDistance; }
+
+	DVec3 getBackgroundColor() const override { return backgroundColor; }
+	DVec3 getInterestPosition() const override { return interestPosition; }
+
+	void CalculateFOV()
+	{
+		switch (apertureMode)
+		{
+			case Camera::ApertureMode::HORIZONTAL:
+				fieldOfView =  2.0 * atan(filmWidth / (2.0 * focalLength)) * 180.0 / OFBX_PI;
+				return;
+			case Camera::ApertureMode::VERTICAL:
+				fieldOfView =  2.0 * atan(filmHeight / (2.0 * focalLength)) * 180.0 / OFBX_PI;
+				return;
+			case Camera::ApertureMode::HORIZANDVERT:
+				fieldOfView =  2.0 * atan(sqrt(filmWidth * filmWidth + filmHeight * filmHeight) / (2.0 * focalLength)) * 180.0 / OFBX_PI;
+				return;
+			case Camera::ApertureMode::FOCALLENGTH:
+				fieldOfView =  2.0 * atan(filmHeight / (2.0 * focalLength)) * 180.0 / OFBX_PI; // Same as vertical ¯\_(ツ)_/¯
+				return;
+			default:
+				fieldOfView =  60.0;
+		}
+	}
+};
+
+struct Root : Object
+{
+	Root(const Scene& _scene, const IElement& _element)
+		: Object(_scene, _element)
+	{
+		copyString(name, "RootNode");
+		is_node = true;
+	}
+	Type getType() const override { return Type::ROOT; }
+};
+
+
+struct Scene : IScene
+{
+	struct Connection
+	{
+		enum Type
+		{
+			OBJECT_OBJECT,
+			OBJECT_PROPERTY,
+			PROPERTY_OBJECT,
+			PROPERTY_PROPERTY,
+		};
+
+		Type type = OBJECT_OBJECT;
+		u64 from_object = 0;
+		u64 to_object = 0;
+		DataView from_property;
+		DataView to_property;
+	};
+
+	struct ObjectPair
+	{
+		const Element* element;
+		Object* object;
+	};
+
+
+	int getAnimationStackCount() const override { return (int)m_animation_stacks.size(); }
+	int getGeometryCount() const override { return (int)m_geometries.size(); }
+	int getMeshCount() const override { return (int)m_meshes.size(); }
+	float getSceneFrameRate() const override { return m_scene_frame_rate; }
+	const GlobalSettings* getGlobalSettings() const override { return &m_settings; }
+
+	const Object* const* getAllObjects() const override { return m_all_objects.empty() ? nullptr : &m_all_objects[0]; }
+
+
+	int getAllObjectCount() const override { return (int)m_all_objects.size(); }
+
+	int getEmbeddedDataCount() const override {
+		return (int)m_videos.size();
+	}
+
+	DataView getEmbeddedData(int index) const override {
+		return m_videos[index].content;
+	}
+
+	bool isEmbeddedBase64(int index) const override {
+		return m_videos[index].is_base_64;
+	}
+
+	const IElementProperty* getEmbeddedBase64Data(int index) const override {
+		return m_videos[index].base64_property;
+	}
+
+	DataView getEmbeddedFilename(int index) const override {
+		return m_videos[index].filename;
+	}
+
+	const AnimationStack* getAnimationStack(int index) const override
+	{
+		assert(index >= 0);
+		assert(index < m_animation_stacks.size());
+		return m_animation_stacks[index];
+	}
+
+
+	const Mesh* getMesh(int index) const override
+	{
+		assert(index >= 0);
+		assert(index < m_meshes.size());
+		return m_meshes[index];
+	}
+
+
+	const Geometry* getGeometry(int index) const override
+	{
+		assert(index >= 0);
+		assert(index < m_geometries.size());
+		return m_geometries[index];
+	}
+
+
+	const TakeInfo* getTakeInfo(const char* name) const override
+	{
+		for (const TakeInfo& info : m_take_infos)
+		{
+			if (info.name == name) return &info;
+		}
+		return nullptr;
+	}
+
+	const Camera* getCamera(int index) const override
+	{
+		assert(index >= 0);
+		assert(index < m_cameras.size());
+		return m_cameras[index];
+	}
+
+	int getCameraCount() const override
+	{
+		return (int)m_cameras.size();
+	}
+
+	const Light* getLight(int index) const override
+	{
+		assert(index >= 0);
+		assert(index < m_lights.size());
+		return m_lights[index];
+	}
+
+	int getLightCount() const override
+	{
+		return (int)m_lights.size();
+	}
+
+
+	const IElement* getRootElement() const override { return m_root_element; }
+	const Object* getRoot() const override { return m_root; }
+
+
+	void destroy() override { delete this; }
+
+
+	~Scene() override {
+		for(Object* ptr : m_all_objects) {
+			ptr->~Object();
+		}
+	}
+
+	bool finalize();
+
+	Element* m_root_element = nullptr;
+	Root* m_root = nullptr;
+	float m_scene_frame_rate = -1;
+	GlobalSettings m_settings;
+
+	std::unordered_map<std::string, u64> m_fake_ids;
+	std::unordered_map<u64, ObjectPair> m_object_map;
+	std::vector<Object*> m_all_objects;
+	std::vector<Mesh*> m_meshes;
+	std::vector<Geometry*> m_geometries;
+	std::vector<AnimationStack*> m_animation_stacks;
+	std::vector<Camera*> m_cameras;
+	std::vector<Light*> m_lights;
+	std::vector<Connection> m_connections;
+	std::vector<u8> m_data;
+	std::vector<TakeInfo> m_take_infos;
+	std::vector<Video> m_videos;
+	Allocator m_allocator;
+	u32 version = 0;
+};
+
+Object::Object(const Scene& scene, const IElement& element)
+	: scene(scene)
+	, element(element)
+	, is_node(false)
+	, node_attribute(nullptr)
+{
+	Element& e = (Element&)element;
+	if (scene.version < 6200 && e.first_property && isString(e.first_property)) {
+		e.first_property->value.toString(name);
+	}
+	else if (e.first_property && e.first_property->next)
+	{
+		e.first_property->next->value.toString(name);
+	}
+	else
+	{
+		name[0] = '\0';
+	}
+}
+
+DataView TextureImpl::getEmbeddedData() const {
+	if (!media.begin) return media;
+	for (const Video& v : scene.m_videos) {
+		if (v.media.end - v.media.begin != media.end - media.begin) continue;
+		const size_t len = v.media.end - v.media.begin;
+		if (memcmp(v.media.begin, media.begin, len) != 0) continue;
+
+		return v.content;
+	}
+	return {};
+}
+
+
+bool PoseImpl::postprocess(Scene& scene) {
+	node = scene.m_object_map[node_id].object;
+	if (node && node->getType() == Object::Type::MESH) {
+		static_cast<MeshImpl*>(node)->pose = this;
+	}
+	return true;
+}
+
+
+struct AnimationCurveNodeImpl : AnimationCurveNode
+{
+	AnimationCurveNodeImpl(const Scene& _scene, const IElement& _element)
+		: AnimationCurveNode(_scene, _element)
+	{
+		default_values[0] = default_values[1] = default_values[2] =  0;
+		bool is_p60;
+		Element* dx = static_cast<Element*>(resolveProperty(*this, "d|X", &is_p60));
+		Element* dy = static_cast<Element*>(resolveProperty(*this, "d|Y", &is_p60));
+		Element* dz = static_cast<Element*>(resolveProperty(*this, "d|Z", &is_p60));
+
+		if (dx) {
+			Property* x = (Property*)dx->getProperty(4);
+			if (x) default_values[0] = (float)x->value.toDouble();
+		}
+		if (dy) {
+			Property* y = (Property*)dy->getProperty(4);
+			if (y) default_values[1] = (float)y->value.toDouble();
+		}
+		if (dz) {
+			Property* z = (Property*)dz->getProperty(4);
+			if (z) default_values[2] = (float)z->value.toDouble();
+		}
+	}
+
+
+	const Object* getBone() const override
+	{
+		return bone;
+	}
+
+	DataView getBoneLinkProperty() const override { return bone_link_property; }
+
+	const AnimationCurve* getCurve(int idx) const override {
+		assert(idx >= 0 && idx < 3);
+		return curves[idx].curve;
+	}
+
+
+	DVec3 getNodeLocalTransform(double time) const override
+	{
+		i64 fbx_time = secondsToFbxTime(time);
+
+		auto getCoord = [&](const Curve& curve, i64 fbx_time, int idx) {
+			if (!curve.curve) return default_values[idx];
+
+			const i64* times = curve.curve->getKeyTime();
+			const float* values = curve.curve->getKeyValue();
+			int count = curve.curve->getKeyCount();
+
+			if (fbx_time < times[0]) fbx_time = times[0];
+			if (fbx_time > times[count - 1]) fbx_time = times[count - 1];
+			for (int i = 1; i < count; ++i)
+			{
+				if (times[i] >= fbx_time)
+				{
+					float t = float(double(fbx_time - times[i - 1]) / double(times[i] - times[i - 1]));
+					return values[i - 1] * (1 - t) + values[i] * t;
+				}
+			}
+			return values[0];
+		};
+
+		return {getCoord(curves[0], fbx_time, 0), getCoord(curves[1], fbx_time, 1), getCoord(curves[2], fbx_time, 2)};
+	}
+
+
+	struct Curve
+	{
+		const AnimationCurve* curve = nullptr;
+		const Scene::Connection* connection = nullptr;
+	};
+
+
+	Curve curves[3];
+	Object* bone = nullptr;
+	DataView bone_link_property;
+	Type getType() const override { return Type::ANIMATION_CURVE_NODE; }
+	float default_values[3];
+	enum Mode
+	{
+		TRANSLATION,
+		ROTATION,
+		SCALE
+	} mode = TRANSLATION;
+};
+
+
+struct AnimationLayerImpl : AnimationLayer
+{
+	AnimationLayerImpl(const Scene& _scene, const IElement& _element)
+		: AnimationLayer(_scene, _element)
+	{
+	}
+
+
+	Type getType() const override { return Type::ANIMATION_LAYER; }
+
+
+	const AnimationCurveNode* getCurveNode(int index) const override
+	{
+		if (index >= (int)curve_nodes.size() || index < 0) return nullptr;
+		return curve_nodes[index];
+	}
+
+
+	const AnimationCurveNode* getCurveNode(const Object& bone, const char* prop) const override
+	{
+		for (const AnimationCurveNodeImpl* node : curve_nodes)
+		{
+			if (node->bone_link_property.begin && node->bone_link_property == prop && node->bone == &bone) return node;
+		}
+		return nullptr;
+	}
+
+
+	std::vector<AnimationCurveNodeImpl*> curve_nodes;
+};
+
+/*
+	DEBUGGING ONLY (but im not your boss so do what you want)
+	- maps the contents of the given node for viewing in the debugger
+	
+	std::map<std::string, ofbx::IElementProperty*, std::less<>> allProperties;
+	mapProperties(element, allProperties);
+*/
+void mapProperties(const ofbx::IElement& parent, std::map<std::string, ofbx::IElementProperty*, std::less<>>& propMap)
+{
+	for (const ofbx::IElement* element = parent.getFirstChild(); element; element = element->getSibling())
+	{
+		char key[32];
+
+		if (element->getFirstProperty())
+			element->getFirstProperty()->getValue().toString(key);
+		else
+			element->getID().toString(key);
+
+
+		ofbx::IElementProperty* prop = element->getFirstProperty();
+		propMap.insert({key, prop});
+
+		if (element->getFirstChild()) mapProperties(*element, propMap);
+	}
+};
+
+
+void parseVideo(Scene& scene, const Element& element, Allocator& allocator)
+{
+	if (!element.first_property) return;
+	if (!element.first_property->next) return;
+	if (element.first_property->next->getType() != IElementProperty::STRING) return;
+
+	const Element* content_element = findChild(element, "Content");
+
+	bool is_base64 = false;
+	if (!content_element) return;
+	if (!content_element->first_property) return;
+	const Property* content_property = content_element->first_property;
+	if (content_element->first_property->getType() != IElementProperty::BINARY) {
+		is_base64 = true;
+	}
+
+	const Element* filename_element = findChild(element, "Filename");
+	if (!filename_element) return;
+	if (!filename_element->first_property) return;
+	if (filename_element->first_property->getType() != IElementProperty::STRING) return;
+
+	Video video;
+	video.is_base_64 = is_base64;
+	video.base64_property = is_base64 ? content_element->first_property->next : nullptr;
+	video.content = is_base64 ? DataView{} : content_element->first_property->value;
+	video.filename = filename_element->first_property->value;
+	video.media = element.first_property->next->value;
+	scene.m_videos.push_back(video);
+}
+
+static bool parseGeometryMaterials(GeometryDataImpl& geom, const Element& element, std::vector<ParseDataJob> &jobs)
+{
+	const Element* layer_material_element = findChild(element, "LayerElementMaterial");
+	if (!layer_material_element) return true;
+
+	const Element* mapping_element = findChild(*layer_material_element, "MappingInformationType");
+	const Element* reference_element = findChild(*layer_material_element, "ReferenceInformationType");
+
+	if (!mapping_element || !reference_element) return false;
+	if (!mapping_element->first_property) return false;
+	if (!reference_element->first_property) return false;
+
+	if (mapping_element->first_property->value == "ByPolygon" && reference_element->first_property->value == "IndexToDirect") {
+		const Element* indices_element = findChild(*layer_material_element, "Materials");
+		if (!indices_element || !indices_element->first_property) return false;
+
+		return pushJob(jobs, *indices_element->first_property, geom.materials);
+	}
+	else
+	{
+		if (mapping_element->first_property->value != "AllSame") return false;
+	}
+	return true;
+}
+
+static bool parseGeometryUVs(GeometryDataImpl& geom, const Element& element, std::vector<ParseDataJob> &jobs) {
+	const Element* layer_uv_element = findChild(element, "LayerElementUV");
+	while (layer_uv_element) {
+		const int uv_index = layer_uv_element->first_property ? layer_uv_element->first_property->getValue().toInt() : 0;
+		if (uv_index >= 0 && uv_index < Geometry::s_uvs_max) {
+			Vec2AttributesImpl& uvs = geom.uvs[uv_index];
+			if (!parseVertexData(*layer_uv_element, "UV", "UVIndex", uvs, jobs)) return false;
+		}
+
+		do {
+			layer_uv_element = layer_uv_element->sibling;
+		} while (layer_uv_element && layer_uv_element->id != "LayerElementUV");
+	}
+	return true;
+}
+
+static bool parseGeometryTangents(GeometryDataImpl& geom, const Element& element, std::vector<ParseDataJob> &jobs) {
+	const Element* layer_tangent_element = findChild(element, "LayerElementTangents");
+	if (!layer_tangent_element) layer_tangent_element = findChild(element, "LayerElementTangent");
+	if (!layer_tangent_element) return true;
+
+	if (findChild(*layer_tangent_element, "Tangents")) {
+		return parseVertexData(*layer_tangent_element, "Tangents", "TangentsIndex", geom.tangents, jobs);
+	}
+
+	return parseVertexData(*layer_tangent_element, "Tangent", "TangentIndex", geom.tangents, jobs);
+}
+
+static bool parseGeometryColors(GeometryDataImpl& geom, const Element& element, std::vector<ParseDataJob> &jobs) {
+	const Element* layer_color_element = findChild(element, "LayerElementColor");
+	if (!layer_color_element) return true;
+	return parseVertexData(*layer_color_element, "Colors", "ColorIndex", geom.colors, jobs);
+}
+
+static bool parseGeometryNormals(GeometryDataImpl& geom, const Element& element, std::vector<ParseDataJob> &jobs) {
+	const Element* layer_normal_element = findChild(element, "LayerElementNormal");
+	if (!layer_normal_element) return true;
+	return parseVertexData(*layer_normal_element, "Normals", "NormalsIndex", geom.normals, jobs);
+}
+
+struct OptionalError<Object*> parseMesh(const Scene& scene, const Element& element, std::vector<ParseDataJob> &jobs, Allocator& allocator) {
+	MeshImpl* mesh = allocator.allocate<MeshImpl>(scene, element);
+
+	if (!element.first_property) return Error("Invalid mesh");
+
+	const Element* vertices_element = findChild(element, "Vertices");
+	if (!vertices_element || !vertices_element->first_property) return mesh;
+
+	const Element* polys_element = findChild(element, "PolygonVertexIndex");
+	if (!polys_element || !polys_element->first_property) return Error("Indices missing");
+
+	if (!pushJob(jobs, *vertices_element->first_property, mesh->geometry_data.positions.values)) return Error("Invalid vertices");
+	if (!pushJob(jobs, *polys_element->first_property, mesh->geometry_data.positions.indices)) return Error("Invalid vertices");
+
+	if (!parseGeometryMaterials(mesh->geometry_data, element, jobs)) return Error("Invalid materials");
+	if (!parseGeometryUVs(mesh->geometry_data, element, jobs)) return Error("Invalid vertex attributes");
+	if (!parseGeometryTangents(mesh->geometry_data, element, jobs)) return Error("Invalid vertex attributes");
+	if (!parseGeometryColors(mesh->geometry_data, element, jobs)) return Error("Invalid vertex attributes");
+	if (!parseGeometryNormals(mesh->geometry_data, element, jobs)) return Error("Invalid vertex attributes");
+
+	return mesh;
+}
+
+struct OptionalError<Object*> parseTexture(const Scene& scene, const Element& element, Allocator& allocator)
+{
+	TextureImpl* texture = allocator.allocate<TextureImpl>(scene, element);
+	const Element* texture_filename = findChild(element, "FileName");
+	if (texture_filename && texture_filename->first_property)
+	{
+		texture->filename = texture_filename->first_property->value;
+	}
+
+	const Element* media = findChild(element, "Media");
+	if (media && media->first_property)
+	{
+		texture->media = media->first_property->value;
+	}
+
+	const Element* texture_relative_filename = findChild(element, "RelativeFilename");
+	if (texture_relative_filename && texture_relative_filename->first_property)
+	{
+		texture->relative_filename = texture_relative_filename->first_property->value;
+	}
+	return texture;
+}
+
+struct OptionalError<Object*> parseLight(Scene& scene, const Element& element, Allocator& allocator)
+{
+	LightImpl* light = allocator.allocate<LightImpl>(scene, element);
+
+	light->lightType = static_cast<Light::LightType>(resolveEnumProperty(*light, "LightType", (int)Light::LightType::POINT));
+
+	const Element* prop = findChild(element, "Properties70");
+	if (prop) prop = prop->child;
+
+	while (prop)
+	{
+		if (prop->id == "P" && prop->first_property)
+		{
+			if (prop->first_property->value == "Color")
+			{
+				light->color.r = (float)prop->getProperty(4)->getValue().toDouble();
+				light->color.g = (float)prop->getProperty(5)->getValue().toDouble();
+				light->color.b = (float)prop->getProperty(6)->getValue().toDouble();
+			}
+			if (prop->first_property->value == "ShadowColor")
+			{
+				light->shadowColor.r = (float)prop->getProperty(4)->getValue().toDouble();
+				light->shadowColor.g = (float)prop->getProperty(5)->getValue().toDouble();
+				light->shadowColor.b = (float)prop->getProperty(6)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "CastShadows")
+			{
+				light->castShadows = prop->getProperty(4)->getValue().toBool();
+			}
+			else if (prop->first_property->value == "InnerAngle")
+			{
+				light->innerAngle = (float)prop->getProperty(4)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "OuterAngle")
+			{
+				light->outerAngle = (float)prop->getProperty(4)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "Intensity")
+			{
+				light->intensity = (float)prop->getProperty(4)->getValue().toDouble();
+			}
+		}
+		prop = prop->sibling;
+	}
+
+	scene.m_lights.push_back(light);
+	return light;
+}
+
+struct OptionalError<Object*> parseCamera(Scene& scene, const Element& element, Allocator& allocator)
+{
+	CameraImpl* camera = allocator.allocate<CameraImpl>(scene, element);
+
+	camera->projectionType = static_cast<Camera::ProjectionType>(resolveEnumProperty(*camera, "ProjectionType", (int)Camera::ProjectionType::PERSPECTIVE));
+	camera->apertureMode = static_cast<Camera::ApertureMode>(resolveEnumProperty(*camera, "ApertureMode", (int)Camera::ApertureMode::HORIZANDVERT));
+	camera->gateFit = static_cast<Camera::GateFit>(resolveEnumProperty(*camera, "GateFit", (int)Camera::GateFit::HORIZONTAL));
+
+	const Element* prop = findChild(element, "Properties70");
+	if (prop) prop = prop->child;
+
+	while (prop)
+	{
+		if (prop->id == "P" && prop->first_property)
+		{
+			if (prop->first_property->value == "InterestPosition")
+			{
+				camera->interestPosition.x = (float)prop->getProperty(4)->getValue().toDouble();
+				camera->interestPosition.y = (float)prop->getProperty(5)->getValue().toDouble();
+				camera->interestPosition.z = (float)prop->getProperty(6)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "BackgroundColor")
+			{
+				camera->backgroundColor.x = (float)prop->getProperty(4)->getValue().toDouble();
+				camera->backgroundColor.y = (float)prop->getProperty(5)->getValue().toDouble();
+				camera->backgroundColor.z = (float)prop->getProperty(6)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "FocalLength")
+			{
+				camera->focalLength = prop->getProperty(4)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "FocusDistance")
+			{
+				camera->focusDistance = prop->getProperty(4)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "FilmAspectRatio")
+			{
+				camera->filmAspectRatio = prop->getProperty(4)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "FilmWidth")
+			{
+				camera->filmWidth = prop->getProperty(4)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "FilmHeight")
+			{
+				camera->filmHeight = prop->getProperty(4)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "AspectHeight")
+			{
+				camera->aspectHeight = prop->getProperty(4)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "AspectWidth")
+			{
+				camera->aspectWidth = prop->getProperty(4)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "AutoComputeClipPanes")
+			{
+				camera->autoComputeClipPanes = prop->getProperty(4)->getValue().toBool();
+			}
+			else if (prop->first_property->value == "NearPlane")
+			{
+				camera->nearPlane = prop->getProperty(4)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "FarPlane")
+			{
+				camera->farPlane = prop->getProperty(4)->getValue().toDouble();
+			}
+		}
+		prop = prop->sibling;
+	}
+
+	camera->CalculateFOV();
+	scene.m_cameras.push_back(camera);
+	return camera;
+}
+
+static bool toObjectID(const Scene& scene, const Property* property, u64* out) {
+	if (!property) return false;
+	if (isString(property)) {
+		if (property->value == "Scene") return 0;
+		std::string tmp((const char*)property->value.begin, property->value.end - property->value.begin);
+		auto iter = scene.m_fake_ids.find(tmp);
+		if (iter != scene.m_fake_ids.end()) {
+			*out = iter->second;
+			return true;
+		}
+
+		return false;
+	}
+
+	*out = property->value.toU64();
+	return true;
+}
+
+
+static u64 toObjectID(Scene& scene, const Property* property) {
+	if (isString(property)) {
+		if (property->value == "Scene") return 0;
+		std::string tmp((const char*)property->value.begin, property->value.end - property->value.begin);
+		auto iter = scene.m_fake_ids.find(tmp);
+		if (iter != scene.m_fake_ids.end()) return iter->second;
+
+		scene.m_fake_ids.emplace(std::move(tmp), scene.m_fake_ids.size() + 1); // ID 0 is reserved for root
+		return scene.m_fake_ids.size();
+	}
+
+	return property->value.toU64();
+}
+
+struct OptionalError<Object*> parsePose(Scene& scene, const Element& element, Allocator& allocator)
+{
+	PoseImpl* pose = allocator.allocate<PoseImpl>(scene, element);
+	const Element* pose_node = findChild(element, "PoseNode");
+	if (pose_node) {
+		const Element* node = findChild(*pose_node, "Node");
+		const Element* matrix = findChild(*pose_node, "Matrix");
+
+		if (matrix && matrix->first_property) {
+			if (!matrix->first_property->getValues(&pose->matrix.m[0], sizeof(pose->matrix))) {
+				return Error("Failed to parse pose");
+			}
+		}
+		pose->node_id = toObjectID(scene, node->first_property);
+	}
+	return pose;
+}
+
+static OptionalError<Object*> parseCluster(const Scene& scene, const Element& element, Allocator& allocator)
+{
+	ClusterImpl* obj = allocator.allocate<ClusterImpl>(scene, element);
+
+	const Element* transform_link = findChild(element, "TransformLink");
+	if (transform_link && transform_link->first_property)
+	{
+		if (!transform_link->first_property->getValues(&obj->transform_link_matrix.m[0], sizeof(obj->transform_link_matrix)))
+		{
+			return Error("Failed to parse TransformLink");
+		}
+	}
+	const Element* transform = findChild(element, "Transform");
+	if (transform && transform->first_property)
+	{
+		if (!transform->first_property->getValues(&obj->transform_matrix.m[0], sizeof(obj->transform_matrix)))
+		{
+			return Error("Failed to parse Transform");
+		}
+	}
+
+	return obj;
+}
+
+
+static OptionalError<Object*> parseNodeAttribute(const Scene& scene, const Element& element, Allocator& allocator)
+{
+	NodeAttributeImpl* obj = allocator.allocate<NodeAttributeImpl>(scene, element);
+	const Element* type_flags = findChild(element, "TypeFlags");
+	if (type_flags && type_flags->first_property)
+	{
+		obj->attribute_type = type_flags->first_property->value;
+	}
+	return obj;
+}
+
+
+static OptionalError<Object*> parseMaterial(const Scene& scene, const Element& element, Allocator& allocator)
+{
+	MaterialImpl* material = allocator.allocate<MaterialImpl>(scene, element);
+	const char* property_id = "P";
+	int property_offset = 4;
+	const Element* prop = findChild(element, "Properties70");
+	if (!prop) {
+		property_id = "Property";
+		property_offset = 3;
+		prop = findChild(element, "Properties60");
+	}
+	material->diffuse_color = {1, 1, 1};
+	if (prop) prop = prop->child;
+	while (prop)
+	{
+		if (prop->id == property_id && prop->first_property)
+		{
+			if (prop->first_property->value == "DiffuseColor")
+			{
+				material->diffuse_color.r = (float)prop->getProperty(property_offset + 0)->getValue().toDouble();
+				material->diffuse_color.g = (float)prop->getProperty(property_offset + 1)->getValue().toDouble();
+				material->diffuse_color.b = (float)prop->getProperty(property_offset + 2)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "SpecularColor")
+			{
+				material->specular_color.r = (float)prop->getProperty(property_offset + 0)->getValue().toDouble();
+				material->specular_color.g = (float)prop->getProperty(property_offset + 1)->getValue().toDouble();
+				material->specular_color.b = (float)prop->getProperty(property_offset + 2)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "Shininess")
+			{
+				material->shininess = (float)prop->getProperty(property_offset)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "ShininessExponent")
+			{
+				material->shininess_exponent = (float)prop->getProperty(property_offset)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "ReflectionColor")
+			{
+				material->reflection_color.r = (float)prop->getProperty(property_offset + 0)->getValue().toDouble();
+				material->reflection_color.g = (float)prop->getProperty(property_offset + 1)->getValue().toDouble();
+				material->reflection_color.b = (float)prop->getProperty(property_offset + 2)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "AmbientColor")
+			{
+				material->ambient_color.r = (float)prop->getProperty(property_offset + 0)->getValue().toDouble();
+				material->ambient_color.g = (float)prop->getProperty(property_offset + 1)->getValue().toDouble();
+				material->ambient_color.b = (float)prop->getProperty(property_offset + 2)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "EmissiveColor")
+			{
+				material->emissive_color.r = (float)prop->getProperty(property_offset + 0)->getValue().toDouble();
+				material->emissive_color.g = (float)prop->getProperty(property_offset + 1)->getValue().toDouble();
+				material->emissive_color.b = (float)prop->getProperty(property_offset + 2)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "ReflectionFactor")
+			{
+				material->reflection_factor = (float)prop->getProperty(property_offset)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "BumpFactor")
+			{
+				material->bump_factor = (float)prop->getProperty(property_offset)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "AmbientFactor")
+			{
+				material->ambient_factor = (float)prop->getProperty(property_offset)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "DiffuseFactor")
+			{
+				material->diffuse_factor = (float)prop->getProperty(property_offset)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "SpecularFactor")
+			{
+				material->specular_factor = (float)prop->getProperty(property_offset)->getValue().toDouble();
+			}
+			else if (prop->first_property->value == "EmissiveFactor")
+			{
+				material->emissive_factor = (float)prop->getProperty(property_offset)->getValue().toDouble();
+			}
+		}
+		prop = prop->sibling;
+	}
+	return material;
+}
+
+template <typename T> const char* fromString(const char* str, const char* end, T* val);
+template <> const char* fromString<int>(const char* str, const char* end, int* val)
+{
+	*val = atoi(str);
+	const char* iter = str;
+	while (iter < end && *iter != ',') ++iter;
+	if (iter < end) ++iter; // skip ','
+	return (const char*)iter;
+}
+
+
+template <> const char* fromString<u64>(const char* str, const char* end, u64* val)
+{
+	*val = strtoull(str, nullptr, 10);
+	const char* iter = str;
+	while (iter < end && *iter != ',') ++iter;
+	if (iter < end) ++iter; // skip ','
+	return (const char*)iter;
+}
+
+
+template <> const char* fromString<i64>(const char* str, const char* end, i64* val)
+{
+	*val = atoll(str);
+	const char* iter = str;
+	while (iter < end && *iter != ',') ++iter;
+	if (iter < end) ++iter; // skip ','
+	return (const char*)iter;
+}
+
+
+template <> const char* fromString<double>(const char* str, const char* end, double* val)
+{
+	*val = atof(str);
+	const char* iter = str;
+	while (iter < end && *iter != ',') ++iter;
+	if (iter < end) ++iter; // skip ','
+	return (const char*)iter;
+}
+
+
+template <> const char* fromString<float>(const char* str, const char* end, float* val)
+{
+	*val = (float)atof(str);
+	const char* iter = str;
+	while (iter < end && *iter != ',') ++iter;
+	if (iter < end) ++iter; // skip ','
+	return (const char*)iter;
+}
+
+
+const char* fromString(const char* str, const char* end, double* val, int count)
+{
+	const char* iter = str;
+	for (int i = 0; i < count; ++i)
+	{
+		*val = atof(iter);
+		++val;
+		while (iter < end && *iter != ',') ++iter;
+		if (iter < end) ++iter; // skip ','
+
+		if (iter == end) return iter;
+	}
+	return (const char*)iter;
+}
+
+const char* fromString(const char* str, const char* end, float* val, int count)
+{
+	const char* iter = str;
+	for (int i = 0; i < count; ++i)
+	{
+		*val = (float)atof(iter);
+		++val;
+		while (iter < end && *iter != ',') ++iter;
+		if (iter < end) ++iter; // skip ','
+
+		if (iter == end) return iter;
+	}
+	return (const char*)iter;
+}
+
+template <> const char* fromString<DVec2>(const char* str, const char* end, DVec2* val)
+{
+	return fromString(str, end, &val->x, 2);
+}
+
+template <> const char* fromString<FVec2>(const char* str, const char* end, FVec2* val)
+{
+	return fromString(str, end, &val->x, 2);
+}
+
+template <> const char* fromString<FVec3>(const char* str, const char* end, FVec3* val)
+{
+	return fromString(str, end, &val->x, 3);
+}
+
+template <> const char* fromString<DVec3>(const char* str, const char* end, DVec3* val)
+{
+	return fromString(str, end, &val->x, 3);
+}
+
+template <> const char* fromString<DVec4>(const char* str, const char* end, DVec4* val)
+{
+	return fromString(str, end, &val->x, 4);
+}
+
+template <> const char* fromString<FVec4>(const char* str, const char* end, FVec4* val)
+{
+	return fromString(str, end, &val->x, 4);
+}
+
+template <> const char* fromString<DMatrix>(const char* str, const char* end, DMatrix* val)
+{
+	return fromString(str, end, &val->m[0], 16);
+}
+
+
+template <typename T> static bool parseMemoryText(const Property& property, T* out, int max_size_bytes) {
+	const u8* iter = property.value.begin;
+	int max_count = max_size_bytes / sizeof(T);
+	int count = 0;
+	while (iter < property.value.end) {
+		if (count >= max_count) return false;
+		T val;
+		iter = (const u8*)fromString<T>((const char*)iter, (const char*)property.value.end, &val);
+		out[count] = val;
+		++count;
+	}
+	return true;
+}
+
+template <typename T> static bool parseMemoryLinked(const Property& property, T* out, int max_size_bytes) {
+	assert(out);
+	assert(property.value.is_binary);
+
+	int elem_size = 1;
+	switch (property.type) {
+		case 'L': elem_size = 8; break;
+		case 'D': elem_size = 8; break;
+		case 'F': elem_size = 4; break;
+		case 'I': elem_size = 4; break;
+		default: return false;
+	}
+
+	if (sizeof(T) % elem_size != 0) return false;
+
+	const Property* p = &property;
+	int count = 0;
+	int max_count = max_size_bytes / sizeof(T);
+	while (p) {
+		T tmp;
+		if (count == max_count) return false;
+		for (u32 i = 0; i < sizeof(T) / elem_size; ++i) {
+			if (!p) return false;
+			if (p->type != property.type) return false;
+
+			memcpy((u8*)&tmp + elem_size * i, p->value.begin, elem_size);
+			p = p->next;
+		}
+		out[count] = tmp;
+		++count;
+	}
+
+	return true;
+}
+
+template <typename T> struct TElemType;
+template <> struct TElemType<float> { using Type = float; };
+template <> struct TElemType<double> { using Type = double; };
+template <> struct TElemType<int> { using Type = int; };
+template <> struct TElemType<i64> { using Type = i64; };
+template <> struct TElemType<u64> { using Type = u64; };
+template <> struct TElemType<DVec2> { using Type = double; };
+template <> struct TElemType<DVec3> { using Type = double; };
+template <> struct TElemType<DVec4> { using Type = double; };
+template <> struct TElemType<FVec2> { using Type = float; };
+template <> struct TElemType<FVec3> { using Type = float; };
+template <> struct TElemType<FVec4> { using Type = float; };
+
+template <typename T> bool typeMatch(u8 type);
+template <> bool typeMatch<int>(u8 type) { return type == Property::INTEGER || type == Property::ARRAY_INT; }
+template <> bool typeMatch<float>(u8 type) { return type == Property::FLOAT || type == Property::ARRAY_FLOAT; }
+template <> bool typeMatch<double>(u8 type) { return type == Property::DOUBLE || type == Property::ARRAY_DOUBLE; }
+template <> bool typeMatch<u64>(u8 type) { return type == Property::LONG || type == Property::ARRAY_LONG; }
+template <> bool typeMatch<i64>(u8 type) { return type == Property::LONG || type == Property::ARRAY_LONG; }
+
+template <typename T>
+static bool parseMemory(const Property& property, T* out, int max_size_bytes) {
+	assert(out);
+	const u32 count = property.getCount();
+	if (count == 0) return true;
+
+	if (!property.value.is_binary) return parseMemoryText(property, out, max_size_bytes);
+
+	if (!typeMatch<typename TElemType<T>::Type>(property.type))
+		return false;
+	int elem_size = 1;
+	switch (property.type) {
+		case 'l': elem_size = 8; break;
+		case 'd': elem_size = 8; break;
+		case 'f': elem_size = 4; break;
+		case 'i': elem_size = 4; break;
+		case 'L':
+		case 'D':
+		case 'F':
+		case 'I':
+			return parseMemoryLinked(property, out, max_size_bytes); 
+		default: return false;
+	}
+	if (count * elem_size != max_size_bytes) return false;
+	if (sizeof(T) % elem_size != 0) return false;
+
+	const u8* data = property.value.begin + sizeof(u32) * 3;
+	if (data > property.value.end) return false;
+
+	u32 enc = *(const u32*)(property.value.begin + 4);
+	u32 len = *(const u32*)(property.value.begin + 8);
+
+	if (enc == 0) {
+		if ((int)len > max_size_bytes) return false;
+		if (data + len > property.value.end) return false;
+		memcpy(out, data, len);
+		return true;
+	}
+	else if (enc == 1) {
+		if (int(elem_size * count) > max_size_bytes) return false;
+		return decompress(data, len, (u8*)out, elem_size * count);
+	}
+
+	return false;
+}
+
+template <typename T> static void parseTextArray(const Property& property, std::vector<T>* out)
+{
+	out->clear();
+	const u8* iter = property.value.begin;
+	while (iter < property.value.end)
+	{
+		T val;
+		iter = (const u8*)fromString<T>((const char*)iter, (const char*)property.value.end, &val);
+		out->push_back(val);
+	}
+}
+
+template <typename T> static bool parseBinaryArrayLinked(const Property& property, std::vector<T>* out)
+{
+	assert(out);
+	assert(property.value.is_binary);
+
+	int elem_size = 1;
+	switch (property.type)
+	{
+		case 'L': elem_size = 8; break;
+		case 'D': elem_size = 8; break;
+		case 'F': elem_size = 4; break;
+		case 'I': elem_size = 4; break;
+		default: return false;
+	}
+
+	if (sizeof(T) % elem_size != 0) return false;
+
+	const Property* p = &property;
+	while (p) {
+		T tmp;
+		for (u32 i = 0; i < sizeof(T) / elem_size; ++i) {
+			if (!p) return false;
+			if (p->type != property.type) return false;
+
+			memcpy((u8*)&tmp + elem_size * i, p->value.begin, elem_size);
+			p = p->next;
+		}
+		out->push_back(tmp);
+	}
+
+	return true;
+}
+
+template <typename T> static bool parseArray(const Property& property, std::vector<T>* out) {
+	assert(out);
+	if (!property.value.is_binary) {
+		parseTextArray(property, out);
+		return true;
+	}
+
+	if (!typeMatch<typename TElemType<T>::Type>(property.type)) return false;
+
+	int elem_size = 1;
+	switch (property.type)
+	{
+		case 'l': elem_size = 8; break;
+		case 'd': elem_size = 8; break;
+		case 'f': elem_size = 4; break;
+		case 'i': elem_size = 4; break;
+		case 'L':
+		case 'D':
+		case 'F':
+		case 'I':
+			return parseBinaryArrayLinked(property, out); 
+		default: return false;
+	}
+	u32 count = property.getCount();
+	out->resize(count * elem_size / sizeof(T));
+	if (count == 0) return true;
+
+	return parseMemory(property, out->data(), int(sizeof((*out)[0]) * out->size()));
+}
+
+template <typename T> static bool parseVecData(Property& property, std::vector<T>* out_vec) {
+	using ElemType = typename TElemType<T>::Type;
+	assert(out_vec);
+	if (!property.value.is_binary) {
+		parseTextArray(property, out_vec);
+		return true;
+	}
+
+	if (typeMatch<ElemType>(property.type)) return parseArray(property, out_vec);
+
+	if (property.type == 'f' || property.type == 'F') {
+		std::vector<float> tmp;
+		if (!parseArray(property, &tmp)) return false;
+		int elem_count = sizeof((*out_vec)[0]) / sizeof(ElemType);
+		out_vec->resize(tmp.size() / elem_count);
+		ElemType* out = (ElemType*)out_vec->data();
+		for (int i = 0, c = (int)tmp.size(); i < c; ++i) {
+			out[i] = static_cast<ElemType>(tmp[i]);
+		}
+		return true;
+	}
+
+	if (property.type == 'd' || property.type == 'D') {
+		std::vector<double> tmp;
+		if (!parseArray(property, &tmp)) return false;
+		int elem_count = sizeof((*out_vec)[0]) / sizeof(ElemType);
+		out_vec->resize(tmp.size() / elem_count);
+		auto* out = (ElemType*)out_vec->data();
+		for (int i = 0, c = (int)tmp.size(); i < c; ++i) {
+			out[i] = static_cast<ElemType>(tmp[i]);
+		}
+		return true;
+	}
+
+	return false;
+}
+
+template <typename T> static bool parseVertexData(const Element& element, const char* name, const char* index_name, T& out, std::vector<ParseDataJob>& jobs) {
+	const Element* data_element = findChild(element, name);
+	if (!data_element || !data_element->first_property) return false;
+
+	const Element* mapping_element = findChild(element, "MappingInformationType");
+	const Element* reference_element = findChild(element, "ReferenceInformationType");
+	if (mapping_element && mapping_element->first_property) {
+		if (mapping_element->first_property->value == "ByPolygonVertex") {
+			out.mapping = VertexDataMapping::BY_POLYGON_VERTEX;
+		} else if (mapping_element->first_property->value == "ByPolygon") {
+			out.mapping = VertexDataMapping::BY_POLYGON;
+		} else if (mapping_element->first_property->value == "ByVertice" || mapping_element->first_property->value == "ByVertex") {
+			out.mapping = VertexDataMapping::BY_VERTEX;
+		} else {
+			return false;
+		}
+	}
+	if (reference_element && reference_element->first_property) {
+		if (reference_element->first_property->value == "IndexToDirect") {
+			const Element* indices_element = findChild(element, index_name);
+			if (indices_element && indices_element->first_property) {
+				if (!pushJob(jobs, *indices_element->first_property, out.indices)) return false;
+			}
+		} else if (reference_element->first_property->value != "Direct") {
+			return false;
+		}
+	}
+	return pushJob(jobs, *data_element->first_property, out.values);
+}
+
+static bool parseDouble(Property& property, double* out)
+{
+	assert(out);
+	if (property.value.is_binary)
+	{
+		int elem_size = 1;
+		switch (property.type)
+		{
+			case 'D': elem_size = 8; break;
+			case 'F': elem_size = 4; break;
+			default: return false;
+		}
+		const u8* data = property.value.begin;
+		if (data > property.value.end) return false;
+		memcpy(out, data, elem_size);
+		return true;
+	}
+	else
+	{
+		fromString<double>((const char*)property.value.begin, (const char*)property.value.end, out);
+		return true;
+	}
+}
+
+static OptionalError<Object*> parseAnimationCurve(const Scene& scene, const Element& element, Allocator& allocator)
+{
+	AnimationCurveImpl* curve = allocator.allocate<AnimationCurveImpl>(scene, element);
+
+	const Element* times = findChild(element, "KeyTime");
+	const Element* values = findChild(element, "KeyValueFloat");
+
+	if (times && times->first_property)
+	{
+		curve->times.resize(times->first_property->getCount());
+		if (!times->first_property->getValues(&curve->times[0], (int)curve->times.size() * sizeof(curve->times[0])))
+		{
+			return Error("Invalid animation curve");
+		}
+	}
+
+	if (values && values->first_property)
+	{
+		curve->values.resize(values->first_property->getCount());
+		if (!values->first_property->getValues(&curve->values[0], (int)curve->values.size() * sizeof(curve->values[0])))
+		{
+			return Error("Invalid animation curve");
+		}
+	}
+
+	if (curve->times.size() != curve->values.size()) return Error("Invalid animation curve");
+
+	return curve;
+}
+
+static OptionalError<Object*> parseGeometry(const Element& element, GeometryImpl& geom, std::vector<ParseDataJob> &jobs, Allocator& allocator) {
+	assert(element.first_property);
+
+	const Element* vertices_element = findChild(element, "Vertices");
+	if (!vertices_element || !vertices_element->first_property)
+	{
+		return &geom;
+	}
+
+	const Element* polys_element = findChild(element, "PolygonVertexIndex");
+	if (!polys_element || !polys_element->first_property) return Error("Indices missing");
+
+	if (!pushJob(jobs, *vertices_element->first_property, geom.positions.values)) return Error("Invalid vertices");
+	if (!pushJob(jobs, *polys_element->first_property, geom.positions.indices)) return Error("Invalid vertices");
+
+	if (!parseGeometryMaterials(geom, element, jobs)) return Error("Invalid materials");
+	if (!parseGeometryUVs(geom, element, jobs)) return Error("Invalid vertex attributes");
+	if (!parseGeometryTangents(geom, element, jobs)) return Error("Invalid vertex attributes");
+	if (!parseGeometryColors(geom, element, jobs)) return Error("Invalid vertex attributes");
+	if (!parseGeometryNormals(geom, element, jobs)) return Error("Invalid vertex attributes");
+
+	return &geom;
+}
+
+
+bool ShapeImpl::postprocess(GeometryImpl& geom, Allocator& allocator) {
+	const Element* vertices_element = findChild((const Element&)element, "Vertices");
+	const Element* normals_element = findChild((const Element&)element, "Normals");
+	const Element* indexes_element = findChild((const Element&)element, "Indexes");
+	if (!vertices_element || !vertices_element->first_property ||
+		!indexes_element || !indexes_element->first_property)
+	{
+		return false;
+	}
+
+	if (!parseVecData(*vertices_element->first_property, &vertices)) return false;
+	if (normals_element && !parseVecData(*normals_element->first_property, &normals)) return false;
+	if (!parseVecData(*indexes_element->first_property, &indices)) return false;
+
+	return true;
+}
+
+static bool parseConnections(const Element& root, Scene& scene)
+{
+	const Element* connections = findChild(root, "Connections");
+	if (!connections) return true;
+
+	scene.m_connections.reserve(1024);
+	const Element* connection = connections->child;
+	while (connection)
+	{
+		if (!isString(connection->first_property) || !connection->first_property->next || !connection->first_property->next->next)
+		{
+			Error::s_message = "Invalid connection";
+			return false;
+		}
+
+		Scene::Connection c;
+		c.from_object = toObjectID(scene, connection->first_property->next);
+		if (connection->first_property->value == "OO")
+		{
+			c.type = Scene::Connection::OBJECT_OBJECT;
+			c.to_object = toObjectID(scene, connection->first_property->next->next);
+		}
+		else if (connection->first_property->value == "OP")
+		{
+			if (!connection->first_property->next->next->next)
+			{
+				Error::s_message = "Invalid connection";
+				return false;
+			}
+			c.type = Scene::Connection::OBJECT_PROPERTY;
+			c.to_object = toObjectID(scene, connection->first_property->next->next);
+			c.to_property = connection->first_property->next->next->next->value;
+		}
+		else if (connection->first_property->value == "PO")
+		{
+			if (!connection->first_property->next->next->next)
+			{
+				Error::s_message = "Invalid connection";
+				return false;
+			}
+			c.type = Scene::Connection::PROPERTY_OBJECT;
+			c.from_property = connection->first_property->next->next->value;
+			c.to_object = toObjectID(scene, connection->first_property->next->next->next);
+		}
+		else if (connection->first_property->value == "PP")
+		{
+			if (!connection->first_property->next->next->next->next)
+			{
+				Error::s_message = "Invalid connection";
+				return false;
+			}
+			c.type = Scene::Connection::PROPERTY_PROPERTY;
+			c.from_property = connection->first_property->next->next->value;
+			c.to_object = toObjectID(scene, connection->first_property->next->next->next);
+			c.to_property = connection->first_property->next->next->next->next->value;
+		}
+		else
+		{
+			assert(false);
+			Error::s_message = "Not supported";
+			return false;
+		}
+		scene.m_connections.push_back(c);
+
+		connection = connection->sibling;
+	}
+	return true;
+}
+
+
+static bool parseTakes(Scene& scene)
+{
+	const Element* takes = findChild((const Element&)*scene.getRootElement(), "Takes");
+	if (!takes) return true;
+
+	const Element* object = takes->child;
+	while (object)
+	{
+		if (object->id == "Take")
+		{
+			if (!isString(object->first_property))
+			{
+				Error::s_message = "Invalid name in take";
+				return false;
+			}
+
+			TakeInfo take;
+			take.name = object->first_property->value;
+			const Element* filename = findChild(*object, "FileName");
+			if (filename)
+			{
+				if (!isString(filename->first_property))
+				{
+					Error::s_message = "Invalid filename in take";
+					return false;
+				}
+				take.filename = filename->first_property->value;
+			}
+			const Element* local_time = findChild(*object, "LocalTime");
+			if (local_time)
+			{
+				if (!isLong(local_time->first_property) || !isLong(local_time->first_property->next))
+				{
+					Error::s_message = "Invalid local time in take";
+					return false;
+				}
+
+				take.local_time_from = fbxTimeToSeconds(local_time->first_property->value.toI64());
+				take.local_time_to = fbxTimeToSeconds(local_time->first_property->next->value.toI64());
+			}
+			const Element* reference_time = findChild(*object, "ReferenceTime");
+			if (reference_time)
+			{
+				if (!isLong(reference_time->first_property) || !isLong(reference_time->first_property->next))
+				{
+					Error::s_message = "Invalid reference time in take";
+					return false;
+				}
+
+				take.reference_time_from = fbxTimeToSeconds(reference_time->first_property->value.toI64());
+				take.reference_time_to = fbxTimeToSeconds(reference_time->first_property->next->value.toI64());
+			}
+
+			scene.m_take_infos.push_back(take);
+		}
+
+		object = object->sibling;
+	}
+
+	return true;
+}
+
+
+static float getFramerateFromTimeMode(FrameRate time_mode, float custom_frame_rate)
+{
+	switch (time_mode)
+	{
+		case FrameRate_DEFAULT: return 14;
+		case FrameRate_120: return 120;
+		case FrameRate_100: return 100;
+		case FrameRate_60: return 60;
+		case FrameRate_50: return 50;
+		case FrameRate_48: return 48;
+		case FrameRate_30: return 30;
+		case FrameRate_30_DROP: return 30;
+		case FrameRate_NTSC_DROP_FRAME: return 29.9700262f;
+		case FrameRate_NTSC_FULL_FRAME: return 29.9700262f;
+		case FrameRate_PAL: return 25;
+		case FrameRate_CINEMA: return 24;
+		case FrameRate_1000: return 1000;
+		case FrameRate_CINEMA_ND: return 23.976f;
+		case FrameRate_CUSTOM: return custom_frame_rate;
+	}
+	return -1;
+}
+
+
+static void parseGlobalSettings(const Element& root, Scene* scene)
+{
+	const Element* settings = findChild(root, "GlobalSettings");
+	if (!settings) return;
+
+	bool is_p60 = false;
+	const Element* props = findChild(*settings, "Properties70");
+	if (!props) {
+		is_p60 = true;
+		props = findChild(*settings, "Properties60");
+		if (!props) return;
+	}
+
+	for (Element* node = props->child; node; node = node->sibling) {
+		if (!node->first_property) continue;
+
+		#define get_property(name, field, type, getter) if(node->first_property->value == name) \
+		{ \
+			IElementProperty* prop = node->getProperty(scene->version <= 6100 ? 3 : 4); \
+			if (prop) \
+			{ \
+				DataView value = prop->getValue(); \
+				scene->m_settings.field = (type)value.getter(); \
+			} \
+		}
+
+		#define get_time_property(name, field, type, getter) if(node->first_property->value == name) \
+		{ \
+			IElementProperty* prop = node->getProperty(scene->version <= 6100 ? 3 : 4); \
+			if (prop) \
+			{ \
+				DataView value = prop->getValue(); \
+				scene->m_settings.field = fbxTimeToSeconds((type)value.getter()); \
+			} \
+		}
+
+		get_property("UpAxis", UpAxis, UpVector, toInt);
+		get_property("UpAxisSign", UpAxisSign, int, toInt);
+		get_property("FrontAxis", FrontAxis, int, toInt);
+		get_property("FrontAxisSign", FrontAxisSign, int, toInt);
+		get_property("CoordAxis", CoordAxis, CoordSystem, toInt);
+		get_property("CoordAxisSign", CoordAxisSign, int, toInt);
+		get_property("OriginalUpAxis", OriginalUpAxis, int, toInt);
+		get_property("OriginalUpAxisSign", OriginalUpAxisSign, int, toInt);
+		get_property("UnitScaleFactor", UnitScaleFactor, float, toDouble);
+		get_property("OriginalUnitScaleFactor", OriginalUnitScaleFactor, float, toDouble);
+		get_time_property("TimeSpanStart", TimeSpanStart, u64, toU64);
+		get_time_property("TimeSpanStop", TimeSpanStop, u64, toU64);
+		get_property("TimeMode", TimeMode, FrameRate, toInt);
+		get_property("CustomFrameRate", CustomFrameRate, float, toDouble);
+
+		#undef get_property
+		#undef get_time_property
+
+		scene->m_scene_frame_rate = getFramerateFromTimeMode(scene->m_settings.TimeMode, scene->m_settings.CustomFrameRate);
+	}
+}
+
+void sync_job_processor(JobFunction fn, void*, void* data, u32 size, u32 count) {
+	u8* ptr = (u8*)data;
+	for(u32 i = 0; i < count; ++i) {
+		fn(ptr);
+		ptr += size;
+	}
+}
+
+static bool parseObjects(const Element& root, Scene& scene, u16 flags, Allocator& allocator, JobProcessor job_processor, void* job_user_ptr) {
+	if (!job_processor) job_processor = &sync_job_processor;
+
+	const bool ignore_geometry = (flags & (u16)LoadFlags::IGNORE_GEOMETRY) != 0;
+	const bool ignore_blend_shapes = (flags & (u16)LoadFlags::IGNORE_BLEND_SHAPES) != 0;
+	const bool ignore_cameras = (flags & (u16)LoadFlags::IGNORE_CAMERAS) != 0;
+	const bool ignore_lights = (flags & (u16)LoadFlags::IGNORE_LIGHTS) != 0;
+	const bool ignore_textures = (flags & (u16)LoadFlags::IGNORE_TEXTURES) != 0;
+	const bool ignore_skin = (flags & (u16)LoadFlags::IGNORE_SKIN) != 0;
+	const bool ignore_bones = (flags & (u16)LoadFlags::IGNORE_BONES) != 0;
+	const bool ignore_pivots = (flags & (u16)LoadFlags::IGNORE_PIVOTS) != 0;
+	const bool ignore_animations = (flags & (u16)LoadFlags::IGNORE_ANIMATIONS) != 0;
+	const bool ignore_materials = (flags & (u16)LoadFlags::IGNORE_MATERIALS) != 0;
+	const bool ignore_poses = (flags & (u16)LoadFlags::IGNORE_POSES) != 0;
+	const bool ignore_videos = (flags & (u16)LoadFlags::IGNORE_VIDEOS) != 0;
+	const bool ignore_limbs = (flags & (u16)LoadFlags::IGNORE_LIMBS) != 0;
+	const bool ignore_meshes = (flags & (u16)LoadFlags::IGNORE_MESHES) != 0;
+	const bool ignore_models = (flags & (u16)LoadFlags::IGNORE_MODELS) != 0;
+
+	const Element* objs = findChild(root, "Objects");
+	if (!objs) return true;
+
+	scene.m_root = allocator.allocate<Root>(scene, root);
+	scene.m_root->id = 0;
+	scene.m_object_map[0] = {&root, scene.m_root};
+
+	const Element* object = objs->child;
+	while (object)
+	{
+		if (object->first_property) {
+			if (!isLong(object->first_property) && !isString(object->first_property))
+			{
+				Error::s_message = "Invalid ID";
+				return false;
+			}
+
+			u64 id = toObjectID(scene, object->first_property);
+			scene.m_object_map[id] = {object, nullptr};
+		}
+		object = object->sibling;
+	}
+
+	std::vector<ParseDataJob> jobs;
+
+	for (auto iter : scene.m_object_map)
+	{
+		OptionalError<Object*> obj = nullptr;
+
+		if (iter.second.object == scene.m_root) continue;
+
+		if (iter.second.element->id == "Geometry" && !ignore_geometry)
+		{
+			Property* last_prop = iter.second.element->first_property;
+			while (last_prop->next) last_prop = last_prop->next;
+			if (last_prop && last_prop->value == "Mesh")
+			{
+				GeometryImpl* geom = allocator.allocate<GeometryImpl>(scene, *iter.second.element);
+				parseGeometry(*iter.second.element, *geom, jobs, allocator);
+				obj = geom;
+				scene.m_geometries.push_back(geom);
+			}
+			else if (last_prop && last_prop->value == "Shape")
+			{
+				obj = allocator.allocate<ShapeImpl>(scene, *iter.second.element);
+			}
+		}
+		else if (iter.second.element->id == "Material" && !ignore_materials)
+		{
+			obj = parseMaterial(scene, *iter.second.element, allocator);
+		}
+		else if (iter.second.element->id == "AnimationStack" && !ignore_animations)
+		{
+			obj = allocator.allocate<AnimationStackImpl>(scene, *iter.second.element);
+			if (!obj.isError())
+			{
+				AnimationStackImpl* stack = (AnimationStackImpl*)obj.getValue();
+				scene.m_animation_stacks.push_back(stack);
+			}
+		}
+		else if (iter.second.element->id == "AnimationLayer" && !ignore_animations)
+		{
+			obj = allocator.allocate<AnimationLayerImpl>(scene, *iter.second.element);
+		}
+		else if (iter.second.element->id == "AnimationCurve" && !ignore_animations)
+		{
+			obj = parseAnimationCurve(scene, *iter.second.element, allocator);
+		}
+		else if (iter.second.element->id == "AnimationCurveNode" && !ignore_animations)
+		{
+			obj = allocator.allocate<AnimationCurveNodeImpl>(scene, *iter.second.element);
+		}
+		else if (iter.second.element->id == "Deformer" && !ignore_blend_shapes)
+		{
+			IElementProperty* class_prop = iter.second.element->getProperty(2);
+			if (!class_prop) class_prop = iter.second.element->getProperty(1);
+
+			if (class_prop)
+			{
+				if (class_prop->getValue() == "Cluster")
+					obj = parseCluster(scene, *iter.second.element, allocator);
+				else if (class_prop->getValue() == "Skin")
+					obj = allocator.allocate<SkinImpl>(scene, *iter.second.element);
+				else if (class_prop->getValue() == "BlendShape" && !ignore_blend_shapes)
+					obj = allocator.allocate<BlendShapeImpl>(scene, *iter.second.element);
+				else if (class_prop->getValue() == "BlendShapeChannel" && !ignore_blend_shapes)
+					obj = allocator.allocate<BlendShapeChannelImpl>(scene, *iter.second.element);
+			}
+		}
+		else if (iter.second.element->id == "NodeAttribute")
+		{
+			Property* last_prop = iter.second.element->first_property;
+			while (last_prop->next) last_prop = last_prop->next;
+			if (last_prop)
+			{
+				if (last_prop->value == "Light" && !ignore_lights)
+				{
+					obj = parseLight(scene, *iter.second.element, allocator);
+				}
+				else if (last_prop->value == "Camera" && !ignore_cameras)
+				{
+					obj = parseCamera(scene, *iter.second.element, allocator);
+				}
+			}
+			else
+			{
+				obj = parseNodeAttribute(scene, *iter.second.element, allocator);
+			}
+		}
+		else if (iter.second.element->id == "Model" && !ignore_models)
+		{
+			IElementProperty* class_prop = iter.second.element->getProperty(2);
+			if (!class_prop) class_prop = iter.second.element->getProperty(1);
+
+			if (class_prop)
+			{
+				if (class_prop->getValue() == "Mesh" && !ignore_meshes)
+				{
+					obj = parseMesh(scene, *iter.second.element, jobs, allocator);
+					if (!obj.isError()) {
+						Mesh* mesh = (Mesh*)obj.getValue();
+						scene.m_meshes.push_back(mesh);
+						obj = mesh;
+					}
+				}
+				else if (class_prop->getValue() == "LimbNode" && !ignore_limbs)
+					obj = allocator.allocate<LimbNodeImpl>(scene, *iter.second.element);
+				else
+					obj = allocator.allocate<NullImpl>(scene, *iter.second.element);
+			}
+		}
+		else if (iter.second.element->id == "Texture" && !ignore_textures)
+		{
+			obj = parseTexture(scene, *iter.second.element, allocator);
+		}
+		else if (iter.second.element->id == "Video" && !ignore_videos)
+		{
+			parseVideo(scene, *iter.second.element, allocator);
+		}
+		else if (iter.second.element->id == "Pose" && !ignore_poses)
+		{
+			obj = parsePose(scene, *iter.second.element, allocator);
+		}
+
+		if (obj.isError()) return false;
+
+		scene.m_object_map[iter.first].object = obj.getValue();
+		if (obj.getValue())
+		{
+			scene.m_all_objects.push_back(obj.getValue());
+			obj.getValue()->id = iter.first;
+		}
+	}
+
+	if (!jobs.empty()) {
+		(*job_processor)([](void* ptr){
+			ParseDataJob* job = (ParseDataJob*)ptr;
+			job->error = !job->f(job->property, job->data);
+		}, job_user_ptr, &jobs[0], (u32)sizeof(jobs[0]), (u32)jobs.size());
+
+		for (const ParseDataJob& job : jobs) {
+			if (job.error) {
+				Error::s_message = "Failed to parse data";
+				return false;
+			}
+		}
+	}
+
+	for (const Scene::Connection& con : scene.m_connections)
+	{
+		if (con.type == Scene::Connection::PROPERTY_PROPERTY) continue;
+
+		Object* parent = scene.m_object_map[con.to_object].object;
+		Object* child = scene.m_object_map[con.from_object].object;
+		if (!child) continue;
+		if (!parent) continue;
+
+		switch (child->getType())
+		{
+			case Object::Type::NODE_ATTRIBUTE:
+				if (parent->node_attribute)
+				{
+					Error::s_message = "Invalid node attribute";
+					return false;
+				}
+				parent->node_attribute = (NodeAttribute*)child;
+				break;
+			case Object::Type::ANIMATION_CURVE_NODE:
+				if (parent->isNode())
+				{
+					AnimationCurveNodeImpl* node = (AnimationCurveNodeImpl*)child;
+					node->bone = parent;
+					node->bone_link_property = con.to_property;
+				}
+				break;
+			default: break;
+		}
+
+		switch (parent->getType())
+		{
+			case Object::Type::MESH:
+			{
+				MeshImpl* mesh = (MeshImpl*)parent;
+				if (child->getType() == Object::Type::SKIN)
+					mesh->skin = (Skin*)child;
+				else if (child->getType() == Object::Type::BLEND_SHAPE)
+					mesh->blendShape = (BlendShape*)child;
+
+				switch (child->getType())
+				{
+					case Object::Type::GEOMETRY:
+						if (mesh->geometry)
+						{
+							Error::s_message = "Invalid mesh";
+							return false;
+						}
+						mesh->geometry = (GeometryImpl*)child;
+						break;
+					case Object::Type::MATERIAL: mesh->materials.push_back((Material*)child); break;
+					default: break;
+				}
+				break;
+			}
+			case Object::Type::SKIN:
+			{
+				SkinImpl* skin = (SkinImpl*)parent;
+				if (child->getType() == Object::Type::CLUSTER)
+				{
+					ClusterImpl* cluster = (ClusterImpl*)child;
+					skin->clusters.push_back(cluster);
+					if (cluster->skin)
+					{
+						Error::s_message = "Invalid cluster";
+						return false;
+					}
+					cluster->skin = skin;
+				}
+				break;
+			}
+			case Object::Type::BLEND_SHAPE:
+			{
+				BlendShapeImpl* blendShape = (BlendShapeImpl*)parent;
+				if (child->getType() == Object::Type::BLEND_SHAPE_CHANNEL)
+				{
+					BlendShapeChannelImpl* blendShapeChannel = (BlendShapeChannelImpl*)child;
+					blendShape->blendShapeChannels.push_back(blendShapeChannel);
+					if (blendShapeChannel->blendShape)
+					{
+						Error::s_message = "Invalid blend shape";
+						return false;
+					}
+					blendShapeChannel->blendShape = blendShape;
+				}
+				break;
+			}
+			case Object::Type::BLEND_SHAPE_CHANNEL:
+			{
+				BlendShapeChannelImpl* blendShapeChannel = (BlendShapeChannelImpl*)parent;
+				if (child->getType() == Object::Type::SHAPE)
+				{
+					ShapeImpl* shape = (ShapeImpl*)child;
+					blendShapeChannel->shapes.push_back(shape);
+				}
+				break;
+			}
+			case Object::Type::MATERIAL:
+			{
+				MaterialImpl* mat = (MaterialImpl*)parent;
+				if (child->getType() == Object::Type::TEXTURE)
+				{
+					Texture::TextureType type = Texture::COUNT;
+					if (con.to_property == "NormalMap")
+						type = Texture::NORMAL;
+					else if (con.to_property == "DiffuseColor")
+						type = Texture::DIFFUSE;
+					else if (con.to_property == "SpecularColor")
+						type = Texture::SPECULAR;
+					else if (con.to_property == "ShininessExponent")
+						type = Texture::SHININESS;
+					else if (con.to_property == "EmissiveColor")
+						type = Texture::EMISSIVE;
+					else if (con.to_property == "AmbientColor")
+						type = Texture::AMBIENT;
+					else if (con.to_property == "ReflectionFactor")
+						type = Texture::REFLECTION;
+					if (type == Texture::COUNT) break;
+
+					if (mat->textures[type])
+					{
+						break; // This may happen for some models (eg. 2 normal maps in use)
+					}
+
+					mat->textures[type] = (Texture*)child;
+				}
+				break;
+			}
+			case Object::Type::GEOMETRY:
+			{
+				GeometryImpl* geom = (GeometryImpl*)parent;
+				if (child->getType() == Object::Type::SKIN)
+					geom->skin = (Skin*)child;
+				else if (child->getType() == Object::Type::BLEND_SHAPE)
+					geom->blendShape = (BlendShape*)child;
+				break;
+			}
+			case Object::Type::CLUSTER:
+			{
+				ClusterImpl* cluster = (ClusterImpl*)parent;
+				if (child->getType() == Object::Type::LIMB_NODE || child->getType() == Object::Type::MESH || child->getType() == Object::Type::NULL_NODE)
+				{
+					if (cluster->link && cluster->link != child)
+					{
+						Error::s_message = "Invalid cluster";
+						return false;
+					}
+
+					cluster->link = child;
+				}
+				break;
+			}
+			case Object::Type::ANIMATION_LAYER:
+			{
+				if (child->getType() == Object::Type::ANIMATION_CURVE_NODE)
+				{
+					((AnimationLayerImpl*)parent)->curve_nodes.push_back((AnimationCurveNodeImpl*)child);
+				}
+			}
+			break;
+			case Object::Type::ANIMATION_CURVE_NODE:
+			{
+				AnimationCurveNodeImpl* node = (AnimationCurveNodeImpl*)parent;
+				if (child->getType() == Object::Type::ANIMATION_CURVE)
+				{
+					char tmp[32];
+					con.to_property.toString(tmp);
+					if (strcmp(tmp, "d|X") == 0)
+					{
+						node->curves[0].connection = &con;
+						node->curves[0].curve = (AnimationCurve*)child;
+					}
+					else if (strcmp(tmp, "d|Y") == 0)
+					{
+						node->curves[1].connection = &con;
+						node->curves[1].curve = (AnimationCurve*)child;
+					}
+					else if (strcmp(tmp, "d|Z") == 0)
+					{
+						node->curves[2].connection = &con;
+						node->curves[2].curve = (AnimationCurve*)child;
+					}
+				}
+				break;
+			}
+			default: break;
+		}
+	}
+
+
+	if (!ignore_geometry) {
+		struct PostprocessJob {
+			Object* obj;
+			bool error = false;
+		};
+		std::vector<PostprocessJob> postprocess_jobs;
+		for (auto iter : scene.m_object_map)
+		{
+			Object* obj = iter.second.object;
+			if (!obj) continue;
+			switch (obj->getType()) {
+				case Object::Type::CLUSTER:
+				case Object::Type::GEOMETRY:
+				case Object::Type::MESH:
+					postprocess_jobs.push_back({obj});
+					break;
+				case Object::Type::BLEND_SHAPE_CHANNEL:
+					if (!((BlendShapeChannelImpl*)iter.second.object)->postprocess(scene.m_allocator)) {
+						Error::s_message = "Failed to postprocess blend shape channel";
+						return false;
+					}
+					break;
+				case Object::Type::POSE:
+					if (!((PoseImpl*)iter.second.object)->postprocess(scene)) {
+						Error::s_message = "Failed to postprocess pose";
+						return false;
+					}
+					break;
+				default: break;
+			}
+		}
+
+		if (!postprocess_jobs.empty()) {
+			(*job_processor)([](void* ptr){
+				PostprocessJob* job = (PostprocessJob*)ptr;
+				switch (job->obj->getType()) {
+					case Object::Type::CLUSTER: job->error = !((ClusterImpl*)job->obj)->postprocess(); break;
+					case Object::Type::GEOMETRY: job->error = !((GeometryImpl*)job->obj)->postprocess(); break;
+					case Object::Type::MESH: job->error = !((MeshImpl*)job->obj)->geometry_data.postprocess(); break;
+					default: break;
+				}
+			}, job_user_ptr, &postprocess_jobs[0], (u32)sizeof(postprocess_jobs[0]), (u32)postprocess_jobs.size());
+			for (const PostprocessJob& job : postprocess_jobs) if (job.error) {
+				Error::s_message = "Failed to postprocess object";
+				return false;
+			}
+		}
+	}
+
+	return true;
+}
+
+
+RotationOrder Object::getRotationOrder() const
+{
+	// This assumes that the default rotation order is EULER_XYZ.
+	return (RotationOrder) resolveEnumProperty(*this, "RotationOrder", (int) RotationOrder::EULER_XYZ);
+}
+
+
+DVec3 Object::getRotationOffset() const
+{
+	return resolveVec3Property(*this, "RotationOffset", {0, 0, 0});
+}
+
+
+DVec3 Object::getRotationPivot() const
+{
+	return resolveVec3Property(*this, "RotationPivot", {0, 0, 0});
+}
+
+
+DVec3 Object::getPostRotation() const
+{
+	return resolveVec3Property(*this, "PostRotation", {0, 0, 0});
+}
+
+
+DVec3 Object::getScalingOffset() const
+{
+	return resolveVec3Property(*this, "ScalingOffset", {0, 0, 0});
+}
+
+
+DVec3 Object::getScalingPivot() const
+{
+	return resolveVec3Property(*this, "ScalingPivot", {0, 0, 0});
+}
+
+
+DMatrix Object::evalLocal(const DVec3& translation, const DVec3& rotation) const
+{
+	return evalLocal(translation, rotation, getLocalScaling());
+}
+
+
+DMatrix Object::evalLocal(const DVec3& translation, const DVec3& rotation, const DVec3& scaling) const
+{
+	DVec3 rotation_pivot = getRotationPivot();
+	DVec3 scaling_pivot = getScalingPivot();
+	RotationOrder rotation_order = getRotationOrder();
+
+	DMatrix s = makeIdentity();
+	s.m[0] = scaling.x;
+	s.m[5] = scaling.y;
+	s.m[10] = scaling.z;
+
+	DMatrix t = makeIdentity();
+	setTranslation(translation, &t);
+
+	DMatrix r = getRotationMatrix(rotation, rotation_order);
+	DMatrix r_pre = getRotationMatrix(getPreRotation(), RotationOrder::EULER_XYZ);
+	DMatrix r_post_inv = getRotationMatrix(-getPostRotation(), RotationOrder::EULER_ZYX);
+
+	DMatrix r_off = makeIdentity();
+	setTranslation(getRotationOffset(), &r_off);
+
+	DMatrix r_p = makeIdentity();
+	setTranslation(rotation_pivot, &r_p);
+
+	DMatrix r_p_inv = makeIdentity();
+	setTranslation(-rotation_pivot, &r_p_inv);
+
+	DMatrix s_off = makeIdentity();
+	setTranslation(getScalingOffset(), &s_off);
+
+	DMatrix s_p = makeIdentity();
+	setTranslation(scaling_pivot, &s_p);
+
+	DMatrix s_p_inv = makeIdentity();
+	setTranslation(-scaling_pivot, &s_p_inv);
+
+	// http://help.autodesk.com/view/FBX/2017/ENU/?guid=__files_GUID_10CDD63C_79C1_4F2D_BB28_AD2BE65A02ED_htm
+	return t * r_off * r_p * r_pre * r * r_post_inv * r_p_inv * s_off * s_p * s * s_p_inv;
+}
+
+
+DVec3 Object::getLocalTranslation() const
+{
+	return resolveVec3Property(*this, "Lcl Translation", {0, 0, 0});
+}
+
+
+DVec3 Object::getPreRotation() const
+{
+	return resolveVec3Property(*this, "PreRotation", {0, 0, 0});
+}
+
+
+DVec3 Object::getLocalRotation() const
+{
+	return resolveVec3Property(*this, "Lcl Rotation", {0, 0, 0});
+}
+
+
+DVec3 Object::getLocalScaling() const
+{
+	return resolveVec3Property(*this, "Lcl Scaling", {1, 1, 1});
+}
+
+
+DMatrix Object::getGlobalTransform() const
+{
+	const Object* parent = getParent();
+	if (!parent) return evalLocal(getLocalTranslation(), getLocalRotation());
+
+	return parent->getGlobalTransform() * evalLocal(getLocalTranslation(), getLocalRotation());
+}
+
+
+DMatrix Object::getLocalTransform() const
+{
+	return evalLocal(getLocalTranslation(), getLocalRotation(), getLocalScaling());
+}
+
+
+Object* Object::resolveObjectLinkReverse(Object::Type type) const
+{
+	u64 id;
+	if (!toObjectID(scene, ((Element&)element).first_property, &id)) return nullptr;
+	for (auto& connection : scene.m_connections)
+	{
+		if (connection.from_object == id && connection.to_object != 0)
+		{
+			const Scene::ObjectPair& pair = scene.m_object_map.find(connection.to_object)->second;
+			Object* obj = pair.object;
+			if (obj && obj->getType() == type) return obj;
+		}
+	}
+	return nullptr;
+}
+
+
+const IScene& Object::getScene() const
+{
+	return scene;
+}
+
+
+Object* Object::resolveObjectLink(int idx) const
+{
+	u64 id = 0;
+	toObjectID(scene, ((Element&)element).first_property, &id);
+	for (auto& connection : scene.m_connections)
+	{
+		if (connection.to_object == id && connection.from_object != 0)
+		{
+			Object* obj = scene.m_object_map.find(connection.from_object)->second.object;
+			if (obj)
+			{
+				if (idx == 0) return obj;
+				--idx;
+			}
+		}
+	}
+	return nullptr;
+}
+
+
+Object* Object::resolveObjectLink(Object::Type type, const char* property, int idx) const
+{
+	u64 id;
+	if (!toObjectID(scene, ((Element&)element).first_property, &id)) return nullptr;
+	for (auto& connection : scene.m_connections)
+	{
+		if (connection.to_object == id && connection.from_object != 0)
+		{
+			Object* obj = scene.m_object_map.find(connection.from_object)->second.object;
+			if (obj && obj->getType() == type)
+			{
+				if (property == nullptr || connection.to_property == property)
+				{
+					if (idx == 0) return obj;
+					--idx;
+				}
+			}
+		}
+	}
+	return nullptr;
+}
+
+
+bool Scene::finalize() {
+	for (const Connection& connection : m_connections) {
+		if (connection.type != Connection::OBJECT_OBJECT) continue;
+		Object* to_obj = m_object_map.find(connection.to_object)->second.object;
+		Object* from_obj = m_object_map.find(connection.from_object)->second.object;
+		if (!from_obj) continue;
+		if (!to_obj) continue;
+		if (!to_obj->is_node) continue;
+		from_obj->parent = to_obj;
+	}
+
+	for (Object* object : m_all_objects) {
+		if (object->depth != 0xffFFffFF) continue;
+		if (object->parent == object) {
+			Error::s_message = "Cyclic node hierarchy";
+			return false;
+		}
+		if (!object->parent) {
+			object->depth = 0;
+			continue;
+		}
+
+		object->depth = 0;
+		
+		Object* parent = object->parent;
+		while (parent) {
+			if (parent == object) {
+				Error::s_message = "Cyclic node hierarchy";
+				return false;
+			}
+			++object->depth;
+			parent = parent->parent;
+		}
+
+		Object* p = object->parent;
+		Object* child = object;
+		while (p) {
+			p->depth = child->depth - 1;
+			child = p;
+			p = p->parent;
+		}
+	}
+	return true;
+}
+
+IScene* load(const u8* data, int size, u16 flags, JobProcessor job_processor, void* job_user_ptr)
+{
+	std::unique_ptr<Scene> scene(new Scene());
+	scene->m_data.resize(size);
+	memcpy(&scene->m_data[0], data, size);
+
+	const bool is_binary = size >= 18 && strncmp((const char*)data, "Kaydara FBX Binary", 18) == 0;
+	OptionalError<Element*> root(nullptr);
+	if (is_binary) {
+		u32 version;
+		root = tokenize(&scene->m_data[0], size, version, scene->m_allocator);
+		scene->version = version;
+		if (version < 6100)
+		{
+			Error::s_message = "Unsupported FBX file format version. Minimum supported version is 6.1";
+			return nullptr;
+		}
+		if (root.isError())
+		{
+			Error::s_message = "";
+			if (root.isError()) return nullptr;
+		}
+	}
+	else {
+		root = tokenizeText(&scene->m_data[0], size, scene->m_allocator);
+		if (root.isError()) return nullptr;
+		const ofbx::Element* header = findChild(*root.getValue(), "FBXHeaderExtension");
+		if (header) {
+			const ofbx::Element* version_elem = findChild(*header, "FBXVersion");
+			if (version_elem->first_property) {
+				scene->version = version_elem->first_property->getValue().toU32();
+			}
+		}
+	}
+
+	scene->m_root_element = root.getValue();
+	assert(scene->m_root_element);
+
+	// if (parseTemplates(*root.getValue()).isError()) return nullptr;
+	if (!parseConnections(*root.getValue(), *scene.get())) return nullptr;
+	if (!parseTakes(*scene.get())) return nullptr;
+	if (!parseObjects(*root.getValue(), *scene.get(), flags, scene->m_allocator, job_processor, job_user_ptr)) return nullptr;
+	parseGlobalSettings(*root.getValue(), scene.get());
+	if (!scene->finalize()) return nullptr;
+
+	return scene.release();
+}
+
+
+const char* getError()
+{
+	return Error::s_message;
+}
+
+
+} // namespace ofbx
diff --git a/Plugins/nosGeometry/External/openFBX/ofbx.h b/Plugins/nosGeometry/External/openFBX/ofbx.h
new file mode 100644
index 00000000..c1394b24
--- /dev/null
+++ b/Plugins/nosGeometry/External/openFBX/ofbx.h
@@ -0,0 +1,804 @@
+#pragma once
+
+
+namespace ofbx
+{
+
+
+typedef unsigned char u8;
+typedef unsigned short u16;
+typedef unsigned int u32;
+#ifdef _WIN32
+	typedef long long i64;
+	typedef unsigned long long u64;
+#else
+	typedef long i64;
+	typedef unsigned long u64;
+#endif
+
+static_assert(sizeof(u8) == 1, "u8 is not 1 byte");
+static_assert(sizeof(u32) == 4, "u32 is not 4 bytes");
+static_assert(sizeof(u64) == 8, "u64 is not 8 bytes");
+static_assert(sizeof(i64) == 8, "i64 is not 8 bytes");
+
+
+using JobFunction = void (*)(void*);
+using JobProcessor = void (*)(JobFunction, void*, void*, u32, u32);
+
+// Ignoring certain nodes will only stop them from being processed not tokenised (i.e. they will still be in the tree)
+enum class LoadFlags : u16
+{
+	NONE = 0,
+	UNUSED = 1 << 0, // can be reused
+	IGNORE_GEOMETRY = 1 << 1,
+	IGNORE_BLEND_SHAPES = 1 << 2,
+	IGNORE_CAMERAS = 1 << 3,
+	IGNORE_LIGHTS = 1 << 4,
+	IGNORE_TEXTURES = 1 << 5,
+	IGNORE_SKIN = 1 << 6,
+	IGNORE_BONES = 1 << 7,
+	IGNORE_PIVOTS = 1 << 8,
+	IGNORE_ANIMATIONS = 1 << 9,
+	IGNORE_MATERIALS = 1 << 10,
+	IGNORE_POSES = 1 << 11,
+	IGNORE_VIDEOS = 1 << 12,
+	IGNORE_LIMBS = 1 << 13,
+	IGNORE_MESHES = 1 << 14,
+	IGNORE_MODELS = 1 << 15,
+};
+
+constexpr LoadFlags operator|(LoadFlags lhs, LoadFlags rhs)
+{
+	return static_cast<LoadFlags>(static_cast<u16>(lhs) | static_cast<u16>(rhs));
+}
+
+constexpr LoadFlags& operator|=(LoadFlags& lhs, LoadFlags rhs)
+{
+	return lhs = lhs | rhs;
+}
+
+struct DVec2 { double x, y; };
+struct DVec3 { double x, y, z; };
+struct DVec4 { double x, y, z, w; };
+struct DMatrix { double m[16]; /* last 4 are translation */ };
+struct DQuat{ double x, y, z, w; };
+
+struct FVec2 { float x, y; };
+struct FVec3 { float x, y, z; };
+struct FVec4 { float x, y, z, w; };
+struct FMatrix { float m[16]; };
+struct FQuat{ float x, y, z, w; };
+
+#define OFBX_SINGLE_PRECISION
+#ifdef OFBX_SINGLE_PRECISION
+	// use floats for vertices, normals, uvs, ...
+	using Vec2 = FVec2;
+	using Vec3 = FVec3;
+	using Vec4 = FVec4;
+	using Matrix = FMatrix;
+	using Quat = FQuat;
+#else
+	// use doubles for vertices, normals, uvs, ...
+	using Vec2 = DVec2;
+	using Vec3 = DVec3;
+	using Vec4 = DVec4;
+	using Matrix = DMatrix;
+	using Quat = DQuat;
+#endif
+
+struct Color
+{
+	float r, g, b;
+};
+
+
+struct DataView
+{
+	const u8* begin = nullptr;
+	const u8* end = nullptr;
+	bool is_binary = true;
+
+	bool operator!=(const char* rhs) const { return !(*this == rhs); }
+	bool operator==(const char* rhs) const;
+
+	u64 toU64() const;
+	i64 toI64() const;
+	int toInt() const;
+	u32 toU32() const;
+	bool toBool() const;
+	double toDouble() const;
+	float toFloat() const;
+
+	template <int N>
+	void toString(char(&out)[N]) const
+	{
+		char* cout = out;
+		const u8* cin = begin;
+		while (cin != end && cout - out < N - 1)
+		{
+			*cout = (char)*cin;
+			++cin;
+			++cout;
+		}
+		*cout = '\0';
+	}
+};
+
+
+struct IElementProperty
+{
+	enum Type : unsigned char
+	{
+		LONG = 'L',
+		INTEGER = 'I',
+		STRING = 'S',
+		FLOAT = 'F',
+		DOUBLE = 'D',
+		ARRAY_DOUBLE = 'd',
+		ARRAY_INT = 'i',
+		ARRAY_LONG = 'l',
+		ARRAY_FLOAT = 'f',
+		BINARY = 'R',
+		NONE = ' '
+	};
+	virtual ~IElementProperty() {}
+	virtual Type getType() const = 0;
+	virtual IElementProperty* getNext() const = 0;
+	virtual DataView getValue() const = 0;
+	virtual int getCount() const = 0;
+	virtual bool getValues(double* values, int max_size) const = 0;
+	virtual bool getValues(int* values, int max_size) const = 0;
+	virtual bool getValues(float* values, int max_size) const = 0;
+	virtual bool getValues(u64* values, int max_size) const = 0;
+	virtual bool getValues(i64* values, int max_size) const = 0;
+};
+
+
+struct IElement
+{
+    virtual ~IElement() = default;
+	virtual IElement* getFirstChild() const = 0;
+	virtual IElement* getSibling() const = 0;
+	virtual DataView getID() const = 0;
+	virtual IElementProperty* getFirstProperty() const = 0;
+};
+
+
+enum class RotationOrder
+{
+	EULER_XYZ,
+	EULER_XZY,
+	EULER_YZX,
+	EULER_YXZ,
+	EULER_ZXY,
+	EULER_ZYX,
+	SPHERIC_XYZ // Currently unsupported. Treated as EULER_XYZ.
+};
+
+
+struct AnimationCurveNode;
+struct AnimationLayer;
+struct Scene;
+struct IScene;
+
+
+struct Object
+{
+	enum class Type
+	{
+		ROOT,
+		GEOMETRY,
+		SHAPE,
+		MATERIAL,
+		MESH,
+		TEXTURE,
+		LIMB_NODE,
+		NULL_NODE,
+		CAMERA,
+		LIGHT,
+		NODE_ATTRIBUTE,
+		CLUSTER,
+		SKIN,
+		BLEND_SHAPE,
+		BLEND_SHAPE_CHANNEL,
+		ANIMATION_STACK,
+		ANIMATION_LAYER,
+		ANIMATION_CURVE,
+		ANIMATION_CURVE_NODE,
+		POSE
+	};
+
+	Object(const Scene& _scene, const IElement& _element);
+
+	virtual ~Object() {}
+	virtual Type getType() const = 0;
+
+	const IScene& getScene() const;
+	Object* resolveObjectLink(int idx) const;
+	Object* resolveObjectLink(Type type, const char* property, int idx) const;
+	Object* resolveObjectLinkReverse(Type type) const;
+	Object* getParent() const { return parent; }
+
+	RotationOrder getRotationOrder() const;
+	DVec3 getRotationOffset() const;
+	DVec3 getRotationPivot() const;
+	DVec3 getPostRotation() const;
+	DVec3 getScalingOffset() const;
+	DVec3 getScalingPivot() const;
+	DVec3 getPreRotation() const;
+	DVec3 getLocalTranslation() const;
+	DVec3 getLocalRotation() const;
+	DVec3 getLocalScaling() const;
+	DMatrix getGlobalTransform() const;
+	DMatrix getLocalTransform() const;
+	DMatrix evalLocal(const DVec3& translation, const DVec3& rotation) const;
+	DMatrix evalLocal(const DVec3& translation, const DVec3& rotation, const DVec3& scaling) const;
+	bool isNode() const { return is_node; }
+
+
+	template <typename T> T* resolveObjectLink(int idx) const
+	{
+		return static_cast<T*>(resolveObjectLink(T::s_type, nullptr, idx));
+	}
+
+	u64 id;
+	u32 depth = 0xffFFffFF;
+	Object* parent = nullptr;
+	char name[128];
+	const IElement& element;
+	const Object* node_attribute;
+
+protected:
+	friend struct Scene;
+	bool is_node;
+	const Scene& scene;
+};
+
+
+struct Pose : Object {
+	static const Type s_type = Type::POSE;
+	Pose(const Scene& _scene, const IElement& _element);
+
+	virtual DMatrix getMatrix() const = 0;
+	virtual const Object* getNode() const = 0;
+};
+
+
+struct Texture : Object
+{
+	enum TextureType
+	{
+		DIFFUSE,
+		NORMAL,
+		SPECULAR,
+        SHININESS,
+        AMBIENT,
+        EMISSIVE,
+        REFLECTION,
+		COUNT
+	};
+
+	static const Type s_type = Type::TEXTURE;
+
+	Texture(const Scene& _scene, const IElement& _element);
+	virtual DataView getFileName() const = 0;
+	virtual DataView getRelativeFileName() const = 0;
+	virtual DataView getEmbeddedData() const = 0;
+};
+
+struct Light : Object
+{
+public:
+	enum class LightType
+	{
+		POINT,
+		DIRECTIONAL,
+		SPOT,
+		AREA,
+		VOLUME,
+		COUNT
+	};
+
+	enum class DecayType
+	{
+		NO_DECAY,
+		LINEAR,
+		QUADRATIC,
+		CUBIC,
+		COUNT
+	};
+
+	Light(const Scene& _scene, const IElement& _element)
+		: Object(_scene, _element)
+	{
+		// Initialize the light properties here
+	}
+
+	// Light type
+	virtual LightType getLightType() const = 0;
+
+	// Light properties
+	virtual bool doesCastLight() const = 0;
+	virtual bool doesDrawVolumetricLight() const = 0;
+	virtual bool doesDrawGroundProjection() const = 0;
+	virtual bool doesDrawFrontFacingVolumetricLight() const = 0;
+	virtual Color getColor() const = 0;
+	virtual double getIntensity() const = 0;
+	virtual double getInnerAngle() const = 0;
+	virtual double getOuterAngle() const = 0;
+	virtual double getFog() const = 0;
+	virtual DecayType getDecayType() const = 0;
+	virtual double getDecayStart() const = 0;
+
+	// Near attenuation
+	virtual bool doesEnableNearAttenuation() const = 0;
+	virtual double getNearAttenuationStart() const = 0;
+	virtual double getNearAttenuationEnd() const = 0;
+
+	// Far attenuation
+	virtual bool doesEnableFarAttenuation() const = 0;
+	virtual double getFarAttenuationStart() const = 0;
+	virtual double getFarAttenuationEnd() const = 0;
+
+	// Shadows
+	virtual const Texture* getShadowTexture() const = 0;
+	virtual bool doesCastShadows() const = 0;
+	virtual Color getShadowColor() const = 0;
+};
+
+struct Camera : Object
+{
+	enum class ProjectionType
+	{
+		PERSPECTIVE,
+		ORTHOGRAPHIC,
+		COUNT
+	};
+
+	enum class ApertureMode // Used to determine how to calculate the FOV
+	{
+		HORIZANDVERT,
+		HORIZONTAL,
+		VERTICAL,
+		FOCALLENGTH,
+		COUNT
+	};
+
+	enum class GateFit
+	{
+		NONE,
+		VERTICAL,
+		HORIZONTAL,
+		FILL,
+		OVERSCAN,
+		STRETCH,
+		COUNT
+	};
+
+	static const Type s_type = Type::CAMERA;
+
+	Camera(const Scene& _scene, const IElement& _element)
+		: Object(_scene, _element)
+	{
+	}
+
+	virtual Type getType() const { return Type::CAMERA; }
+	virtual ProjectionType getProjectionType() const = 0;
+	virtual ApertureMode getApertureMode() const = 0;
+
+	virtual double getFilmHeight() const = 0;
+	virtual double getFilmWidth() const = 0;
+
+	virtual double getAspectHeight() const = 0;
+	virtual double getAspectWidth() const = 0;
+
+	virtual double getNearPlane() const = 0;
+	virtual double getFarPlane() const = 0;
+	virtual bool doesAutoComputeClipPanes() const = 0;
+
+	virtual GateFit getGateFit() const = 0;
+	virtual double getFilmAspectRatio() const = 0;
+	virtual double getFocalLength() const = 0;
+	virtual double getFocusDistance() const = 0;
+
+	virtual DVec3 getBackgroundColor() const = 0;
+	virtual DVec3 getInterestPosition() const = 0;
+};
+
+struct Material : Object
+{
+	static const Type s_type = Type::MATERIAL;
+
+	Material(const Scene& _scene, const IElement& _element);
+
+	virtual Color getDiffuseColor() const = 0;
+	virtual Color getSpecularColor() const = 0;
+    virtual Color getReflectionColor() const = 0;
+    virtual Color getAmbientColor() const = 0;
+    virtual Color getEmissiveColor() const = 0;
+
+    virtual double getDiffuseFactor() const = 0;
+    virtual double getSpecularFactor() const = 0;
+    virtual double getReflectionFactor() const = 0;
+    virtual double getShininess() const = 0;
+    virtual double getShininessExponent() const = 0;
+    virtual double getAmbientFactor() const = 0;
+    virtual double getBumpFactor() const = 0;
+    virtual double getEmissiveFactor() const = 0;
+
+	virtual const Texture* getTexture(Texture::TextureType type) const = 0;
+};
+
+
+struct Cluster : Object
+{
+	static const Type s_type = Type::CLUSTER;
+
+	Cluster(const Scene& _scene, const IElement& _element);
+
+	virtual const int* getIndices() const = 0;
+	virtual int getIndicesCount() const = 0;
+	virtual const double* getWeights() const = 0;
+	virtual int getWeightsCount() const = 0;
+	virtual DMatrix getTransformMatrix() const = 0;
+	virtual DMatrix getTransformLinkMatrix() const = 0;
+	virtual const Object* getLink() const = 0;
+};
+
+
+struct Skin : Object
+{
+	static const Type s_type = Type::SKIN;
+
+	Skin(const Scene& _scene, const IElement& _element);
+
+	virtual int getClusterCount() const = 0;
+	virtual const Cluster* getCluster(int idx) const = 0;
+};
+
+
+struct BlendShapeChannel : Object
+{
+	static const Type s_type = Type::BLEND_SHAPE_CHANNEL;
+
+	BlendShapeChannel(const Scene& _scene, const IElement& _element);
+
+	virtual double getDeformPercent() const = 0;
+	virtual int getShapeCount() const = 0;
+	virtual const struct Shape* getShape(int idx) const = 0;
+};
+
+
+struct BlendShape : Object
+{
+	static const Type s_type = Type::BLEND_SHAPE;
+
+	BlendShape(const Scene& _scene, const IElement& _element);
+
+	virtual int getBlendShapeChannelCount() const = 0;
+	virtual const BlendShapeChannel* getBlendShapeChannel(int idx) const = 0;
+};
+
+
+struct NodeAttribute : Object
+{
+	static const Type s_type = Type::NODE_ATTRIBUTE;
+
+	NodeAttribute(const Scene& _scene, const IElement& _element);
+
+	virtual DataView getAttributeType() const = 0;
+};
+
+
+struct Vec2Attributes {
+	const Vec2* values = nullptr;
+	const int* indices = nullptr;
+	int count = 0;
+
+	const Vec2& get(int i) const { return indices ? values[indices[i]] : values[i]; }
+};
+
+struct Vec3Attributes {
+	const Vec3* values = nullptr;
+	const int* indices = nullptr;
+	int count = 0;
+	int values_count = 0;
+
+	const Vec3& get(int i) const { return indices ? values[indices[i]] : values[i]; }
+};
+
+struct Vec4Attributes {
+	const Vec4* values = nullptr;
+	const int* indices = nullptr;
+	int count = 0;
+
+	const Vec4& get(int i) const { return indices ? values[indices[i]] : values[i]; }
+};
+
+// subset of polygons with same material
+struct GeometryPartition {
+	struct Polygon {
+		const int from_vertex; // index into VecNAttributes::indices
+		const int vertex_count;
+	};
+	const Polygon* polygons;
+	const int polygon_count;
+	const int max_polygon_triangles; // max triangles in single polygon, can be used for preallocation
+	const int triangles_count; // number of triangles after polygon triangulation, can be used for preallocation
+};
+
+struct GeometryData {
+	virtual ~GeometryData() {}
+	
+	virtual Vec3Attributes getPositions() const = 0;
+	virtual Vec3Attributes getNormals() const = 0;
+	virtual Vec2Attributes getUVs(int index = 0) const = 0;
+	virtual Vec4Attributes getColors() const = 0;
+	virtual Vec3Attributes getTangents() const = 0;
+	virtual int getPartitionCount() const = 0;
+	virtual GeometryPartition getPartition(int partition_index) const = 0;
+};
+
+
+struct Geometry : Object {
+	static const Type s_type = Type::GEOMETRY;
+	static const int s_uvs_max = 4;
+
+	Geometry(const Scene& _scene, const IElement& _element);
+
+	virtual const GeometryData& getGeometryData() const = 0;
+	virtual const Skin* getSkin() const = 0;
+	virtual const BlendShape* getBlendShape() const = 0;
+};
+
+
+struct Shape : Object
+{
+	static const Type s_type = Type::SHAPE;
+
+	Shape(const Scene& _scene, const IElement& _element);
+
+	virtual const Vec3* getVertices() const = 0;
+	virtual int getVertexCount() const = 0;
+
+	virtual const int* getIndices() const = 0;
+	virtual int getIndexCount() const = 0;
+
+	virtual const Vec3* getNormals() const = 0;
+};
+
+
+struct Mesh : Object {
+	static const Type s_type = Type::MESH;
+
+	Mesh(const Scene& _scene, const IElement& _element);
+
+	virtual const Pose* getPose() const = 0;
+	virtual const Geometry* getGeometry() const = 0;
+	virtual DMatrix getGeometricMatrix() const = 0;
+	virtual const Material* getMaterial(int idx) const = 0;
+	virtual int getMaterialCount() const = 0;
+	// this will use data from `Geometry` if available and from `Mesh` otherwise
+	virtual const GeometryData& getGeometryData() const = 0;
+	virtual const Skin* getSkin() const = 0;
+	virtual const BlendShape* getBlendShape() const = 0;
+};
+
+
+struct AnimationStack : Object
+{
+	static const Type s_type = Type::ANIMATION_STACK;
+
+	AnimationStack(const Scene& _scene, const IElement& _element);
+	virtual const AnimationLayer* getLayer(int index) const = 0;
+};
+
+
+struct AnimationLayer : Object
+{
+	static const Type s_type = Type::ANIMATION_LAYER;
+
+	AnimationLayer(const Scene& _scene, const IElement& _element);
+
+	virtual const AnimationCurveNode* getCurveNode(int index) const = 0;
+	virtual const AnimationCurveNode* getCurveNode(const Object& bone, const char* property) const = 0;
+};
+
+
+struct AnimationCurve : Object
+{
+	static const Type s_type = Type::ANIMATION_CURVE;
+
+	AnimationCurve(const Scene& _scene, const IElement& _element);
+
+	virtual int getKeyCount() const = 0;
+	virtual const i64* getKeyTime() const = 0;
+	virtual const float* getKeyValue() const = 0;
+};
+
+
+struct AnimationCurveNode : Object
+{
+	static const Type s_type = Type::ANIMATION_CURVE_NODE;
+
+	AnimationCurveNode(const Scene& _scene, const IElement& _element);
+
+	virtual DataView getBoneLinkProperty() const = 0;
+	virtual const AnimationCurve* getCurve(int idx) const = 0; 
+	virtual DVec3 getNodeLocalTransform(double time) const = 0;
+	virtual const Object* getBone() const = 0;
+};
+
+
+struct TakeInfo
+{
+	DataView name;
+	DataView filename;
+	double local_time_from;
+	double local_time_to;
+	double reference_time_from;
+	double reference_time_to;
+};
+
+
+// Specifies which canonical axis represents up in the system (typically Y or Z).
+enum UpVector
+{
+	UpVector_AxisX = 0,
+	UpVector_AxisY = 1,
+	UpVector_AxisZ = 2
+};
+
+
+// Specifies the third vector of the system.
+enum CoordSystem
+{
+	CoordSystem_RightHanded = 0,
+	CoordSystem_LeftHanded = 1
+};
+
+
+// http://docs.autodesk.com/FBX/2014/ENU/FBX-SDK-Documentation/index.html?url=cpp_ref/class_fbx_time.html,topicNumber=cpp_ref_class_fbx_time_html29087af6-8c2c-4e9d-aede-7dc5a1c2436c,hash=a837590fd5310ff5df56ffcf7c394787e
+enum FrameRate
+{
+	FrameRate_DEFAULT = 0,
+	FrameRate_120 = 1,
+	FrameRate_100 = 2,
+	FrameRate_60 = 3,
+	FrameRate_50 = 4,
+	FrameRate_48 = 5,
+	FrameRate_30 = 6,
+	FrameRate_30_DROP = 7,
+	FrameRate_NTSC_DROP_FRAME = 8,
+	FrameRate_NTSC_FULL_FRAME = 9,
+	FrameRate_PAL = 10,
+	FrameRate_CINEMA = 11,
+	FrameRate_1000 = 12,
+	FrameRate_CINEMA_ND = 13,
+	FrameRate_CUSTOM = 14,
+};
+
+
+struct GlobalSettings
+{
+	UpVector UpAxis = UpVector_AxisY;
+	int UpAxisSign = 1;
+	// this seems to be 1-2 in Autodesk (odd/even parity), and 0-2 in Blender (axis as in UpAxis)
+	// I recommend to ignore FrontAxis and use just UpVector
+	int FrontAxis = 1; 
+	int FrontAxisSign = 1;
+	CoordSystem CoordAxis = CoordSystem_RightHanded;
+	int CoordAxisSign = 1;
+	int OriginalUpAxis = 0;
+	int OriginalUpAxisSign = 1;
+	float UnitScaleFactor = 1;
+	float OriginalUnitScaleFactor = 1;
+	double TimeSpanStart = 0L;
+	double TimeSpanStop = 0L;
+	FrameRate TimeMode = FrameRate_DEFAULT;
+	float CustomFrameRate = -1.0f;
+};
+
+
+struct IScene
+{
+	virtual void destroy() = 0;
+
+	// Root Node
+	virtual const IElement* getRootElement() const = 0;
+	virtual const Object* getRoot() const = 0;
+
+	// Meshes
+	virtual int getMeshCount() const = 0;
+	virtual const Mesh* getMesh(int index) const = 0;
+
+	// Geometry
+	virtual int getGeometryCount() const = 0;
+	virtual const Geometry* getGeometry(int index) const = 0;
+
+	// Animations
+	virtual int getAnimationStackCount() const = 0;
+	virtual const AnimationStack* getAnimationStack(int index) const = 0;
+
+	// Cameras
+	virtual int getCameraCount() const = 0;
+	virtual const Camera* getCamera(int index) const = 0;
+
+	// Lights
+	virtual int getLightCount() const = 0;
+	virtual const Light* getLight(int index) const = 0;
+
+	// Scene Objects (Everything in scene)
+	virtual const Object* const* getAllObjects() const = 0;
+	virtual int getAllObjectCount() const = 0;
+
+	// Embedded files/Data
+	virtual int getEmbeddedDataCount() const = 0;
+	virtual DataView getEmbeddedData(int index) const = 0;
+	virtual DataView getEmbeddedFilename(int index) const = 0;
+	virtual bool isEmbeddedBase64(int index) const = 0;
+	// data are encoded in returned property and all ->next properties
+	virtual const IElementProperty* getEmbeddedBase64Data(int index) const = 0;
+
+	// Scene Misc
+	virtual const TakeInfo* getTakeInfo(const char* name) const = 0;
+	virtual float getSceneFrameRate() const = 0;
+	virtual const GlobalSettings* getGlobalSettings() const = 0;
+
+protected:
+	virtual ~IScene() {}
+};
+
+
+IScene* load(const u8* data, int size, u16 flags, JobProcessor job_processor = nullptr, void* job_user_ptr = nullptr);
+const char* getError();
+double fbxTimeToSeconds(i64 value);
+i64 secondsToFbxTime(double value);
+
+// TODO nonconvex
+inline u32 triangulate(const GeometryData& geom, const GeometryPartition::Polygon& polygon, int* tri_indices) {
+	if (polygon.vertex_count < 3) return 0;
+	if (polygon.vertex_count == 3) {
+		tri_indices[0] = polygon.from_vertex;
+		tri_indices[1] = polygon.from_vertex + 1;
+		tri_indices[2] = polygon.from_vertex + 2;
+		return 3;
+	}
+	else if (polygon.vertex_count == 4) {
+		tri_indices[0] = polygon.from_vertex + 0;
+		tri_indices[1] = polygon.from_vertex + 1;
+		tri_indices[2] = polygon.from_vertex + 2;
+
+		tri_indices[3] = polygon.from_vertex + 0;
+		tri_indices[4] = polygon.from_vertex + 2;
+		tri_indices[5] = polygon.from_vertex + 3;
+		return 6;
+	}
+	
+	for (int tri = 0; tri < polygon.vertex_count - 2; ++tri) {
+		tri_indices[tri * 3 + 0] = polygon.from_vertex;
+		tri_indices[tri * 3 + 1] = polygon.from_vertex + 1 + tri;
+		tri_indices[tri * 3 + 2] = polygon.from_vertex + 2 + tri;
+	}
+	return 3 * (polygon.vertex_count - 2);
+}
+
+
+} // namespace ofbx
+
+#ifdef OFBX_DEFAULT_DELETER
+#include <memory>
+
+template <> struct ::std::default_delete<ofbx::IScene>
+{
+	default_delete() = default;
+	template <class U> constexpr default_delete(default_delete<U>) noexcept {}
+	void operator()(ofbx::IScene* scene) const noexcept
+	{
+		if (scene)
+		{
+			scene->destroy();
+		}
+	}
+};
+#endif
diff --git a/Plugins/nosGeometry/External/openFBX/readme.txt b/Plugins/nosGeometry/External/openFBX/readme.txt
new file mode 100644
index 00000000..f0077b47
--- /dev/null
+++ b/Plugins/nosGeometry/External/openFBX/readme.txt
@@ -0,0 +1 @@
+https://github.com/nem0/OpenFBX
\ No newline at end of file
diff --git a/Plugins/nosGeometry/Geometry.noscfg b/Plugins/nosGeometry/Geometry.noscfg
new file mode 100644
index 00000000..e1e7bcaf
--- /dev/null
+++ b/Plugins/nosGeometry/Geometry.noscfg
@@ -0,0 +1,23 @@
+{
+    "info": {
+        "id": {
+            "name": "nos.geometry",
+            "version": "0.1.0"
+        },
+        "display_name": "Geometry",
+        "description": "Nodes for reading 3D assets (FBX) and 3D geometry operations.",
+        "category": "Geometry",
+        "dependencies": [
+            {
+                "name": "nos.sys.track",
+                "version": "1.1"
+            }
+        ]
+    },
+    "binary_path": "Binaries/nosGeometry",
+    "node_definitions": [
+        "Config/ReadFBXTransform.nosdef"
+    ],
+    "defaults": [],
+    "custom_types": []
+}
\ No newline at end of file
diff --git a/Plugins/nosGeometry/Source/PluginMain.cpp b/Plugins/nosGeometry/Source/PluginMain.cpp
new file mode 100644
index 00000000..bf50b6e1
--- /dev/null
+++ b/Plugins/nosGeometry/Source/PluginMain.cpp
@@ -0,0 +1,31 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#include <Nodos/PluginAPI.h>
+#include <Nodos/PluginHelpers.hpp>
+#include <Nodos/Helpers.hpp>
+
+NOS_INIT()
+NOS_BEGIN_IMPORT_DEPS()
+NOS_END_IMPORT_DEPS()
+
+namespace nos::geometry
+{
+nosResult RegisterReadFBXTransform(nosNodeFunctions*);
+}
+
+nosResult NOSAPI_CALL ExportNodeFunctions(size_t* outCount, nosNodeFunctions** outFunctions)
+{
+    *outCount = 1;
+    if (!outFunctions)
+        return NOS_RESULT_SUCCESS;
+    return nos::geometry::RegisterReadFBXTransform(outFunctions[0]);
+}
+
+extern "C"
+{
+NOSAPI_ATTR nosResult NOSAPI_CALL nosExportPlugin(nosPluginFunctions* out)
+{
+	out->ExportNodeFunctions = ExportNodeFunctions;
+	return NOS_RESULT_SUCCESS;
+}
+}
diff --git a/Plugins/nosGeometry/Source/ReadFBXTransform.cpp b/Plugins/nosGeometry/Source/ReadFBXTransform.cpp
new file mode 100644
index 00000000..9c8df2e9
--- /dev/null
+++ b/Plugins/nosGeometry/Source/ReadFBXTransform.cpp
@@ -0,0 +1,240 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#include <Nodos/PluginHelpers.hpp>
+#include <Nodos/Helpers.hpp>
+
+// Framework builtins (nos.fb.Transform / nos.fb.vec3d)
+#include <Builtins_generated.h>
+
+#include <glm/glm.hpp>
+
+// Shared CoordinateFrame enum + Euler conversion helpers (nos.sys.track).
+#include <nosSysTrack/CoordinateFrameConv.h>
+
+// Vendored FBX reader
+#include <ofbx.h>
+
+#include <cstdint>
+#include <filesystem>
+#include <fstream>
+#include <string>
+#include <unordered_map>
+#include <unordered_set>
+#include <vector>
+
+namespace nos::geometry
+{
+NOS_REGISTER_NAME(Path)
+NOS_REGISTER_NAME(Object)
+NOS_REGISTER_NAME(SourceFrame)
+NOS_REGISTER_NAME(LocalTransform)
+NOS_REGISTER_NAME(GlobalTransform)
+NOS_REGISTER_NAME(IsLoaded)
+
+namespace conv = nos::track::convention;
+using Frame = nos::sys::track::CoordinateFrame;
+
+// Frame-independent decomposition of an FBX object's transform. Rotation is kept
+// as a matrix so it can be re-expressed in whatever CoordinateFrame the user picks
+// without re-reading the file.
+struct RawTransform
+{
+	glm::dvec3 Translation{0.0};
+	glm::dmat3 Rotation{1.0};
+	glm::dvec3 Scale{1.0};
+};
+
+struct ObjectTransforms
+{
+	RawTransform Local;
+	RawTransform Global;
+};
+
+// Decompose an openFBX 4x4 (column-major double[16]) into translation, a
+// normalized rotation matrix, and per-axis scale.
+static RawTransform DecomposeMatrix(ofbx::DMatrix const& m)
+{
+	glm::dmat4 gm(1.0);
+	for (int c = 0; c < 4; ++c)
+		for (int r = 0; r < 4; ++r)
+			gm[c][r] = m.m[c * 4 + r];
+
+	RawTransform out;
+	out.Translation = glm::dvec3(gm[3]);
+	out.Scale = glm::dvec3(glm::length(glm::dvec3(gm[0])),
+						   glm::length(glm::dvec3(gm[1])),
+						   glm::length(glm::dvec3(gm[2])));
+	out.Rotation = glm::dmat3(
+		out.Scale.x != 0.0 ? glm::dvec3(gm[0]) / out.Scale.x : glm::dvec3(1, 0, 0),
+		out.Scale.y != 0.0 ? glm::dvec3(gm[1]) / out.Scale.y : glm::dvec3(0, 1, 0),
+		out.Scale.z != 0.0 ? glm::dvec3(gm[2]) / out.Scale.z : glm::dvec3(0, 0, 1));
+	return out;
+}
+
+// Express a decomposed transform as a nos.fb.Transform, packing the rotation in
+// `frame`'s Euler convention so it composes with the Convert Transform node.
+static fb::Transform ToTransform(RawTransform const& t, Frame frame)
+{
+	glm::dvec3 euler = conv::MatToEuler(frame, t.Rotation);
+	return fb::Transform(
+		fb::vec3d(t.Translation.x, t.Translation.y, t.Translation.z),
+		fb::vec3d(euler.x, euler.y, euler.z),
+		fb::vec3d(t.Scale.x, t.Scale.y, t.Scale.z));
+}
+
+struct ReadFBXTransformContext : NodeContext
+{
+	// Combo-box labels in display order and their resolved (raw) transforms.
+	std::vector<std::string> ObjectLabels;
+	std::unordered_map<std::string, ObjectTransforms> Transforms;
+	// Per-node unique name of the string list backing the Object combo box.
+	std::string ComboListName;
+	// Object the user last selected; preferred when (re)loading a file.
+	std::string DesiredSelection;
+	// Coordinate frame the user declared the file is authored in.
+	Frame CurrentFrame = Frame::RH_YUp_FwdNegZ_RightX;
+	bool Loaded = false;
+
+	ReadFBXTransformContext(nosFbNodePtr node) : NodeContext(node)
+	{
+		ComboListName = "nos.geometry.FBXObjects." + std::string(NodeId);
+		SetPinVisualizer(NSN_Object, {.type = nos::fb::VisualizerType::COMBO_BOX, .name = ComboListName});
+
+		// Restore saved path / selection / frame.
+		std::string path;
+		if (auto* pins = node->pins())
+			for (auto const* pin : *pins)
+			{
+				if (!pin->data() || !pin->data()->size())
+					continue;
+				auto const* name = pin->name()->c_str();
+				if (0 == strcmp(name, "Path"))
+					path = reinterpret_cast<const char*>(pin->data()->data());
+				else if (0 == strcmp(name, "Object"))
+					DesiredSelection = reinterpret_cast<const char*>(pin->data()->data());
+				else if (0 == strcmp(name, "SourceFrame"))
+					CurrentFrame = static_cast<Frame>(*reinterpret_cast<const uint8_t*>(pin->data()->data()));
+			}
+		if (!path.empty())
+			LoadFbx(path);
+	}
+
+	void OnPinValueChanged(nos::Name pinName, uuid const& pinId, nosBuffer value) override
+	{
+		if (pinName == NSN_Path)
+		{
+			LoadFbx(value.Data ? reinterpret_cast<const char*>(value.Data) : "");
+		}
+		else if (pinName == NSN_Object)
+		{
+			DesiredSelection = value.Data ? reinterpret_cast<const char*>(value.Data) : "";
+			UpdateOutputs(DesiredSelection);
+		}
+		else if (pinName == NSN_SourceFrame)
+		{
+			if (value.Data)
+				CurrentFrame = static_cast<Frame>(*reinterpret_cast<const uint8_t*>(value.Data));
+			UpdateOutputs(DesiredSelection);
+		}
+	}
+
+	void LoadFbx(std::string const& path)
+	{
+		ObjectLabels.clear();
+		Transforms.clear();
+		UpdateStringList(ComboListName, {});
+
+		std::error_code ec;
+		if (path.empty() || !std::filesystem::exists(path, ec))
+		{
+			Finish(false, path.empty() ? "No FBX file selected" : "FBX file not found");
+			return;
+		}
+
+		std::ifstream file(std::filesystem::path(path), std::ios::binary);
+		std::vector<ofbx::u8> content((std::istreambuf_iterator<char>(file)), std::istreambuf_iterator<char>());
+		if (content.empty())
+		{
+			Finish(false, "Failed to read FBX file");
+			return;
+		}
+
+		// We only need the scene graph / transforms, so skip the heavy payloads.
+		auto flags = ofbx::LoadFlags::IGNORE_GEOMETRY | ofbx::LoadFlags::IGNORE_BLEND_SHAPES |
+					 ofbx::LoadFlags::IGNORE_TEXTURES | ofbx::LoadFlags::IGNORE_SKIN |
+					 ofbx::LoadFlags::IGNORE_MATERIALS | ofbx::LoadFlags::IGNORE_ANIMATIONS |
+					 ofbx::LoadFlags::IGNORE_VIDEOS | ofbx::LoadFlags::IGNORE_POSES;
+
+		ofbx::IScene* scene = ofbx::load(content.data(), static_cast<int>(content.size()), static_cast<ofbx::u16>(flags));
+		if (!scene)
+		{
+			nosEngine.LogE("ReadFBXTransform: failed to parse '%s': %s", path.c_str(), ofbx::getError());
+			Finish(false, "Failed to parse FBX");
+			return;
+		}
+
+		std::unordered_set<std::string> usedLabels;
+		int count = scene->getAllObjectCount();
+		ofbx::Object const* const* objects = scene->getAllObjects();
+		for (int i = 0; i < count; ++i)
+		{
+			ofbx::Object const* obj = objects[i];
+			if (!obj || !obj->isNode())
+				continue;
+
+			std::string base = (obj->name[0] != '\0') ? obj->name : "(unnamed)";
+			std::string label = base;
+			for (int suffix = 2; usedLabels.count(label); ++suffix)
+				label = base + " (" + std::to_string(suffix) + ")";
+			usedLabels.insert(label);
+
+			ObjectTransforms t;
+			t.Local = DecomposeMatrix(obj->getLocalTransform());
+			t.Global = DecomposeMatrix(obj->getGlobalTransform());
+
+			Transforms.emplace(label, t);
+			ObjectLabels.push_back(std::move(label));
+		}
+		scene->destroy();
+
+		if (ObjectLabels.empty())
+		{
+			Finish(false, "No objects found in FBX");
+			return;
+		}
+
+		UpdateStringList(ComboListName, ObjectLabels);
+
+		// Keep the previous selection if it still exists, otherwise pick the first.
+		std::string selection = Transforms.count(DesiredSelection) ? DesiredSelection : ObjectLabels.front();
+		DesiredSelection = selection;
+		SetPinValue(NSN_Object, selection.c_str());
+		UpdateOutputs(selection);
+
+		Finish(true, "Loaded " + std::to_string(ObjectLabels.size()) + " object(s)");
+	}
+
+	void UpdateOutputs(std::string const& selection)
+	{
+		auto it = Transforms.find(selection);
+		if (it == Transforms.end())
+			return;
+		SetPinValue(NSN_LocalTransform, nos::Buffer::From(ToTransform(it->second.Local, CurrentFrame)));
+		SetPinValue(NSN_GlobalTransform, nos::Buffer::From(ToTransform(it->second.Global, CurrentFrame)));
+	}
+
+	void Finish(bool ok, std::string const& message)
+	{
+		Loaded = ok;
+		SetPinValue(NSN_IsLoaded, nos::Buffer::From(Loaded));
+		SetNodeStatusMessage(message, ok ? fb::NodeStatusMessageType::INFO : fb::NodeStatusMessageType::WARNING);
+	}
+};
+
+nosResult RegisterReadFBXTransform(nosNodeFunctions* fn)
+{
+	NOS_BIND_NODE_CLASS(NOS_NAME("nos.geometry.ReadFBXTransform"), ReadFBXTransformContext, fn);
+	return NOS_RESULT_SUCCESS;
+}
+
+} // namespace nos::geometry
diff --git a/Plugins/nosMath/CMakeLists.txt b/Plugins/nosMath/CMakeLists.txt
index ee9ef718..bcbf2b2f 100644
--- a/Plugins/nosMath/CMakeLists.txt
+++ b/Plugins/nosMath/CMakeLists.txt
@@ -6,6 +6,10 @@ add_library(tinyexpr_cpp STATIC ${TINYEXPR_SOURCES})
 target_include_directories(tinyexpr_cpp PUBLIC External/tinyexpr-cpp)
 nos_group_targets("tinyexpr_cpp" "External")
 
-set(DEPENDENCIES ${NOS_PLUGIN_SDK_TARGET} tinyexpr_cpp)
+set(GENERATED_OUTPUT_DIR "${CMAKE_CURRENT_BINARY_DIR}/Generated")
+nos_generate_flatbuffers("${CMAKE_CURRENT_SOURCE_DIR}/Config" "${GENERATED_OUTPUT_DIR}" "cpp" "${NOS_SDK_DIR}/Types" nosMath_generated)
 
-nos_add_plugin("nosMath" "${DEPENDENCIES}" "")
+set(DEPENDENCIES ${NOS_PLUGIN_SDK_TARGET} tinyexpr_cpp nosMath_generated)
+set(INCLUDE_FOLDERS "${GENERATED_OUTPUT_DIR}")
+
+nos_add_plugin("nosMath" "${DEPENDENCIES}" "${INCLUDE_FOLDERS}")
diff --git a/Plugins/nosMath/Config/EulerToQuaternion.nosdef b/Plugins/nosMath/Config/EulerToQuaternion.nosdef
new file mode 100644
index 00000000..fa40e5d7
--- /dev/null
+++ b/Plugins/nosMath/Config/EulerToQuaternion.nosdef
@@ -0,0 +1,38 @@
+{
+	"nodes": [
+		{
+			"class_name": "EulerToQuaternion",
+			"menu_info": {
+				"category": "Math|Linear Algebra",
+				"display_name": "Euler To Quaternion"
+			},
+			"node": {
+				"class_name": "EulerToQuaternion",
+				"contents_type": "Job",
+				"description": "Converts an Euler-angle rotation (degrees) to a unit quaternion (x, y, z, w). The Order pin selects the intrinsic rotation order applied to the components of the input vec3 (e.g. ZYX means R = Rz(rot.z) * Ry(rot.y) * Rx(rot.x)). Default ZYX matches the FreeD/Track convention.",
+				"pins": [
+					{
+						"name": "Euler",
+						"type_name": "nos.fb.vec3d",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY"
+					},
+					{
+						"name": "Order",
+						"type_name": "nos.math.EulerOrder",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": "ZYX",
+						"description": "Euler intrinsic rotation order applied to the (rot.x, rot.y, rot.z) components."
+					},
+					{
+						"name": "Quaternion",
+						"type_name": "nos.fb.vec4d",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY"
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosMath/Config/Math.fbs b/Plugins/nosMath/Config/Math.fbs
new file mode 100644
index 00000000..84c79eeb
--- /dev/null
+++ b/Plugins/nosMath/Config/Math.fbs
@@ -0,0 +1,10 @@
+namespace nos.math;
+
+enum EulerOrder : ubyte {
+	ZYX = 0,
+	XYZ = 1,
+	YXZ = 2,
+	YZX = 3,
+	ZXY = 4,
+	XZY = 5,
+}
diff --git a/Plugins/nosMath/Config/QuaternionMultiply.nosdef b/Plugins/nosMath/Config/QuaternionMultiply.nosdef
new file mode 100644
index 00000000..fc162b41
--- /dev/null
+++ b/Plugins/nosMath/Config/QuaternionMultiply.nosdef
@@ -0,0 +1,36 @@
+{
+	"nodes": [
+		{
+			"class_name": "QuaternionMultiply",
+			"menu_info": {
+				"category": "Math|Linear Algebra",
+				"display_name": "Quaternion Multiply"
+			},
+			"node": {
+				"class_name": "QuaternionMultiply",
+				"contents_type": "Job",
+				"description": "Hamilton product of two unit quaternions: Result = A * B (each as (x, y, z, w)). Composing rotations: A * B applies B first, then A. To rotate (conjugate) a quaternion Q by R, compute R * Q * conjugate(R).",
+				"pins": [
+					{
+						"name": "A",
+						"type_name": "nos.fb.vec4d",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY"
+					},
+					{
+						"name": "B",
+						"type_name": "nos.fb.vec4d",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY"
+					},
+					{
+						"name": "Result",
+						"type_name": "nos.fb.vec4d",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY"
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosMath/Config/QuaternionToEuler.nosdef b/Plugins/nosMath/Config/QuaternionToEuler.nosdef
new file mode 100644
index 00000000..d08ffc7a
--- /dev/null
+++ b/Plugins/nosMath/Config/QuaternionToEuler.nosdef
@@ -0,0 +1,38 @@
+{
+	"nodes": [
+		{
+			"class_name": "QuaternionToEuler",
+			"menu_info": {
+				"category": "Math|Linear Algebra",
+				"display_name": "Quaternion To Euler"
+			},
+			"node": {
+				"class_name": "QuaternionToEuler",
+				"contents_type": "Job",
+				"description": "Converts a unit quaternion (x, y, z, w) to Euler angles (degrees). The Order pin selects the intrinsic rotation order extracted (e.g. ZYX yields rot.z = first rotation about Z, rot.y about Y, rot.x about X). Inverse of EulerToQuaternion when the same Order is used on both ends.",
+				"pins": [
+					{
+						"name": "Quaternion",
+						"type_name": "nos.fb.vec4d",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY"
+					},
+					{
+						"name": "Order",
+						"type_name": "nos.math.EulerOrder",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": "ZYX",
+						"description": "Euler intrinsic rotation order extracted into the (rot.x, rot.y, rot.z) output components."
+					},
+					{
+						"name": "Euler",
+						"type_name": "nos.fb.vec3d",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY"
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosMath/Math.noscfg b/Plugins/nosMath/Math.noscfg
index de4791ee..5417aca6 100644
--- a/Plugins/nosMath/Math.noscfg
+++ b/Plugins/nosMath/Math.noscfg
@@ -14,7 +14,9 @@
       }
     ]
   },
-  "custom_types": [],
+  "custom_types": [
+    "Config/Math.fbs"
+  ],
   "node_definitions": [
     "Config/Math.nosdef",
     "Config/Eval.nosdef",
@@ -25,7 +27,10 @@
     "Config/Random.nosdef",
     "Config/Lerp.nosdef",
     "Config/Vec3ToVec4.nosdef",
-    "Config/EmbedMat3ToMat4.nosdef"
+    "Config/EmbedMat3ToMat4.nosdef",
+    "Config/EulerToQuaternion.nosdef",
+    "Config/QuaternionToEuler.nosdef",
+    "Config/QuaternionMultiply.nosdef"
   ],
   "binary_path": "Binaries/nosMath",
   "third_party_software": [
diff --git a/Plugins/nosMath/Source/EulerToQuaternion.cpp b/Plugins/nosMath/Source/EulerToQuaternion.cpp
new file mode 100644
index 00000000..94440a60
--- /dev/null
+++ b/Plugins/nosMath/Source/EulerToQuaternion.cpp
@@ -0,0 +1,97 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#include <Nodos/PluginHelpers.hpp>
+#include <Math_generated.h>
+#include <glm/glm.hpp>
+#include <glm/gtc/quaternion.hpp>
+#include <glm/gtx/euler_angles.hpp>
+
+namespace nos::math
+{
+
+// Build a rotation matrix for the given intrinsic Euler order.
+// In all cases, rot.x is the angle about X, rot.y about Y, rot.z about Z (radians).
+// Order ZYX means R = Rz(rot.z) * Ry(rot.y) * Rx(rot.x), applied right-to-left to a point.
+static glm::dmat4 EulerToMat(EulerOrder order, glm::dvec3 const& r)
+{
+	switch (order)
+	{
+	case EulerOrder::ZYX: return glm::eulerAngleZYX<double>(r.z, r.y, r.x);
+	case EulerOrder::XYZ: return glm::eulerAngleXYZ<double>(r.x, r.y, r.z);
+	case EulerOrder::YXZ: return glm::eulerAngleYXZ<double>(r.y, r.x, r.z);
+	case EulerOrder::YZX: return glm::eulerAngleYZX<double>(r.y, r.z, r.x);
+	case EulerOrder::ZXY: return glm::eulerAngleZXY<double>(r.z, r.x, r.y);
+	case EulerOrder::XZY: return glm::eulerAngleXZY<double>(r.x, r.z, r.y);
+	}
+	return glm::dmat4(1.0);
+}
+
+static void MatToEuler(EulerOrder order, glm::dmat4 const& m, glm::dvec3& r)
+{
+	switch (order)
+	{
+	case EulerOrder::ZYX: glm::extractEulerAngleZYX(m, r.z, r.y, r.x); break;
+	case EulerOrder::XYZ: glm::extractEulerAngleXYZ(m, r.x, r.y, r.z); break;
+	case EulerOrder::YXZ: glm::extractEulerAngleYXZ(m, r.y, r.x, r.z); break;
+	case EulerOrder::YZX: glm::extractEulerAngleYZX(m, r.y, r.z, r.x); break;
+	case EulerOrder::ZXY: glm::extractEulerAngleZXY(m, r.z, r.x, r.y); break;
+	case EulerOrder::XZY: glm::extractEulerAngleXZY(m, r.x, r.z, r.y); break;
+	}
+}
+
+struct EulerToQuaternionNodeContext : NodeContext
+{
+	using NodeContext::NodeContext;
+
+	nosResult ExecuteNode(nosNodeExecuteParams* execParams) override
+	{
+		nos::NodeExecuteParams params(execParams);
+		auto* in = params.GetPinData<fb::vec3d>(NOS_NAME("Euler"));
+		auto* order = params.GetPinData<EulerOrder>(NOS_NAME("Order"));
+		auto* out = params.GetPinData<fb::vec4d>(NOS_NAME("Quaternion"));
+
+		glm::dvec3 r = glm::radians(glm::dvec3(in->x(), in->y(), in->z()));
+		glm::dquat q(EulerToMat(*order, r));
+
+		out->mutate_x(q.x);
+		out->mutate_y(q.y);
+		out->mutate_z(q.z);
+		out->mutate_w(q.w);
+		return NOS_RESULT_SUCCESS;
+	}
+};
+
+void RegisterEulerToQuaternion(nosNodeFunctions* fn)
+{
+	NOS_BIND_NODE_CLASS(NOS_NAME("nos.math.EulerToQuaternion"), EulerToQuaternionNodeContext, fn)
+}
+
+struct QuaternionToEulerNodeContext : NodeContext
+{
+	using NodeContext::NodeContext;
+
+	nosResult ExecuteNode(nosNodeExecuteParams* execParams) override
+	{
+		nos::NodeExecuteParams params(execParams);
+		auto* in = params.GetPinData<fb::vec4d>(NOS_NAME("Quaternion"));
+		auto* order = params.GetPinData<EulerOrder>(NOS_NAME("Order"));
+		auto* out = params.GetPinData<fb::vec3d>(NOS_NAME("Euler"));
+
+		glm::dquat q(in->w(), in->x(), in->y(), in->z());
+		glm::dmat4 m = glm::mat4_cast(q);
+		glm::dvec3 r(0.0);
+		MatToEuler(*order, m, r);
+
+		out->mutate_x(glm::degrees(r.x));
+		out->mutate_y(glm::degrees(r.y));
+		out->mutate_z(glm::degrees(r.z));
+		return NOS_RESULT_SUCCESS;
+	}
+};
+
+void RegisterQuaternionToEuler(nosNodeFunctions* fn)
+{
+	NOS_BIND_NODE_CLASS(NOS_NAME("nos.math.QuaternionToEuler"), QuaternionToEulerNodeContext, fn)
+}
+
+}  // namespace nos::math
diff --git a/Plugins/nosMath/Source/Math.cpp b/Plugins/nosMath/Source/Math.cpp
index c307f2cf..1893cc8e 100644
--- a/Plugins/nosMath/Source/Math.cpp
+++ b/Plugins/nosMath/Source/Math.cpp
@@ -104,6 +104,9 @@ enum class MathNodeTypes : int {
 	Or,
 	Not,
 	Random,
+	EulerToQuaternion,
+	QuaternionToEuler,
+	QuaternionMultiply,
 	Count
 };
 
@@ -168,6 +171,9 @@ void RegisterAnd(nosNodeFunctions*);
 void RegisterOr(nosNodeFunctions*);
 void RegisterNot(nosNodeFunctions*);
 void RegisterRandom(nosNodeFunctions*);
+void RegisterEulerToQuaternion(nosNodeFunctions*);
+void RegisterQuaternionToEuler(nosNodeFunctions*);
+void RegisterQuaternionMultiply(nosNodeFunctions*);
 
 nosResult NOSAPI_CALL ExportNodeFunctions(size_t* outCount, nosNodeFunctions** outList)
 {
@@ -281,6 +287,18 @@ nosResult NOSAPI_CALL ExportNodeFunctions(size_t* outCount, nosNodeFunctions** o
 			RegisterRandom(node);
 			break;
 		}
+		case MathNodeTypes::EulerToQuaternion: {
+			RegisterEulerToQuaternion(node);
+			break;
+		}
+		case MathNodeTypes::QuaternionToEuler: {
+			RegisterQuaternionToEuler(node);
+			break;
+		}
+		case MathNodeTypes::QuaternionMultiply: {
+			RegisterQuaternionMultiply(node);
+			break;
+		}
 		default:
 			break;
 		}
diff --git a/Plugins/nosMath/Source/QuaternionMultiply.cpp b/Plugins/nosMath/Source/QuaternionMultiply.cpp
new file mode 100644
index 00000000..395b4843
--- /dev/null
+++ b/Plugins/nosMath/Source/QuaternionMultiply.cpp
@@ -0,0 +1,39 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#include <Nodos/PluginHelpers.hpp>
+#include <Math_generated.h>
+#include <glm/glm.hpp>
+#include <glm/gtc/quaternion.hpp>
+
+namespace nos::math
+{
+
+struct QuaternionMultiplyNodeContext : NodeContext
+{
+	using NodeContext::NodeContext;
+
+	nosResult ExecuteNode(nosNodeExecuteParams* execParams) override
+	{
+		nos::NodeExecuteParams params(execParams);
+		auto* a = params.GetPinData<fb::vec4d>(NOS_NAME("A"));
+		auto* b = params.GetPinData<fb::vec4d>(NOS_NAME("B"));
+		auto* out = params.GetPinData<fb::vec4d>(NOS_NAME("Result"));
+
+		glm::dquat qa(a->w(), a->x(), a->y(), a->z());
+		glm::dquat qb(b->w(), b->x(), b->y(), b->z());
+		glm::dquat qr = qa * qb;
+
+		out->mutate_x(qr.x);
+		out->mutate_y(qr.y);
+		out->mutate_z(qr.z);
+		out->mutate_w(qr.w);
+		return NOS_RESULT_SUCCESS;
+	}
+};
+
+void RegisterQuaternionMultiply(nosNodeFunctions* fn)
+{
+	NOS_BIND_NODE_CLASS(NOS_NAME("nos.math.QuaternionMultiply"), QuaternionMultiplyNodeContext, fn)
+}
+
+}  // namespace nos::math
diff --git a/Plugins/nosTrack/CHANGES.md b/Plugins/nosTrack/CHANGES.md
new file mode 100644
index 00000000..ec713c45
--- /dev/null
+++ b/Plugins/nosTrack/CHANGES.md
@@ -0,0 +1,57 @@
+# Record Track (COLMAP) Node
+
+## Summary
+
+A new node "Record Track (COLMAP)" added to the `nosTrack` plugin. It records incoming camera tracking data per frame and exports it in COLMAP's text format (`cameras.txt` + `images.txt`).
+
+## Files Changed
+
+### New files
+- `Source/RecordTrackCOLMAP.cpp` — Node implementation
+- `Config/RecordTrackCOLMAP.nosdef` — Node definition (pins, functions, metadata)
+
+### Modified files
+- `Source/TrackMain.cpp` — Added `RecordTrackCOLMAP` to the `TrackNode` enum and `ExportNodeFunctions` switch
+- `Track.noscfg` — Added `Config/RecordTrackCOLMAP.nosdef` to `node_definitions`
+
+## Node Design
+
+### Pins
+| Pin | Type | Direction | Description |
+|-----|------|-----------|-------------|
+| Track | `nos.track.Track` | Input | Incoming tracking data |
+| Track Out | `nos.track.Track` | Output (only) | Pass-through of input |
+| Output Directory | `string` | Property | Folder picker for output |
+| Image Resolution | `nos.fb.vec2u` | Property | Width/height (default 1920x1080) |
+| Record | `bool` | Property | Mirrors Record/Stop functions |
+| Frame Count | `uint` | Output (only) | Frames in buffer |
+
+### Functions
+| Function | Behavior |
+|----------|----------|
+| Record | Validates folder is empty, clears buffer, starts recording. Orphaned while recording. |
+| Stop | Stops recording (does NOT save). Orphaned while idle. |
+| Save | Writes `cameras.txt` + `images.txt` to disk. Does not clear buffer. |
+| Clear | Clears frame buffer and resets count. |
+| Open Folder | Opens output directory in explorer (Windows) or xdg-open (Linux). |
+
+### State Management
+- Record pin and functions are kept in sync bidirectionally. A `SyncingRecordPin` bool guard prevents re-entrant loops between pin changes and function calls.
+- Function orphan states: Record/Stop toggle via `SetNodeOrphanState` using a `Name -> UUID` map built in constructor.
+- Status messages show recording state + frame count, and persist error messages (e.g., "Target folder is not empty") via `LastError` until user changes the output directory.
+- Non-empty folder check: Recording fails with a FAILURE status if the target folder already has files.
+
+### COLMAP Output Format
+- `cameras.txt`: One OPENCV camera per frame — `fx, fy, cx, cy, k1, k2, p1, p2` derived from Track FOV, sensor size, pixel aspect ratio, lens distortion.
+- `images.txt`: Per-frame pose — Euler angles converted to quaternion (world-to-camera), translation as `t = -R * C`.
+
+## Known Review Points
+- Euler-to-quaternion convention: The Track's rotation fields (roll/tilt/pan) are passed through `glm::quat(eulerRadians)` then inverted for COLMAP's world-to-camera convention. May need validation against actual tracker output.
+- One camera per frame: Each frame gets its own camera entry. This handles zoom/FOV changes but may be unusual for COLMAP workflows with constant intrinsics.
+- No `points3D.txt`: COLMAP expects this file too (can be empty). Not currently written.
+- `std::system()` for Open Folder: Works but is a simple shell call. Could be replaced with platform APIs if needed.
+
+## Build
+```
+./nodos dev build -p Project13 --target nosTrack
+```
diff --git a/Plugins/nosTrack/CMakeLists.txt b/Plugins/nosTrack/CMakeLists.txt
index 26c05e2b..af2df47c 100644
--- a/Plugins/nosTrack/CMakeLists.txt
+++ b/Plugins/nosTrack/CMakeLists.txt
@@ -1,6 +1,6 @@
 # Copyright MediaZ Teknoloji A.S. All Rights Reserved.
 
-set(MODULE_DEPENDENCIES "nos.sys.track-1.0")
+set(MODULE_DEPENDENCIES "nos.sys.track-1.1")
 set(dep_idx 0)
 foreach(module_name_version ${MODULE_DEPENDENCIES})
     # module_name_version: <MODULE_NAME>-<MODULE_VERSION>
@@ -13,4 +13,7 @@ endforeach()
 
 list(APPEND MODULE_DEPENDENCIES_TARGETS ${NOS_PLUGIN_SDK_TARGET})
 
+nos_generate_flatbuffers("${CMAKE_CURRENT_SOURCE_DIR}/Config" "${CMAKE_CURRENT_SOURCE_DIR}/Source" "cpp" "" nosTrack_generated)
+list(APPEND MODULE_DEPENDENCIES_TARGETS nosTrack_generated)
+
 nos_add_plugin("nosTrack" "${MODULE_DEPENDENCIES_TARGETS}" "${CMAKE_CURRENT_LIST_DIR}/External/asio/asio/include")
diff --git a/Plugins/nosTrack/Config/ConvertTransform.nosdef b/Plugins/nosTrack/Config/ConvertTransform.nosdef
new file mode 100644
index 00000000..aea8e1b7
--- /dev/null
+++ b/Plugins/nosTrack/Config/ConvertTransform.nosdef
@@ -0,0 +1,56 @@
+{
+	"nodes": [
+		{
+			"class_name": "ConvertTransform",
+			"menu_info": {
+				"category": "Track|Coordinate System",
+				"display_name": "Convert Transform"
+			},
+			"node": {
+				"class_name": "ConvertTransform",
+				"contents_type": "Job",
+				"description": "Converts a Transform between coordinate frames.\nThe Source and Target enums select axis assignments, handedness, and the Euler convention used for the rotation field.\nPosition: basis-changed (Source -> Target), then multiplied by WorldScale (e.g. 0.01 for cm -> m, 100 for m -> cm).\nRotation: built in the source Euler convention, conjugated by the basis-change matrix, re-extracted in the target convention.\nScale: axis factors are reordered to follow the basis change.",
+				"pins": [
+					{
+						"name": "In",
+						"type_name": "nos.fb.Transform",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY"
+					},
+					{
+						"name": "SourceFrame",
+						"display_name": "Source Frame",
+						"type_name": "nos.sys.track.CoordinateFrame",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": "LH_ZUp_FwdX_RightY",
+						"description": "Coordinate system convention of the input Transform."
+					},
+					{
+						"name": "TargetFrame",
+						"display_name": "Target Frame",
+						"type_name": "nos.sys.track.CoordinateFrame",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": "RH_YUp_FwdNegZ_RightX",
+						"description": "Coordinate system convention of the output Transform."
+					},
+					{
+						"name": "WorldScale",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 1.0,
+						"description": "Uniform scale applied only to the output position after the basis change. Use to convert linear units (e.g. 0.01 for cm -> m, 100 for m -> cm). Does not affect rotation or the Transform's own scale."
+					},
+					{
+						"name": "Out",
+						"type_name": "nos.fb.Transform",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_OR_PROPERTY"
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosTrack/Config/PlaybackMode.fbs b/Plugins/nosTrack/Config/PlaybackMode.fbs
new file mode 100644
index 00000000..c0d1d952
--- /dev/null
+++ b/Plugins/nosTrack/Config/PlaybackMode.fbs
@@ -0,0 +1,9 @@
+namespace nos.track;
+
+// Selects how PlaybackTrackCOLMAP indexes into the recorded frames.
+enum PlaybackTrackMode : uint
+{
+    FrameIndex = 0,  // Use the InFrameIndex pin as a 0-based offset.
+    Timecode = 1,    // Look up by Timecode string from timecodes.txt.
+    FrameNumber = 2, // Look up by FrameNumber column from timecodes.txt.
+}
diff --git a/Plugins/nosTrack/Config/PlaybackTrackCOLMAP.nosdef b/Plugins/nosTrack/Config/PlaybackTrackCOLMAP.nosdef
new file mode 100644
index 00000000..7f1604f2
--- /dev/null
+++ b/Plugins/nosTrack/Config/PlaybackTrackCOLMAP.nosdef
@@ -0,0 +1,107 @@
+{
+	"nodes": [
+		{
+			"class_name": "PlaybackTrackCOLMAP",
+			"menu_info": {
+				"category": "nosTrack",
+				"display_name": "Playback Track (COLMAP)",
+				"name_aliases": [ "colmap", "import camera", "playback camera" ]
+			},
+			"node": {
+				"class_name": "PlaybackTrackCOLMAP",
+				"display_name": "Playback Track (COLMAP)",
+				"contents_type": "Job",
+				"always_execute": true,
+				"description": "Loads camera track from COLMAP-spec cameras.txt + images.txt.\nReads world-to-camera poses in the COLMAP frame (RH, +X right, +Y down, +Z forward) and converts to the chosen TargetFrame.\nWhen an extras.txt sidecar is present, original Euler/FOV/sensor metadata is restored verbatim (no quaternion round-trip drift).",
+				"pins": [
+					{
+						"name": "InputDirectory",
+						"display_name": "Input Directory",
+						"type_name": "string",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"visualizer": { "type": "FOLDER_PICKER" },
+						"description": "Directory with cameras.txt + images.txt (and optional timecodes.txt / extras.txt sidecars)."
+					},
+					{
+						"name": "TargetFrame",
+						"display_name": "Target Frame",
+						"type_name": "nos.sys.track.CoordinateFrame",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": "LH_ZUp_FwdX_RightY",
+						"description": "Coordinate frame of the produced Track.\nCOLMAP poses are converted into this frame.\nDefault matches FreeD / UE convention."
+					},
+					{
+						"name": "Mode",
+						"display_name": "Mode",
+						"type_name": "nos.track.PlaybackTrackMode",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": "FrameIndex",
+						"description": "Selects how to index frames.\nFrameIndex uses InFrameIndex.\nTimecode / FrameNumber look up via timecodes.txt sidecar.\nThe unused index pin becomes PASSIVE."
+					},
+					{
+						"name": "InFrameIndex",
+						"display_name": "Frame Index",
+						"type_name": "uint",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 0,
+						"description": "0-based frame index. Used when Mode=FrameIndex."
+					},
+					{
+						"name": "InTimecode",
+						"display_name": "Timecode",
+						"type_name": "string",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"description": "Timecode string (HH:MM:SS:FF) to look up. Used when Mode=Timecode. Requires timecodes.txt."
+					},
+					{
+						"name": "InFrameNumber",
+						"display_name": "Frame Number",
+						"type_name": "uint",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 0,
+						"description": "Absolute frame number to look up. Used when Mode=FrameNumber. Requires timecodes.txt."
+					},
+					{
+						"name": "OutFrameIndex",
+						"display_name": "Frame Index",
+						"type_name": "uint",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY",
+						"data": 0,
+						"description": "Current playback frame index."
+					},
+					{
+						"name": "FrameCount",
+						"display_name": "Frame Count",
+						"type_name": "uint",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY",
+						"data": 0,
+						"description": "Total frames loaded."
+					},
+					{
+						"name": "Track",
+						"type_name": "nos.sys.track.Track",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY",
+						"description": "Track for the current frame, expressed in the TargetFrame convention."
+					}
+				],
+				"functions": [
+					{
+						"class_name": "PlaybackTrackCOLMAP_OpenFolder",
+						"display_name": "Open Folder",
+						"contents_type": "Job",
+						"pins": []
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosTrack/Config/RecordTrackCOLMAP.nosdef b/Plugins/nosTrack/Config/RecordTrackCOLMAP.nosdef
new file mode 100644
index 00000000..c26f52cb
--- /dev/null
+++ b/Plugins/nosTrack/Config/RecordTrackCOLMAP.nosdef
@@ -0,0 +1,120 @@
+{
+	"nodes": [
+		{
+			"class_name": "RecordTrackCOLMAP",
+			"menu_info": {
+				"category": "nosTrack",
+				"display_name": "Record Track (COLMAP)",
+				"name_aliases": [ "colmap", "export camera", "record camera" ]
+			},
+			"node": {
+				"class_name": "RecordTrackCOLMAP",
+				"display_name": "Record Track (COLMAP)",
+				"contents_type": "Job",
+				"always_execute": true,
+				"description": "Records camera track data each frame while Record is true.\nOn falling edge (after MinOffFrames debounce) writes COLMAP-spec cameras.txt + images.txt and clears the buffer.\nIntrinsics come from FOV/sensor/distortion. Extrinsics are written as world-to-camera in the COLMAP frame (RH, +X right, +Y down, +Z forward).\nSet SourceFrame to match the convention of the connected Track.",
+				"pins": [
+					{
+						"name": "Timecode",
+						"display_name": "Timecode",
+						"type_name": "string",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"description": "Optional SMPTE timecode (HH:MM:SS:FF). Written to timecodes.txt sidecar when non-empty."
+					},
+					{
+						"name": "FrameNumber",
+						"display_name": "Frame Number",
+						"type_name": "uint",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 0,
+						"description": "Optional absolute frame number paired with Timecode. Written to timecodes.txt sidecar."
+					},
+					{
+						"name": "OutputDirectory",
+						"display_name": "Output Directory",
+						"type_name": "string",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"visualizer": { "type": "FOLDER_PICKER" },
+						"description": "Where cameras.txt and images.txt are written when recording stops. Must be empty to start recording."
+					},
+					{
+						"name": "ImageResolution",
+						"display_name": "Image Resolution",
+						"type_name": "nos.fb.vec2u",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": {
+							"x": 1920,
+							"y": 1080
+						},
+						"description": "Image WIDTH/HEIGHT in pixels. Used to compute focal length and principal point for cameras.txt."
+					},
+					{
+						"name": "SourceFrame",
+						"display_name": "Source Frame",
+						"type_name": "nos.sys.track.CoordinateFrame",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": "LH_ZUp_FwdX_RightY",
+						"description": "Coordinate frame of the connected Track.\nUsed to convert location and rotation into the COLMAP frame before writing.\nDefault matches FreeD / UE convention."
+					},
+					{
+						"name": "Record",
+						"type_name": "bool",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": false,
+						"description": "Drives recording.\nRising edge: clear buffer and start.\nFalling edge (after MinOffFrames): stop and write files.\nFails to start if OutputDirectory is non-empty."
+					},
+					{
+						"name": "MinOffFrames",
+						"display_name": "Min Off Frames",
+						"type_name": "uint",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 1,
+						"min": "1",
+						"description": "Debounce: minimum consecutive Record=false frames before stopping. Default 1 = stop immediately. Use 5-15 to ride out short upstream glitches (e.g. SDI bit flips on a camera-derived flag)."
+					},
+					{
+						"name": "RecordingFrame",
+						"display_name": "Recording Frame",
+						"type_name": "uint",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY",
+						"data": 0,
+						"description": "Current recording frame index. 0 when not recording."
+					},
+					{
+						"name": "FrameCount",
+						"display_name": "Frame Count",
+						"type_name": "uint",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY",
+						"data": 0,
+						"description": "Frames in the buffer."
+					},
+					{
+						"name": "InTrack",
+						"display_name": "Track",
+						"type_name": "nos.sys.track.Track",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"description": "Camera track to record. Interpreted in the SourceFrame convention (location, rotation Euler, FOV, sensor, lens distortion)."
+					},
+					{
+						"name": "OutTrack",
+						"display_name": "Track",
+						"type_name": "nos.sys.track.Track",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY",
+						"description": "Pass-through of InTrack."
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosTrack/Config/TrackTransform.nosdef b/Plugins/nosTrack/Config/TrackTransform.nosdef
new file mode 100644
index 00000000..cb198734
--- /dev/null
+++ b/Plugins/nosTrack/Config/TrackTransform.nosdef
@@ -0,0 +1,54 @@
+{
+	"nodes": [
+		{
+			"class_name": "TrackTransform",
+			"menu_info": {
+				"category": "Track|Coordinate System",
+				"display_name": "Track Transform"
+			},
+			"node": {
+				"class_name": "TrackTransform",
+				"contents_type": "Job",
+				"description": "Transforms a Track between coordinate frames.\nThe Source and Target enums select axis assignments, handedness, and the Euler convention used for the rotation field.\nLocation: basis-changed (Source -> Target), then multiplied by WorldScale (e.g. 0.01 for cm -> m, 100 for m -> cm).\nRotation: built in the source Euler convention, conjugated by the basis-change matrix, re-extracted in the target convention.\nOther Track fields (fov, focus, sensor_size, lens_distortion, ...) pass through unchanged.",
+				"pins": [
+					{
+						"name": "In",
+						"type_name": "nos.sys.track.Track",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY"
+					},
+					{
+						"name": "Source",
+						"type_name": "nos.sys.track.CoordinateFrame",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": "LH_ZUp_FwdX_RightY",
+						"description": "Coordinate system convention of the input Track."
+					},
+					{
+						"name": "Target",
+						"type_name": "nos.sys.track.CoordinateFrame",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": "RH_YUp_FwdNegZ_RightX",
+						"description": "Coordinate system convention of the output Track."
+					},
+					{
+						"name": "WorldScale",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 1.0,
+						"description": "Uniform scale applied only to the output location after the basis change. Use to convert linear units (e.g. 0.01 for cm -> m, 100 for m -> cm). Does not affect rotation, fov, sensor size, focus, or lens distortion."
+					},
+					{
+						"name": "Out",
+						"type_name": "nos.sys.track.Track",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_OR_PROPERTY"
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosTrack/Source/ConvertTransform.cpp b/Plugins/nosTrack/Source/ConvertTransform.cpp
new file mode 100644
index 00000000..463a9666
--- /dev/null
+++ b/Plugins/nosTrack/Source/ConvertTransform.cpp
@@ -0,0 +1,59 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#include <Nodos/Helpers.hpp>
+#include <Builtins_generated.h>
+#include <glm/glm.hpp>
+
+#include <cmath>
+
+#include <nosSysTrack/CoordinateFrameConv.h>
+
+namespace nos::track
+{
+
+void RegisterConvertTransform(nosNodeFunctions* funcs)
+{
+	funcs->ClassName = NOS_NAME("ConvertTransform");
+	funcs->ExecuteNode = [](void*, nosNodeExecuteParams* params) {
+		auto pins = GetPinValues(params);
+		auto ids = GetPinIds(params);
+
+		// nos.fb.Transform is a struct, so the pin data is the raw struct bytes.
+		auto* in = static_cast<nos::fb::Transform*>(pins[NOS_NAME("In")]);
+		auto source = *static_cast<convention::Frame*>(pins[NOS_NAME("SourceFrame")]);
+		auto target = *static_cast<convention::Frame*>(pins[NOS_NAME("TargetFrame")]);
+		float worldScale = *static_cast<float*>(pins[NOS_NAME("WorldScale")]);
+
+		const glm::dmat3 S_src = convention::BasisMatrix(source);
+		const glm::dmat3 S_tgt = convention::BasisMatrix(target);
+		const glm::dmat3 M = S_tgt * glm::inverse(S_src);
+
+		// Position: basis change, then uniform world-scale (unit conversion).
+		const auto& p = in->position();
+		glm::dvec3 outPos = M * glm::dvec3(p.x(), p.y(), p.z()) * static_cast<double>(worldScale);
+
+		// Rotation: build in source frame, conjugate by M (orthogonal => M^-1 = M^T),
+		// extract in target frame.
+		const auto& r = in->rotation();
+		glm::dmat3 R_src = convention::EulerToMat(source, glm::dvec3(r.x(), r.y(), r.z()));
+		glm::dmat3 R_tgt = M * R_src * glm::transpose(M);
+		glm::dvec3 outRot = convention::MatToEuler(target, R_tgt);
+
+		// Scale: M is a signed axis permutation, so the per-axis factors just reorder.
+		const auto& s = in->scale();
+		glm::dmat3 absM(0.0);
+		for (int c = 0; c < 3; ++c)
+			for (int row = 0; row < 3; ++row)
+				absM[c][row] = std::abs(M[c][row]);
+		glm::dvec3 outScale = absM * glm::dvec3(s.x(), s.y(), s.z());
+
+		nos::fb::Transform out(
+			nos::fb::vec3d(outPos.x, outPos.y, outPos.z),
+			nos::fb::vec3d(outRot.x, outRot.y, outRot.z),
+			nos::fb::vec3d(outScale.x, outScale.y, outScale.z));
+
+		return nosEngine.SetPinValue(ids[NOS_NAME("Out")], nos::Buffer::From(out));
+	};
+}
+
+}  // namespace nos::track
diff --git a/Plugins/nosTrack/Source/PlaybackTrackCOLMAP.cpp b/Plugins/nosTrack/Source/PlaybackTrackCOLMAP.cpp
new file mode 100644
index 00000000..b72e8ea6
--- /dev/null
+++ b/Plugins/nosTrack/Source/PlaybackTrackCOLMAP.cpp
@@ -0,0 +1,568 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#include <Nodos/PluginHelpers.hpp>
+#include "nosSysTrack/Track_generated.h"
+#include "PlaybackMode_generated.h"
+
+#include <glm/glm.hpp>
+#include <glm/gtc/quaternion.hpp>
+
+#include <fstream>
+#include <filesystem>
+#include <vector>
+#include <cmath>
+#include <sstream>
+#include <string>
+#include <algorithm>
+#include <unordered_map>
+
+#include <nosSysTrack/CoordinateFrameConv.h>
+
+namespace nos::track
+{
+
+NOS_REGISTER_NAME_SPACED(Playback_InputDirectory, "InputDirectory");
+NOS_REGISTER_NAME_SPACED(Playback_TargetFrame, "TargetFrame");
+NOS_REGISTER_NAME_SPACED(Playback_Mode, "Mode");
+NOS_REGISTER_NAME_SPACED(Playback_InFrameIndex, "InFrameIndex");
+NOS_REGISTER_NAME_SPACED(Playback_InTimecode, "InTimecode");
+NOS_REGISTER_NAME_SPACED(Playback_InFrameNumber, "InFrameNumber");
+NOS_REGISTER_NAME_SPACED(Playback_OutFrameIndex, "OutFrameIndex");
+NOS_REGISTER_NAME_SPACED(Playback_FrameCount, "FrameCount");
+
+NOS_REGISTER_NAME(PlaybackTrackCOLMAP_OpenFolder);
+
+struct COLMAPCamera
+{
+	uint32_t Id = 0;
+	std::string Model;
+	uint32_t Width = 0;
+	uint32_t Height = 0;
+	float Fx = 0, Fy = 0, Cx = 0, Cy = 0;
+	float K1 = 0, K2 = 0, P1 = 0, P2 = 0;
+};
+
+struct COLMAPImage
+{
+	uint32_t Id = 0;
+	glm::quat Q{1, 0, 0, 0};  // R_w2c in COLMAP camera frame.
+	glm::vec3 T{0};           // t = -R_w2c * camera_world_position (COLMAP world frame).
+	uint32_t CameraId = 0;
+};
+
+struct TimecodeEntry
+{
+	std::string Timecode;
+	uint32_t FrameNumber = 0;
+};
+
+struct ExtrasEntry
+{
+	bool Present = false;
+	float Zoom = 0;
+	float Focus = 0;
+	float FocusDistance = 0;
+	float RenderRatio = 0;
+	float NodalOffset = 0;
+	float DistortionScale = 0;
+	float SensorWmm = 0;
+	float SensorHmm = 0;
+	float RotX = 0;
+	float RotY = 0;
+	float RotZ = 0;
+};
+
+struct PlaybackTrackCOLMAPContext : NodeContext
+{
+	std::string InputDir;
+	convention::Frame TargetFrame = convention::Frame::LH_ZUp_FwdX_RightY;
+	PlaybackTrackMode Mode = PlaybackTrackMode::FrameIndex;
+	uint32_t FrameIndex = 0;
+	std::string InTimecode;
+	uint32_t InFrameNumber = 0;
+	std::string LastError;
+	std::vector<sys::track::TTrack> Frames;
+	std::vector<TimecodeEntry> Timecodes; // empty or same size as Frames
+	std::unordered_map<std::string, uint32_t> TimecodeToIndex;
+	std::unordered_map<uint32_t, uint32_t> FrameNumberToIndex;
+	uint32_t CurrentFrame = 0;
+
+	PlaybackTrackCOLMAPContext(nosFbNodePtr node) : NodeContext(node)
+	{
+		if (node->pins())
+		{
+			for (auto* pin : *node->pins())
+			{
+				auto name = nos::Name(pin->name()->c_str());
+				if (flatbuffers::IsFieldPresent(pin, fb::Pin::VT_DATA))
+				{
+					nosBuffer value = {.Data = (void*)pin->data()->data(), .Size = pin->data()->size()};
+					OnPinValueChanged(name, *pin->id(), value);
+				}
+			}
+		}
+		ApplyModeOrphanStates();
+		UpdateStatus();
+	}
+
+	void OnPinValueChanged(nos::Name pinName, uuid const& pinId, nosBuffer val) override
+	{
+		if (pinName == NSN_Playback_InputDirectory)
+		{
+			InputDir = InterpretPinValue<const char>(val.Data);
+			LastError.clear();
+			if (!InputDir.empty())
+				LoadFromDirectory();
+			else
+				UpdateStatus();
+		}
+		else if (pinName == NSN_Playback_TargetFrame)
+		{
+			TargetFrame = *(convention::Frame*)val.Data;
+			if (!InputDir.empty())
+				LoadFromDirectory();
+		}
+		else if (pinName == NSN_Playback_Mode)
+		{
+			Mode = *(PlaybackTrackMode*)val.Data;
+			ApplyModeOrphanStates();
+		}
+		else if (pinName == NSN_Playback_InFrameIndex)
+			FrameIndex = *(uint32_t*)val.Data;
+		else if (pinName == NSN_Playback_InTimecode)
+			InTimecode = InterpretPinValue<const char>(val.Data);
+		else if (pinName == NSN_Playback_InFrameNumber)
+			InFrameNumber = *(uint32_t*)val.Data;
+	}
+
+	void ApplyModeOrphanStates()
+	{
+		auto state = [](bool active) {
+			return active ? fb::PinOrphanStateType::ACTIVE : fb::PinOrphanStateType::PASSIVE;
+		};
+		const bool useIdx = Mode == PlaybackTrackMode::FrameIndex;
+		const bool useTC  = Mode == PlaybackTrackMode::Timecode;
+		const bool useFN  = Mode == PlaybackTrackMode::FrameNumber;
+		SetPinOrphanState(NSN_Playback_InFrameIndex,  state(useIdx));
+		SetPinOrphanState(NSN_Playback_InTimecode,    state(useTC));
+		SetPinOrphanState(NSN_Playback_InFrameNumber, state(useFN));
+	}
+
+	void UpdateFrameCountPin()
+	{
+		uint32_t count = (uint32_t)Frames.size();
+		SetPinValue(NSN_Playback_FrameCount, nosBuffer{.Data = &count, .Size = sizeof(count)});
+	}
+
+	void UpdateFrameIndexPin()
+	{
+		SetPinValue(NSN_Playback_OutFrameIndex, nosBuffer{.Data = &CurrentFrame, .Size = sizeof(CurrentFrame)});
+	}
+
+	void UpdateStatus()
+	{
+		if (!LastError.empty())
+			SetNodeStatusMessage(LastError, fb::NodeStatusMessageType::FAILURE);
+		else if (InputDir.empty())
+			SetNodeStatusMessage("Set input directory", fb::NodeStatusMessageType::WARNING);
+		else if (Frames.empty())
+			SetNodeStatusMessage("No data loaded", fb::NodeStatusMessageType::WARNING);
+		else
+			SetNodeStatusMessage("Loaded (" + std::to_string(Frames.size()) + " frames)", fb::NodeStatusMessageType::INFO);
+	}
+
+	// --- Parsing ---
+
+	bool LoadFromDirectory()
+	{
+		if (InputDir.empty())
+		{
+			LastError = "Set input directory";
+			UpdateStatus();
+			return false;
+		}
+
+		std::filesystem::path dir = nos::Utf8ToPath(InputDir);
+		auto camerasPath = dir / "cameras.txt";
+		auto imagesPath = dir / "images.txt";
+
+		if (!std::filesystem::exists(camerasPath))
+		{
+			LastError = "cameras.txt not found";
+			UpdateStatus();
+			return false;
+		}
+		if (!std::filesystem::exists(imagesPath))
+		{
+			LastError = "images.txt not found";
+			UpdateStatus();
+			return false;
+		}
+
+		std::unordered_map<uint32_t, COLMAPCamera> cameras;
+		if (!ParseCamerasTxt(camerasPath, cameras))
+			return false;
+
+		std::vector<COLMAPImage> images;
+		if (!ParseImagesTxt(imagesPath, images))
+			return false;
+
+		if (images.empty())
+		{
+			LastError = "No images found in images.txt";
+			UpdateStatus();
+			return false;
+		}
+
+		Frames.clear();
+		Frames.reserve(images.size());
+		Timecodes.clear();
+
+		auto timecodesPath = dir / "timecodes.txt";
+		if (std::filesystem::exists(timecodesPath))
+			ParseTimecodesTxt(timecodesPath, images.size());
+
+		std::vector<ExtrasEntry> extras;
+		auto extrasPath = dir / "extras.txt";
+		if (std::filesystem::exists(extrasPath))
+			ParseExtrasTxt(extrasPath, images.size(), extras);
+
+		// Inverse of RecordTrackCOLMAP::WriteImagesTxt:
+		//   images.txt holds R_w2c in COLMAP frame, t = -R_w2c * pos_colmap.
+		//   pos_colmap = -R_c2w_colmap * t   (R_c2w_colmap = R_w2c^T)
+		//   pos_target = M^-1 * pos_colmap
+		//   R_c2w_target = M^-1 * R_c2w_colmap * M
+		//   Track.rotation = MatToEuler(TargetFrame, R_c2w_target)
+		const glm::dmat3 Minv = convention::BasisChangeFromColmap(TargetFrame);
+		const glm::dmat3 M = glm::inverse(Minv);
+
+		for (size_t i = 0; i < images.size(); ++i)
+		{
+			auto& img = images[i];
+			sys::track::TTrack trackData{};
+			auto camIt = cameras.find(img.CameraId);
+			const ExtrasEntry* ex = (i < extras.size() && extras[i].Present) ? &extras[i] : nullptr;
+
+			glm::dmat3 R_w2c = glm::dmat3(glm::mat3_cast(img.Q));
+			glm::dmat3 R_c2w_colmap = glm::transpose(R_w2c);
+			glm::dvec3 pos_colmap = -R_c2w_colmap * glm::dvec3(img.T);
+
+			glm::dvec3 pos_target = Minv * pos_colmap;
+			glm::vec3 locF((float)pos_target.x, (float)pos_target.y, (float)pos_target.z);
+			trackData.location = reinterpret_cast<nos::fb::vec3&>(locF);
+
+			// Rotation: prefer the original Euler from extras (avoids quaternion-
+			// to-Euler ambiguity near gimbal lock); fall back to extracting from
+			// the COLMAP rotation matrix when no extras sidecar exists.
+			if (ex)
+			{
+				glm::vec3 euler(ex->RotX, ex->RotY, ex->RotZ);
+				trackData.rotation = reinterpret_cast<nos::fb::vec3&>(euler);
+			}
+			else
+			{
+				glm::dmat3 R_c2w_target = Minv * R_c2w_colmap * M;
+				glm::dvec3 eulerD = convention::MatToEuler(TargetFrame, R_c2w_target);
+				glm::vec3 eulerF((float)eulerD.x, (float)eulerD.y, (float)eulerD.z);
+				trackData.rotation = reinterpret_cast<nos::fb::vec3&>(eulerF);
+			}
+
+			if (camIt != cameras.end())
+			{
+				auto& cam = camIt->second;
+				if (cam.Fx > 0)
+					trackData.fov = glm::degrees(2.0f * std::atan(cam.Width * 0.5f / cam.Fx));
+				if (cam.Fx > 0 && cam.Fy > 0)
+					trackData.pixel_aspect_ratio = cam.Fx / cam.Fy;
+				trackData.lens_distortion.mutable_k1k2() = nos::fb::vec2(cam.K1, cam.K2);
+
+				// sensor_size: COLMAP only stores pixel dims, but Track expects mm.
+				// Use the extras value when present; otherwise fall back to pixels
+				// (matches pre-extras behaviour).
+				glm::vec2 sensorMm(0);
+				if (ex && ex->SensorWmm > 0 && ex->SensorHmm > 0)
+				{
+					sensorMm = {ex->SensorWmm, ex->SensorHmm};
+					trackData.sensor_size = nos::fb::vec2(sensorMm.x, sensorMm.y);
+				}
+				else
+				{
+					trackData.sensor_size = nos::fb::vec2(cam.Width, cam.Height);
+				}
+
+				// center_shift: invert the (cx, cy) encoding written by record.
+				// Needs sensor_size in mm to be meaningful, so only reconstructed
+				// when extras provided it.
+				if (sensorMm.x > 0 && cam.Width > 0 && sensorMm.y > 0 && cam.Height > 0)
+				{
+					glm::vec2 shift{
+						(cam.Cx - cam.Width * 0.5f) * sensorMm.x / cam.Width,
+						(cam.Cy - cam.Height * 0.5f) * sensorMm.y / cam.Height};
+					trackData.lens_distortion.mutable_center_shift() = reinterpret_cast<nos::fb::vec2&>(shift);
+				}
+			}
+
+			if (ex)
+			{
+				trackData.zoom = ex->Zoom;
+				trackData.focus = ex->Focus;
+				trackData.focus_distance = ex->FocusDistance;
+				trackData.render_ratio = ex->RenderRatio;
+				trackData.nodal_offset = ex->NodalOffset;
+				trackData.lens_distortion.mutate_distortion_scale(ex->DistortionScale);
+			}
+
+			Frames.push_back(std::move(trackData));
+		}
+
+		CurrentFrame = 0;
+		LastError.clear();
+		UpdateFrameCountPin();
+		UpdateFrameIndexPin();
+		UpdateStatus();
+		nosEngine.LogI("PlaybackTrackCOLMAP: Loaded %zu frames from %s", Frames.size(), InputDir.c_str());
+		return true;
+	}
+
+	bool ParseCamerasTxt(const std::filesystem::path& path, std::unordered_map<uint32_t, COLMAPCamera>& cameras)
+	{
+		std::ifstream file(path);
+		if (!file.is_open())
+		{
+			LastError = "Cannot open cameras.txt";
+			UpdateStatus();
+			return false;
+		}
+
+		std::string line;
+		while (std::getline(file, line))
+		{
+			if (line.empty() || line[0] == '#')
+				continue;
+			std::istringstream ss(line);
+			COLMAPCamera cam;
+			ss >> cam.Id >> cam.Model >> cam.Width >> cam.Height;
+			if (cam.Model == "OPENCV")
+				ss >> cam.Fx >> cam.Fy >> cam.Cx >> cam.Cy >> cam.K1 >> cam.K2 >> cam.P1 >> cam.P2;
+			else if (cam.Model == "PINHOLE")
+				ss >> cam.Fx >> cam.Fy >> cam.Cx >> cam.Cy;
+			else if (cam.Model == "SIMPLE_PINHOLE")
+			{
+				float f;
+				ss >> f >> cam.Cx >> cam.Cy;
+				cam.Fx = cam.Fy = f;
+			}
+			else if (cam.Model == "SIMPLE_RADIAL")
+			{
+				float f;
+				ss >> f >> cam.Cx >> cam.Cy >> cam.K1;
+				cam.Fx = cam.Fy = f;
+			}
+			else if (cam.Model == "RADIAL")
+			{
+				float f;
+				ss >> f >> cam.Cx >> cam.Cy >> cam.K1 >> cam.K2;
+				cam.Fx = cam.Fy = f;
+			}
+			else
+			{
+				nosEngine.LogW("PlaybackTrackCOLMAP: Unsupported camera model '%s', treating as PINHOLE", cam.Model.c_str());
+				ss >> cam.Fx >> cam.Fy >> cam.Cx >> cam.Cy;
+			}
+			cameras[cam.Id] = cam;
+		}
+		return true;
+	}
+
+	bool ParseImagesTxt(const std::filesystem::path& path, std::vector<COLMAPImage>& images)
+	{
+		std::ifstream file(path);
+		if (!file.is_open())
+		{
+			LastError = "Cannot open images.txt";
+			UpdateStatus();
+			return false;
+		}
+
+		std::string line;
+		while (std::getline(file, line))
+		{
+			if (line.empty() || line[0] == '#')
+				continue;
+			std::istringstream ss(line);
+			COLMAPImage img;
+			float qw, qx, qy, qz;
+			std::string name;
+			ss >> img.Id >> qw >> qx >> qy >> qz
+			   >> img.T.x >> img.T.y >> img.T.z
+			   >> img.CameraId >> name;
+			img.Q = glm::quat(qw, qx, qy, qz);
+			images.push_back(img);
+			// Skip POINTS2D line
+			std::getline(file, line);
+		}
+
+		std::sort(images.begin(), images.end(), [](auto& a, auto& b) { return a.Id < b.Id; });
+		return true;
+	}
+
+	void ParseExtrasTxt(const std::filesystem::path& path, size_t expectedCount, std::vector<ExtrasEntry>& outExtras)
+	{
+		std::ifstream file(path);
+		if (!file.is_open())
+			return;
+		std::unordered_map<uint32_t, ExtrasEntry> byId;
+		std::string line;
+		while (std::getline(file, line))
+		{
+			if (line.empty() || line[0] == '#')
+				continue;
+			std::istringstream ss(line);
+			uint32_t id = 0;
+			ExtrasEntry e;
+			ss >> id >> e.Zoom >> e.Focus >> e.FocusDistance >> e.RenderRatio
+			   >> e.NodalOffset >> e.DistortionScale
+			   >> e.SensorWmm >> e.SensorHmm
+			   >> e.RotX >> e.RotY >> e.RotZ;
+			if (!ss.fail())
+			{
+				e.Present = true;
+				byId[id] = e;
+			}
+		}
+		outExtras.assign(expectedCount, ExtrasEntry{});
+		for (size_t i = 0; i < expectedCount; ++i)
+		{
+			auto it = byId.find(uint32_t(i + 1));
+			if (it != byId.end())
+				outExtras[i] = it->second;
+		}
+	}
+
+	void ParseTimecodesTxt(const std::filesystem::path& path, size_t expectedCount)
+	{
+		std::ifstream file(path);
+		if (!file.is_open())
+			return;
+		std::unordered_map<uint32_t, TimecodeEntry> byId;
+		std::string line;
+		while (std::getline(file, line))
+		{
+			if (line.empty() || line[0] == '#')
+				continue;
+			std::istringstream ss(line);
+			uint32_t id = 0;
+			TimecodeEntry e;
+			ss >> id >> e.Timecode >> e.FrameNumber;
+			if (e.Timecode == "-")
+				e.Timecode.clear();
+			byId[id] = std::move(e);
+		}
+		Timecodes.assign(expectedCount, TimecodeEntry{});
+		TimecodeToIndex.clear();
+		FrameNumberToIndex.clear();
+		for (size_t i = 0; i < expectedCount; ++i)
+		{
+			auto it = byId.find(uint32_t(i + 1));
+			if (it == byId.end())
+				continue;
+			Timecodes[i] = it->second;
+			if (!Timecodes[i].Timecode.empty())
+				TimecodeToIndex.emplace(Timecodes[i].Timecode, uint32_t(i));
+			FrameNumberToIndex.emplace(Timecodes[i].FrameNumber, uint32_t(i));
+		}
+	}
+
+	// --- Execution ---
+
+	bool ResolveFrameIndex(uint32_t& outIdx)
+	{
+		switch (Mode)
+		{
+		case PlaybackTrackMode::Timecode:
+		{
+			auto it = TimecodeToIndex.find(InTimecode);
+			if (it == TimecodeToIndex.end())
+				return false;
+			outIdx = it->second;
+			return true;
+		}
+		case PlaybackTrackMode::FrameNumber:
+		{
+			auto it = FrameNumberToIndex.find(InFrameNumber);
+			if (it == FrameNumberToIndex.end())
+				return false;
+			outIdx = it->second;
+			return true;
+		}
+		case PlaybackTrackMode::FrameIndex:
+		default:
+			outIdx = FrameIndex < (uint32_t)Frames.size() ? FrameIndex : (uint32_t)Frames.size() - 1;
+			return true;
+		}
+	}
+
+	nosResult ExecuteNode(nosNodeExecuteParams* params) override
+	{
+		if (Frames.empty())
+		{
+			sys::track::TTrack empty{};
+			auto buf = nos::Buffer::From(empty);
+			SetPinValue(NOS_NAME("Track"), {.Data = buf.Data(), .Size = buf.Size()});
+			return NOS_RESULT_SUCCESS;
+		}
+
+		uint32_t frameIdx = 0;
+		if (!ResolveFrameIndex(frameIdx))
+			frameIdx = CurrentFrame < (uint32_t)Frames.size() ? CurrentFrame : 0;
+		CurrentFrame = frameIdx;
+
+		auto buf = nos::Buffer::From(Frames[frameIdx]);
+		SetPinValue(NOS_NAME("Track"), {.Data = buf.Data(), .Size = buf.Size()});
+		UpdateFrameIndexPin();
+
+		return NOS_RESULT_SUCCESS;
+	}
+
+	static nosResult GetFunctions(size_t* count, nosName* names, nosPfnNodeFunctionExecute* fns)
+	{
+		*count = 1;
+		if (!names || !fns)
+			return NOS_RESULT_SUCCESS;
+
+		names[0] = NOS_NAME_STATIC("PlaybackTrackCOLMAP_OpenFolder");
+		fns[0] = [](void* ctx, nosFunctionExecuteParams*) {
+			auto* self = static_cast<PlaybackTrackCOLMAPContext*>(ctx);
+			if (self->InputDir.empty())
+			{
+				nosEngine.LogW("PlaybackTrackCOLMAP: Input directory not set");
+				return NOS_RESULT_FAILED;
+			}
+			std::filesystem::path dir = nos::Utf8ToPath(self->InputDir);
+			if (!std::filesystem::exists(dir))
+			{
+				nosEngine.LogW("PlaybackTrackCOLMAP: Directory does not exist: %s", self->InputDir.c_str());
+				return NOS_RESULT_FAILED;
+			}
+			// TODO: Replace std::system with platform APIs (ShellExecuteW / posix_spawnp)
+#if defined(_WIN32)
+			std::string cmd = "explorer \"" + nos::PathToUtf8(dir) + "\"";
+#elif defined(__APPLE__)
+			std::string cmd = "open \"" + nos::PathToUtf8(dir) + "\"";
+#else
+			std::string cmd = "xdg-open \"" + nos::PathToUtf8(dir) + "\"";
+#endif
+			std::system(cmd.c_str());
+			return NOS_RESULT_SUCCESS;
+		};
+
+		return NOS_RESULT_SUCCESS;
+	}
+};
+
+void RegisterPlaybackTrackCOLMAP(nosNodeFunctions* fn)
+{
+	NOS_BIND_NODE_CLASS(NOS_NAME("PlaybackTrackCOLMAP"), PlaybackTrackCOLMAPContext, fn);
+}
+
+} // namespace nos::track
diff --git a/Plugins/nosTrack/Source/RecordTrackCOLMAP.cpp b/Plugins/nosTrack/Source/RecordTrackCOLMAP.cpp
new file mode 100644
index 00000000..33305432
--- /dev/null
+++ b/Plugins/nosTrack/Source/RecordTrackCOLMAP.cpp
@@ -0,0 +1,463 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#include <Nodos/PluginHelpers.hpp>
+#include "nosSysTrack/Track_generated.h"
+
+#include <glm/glm.hpp>
+#include <glm/gtc/quaternion.hpp>
+
+#include <fstream>
+#include <filesystem>
+#include <vector>
+#include <cmath>
+#include <iomanip>
+
+#include <nosSysTrack/CoordinateFrameConv.h>
+
+namespace nos::track
+{
+
+NOS_REGISTER_NAME(OutputDirectory);
+NOS_REGISTER_NAME(ImageResolution);
+NOS_REGISTER_NAME(SourceFrame);
+NOS_REGISTER_NAME(Record);
+NOS_REGISTER_NAME(MinOffFrames);
+NOS_REGISTER_NAME(FrameCount);
+NOS_REGISTER_NAME(RecordingFrame);
+
+struct RecordedFrame
+{
+	glm::vec3 Location;
+	glm::vec3 Rotation; // Euler degrees in the SourceFrame's convention.
+	float FOV;
+	float Zoom;
+	float Focus;
+	float RenderRatio;
+	glm::vec2 SensorSize;
+	float PixelAspectRatio;
+	float NodalOffset;
+	float FocusDistance;
+	float K1;
+	float K2;
+	glm::vec2 CenterShift;
+	float DistortionScale;
+	std::string Timecode;
+	uint32_t FrameNumber;
+};
+
+struct RecordTrackCOLMAPContext : NodeContext
+{
+	std::string OutputDir;
+	nosVec2u ImageResolution = {1920, 1080};
+	convention::Frame SourceFrame = convention::Frame::LH_ZUp_FwdX_RightY;
+	bool Recording = false;
+	uint32_t ConsecutiveOffFrames = 0;
+	bool LastRequestRecord = false;
+	std::string LastError;
+	std::vector<RecordedFrame> Frames;
+	nosVec2u DeltaSeconds{}; // {numerator, denominator}; 0/0 if not in fixed-step mode
+
+	RecordTrackCOLMAPContext(nosFbNodePtr node) : NodeContext(node)
+	{
+		if (node->pins())
+		{
+			for (auto* pin : *node->pins())
+			{
+				auto name = nos::Name(pin->name()->c_str());
+				if (flatbuffers::IsFieldPresent(pin, fb::Pin::VT_DATA))
+				{
+					nosBuffer value = {.Data = (void*)pin->data()->data(), .Size = pin->data()->size()};
+					OnPinValueChanged(name, *pin->id(), value);
+				}
+			}
+		}
+		UpdateStatus();
+	}
+
+	bool StartRecording()
+	{
+		std::string error;
+		if (!CanStartRecording(error))
+		{
+			LastError = std::move(error);
+			UpdateStatus();
+			return false;
+		}
+		LastError.clear();
+		Frames.clear();
+		Recording = true;
+		ConsecutiveOffFrames = 0;
+		UpdateFrameCountPin();
+		UpdateRecordingFramePin();
+		UpdateStatus();
+		nosEngine.LogI("RecordTrackCOLMAP: Recording started");
+		return true;
+	}
+
+	void StopRecording()
+	{
+		Recording = false;
+		nosEngine.LogI("RecordTrackCOLMAP: Recording stopped (%zu frames in buffer)", Frames.size());
+		if (!Frames.empty())
+			WriteFiles();
+		Frames.clear();
+		UpdateFrameCountPin();
+		UpdateRecordingFramePin();
+		UpdateStatus();
+	}
+
+	void OnPinValueChanged(nos::Name pinName, uuid const& pinId, nosBuffer val) override
+	{
+		if (pinName == NSN_OutputDirectory)
+		{
+			OutputDir = InterpretPinValue<const char>(val.Data);
+			LastError.clear();
+			UpdateStatus();
+		}
+		else if (pinName == NSN_ImageResolution)
+			ImageResolution = *(nosVec2u*)val.Data;
+		else if (pinName == NSN_SourceFrame)
+			SourceFrame = *(convention::Frame*)val.Data;
+	}
+
+	bool CanStartRecording(std::string& outError)
+	{
+		if (OutputDir.empty())
+		{
+			outError = "Set output directory";
+			return false;
+		}
+
+		std::filesystem::path outDir = nos::Utf8ToPath(OutputDir);
+		try
+		{
+			if (std::filesystem::exists(outDir) && !std::filesystem::is_empty(outDir))
+			{
+				outError = "Target folder is not empty";
+				return false;
+			}
+		}
+		catch (std::filesystem::filesystem_error& e)
+		{
+			nosEngine.LogE("RecordTrackCOLMAP: %s", e.what());
+			outError = e.what();
+			return false;
+		}
+		return true;
+	}
+
+	void UpdateFrameCountPin()
+	{
+		uint32_t count = (uint32_t)Frames.size();
+		SetPinValue(NSN_FrameCount, nosBuffer{.Data = &count, .Size = sizeof(count)});
+	}
+
+	void UpdateRecordingFramePin()
+	{
+		uint32_t frame = Recording ? (uint32_t)Frames.size() : 0;
+		SetPinValue(NSN_RecordingFrame, nosBuffer{.Data = &frame, .Size = sizeof(frame)});
+	}
+
+	void UpdateStatus()
+	{
+		if (!LastError.empty())
+			SetNodeStatusMessage(LastError, fb::NodeStatusMessageType::FAILURE);
+		else if (OutputDir.empty())
+			SetNodeStatusMessage("Set output directory", fb::NodeStatusMessageType::WARNING);
+		else if (Recording)
+			SetNodeStatusMessage("Recording (" + std::to_string(Frames.size()) + " frames)", fb::NodeStatusMessageType::INFO);
+		else
+			SetNodeStatusMessage("Idle", fb::NodeStatusMessageType::INFO);
+	}
+
+	nosResult ExecuteNode(nosNodeExecuteParams* params) override
+	{
+		nos::NodeExecuteParams execParams(params);
+
+		if (params->TimingInfo.TimingMode == NOS_EXECUTION_TIMING_MODE_FIXED_STEP)
+			DeltaSeconds = params->TimingInfo.FixedStepTiming.DeltaSeconds;
+
+		// Pass through Track input to output
+		nosBuffer trackBuf{};
+		for (size_t i = 0; i < params->PinCount; ++i)
+		{
+			if (params->Pins[i].Name == NOS_NAME("InTrack"))
+			{
+				trackBuf = {.Data = (void*)params->Pins[i].Data->Data, .Size = params->Pins[i].Data->Size};
+				break;
+			}
+		}
+		SetPinValue(NOS_NAME("OutTrack"), trackBuf);
+
+		// Drive recording state from the Record pin, with off-state debouncing to
+		// ride out brief glitches in the upstream signal (e.g. SDI bit flips on a
+		// camera-derived recording flag). Start happens immediately on a rising
+		// edge; stop only after MinOffFrames consecutive false frames.
+		const bool requestRecord = *execParams.GetPinData<bool>(NSN_Record);
+		const uint32_t minOffFrames = *execParams.GetPinData<uint32_t>(NSN_MinOffFrames);
+
+		const bool risingEdge = requestRecord && !LastRequestRecord;
+		LastRequestRecord = requestRecord;
+
+		if (risingEdge && !Recording)
+			StartRecording();
+
+		if (Recording)
+		{
+			if (requestRecord)
+				ConsecutiveOffFrames = 0;
+			else if (++ConsecutiveOffFrames >= std::max(1u, minOffFrames))
+				StopRecording();
+		}
+
+		if (!Recording)
+			return NOS_RESULT_SUCCESS;
+
+		auto* trackData = flatbuffers::GetRoot<sys::track::Track>(trackBuf.Data);
+		if (!trackData)
+			return NOS_RESULT_SUCCESS;
+
+		RecordedFrame frame{};
+		if (const char* tc = execParams.GetPinData<const char>(NOS_NAME_STATIC("Timecode")))
+			frame.Timecode = tc;
+		frame.FrameNumber = *execParams.GetPinData<uint32_t>(NOS_NAME_STATIC("FrameNumber"));
+		if (auto* loc = trackData->location())
+			frame.Location = {loc->x(), loc->y(), loc->z()};
+		if (auto* rot = trackData->rotation())
+			frame.Rotation = {rot->x(), rot->y(), rot->z()};
+		frame.FOV = trackData->fov();
+		frame.Zoom = trackData->zoom();
+		frame.Focus = trackData->focus();
+		frame.RenderRatio = trackData->render_ratio();
+		if (auto* ss = trackData->sensor_size())
+			frame.SensorSize = {ss->x(), ss->y()};
+		frame.PixelAspectRatio = trackData->pixel_aspect_ratio();
+		frame.NodalOffset = trackData->nodal_offset();
+		frame.FocusDistance = trackData->focus_distance();
+		if (auto* ld = trackData->lens_distortion())
+		{
+			frame.K1 = ld->k1k2().x();
+			frame.K2 = ld->k1k2().y();
+			frame.CenterShift = {ld->center_shift().x(), ld->center_shift().y()};
+			frame.DistortionScale = ld->distortion_scale();
+		}
+		Frames.push_back(frame);
+
+		UpdateFrameCountPin();
+		UpdateRecordingFramePin();
+		UpdateStatus();
+
+		return NOS_RESULT_SUCCESS;
+	}
+
+	void WriteFiles()
+	{
+		if (OutputDir.empty())
+		{
+			nosEngine.LogE("RecordTrackCOLMAP: Output directory is empty");
+			return;
+		}
+		if (Frames.empty())
+		{
+			nosEngine.LogW("RecordTrackCOLMAP: No frames recorded");
+			return;
+		}
+
+		std::filesystem::path outDir = nos::Utf8ToPath(OutputDir);
+		try
+		{
+			if (!std::filesystem::exists(outDir))
+				std::filesystem::create_directories(outDir);
+		}
+		catch (std::filesystem::filesystem_error& e)
+		{
+			nosEngine.LogE("RecordTrackCOLMAP: %s", e.what());
+			return;
+		}
+
+		WriteCamerasTxt(outDir);
+		WriteImagesTxt(outDir);
+		WriteTimecodesTxt(outDir);
+		WriteExtrasTxt(outDir);
+		nosEngine.LogI("RecordTrackCOLMAP: Saved %zu frames to %s", Frames.size(), OutputDir.c_str());
+	}
+
+	void WriteExtrasTxt(const std::filesystem::path& outDir)
+	{
+		// Sidecar for Track fields that don't fit COLMAP's standard cameras.txt /
+		// images.txt format. Keyed by IMAGE_ID so it pairs 1:1 with images.txt.
+		auto path = outDir / "extras.txt";
+		std::ofstream file(path);
+		if (!file.is_open())
+		{
+			nosEngine.LogE("RecordTrackCOLMAP: Cannot open %s", nos::PathToUtf8(path).c_str());
+			return;
+		}
+		const char* frameName =
+			SourceFrame == convention::Frame::LH_ZUp_FwdX_RightY    ? "LH_ZUp_FwdX_RightY"
+			: SourceFrame == convention::Frame::RH_YUp_FwdNegZ_RightX ? "RH_YUp_FwdNegZ_RightX"
+			: "Unknown";
+		file << std::setprecision(12);
+		file << "# Nodos Track sidecar paired with images.txt by IMAGE_ID.\n";
+		file << "# Carries fields that don't fit COLMAP's cameras.txt/images.txt:\n";
+		file << "#   - sensor_size in mm (cameras.txt only stores pixel WIDTH/HEIGHT)\n";
+		file << "#   - original Euler rotation in degrees (avoids quaternion round-trip drift)\n";
+		file << "#   - nodos-only fields with no COLMAP equivalent\n";
+		file << "# SourceFrame: " << frameName << " (Euler convention used for ROT_X, ROT_Y, ROT_Z below).\n";
+		file << "# IMAGE_ID, ZOOM, FOCUS, FOCUS_DISTANCE, RENDER_RATIO, NODAL_OFFSET, DISTORTION_SCALE, SENSOR_W_MM, SENSOR_H_MM, ROT_X, ROT_Y, ROT_Z\n";
+		file << "# Number of entries: " << Frames.size() << "\n";
+		for (size_t i = 0; i < Frames.size(); ++i)
+		{
+			const auto& f = Frames[i];
+			file << (i + 1) << " "
+				 << f.Zoom << " "
+				 << f.Focus << " "
+				 << f.FocusDistance << " "
+				 << f.RenderRatio << " "
+				 << f.NodalOffset << " "
+				 << f.DistortionScale << " "
+				 << f.SensorSize.x << " " << f.SensorSize.y << " "
+				 << f.Rotation.x << " " << f.Rotation.y << " " << f.Rotation.z << "\n";
+		}
+	}
+
+	void WriteTimecodesTxt(const std::filesystem::path& outDir)
+	{
+		// Skip the sidecar entirely if no frame carried a timecode -- keeps the
+		// output minimal when the upstream graph isn't producing TC.
+		bool any = false;
+		for (auto& f : Frames)
+			if (!f.Timecode.empty() || f.FrameNumber != 0) { any = true; break; }
+		if (!any)
+			return;
+
+		auto path = outDir / "timecodes.txt";
+		std::ofstream file(path);
+		if (!file.is_open())
+		{
+			nosEngine.LogE("RecordTrackCOLMAP: Cannot open %s", nos::PathToUtf8(path).c_str());
+			return;
+		}
+		double dt = (DeltaSeconds.y != 0) ? (double)DeltaSeconds.x / (double)DeltaSeconds.y : 0.0;
+		file << "# Timecode sidecar paired with images.txt by IMAGE_ID.\n";
+		file << "# First non-comment line: per-frame delta seconds (0 if recording wasn't in fixed-step timing).\n";
+		file << "# IMAGE_ID, TIMECODE, FRAME_NUMBER\n";
+		file << "# Number of entries: " << Frames.size() << "\n";
+		file << std::setprecision(12) << dt << "\n";
+		for (size_t i = 0; i < Frames.size(); ++i)
+		{
+			const auto& f = Frames[i];
+			file << (i + 1) << " "
+				 << (f.Timecode.empty() ? "-" : f.Timecode) << " "
+				 << f.FrameNumber << "\n";
+		}
+	}
+
+	float ComputeFocalLengthPixels(const RecordedFrame& frame) const
+	{
+		if (frame.FOV <= 0.0f)
+			return static_cast<float>(ImageResolution.x);
+		float fovRad = glm::radians(frame.FOV);
+		return (ImageResolution.x * 0.5f) / std::tan(fovRad * 0.5f);
+	}
+
+	void WriteCamerasTxt(const std::filesystem::path& outDir)
+	{
+		auto path = outDir / "cameras.txt";
+		std::ofstream file(path);
+		if (!file.is_open())
+		{
+			nosEngine.LogE("RecordTrackCOLMAP: Cannot open %s", nos::PathToUtf8(path).c_str());
+			return;
+		}
+
+		file << std::setprecision(12);
+		file << "# COLMAP camera intrinsics. Standard format (colmap.github.io/format.html).\n";
+		file << "# OPENCV model: PARAMS = fx, fy, cx, cy, k1, k2, p1, p2 (pixels).\n";
+		file << "# Camera list with one line of data per camera:\n";
+		file << "# CAMERA_ID, MODEL, WIDTH, HEIGHT, PARAMS[]\n";
+		file << "# Number of cameras: " << Frames.size() << "\n";
+
+		for (size_t i = 0; i < Frames.size(); ++i)
+		{
+			float fx = ComputeFocalLengthPixels(Frames[i]);
+			float fy = fx;
+			if (Frames[i].PixelAspectRatio > 0.0f)
+				fy = fx / Frames[i].PixelAspectRatio;
+
+			// center_shift is in the same units as sensor_size (mm); convert to
+			// pixel offset on the principal point. See TrackToView.cpp:30 for the
+			// canonical centerShift / sensorSize relationship.
+			float cx = ImageResolution.x * 0.5f;
+			float cy = ImageResolution.y * 0.5f;
+			if (Frames[i].SensorSize.x > 0.0f)
+				cx += Frames[i].CenterShift.x * ImageResolution.x / Frames[i].SensorSize.x;
+			if (Frames[i].SensorSize.y > 0.0f)
+				cy += Frames[i].CenterShift.y * ImageResolution.y / Frames[i].SensorSize.y;
+
+			float k1 = Frames[i].K1;
+			float k2 = Frames[i].K2;
+
+			file << (i + 1) << " OPENCV " << ImageResolution.x << " " << ImageResolution.y << " "
+				 << fx << " " << fy << " " << cx << " " << cy << " "
+				 << k1 << " " << k2 << " 0 0\n";
+		}
+	}
+
+	void WriteImagesTxt(const std::filesystem::path& outDir)
+	{
+		auto path = outDir / "images.txt";
+		std::ofstream file(path);
+		if (!file.is_open())
+		{
+			nosEngine.LogE("RecordTrackCOLMAP: Cannot open %s", nos::PathToUtf8(path).c_str());
+			return;
+		}
+
+		file << std::setprecision(12);
+		file << "# COLMAP poses. Standard format (colmap.github.io/format.html).\n";
+		file << "# Frame: RH, +X right, +Y down, +Z forward (camera looks along +Z).\n";
+		file << "# (QW, QX, QY, QZ) is the world-to-camera rotation R_w2c.\n";
+		file << "# (TX, TY, TZ) is the world-to-camera translation: t = -R_w2c * camera_world_position.\n";
+		file << "# Recover camera position in the COLMAP world frame as: C = -R_w2c^T * t.\n";
+		file << "# Image list with two lines of data per image:\n";
+		file << "# IMAGE_ID, QW, QX, QY, QZ, TX, TY, TZ, CAMERA_ID, NAME\n";
+		file << "# POINTS2D[] as (X, Y, POINT3D_ID)\n";
+		file << "# Number of images: " << Frames.size() << "\n";
+
+		// M maps the SourceFrame to the COLMAP frame. Used to convert both the
+		// source-frame R_c2w and the source-frame camera position into COLMAP.
+		const glm::dmat3 M = convention::BasisChangeToColmap(SourceFrame);
+		const glm::dmat3 Minv = glm::inverse(M);
+
+		for (size_t i = 0; i < Frames.size(); ++i)
+		{
+			auto& frame = Frames[i];
+
+			// Build R_c2w in the source frame, then conjugate by M to land in
+			// the COLMAP frame. Likewise frame the position.
+			glm::dmat3 R_c2w_src = convention::EulerToMat(SourceFrame, glm::dvec3(frame.Rotation));
+			glm::dmat3 R_c2w_colmap = M * R_c2w_src * Minv;
+			glm::dvec3 pos_colmap = M * glm::dvec3(frame.Location);
+
+			glm::dmat3 R_w2c = glm::transpose(R_c2w_colmap);
+			glm::dquat q_w2c = glm::quat_cast(R_w2c);
+			glm::dvec3 t = -R_w2c * pos_colmap;
+
+			file << (i + 1) << " "
+				 << q_w2c.w << " " << q_w2c.x << " " << q_w2c.y << " " << q_w2c.z << " "
+				 << t.x << " " << t.y << " " << t.z << " "
+				 << (i + 1) << " "
+				 << "frame_" << std::setfill('0') << std::setw(6) << i << ".png\n";
+			// Empty points line (required by COLMAP format)
+			file << "\n";
+		}
+	}
+};
+
+void RegisterRecordTrackCOLMAP(nosNodeFunctions* fn)
+{
+	NOS_BIND_NODE_CLASS(NOS_NAME("RecordTrackCOLMAP"), RecordTrackCOLMAPContext, fn);
+}
+
+} // namespace nos::track
diff --git a/Plugins/nosTrack/Source/TrackMain.cpp b/Plugins/nosTrack/Source/TrackMain.cpp
index c330165d..3ecb9cb0 100644
--- a/Plugins/nosTrack/Source/TrackMain.cpp
+++ b/Plugins/nosTrack/Source/TrackMain.cpp
@@ -15,12 +15,20 @@ enum TrackNode : int
 	FreeD,
 	UserTrack,
 	AddTrack,
+	RecordTrackCOLMAP,
+	PlaybackTrackCOLMAP,
+	TrackTransform,
+	ConvertTransform,
 	Count
 };
 
 void RegisterFreeDNode(nosNodeFunctions* functions);
 void RegisterController(nosNodeFunctions* functions);
 void RegisterAddTrack(nosNodeFunctions*);
+void RegisterRecordTrackCOLMAP(nosNodeFunctions*);
+void RegisterPlaybackTrackCOLMAP(nosNodeFunctions*);
+void RegisterTrackTransform(nosNodeFunctions*);
+void RegisterConvertTransform(nosNodeFunctions*);
 
 nosResult NOSAPI_CALL ExportNodeFunctions(size_t* outSize, nosNodeFunctions** outList)
 {
@@ -40,7 +48,19 @@ nosResult NOSAPI_CALL ExportNodeFunctions(size_t* outSize, nosNodeFunctions** ou
 			RegisterController(node);
 			break;
 		case TrackNode::AddTrack:
-			RegisterAddTrack(node); 
+			RegisterAddTrack(node);
+			break;
+		case TrackNode::RecordTrackCOLMAP:
+			RegisterRecordTrackCOLMAP(node);
+			break;
+		case TrackNode::PlaybackTrackCOLMAP:
+			RegisterPlaybackTrackCOLMAP(node);
+			break;
+		case TrackNode::TrackTransform:
+			RegisterTrackTransform(node);
+			break;
+		case TrackNode::ConvertTransform:
+			RegisterConvertTransform(node);
 			break;
 		}
 	}
diff --git a/Plugins/nosTrack/Source/TrackTransform.cpp b/Plugins/nosTrack/Source/TrackTransform.cpp
new file mode 100644
index 00000000..1f32f973
--- /dev/null
+++ b/Plugins/nosTrack/Source/TrackTransform.cpp
@@ -0,0 +1,53 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#include <Nodos/Helpers.hpp>
+#include <nosSysTrack/Track_generated.h>
+#include <glm/glm.hpp>
+
+#include <nosSysTrack/CoordinateFrameConv.h>
+
+namespace nos::track
+{
+
+void RegisterTrackTransform(nosNodeFunctions* funcs)
+{
+	funcs->ClassName = NOS_NAME("TrackTransform");
+	funcs->ExecuteNode = [](void*, nosNodeExecuteParams* params) {
+		auto pins = GetPinValues(params);
+		auto ids = GetPinIds(params);
+
+		auto* inTrack = flatbuffers::GetMutableRoot<nos::sys::track::Track>(pins[NOS_NAME("In")]);
+		auto source = *static_cast<convention::Frame*>(pins[NOS_NAME("Source")]);
+		auto target = *static_cast<convention::Frame*>(pins[NOS_NAME("Target")]);
+		float worldScale = *static_cast<float*>(pins[NOS_NAME("WorldScale")]);
+
+		nos::sys::track::TTrack out;
+		inTrack->UnPackTo(&out);
+
+		const glm::dmat3 S_src = convention::BasisMatrix(source);
+		const glm::dmat3 S_tgt = convention::BasisMatrix(target);
+		const glm::dmat3 M = S_tgt * glm::inverse(S_src);
+
+		// Location: basis change, then uniform world-scale. Other Track fields
+		// (rotation, fov, focus, sensor_size, lens_distortion, ...) are unaffected.
+		const auto& inLoc = *inTrack->location();
+		glm::dvec3 loc(inLoc.x(), inLoc.y(), inLoc.z());
+		glm::dvec3 outLoc = M * loc * static_cast<double>(worldScale);
+		out.location.mutate_x(static_cast<float>(outLoc.x));
+		out.location.mutate_y(static_cast<float>(outLoc.y));
+		out.location.mutate_z(static_cast<float>(outLoc.z));
+
+		// Rotation: build in source frame, conjugate by M, extract in target frame.
+		const auto& inRot = *inTrack->rotation();
+		glm::dmat3 R_src = convention::EulerToMat(source, glm::dvec3(inRot.x(), inRot.y(), inRot.z()));
+		glm::dmat3 R_tgt = M * R_src * glm::transpose(M);
+		glm::dvec3 outRotDeg = convention::MatToEuler(target, R_tgt);
+		out.rotation.mutate_x(static_cast<float>(outRotDeg.x));
+		out.rotation.mutate_y(static_cast<float>(outRotDeg.y));
+		out.rotation.mutate_z(static_cast<float>(outRotDeg.z));
+
+		return nosEngine.SetPinValue(ids[NOS_NAME("Out")], nos::Buffer::From(out));
+	};
+}
+
+}  // namespace nos::track
diff --git a/Plugins/nosTrack/Track.noscfg b/Plugins/nosTrack/Track.noscfg
index 861423c0..28abf5cf 100644
--- a/Plugins/nosTrack/Track.noscfg
+++ b/Plugins/nosTrack/Track.noscfg
@@ -2,21 +2,28 @@
 	"info": {
 		"id": {
 			"name": "nos.track",
-			"version": "1.10.0"
+			"version": "1.11.0"
 		},
 		"display_name": "Track",
 		"category": "Virtual Studio",
 		"dependencies": [
 			{
 				"name": "nos.sys.track",
-				"version": "1.0"
+				"version": "1.1"
 			}
 		]
 	},
 	"node_definitions": [
 		"Config/FreeD.nosdef",
 		"Config/UserTrack.nosdef",
-		"Config/AddTrack.nosdef"
+		"Config/AddTrack.nosdef",
+		"Config/RecordTrackCOLMAP.nosdef",
+		"Config/PlaybackTrackCOLMAP.nosdef",
+		"Config/TrackTransform.nosdef",
+		"Config/ConvertTransform.nosdef"
+	],
+	"custom_types": [
+		"Config/PlaybackMode.fbs"
 	],
 	"defaults": [
 		"Config/Defaults.json"
diff --git a/Plugins/nosUtilities/.nospub b/Plugins/nosUtilities/.nospub
index 609d521e..9883f1c9 100644
--- a/Plugins/nosUtilities/.nospub
+++ b/Plugins/nosUtilities/.nospub
@@ -4,6 +4,7 @@
         "*.noscfg",
         "Include/**",
         "Assets/**",
+        "Fonts/**",
         "Shaders/*.{hlsl,glsl,frag,vert,spv,comp}",
         "Binaries/*.{dll,dylib,so}"
     ],
diff --git a/Plugins/nosUtilities/CMakeLists.txt b/Plugins/nosUtilities/CMakeLists.txt
index 62db52c7..54c5910b 100644
--- a/Plugins/nosUtilities/CMakeLists.txt
+++ b/Plugins/nosUtilities/CMakeLists.txt
@@ -12,5 +12,17 @@ foreach(module_name_version ${MODULE_DEPENDENCIES})
     list(APPEND MODULE_DEPENDENCIES_TARGETS ${DEP_${dep_idx}})
 endforeach()
 
-list(APPEND DEPENDENCIES stb nosUtilities_generated ${NOS_PLUGIN_SDK_TARGET} ${MODULE_DEPENDENCIES_TARGETS})
-nos_add_plugin("nosUtilities" "${DEPENDENCIES}" "")
\ No newline at end of file
+# FreeType is vendored as a submodule and built with no external dependencies
+# so the text rendering node has a self-contained font rasterizer.
+if (NOT TARGET freetype)
+    set(FT_DISABLE_ZLIB ON CACHE BOOL "" FORCE)
+    set(FT_DISABLE_BZIP2 ON CACHE BOOL "" FORCE)
+    set(FT_DISABLE_PNG ON CACHE BOOL "" FORCE)
+    set(FT_DISABLE_HARFBUZZ ON CACHE BOOL "" FORCE)
+    set(FT_DISABLE_BROTLI ON CACHE BOOL "" FORCE)
+    add_subdirectory(External/freetype EXCLUDE_FROM_ALL)
+    nos_group_targets("freetype" "External")
+endif()
+
+list(APPEND DEPENDENCIES stb freetype nosUtilities_generated ${NOS_PLUGIN_SDK_TARGET} ${MODULE_DEPENDENCIES_TARGETS})
+nos_add_plugin("nosUtilities" "${DEPENDENCIES}" "")
diff --git a/Plugins/nosUtilities/Config/ChannelViewer.fbs b/Plugins/nosUtilities/Config/ChannelViewer.fbs
index b5de7eb1..7042da21 100644
--- a/Plugins/nosUtilities/Config/ChannelViewer.fbs
+++ b/Plugins/nosUtilities/Config/ChannelViewer.fbs
@@ -9,9 +9,3 @@ enum ChannelViewerChannels : uint {
   Cb = 5,
   Cr = 6
 }
-
-enum ChannelViewerFormats : uint {
-  Rec_601 = 0,
-  Rec_709 = 1,
-  Rec_2020 = 2
-}
diff --git a/Plugins/nosUtilities/Config/ChannelViewer.nosdef b/Plugins/nosUtilities/Config/ChannelViewer.nosdef
index 4a002d10..2722cba5 100644
--- a/Plugins/nosUtilities/Config/ChannelViewer.nosdef
+++ b/Plugins/nosUtilities/Config/ChannelViewer.nosdef
@@ -31,10 +31,10 @@
 					},
 					{
 						"name": "Format",
-						"type_name": "nos.utilities.ChannelViewerFormats",
+						"type_name": "nos.mediaio.ColorSpace",
 						"show_as": "PROPERTY",
 						"can_show_as": "PROPERTY_ONLY",
-						"data": "Rec_709",
+						"data": "REC709",
 						"description": "Sets the input texture color space,\nRequired for correct YCbCr conversion"
 					},
 					{
diff --git a/Plugins/nosUtilities/Config/MultiBoundedQueue.nosdef b/Plugins/nosUtilities/Config/MultiBoundedQueue.nosdef
new file mode 100644
index 00000000..df1ef4c8
--- /dev/null
+++ b/Plugins/nosUtilities/Config/MultiBoundedQueue.nosdef
@@ -0,0 +1,56 @@
+{
+	"nodes": [
+		{
+			"class_name": "MultiBoundedQueue",
+			"menu_info": {
+				"category": "Utilities",
+				"display_name": "Multi Bounded Queue",
+				"name_aliases": [ "data structure", "algorithm", "circular", "multi", "fifo" ]
+			},
+			"node": {
+				"class_name": "MultiBoundedQueue",
+				"display_name": "Multi Bounded Queue",
+				"contents_type": "Job",
+				"description": "Bounded FIFO queue with one or more independent input/output channel pairs sharing a single bound. Right-click the node to add a channel, right-click an Input_X or Output_X pin to remove its channel.",
+				"pins": [
+					{
+						"name": "Thread",
+						"type_name": "nos.exe",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_ONLY"
+					},
+					{
+						"name": "Size",
+						"type_name": "uint",
+						"data": 2,
+						"max": 120,
+						"min": 1,
+						"show_as": "PROPERTY",
+						"can_show_as": "PROPERTY_ONLY"
+					},
+					{
+						"name": "Alignment",
+						"description": "Used for creating memory-aligned buffers in memory",
+						"type_name": "uint",
+						"def": 0,
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY"
+					},
+					{
+						"name": "Input_A",
+						"type_name": "nos.Generic",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_ONLY"
+					},
+					{
+						"name": "Output_A",
+						"type_name": "nos.Generic",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY",
+						"live": true
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosUtilities/Config/MultiLiveOut.nosdef b/Plugins/nosUtilities/Config/MultiLiveOut.nosdef
new file mode 100644
index 00000000..36997973
--- /dev/null
+++ b/Plugins/nosUtilities/Config/MultiLiveOut.nosdef
@@ -0,0 +1,30 @@
+{
+	"nodes": [
+		{
+			"class_name": "MultiLiveOut",
+			"menu_info": {
+				"category": "Scheduling",
+				"display_name": "Multi Live Out"
+			},
+			"node": {
+				"class_name": "MultiLiveOut",
+				"contents_type": "Job",
+				"pins": [
+					{
+						"name": "Input_0",
+						"type_name": "nos.Generic",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_ONLY"
+					},
+					{
+						"name": "Output_0",
+						"type_name": "nos.Generic",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY",
+						"live": true
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosUtilities/Config/MultiRingBuffer.nosdef b/Plugins/nosUtilities/Config/MultiRingBuffer.nosdef
new file mode 100644
index 00000000..3fa2c4c3
--- /dev/null
+++ b/Plugins/nosUtilities/Config/MultiRingBuffer.nosdef
@@ -0,0 +1,74 @@
+{
+	"nodes": [
+		{
+			"class_name": "MultiRingBuffer",
+			"menu_info": {
+				"category": "Utilities",
+				"display_name": "Multi Ring Buffer",
+				"name_aliases": [ "data structure", "algorithm", "circular", "multi" ]
+			},
+			"node": {
+				"class_name": "MultiRingBuffer",
+				"display_name": "Multi Ring Buffer",
+				"contents_type": "Job",
+				"description": "Ring buffer with one or more independent input/output channel pairs sharing a single ring size. Right-click the node to add a channel, right-click an Input_X or Output_X pin to remove its channel.",
+				"pins": [
+					{
+						"name": "Thread",
+						"type_name": "nos.exe",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_ONLY"
+					},
+					{
+						"name": "Size",
+						"type_name": "uint",
+						"data": 2,
+						"max": 120,
+						"min": 1,
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY"
+					},
+					{
+						"name": "Spare",
+						"type_name": "uint",
+						"data": 0,
+						"max": 119,
+						"min": 0,
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY"
+					},
+					{
+						"name": "Alignment",
+						"description": "Used for creating memory-aligned buffers in memory",
+						"type_name": "uint",
+						"def": 0,
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY"
+					},
+					{
+						"name": "Input_A",
+						"type_name": "nos.Generic",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_ONLY"
+					},
+					{
+						"name": "Output_A",
+						"type_name": "nos.Generic",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY",
+						"live": true
+					},
+					{
+						"name": "RepeatWhenFilling",
+						"display_name": "Repeat When Filling",
+						"type_name": "bool",
+						"description": "Serves the last value while the buffer is being filled instead of waiting & resets the ring on restart",
+						"def": true,
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY"
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosUtilities/Config/ScheduleRequest.nosdef b/Plugins/nosUtilities/Config/ScheduleRequest.nosdef
new file mode 100644
index 00000000..59042dbe
--- /dev/null
+++ b/Plugins/nosUtilities/Config/ScheduleRequest.nosdef
@@ -0,0 +1,58 @@
+{
+	"nodes": [
+		{
+			"class_name": "ScheduleRequest",
+			"menu_info": {
+				"category": "Execution",
+				"display_name": "Schedule Request",
+				"aliases": [ "schedule", "on demand", "request" ]
+			},
+			"node": {
+				"class_name": "ScheduleRequest",
+				"display_name": "Schedule Request",
+				"contents_type": "Job",
+				"description": "Drives an on-demand path. Each execution, and each path start, queues another\nschedule request so the path feeding Trigger keeps running. Wire the resource you\nwant scheduled into Sink.",
+				"pins": [
+					{
+						"name": "Trigger",
+						"type_name": "nos.exe",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_ONLY"
+					},
+					{
+						"name": "Sink",
+						"type_name": "nos.Generic",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_ONLY"
+					},
+					{
+						"name": "DeltaSeconds",
+						"display_name": "Delta Seconds",
+						"description": "Target time between path runs, as a rational x/y seconds. Default 1/60.",
+						"type_name": "nos.fb.vec2u",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": { "x": 1, "y": 60 }
+					},
+					{
+						"name": "Importance",
+						"description": "Conflicting paths are controlled by the node of higher importance.",
+						"type_name": "uint",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 1
+					},
+					{
+						"name": "TryAgainOnFailure",
+						"display_name": "Try Again On Failure",
+						"description": "If enabled, the request is retried when a node on the path returns an error.",
+						"type_name": "bool",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": true
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosUtilities/Config/TextRender.fbs b/Plugins/nosUtilities/Config/TextRender.fbs
new file mode 100644
index 00000000..8bfe4e6f
--- /dev/null
+++ b/Plugins/nosUtilities/Config/TextRender.fbs
@@ -0,0 +1,15 @@
+namespace nos.utilities;
+
+enum TextHAlign : uint
+{
+    LEFT   = 0,
+    CENTER = 1,
+    RIGHT  = 2,
+}
+
+enum TextVAlign : uint
+{
+    TOP    = 0,
+    MIDDLE = 1,
+    BOTTOM = 2,
+}
diff --git a/Plugins/nosUtilities/Config/TextRender.nosdef b/Plugins/nosUtilities/Config/TextRender.nosdef
new file mode 100644
index 00000000..5ad61bde
--- /dev/null
+++ b/Plugins/nosUtilities/Config/TextRender.nosdef
@@ -0,0 +1,275 @@
+{
+	"nodes": [
+		{
+			"class_name": "TextRender",
+			"menu_info": {
+				"category": "Utilities",
+				"display_name": "Text Render",
+				"name_aliases": [ "text", "font", "label", "caption", "subtitle", "string to texture" ]
+			},
+			"node": {
+				"class_name": "TextRender",
+				"contents_type": "Job",
+				"description": "Renders text into a texture using a signed distance field font atlas.\nSupports multi-line text, word wrapping, outline, drop shadow and a text-box background.",
+				"pins": [
+					{
+						"name": "Text",
+						"type_name": "string",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": "Text",
+						"description": "Text to render. Newlines and word wrapping are honored."
+					},
+					{
+						"name": "FontSize",
+						"display_name": "Font Size",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"meta_data_map": [
+							{ "key": "Category", "value": "Font" }
+						],
+						"data": 64.0,
+						"min": 1.0,
+						"description": "Glyph height in pixels."
+					},
+					{
+						"name": "Color",
+						"type_name": "nos.fb.vec4",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"visualizer": {
+							"type": "COLOR_PICKER"
+						},
+						"data": {
+							"x": 1,
+							"y": 1,
+							"z": 1,
+							"w": 1
+						},
+						"description": "Fill color of the text."
+					},
+					{
+						"name": "Opacity",
+						"type_name": "float",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"data": 1.0,
+						"min": 0.0,
+						"max": 1.0,
+						"description": "Global opacity multiplier applied to text, outline, shadow and background."
+					},
+					{
+						"name": "StrokeColor",
+						"display_name": "Stroke Color",
+						"type_name": "nos.fb.vec4",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"meta_data_map": [
+							{ "key": "Category", "value": "Outline" }
+						],
+						"visualizer": {
+							"type": "COLOR_PICKER"
+						},
+						"data": {
+							"x": 0,
+							"y": 0,
+							"z": 0,
+							"w": 1
+						},
+						"description": "Outline color. Only drawn when Stroke Width is greater than 0."
+					},
+					{
+						"name": "StrokeWidth",
+						"display_name": "Stroke Width",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"meta_data_map": [
+							{ "key": "Category", "value": "Outline" }
+						],
+						"data": 0.0,
+						"min": 0.0,
+						"description": "Outline thickness in pixels. 0 disables the outline."
+					},
+					{
+						"name": "ShadowColor",
+						"display_name": "Shadow Color",
+						"type_name": "nos.fb.vec4",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"meta_data_map": [
+							{ "key": "Category", "value": "Shadow" }
+						],
+						"visualizer": {
+							"type": "COLOR_PICKER"
+						},
+						"data": {
+							"x": 0,
+							"y": 0,
+							"z": 0,
+							"w": 0
+						},
+						"description": "Drop shadow color. Alpha 0 disables the shadow."
+					},
+					{
+						"name": "ShadowOffset",
+						"display_name": "Shadow Offset",
+						"type_name": "nos.fb.vec2",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"meta_data_map": [
+							{ "key": "Category", "value": "Shadow" }
+						],
+						"data": {
+							"x": 3,
+							"y": 3
+						},
+						"description": "Drop shadow offset in pixels (x right, y down)."
+					},
+					{
+						"name": "ShadowSoftness",
+						"display_name": "Shadow Softness",
+						"type_name": "float",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"meta_data_map": [
+							{ "key": "Category", "value": "Shadow" }
+						],
+						"data": 3.0,
+						"min": 0.0,
+						"description": "Drop shadow edge blur in pixels."
+					},
+					{
+						"name": "BackgroundColor",
+						"display_name": "Background Color",
+						"type_name": "nos.fb.vec4",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"meta_data_map": [
+							{ "key": "Category", "value": "Background" }
+						],
+						"visualizer": {
+							"type": "COLOR_PICKER"
+						},
+						"data": {
+							"x": 0,
+							"y": 0,
+							"z": 0,
+							"w": 0.6
+						},
+						"description": "Color of the box drawn behind the text block.\nAlpha 0 disables the box; the frame stays transparent."
+					},
+					{
+						"name": "BackgroundPadding",
+						"display_name": "Background Padding",
+						"type_name": "nos.fb.vec2",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"meta_data_map": [
+							{ "key": "Category", "value": "Background" }
+						],
+						"data": {
+							"x": 20,
+							"y": 10
+						},
+						"description": "Padding in pixels between the text and the background box edges."
+					},
+					{
+						"name": "HorizontalAlign",
+						"display_name": "Horizontal Align",
+						"type_name": "nos.utilities.TextHAlign",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_OUTPUT_PROPERTY",
+						"meta_data_map": [
+							{ "key": "Category", "value": "Layout" }
+						],
+						"data": "CENTER",
+						"description": "Horizontal anchor of the text block within the output."
+					},
+					{
+						"name": "VerticalAlign",
+						"display_name": "Vertical Align",
+						"type_name": "nos.utilities.TextVAlign",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_OUTPUT_PROPERTY",
+						"meta_data_map": [
+							{ "key": "Category", "value": "Layout" }
+						],
+						"data": "BOTTOM",
+						"description": "Vertical anchor of the text block within the output."
+					},
+					{
+						"name": "Position",
+						"type_name": "nos.fb.vec2",
+						"show_as": "INPUT_PIN",
+						"can_show_as": "INPUT_PIN_OR_PROPERTY",
+						"meta_data_map": [
+							{ "key": "Category", "value": "Layout" }
+						],
+						"data": {
+							"x": 0,
+							"y": -50
+						},
+						"description": "Extra offset in pixels applied on top of the alignment anchor."
+					},
+					{
+						"name": "Resolution",
+						"type_name": "nos.fb.vec2u",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_OUTPUT_PROPERTY",
+						"meta_data_map": [
+							{ "key": "Category", "value": "Layout" }
+						],
+						"data": {
+							"x": 1920,
+							"y": 1080
+						},
+						"description": "Output texture resolution.",
+						"visualizer": {
+							"type": "NAMED_VALUE",
+							"name": "nos.mediaio.ResolutionVisualizer"
+						}
+					},
+					{
+						"name": "WrapWidth",
+						"display_name": "Wrap Width",
+						"type_name": "uint",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_OUTPUT_PROPERTY",
+						"meta_data_map": [
+							{ "key": "Category", "value": "Layout" }
+						],
+						"data": 0,
+						"description": "Word-wrap width in characters.\n0 wraps to the output texture width."
+					},
+					{
+						"name": "Font",
+						"type_name": "string",
+						"show_as": "PROPERTY",
+						"can_show_as": "INPUT_OUTPUT_PROPERTY",
+						"meta_data_map": [
+							{ "key": "Category", "value": "Font" }
+						],
+						"data": "",
+						"description": "Path to a .ttf/.otf font file.\nLeave empty to use the bundled Roboto Mono font.",
+						"visualizer": {
+							"type": "FILE_PICKER",
+							"file_extensions": [ "ttf", "otf" ],
+							"file_picker_type": "OPEN"
+						}
+					},
+					{
+						"name": "Output",
+						"type_name": "nos.sys.vulkan.Texture",
+						"show_as": "OUTPUT_PIN",
+						"can_show_as": "OUTPUT_PIN_ONLY",
+						"data": {
+							"unscaled": true
+						}
+					}
+				]
+			}
+		}
+	]
+}
diff --git a/Plugins/nosUtilities/External/freetype b/Plugins/nosUtilities/External/freetype
new file mode 160000
index 00000000..7e0e56f8
--- /dev/null
+++ b/Plugins/nosUtilities/External/freetype
@@ -0,0 +1 @@
+Subproject commit 7e0e56f84fd53cf38378d33c8fc8f92d12ab9ac6
diff --git a/Plugins/nosUtilities/Fonts/LICENSE-RobotoMono.txt b/Plugins/nosUtilities/Fonts/LICENSE-RobotoMono.txt
new file mode 100644
index 00000000..8e7df338
--- /dev/null
+++ b/Plugins/nosUtilities/Fonts/LICENSE-RobotoMono.txt
@@ -0,0 +1,93 @@
+Copyright 2015 The Roboto Mono Project Authors (https://github.com/googlefonts/robotomono)
+
+This Font Software is licensed under the SIL Open Font License, Version 1.1.
+This license is copied below, and is also available with a FAQ at:
+https://openfontlicense.org
+
+
+-----------------------------------------------------------
+SIL OPEN FONT LICENSE Version 1.1 - 26 February 2007
+-----------------------------------------------------------
+
+PREAMBLE
+The goals of the Open Font License (OFL) are to stimulate worldwide
+development of collaborative font projects, to support the font creation
+efforts of academic and linguistic communities, and to provide a free and
+open framework in which fonts may be shared and improved in partnership
+with others.
+
+The OFL allows the licensed fonts to be used, studied, modified and
+redistributed freely as long as they are not sold by themselves. The
+fonts, including any derivative works, can be bundled, embedded, 
+redistributed and/or sold with any software provided that any reserved
+names are not used by derivative works. The fonts and derivatives,
+however, cannot be released under any other type of license. The
+requirement for fonts to remain under this license does not apply
+to any document created using the fonts or their derivatives.
+
+DEFINITIONS
+"Font Software" refers to the set of files released by the Copyright
+Holder(s) under this license and clearly marked as such. This may
+include source files, build scripts and documentation.
+
+"Reserved Font Name" refers to any names specified as such after the
+copyright statement(s).
+
+"Original Version" refers to the collection of Font Software components as
+distributed by the Copyright Holder(s).
+
+"Modified Version" refers to any derivative made by adding to, deleting,
+or substituting -- in part or in whole -- any of the components of the
+Original Version, by changing formats or by porting the Font Software to a
+new environment.
+
+"Author" refers to any designer, engineer, programmer, technical
+writer or other person who contributed to the Font Software.
+
+PERMISSION & CONDITIONS
+Permission is hereby granted, free of charge, to any person obtaining
+a copy of the Font Software, to use, study, copy, merge, embed, modify,
+redistribute, and sell modified and unmodified copies of the Font
+Software, subject to the following conditions:
+
+1) Neither the Font Software nor any of its individual components,
+in Original or Modified Versions, may be sold by itself.
+
+2) Original or Modified Versions of the Font Software may be bundled,
+redistributed and/or sold with any software, provided that each copy
+contains the above copyright notice and this license. These can be
+included either as stand-alone text files, human-readable headers or
+in the appropriate machine-readable metadata fields within text or
+binary files as long as those fields can be easily viewed by the user.
+
+3) No Modified Version of the Font Software may use the Reserved Font
+Name(s) unless explicit written permission is granted by the corresponding
+Copyright Holder. This restriction only applies to the primary font name as
+presented to the users.
+
+4) The name(s) of the Copyright Holder(s) or the Author(s) of the Font
+Software shall not be used to promote, endorse or advertise any
+Modified Version, except to acknowledge the contribution(s) of the
+Copyright Holder(s) and the Author(s) or with their explicit written
+permission.
+
+5) The Font Software, modified or unmodified, in part or in whole,
+must be distributed entirely under this license, and must not be
+distributed under any other license. The requirement for fonts to
+remain under this license does not apply to any document created
+using the Font Software.
+
+TERMINATION
+This license becomes null and void if any of the above conditions are
+not met.
+
+DISCLAIMER
+THE FONT SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO ANY WARRANTIES OF
+MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT
+OF COPYRIGHT, PATENT, TRADEMARK, OR OTHER RIGHT. IN NO EVENT SHALL THE
+COPYRIGHT HOLDER BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+INCLUDING ANY GENERAL, SPECIAL, INDIRECT, INCIDENTAL, OR CONSEQUENTIAL
+DAMAGES, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+FROM, OUT OF THE USE OR INABILITY TO USE THE FONT SOFTWARE OR FROM
+OTHER DEALINGS IN THE FONT SOFTWARE.
diff --git a/Plugins/nosUtilities/Fonts/RobotoMono-Regular.ttf b/Plugins/nosUtilities/Fonts/RobotoMono-Regular.ttf
new file mode 100644
index 00000000..f21d1d71
Binary files /dev/null and b/Plugins/nosUtilities/Fonts/RobotoMono-Regular.ttf differ
diff --git a/Plugins/nosUtilities/Shaders/TextBox.frag b/Plugins/nosUtilities/Shaders/TextBox.frag
new file mode 100644
index 00000000..c7d7e0a5
--- /dev/null
+++ b/Plugins/nosUtilities/Shaders/TextBox.frag
@@ -0,0 +1,19 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#version 450
+#extension GL_EXT_scalar_block_layout : enable
+
+layout(binding = 0, std430) uniform UBO
+{
+    vec2 Offset;
+    vec2 Size;
+    vec4 BoxColor;
+} ubo;
+
+layout(location = 0) in vec2 uv;
+layout(location = 0) out vec4 rt;
+
+void main()
+{
+    rt = ubo.BoxColor;
+}
diff --git a/Plugins/nosUtilities/Shaders/TextBox.vert b/Plugins/nosUtilities/Shaders/TextBox.vert
new file mode 100644
index 00000000..2b2ac902
--- /dev/null
+++ b/Plugins/nosUtilities/Shaders/TextBox.vert
@@ -0,0 +1,29 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#version 450
+#extension GL_EXT_scalar_block_layout : enable
+
+layout(location = 0) out vec2 uv;
+
+layout(binding = 0, std430) uniform UBO
+{
+    vec2 Offset;   // box top-left in 0..1 output coords (y down)
+    vec2 Size;     // box size in 0..1 output coords
+    vec4 BoxColor;
+} ubo;
+
+const vec2 pos[6] =
+    vec2[6](
+        vec2(0.0, +1.0),
+        vec2(+1.0, +1.0),
+        vec2(0.0, 0.0),
+        vec2(0.0, 0.0),
+        vec2(+1.0, +1.0),
+        vec2(+1.0, 0.0));
+
+void main()
+{
+    vec2 p = pos[gl_VertexIndex];
+    gl_Position = vec4((p * ubo.Size * 2) + vec2(-1, -1) + ubo.Offset * 2, 0.0, 1.0);
+    uv = p;
+}
diff --git a/Plugins/nosUtilities/Shaders/TextGlyph.frag b/Plugins/nosUtilities/Shaders/TextGlyph.frag
new file mode 100644
index 00000000..3b2246c0
--- /dev/null
+++ b/Plugins/nosUtilities/Shaders/TextGlyph.frag
@@ -0,0 +1,42 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#version 450
+#extension GL_EXT_scalar_block_layout : enable
+
+layout(binding = 1) uniform sampler2D Atlas;
+
+layout(binding = 0, std430) uniform UBO
+{
+    vec2 Offset;
+    vec2 Size;
+    vec4 AtlasRect;   // xy = atlas uv min, zw = atlas uv extent
+    vec4 FillColor;
+    vec4 StrokeColor;
+    float StrokeWidth; // outline thickness in output pixels (0 = none)
+    float Softness;    // extra edge blur in output pixels (drop shadow)
+    float PxRange;     // output pixels spanned by one full signed-distance unit
+} ubo;
+
+layout(location = 0) in vec2 uv;
+layout(location = 0) out vec4 rt;
+
+void main()
+{
+    // uv (0,0) is the glyph top-left, matching the top-down atlas bitmaps.
+    vec2 atlasUv = ubo.AtlasRect.xy + uv * ubo.AtlasRect.zw;
+    float sd = texture(Atlas, atlasUv).r; // signed distance, 0.5 = glyph edge
+
+    float distPx = (sd - 0.5) * ubo.PxRange; // signed distance, output pixels
+    float aa = 0.75 + ubo.Softness;
+
+    float fillA = smoothstep(-aa, aa, distPx);
+    float outerA = smoothstep(-aa, aa, distPx + ubo.StrokeWidth);
+
+    // Composite the fill over the stroke (stroke spans the whole silhouette).
+    float fa = ubo.FillColor.a * fillA;
+    float sa = ubo.StrokeColor.a * outerA;
+    float outA = fa + sa * (1.0 - fa);
+    vec3 outRGB = (ubo.FillColor.rgb * fa + ubo.StrokeColor.rgb * sa * (1.0 - fa)) / max(outA, 1e-5);
+
+    rt = vec4(outRGB, outA);
+}
diff --git a/Plugins/nosUtilities/Shaders/TextGlyph.vert b/Plugins/nosUtilities/Shaders/TextGlyph.vert
new file mode 100644
index 00000000..284e6cba
--- /dev/null
+++ b/Plugins/nosUtilities/Shaders/TextGlyph.vert
@@ -0,0 +1,34 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#version 450
+#extension GL_EXT_scalar_block_layout : enable
+
+layout(location = 0) out vec2 uv;
+
+layout(binding = 0, std430) uniform UBO
+{
+    vec2 Offset;     // glyph quad top-left in 0..1 output coords (y down)
+    vec2 Size;       // glyph quad size in 0..1 output coords
+    vec4 AtlasRect;  // xy = atlas uv min, zw = atlas uv extent
+    vec4 FillColor;
+    vec4 StrokeColor;
+    float StrokeWidth;
+    float Softness;
+    float PxRange;
+} ubo;
+
+const vec2 pos[6] =
+    vec2[6](
+        vec2(0.0, +1.0),
+        vec2(+1.0, +1.0),
+        vec2(0.0, 0.0),
+        vec2(0.0, 0.0),
+        vec2(+1.0, +1.0),
+        vec2(+1.0, 0.0));
+
+void main()
+{
+    vec2 p = pos[gl_VertexIndex];
+    gl_Position = vec4((p * ubo.Size * 2) + vec2(-1, -1) + ubo.Offset * 2, 0.0, 1.0);
+    uv = p;
+}
diff --git a/Plugins/nosUtilities/Source/ChannelViewer.cpp b/Plugins/nosUtilities/Source/ChannelViewer.cpp
index a0d88f67..4fcc2e96 100644
--- a/Plugins/nosUtilities/Source/ChannelViewer.cpp
+++ b/Plugins/nosUtilities/Source/ChannelViewer.cpp
@@ -13,6 +13,41 @@ NOS_REGISTER_NAME_SPACED(Nos_Utilities_ChannelViewer, "nos.utilities.ChannelView
 
 namespace nos::utilities
 {
+static nosResult MigrateNode(nosFbNodePtr nodePtr, nosBuffer* outBuffer)
+{
+	fb::TNode tNode;
+	nodePtr->UnPackTo(&tNode);
+	bool migrated = false;
+	for (auto& pin : tNode.pins)
+	{
+		if (!pin || pin->name != "Format")
+			continue;
+		bool legacyType = pin->type_name == "nos.utilities.ChannelViewerFormats" ||
+		                  pin->type_name == "nos.fb.ChannelViewerFormats";
+		const char* newValue = nullptr;
+		if (!pin->data.empty())
+		{
+			std::string_view oldValue(reinterpret_cast<const char*>(pin->data.data()), pin->data.size() - 1);
+			if (oldValue == "Rec_601") newValue = "REC601";
+			else if (oldValue == "Rec_709") newValue = "REC709";
+			else if (oldValue == "Rec_2020") newValue = "REC2020";
+		}
+		if (!legacyType && !newValue)
+			continue;
+		pin->type_name = "nos.mediaio.ColorSpace";
+		if (newValue)
+		{
+			std::string s = newValue;
+			pin->data = std::vector<uint8_t>(s.c_str(), s.c_str() + s.size() + 1);
+		}
+		migrated = true;
+	}
+	if (!migrated)
+		return NOS_RESULT_SUCCESS;
+	*outBuffer = EngineBuffer::CopyFrom(tNode).Release();
+	return NOS_RESULT_SUCCESS;
+}
+
 static nosResult ExecuteNode(void* ctx, nosNodeExecuteParams* pins)
 {
 	auto values = GetPinValues(pins);
@@ -25,7 +60,8 @@ static nosResult ExecuteNode(void* ctx, nosNodeExecuteParams* pins)
 	glm::vec4 val{};
 	val[channel & 3] = 1;
 
-	constexpr glm::vec3 coeffs[3] = {{.299f, .587f, .114f}, {.2126f, .7152f, .0722f}, {.2627f, .678f, .0593f}};
+	// Indexed by nos.mediaio.ColorSpace: REC709=0, REC601=1, REC2020=2
+	constexpr glm::vec3 coeffs[3] = {{.2126f, .7152f, .0722f}, {.299f, .587f, .114f}, {.2627f, .678f, .0593f}};
 
 	glm::vec4 multipliers = glm::vec4(coeffs[format], channel > 3);
 	std::vector bindings = {
@@ -51,6 +87,7 @@ nosResult RegisterChannelViewer(nosNodeFunctions* out)
 {
 	out->ClassName = NSN_Nos_Utilities_ChannelViewer;
 	out->ExecuteNode = ExecuteNode;
+	out->MigrateNode = MigrateNode;
 
 	fs::path root = nosEngine.Module->RootFolderPath;
 	auto chViewerPath = (root / "Shaders" / "ChannelViewer.frag").generic_string();
diff --git a/Plugins/nosUtilities/Source/MultiBoundedQueue.cpp b/Plugins/nosUtilities/Source/MultiBoundedQueue.cpp
new file mode 100644
index 00000000..9f433574
--- /dev/null
+++ b/Plugins/nosUtilities/Source/MultiBoundedQueue.cpp
@@ -0,0 +1,608 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#pragma once
+
+#include <set>
+
+#include <Nodos/PluginHelpers.hpp>
+
+// External
+#include <glm/glm.hpp>
+#include <nosVulkanSubsystem/Helpers.hpp>
+
+#include "MultiRing.h"
+#include "Ring.h"
+#include "nosUtil/Stopwatch.hpp"
+
+namespace nos::utilities
+{
+
+struct MultiBoundedQueueNodeContext : NodeContext
+{
+	static constexpr std::string_view CHANNEL_LETTERS = "ABCDEFGHIJKLMNOPQRSTUVWXYZ";
+
+	enum MenuCommandType : uint8_t
+	{
+		ADD_CHANNEL = 0,
+		REMOVE_CHANNEL = 1,
+	};
+
+	struct MenuCommand
+	{
+		MenuCommandType Type;
+		uint8_t Letter;
+		MenuCommand(uint32_t cmd)
+		{
+			Type = static_cast<MenuCommandType>(cmd & 0xFF);
+			Letter = static_cast<uint8_t>((cmd >> 8) & 0xFF);
+		}
+		MenuCommand(MenuCommandType type, uint8_t letter) : Type(type), Letter(letter) {}
+		operator uint32_t() const { return (Letter << 8) | Type; }
+	};
+
+	struct Channel
+	{
+		char Letter;
+		nos::Name InputName;
+		nos::Name OutputName;
+		uuid InputId{};
+		uuid OutputId{};
+		nos::TypeInfo TypeInfo;
+		MultiRing::Channel* RingChannel = nullptr;
+		std::atomic_bool IsOutLive = false;
+		bool NeedsRecreation = false;
+
+		Channel(char letter)
+			: Letter(letter),
+			  InputName((std::string("Input_") + letter).c_str()),
+			  OutputName((std::string("Output_") + letter).c_str()),
+			  TypeInfo(NSN_Generic)
+		{
+		}
+	};
+
+	std::map<char, std::unique_ptr<Channel>> Channels;
+	std::unordered_map<uuid, char> PinIdToLetter;
+	MultiRing Ring;
+	// Channels popped since the last SendScheduleRequest. One producer run
+	// pushes one slot per live channel, so we must only schedule again once
+	// every live channel has been popped — otherwise schedule requests pile
+	// up by a factor of N (channels) per consumer tick.
+	std::set<char> PoppedSinceLastSchedule;
+
+	std::optional<uint32_t> RequestedRingSize = std::nullopt;
+
+	std::string GetName() const { return "MultiBoundedQueue"; }
+
+	static std::optional<char> ParseLetter(std::string_view pinName)
+	{
+		auto pos = pinName.find_last_of('_');
+		if (pos == std::string::npos || pos + 2 != pinName.size())
+			return std::nullopt;
+		char c = pinName[pos + 1];
+		if (c < 'A' || c > 'Z')
+			return std::nullopt;
+		return c;
+	}
+
+	static bool IsInputPin(std::string_view pinName) { return pinName.starts_with("Input_"); }
+	static bool IsOutputPin(std::string_view pinName) { return pinName.starts_with("Output_"); }
+
+	MultiBoundedQueueNodeContext(nosFbNodePtr node) : NodeContext(node)
+	{
+		std::vector<uuid> pinsToUnorphan;
+		for (auto* pin : *node->pins())
+		{
+			auto pinNameSv = pin->name()->string_view();
+			if (!IsInputPin(pinNameSv) && !IsOutputPin(pinNameSv))
+				continue;
+			auto letter = ParseLetter(pinNameSv);
+			if (!letter)
+				continue;
+
+			auto& channel = Channels[*letter];
+			if (!channel)
+				channel = std::make_unique<Channel>(*letter);
+
+			if (IsInputPin(pinNameSv))
+				channel->InputId = uuid(*pin->id());
+			else
+			{
+				channel->OutputId = uuid(*pin->id());
+				channel->IsOutLive = pin->live();
+			}
+			PinIdToLetter[uuid(*pin->id())] = *letter;
+
+			nos::Name typeName(pin->type_name()->c_str());
+			if (typeName != NSN_Generic && channel->TypeInfo->TypeName == NSN_Generic)
+				channel->TypeInfo = nos::TypeInfo(typeName);
+
+			if (auto orphanState = pin->orphan_state())
+				if (orphanState->type() == fb::PinOrphanStateType::ORPHAN)
+					pinsToUnorphan.push_back(uuid(*pin->id()));
+		}
+
+		for (auto& [_, ch] : Channels)
+			InitChannel(*ch);
+
+		for (auto const& pinId : pinsToUnorphan)
+			SetPinOrphanState(pinId, fb::PinOrphanStateType::ACTIVE);
+
+		AddPinValueWatcher(NSN_Size, [this](nos::Buffer const& newSize, std::optional<nos::Buffer> oldVal) {
+			uint32_t size = *newSize.As<uint32_t>();
+			if (oldVal && oldVal == newSize)
+				return;
+			RequestRingResize(size);
+		});
+		AddPinValueWatcher(NSN_Alignment, [this](nos::Buffer const& newAlignment, std::optional<nos::Buffer> oldVal) {
+			bool any = false;
+			for (auto& [_, ch] : Channels)
+			{
+				if (!ch->RingChannel)
+					continue;
+				if (ch->RingChannel->ResInterface->CheckNewResource(NSN_Alignment, newAlignment, oldVal))
+				{
+					nosEngine.SendPathRestart(ch->InputId);
+					ch->NeedsRecreation = true;
+					any = true;
+				}
+			}
+			if (any)
+			{
+				Ring.Stop();
+				PoppedSinceLastSchedule.clear();
+			}
+		});
+	}
+
+	~MultiBoundedQueueNodeContext() override { Ring.Stop(); }
+
+	void InitChannel(Channel& ch)
+	{
+		std::shared_ptr<ResourceInterface> resource;
+		if (ch.TypeInfo->TypeName == NOS_NAME(sys::vulkan::Buffer::GetFullyQualifiedName()))
+			resource = std::make_shared<GPUBufferResource>();
+		else if (ch.TypeInfo->TypeName == NOS_NAME(sys::vulkan::Texture::GetFullyQualifiedName()))
+			resource = std::make_shared<GPUTextureResource>();
+		else
+			resource = std::make_shared<CPUTrivialResource>();
+
+		ch.RingChannel = &Ring.AddChannel(ch.Letter, std::move(resource), &ch);
+	}
+
+	Channel* GetChannelByPinId(uuid const& id)
+	{
+		auto it = PinIdToLetter.find(id);
+		if (it == PinIdToLetter.end())
+			return nullptr;
+		auto chIt = Channels.find(it->second);
+		return chIt != Channels.end() ? chIt->second.get() : nullptr;
+	}
+
+	void RequestRingResize(uint32_t size)
+	{
+		if (size == 0)
+		{
+			nosEngine.LogW((GetName() + " size cannot be 0").c_str());
+			return;
+		}
+		if (Ring.Size == size && (!RequestedRingSize.has_value() || *RequestedRingSize == size))
+			return;
+		for (auto& [_, ch] : Channels)
+		{
+			if (!ch->RingChannel)
+				continue;
+			nosPathCommand ringSizeChange{.Event = NOS_RING_SIZE_CHANGE, .RingSize = size};
+			nosEngine.SendPathCommand(ch->InputId, ringSizeChange);
+		}
+		Ring.Stop();
+		PoppedSinceLastSchedule.clear();
+		SendPathRestart();
+		RequestedRingSize = size;
+	}
+
+	void SendPathRestart()
+	{
+		for (auto& [_, ch] : Channels)
+			nosEngine.SendPathRestart(ch->InputId);
+	}
+
+	void OnPinValueChanged(nos::Name pinName, uuid const& pinId, nosBuffer value) override
+	{
+		auto sv = pinName.AsString();
+		if (!IsInputPin(sv))
+			return;
+		auto* ch = GetChannelByPinId(pinId);
+		if (!ch || !ch->RingChannel)
+			return;
+		if (ch->RingChannel->ResInterface->CheckNewResource(NSN_Input, value, std::nullopt))
+		{
+			nosEngine.SendPathRestart(ch->InputId);
+			Ring.Stop();
+			PoppedSinceLastSchedule.clear();
+			ch->NeedsRecreation = true;
+		}
+	}
+
+	nosResult OnResolvePinDataTypes(nosResolvePinDataTypesParams* params) override
+	{
+		auto pinNameStr = nos::Name(params->InstigatorPinName).AsString();
+		auto letter = ParseLetter(pinNameStr);
+		if (!letter)
+			return NOS_RESULT_FAILED;
+		auto chIt = Channels.find(*letter);
+		if (chIt == Channels.end())
+			return NOS_RESULT_FAILED;
+		auto& ch = *chIt->second;
+		if (ch.TypeInfo->TypeName != NSN_Generic)
+			return NOS_RESULT_FAILED;
+		ch.TypeInfo = nos::TypeInfo(params->IncomingTypeName);
+		if (ch.RingChannel)
+		{
+			Ring.Stop();
+			PoppedSinceLastSchedule.clear();
+			Ring.RemoveChannel(*letter);
+			ch.RingChannel = nullptr;
+		}
+		for (size_t i = 0; i < params->PinCount; i++)
+		{
+			auto& pinInfo = params->Pins[i];
+			if (pinInfo.Id == ch.InputId || pinInfo.Id == ch.OutputId)
+				pinInfo.OutResolvedTypeName = ch.TypeInfo->TypeName;
+		}
+		return NOS_RESULT_SUCCESS;
+	}
+
+	void OnPinUpdated(const nosPinUpdate*) override
+	{
+		for (auto& [_, ch] : Channels)
+			if (!ch->RingChannel)
+				InitChannel(*ch);
+	}
+
+	void OnNodeUpdated(nosNodeUpdate const* update) override
+	{
+		if (update->Type == NOS_NODE_UPDATE_PIN_DELETED)
+		{
+			auto it = PinIdToLetter.find(update->PinDeleted);
+			if (it == PinIdToLetter.end())
+				return;
+			char letter = it->second;
+			PinIdToLetter.erase(it);
+			auto chIt = Channels.find(letter);
+			if (chIt == Channels.end())
+				return;
+			auto& ch = *chIt->second;
+			bool inputAlive = PinIdToLetter.contains(ch.InputId);
+			bool outputAlive = PinIdToLetter.contains(ch.OutputId);
+			if (!inputAlive && !outputAlive)
+			{
+				if (ch.RingChannel)
+				{
+					Ring.RemoveChannel(letter);
+					ch.RingChannel = nullptr;
+				}
+				Channels.erase(chIt);
+			}
+		}
+		else if (update->Type == NOS_NODE_UPDATE_PIN_CREATED)
+		{
+			auto* pin = update->PinCreated;
+			auto sv = pin->name()->string_view();
+			if (!IsInputPin(sv) && !IsOutputPin(sv))
+				return;
+			auto letter = ParseLetter(sv);
+			if (!letter)
+				return;
+			auto& chPtr = Channels[*letter];
+			if (!chPtr)
+				chPtr = std::make_unique<Channel>(*letter);
+			if (IsInputPin(sv))
+				chPtr->InputId = uuid(*pin->id());
+			else
+			{
+				chPtr->OutputId = uuid(*pin->id());
+				chPtr->IsOutLive = pin->live();
+			}
+			PinIdToLetter[uuid(*pin->id())] = *letter;
+			if (!chPtr->RingChannel)
+				InitChannel(*chPtr);
+		}
+	}
+
+	nosResult ExecuteNode(nosNodeExecuteParams* params) override
+	{
+		if (Channels.empty() || Ring.Exit)
+			return NOS_RESULT_FAILED;
+
+		NodeExecuteParams pins(params);
+		uint32_t requestedSize = *pins.GetPinData<uint32_t>(NSN_Size);
+
+		struct Gathered
+		{
+			Channel* NodeCh;
+			MultiRing::Channel* RingCh;
+			void* Input;
+		};
+		std::vector<Gathered> gathered;
+		gathered.reserve(Channels.size());
+		std::vector<MultiRing::Channel*> wantedRings;
+		wantedRings.reserve(Channels.size());
+
+		uint32_t maxRequired = requestedSize;
+		for (auto& [_, ch] : Channels)
+		{
+			if (!ch->RingChannel || ch->RingChannel->Resources.empty() || !ch->TypeInfo)
+				continue;
+			auto it = pins.find(ch->InputName);
+			if (it == pins.end())
+				continue;
+			void* input = ch->RingChannel->ResInterface->GetPinInfo(it->second, false);
+			if (!input)
+				continue;
+			auto [required, _] = ch->RingChannel->ResInterface->GetRequiredRingSize(input, requestedSize);
+			if (required > maxRequired)
+				maxRequired = required;
+			gathered.push_back({ch.get(), ch->RingChannel, input});
+			wantedRings.push_back(ch->RingChannel);
+		}
+		if (gathered.empty())
+		{
+			SendScheduleRequest(0);
+			return NOS_RESULT_FAILED;
+		}
+
+		if (Ring.Size != maxRequired)
+		{
+			RequestRingResize(maxRequired);
+			return NOS_RESULT_FAILED;
+		}
+
+		std::vector<MultiRing::SlotPair> slots;
+		if (!Ring.BeginPushSubset(100, wantedRings, slots))
+			return Ring.Exit ? NOS_RESULT_FAILED : NOS_RESULT_PENDING;
+
+		for (size_t i = 0; i < gathered.size(); ++i)
+		{
+			auto& g = gathered[i];
+			auto* slot = slots[i].second;
+			g.RingCh->ResInterface->Push(slot, g.Input, params,
+										 NOS_NAME_STATIC("MultiBoundedQueue"), false);
+			if (!g.NodeCh->IsOutLive)
+			{
+				ChangePinLiveness(g.NodeCh->OutputName, true);
+				g.NodeCh->IsOutLive = true;
+			}
+		}
+
+		Ring.EndPushAll(slots);
+		return NOS_RESULT_SUCCESS;
+	}
+
+	nosResult CopyFrom(nosCopyInfo* cpy) override
+	{
+		auto* ch = GetChannelByPinId(cpy->ID);
+		if (!ch || !ch->RingChannel || Ring.Exit)
+			return NOS_RESULT_FAILED;
+		if (!ch->IsOutLive)
+			return NOS_RESULT_SUCCESS;
+
+		ResourceInterface::ResourceBase* slot;
+		{
+			ScopedProfilerEvent _({.Name = "Wait For Filled Slot"});
+			slot = Ring.BeginPop(*ch->RingChannel, 100);
+		}
+		if (!slot)
+			return Ring.Exit ? NOS_RESULT_FAILED : NOS_RESULT_PENDING;
+
+		// Propagate the slot resource's descriptor onto the output pin before
+		// Copy reads cpy->PinData as the destination — otherwise the GPU copy
+		// targets the stale (default-sized) output descriptor.
+		nos::Buffer outPinVal;
+		if (ch->RingChannel->ResInterface->BeginCopyFrom(slot, *cpy->PinData, outPinVal))
+			nosEngine.SetPinValueByName(NodeId, ch->OutputName, outPinVal);
+
+		ch->RingChannel->ResInterface->Copy(slot, cpy, NodeId);
+
+		cpy->CopyFromOptions.ShouldSetSourceFrameNumber = true;
+		cpy->FrameNumber = slot->FrameNumber;
+
+		Ring.EndPop(*ch->RingChannel, slot);
+
+		PoppedSinceLastSchedule.insert(ch->Letter);
+		size_t liveCount = 0;
+		for (auto& [_, c] : Channels)
+			if (c->IsOutLive)
+				++liveCount;
+		if (PoppedSinceLastSchedule.size() >= liveCount)
+		{
+			SendScheduleRequest(1);
+			PoppedSinceLastSchedule.clear();
+		}
+		return NOS_RESULT_SUCCESS;
+	}
+
+	void OnEndFrame(uuid const& pinId, nosEndFrameCause cause) override
+	{
+		if (cause != NOS_END_FRAME_FAILED)
+			return;
+		auto* ch = GetChannelByPinId(pinId);
+		if (!ch)
+			return;
+		if (pinId == ch->OutputId)
+			return;
+		if (!ch->IsOutLive)
+			return;
+		ChangePinLiveness(ch->OutputName, false);
+		ch->IsOutLive = false;
+	}
+
+	void SendScheduleRequest(uint32_t count, bool reset = false) const
+	{
+		nosScheduleNodeParams schedule{.NodeId = NodeId, .AddScheduleCount = count, .Reset = reset};
+		nosEngine.ScheduleNode(&schedule);
+	}
+
+	void OnPathCommand(const nosPathCommand* command) override
+	{
+		switch (command->Event)
+		{
+		case NOS_RING_SIZE_CHANGE:
+			if (command->RingSize == 0)
+				return;
+			RequestedRingSize = command->RingSize;
+			nosEngine.SetPinValue(*GetPinId(NSN_Size), nos::Buffer::From(command->RingSize));
+			break;
+		default: return;
+		}
+	}
+
+	void OnPathStop() override
+	{
+		Ring.Stop();
+		PoppedSinceLastSchedule.clear();
+	}
+
+	void OnPathStart() override
+	{
+		if (Channels.empty())
+			return;
+
+		PoppedSinceLastSchedule.clear();
+
+		Ring.ResetAll(false);
+
+		if (RequestedRingSize)
+		{
+			Ring.ResizeAll(*RequestedRingSize);
+			for (auto& [_, ch] : Channels)
+				ch->NeedsRecreation = false;
+			RequestedRingSize = std::nullopt;
+		}
+		for (auto& [_, ch] : Channels)
+		{
+			if (ch->NeedsRecreation && ch->RingChannel)
+			{
+				Ring.RecreateChannelResources(*ch->RingChannel);
+				ch->NeedsRecreation = false;
+			}
+		}
+
+		size_t totalSchedule = 0;
+		for (auto& [_, ch] : Channels)
+		{
+			if (!ch->RingChannel)
+				continue;
+			if (ch->RingChannel->Resources.empty())
+			{
+				totalSchedule = std::max<size_t>(totalSchedule, 1);
+				continue;
+			}
+			auto emptySlotCount = Ring.WritePoolSize(*ch->RingChannel);
+			totalSchedule = std::max(totalSchedule, emptySlotCount);
+			ch->RingChannel->ResInterface->OnPathStart();
+		}
+		Ring.Start();
+		if (totalSchedule > 0)
+		{
+			nosScheduleNodeParams schedule{.NodeId = NodeId, .AddScheduleCount = (uint32_t)totalSchedule};
+			nosEngine.ScheduleNode(&schedule);
+		}
+	}
+
+	void OnNodeMenuRequested(nosContextMenuRequestPtr request) override
+	{
+		flatbuffers::FlatBufferBuilder fbb;
+		std::vector items = {
+			nos::CreateContextMenuItemDirect(fbb, "Add Channel", MenuCommand(ADD_CHANNEL, 0))};
+		HandleEvent(CreateAppEvent(fbb, app::CreateAppContextMenuUpdateDirect(
+											fbb, request->item_id(), request->pos(), request->instigator(), &items)));
+	}
+
+	void OnPinMenuRequested(nos::Name pinName, nosContextMenuRequestPtr request) override
+	{
+		auto sv = pinName.AsString();
+		if (!IsInputPin(sv) && !IsOutputPin(sv))
+			return;
+		auto letter = ParseLetter(sv);
+		if (!letter)
+			return;
+		if (Channels.size() <= 1)
+			return;
+		flatbuffers::FlatBufferBuilder fbb;
+		std::vector items = {nos::CreateContextMenuItemDirect(
+			fbb, "Remove Channel", MenuCommand(REMOVE_CHANNEL, static_cast<uint8_t>(*letter)))};
+		HandleEvent(CreateAppEvent(fbb, app::CreateAppContextMenuUpdateDirect(
+											fbb, request->item_id(), request->pos(), request->instigator(), &items)));
+	}
+
+	void OnMenuCommand(uuid const& itemID, uint32_t cmd) override
+	{
+		auto command = MenuCommand(cmd);
+		switch (command.Type)
+		{
+		case ADD_CHANNEL:
+		{
+			char newLetter = 0;
+			for (char c : CHANNEL_LETTERS)
+			{
+				if (!Channels.contains(c))
+				{
+					newLetter = c;
+					break;
+				}
+			}
+			if (newLetter == 0)
+			{
+				SetNodeStatusMessage("Maximum number of channels reached", fb::NodeStatusMessageType::WARNING);
+				return;
+			}
+
+			fb::TPin inPin;
+			inPin.id = uuid(nosEngine.GenerateID());
+			inPin.name = std::string("Input_") + newLetter;
+			inPin.type_name = "nos.Generic";
+			inPin.show_as = fb::ShowAs::INPUT_PIN;
+			inPin.can_show_as = fb::CanShowAs::INPUT_PIN_ONLY;
+
+			fb::TPin outPin;
+			outPin.id = uuid(nosEngine.GenerateID());
+			outPin.name = std::string("Output_") + newLetter;
+			outPin.type_name = "nos.Generic";
+			outPin.show_as = fb::ShowAs::OUTPUT_PIN;
+			outPin.can_show_as = fb::CanShowAs::OUTPUT_PIN_ONLY;
+			outPin.live = true;
+
+			nos::TPartialNodeUpdate update;
+			update.node_id = NodeId;
+			update.pins_to_add.emplace_back(std::make_unique<fb::TPin>(std::move(inPin)));
+			update.pins_to_add.emplace_back(std::make_unique<fb::TPin>(std::move(outPin)));
+			flatbuffers::FlatBufferBuilder fbb;
+			HandleEvent(CreateAppEvent(fbb, nos::CreatePartialNodeUpdate(fbb, &update)));
+			break;
+		}
+		case REMOVE_CHANNEL:
+		{
+			char letter = static_cast<char>(command.Letter);
+			auto it = Channels.find(letter);
+			if (it == Channels.end())
+				return;
+			auto& ch = *it->second;
+			nos::TPartialNodeUpdate update;
+			update.node_id = NodeId;
+			update.pins_to_delete = {ch.InputId, ch.OutputId};
+			flatbuffers::FlatBufferBuilder fbb;
+			HandleEvent(CreateAppEvent(fbb, nos::CreatePartialNodeUpdate(fbb, &update)));
+			break;
+		}
+		}
+	}
+};
+
+nosResult RegisterMultiBoundedQueue(nosNodeFunctions* functions)
+{
+	NOS_BIND_NODE_CLASS(NOS_NAME("MultiBoundedQueue"), MultiBoundedQueueNodeContext, functions)
+	return NOS_RESULT_SUCCESS;
+}
+
+} // namespace nos::utilities
diff --git a/Plugins/nosUtilities/Source/MultiLiveOut.cpp b/Plugins/nosUtilities/Source/MultiLiveOut.cpp
new file mode 100644
index 00000000..c4d08d88
--- /dev/null
+++ b/Plugins/nosUtilities/Source/MultiLiveOut.cpp
@@ -0,0 +1,189 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#include <Nodos/PluginHelpers.hpp>
+
+namespace nos::utilities
+{
+
+struct MultiLiveOutNode : NodeContext
+{
+	MultiLiveOutNode(nosFbNodePtr node) : NodeContext(node)
+	{
+		for (auto* pin : *node->pins())
+		{
+			SetPinOrphanState(*pin->id(), nos::fb::PinOrphanStateType::ACTIVE);
+			auto index = GetPinIndex(pin->name()->string_view());
+			if (!index)
+			{
+				nosEngine.LogE("Failed to parse index from pin name: %s", pin->name()->c_str());
+				continue;
+			}
+			if (pin->show_as() == nosFbShowAs::OUTPUT_PIN)
+				IndexToPairs[*index].second = uuid(*pin->id());
+			else
+				IndexToPairs[*index].first = uuid(*pin->id());
+		}
+	}
+
+	void OnNodeUpdated(nosNodeUpdate const* update) override
+	{
+		if (update->Type == NOS_NODE_UPDATE_PIN_CREATED)
+		{
+			auto* pin = update->PinCreated;
+			auto index = GetPinIndex(pin->name()->string_view());
+			if (!index)
+				return;
+			if (pin->show_as() == nosFbShowAs::OUTPUT_PIN)
+				IndexToPairs[*index].second = uuid(*pin->id());
+			else
+				IndexToPairs[*index].first = uuid(*pin->id());
+		}
+		else if (update->Type == NOS_NODE_UPDATE_PIN_DELETED)
+		{
+			for (auto it = IndexToPairs.begin(); it != IndexToPairs.end(); ++it)
+			{
+				if (it->second.first == update->PinDeleted || it->second.second == update->PinDeleted)
+				{
+					IndexToPairs.erase(it);
+					break;
+				}
+			}
+		}
+	}
+
+	void OnMenuRequested(nosContextMenuRequestPtr request) override
+	{
+		flatbuffers::FlatBufferBuilder fbb;
+		std::vector<flatbuffers::Offset<nos::ContextMenuItem>> items;
+		if (*request->item_id() == NodeId)
+			items.push_back(nos::CreateContextMenuItemDirect(fbb, "Add New Pair", 1));
+		else
+		{
+			auto* pin = GetPin(*request->item_id());
+			if (!pin)
+				return;
+			if (pin->Name == NOS_NAME("Input_0") || pin->Name == NOS_NAME("Output_0"))
+				return;
+			items.push_back(nos::CreateContextMenuItemDirect(fbb, "Remove Pair", 1));
+		}
+		HandleEvent(CreateAppEvent(
+			fbb, CreateAppContextMenuUpdate(
+				fbb, request->item_id(), request->pos(), request->instigator(), fbb.CreateVector(items))));
+	}
+
+	void OnMenuCommand(uuid const& itemID, uint32_t cmd) override
+	{
+		flatbuffers::FlatBufferBuilder fbb;
+		if (itemID == NodeId)
+		{
+			int index = 0;
+			for (; index < (int)IndexToPairs.size(); index++)
+			{
+				if (!IndexToPairs.contains(index))
+					break;
+			}
+			fb::TPin outPin;
+			outPin.id = uuid(nosEngine.GenerateID());
+			outPin.name = "Output_" + std::to_string(index);
+			outPin.type_name = NOS_NAME("nos.Generic");
+			outPin.live = true;
+			outPin.show_as = fb::ShowAs::OUTPUT_PIN;
+			outPin.can_show_as = fb::CanShowAs::OUTPUT_PIN_ONLY;
+
+			fb::TPin inPin;
+			inPin.id = uuid(nosEngine.GenerateID());
+			inPin.name = "Input_" + std::to_string(index);
+			inPin.type_name = NOS_NAME("nos.Generic");
+			inPin.show_as = fb::ShowAs::INPUT_PIN;
+			inPin.can_show_as = fb::CanShowAs::INPUT_PIN_ONLY;
+
+			nos::TPartialNodeUpdate update;
+			update.node_id = NodeId;
+			update.pins_to_add.emplace_back(std::make_unique<fb::TPin>(std::move(outPin)));
+			update.pins_to_add.emplace_back(std::make_unique<fb::TPin>(std::move(inPin)));
+			HandleEvent(CreateAppEvent(fbb, nos::CreatePartialNodeUpdate(fbb, &update)));
+			IndexToPairs[index] = {uuid(inPin.id), uuid(outPin.id)};
+		}
+		else
+		{
+			auto* pin = GetPin(itemID);
+			if (!pin)
+				return;
+			auto index = GetPinIndex(pin->Name.AsString());
+			if (!index)
+			{
+				nosEngine.LogE("Failed to parse index from pin name: %s", pin->Name.AsCStr());
+				return;
+			}
+			nos::TPartialNodeUpdate update;
+			update.node_id = NodeId;
+			update.pins_to_delete = {IndexToPairs[*index].first, IndexToPairs[*index].second};
+			HandleEvent(CreateAppEvent(fbb, nos::CreatePartialNodeUpdate(fbb, &update)));
+			IndexToPairs.erase(*index);
+		}
+	}
+
+	nosResult OnResolvePinDataTypes(nosResolvePinDataTypesParams* params) override
+	{
+		auto pinName = nos::Name(params->InstigatorPinName).AsString();
+		auto index = GetPinIndex(pinName);
+		if (!index.has_value())
+		{
+			strcpy(params->OutErrorMessage, "Failed to parse pin index from pin name.");
+			return NOS_RESULT_FAILED;
+		}
+		auto const& [firstId, secondId] = IndexToPairs[*index];
+		for (size_t i = 0; i < params->PinCount; i++)
+		{
+			auto& pin = params->Pins[i];
+			if (pin.Id == firstId || pin.Id == secondId)
+				pin.OutResolvedTypeName = params->IncomingTypeName;
+			else
+				pin.OutResolvedTypeName = NOS_NAME("nos.Generic");
+		}
+		return NOS_RESULT_SUCCESS;
+	}
+
+	std::optional<int32_t> GetPinIndex(std::string_view pinName) const
+	{
+		auto indexPos = pinName.find_last_of('_');
+		if (indexPos == std::string::npos)
+			return std::nullopt;
+		try
+		{
+			return std::stoi(std::string(pinName.substr(indexPos + 1)));
+		}
+		catch (...)
+		{
+			nosEngine.LogE("Failed to parse index from pin name: %s", std::string(pinName).c_str());
+			return std::nullopt;
+		}
+	}
+
+	nosResult ExecuteNode(nosNodeExecuteParams* params) override
+	{
+		for (auto const& [_, idPair] : IndexToPairs)
+		{
+			for (size_t i = 0; i < params->PinCount; ++i)
+			{
+				auto& pin = params->Pins[i];
+				if (pin.Id == idPair.first && pin.Data)
+				{
+					nosEngine.SetPinValue(idPair.second, *pin.Data);
+					break;
+				}
+			}
+		}
+		return NOS_RESULT_SUCCESS;
+	}
+
+	std::unordered_map<int32_t, std::pair<nos::uuid, nos::uuid>> IndexToPairs;
+};
+
+nosResult RegisterMultiLiveOut(nosNodeFunctions* fn)
+{
+	NOS_BIND_NODE_CLASS(NOS_NAME("MultiLiveOut"), MultiLiveOutNode, fn)
+	return NOS_RESULT_SUCCESS;
+}
+
+} // namespace nos::utilities
diff --git a/Plugins/nosUtilities/Source/MultiRing.h b/Plugins/nosUtilities/Source/MultiRing.h
new file mode 100644
index 00000000..c2d0ba14
--- /dev/null
+++ b/Plugins/nosUtilities/Source/MultiRing.h
@@ -0,0 +1,256 @@
+/*
+ * Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+ */
+
+#pragma once
+
+#include "Ring.h"
+
+namespace nos
+{
+
+// Ring that holds N independent channels under a single mutex / CV pair.
+// Each channel still owns its own slot pools and Resources, but every push,
+// pop, resize and reset goes through the shared synchronization, so an
+// N-channel batch push is a single lock acquisition, not N.
+struct MultiRing
+{
+	struct Channel
+	{
+		std::shared_ptr<ResourceInterface> ResInterface;
+		std::vector<rc<ResourceInterface::ResourceBase>> Resources;
+		std::deque<ResourceInterface::ResourceBase*> WritePool;
+		std::deque<ResourceInterface::ResourceBase*> ReadPool;
+		void* UserData = nullptr;
+	};
+
+	std::map<char, std::unique_ptr<Channel>> Channels;
+	std::mutex Mutex;
+	std::condition_variable WriteCV;
+	std::condition_variable ReadCV;
+	std::atomic_bool Exit = true;
+	uint32_t Size = 0;
+
+	~MultiRing() { Stop(); }
+
+	void Stop()
+	{
+		{
+			std::unique_lock lock(Mutex);
+			Exit = true;
+		}
+		WriteCV.notify_all();
+		ReadCV.notify_all();
+	}
+
+	void Start()
+	{
+		std::unique_lock lock(Mutex);
+		Exit = false;
+	}
+
+	void AllocateChannelResourcesUnlocked(Channel& ch)
+	{
+		ch.WritePool.clear();
+		ch.ReadPool.clear();
+		ch.Resources.clear();
+		for (uint32_t i = 0; i < Size; ++i)
+		{
+			auto res = ch.ResInterface->CreateResource();
+			if (!res)
+			{
+				nosEngine.LogE("Failed to create resource for multi ring buffer.");
+				ch.Resources.clear();
+				ch.WritePool.clear();
+				ch.ReadPool.clear();
+				Exit = true;
+				return;
+			}
+			ch.Resources.push_back(res);
+			ch.WritePool.push_back(res.get());
+		}
+	}
+
+	Channel& AddChannel(char key, std::shared_ptr<ResourceInterface> resInterface, void* userData = nullptr)
+	{
+		std::unique_lock lock(Mutex);
+		auto& ch = Channels[key];
+		if (!ch)
+			ch = std::make_unique<Channel>();
+		ch->ResInterface = std::move(resInterface);
+		ch->UserData = userData;
+		if (Size == 0)
+			Size = 1;
+		AllocateChannelResourcesUnlocked(*ch);
+		return *ch;
+	}
+
+	void RemoveChannel(char key)
+	{
+		std::unique_lock lock(Mutex);
+		Channels.erase(key);
+	}
+
+	void RecreateChannelResources(Channel& ch)
+	{
+		std::unique_lock lock(Mutex);
+		AllocateChannelResourcesUnlocked(ch);
+	}
+
+	void ResizeAll(uint32_t newSize)
+	{
+		std::unique_lock lock(Mutex);
+		Size = newSize;
+		for (auto& [_, ch] : Channels)
+			AllocateChannelResourcesUnlocked(*ch);
+	}
+
+	bool AreAllChannelsValid()
+	{
+		std::unique_lock lock(Mutex);
+		if (Channels.empty())
+			return false;
+		for (auto& [_, ch] : Channels)
+			if (ch->Resources.empty())
+				return false;
+		return true;
+	}
+
+	// Move slots between pools for every channel. fill=false: read→write.
+	void ResetAll(bool fill)
+	{
+		std::unique_lock lock(Mutex);
+		for (auto& [_, ch] : Channels)
+		{
+			auto& from = fill ? ch->WritePool : ch->ReadPool;
+			auto& to = fill ? ch->ReadPool : ch->WritePool;
+			while (!from.empty())
+			{
+				auto* slot = from.front();
+				from.pop_front();
+				ch->ResInterface->Reset(slot);
+				to.push_back(slot);
+			}
+		}
+	}
+
+	// If this channel is full and its read pool is non-empty, hand one slot
+	// back to the write pool so the producer can start pushing again.
+	void MoveOneReadToWriteIfFull(Channel& ch)
+	{
+		std::unique_lock lock(Mutex);
+		if (ch.ReadPool.size() != ch.Resources.size() || ch.ReadPool.empty())
+			return;
+		auto* slot = ch.ReadPool.front();
+		ch.ReadPool.pop_front();
+		ch.WritePool.push_back(slot);
+	}
+
+	bool IsFull(Channel const& ch)
+	{
+		std::unique_lock lock(Mutex);
+		return ch.ReadPool.size() == ch.Resources.size();
+	}
+
+	bool IsEmpty(Channel const& ch)
+	{
+		std::unique_lock lock(Mutex);
+		return ch.ReadPool.empty();
+	}
+
+	size_t WritePoolSize(Channel const& ch)
+	{
+		std::unique_lock lock(Mutex);
+		return ch.WritePool.size();
+	}
+
+	size_t ReadPoolSize(Channel const& ch)
+	{
+		std::unique_lock lock(Mutex);
+		return ch.ReadPool.size();
+	}
+
+	using SlotPair = std::pair<Channel*, ResourceInterface::ResourceBase*>;
+
+	// Atomically pop one slot from each requested channel's WritePool.
+	// Waits until every requested channel has at least one slot, or
+	// timeout/exit. The caller-supplied list typically excludes channels
+	// that don't have valid input data this frame.
+	bool BeginPushSubset(uint64_t timeoutMs,
+						 std::vector<Channel*> const& wanted,
+						 std::vector<SlotPair>& outSlots)
+	{
+		std::unique_lock lock(Mutex);
+		auto pred = [&] {
+			if (Exit)
+				return true;
+			if (wanted.empty())
+				return false;
+			for (auto* ch : wanted)
+				if (ch->WritePool.empty())
+					return false;
+			return true;
+		};
+		if (!WriteCV.wait_for(lock, std::chrono::milliseconds(timeoutMs), pred))
+			return false;
+		if (Exit)
+			return false;
+		outSlots.clear();
+		outSlots.reserve(wanted.size());
+		for (auto* ch : wanted)
+		{
+			auto* slot = ch->WritePool.front();
+			ch->WritePool.pop_front();
+			outSlots.emplace_back(ch, slot);
+		}
+		return true;
+	}
+
+	void EndPushAll(std::vector<SlotPair> const& slots)
+	{
+		{
+			std::unique_lock lock(Mutex);
+			for (auto& [ch, slot] : slots)
+				ch->ReadPool.push_back(slot);
+		}
+		ReadCV.notify_all();
+	}
+
+	void CancelPushAll(std::vector<SlotPair> const& slots)
+	{
+		{
+			std::unique_lock lock(Mutex);
+			for (auto& [ch, slot] : slots)
+			{
+				slot->FrameNumber = 0;
+				ch->WritePool.push_front(slot);
+			}
+		}
+		WriteCV.notify_all();
+	}
+
+	ResourceInterface::ResourceBase* BeginPop(Channel& ch, uint64_t timeoutMs)
+	{
+		std::unique_lock lock(Mutex);
+		if (!ReadCV.wait_for(lock, std::chrono::milliseconds(timeoutMs),
+							 [&] { return !ch.ReadPool.empty() || Exit; }))
+			return nullptr;
+		if (Exit)
+			return nullptr;
+		auto* slot = ch.ReadPool.front();
+		ch.ReadPool.pop_front();
+		return slot;
+	}
+
+	void EndPop(Channel& ch, ResourceInterface::ResourceBase* slot)
+	{
+		{
+			std::unique_lock lock(Mutex);
+			slot->FrameNumber = 0;
+			ch.WritePool.push_back(slot);
+		}
+		WriteCV.notify_all();
+	}
+};
+
+} // namespace nos
diff --git a/Plugins/nosUtilities/Source/MultiRingBuffer.cpp b/Plugins/nosUtilities/Source/MultiRingBuffer.cpp
new file mode 100644
index 00000000..2c446299
--- /dev/null
+++ b/Plugins/nosUtilities/Source/MultiRingBuffer.cpp
@@ -0,0 +1,731 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#pragma once
+
+#include <set>
+
+#include <Nodos/PluginHelpers.hpp>
+
+// External
+#include <glm/glm.hpp>
+#include <nosVulkanSubsystem/Helpers.hpp>
+
+#include "MultiRing.h"
+#include "Ring.h"
+#include "nosUtil/Stopwatch.hpp"
+
+namespace nos::utilities
+{
+
+struct MultiRingBufferNodeContext : NodeContext
+{
+	using RingMode = RingNodeBase::RingMode;
+	using OnRestartType = RingNodeBase::OnRestartType;
+
+	static constexpr std::string_view CHANNEL_LETTERS = "ABCDEFGHIJKLMNOPQRSTUVWXYZ";
+
+	enum MenuCommandType : uint8_t
+	{
+		ADD_CHANNEL = 0,
+		REMOVE_CHANNEL = 1,
+	};
+
+	struct MenuCommand
+	{
+		MenuCommandType Type;
+		uint8_t Letter;
+		MenuCommand(uint32_t cmd)
+		{
+			Type = static_cast<MenuCommandType>(cmd & 0xFF);
+			Letter = static_cast<uint8_t>((cmd >> 8) & 0xFF);
+		}
+		MenuCommand(MenuCommandType type, uint8_t letter) : Type(type), Letter(letter) {}
+		operator uint32_t() const { return (Letter << 8) | Type; }
+	};
+
+	struct Channel
+	{
+		char Letter;
+		nos::Name InputName;
+		nos::Name OutputName;
+		uuid InputId{};
+		uuid OutputId{};
+		nos::TypeInfo TypeInfo;
+		MultiRing::Channel* RingChannel = nullptr;
+		std::atomic_bool IsOutLive = false;
+		ResourceInterface::ResourceBase* LastPopped = nullptr;
+		bool NeedsRecreation = false;
+		std::size_t RemainingRepeatableCount = 0;
+
+		Channel(char letter)
+			: Letter(letter),
+			  InputName((std::string("Input_") + letter).c_str()),
+			  OutputName((std::string("Output_") + letter).c_str()),
+			  TypeInfo(NSN_Generic)
+		{
+		}
+	};
+
+	std::map<char, std::unique_ptr<Channel>> Channels;
+	std::unordered_map<uuid, char> PinIdToLetter;
+	MultiRing Ring;
+	// Channels popped since the last SendScheduleRequest. One producer run
+	// pushes one slot per live channel, so we must only schedule again once
+	// every live channel has been popped — otherwise schedule requests pile
+	// up by a factor of N (channels) per consumer tick.
+	std::set<char> PoppedSinceLastSchedule;
+
+	OnRestartType OnRestart = OnRestartType::WAIT_UNTIL_FULL;
+	std::optional<uint32_t> RequestedRingSize = std::nullopt;
+	std::atomic<RingMode> Mode = RingMode::CONSUME;
+	std::condition_variable ModeCV;
+	std::mutex ModeMutex;
+	std::atomic_bool RepeatWhenFilling = false;
+
+	std::string GetName() const { return "MultiRingBuffer"; }
+
+	static std::optional<char> ParseLetter(std::string_view pinName)
+	{
+		auto pos = pinName.find_last_of('_');
+		if (pos == std::string::npos || pos + 2 != pinName.size())
+			return std::nullopt;
+		char c = pinName[pos + 1];
+		if (c < 'A' || c > 'Z')
+			return std::nullopt;
+		return c;
+	}
+
+	static bool IsInputPin(std::string_view pinName) { return pinName.starts_with("Input_"); }
+	static bool IsOutputPin(std::string_view pinName) { return pinName.starts_with("Output_"); }
+
+	MultiRingBufferNodeContext(nosFbNodePtr node) : NodeContext(node)
+	{
+		std::vector<uuid> pinsToUnorphan;
+		for (auto* pin : *node->pins())
+		{
+			auto pinNameSv = pin->name()->string_view();
+			if (!IsInputPin(pinNameSv) && !IsOutputPin(pinNameSv))
+				continue;
+			auto letter = ParseLetter(pinNameSv);
+			if (!letter)
+				continue;
+
+			auto& channel = Channels[*letter];
+			if (!channel)
+				channel = std::make_unique<Channel>(*letter);
+
+			if (IsInputPin(pinNameSv))
+				channel->InputId = uuid(*pin->id());
+			else
+			{
+				channel->OutputId = uuid(*pin->id());
+				channel->IsOutLive = pin->live();
+			}
+			PinIdToLetter[uuid(*pin->id())] = *letter;
+
+			nos::Name typeName(pin->type_name()->c_str());
+			if (typeName != NSN_Generic && channel->TypeInfo->TypeName == NSN_Generic)
+				channel->TypeInfo = nos::TypeInfo(typeName);
+
+			if (auto orphanState = pin->orphan_state())
+				if (orphanState->type() == fb::PinOrphanStateType::ORPHAN)
+					pinsToUnorphan.push_back(uuid(*pin->id()));
+		}
+
+		for (auto& [_, ch] : Channels)
+			InitChannel(*ch);
+
+		for (auto const& pinId : pinsToUnorphan)
+			SetPinOrphanState(pinId, fb::PinOrphanStateType::ACTIVE);
+
+		AddPinValueWatcher(NSN_Size, [this](nos::Buffer const& newSize, std::optional<nos::Buffer> oldVal) {
+			uint32_t size = *newSize.As<uint32_t>();
+			if (oldVal && oldVal == newSize)
+				return;
+			RequestRingResize(size);
+		});
+		AddPinValueWatcher(NSN_Alignment, [this](nos::Buffer const& newAlignment, std::optional<nos::Buffer> oldVal) {
+			bool any = false;
+			for (auto& [_, ch] : Channels)
+			{
+				if (!ch->RingChannel)
+					continue;
+				if (ch->RingChannel->ResInterface->CheckNewResource(NSN_Alignment, newAlignment, oldVal))
+				{
+					nosEngine.SendPathRestart(ch->InputId);
+					ch->NeedsRecreation = true;
+					any = true;
+				}
+			}
+			if (any)
+			{
+				Ring.Stop();
+				PoppedSinceLastSchedule.clear();
+			}
+		});
+		AddPinValueWatcher(NOS_NAME_STATIC("RepeatWhenFilling"),
+						   [this](nos::Buffer const& newVal, std::optional<nos::Buffer> oldVal) {
+							   RepeatWhenFilling = *newVal.As<bool>();
+						   });
+	}
+
+	~MultiRingBufferNodeContext() override
+	{
+		for (auto& [_, ch] : Channels)
+			NOS_SOFT_CHECK(ch->LastPopped == nullptr);
+		Ring.Stop();
+	}
+
+	void InitChannel(Channel& ch)
+	{
+		std::shared_ptr<ResourceInterface> resource;
+		if (ch.TypeInfo->TypeName == NOS_NAME(sys::vulkan::Buffer::GetFullyQualifiedName()))
+			resource = std::make_shared<GPUBufferResource>();
+		else if (ch.TypeInfo->TypeName == NOS_NAME(sys::vulkan::Texture::GetFullyQualifiedName()))
+			resource = std::make_shared<GPUTextureResource>();
+		else
+			resource = std::make_shared<CPUTrivialResource>();
+
+		ch.RingChannel = &Ring.AddChannel(ch.Letter, std::move(resource), &ch);
+	}
+
+	Channel* GetChannelByPinId(uuid const& id)
+	{
+		auto it = PinIdToLetter.find(id);
+		if (it == PinIdToLetter.end())
+			return nullptr;
+		auto chIt = Channels.find(it->second);
+		return chIt != Channels.end() ? chIt->second.get() : nullptr;
+	}
+
+	void SeedOutputPin(Channel& ch)
+	{
+		if (!ch.RingChannel || ch.RingChannel->Resources.empty())
+			return;
+		auto* base = ch.RingChannel->Resources[0].get();
+		if (!base)
+			return;
+		if (ch.TypeInfo->TypeName == NOS_NAME(sys::vulkan::Buffer::GetFullyQualifiedName()))
+		{
+			if (auto* res = ResourceInterface::GetResource<GPUBufferResource>(base))
+				nosEngine.SetPinValueByName(NodeId, ch.OutputName, res->VkRes.ToPinData());
+		}
+		else if (ch.TypeInfo->TypeName == NOS_NAME(sys::vulkan::Texture::GetFullyQualifiedName()))
+		{
+			if (auto* res = ResourceInterface::GetResource<GPUTextureResource>(base))
+			{
+				sys::vulkan::TTexture texDef = vkss::ConvertTextureInfo(res->VkRes);
+				texDef.unscaled = true;
+				nosEngine.SetPinValueByName(NodeId, ch.OutputName, nos::Buffer::From(texDef));
+			}
+		}
+	}
+
+	void RequestRingResize(uint32_t size)
+	{
+		if (size == 0)
+		{
+			nosEngine.LogW((GetName() + " size cannot be 0").c_str());
+			return;
+		}
+		if (Ring.Size == size && (!RequestedRingSize.has_value() || *RequestedRingSize == size))
+			return;
+		for (auto& [_, ch] : Channels)
+		{
+			if (!ch->RingChannel)
+				continue;
+			nosPathCommand ringSizeChange{.Event = NOS_RING_SIZE_CHANGE, .RingSize = size};
+			nosEngine.SendPathCommand(ch->InputId, ringSizeChange);
+		}
+		Ring.Stop();
+		PoppedSinceLastSchedule.clear();
+		SendPathRestart();
+		RequestedRingSize = size;
+	}
+
+	void SendPathRestart()
+	{
+		for (auto& [_, ch] : Channels)
+			nosEngine.SendPathRestart(ch->InputId);
+	}
+
+	void OnPinValueChanged(nos::Name pinName, uuid const& pinId, nosBuffer value) override
+	{
+		auto sv = pinName.AsString();
+		if (!IsInputPin(sv))
+			return;
+		auto* ch = GetChannelByPinId(pinId);
+		if (!ch || !ch->RingChannel)
+			return;
+		if (ch->RingChannel->ResInterface->CheckNewResource(NSN_Input, value, std::nullopt))
+		{
+			nosEngine.SendPathRestart(ch->InputId);
+			Ring.Stop();
+			PoppedSinceLastSchedule.clear();
+			ch->NeedsRecreation = true;
+		}
+	}
+
+	nosResult OnResolvePinDataTypes(nosResolvePinDataTypesParams* params) override
+	{
+		auto pinNameStr = nos::Name(params->InstigatorPinName).AsString();
+		auto letter = ParseLetter(pinNameStr);
+		if (!letter)
+			return NOS_RESULT_FAILED;
+		auto chIt = Channels.find(*letter);
+		if (chIt == Channels.end())
+			return NOS_RESULT_FAILED;
+		auto& ch = *chIt->second;
+		if (ch.TypeInfo->TypeName != NSN_Generic)
+			return NOS_RESULT_FAILED;
+		ch.TypeInfo = nos::TypeInfo(params->IncomingTypeName);
+		// Drop the Generic-fallback ring channel so OnPinUpdated re-inits with the resolved type.
+		if (ch.RingChannel)
+		{
+			Ring.Stop();
+			PoppedSinceLastSchedule.clear();
+			Ring.RemoveChannel(*letter);
+			ch.RingChannel = nullptr;
+		}
+		for (size_t i = 0; i < params->PinCount; i++)
+		{
+			auto& pinInfo = params->Pins[i];
+			if (pinInfo.Id == ch.InputId || pinInfo.Id == ch.OutputId)
+				pinInfo.OutResolvedTypeName = ch.TypeInfo->TypeName;
+		}
+		return NOS_RESULT_SUCCESS;
+	}
+
+	void OnPinUpdated(const nosPinUpdate*) override
+	{
+		for (auto& [_, ch] : Channels)
+			if (!ch->RingChannel)
+				InitChannel(*ch);
+	}
+
+	void OnNodeUpdated(nosNodeUpdate const* update) override
+	{
+		if (update->Type == NOS_NODE_UPDATE_PIN_DELETED)
+		{
+			auto it = PinIdToLetter.find(update->PinDeleted);
+			if (it == PinIdToLetter.end())
+				return;
+			char letter = it->second;
+			PinIdToLetter.erase(it);
+			auto chIt = Channels.find(letter);
+			if (chIt == Channels.end())
+				return;
+			auto& ch = *chIt->second;
+			bool inputAlive = PinIdToLetter.contains(ch.InputId);
+			bool outputAlive = PinIdToLetter.contains(ch.OutputId);
+			if (!inputAlive && !outputAlive)
+			{
+				if (ch.RingChannel)
+				{
+					Ring.RemoveChannel(letter);
+					ch.RingChannel = nullptr;
+				}
+				Channels.erase(chIt);
+			}
+		}
+		else if (update->Type == NOS_NODE_UPDATE_PIN_CREATED)
+		{
+			auto* pin = update->PinCreated;
+			auto sv = pin->name()->string_view();
+			if (!IsInputPin(sv) && !IsOutputPin(sv))
+				return;
+			auto letter = ParseLetter(sv);
+			if (!letter)
+				return;
+			auto& chPtr = Channels[*letter];
+			if (!chPtr)
+				chPtr = std::make_unique<Channel>(*letter);
+			if (IsInputPin(sv))
+				chPtr->InputId = uuid(*pin->id());
+			else
+			{
+				chPtr->OutputId = uuid(*pin->id());
+				chPtr->IsOutLive = pin->live();
+			}
+			PinIdToLetter[uuid(*pin->id())] = *letter;
+			if (!chPtr->RingChannel)
+				InitChannel(*chPtr);
+		}
+	}
+
+	nosResult ExecuteNode(nosNodeExecuteParams* params) override
+	{
+		if (Channels.empty() || Ring.Exit)
+			return NOS_RESULT_FAILED;
+
+		NodeExecuteParams pins(params);
+		uint32_t requestedSize = *pins.GetPinData<uint32_t>(NSN_Size);
+
+		struct Gathered
+		{
+			Channel* NodeCh;
+			MultiRing::Channel* RingCh;
+			void* Input;
+		};
+		std::vector<Gathered> gathered;
+		gathered.reserve(Channels.size());
+		std::vector<MultiRing::Channel*> wantedRings;
+		wantedRings.reserve(Channels.size());
+
+		uint32_t maxRequired = requestedSize;
+		std::string adjustMessage;
+		for (auto& [_, ch] : Channels)
+		{
+			if (!ch->RingChannel || ch->RingChannel->Resources.empty() || !ch->TypeInfo)
+				continue;
+			auto it = pins.find(ch->InputName);
+			if (it == pins.end())
+				continue;
+			void* input = ch->RingChannel->ResInterface->GetPinInfo(it->second, true);
+			if (!input)
+				continue;
+			auto [required, message] = ch->RingChannel->ResInterface->GetRequiredRingSize(input, requestedSize);
+			if (required > maxRequired)
+			{
+				maxRequired = required;
+				adjustMessage = message;
+			}
+			gathered.push_back({ch.get(), ch->RingChannel, input});
+			wantedRings.push_back(ch->RingChannel);
+		}
+		if (gathered.empty())
+		{
+			SendScheduleRequest(0);
+			return NOS_RESULT_FAILED;
+		}
+
+		bool effectiveSizeAdjusted = maxRequired != requestedSize;
+		ClearNodeStatusMessages();
+		if (effectiveSizeAdjusted)
+			SetNodeStatusMessage(adjustMessage, fb::NodeStatusMessageType::WARNING);
+
+		if (Ring.Size != maxRequired)
+		{
+			RequestRingResize(maxRequired);
+			if (effectiveSizeAdjusted)
+				nosEngine.LogW("%s", adjustMessage.c_str());
+			return NOS_RESULT_FAILED;
+		}
+
+		std::vector<MultiRing::SlotPair> slots;
+		if (!Ring.BeginPushSubset(100, wantedRings, slots))
+			return Ring.Exit ? NOS_RESULT_FAILED : NOS_RESULT_PENDING;
+
+		// Push outside the lock — Vulkan command recording can be slow.
+		for (size_t i = 0; i < gathered.size(); ++i)
+		{
+			auto& g = gathered[i];
+			auto* slot = slots[i].second;
+			g.RingCh->ResInterface->Push(slot, g.Input, params,
+										 NOS_NAME_STATIC("MultiRingBuffer"), true);
+			if (!g.NodeCh->IsOutLive)
+			{
+				ChangePinLiveness(g.NodeCh->OutputName, true);
+				g.NodeCh->IsOutLive = true;
+			}
+		}
+
+		Ring.EndPushAll(slots);
+
+		if (Mode == RingMode::FILL)
+		{
+			bool isFillComplete = true;
+			for (auto* rc : wantedRings)
+				if (Ring.WritePoolSize(*rc) != 0)
+				{
+					isFillComplete = false;
+					break;
+				}
+			if (isFillComplete)
+			{
+				Mode = RingMode::CONSUME;
+				ModeCV.notify_all();
+			}
+		}
+
+		return NOS_RESULT_SUCCESS;
+	}
+
+	nosResult CopyFrom(nosCopyInfo* cpy) override
+	{
+		auto* ch = GetChannelByPinId(cpy->ID);
+		if (!ch || !ch->RingChannel || Ring.Exit)
+			return NOS_RESULT_FAILED;
+		if (!ch->IsOutLive)
+			return NOS_RESULT_SUCCESS;
+
+		// EndPop the previous frame's slot before popping a new one. We can't
+		// rely on OnEndFrame: the engine only fires it on the path's primary
+		// source pin, so live secondary outputs (e.g. a second channel feeding
+		// the same consumer) never receive it. By the time the consumer asks
+		// for the next frame on this pin, it's done with the previous one.
+		if (ch->LastPopped)
+		{
+			Ring.EndPop(*ch->RingChannel, ch->LastPopped);
+			ch->LastPopped = nullptr;
+		}
+
+		if (OnRestart == OnRestartType::WAIT_UNTIL_FULL && RepeatWhenFilling)
+		{
+			if (ch->RemainingRepeatableCount > 0)
+			{
+				ch->RingChannel->ResInterface->OnRepeatPinValue(cpy);
+				ch->RemainingRepeatableCount--;
+				return NOS_RESULT_SUCCESS;
+			}
+		}
+		else if (Mode == RingMode::FILL)
+		{
+			std::unique_lock lock(ModeMutex);
+			if (!ModeCV.wait_for(lock, std::chrono::milliseconds(100),
+								 [this] { return Mode != RingMode::FILL; }))
+				return NOS_RESULT_PENDING;
+		}
+
+		ResourceInterface::ResourceBase* slot;
+		{
+			ScopedProfilerEvent _({.Name = "Wait For Filled Slot"});
+			slot = Ring.BeginPop(*ch->RingChannel, 100);
+		}
+		if (!slot)
+			return Ring.Exit ? NOS_RESULT_FAILED : NOS_RESULT_PENDING;
+
+		nos::Buffer outPinVal;
+		bool changePinValue = ch->RingChannel->ResInterface->BeginCopyFrom(slot, *cpy->PinData, outPinVal);
+		if (changePinValue)
+			nosEngine.SetPinValueByName(NodeId, ch->OutputName, outPinVal);
+
+		ch->RingChannel->ResInterface->WaitForDownloadToEnd(slot, "MultiRingBuffer", NodeName.AsString(), cpy);
+
+		cpy->CopyFromOptions.ShouldSetSourceFrameNumber = true;
+		cpy->FrameNumber = slot->FrameNumber;
+
+		ch->LastPopped = slot;
+
+		PoppedSinceLastSchedule.insert(ch->Letter);
+		size_t liveCount = 0;
+		for (auto& [_, c] : Channels)
+			if (c->IsOutLive)
+				++liveCount;
+		if (PoppedSinceLastSchedule.size() >= liveCount)
+		{
+			SendScheduleRequest(1);
+			PoppedSinceLastSchedule.clear();
+		}
+		return NOS_RESULT_SUCCESS;
+	}
+
+	void OnEndFrame(uuid const& pinId, nosEndFrameCause cause) override
+	{
+		auto* ch = GetChannelByPinId(pinId);
+		if (!ch)
+			return;
+
+		if (cause == NOS_END_FRAME_FAILED)
+		{
+			if (pinId == ch->OutputId)
+				return;
+			if (!ch->IsOutLive)
+				return;
+			ChangePinLiveness(ch->OutputName, false);
+			ch->IsOutLive = false;
+		}
+		// EndPop happens at the start of the next CopyFrom for this channel
+		// rather than here, because OnEndFrame is unreliable for secondary
+		// live outputs.
+	}
+
+	void SendScheduleRequest(uint32_t count, bool reset = false) const
+	{
+		nosScheduleNodeParams schedule{.NodeId = NodeId, .AddScheduleCount = count, .Reset = reset};
+		nosEngine.ScheduleNode(&schedule);
+	}
+
+	void OnPathCommand(const nosPathCommand* command) override
+	{
+		switch (command->Event)
+		{
+		case NOS_RING_SIZE_CHANGE:
+			if (command->RingSize == 0)
+				return;
+			RequestedRingSize = command->RingSize;
+			nosEngine.SetPinValue(*GetPinId(NSN_Size), nos::Buffer::From(command->RingSize));
+			break;
+		default: return;
+		}
+	}
+
+	void OnPathStop() override
+	{
+		if (OnRestart == OnRestartType::WAIT_UNTIL_FULL)
+			Mode = RingMode::FILL;
+		for (auto& [_, ch] : Channels)
+		{
+			if (ch->LastPopped && ch->RingChannel)
+			{
+				Ring.EndPop(*ch->RingChannel, ch->LastPopped);
+				ch->LastPopped = nullptr;
+			}
+		}
+		Ring.Stop();
+		PoppedSinceLastSchedule.clear();
+	}
+
+	void OnPathStart() override
+	{
+		if (Channels.empty())
+			return;
+
+		PoppedSinceLastSchedule.clear();
+
+		if (OnRestart == OnRestartType::RESET || RepeatWhenFilling)
+			Ring.ResetAll(false);
+		else
+		{
+			for (auto& [_, ch] : Channels)
+				if (ch->RingChannel)
+					Ring.MoveOneReadToWriteIfFull(*ch->RingChannel);
+		}
+
+		if (RequestedRingSize)
+		{
+			Ring.ResizeAll(*RequestedRingSize);
+			for (auto& [_, ch] : Channels)
+				ch->NeedsRecreation = false;
+			RequestedRingSize = std::nullopt;
+		}
+		for (auto& [_, ch] : Channels)
+		{
+			if (ch->NeedsRecreation && ch->RingChannel)
+			{
+				Ring.RecreateChannelResources(*ch->RingChannel);
+				ch->NeedsRecreation = false;
+			}
+		}
+
+		size_t totalSchedule = 0;
+		for (auto& [_, ch] : Channels)
+		{
+			if (!ch->RingChannel)
+				continue;
+			if (ch->RingChannel->Resources.empty())
+			{
+				totalSchedule = std::max<size_t>(totalSchedule, 1);
+				continue;
+			}
+			auto emptySlotCount = Ring.WritePoolSize(*ch->RingChannel);
+			if (RepeatWhenFilling)
+				ch->RemainingRepeatableCount = std::max(emptySlotCount, (size_t)1) - 1;
+			totalSchedule = std::max(totalSchedule, emptySlotCount);
+			ch->RingChannel->ResInterface->OnPathStart();
+			SeedOutputPin(*ch);
+		}
+		Ring.Start();
+		if (totalSchedule > 0)
+		{
+			nosScheduleNodeParams schedule{.NodeId = NodeId, .AddScheduleCount = (uint32_t)totalSchedule};
+			nosEngine.ScheduleNode(&schedule);
+		}
+	}
+
+	void OnNodeMenuRequested(nosContextMenuRequestPtr request) override
+	{
+		flatbuffers::FlatBufferBuilder fbb;
+		std::vector items = {
+			nos::CreateContextMenuItemDirect(fbb, "Add Channel", MenuCommand(ADD_CHANNEL, 0))};
+		HandleEvent(CreateAppEvent(fbb, app::CreateAppContextMenuUpdateDirect(
+											fbb, request->item_id(), request->pos(), request->instigator(), &items)));
+	}
+
+	void OnPinMenuRequested(nos::Name pinName, nosContextMenuRequestPtr request) override
+	{
+		auto sv = pinName.AsString();
+		if (!IsInputPin(sv) && !IsOutputPin(sv))
+			return;
+		auto letter = ParseLetter(sv);
+		if (!letter)
+			return;
+		if (Channels.size() <= 1)
+			return;
+		flatbuffers::FlatBufferBuilder fbb;
+		std::vector items = {nos::CreateContextMenuItemDirect(
+			fbb, "Remove Channel", MenuCommand(REMOVE_CHANNEL, static_cast<uint8_t>(*letter)))};
+		HandleEvent(CreateAppEvent(fbb, app::CreateAppContextMenuUpdateDirect(
+											fbb, request->item_id(), request->pos(), request->instigator(), &items)));
+	}
+
+	void OnMenuCommand(uuid const& itemID, uint32_t cmd) override
+	{
+		auto command = MenuCommand(cmd);
+		switch (command.Type)
+		{
+		case ADD_CHANNEL:
+		{
+			char newLetter = 0;
+			for (char c : CHANNEL_LETTERS)
+			{
+				if (!Channels.contains(c))
+				{
+					newLetter = c;
+					break;
+				}
+			}
+			if (newLetter == 0)
+			{
+				SetNodeStatusMessage("Maximum number of channels reached", fb::NodeStatusMessageType::WARNING);
+				return;
+			}
+
+			fb::TPin inPin;
+			inPin.id = uuid(nosEngine.GenerateID());
+			inPin.name = std::string("Input_") + newLetter;
+			inPin.type_name = "nos.Generic";
+			inPin.show_as = fb::ShowAs::INPUT_PIN;
+			inPin.can_show_as = fb::CanShowAs::INPUT_PIN_ONLY;
+
+			fb::TPin outPin;
+			outPin.id = uuid(nosEngine.GenerateID());
+			outPin.name = std::string("Output_") + newLetter;
+			outPin.type_name = "nos.Generic";
+			outPin.show_as = fb::ShowAs::OUTPUT_PIN;
+			outPin.can_show_as = fb::CanShowAs::OUTPUT_PIN_ONLY;
+			outPin.live = true;
+
+			nos::TPartialNodeUpdate update;
+			update.node_id = NodeId;
+			update.pins_to_add.emplace_back(std::make_unique<fb::TPin>(std::move(inPin)));
+			update.pins_to_add.emplace_back(std::make_unique<fb::TPin>(std::move(outPin)));
+			flatbuffers::FlatBufferBuilder fbb;
+			HandleEvent(CreateAppEvent(fbb, nos::CreatePartialNodeUpdate(fbb, &update)));
+			break;
+		}
+		case REMOVE_CHANNEL:
+		{
+			char letter = static_cast<char>(command.Letter);
+			auto it = Channels.find(letter);
+			if (it == Channels.end())
+				return;
+			auto& ch = *it->second;
+			nos::TPartialNodeUpdate update;
+			update.node_id = NodeId;
+			update.pins_to_delete = {ch.InputId, ch.OutputId};
+			flatbuffers::FlatBufferBuilder fbb;
+			HandleEvent(CreateAppEvent(fbb, nos::CreatePartialNodeUpdate(fbb, &update)));
+			break;
+		}
+		}
+	}
+};
+
+nosResult RegisterMultiRingBuffer(nosNodeFunctions* functions)
+{
+	NOS_BIND_NODE_CLASS(NOS_NAME("MultiRingBuffer"), MultiRingBufferNodeContext, functions)
+	return NOS_RESULT_SUCCESS;
+}
+
+} // namespace nos::utilities
diff --git a/Plugins/nosUtilities/Source/ScheduleRequest.cpp b/Plugins/nosUtilities/Source/ScheduleRequest.cpp
new file mode 100644
index 00000000..4b21f93b
--- /dev/null
+++ b/Plugins/nosUtilities/Source/ScheduleRequest.cpp
@@ -0,0 +1,80 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#include <Nodos/PluginHelpers.hpp>
+
+namespace nos::utilities
+{
+
+// Drives an on-demand path: each execution (and each path start) queues another
+// schedule request, so the path feeding the Trigger pin keeps running. Wire the
+// thing you want scheduled into Sink. Ported from nos.flow (dev branch).
+struct ScheduleRequestNode : NodeContext
+{
+	bool TryAgainOnFailure = true;
+	nosVec2u DeltaSeconds = { 1, 60 };
+	uint32_t Importance = 1;
+
+	ScheduleRequestNode(nosFbNodePtr node) : NodeContext(node)
+	{
+		if (node->pins())
+			for (auto* pin : *node->pins())
+			{
+				auto* data = pin->data();
+				if (data && data->size())
+					ReadPin(nos::Name(pin->name()->c_str()), data->data());
+			}
+	}
+
+	void ReadPin(nos::Name name, const void* data)
+	{
+		if (name == NOS_NAME("DeltaSeconds"))
+			DeltaSeconds = *static_cast<const nosVec2u*>(data);
+		else if (name == NOS_NAME("Importance"))
+			Importance = *static_cast<const uint32_t*>(data);
+		else if (name == NOS_NAME("TryAgainOnFailure"))
+			TryAgainOnFailure = *static_cast<const bool*>(data);
+	}
+
+	void OnPinValueChanged(nos::Name pinName, uuid const& pinId, nosBuffer value) override
+	{
+		ReadPin(pinName, value.Data);
+	}
+
+	void GetScheduleInfo(nosScheduleInfo* info) override
+	{
+		info->Type = NOS_SCHEDULE_TYPE_ON_DEMAND;
+		info->DeltaSeconds = DeltaSeconds;
+		info->Importance = Importance;
+	}
+
+	void ScheduleOnce()
+	{
+		nosScheduleNodeParams params{ .NodeId = NodeId, .AddScheduleCount = 1, .Reset = false };
+		nosEngine.ScheduleNode(&params);
+	}
+
+	nosResult ExecuteNode(nosNodeExecuteParams* params) override
+	{
+		ScheduleOnce();
+		return NOS_RESULT_SUCCESS;
+	}
+
+	void OnPathStart() override
+	{
+		ScheduleOnce();
+	}
+
+	void OnEndFrame(uuid const& pinId, nosEndFrameCause cause) override
+	{
+		if (TryAgainOnFailure && cause == NOS_END_FRAME_FAILED)
+			ScheduleOnce();
+	}
+};
+
+nosResult RegisterScheduleRequest(nosNodeFunctions* fn)
+{
+	NOS_BIND_NODE_CLASS(NOS_NAME("ScheduleRequest"), ScheduleRequestNode, fn);
+	return NOS_RESULT_SUCCESS;
+}
+
+} // namespace nos::utilities
diff --git a/Plugins/nosUtilities/Source/Sink.cpp b/Plugins/nosUtilities/Source/Sink.cpp
index 043982f3..28294d7e 100644
--- a/Plugins/nosUtilities/Source/Sink.cpp
+++ b/Plugins/nosUtilities/Source/Sink.cpp
@@ -5,6 +5,7 @@
 
 // stl
 #include <chrono>
+#include <list>
 #include <nosUtil/Stopwatch.hpp>
 
 #include "Sink_generated.h"
@@ -18,6 +19,33 @@ constexpr uint64_t VULKAN_TIMEOUT_BEFORE_LEAK =
 
 struct SinkNode : NodeContext
 {
+	enum MenuCommandType : uint8_t
+	{
+		ADD_INPUT = 0,
+		REMOVE_INPUT = 1,
+	};
+
+	struct MenuCommand
+	{
+		MenuCommandType Type;
+		uint8_t InputIndex;
+		MenuCommand(uint32_t cmd) {
+			Type = static_cast<MenuCommandType>(cmd & 0xFF);
+			InputIndex = static_cast<uint8_t>((cmd >> 8) & 0xFF);
+		}
+		MenuCommand(MenuCommandType type, uint8_t inputIndex) : Type(type), InputIndex(inputIndex) {}
+		operator uint32_t() const { return (InputIndex << 8) | Type; }
+	};
+
+	static const std::unordered_set<std::string_view>& StaticPinNames()
+	{
+		static const std::unordered_set<std::string_view> names = {
+			"InExe", "Sink Input", "Sink FPS", "HasGPUWork", "GPUFrameBuffering",
+			"AcceptsRepeat", "SinkMode", "LatencyBudget"
+		};
+		return names;
+	}
+
 	std::mutex Mutex;
 	std::atomic<bool> ShouldStop = false;
 	std::atomic<float> Fps = 1000.0f / 60.0f;
@@ -31,9 +59,27 @@ struct SinkNode : NodeContext
 	std::optional<std::vector<nosGPUEvent>> GPUFrameSyncEvents = std::nullopt;
 	size_t GPUFrameBuffering = 1;
 	uint64_t CurrentGPUEventIndex = 0;
+	std::vector<uuid> DynamicInputs;
 
 
 	SinkNode(nosFbNodePtr inNode) : NodeContext(inNode) {
+		std::list<uuid> pinsToUnorphan;
+		for (auto i = 0; i < inNode->pins()->size(); i++)
+		{
+			auto pin = inNode->pins()->Get(i);
+			if (pin->show_as() != fb::ShowAs::INPUT_PIN)
+				continue;
+			if (StaticPinNames().contains(pin->name()->string_view()))
+				continue;
+			DynamicInputs.push_back(*pin->id());
+			if (auto orphanState = pin->orphan_state())
+			{
+				if (orphanState->type() == fb::PinOrphanStateType::ORPHAN)
+					pinsToUnorphan.push_back(*pin->id());
+			}
+		}
+		for (auto const& pinId : pinsToUnorphan)
+			SetPinOrphanState(pinId, fb::PinOrphanStateType::ACTIVE);
 		AddPinValueWatcher(NOS_NAME("HasGPUWork"),
 						   [this](nosBuffer const& newVal, std::optional<nos::Buffer> oldValue) {
 							   bool hasGpuWork = *static_cast<bool*>(newVal.Data);
@@ -255,6 +301,93 @@ struct SinkNode : NodeContext
 		}
 	}
 
+	void OnNodeMenuRequested(nosContextMenuRequestPtr request) override
+	{
+		uint32_t cmd = MenuCommand(ADD_INPUT, 0);
+		flatbuffers::FlatBufferBuilder fbb;
+		std::vector items = {
+			nos::CreateContextMenuItemDirect(fbb, "Add Sink", cmd, nullptr)
+		};
+		HandleEvent(CreateAppEvent(fbb, app::CreateAppContextMenuUpdateDirect(
+			fbb, request->item_id(), request->pos(), request->instigator(), &items)));
+	}
+
+	void OnPinMenuRequested(nos::Name pinName, nosContextMenuRequestPtr request) override
+	{
+		if (StaticPinNames().contains(pinName.AsString()))
+			return;
+		auto pinId = GetPinId(pinName);
+		if (!pinId)
+			return;
+		auto it = std::find(DynamicInputs.begin(), DynamicInputs.end(), *pinId);
+		if (it == DynamicInputs.end())
+			return;
+		auto index = std::distance(DynamicInputs.begin(), it);
+		uint32_t cmd = MenuCommand(REMOVE_INPUT, static_cast<uint8_t>(index));
+		flatbuffers::FlatBufferBuilder fbb;
+		std::vector items = {
+			nos::CreateContextMenuItemDirect(fbb, "Remove Input", cmd, nullptr)
+		};
+		HandleEvent(CreateAppEvent(fbb, app::CreateAppContextMenuUpdateDirect(
+			fbb, request->item_id(), request->pos(), request->instigator(), &items)));
+	}
+
+	void OnMenuCommand(uuid const& itemID, uint32_t cmd) override
+	{
+		auto command = MenuCommand(cmd);
+		switch (command.Type)
+		{
+		case ADD_INPUT:
+		{
+			std::string pinName;
+			for (size_t i = 2;; i++)
+			{
+				auto candidate = "Sink Input " + std::to_string(i);
+				if (!GetPinId(nos::Name(candidate)))
+				{
+					pinName = std::move(candidate);
+					break;
+				}
+			}
+			flatbuffers::FlatBufferBuilder fbb;
+			uuid pinId = nosEngine.GenerateID();
+			std::vector pins = {
+				fb::CreatePinDirect(fbb, &pinId, pinName.c_str(), "nos.Generic",
+					fb::ShowAs::INPUT_PIN, fb::CanShowAs::INPUT_PIN_ONLY)
+			};
+			HandleEvent(CreateAppEvent(fbb, CreatePartialNodeUpdateDirect(fbb, &NodeId, ClearFlags::NONE, 0, &pins)));
+			break;
+		}
+		case REMOVE_INPUT:
+		{
+			if (command.InputIndex >= DynamicInputs.size())
+				return;
+			auto pinId = DynamicInputs[command.InputIndex];
+			flatbuffers::FlatBufferBuilder fbb;
+			std::vector pinsToRemove = { *&pinId };
+			HandleEvent(CreateAppEvent(fbb, CreatePartialNodeUpdateDirect(fbb, &NodeId, ClearFlags::NONE, &pinsToRemove)));
+			break;
+		}
+		}
+	}
+
+	void OnNodeUpdated(nosNodeUpdate const* update) override
+	{
+		if (update->Type == NOS_NODE_UPDATE_PIN_DELETED)
+		{
+			std::erase_if(DynamicInputs, [&](auto id) { return id == update->PinDeleted; });
+		}
+		else if (update->Type == NOS_NODE_UPDATE_PIN_CREATED)
+		{
+			auto* pin = update->PinCreated;
+			if (pin->show_as() != fb::ShowAs::INPUT_PIN)
+				return;
+			if (StaticPinNames().contains(pin->name()->string_view()))
+				return;
+			DynamicInputs.push_back(*pin->id());
+		}
+	}
+
 	void GetScheduleInfo(nosScheduleInfo* info) override
 	{
 		info->Type = NOS_SCHEDULE_TYPE_ON_DEMAND;
diff --git a/Plugins/nosUtilities/Source/TextRender.cpp b/Plugins/nosUtilities/Source/TextRender.cpp
new file mode 100644
index 00000000..37548680
--- /dev/null
+++ b/Plugins/nosUtilities/Source/TextRender.cpp
@@ -0,0 +1,699 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+
+#include <Nodos/PluginHelpers.hpp>
+#include <nosVulkanSubsystem/Helpers.hpp>
+
+#include <algorithm>
+#include <array>
+#include <cstring>
+#include <filesystem>
+#include <optional>
+#include <string>
+#include <vector>
+
+#include <ft2build.h>
+#include FT_FREETYPE_H
+#include FT_MODULE_H
+
+namespace nos::utilities
+{
+namespace fs = std::filesystem;
+
+NOS_REGISTER_NAME(TextRender)
+NOS_REGISTER_NAME(TextGlyph_Pass)
+NOS_REGISTER_NAME(TextGlyph_Frag)
+NOS_REGISTER_NAME(TextGlyph_Vert)
+NOS_REGISTER_NAME(TextBox_Pass)
+NOS_REGISTER_NAME(TextBox_Frag)
+NOS_REGISTER_NAME(TextBox_Vert)
+
+NOS_REGISTER_NAME(Text)
+NOS_REGISTER_NAME(FontSize)
+NOS_REGISTER_NAME(Color)
+NOS_REGISTER_NAME(Opacity)
+NOS_REGISTER_NAME(StrokeColor)
+NOS_REGISTER_NAME(StrokeWidth)
+NOS_REGISTER_NAME(ShadowColor)
+NOS_REGISTER_NAME(ShadowOffset)
+NOS_REGISTER_NAME(ShadowSoftness)
+NOS_REGISTER_NAME(BackgroundColor)
+NOS_REGISTER_NAME(BackgroundPadding)
+NOS_REGISTER_NAME(HorizontalAlign)
+NOS_REGISTER_NAME(VerticalAlign)
+NOS_REGISTER_NAME(Position)
+NOS_REGISTER_NAME(Resolution)
+NOS_REGISTER_NAME(WrapWidth)
+NOS_REGISTER_NAME(Font)
+NOS_REGISTER_NAME(Output)
+
+NOS_REGISTER_NAME(Offset)
+NOS_REGISTER_NAME(Size)
+NOS_REGISTER_NAME(AtlasRect)
+NOS_REGISTER_NAME(FillColor)
+NOS_REGISTER_NAME(Softness)
+NOS_REGISTER_NAME(PxRange)
+NOS_REGISTER_NAME(Atlas)
+NOS_REGISTER_NAME(BoxColor)
+
+// ASCII printable range packed into the SDF atlas.
+constexpr uint32_t FIRST_CHAR = 32;
+constexpr uint32_t LAST_CHAR = 126;
+constexpr uint32_t GLYPH_COUNT = LAST_CHAR - FIRST_CHAR + 1;
+// Reference size the atlas is rasterized at; the SDF is scaled by the shader.
+constexpr float REF_PIXEL_SIZE = 72.0f;
+// SDF spread in reference pixels: how far signed-distance data extends from the
+// glyph edge. Caps the usable outline thickness and shadow softness.
+constexpr int SDF_SPREAD = 16;
+constexpr int ATLAS_WIDTH = 1024;
+constexpr int ATLAS_PADDING = 2;
+// Upper bound on draw calls per execution to keep pathological inputs cheap.
+constexpr size_t MAX_DRAWN_GLYPHS = 8192;
+
+struct Glyph
+{
+	int AtlasX = 0, AtlasY = 0; // top-left in atlas pixels
+	int Width = 0, Height = 0;  // bitmap size in reference pixels
+	float BearingLeft = 0;      // pen-origin to bitmap left, reference pixels
+	float BearingTop = 0;       // baseline to bitmap top, reference pixels
+	float Advance = 0;          // horizontal advance, reference pixels
+	bool HasBitmap = false;
+};
+
+struct TextRenderNode : NodeContext
+{
+	FT_Library Library = nullptr;
+	nosResourceShareInfo AtlasTex{};
+
+	std::array<Glyph, GLYPH_COUNT> Glyphs{};
+	int AtlasW = 0, AtlasH = 0;
+	float RefLineHeight = REF_PIXEL_SIZE * 1.2f;
+	float RefAscender = REF_PIXEL_SIZE;
+
+	// Path the current atlas was built from; empty means "bundled font".
+	std::optional<std::string> BuiltFontPath;
+	bool AtlasValid = false;
+
+	TextRenderNode(nosFbNodePtr node) : NodeContext(node)
+	{
+		if (FT_Init_FreeType(&Library))
+		{
+			Library = nullptr;
+			nosEngine.LogE("TextRender: failed to initialize FreeType");
+			return;
+		}
+		FT_Int spread = SDF_SPREAD;
+		FT_Property_Set(Library, "sdf", "spread", &spread);
+	}
+
+	~TextRenderNode() override
+	{
+		DestroyAtlas();
+		if (Library)
+			FT_Done_FreeType(Library);
+	}
+
+	void DestroyAtlas()
+	{
+		if (AtlasTex.Memory.Handle)
+			nosVulkan->DestroyResource(&AtlasTex);
+		AtlasTex = {};
+		AtlasValid = false;
+	}
+
+	std::string ResolveFontPath(const char* fontPin) const
+	{
+		if (fontPin && fontPin[0] != '\0')
+			return fontPin;
+		fs::path root = nosEngine.Module->RootFolderPath;
+		return (root / "Fonts" / "RobotoMono-Regular.ttf").generic_string();
+	}
+
+	// Rasterizes the printable ASCII range into a single-channel SDF atlas
+	// and uploads it as a texture. Returns false on failure.
+	bool BuildAtlas(const std::string& fontPath)
+	{
+		if (!Library)
+			return false;
+
+		FT_Face face = nullptr;
+		if (FT_New_Face(Library, fontPath.c_str(), 0, &face))
+		{
+			nosEngine.LogE("TextRender: could not open font '%s'", fontPath.c_str());
+			return false;
+		}
+		FT_Set_Pixel_Sizes(face, 0, static_cast<FT_UInt>(REF_PIXEL_SIZE));
+
+		RefLineHeight = (face->size->metrics.height >> 6) > 0 ? float(face->size->metrics.height >> 6)
+															  : REF_PIXEL_SIZE * 1.2f;
+		RefAscender = (face->size->metrics.ascender >> 6) > 0 ? float(face->size->metrics.ascender >> 6)
+															  : REF_PIXEL_SIZE;
+
+		struct Raster
+		{
+			std::vector<uint8_t> Pixels;
+			int W = 0, H = 0;
+		};
+		std::array<Raster, GLYPH_COUNT> rasters{};
+		std::array<Glyph, GLYPH_COUNT> glyphs{};
+
+		for (uint32_t i = 0; i < GLYPH_COUNT; ++i)
+		{
+			Glyph& g = glyphs[i];
+			if (FT_Load_Char(face, FIRST_CHAR + i, FT_LOAD_DEFAULT))
+				continue;
+			FT_GlyphSlot slot = face->glyph;
+			g.Advance = float(slot->advance.x >> 6);
+
+			if (FT_Render_Glyph(slot, FT_RENDER_MODE_SDF))
+				continue; // whitespace / empty outline: advance is still valid
+
+			const FT_Bitmap& bm = slot->bitmap;
+			if (bm.width == 0 || bm.rows == 0)
+				continue;
+
+			g.Width = int(bm.width);
+			g.Height = int(bm.rows);
+			g.BearingLeft = float(slot->bitmap_left);
+			g.BearingTop = float(slot->bitmap_top);
+			g.HasBitmap = true;
+
+			Raster& r = rasters[i];
+			r.W = int(bm.width);
+			r.H = int(bm.rows);
+			r.Pixels.resize(size_t(r.W) * r.H);
+			const int pitch = bm.pitch;
+			for (int row = 0; row < r.H; ++row)
+			{
+				const uint8_t* src = bm.buffer + size_t(row) * (pitch < 0 ? -pitch : pitch);
+				std::memcpy(r.Pixels.data() + size_t(row) * r.W, src, r.W);
+			}
+		}
+		FT_Done_Face(face);
+
+		// Shelf-pack the glyph bitmaps into a fixed-width atlas.
+		int x = ATLAS_PADDING, y = ATLAS_PADDING, shelfH = 0;
+		for (uint32_t i = 0; i < GLYPH_COUNT; ++i)
+		{
+			Glyph& g = glyphs[i];
+			if (!g.HasBitmap)
+				continue;
+			if (x + g.Width + ATLAS_PADDING > ATLAS_WIDTH)
+			{
+				x = ATLAS_PADDING;
+				y += shelfH + ATLAS_PADDING;
+				shelfH = 0;
+			}
+			g.AtlasX = x;
+			g.AtlasY = y;
+			x += g.Width + ATLAS_PADDING;
+			shelfH = std::max(shelfH, g.Height);
+		}
+		const int atlasW = ATLAS_WIDTH;
+		const int atlasH = y + shelfH + ATLAS_PADDING;
+
+		std::vector<uint8_t> pixels(size_t(atlasW) * atlasH, 0);
+		for (uint32_t i = 0; i < GLYPH_COUNT; ++i)
+		{
+			const Glyph& g = glyphs[i];
+			const Raster& r = rasters[i];
+			if (!g.HasBitmap)
+				continue;
+			for (int row = 0; row < r.H; ++row)
+				std::memcpy(pixels.data() + size_t(g.AtlasY + row) * atlasW + g.AtlasX,
+							r.Pixels.data() + size_t(row) * r.W,
+							r.W);
+		}
+
+		DestroyAtlas();
+
+		nosResourceShareInfo atlas{};
+		atlas.Info.Type = NOS_RESOURCE_TYPE_TEXTURE;
+		atlas.Info.Texture = {.Width = uint32_t(atlasW),
+							  .Height = uint32_t(atlasH),
+							  .Format = NOS_FORMAT_R8_UNORM};
+		auto cmd = vkss::BeginCmd(NOS_NAME("TextRenderAtlasUpload"), NodeId);
+		nosResult res = nosVulkan->ImageLoad(cmd,
+											 pixels.data(),
+											 nosVec2u{uint32_t(atlasW), uint32_t(atlasH)},
+											 NOS_FORMAT_R8_UNORM,
+											 &atlas,
+											 "TextRenderAtlas");
+		vkss::EndCmd(cmd, NOS_TRUE, nullptr);
+		if (res != NOS_RESULT_SUCCESS)
+		{
+			nosEngine.LogE("TextRender: failed to upload font atlas");
+			return false;
+		}
+
+		atlas.Info.Texture.Filter = NOS_TEXTURE_FILTER_LINEAR;
+		AtlasTex = atlas;
+		AtlasW = atlasW;
+		AtlasH = atlasH;
+		Glyphs = glyphs;
+		AtlasValid = true;
+		return true;
+	}
+
+	void EnsureAtlas(const char* fontPin)
+	{
+		std::string path = ResolveFontPath(fontPin);
+		if (AtlasValid && BuiltFontPath && *BuiltFontPath == path)
+			return;
+		BuiltFontPath = path;
+		if (BuildAtlas(path))
+			ClearNodeStatusMessages();
+		else
+			SetNodeStatusMessage("Could not load font.", fb::NodeStatusMessageType::FAILURE);
+	}
+
+	const Glyph* GlyphFor(char c) const
+	{
+		auto u = uint32_t(uint8_t(c));
+		if (u < FIRST_CHAR || u > LAST_CHAR)
+			return nullptr;
+		return &Glyphs[u - FIRST_CHAR];
+	}
+
+	// One laid-out glyph: index into Glyphs plus its pen origin on the line.
+	struct Placed
+	{
+		uint32_t GlyphIndex;
+		float PenX;
+		int Line;
+	};
+
+	// Greedy word-wrap layout in output-pixel space. Honors '\n' and breaks
+	// words longer than maxWidth character by character.
+	void LayoutText(const char* text,
+					float scale,
+					float maxWidth,
+					std::vector<Placed>& out,
+					std::vector<float>& lineWidths) const
+	{
+		const float spaceAdvance = [&] {
+			const Glyph* sp = GlyphFor(' ');
+			return sp ? sp->Advance * scale : REF_PIXEL_SIZE * 0.3f * scale;
+		}();
+
+		int line = 0;
+		float penX = 0.0f;
+		lineWidths.push_back(0.0f);
+
+		auto newLine = [&] {
+			lineWidths[line] = penX;
+			++line;
+			penX = 0.0f;
+			lineWidths.push_back(0.0f);
+		};
+		auto placeChar = [&](char c) {
+			const Glyph* g = GlyphFor(c);
+			if (!g)
+				return;
+			auto idx = uint32_t(uint8_t(c)) - FIRST_CHAR;
+			if (g->HasBitmap && out.size() < MAX_DRAWN_GLYPHS)
+				out.push_back({idx, penX, line});
+			penX += g->Advance * scale;
+		};
+
+		std::string word;
+		auto wordWidth = [&](const std::string& w) {
+			float width = 0.0f;
+			for (char c : w)
+				if (const Glyph* g = GlyphFor(c))
+					width += g->Advance * scale;
+			return width;
+		};
+		auto flushWord = [&] {
+			if (word.empty())
+				return;
+			float ww = wordWidth(word);
+			if (ww > maxWidth)
+			{
+				// Word does not fit on any line: hard-break per character.
+				for (char c : word)
+				{
+					const Glyph* g = GlyphFor(c);
+					float adv = g ? g->Advance * scale : 0.0f;
+					if (penX > 0.0f && penX + adv > maxWidth)
+						newLine();
+					placeChar(c);
+				}
+			}
+			else
+			{
+				if (penX > 0.0f && penX + ww > maxWidth)
+					newLine();
+				for (char c : word)
+					placeChar(c);
+			}
+			word.clear();
+		};
+
+		for (const char* p = text; *p; ++p)
+		{
+			char c = *p;
+			if (c == '\n')
+			{
+				flushWord();
+				newLine();
+			}
+			else if (c == ' ' || c == '\t')
+			{
+				flushWord();
+				float adv = (c == '\t') ? spaceAdvance * 4.0f : spaceAdvance;
+				if (penX > 0.0f)
+					penX += adv;
+			}
+			else
+			{
+				word.push_back(c);
+			}
+		}
+		flushWord();
+		lineWidths[line] = penX;
+	}
+
+	// Draws a flat-colored rectangle (the text-box background).
+	void DrawBox(nosCmd cmd,
+				 const nosResourceShareInfo& tex,
+				 float outW,
+				 float outH,
+				 float x,
+				 float y,
+				 float w,
+				 float h,
+				 nosVec4 boxColor)
+	{
+		nosVec2 offset{x / outW, y / outH};
+		nosVec2 size{w / outW, h / outH};
+		std::array bindings = {vkss::ShaderBinding(NSN_Offset, offset),
+							   vkss::ShaderBinding(NSN_Size, size),
+							   vkss::ShaderBinding(NSN_BoxColor, boxColor)};
+		nosVertexData vertexData{
+			.DepthFunc = NOS_DEPTH_FUNCTION_ALWAYS,
+			.DepthWrite = NOS_FALSE,
+			.DepthTest = NOS_FALSE,
+		};
+		nosRunPassParams pass{.Key = NSN_TextBox_Pass,
+							  .Bindings = bindings.data(),
+							  .BindingCount = uint32_t(bindings.size()),
+							  .Output = tex,
+							  .Vertices = vertexData,
+							  .Wireframe = NOS_FALSE,
+							  .Benchmark = NOS_FALSE,
+							  .DoNotClear = NOS_TRUE};
+		nosVulkan->RunPass(cmd, &pass);
+	}
+
+	// Draws one glyph quad. Used for both the shadow and the fill/stroke pass:
+	// the shadow passes the shadow color as the fill with a softened edge.
+	void DrawGlyph(nosCmd cmd,
+				   const nosResourceShareInfo& tex,
+				   float outW,
+				   float outH,
+				   float glyphLeft,
+				   float glyphTop,
+				   float glyphW,
+				   float glyphH,
+				   nosVec4 atlasRect,
+				   nosVec4 fillColor,
+				   nosVec4 strokeColor,
+				   float strokeWidth,
+				   float softness,
+				   float pxRange)
+	{
+		nosVec2 offset{glyphLeft / outW, glyphTop / outH};
+		nosVec2 size{glyphW / outW, glyphH / outH};
+		std::array bindings = {vkss::ShaderBinding(NSN_Offset, offset),
+							   vkss::ShaderBinding(NSN_Size, size),
+							   vkss::ShaderBinding(NSN_AtlasRect, atlasRect),
+							   vkss::ShaderBinding(NSN_FillColor, fillColor),
+							   vkss::ShaderBinding(NSN_StrokeColor, strokeColor),
+							   vkss::ShaderBinding(NSN_StrokeWidth, strokeWidth),
+							   vkss::ShaderBinding(NSN_Softness, softness),
+							   vkss::ShaderBinding(NSN_PxRange, pxRange),
+							   vkss::ShaderBinding(NSN_Atlas, AtlasTex)};
+		nosVertexData vertexData{
+			.DepthFunc = NOS_DEPTH_FUNCTION_ALWAYS,
+			.DepthWrite = NOS_FALSE,
+			.DepthTest = NOS_FALSE,
+		};
+		nosRunPassParams pass{.Key = NSN_TextGlyph_Pass,
+							  .Bindings = bindings.data(),
+							  .BindingCount = uint32_t(bindings.size()),
+							  .Output = tex,
+							  .Vertices = vertexData,
+							  .Wireframe = NOS_FALSE,
+							  .Benchmark = NOS_FALSE,
+							  .DoNotClear = NOS_TRUE};
+		nosVulkan->RunPass(cmd, &pass);
+	}
+
+	nosResult ExecuteNode(nosNodeExecuteParams* rawParams) override
+	{
+		NodeExecuteParams args(rawParams);
+
+		const char* fontPin = args.GetPinData<const char>(NSN_Font);
+		EnsureAtlas(fontPin);
+
+		auto resolution = *reinterpret_cast<nosVec2u*>(args[NSN_Resolution].Data->Data);
+		if (resolution.x == 0 || resolution.y == 0)
+			return NOS_RESULT_SUCCESS;
+
+		// Resize the output texture to match the requested resolution.
+		auto tex = vkss::DeserializeTextureInfo(args[NSN_Output].Data->Data);
+		if (tex.Info.Texture.Width != resolution.x || tex.Info.Texture.Height != resolution.y)
+		{
+			auto resized = tex;
+			resized.Memory = {};
+			resized.Info.Texture.Width = resolution.x;
+			resized.Info.Texture.Height = resolution.y;
+			auto texFb = vkss::ConvertTextureInfo(resized);
+			texFb.unscaled = true;
+			auto buf = nos::Buffer::From(texFb);
+			nosEngine.SetPinValue(args[NSN_Output].Id, {.Data = buf.Data(), .Size = buf.Size()});
+			tex = vkss::DeserializeTextureInfo(args[NSN_Output].Data->Data);
+		}
+		if (tex.Memory.Handle == 0)
+			return NOS_RESULT_SUCCESS;
+
+		const char* text = args.GetPinData<const char>(NSN_Text);
+		float fontSize = *reinterpret_cast<float*>(args[NSN_FontSize].Data->Data);
+		float opacity = std::clamp(*reinterpret_cast<float*>(args[NSN_Opacity].Data->Data), 0.0f, 1.0f);
+		auto textColor = *reinterpret_cast<nosVec4*>(args[NSN_Color].Data->Data);
+		auto strokeColor = *reinterpret_cast<nosVec4*>(args[NSN_StrokeColor].Data->Data);
+		float strokeWidthPin = *reinterpret_cast<float*>(args[NSN_StrokeWidth].Data->Data);
+		auto shadowColor = *reinterpret_cast<nosVec4*>(args[NSN_ShadowColor].Data->Data);
+		auto shadowOffset = *reinterpret_cast<nosVec2*>(args[NSN_ShadowOffset].Data->Data);
+		float shadowSoftnessPin = *reinterpret_cast<float*>(args[NSN_ShadowSoftness].Data->Data);
+		auto boxColor = *reinterpret_cast<nosVec4*>(args[NSN_BackgroundColor].Data->Data);
+		auto boxPadding = *reinterpret_cast<nosVec2*>(args[NSN_BackgroundPadding].Data->Data);
+		auto hAlign = *reinterpret_cast<uint32_t*>(args[NSN_HorizontalAlign].Data->Data);
+		auto vAlign = *reinterpret_cast<uint32_t*>(args[NSN_VerticalAlign].Data->Data);
+		auto position = *reinterpret_cast<nosVec2*>(args[NSN_Position].Data->Data);
+		auto wrapWidthChars = *reinterpret_cast<uint32_t*>(args[NSN_WrapWidth].Data->Data);
+
+		// Global opacity folds into every color's alpha.
+		textColor.w *= opacity;
+		strokeColor.w *= opacity;
+		shadowColor.w *= opacity;
+		boxColor.w *= opacity;
+
+		// The frame outside the text box stays transparent.
+		auto cmd = vkss::BeginCmd(NOS_NAME("TextRender"), NodeId);
+		nosVulkan->Clear(cmd, &tex, nosVec4{0.0f, 0.0f, 0.0f, 0.0f});
+
+		if (AtlasValid && text && text[0] != '\0' && fontSize > 0.0f)
+		{
+			const float outW = float(tex.Info.Texture.Width);
+			const float outH = float(tex.Info.Texture.Height);
+			const float scale = fontSize / REF_PIXEL_SIZE;
+			const float lineHeight = RefLineHeight * scale;
+			const float ascender = RefAscender * scale;
+			const float pxRange = 2.0f * float(SDF_SPREAD) * scale;
+			// The SDF only carries data within SDF_SPREAD reference pixels of the
+			// glyph edge, which bounds outline thickness and shadow softness.
+			const float effectLimit = float(SDF_SPREAD) * scale;
+			const float strokeWidth = std::clamp(strokeWidthPin, 0.0f, effectLimit);
+			const float shadowSoftness = std::clamp(shadowSoftnessPin, 0.0f, effectLimit);
+
+			// WrapWidth is in characters; 0 falls back to the texture width.
+			// The character cell width is the font's space advance, which is
+			// exact for monospace fonts and approximate for proportional ones.
+			float wrapWidth = outW;
+			if (wrapWidthChars > 0)
+			{
+				const Glyph* space = GlyphFor(' ');
+				const float charWidth = (space ? space->Advance : REF_PIXEL_SIZE * 0.6f) * scale;
+				wrapWidth = float(wrapWidthChars) * charWidth;
+			}
+
+			std::vector<Placed> placed;
+			std::vector<float> lineWidths;
+			LayoutText(text, scale, wrapWidth, placed, lineWidths);
+
+			const uint32_t numLines = uint32_t(lineWidths.size());
+			const float blockHeight = lineHeight * float(numLines);
+
+			float vBase = 0.0f;
+			if (vAlign == 1) // MIDDLE
+				vBase = (outH - blockHeight) * 0.5f;
+			else if (vAlign == 2) // BOTTOM
+				vBase = outH - blockHeight;
+			const float vOffset = vBase + position.y;
+
+			// Per-line horizontal anchor offset (alignment + position nudge).
+			std::vector<float> hOffsets(numLines);
+			for (uint32_t i = 0; i < numLines; ++i)
+			{
+				float off = 0.0f;
+				if (hAlign == 1) // CENTER
+					off = (outW - lineWidths[i]) * 0.5f;
+				else if (hAlign == 2) // RIGHT
+					off = outW - lineWidths[i];
+				hOffsets[i] = off + position.x;
+			}
+
+			// Text-block bounds, used for the background box.
+			float blockLeft = outW, blockRight = 0.0f;
+			bool anyLine = false;
+			for (uint32_t i = 0; i < numLines; ++i)
+			{
+				if (lineWidths[i] <= 0.0f)
+					continue;
+				anyLine = true;
+				blockLeft = std::min(blockLeft, hOffsets[i]);
+				blockRight = std::max(blockRight, hOffsets[i] + lineWidths[i]);
+			}
+
+			// Background box, behind everything.
+			if (anyLine && boxColor.w > 0.0f)
+				DrawBox(cmd,
+						tex,
+						outW,
+						outH,
+						blockLeft - boxPadding.x,
+						vOffset - boxPadding.y,
+						(blockRight - blockLeft) + 2.0f * boxPadding.x,
+						blockHeight + 2.0f * boxPadding.y,
+						boxColor);
+
+			auto glyphRect = [&](const Placed& gp, float& left, float& top, float& w, float& h) {
+				const Glyph& g = Glyphs[gp.GlyphIndex];
+				const float baseline = vOffset + ascender + float(gp.Line) * lineHeight;
+				left = hOffsets[gp.Line] + gp.PenX + g.BearingLeft * scale;
+				top = baseline - g.BearingTop * scale;
+				w = float(g.Width) * scale;
+				h = float(g.Height) * scale;
+			};
+			auto atlasRectOf = [&](const Placed& gp) {
+				const Glyph& g = Glyphs[gp.GlyphIndex];
+				return nosVec4{float(g.AtlasX) / float(AtlasW),
+							   float(g.AtlasY) / float(AtlasH),
+							   float(g.Width) / float(AtlasW),
+							   float(g.Height) / float(AtlasH)};
+			};
+
+			// Drop shadow: all shadows first so no glyph fill is tinted by a
+			// neighbouring glyph's shadow.
+			if (shadowColor.w > 0.0f)
+			{
+				nosVec4 noStroke{0.0f, 0.0f, 0.0f, 0.0f};
+				for (const Placed& gp : placed)
+				{
+					float left, top, w, h;
+					glyphRect(gp, left, top, w, h);
+					DrawGlyph(cmd,
+							  tex,
+							  outW,
+							  outH,
+							  left + shadowOffset.x,
+							  top + shadowOffset.y,
+							  w,
+							  h,
+							  atlasRectOf(gp),
+							  shadowColor,
+							  noStroke,
+							  0.0f,
+							  shadowSoftness,
+							  pxRange);
+				}
+			}
+
+			// Fill + outline.
+			for (const Placed& gp : placed)
+			{
+				float left, top, w, h;
+				glyphRect(gp, left, top, w, h);
+				DrawGlyph(cmd,
+						  tex,
+						  outW,
+						  outH,
+						  left,
+						  top,
+						  w,
+						  h,
+						  atlasRectOf(gp),
+						  textColor,
+						  strokeColor,
+						  strokeWidth,
+						  0.0f,
+						  pxRange);
+			}
+		}
+
+		vkss::EndCmd(cmd, NOS_FALSE, nullptr);
+		return NOS_RESULT_SUCCESS;
+	}
+};
+
+static nosResult RegisterShaderPair(const fs::path& root,
+									const char* baseName,
+									nosName fragKey,
+									nosName vertKey)
+{
+	auto fragPath = (root / "Shaders" / (std::string(baseName) + ".frag")).generic_string();
+	auto vertPath = (root / "Shaders" / (std::string(baseName) + ".vert")).generic_string();
+	std::array shaders = {
+		nosShaderInfo{.ShaderName = fragKey,
+					  .Source = {.Stage = NOS_SHADER_STAGE_FRAG, .GLSLPath = fragPath.c_str()},
+					  .AssociatedNodeClassName = NSN_TextRender},
+		nosShaderInfo{.ShaderName = vertKey,
+					  .Source = {.Stage = NOS_SHADER_STAGE_VERT, .GLSLPath = vertPath.c_str()},
+					  .AssociatedNodeClassName = NSN_TextRender},
+	};
+	return nosVulkan->RegisterShaders(shaders.size(), shaders.data());
+}
+
+nosResult RegisterTextRender(nosNodeFunctions* fn)
+{
+	NOS_BIND_NODE_CLASS(NSN_TextRender, TextRenderNode, fn);
+
+	fs::path root = nosEngine.Module->RootFolderPath;
+	if (nosResult ret = RegisterShaderPair(root, "TextGlyph", NSN_TextGlyph_Frag, NSN_TextGlyph_Vert);
+		ret != NOS_RESULT_SUCCESS)
+		return ret;
+	if (nosResult ret = RegisterShaderPair(root, "TextBox", NSN_TextBox_Frag, NSN_TextBox_Vert);
+		ret != NOS_RESULT_SUCCESS)
+		return ret;
+
+	std::array passes = {
+		nosPassInfo{
+			.Key = NSN_TextGlyph_Pass,
+			.Shader = NSN_TextGlyph_Frag,
+			.VertexShader = NSN_TextGlyph_Vert,
+			.MultiSample = 1,
+			.Blend = NOS_BLEND_MODE_ALPHA_BLENDING,
+		},
+		nosPassInfo{
+			.Key = NSN_TextBox_Pass,
+			.Shader = NSN_TextBox_Frag,
+			.VertexShader = NSN_TextBox_Vert,
+			.MultiSample = 1,
+			.Blend = NOS_BLEND_MODE_ALPHA_BLENDING,
+		},
+	};
+	return nosVulkan->RegisterPasses(passes.size(), passes.data());
+}
+
+} // namespace nos::utilities
diff --git a/Plugins/nosUtilities/Source/UtilitiesMain.cpp b/Plugins/nosUtilities/Source/UtilitiesMain.cpp
index c3d3e24a..ad07f07c 100644
--- a/Plugins/nosUtilities/Source/UtilitiesMain.cpp
+++ b/Plugins/nosUtilities/Source/UtilitiesMain.cpp
@@ -41,7 +41,9 @@ enum Utilities : int
 	PropagateExecution,
 	UploadBufferProvider,
 	BoundedQueue,
+	MultiBoundedQueue,
 	RingBuffer,
+	MultiRingBuffer,
 	Host,
 	DeinterlacedBoundedTextureQueue,
 	DeinterlacedBufferRing,
@@ -57,6 +59,9 @@ enum Utilities : int
 	GridOutputLayout,
 	LoadCubeLUT,
 	RepeatingJunction,
+	MultiLiveOut,
+	TextRender,
+	ScheduleRequest,
 	Count
 };
 
@@ -75,7 +80,9 @@ nosResult RegisterSink(nosNodeFunctions*);
 nosResult RegisterPropagateExecution(nosNodeFunctions*);
 nosResult RegisterUploadBufferProvider(nosNodeFunctions*);
 nosResult RegisterBoundedQueue(nosNodeFunctions*);
+nosResult RegisterMultiBoundedQueue(nosNodeFunctions*);
 nosResult RegisterRingBuffer(nosNodeFunctions*);
+nosResult RegisterMultiRingBuffer(nosNodeFunctions*);
 nosResult RegisterHost(nosNodeFunctions*);
 nosResult RegisterPin2Json(nosNodeFunctions*);
 nosResult RegisterJson2Pin(nosNodeFunctions*);
@@ -93,6 +100,9 @@ nosResult RegisterFreeOutputLayout(nosNodeFunctions*);
 nosResult RegisterGridOutputLayout(nosNodeFunctions*);
 nosResult RegisterLoadCubeLUT(nosNodeFunctions*);
 nosResult RegisterRepeatingJunction(nosNodeFunctions*);
+nosResult RegisterMultiLiveOut(nosNodeFunctions*);
+nosResult RegisterTextRender(nosNodeFunctions*);
+nosResult RegisterScheduleRequest(nosNodeFunctions*);
 
 nosResult NOSAPI_CALL ExportNodeFunctions(size_t* outSize, nosNodeFunctions** outList)
 {
@@ -129,7 +139,9 @@ nosResult NOSAPI_CALL ExportNodeFunctions(size_t* outSize, nosNodeFunctions** ou
 			GEN_CASE_NODE(PropagateExecution)
 			GEN_CASE_NODE(UploadBufferProvider)
 			GEN_CASE_NODE(BoundedQueue)
+			GEN_CASE_NODE(MultiBoundedQueue)
 			GEN_CASE_NODE(RingBuffer)
+			GEN_CASE_NODE(MultiRingBuffer)
 			GEN_CASE_NODE(Host)
 			GEN_CASE_NODE(DeinterlacedBoundedTextureQueue)
 			GEN_CASE_NODE(DeinterlacedBufferRing)
@@ -145,6 +157,9 @@ nosResult NOSAPI_CALL ExportNodeFunctions(size_t* outSize, nosNodeFunctions** ou
 			GEN_CASE_NODE(GridOutputLayout)
 			GEN_CASE_NODE(LoadCubeLUT)
 			GEN_CASE_NODE(RepeatingJunction)
+			GEN_CASE_NODE(MultiLiveOut)
+			GEN_CASE_NODE(TextRender)
+			GEN_CASE_NODE(ScheduleRequest)
 		}
 	}
 	return NOS_RESULT_SUCCESS;
@@ -163,7 +178,7 @@ NOSAPI_ATTR nosResult NOSAPI_CALL nosExportPlugin(nosPluginFunctions* out)
 		}
 		// clang-format off
 		outRenamedFrom[0] = NOS_NAME("nos.fb.ChannelViewerChannels"); outRenamedTo[0] = NOS_NAME("nos.utilities.ChannelViewerChannels");
-		outRenamedFrom[1] = NOS_NAME("nos.fb.ChannelViewerFormats"); outRenamedTo[1] = NOS_NAME("nos.utilities.ChannelViewerFormats");
+		outRenamedFrom[1] = NOS_NAME("nos.fb.ChannelViewerFormats"); outRenamedTo[1] = NOS_NAME("nos.mediaio.ColorSpace");
 		outRenamedFrom[2] = NOS_NAME("nos.fb.GradientKind"); outRenamedTo[2] = NOS_NAME("nos.utilities.GradientKind");
 		outRenamedFrom[3] = NOS_NAME("nos.fb.BlendMode"); outRenamedTo[3] = NOS_NAME("nos.utilities.BlendMode");
 		outRenamedFrom[4] = NOS_NAME("nos.fb.ResizeMethod"); outRenamedTo[4] = NOS_NAME("nos.utilities.ResizeMethod");
diff --git a/Plugins/nosUtilities/Utilities.noscfg b/Plugins/nosUtilities/Utilities.noscfg
index 79883ae9..50864c54 100644
--- a/Plugins/nosUtilities/Utilities.noscfg
+++ b/Plugins/nosUtilities/Utilities.noscfg
@@ -2,7 +2,7 @@
 	"info": {
 		"id": {
 			"name": "nos.utilities",
-			"version": "3.14.8"
+			"version": "3.15.0"
 		},
 		"description": "Various utility nodes.",
 		"display_name": "Utilities",
@@ -43,7 +43,9 @@
 		"Config/UploadBufferProvider.nosdef",
 		"Config/TimedFunctionSignaller.nosdef",
 		"Config/RingBuffer.nosdef",
+		"Config/MultiRingBuffer.nosdef",
 		"Config/BoundedQueue.nosdef",
+		"Config/MultiBoundedQueue.nosdef",
 		"Config/Host.nosdef",
 		"Config/AutoResize.nosdef",
 		"Config/ExecDepend.nosdef",
@@ -63,7 +65,10 @@
 		"Config/CalculateDispatchSize.nosdef",
 		"Config/YADIF.nosdef",
 		"Config/YADIFWithAutoDispatchSize.nosdef",
-		"Config/RepeatingJunction.nosdef"
+		"Config/RepeatingJunction.nosdef",
+		"Config/MultiLiveOut.nosdef",
+		"Config/TextRender.nosdef",
+		"Config/ScheduleRequest.nosdef"
 	],
 	"custom_types": [
 		"Config/Merge.fbs",
@@ -73,7 +78,8 @@
 		"Config/TextureSwitcher.fbs",
 		"Config/ChannelViewer.fbs",
 		"Config/Sink.fbs",
-		"Config/Layout.fbs"
+		"Config/Layout.fbs",
+		"Config/TextRender.fbs"
 	],
 	"defaults": [
 		"Config/Defaults.json"
diff --git a/Subsystems/nosTrackSubsystem/Config/Track.fbs b/Subsystems/nosTrackSubsystem/Config/Track.fbs
index e1dcce23..f36f2818 100644
--- a/Subsystems/nosTrackSubsystem/Config/Track.fbs
+++ b/Subsystems/nosTrackSubsystem/Config/Track.fbs
@@ -42,3 +42,18 @@ enum RotationSystem : uint {
   RPT = 4,
   PRT = 5,
 }
+
+// World coordinate frame convention used by a Track endpoint. Encodes axis
+// assignments to world-semantic directions (forward, right, up), the implied
+// handedness, and the Euler convention for the Track.rotation field.
+enum CoordinateFrame : ubyte {
+    // Left-handed, Z-up. +X forward, +Y right, +Z up.
+    // Rotation: rot.x = roll (X), rot.y = pitch (Y), rot.z = yaw (Z),
+    // intrinsic ZYX => R = Rz(yaw) * Ry(pitch) * Rx(roll).
+    LH_ZUp_FwdX_RightY = 0,
+
+    // Right-handed, Y-up. +X right, +Y up, -Z forward.
+    // Rotation: rot.x = pitch (X), rot.y = yaw (Y), rot.z = roll (Z),
+    // intrinsic YXZ => R = Ry(yaw) * Rx(pitch) * Rz(roll).
+    RH_YUp_FwdNegZ_RightX = 1,
+}
diff --git a/Subsystems/nosTrackSubsystem/Include/nosSysTrack/CoordinateFrameConv.h b/Subsystems/nosTrackSubsystem/Include/nosSysTrack/CoordinateFrameConv.h
new file mode 100644
index 00000000..76c35186
--- /dev/null
+++ b/Subsystems/nosTrackSubsystem/Include/nosSysTrack/CoordinateFrameConv.h
@@ -0,0 +1,106 @@
+// Copyright MediaZ Teknoloji A.S. All Rights Reserved.
+// Frame-conversion helpers for nos.sys.track.CoordinateFrame, shared by the
+// Track nodes (TrackTransform / RecordTrackCOLMAP / PlaybackTrackCOLMAP /
+// ConvertTransform) and by transform producers such as nos.geometry's FBX
+// reader. Encodes per-frame Euler conventions and basis-change matrices to the
+// COLMAP camera/world frame.
+#pragma once
+
+#include <nosSysTrack/Track_generated.h>
+
+#ifndef GLM_ENABLE_EXPERIMENTAL
+#define GLM_ENABLE_EXPERIMENTAL
+#endif
+#include <glm/glm.hpp>
+#include <glm/gtx/euler_angles.hpp>
+
+namespace nos::track::convention
+{
+
+using Frame = sys::track::CoordinateFrame;
+
+// Basis matrix S for a CoordinateFrame: maps semantic (forward, right, up)
+// to engine coords (vx, vy, vz). v_engine = S * (forward, right, up).
+// det(S) > 0 for left-handed frames, < 0 for right-handed (with this ordering).
+inline glm::dmat3 BasisMatrix(Frame frame)
+{
+	switch (frame)
+	{
+	case Frame::LH_ZUp_FwdX_RightY:
+		// vx = forward, vy = right, vz = up.
+		return glm::dmat3(1.0);
+	case Frame::RH_YUp_FwdNegZ_RightX:
+		// vx = right, vy = up, vz = -forward.
+		return glm::dmat3(
+			glm::dvec3( 0.0,  0.0, -1.0),  // M * (1,0,0) = forward column
+			glm::dvec3( 1.0,  0.0,  0.0),  // M * (0,1,0) = right column
+			glm::dvec3( 0.0,  1.0,  0.0)); // M * (0,0,1) = up column
+	}
+	return glm::dmat3(1.0);
+}
+
+// COLMAP camera/world frame: X right, Y down, Z forward (RH).
+// Provided as a basis matrix in the same (forward, right, up) convention so
+// it can be combined with BasisMatrix to build cross-frame conversions.
+inline glm::dmat3 ColmapBasisMatrix()
+{
+	return glm::dmat3(
+		glm::dvec3( 0.0,  0.0,  1.0),  // forward -> +Z
+		glm::dvec3( 1.0,  0.0,  0.0),  // right -> +X
+		glm::dvec3( 0.0, -1.0,  0.0)); // up -> -Y (Y is down)
+}
+
+// Build R_c2w in `frame` from Track.rotation Euler degrees.
+inline glm::dmat3 EulerToMat(Frame frame, glm::dvec3 const& degRot)
+{
+	glm::dvec3 r = glm::radians(degRot);
+	switch (frame)
+	{
+	case Frame::LH_ZUp_FwdX_RightY:
+		// FRotator: rot.x = roll, rot.y = pitch, rot.z = yaw, intrinsic ZYX.
+		// UE sign convention has +pitch = look up and +roll = bank right via
+		// LH-rule rotations, equivalent to standard-RH Rz(yaw) * Ry(-pitch) * Rx(-roll).
+		return glm::dmat3(glm::eulerAngleZYX<double>(r.z, -r.y, -r.x));
+	case Frame::RH_YUp_FwdNegZ_RightX:
+		// rot.x = pitch, rot.y = yaw, rot.z = roll, intrinsic YXZ:
+		// R = Ry(yaw) * Rx(pitch) * Rz(roll), all standard-RH formulas.
+		return glm::dmat3(glm::eulerAngleYXZ<double>(r.y, r.x, r.z));
+	}
+	return glm::dmat3(1.0);
+}
+
+// Inverse of EulerToMat: extract Euler degrees in `frame`'s convention.
+// Output is packed into the (rot.x, rot.y, rot.z) Track layout for that frame.
+inline glm::dvec3 MatToEuler(Frame frame, glm::dmat3 const& R)
+{
+	glm::dmat4 M(R);
+	double a = 0.0, b = 0.0, c = 0.0;
+	switch (frame)
+	{
+	case Frame::LH_ZUp_FwdX_RightY:
+		glm::extractEulerAngleZYX(M, a, b, c);  // a=yaw, b=pitch, c=roll
+		// Negate pitch and roll back to UE sign convention; pack as (roll, pitch, yaw).
+		return glm::degrees(glm::dvec3(-c, -b, a));
+	case Frame::RH_YUp_FwdNegZ_RightX:
+		glm::extractEulerAngleYXZ(M, a, b, c);  // a=yaw, b=pitch, c=roll
+		// Pack as (pitch, yaw, roll).
+		return glm::degrees(glm::dvec3(b, a, c));
+	}
+	return glm::dvec3(0.0);
+}
+
+// Basis-change M from `frame` to COLMAP frame: M = S_colmap * S_frame^-1.
+// For a vector:           v_colmap = M * v_frame.
+// For a rotation matrix:  R_colmap = M * R_frame * M^-1.
+inline glm::dmat3 BasisChangeToColmap(Frame frame)
+{
+	return ColmapBasisMatrix() * glm::inverse(BasisMatrix(frame));
+}
+
+// Inverse of BasisChangeToColmap.
+inline glm::dmat3 BasisChangeFromColmap(Frame frame)
+{
+	return BasisMatrix(frame) * glm::inverse(ColmapBasisMatrix());
+}
+
+}  // namespace nos::track::convention
diff --git a/Subsystems/nosTrackSubsystem/nosTrackSubsystem.nossys b/Subsystems/nosTrackSubsystem/nosTrackSubsystem.nossys
index d2f6b9cb..625fd3fe 100644
--- a/Subsystems/nosTrackSubsystem/nosTrackSubsystem.nossys
+++ b/Subsystems/nosTrackSubsystem/nosTrackSubsystem.nossys
@@ -2,7 +2,7 @@
 	"info": {
 		"id": {
 			"name": "nos.sys.track",
-			"version": "1.0.0"
+			"version": "1.1.0"
 		},
 		"display_name": "Track Subsystem",
 		"dependencies": [