Asset API updates, parallel blake3, inline AABB extender, IO policies, runtime tunning, mesh loaders & writers by AnastaZIuk · Pull Request #1000 · Devsh-Graphics-Programming/Nabla

AnastaZIuk · 2026-02-14T06:54:51Z

No description provided.

devshgraphicsprogramming · 2026-02-17T16:11:57Z

src/nbl/asset/interchange/CSTLMeshWriter.cpp

+double stlNormalizeColorComponentToUnit(double value)
+{
+	if (!std::isfinite(value))
+		return 0.0;
+	if (value > 1.0)
+		value /= 255.0;
+	return std::clamp(value, 0.0, 1.0);
+}

-	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, "endsolid ", context->fileOffset, 9);
+uint16_t stlPackViscamColorFromB8G8R8A8(const uint32_t color)
+{
+	const void* src[4] = { &color, nullptr, nullptr, nullptr };
+	uint16_t packed = 0u;
+	convertColor<EF_B8G8R8A8_UNORM, EF_A1R5G5B5_UNORM_PACK16>(src, &packed, 0u, 0u);
+	packed |= 0x8000u;
+	return packed;
+}

-		context->fileOffset += success.getBytesProcessed();
-	}
+const ICPUPolygonGeometry::SDataView* stlFindColorView(const ICPUPolygonGeometry* geom, const size_t vertexCount)
+{
+	if (!geom)
+		return nullptr;

+	const auto& auxViews = geom->getAuxAttributeViews();
+	const ICPUPolygonGeometry::SDataView* fallback = nullptr;
+	for (const auto& view : auxViews)
 	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, headerTxt, context->fileOffset, sizeof(headerTxt) - 1);
-
-		context->fileOffset += success.getBytesProcessed();
+		if (!view || view.getElementCount() != vertexCount)
+			continue;
+		const uint32_t channels = getFormatChannelCount(view.composed.format);
+		if (channels < 3u)
+			continue;
+		if (view.composed.format == EF_B8G8R8A8_UNORM)
+			return &view;
+		if (!fallback)
+			fallback = &view;
 	}
+	return fallback;
+}

+bool stlDecodeColorB8G8R8A8(const ICPUPolygonGeometry::SDataView& colorView, const uint32_t ix, uint32_t& outColor)
+{
+	if (colorView.composed.format == EF_B8G8R8A8_UNORM && colorView.composed.getStride() == sizeof(uint32_t))
 	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, name.c_str(), context->fileOffset, name.size());
-
-		context->fileOffset += success.getBytesProcessed();
+		const auto* const ptr = reinterpret_cast<const uint8_t*>(colorView.getPointer());
+		if (!ptr)
+			return false;
+		std::memcpy(&outColor, ptr + static_cast<size_t>(ix) * sizeof(uint32_t), sizeof(outColor));
+		return true;
 	}

+	hlsl::float64_t4 decoded = {};
+	if (!colorView.decodeElement(ix, decoded))
+		return false;
+	const double rgbaUnit[4] = {
+		stlNormalizeColorComponentToUnit(decoded.x),
+		stlNormalizeColorComponentToUnit(decoded.y),
+		stlNormalizeColorComponentToUnit(decoded.z),
+		stlNormalizeColorComponentToUnit(decoded.w)
+	};
+	encodePixels<EF_B8G8R8A8_UNORM, double>(&outColor, rgbaUnit);
 	return true;
 }

-void CSTLMeshWriter::getVectorAsStringLine(const core::vectorSIMDf& v, std::string& s) const
+void stlDecodeColorUnitRGBAFromB8G8R8A8(const uint32_t color, double (&out)[4])
 {
-    std::ostringstream tmp;
-    tmp << v.X << " " << v.Y << " " << v.Z << "\n";
-    s = std::string(tmp.str().c_str());
+	const void* src[4] = { &color, nullptr, nullptr, nullptr };
+	decodePixels<EF_B8G8R8A8_UNORM, double>(src, out, 0u, 0u);
 }

-void CSTLMeshWriter::writeFaceText(
-		const core::vectorSIMDf& v1,
-		const core::vectorSIMDf& v2,
-		const core::vectorSIMDf& v3,
-		SContext* context)
+bool writeMeshBinary(const asset::ICPUPolygonGeometry* geom, SContext* context)
 {
-	core::vectorSIMDf vertex1 = v3;
-	core::vectorSIMDf vertex2 = v2;
-	core::vectorSIMDf vertex3 = v1;
-	core::vectorSIMDf normal = core::plane3dSIMDf(vertex1, vertex2, vertex3).getNormal();
-	std::string tmp;
+	if (!geom || !context || !context->writeContext.outputFile)
+		return false;

-	auto flipVectors = [&]()
-	{
-		vertex1.X = -vertex1.X;
-		vertex2.X = -vertex2.X;
-		vertex3.X = -vertex3.X;
-		normal = core::plane3dSIMDf(vertex1, vertex2, vertex3).getNormal();
-	};
-
-	if (!(context->writeContext.params.flags & E_WRITER_FLAGS::EWF_MESH_IS_RIGHT_HANDED))
-		flipVectors();
-
-	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, "facet normal ", context->fileOffset, 13);
+	const auto& posView = geom->getPositionView();
+	if (!posView)
+		return false;

-		context->fileOffset += success.getBytesProcessed();
-	}
+	const bool flipHandedness = !(context->writeContext.params.flags & E_WRITER_FLAGS::EWF_MESH_IS_RIGHT_HANDED);
+	const size_t vertexCount = posView.getElementCount();
+	if (vertexCount == 0ull)
+		return false;

-	getVectorAsStringLine(normal, tmp);
+	core::vector<uint32_t> indexData;
+	const uint32_t* indices = nullptr;
+	uint32_t facenum = 0u;
+	if (!decodeTriangleIndices(geom, posView, indexData, indices, facenum))
+		return false;

-	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, tmp.c_str(), context->fileOffset, tmp.size());
+	const size_t outputSize = stl_writer_detail::BinaryPrefixBytes + static_cast<size_t>(facenum) * stl_writer_detail::BinaryTriangleRecordBytes;
+	std::unique_ptr<uint8_t[]> output(new (std::nothrow) uint8_t[outputSize]);
+	if (!output)
+		return false;
+	uint8_t* dst = output.get();

-		context->fileOffset += success.getBytesProcessed();
-	}
+	std::memset(dst, 0, stl_writer_detail::BinaryHeaderBytes);
+	dst += stl_writer_detail::BinaryHeaderBytes;
+
+	std::memcpy(dst, &facenum, sizeof(facenum));
+	dst += sizeof(facenum);
+
+	const auto& normalView = geom->getNormalView();
+	const bool hasNormals = static_cast<bool>(normalView);
+	const auto* const colorView = stlFindColorView(geom, vertexCount);
+	const hlsl::float32_t3* const tightPositions = getTightFloat3View(posView);
+	const hlsl::float32_t3* const tightNormals = hasNormals ? getTightFloat3View(normalView) : nullptr;
+	const float handednessSign = flipHandedness ? -1.f : 1.f;

+	auto decodePosition = [&](const uint32_t ix, hlsl::float32_t3& out)->bool
 	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, "  outer loop\n", context->fileOffset, 13);
+		if (tightPositions)
+		{
+			out = tightPositions[ix];
+			return true;
+		}
+		return posView.decodeElement(ix, out);
+	};

-		context->fileOffset += success.getBytesProcessed();
-	}
+	auto decodeNormal = [&](const uint32_t ix, hlsl::float32_t3& out)->bool
+	{
+		if (!hasNormals)
+			return false;
+		if (tightNormals)
+		{
+			out = tightNormals[ix];
+			return true;
+		}
+		return normalView.decodeElement(ix, out);
+	};
+	auto computeFaceColor = [&](const uint32_t i0, const uint32_t i1, const uint32_t i2, uint16_t& outColor)->bool
+	{
+		outColor = 0u;
+		if (!colorView)
+			return true;
+		uint32_t c0 = 0u, c1 = 0u, c2 = 0u;
+		if (!stlDecodeColorB8G8R8A8(*colorView, i0, c0))
+			return false;
+		if (!stlDecodeColorB8G8R8A8(*colorView, i1, c1))
+			return false;
+		if (!stlDecodeColorB8G8R8A8(*colorView, i2, c2))
+			return false;
+		double rgba0[4] = {};
+		double rgba1[4] = {};
+		double rgba2[4] = {};
+		stlDecodeColorUnitRGBAFromB8G8R8A8(c0, rgba0);
+		stlDecodeColorUnitRGBAFromB8G8R8A8(c1, rgba1);
+		stlDecodeColorUnitRGBAFromB8G8R8A8(c2, rgba2);
+		const double rgbaAvg[4] = {
+			(rgba0[0] + rgba1[0] + rgba2[0]) / 3.0,
+			(rgba0[1] + rgba1[1] + rgba2[1]) / 3.0,
+			(rgba0[2] + rgba1[2] + rgba2[2]) / 3.0,
+			1.0
+		};
+		uint32_t avgColor = 0u;
+		encodePixels<EF_B8G8R8A8_UNORM, double>(&avgColor, rgbaAvg);
+		outColor = stlPackViscamColorFromB8G8R8A8(avgColor);
+		return true;
+	};
+	auto writeRecord = [&dst](const float nx, const float ny, const float nz, const float v1x, const float v1y, const float v1z, const float v2x, const float v2y, const float v2z, const float v3x, const float v3y, const float v3z, const uint16_t attribute)->void
+	{
+		const float payload[stl_writer_detail::BinaryTriangleFloatCount] = {
+			nx, ny, nz,
+			v1x, v1y, v1z,
+			v2x, v2y, v2z,
+			v3x, v3y, v3z
+		};
+		std::memcpy(dst, payload, stl_writer_detail::BinaryTriangleFloatBytes);
+		dst += stl_writer_detail::BinaryTriangleFloatBytes;
+		std::memcpy(dst, &attribute, stl_writer_detail::BinaryTriangleAttributeBytes);
+		dst += stl_writer_detail::BinaryTriangleAttributeBytes;
+	};

+	const bool hasFastTightPath = (indices == nullptr) && (tightPositions != nullptr) && (!hasNormals || (tightNormals != nullptr));
+	if (hasFastTightPath && hasNormals)
 	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, "    vertex ", context->fileOffset, 11);
+		bool allFastNormalsNonZero = true;
+		const size_t normalCount = static_cast<size_t>(facenum) * 3ull;
+		for (size_t i = 0ull; i < normalCount; ++i)
+		{
+			const auto& n = tightNormals[i];
+			if (n.x == 0.f && n.y == 0.f && n.z == 0.f)
+			{
+				allFastNormalsNonZero = false;
+				break;
+			}
+		}

-		context->fileOffset += success.getBytesProcessed();
+		const hlsl::float32_t3* posTri = tightPositions;
+		const hlsl::float32_t3* nrmTri = tightNormals;
+		if (allFastNormalsNonZero)
+		{
+			for (uint32_t primIx = 0u; primIx < facenum; ++primIx, posTri += 3u, nrmTri += 3u)
+			{
+				uint16_t faceColor = 0u;
+				if (!computeFaceColor(primIx * 3u + 0u, primIx * 3u + 1u, primIx * 3u + 2u, faceColor))
+					return false;
+
+				const hlsl::float32_t3 vertex1 = posTri[2u];
+				const hlsl::float32_t3 vertex2 = posTri[1u];
+				const hlsl::float32_t3 vertex3 = posTri[0u];
+				const float vertex1x = vertex1.x * handednessSign;
+				const float vertex2x = vertex2.x * handednessSign;
+				const float vertex3x = vertex3.x * handednessSign;
+
+				hlsl::float32_t3 attrNormal = nrmTri[0u];
+				if (flipHandedness)
+					attrNormal.x = -attrNormal.x;
+
+				writeRecord(
+					attrNormal.x, attrNormal.y, attrNormal.z,
+					vertex1x, vertex1.y, vertex1.z,
+					vertex2x, vertex2.y, vertex2.z,
+					vertex3x, vertex3.y, vertex3.z,
+					faceColor);
+			}
+		}
+		else
+		{
+			for (uint32_t primIx = 0u; primIx < facenum; ++primIx, posTri += 3u, nrmTri += 3u)
+			{
+				uint16_t faceColor = 0u;
+				if (!computeFaceColor(primIx * 3u + 0u, primIx * 3u + 1u, primIx * 3u + 2u, faceColor))
+					return false;
+
+				const hlsl::float32_t3 vertex1 = posTri[2u];
+				const hlsl::float32_t3 vertex2 = posTri[1u];
+				const hlsl::float32_t3 vertex3 = posTri[0u];
+				const float vertex1x = vertex1.x * handednessSign;
+				const float vertex2x = vertex2.x * handednessSign;
+				const float vertex3x = vertex3.x * handednessSign;
+
+				float normalX = 0.f;
+				float normalY = 0.f;
+				float normalZ = 0.f;
+				hlsl::float32_t3 attrNormal = nrmTri[0u];
+				if (attrNormal.x == 0.f && attrNormal.y == 0.f && attrNormal.z == 0.f)
+					attrNormal = nrmTri[1u];
+				if (attrNormal.x == 0.f && attrNormal.y == 0.f && attrNormal.z == 0.f)
+					attrNormal = nrmTri[2u];
+				if (!(attrNormal.x == 0.f && attrNormal.y == 0.f && attrNormal.z == 0.f))
+				{
+					if (flipHandedness)
+						attrNormal.x = -attrNormal.x;
+					normalX = attrNormal.x;
+					normalY = attrNormal.y;
+					normalZ = attrNormal.z;
+				}
+
+				if (normalX == 0.f && normalY == 0.f && normalZ == 0.f)
+				{
+					const float edge21x = vertex2x - vertex1x;
+					const float edge21y = vertex2.y - vertex1.y;
+					const float edge21z = vertex2.z - vertex1.z;
+					const float edge31x = vertex3x - vertex1x;
+					const float edge31y = vertex3.y - vertex1.y;
+					const float edge31z = vertex3.z - vertex1.z;
+
+					normalX = edge21y * edge31z - edge21z * edge31y;
+					normalY = edge21z * edge31x - edge21x * edge31z;
+					normalZ = edge21x * edge31y - edge21y * edge31x;
+					const float planeNormalLen2 = normalX * normalX + normalY * normalY + normalZ * normalZ;
+					if (planeNormalLen2 > 0.f)
+					{
+						const float invLen = 1.f / std::sqrt(planeNormalLen2);
+						normalX *= invLen;
+						normalY *= invLen;
+						normalZ *= invLen;
+					}
+				}
+
+				writeRecord(
+					normalX, normalY, normalZ,
+					vertex1x, vertex1.y, vertex1.z,
+					vertex2x, vertex2.y, vertex2.z,
+					vertex3x, vertex3.y, vertex3.z,
+					faceColor);
+			}
+		}
+	}
+	else if (hasFastTightPath)
+	{
+		const hlsl::float32_t3* posTri = tightPositions;
+		for (uint32_t primIx = 0u; primIx < facenum; ++primIx, posTri += 3u)
+		{
+			uint16_t faceColor = 0u;
+			if (!computeFaceColor(primIx * 3u + 0u, primIx * 3u + 1u, primIx * 3u + 2u, faceColor))
+				return false;
+
+			const hlsl::float32_t3 vertex1 = posTri[2u];
+			const hlsl::float32_t3 vertex2 = posTri[1u];
+			const hlsl::float32_t3 vertex3 = posTri[0u];
+			const float vertex1x = vertex1.x * handednessSign;
+			const float vertex2x = vertex2.x * handednessSign;
+			const float vertex3x = vertex3.x * handednessSign;
+
+			const float edge21x = vertex2x - vertex1x;
+			const float edge21y = vertex2.y - vertex1.y;
+			const float edge21z = vertex2.z - vertex1.z;
+			const float edge31x = vertex3x - vertex1x;
+			const float edge31y = vertex3.y - vertex1.y;
+			const float edge31z = vertex3.z - vertex1.z;
+
+			float normalX = edge21y * edge31z - edge21z * edge31y;
+			float normalY = edge21z * edge31x - edge21x * edge31z;
+			float normalZ = edge21x * edge31y - edge21y * edge31x;
+			const float planeNormalLen2 = normalX * normalX + normalY * normalY + normalZ * normalZ;
+			if (planeNormalLen2 > 0.f)
+			{
+				const float invLen = 1.f / std::sqrt(planeNormalLen2);
+				normalX *= invLen;
+				normalY *= invLen;
+				normalZ *= invLen;
+			}
+
+			writeRecord(
+				normalX, normalY, normalZ,
+				vertex1x, vertex1.y, vertex1.z,
+				vertex2x, vertex2.y, vertex2.z,
+				vertex3x, vertex3.y, vertex3.z,
+				faceColor);
+		}
+	}
+	else
+	{
+		for (uint32_t primIx = 0u; primIx < facenum; ++primIx)
+		{
+			const uint32_t i0 = indices ? indices[primIx * 3u + 0u] : (primIx * 3u + 0u);
+			const uint32_t i1 = indices ? indices[primIx * 3u + 1u] : (primIx * 3u + 1u);
+			const uint32_t i2 = indices ? indices[primIx * 3u + 2u] : (primIx * 3u + 2u);
+			if (i0 >= vertexCount || i1 >= vertexCount || i2 >= vertexCount)
+				return false;
+			uint16_t faceColor = 0u;
+			if (!computeFaceColor(i0, i1, i2, faceColor))
+				return false;
+
+			hlsl::float32_t3 p0 = {};
+			hlsl::float32_t3 p1 = {};
+			hlsl::float32_t3 p2 = {};
+			if (!decodePosition(i0, p0) || !decodePosition(i1, p1) || !decodePosition(i2, p2))
+				return false;
+
+			hlsl::float32_t3 vertex1 = p2;
+			hlsl::float32_t3 vertex2 = p1;
+			hlsl::float32_t3 vertex3 = p0;
+
+			if (flipHandedness)
+			{
+				vertex1.x = -vertex1.x;
+				vertex2.x = -vertex2.x;
+				vertex3.x = -vertex3.x;
+			}
+
+			const hlsl::float32_t3 planeNormal = hlsl::cross(vertex2 - vertex1, vertex3 - vertex1);
+			const float planeNormalLen2 = hlsl::dot(planeNormal, planeNormal);
+			hlsl::float32_t3 normal = hlsl::float32_t3(0.f, 0.f, 0.f);
+			if (!hasNormals)
+			{
+				if (planeNormalLen2 > 0.f)
+					normal = hlsl::normalize(planeNormal);
+			}
+
+			if (hasNormals)
+			{
+				hlsl::float32_t3 n0 = {};
+				if (!decodeNormal(i0, n0))
+					return false;
+
+				hlsl::float32_t3 attrNormal = n0;
+				if (hlsl::dot(attrNormal, attrNormal) <= 0.f)
+				{
+					hlsl::float32_t3 n1 = {};
+					if (!decodeNormal(i1, n1))
+						return false;
+					attrNormal = n1;
+				}
+				if (hlsl::dot(attrNormal, attrNormal) <= 0.f)
+				{
+					hlsl::float32_t3 n2 = {};
+					if (!decodeNormal(i2, n2))
+						return false;
+					attrNormal = n2;
+				}
+
+				if (hlsl::dot(attrNormal, attrNormal) > 0.f)
+				{
+					if (flipHandedness)
+						attrNormal.x = -attrNormal.x;
+					if (planeNormalLen2 > 0.f && hlsl::dot(attrNormal, planeNormal) < 0.f)
+						attrNormal = -attrNormal;
+					normal = attrNormal;
+				}
+				else if (planeNormalLen2 > 0.f)
+				{
+					normal = hlsl::normalize(planeNormal);
+				}
+			}
+
+			writeRecord(
+				normal.x, normal.y, normal.z,
+				vertex1.x, vertex1.y, vertex1.z,
+				vertex2.x, vertex2.y, vertex2.z,
+				vertex3.x, vertex3.y, vertex3.z,
+				faceColor);
+		}
 	}

-	getVectorAsStringLine(vertex1, tmp);
+	const bool writeOk = writeFileWithPolicy(context->writeContext.outputFile, context->ioPlan, output.get(), outputSize, &context->writeTelemetry);
+	if (writeOk)
+		context->fileOffset += outputSize;
+	return writeOk;
+}

-	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, tmp.c_str(), context->fileOffset, tmp.size());
+bool writeMeshASCII(const asset::ICPUPolygonGeometry* geom, SContext* context)
+{
+	if (!geom)
+		return false;

-		context->fileOffset += success.getBytesProcessed();
-	}
+	const auto* indexing = geom->getIndexingCallback();
+	if (!indexing || indexing->degree() != 3u)
+		return false;

-	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, "    vertex ", context->fileOffset, 11);
+	const auto& posView = geom->getPositionView();
+	if (!posView)
+		return false;
+	const auto& normalView = geom->getNormalView();
+	const bool flipHandedness = !(context->writeContext.params.flags & E_WRITER_FLAGS::EWF_MESH_IS_RIGHT_HANDED);

-		context->fileOffset += success.getBytesProcessed();
-	}
+	const std::string name = context->writeContext.outputFile->getFileName().filename().replace_extension().string();
+	const std::string_view solidName = name.empty() ? std::string_view(stl_writer_detail::AsciiDefaultName) : std::string_view(name);

-	getVectorAsStringLine(vertex2, tmp);
+	if (!writeBytes(context, stl_writer_detail::AsciiSolidPrefix, sizeof(stl_writer_detail::AsciiSolidPrefix) - 1ull))
+		return false;

-	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, tmp.c_str(), context->fileOffset, tmp.size());
+	if (!writeBytes(context, solidName.data(), solidName.size()))
+		return false;

-		context->fileOffset += success.getBytesProcessed();
-	}
+	if (!writeBytes(context, "\n", sizeof("\n") - 1ull))
+		return false;

+	const uint32_t faceCount = static_cast<uint32_t>(geom->getPrimitiveCount());
+	for (uint32_t primIx = 0u; primIx < faceCount; ++primIx)
 	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, "    vertex ", context->fileOffset, 11);
-
-		context->fileOffset += success.getBytesProcessed();
+		core::vectorSIMDf v0;
+		core::vectorSIMDf v1;
+		core::vectorSIMDf v2;
+		uint32_t idx[3] = {};
+		if (!decodeTriangle(geom, indexing, posView, primIx, v0, v1, v2, idx))
+			return false;
+		if (!writeFaceText(v0, v1, v2, idx, normalView, flipHandedness, context))
+			return false;
+		if (!writeBytes(context, "\n", sizeof("\n") - 1ull))
+			return false;
 	}

-	getVectorAsStringLine(vertex3, tmp);
+	if (!writeBytes(context, stl_writer_detail::AsciiEndSolidPrefix, sizeof(stl_writer_detail::AsciiEndSolidPrefix) - 1ull))
+		return false;

-	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, tmp.c_str(), context->fileOffset, tmp.size());
+	if (!writeBytes(context, solidName.data(), solidName.size()))
+		return false;

-		context->fileOffset += success.getBytesProcessed();
-	}
+	return true;
+}

-	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, "  endloop\n", context->fileOffset, 10);
+bool writeFaceText(
+		const core::vectorSIMDf& v1,
+		const core::vectorSIMDf& v2,
+		const core::vectorSIMDf& v3,
+		const uint32_t* idx,
+		const asset::ICPUPolygonGeometry::SDataView& normalView,
+		const bool flipHandedness,
+		SContext* context)
+{
+	core::vectorSIMDf vertex1 = v3;
+	core::vectorSIMDf vertex2 = v2;
+	core::vectorSIMDf vertex3 = v1;

-		context->fileOffset += success.getBytesProcessed();
+	if (flipHandedness)
+	{
+		vertex1.X = -vertex1.X;
+		vertex2.X = -vertex2.X;
+		vertex3.X = -vertex3.X;
 	}

+	core::vectorSIMDf normal = core::plane3dSIMDf(vertex1, vertex2, vertex3).getNormal();
+	core::vectorSIMDf attrNormal;
+	if (decodeTriangleNormal(normalView, idx, attrNormal))
 	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, "endfacet\n", context->fileOffset, 9);
-
-		context->fileOffset += success.getBytesProcessed();
+		if (flipHandedness)
+			attrNormal.X = -attrNormal.X;
+		if (core::dot(attrNormal, normal).X < 0.f)
+			attrNormal = -attrNormal;
+		normal = attrNormal;
 	}
+
+	std::array<char, stl_writer_detail::AsciiFaceTextMaxBytes> faceText = {};
+	char* cursor = faceText.data();
+	char* const end = faceText.data() + faceText.size();
+	if (!appendLiteral(cursor, end, "facet normal ", sizeof("facet normal ") - 1ull))
+		return false;
+	if (!appendVectorAsAsciiLine(cursor, end, normal))
+		return false;
+	if (!appendLiteral(cursor, end, "  outer loop\n", sizeof("  outer loop\n") - 1ull))
+		return false;
+	if (!appendLiteral(cursor, end, "    vertex ", sizeof("    vertex ") - 1ull))
+		return false;
+	if (!appendVectorAsAsciiLine(cursor, end, vertex1))
+		return false;
+	if (!appendLiteral(cursor, end, "    vertex ", sizeof("    vertex ") - 1ull))
+		return false;
+	if (!appendVectorAsAsciiLine(cursor, end, vertex2))
+		return false;
+	if (!appendLiteral(cursor, end, "    vertex ", sizeof("    vertex ") - 1ull))
+		return false;
+	if (!appendVectorAsAsciiLine(cursor, end, vertex3))
+		return false;
+	if (!appendLiteral(cursor, end, "  endloop\n", sizeof("  endloop\n") - 1ull))
+		return false;
+	if (!appendLiteral(cursor, end, "endfacet\n", sizeof("endfacet\n") - 1ull))
+		return false;
+
+	return writeBytes(context, faceText.data(), static_cast<size_t>(cursor - faceText.data()));
+}
+
 }


fun fact when dealing with mesh LDR colors, they're supposed to be SRGB

whenever they were UNORM before, that was wrong.

at least when the semantics were clear that they were RGB per-vertex colors

devshgraphicsprogramming · 2026-02-17T16:13:17Z

src/nbl/asset/interchange/CSTLMeshWriter.cpp

+	core::vector<uint32_t> indexData;
+	const uint32_t* indices = nullptr;
+	uint32_t facenum = 0u;
+	if (!decodeTriangleIndices(geom, posView, indexData, indices, facenum))
+		return false;


make a common util for all polygon geo writers ?

devshgraphicsprogramming · 2026-02-17T16:14:44Z

src/nbl/asset/interchange/CSTLMeshWriter.cpp

+	const size_t outputSize = stl_writer_detail::BinaryPrefixBytes + static_cast<size_t>(facenum) * stl_writer_detail::BinaryTriangleRecordBytes;
+	std::unique_ptr<uint8_t[]> output(new (std::nothrow) uint8_t[outputSize]);
+	if (!output)
+		return false;
+	uint8_t* dst = output.get();


does this make sense if the output file is memory mapped anyway ?

devshgraphicsprogramming · 2026-02-17T16:16:32Z

src/nbl/asset/interchange/CSTLMeshWriter.cpp

+	auto computeFaceColor = [&](const uint32_t i0, const uint32_t i1, const uint32_t i2, uint16_t& outColor)->bool
+	{
+		outColor = 0u;
+		if (!colorView)
+			return true;
+		uint32_t c0 = 0u, c1 = 0u, c2 = 0u;
+		if (!stlDecodeColorB8G8R8A8(*colorView, i0, c0))
+			return false;
+		if (!stlDecodeColorB8G8R8A8(*colorView, i1, c1))
+			return false;
+		if (!stlDecodeColorB8G8R8A8(*colorView, i2, c2))
+			return false;
+		double rgba0[4] = {};
+		double rgba1[4] = {};
+		double rgba2[4] = {};
+		stlDecodeColorUnitRGBAFromB8G8R8A8(c0, rgba0);
+		stlDecodeColorUnitRGBAFromB8G8R8A8(c1, rgba1);
+		stlDecodeColorUnitRGBAFromB8G8R8A8(c2, rgba2);
+		const double rgbaAvg[4] = {
+			(rgba0[0] + rgba1[0] + rgba2[0]) / 3.0,
+			(rgba0[1] + rgba1[1] + rgba2[1]) / 3.0,
+			(rgba0[2] + rgba1[2] + rgba2[2]) / 3.0,
+			1.0
+		};
+		uint32_t avgColor = 0u;
+		encodePixels<EF_B8G8R8A8_UNORM, double>(&avgColor, rgbaAvg);
+		outColor = stlPackViscamColorFromB8G8R8A8(avgColor);
+		return true;
+	};


I think you need better SRGB handling

devshgraphicsprogramming · 2026-02-17T16:17:10Z

src/nbl/asset/interchange/CSTLMeshWriter.cpp

+		outColor = stlPackViscamColorFromB8G8R8A8(avgColor);
+		return true;
+	};
+	auto writeRecord = [&dst](const float nx, const float ny, const float nz, const float v1x, const float v1y, const float v1z, const float v2x, const float v2y, const float v2z, const float v3x, const float v3y, const float v3z, const uint16_t attribute)->void


why are we passing stuff as individual scalars and not hlsl::float32_t3 ?

devshgraphicsprogramming · 2026-02-17T16:17:56Z

src/nbl/asset/interchange/CSTLMeshWriter.cpp

+				const hlsl::float32_t3 vertex1 = posTri[2u];
+				const hlsl::float32_t3 vertex2 = posTri[1u];
+				const hlsl::float32_t3 vertex3 = posTri[0u];
+				const float vertex1x = vertex1.x * handednessSign;
+				const float vertex2x = vertex2.x * handednessSign;
+				const float vertex3x = vertex3.x * handednessSign;
+
+				float normalX = 0.f;
+				float normalY = 0.f;
+				float normalZ = 0.f;
+				hlsl::float32_t3 attrNormal = nrmTri[0u];
+				if (attrNormal.x == 0.f && attrNormal.y == 0.f && attrNormal.z == 0.f)
+					attrNormal = nrmTri[1u];
+				if (attrNormal.x == 0.f && attrNormal.y == 0.f && attrNormal.z == 0.f)
+					attrNormal = nrmTri[2u];
+				if (!(attrNormal.x == 0.f && attrNormal.y == 0.f && attrNormal.z == 0.f))
+				{
+					if (flipHandedness)
+						attrNormal.x = -attrNormal.x;
+					normalX = attrNormal.x;
+					normalY = attrNormal.y;
+					normalZ = attrNormal.z;
+				}
+
+				if (normalX == 0.f && normalY == 0.f && normalZ == 0.f)
+				{
+					const float edge21x = vertex2x - vertex1x;
+					const float edge21y = vertex2.y - vertex1.y;
+					const float edge21z = vertex2.z - vertex1.z;
+					const float edge31x = vertex3x - vertex1x;
+					const float edge31y = vertex3.y - vertex1.y;
+					const float edge31z = vertex3.z - vertex1.z;
+
+					normalX = edge21y * edge31z - edge21z * edge31y;
+					normalY = edge21z * edge31x - edge21x * edge31z;
+					normalZ = edge21x * edge31y - edge21y * edge31x;
+					const float planeNormalLen2 = normalX * normalX + normalY * normalY + normalZ * normalZ;
+					if (planeNormalLen2 > 0.f)
+					{
+						const float invLen = 1.f / std::sqrt(planeNormalLen2);
+						normalX *= invLen;
+						normalY *= invLen;
+						normalZ *= invLen;
+					}
+				}


the code could be so much smaller if you used vector types and HLSL lib

devshgraphicsprogramming · 2026-02-17T16:18:07Z

src/nbl/asset/interchange/CSTLMeshWriter.cpp

+					if (planeNormalLen2 > 0.f)
+					{
+						const float invLen = 1.f / std::sqrt(planeNormalLen2);
+						normalX *= invLen;
+						normalY *= invLen;
+						normalZ *= invLen;
+					}


its okay to write NaN in this case

devshgraphicsprogramming · 2026-02-17T16:18:16Z

src/nbl/asset/interchange/CSTLMeshWriter.cpp

+			if (planeNormalLen2 > 0.f)
+			{
+				const float invLen = 1.f / std::sqrt(planeNormalLen2);
+				normalX *= invLen;
+				normalY *= invLen;
+				normalZ *= invLen;
+			}


nan is okay

devshgraphicsprogramming · 2026-02-17T16:18:38Z

src/nbl/asset/interchange/CSTLMeshWriter.cpp

+			hlsl::float32_t3 p0 = {};
+			hlsl::float32_t3 p1 = {};
+			hlsl::float32_t3 p2 = {};
+			if (!decodePosition(i0, p0) || !decodePosition(i1, p1) || !decodePosition(i2, p2))
+				return false;
+
+			hlsl::float32_t3 vertex1 = p2;
+			hlsl::float32_t3 vertex2 = p1;
+			hlsl::float32_t3 vertex3 = p0;
+
+			if (flipHandedness)
+			{
+				vertex1.x = -vertex1.x;
+				vertex2.x = -vertex2.x;
+				vertex3.x = -vertex3.x;
+			}


use arrays instead of separate vals

devshgraphicsprogramming · 2026-02-17T16:18:58Z

src/nbl/asset/interchange/CSTLMeshWriter.cpp

+			hlsl::float32_t3 normal = hlsl::float32_t3(0.f, 0.f, 0.f);
+			if (!hasNormals)
+			{
+				if (planeNormalLen2 > 0.f)


NaN is okay

devshgraphicsprogramming · 2026-02-17T16:19:20Z

src/nbl/asset/interchange/CSTLMeshWriter.cpp

+			if (hasNormals)
+			{
+				hlsl::float32_t3 n0 = {};
+				if (!decodeNormal(i0, n0))
+					return false;
+
+				hlsl::float32_t3 attrNormal = n0;
+				if (hlsl::dot(attrNormal, attrNormal) <= 0.f)
+				{
+					hlsl::float32_t3 n1 = {};
+					if (!decodeNormal(i1, n1))
+						return false;
+					attrNormal = n1;
+				}
+				if (hlsl::dot(attrNormal, attrNormal) <= 0.f)
+				{
+					hlsl::float32_t3 n2 = {};
+					if (!decodeNormal(i2, n2))
+						return false;
+					attrNormal = n2;
+				}
+
+				if (hlsl::dot(attrNormal, attrNormal) > 0.f)
+				{
+					if (flipHandedness)
+						attrNormal.x = -attrNormal.x;
+					if (planeNormalLen2 > 0.f && hlsl::dot(attrNormal, planeNormal) < 0.f)
+						attrNormal = -attrNormal;
+					normal = attrNormal;
+				}
+				else if (planeNormalLen2 > 0.f)
+				{
+					normal = hlsl::normalize(planeNormal);
+				}
+			}


what's all this code ?

devshgraphicsprogramming · 2026-02-17T16:19:43Z

src/nbl/asset/interchange/CSTLMeshWriter.cpp

+bool writeFaceText(
+		const core::vectorSIMDf& v1,
+		const core::vectorSIMDf& v2,
+		const core::vectorSIMDf& v3,
+		const uint32_t* idx,
+		const asset::ICPUPolygonGeometry::SDataView& normalView,
+		const bool flipHandedness,
+		SContext* context)
+{
+	core::vectorSIMDf vertex1 = v3;
+	core::vectorSIMDf vertex2 = v2;
+	core::vectorSIMDf vertex3 = v1;

-		context->fileOffset += success.getBytesProcessed();
+	if (flipHandedness)
+	{
+		vertex1.X = -vertex1.X;
+		vertex2.X = -vertex2.X;
+		vertex3.X = -vertex3.X;
 	}

+	core::vectorSIMDf normal = core::plane3dSIMDf(vertex1, vertex2, vertex3).getNormal();
+	core::vectorSIMDf attrNormal;
+	if (decodeTriangleNormal(normalView, idx, attrNormal))
 	{
-		system::IFile::success_t success;;
-		context->writeContext.outputFile->write(success, "endfacet\n", context->fileOffset, 9);
-
-		context->fileOffset += success.getBytesProcessed();
+		if (flipHandedness)
+			attrNormal.X = -attrNormal.X;
+		if (core::dot(attrNormal, normal).X < 0.f)
+			attrNormal = -attrNormal;
+		normal = attrNormal;
 	}


get rid of old vector types

devshgraphicsprogramming · 2026-02-17T16:19:50Z

src/nbl/asset/interchange/CSTLMeshWriter.cpp

+		core::vectorSIMDf v0;
+		core::vectorSIMDf v1;
+		core::vectorSIMDf v2;


devshgraphicsprogramming · 2026-02-17T16:24:33Z

src/nbl/asset/interchange/COBJMeshWriter.cpp

+constexpr size_t ApproxObjBytesPerVertex = 96ull;
+constexpr size_t ApproxObjBytesPerFace = 48ull;
+constexpr size_t MaxUInt32Chars = 10ull;
+constexpr size_t MaxFloatFixed6Chars = 48ull;
+constexpr size_t MaxIndexTokenBytes = MaxUInt32Chars * 3ull + 2ull;


express this with sizeof so we know where all that stuff comes from / assumptions

devshgraphicsprogramming · 2026-02-17T16:25:16Z

src/nbl/asset/interchange/COBJMeshWriter.cpp

+bool decodeVec4(const ICPUPolygonGeometry::SDataView& view, const size_t ix, hlsl::float64_t4& out)
+{
+	out = hlsl::float64_t4(0.0, 0.0, 0.0, 0.0);
+	return view.decodeElement(ix, out);
+}
+
+char* appendUIntToBuffer(char* dst, char* const end, const uint32_t value)
+{
+	if (!dst || dst >= end)
+		return end;
+
+	const auto result = std::to_chars(dst, end, value);
+	if (result.ec == std::errc())
+		return result.ptr;
+
+	const int written = std::snprintf(dst, static_cast<size_t>(end - dst), "%u", value);
+	if (written <= 0)
+		return dst;
+	const size_t writeLen = static_cast<size_t>(written);
+	return (writeLen < static_cast<size_t>(end - dst)) ? (dst + writeLen) : end;
+}


commonalize?

devshgraphicsprogramming · 2026-02-17T16:26:28Z

src/nbl/asset/interchange/COBJMeshWriter.cpp

+void appendVec3Line(std::string& out, const char* prefix, const size_t prefixSize, const float x, const float y, const float z)
+{
+	const size_t oldSize = out.size();
+	out.resize(oldSize + prefixSize + (3ull * MaxFloatFixed6Chars) + 3ull);
+	char* const lineBegin = out.data() + oldSize;
+	char* cursor = lineBegin;
+	char* const lineEnd = out.data() + out.size();
+
+	std::memcpy(cursor, prefix, prefixSize);
+	cursor += prefixSize;
+
+	cursor = appendFloatFixed6ToBuffer(cursor, lineEnd, x);
+	if (cursor < lineEnd)
+		*(cursor++) = ' ';
+	cursor = appendFloatFixed6ToBuffer(cursor, lineEnd, y);
+	if (cursor < lineEnd)
+		*(cursor++) = ' ';
+	cursor = appendFloatFixed6ToBuffer(cursor, lineEnd, z);
+	if (cursor < lineEnd)
+		*(cursor++) = '\n';
+
+	out.resize(oldSize + static_cast<size_t>(cursor - lineBegin));
+}
+
+void appendVec2Line(std::string& out, const char* prefix, const size_t prefixSize, const float x, const float y)
+{
+	const size_t oldSize = out.size();
+	out.resize(oldSize + prefixSize + (2ull * MaxFloatFixed6Chars) + 2ull);
+	char* const lineBegin = out.data() + oldSize;
+	char* cursor = lineBegin;
+	char* const lineEnd = out.data() + out.size();
+
+	std::memcpy(cursor, prefix, prefixSize);
+	cursor += prefixSize;
+
+	cursor = appendFloatFixed6ToBuffer(cursor, lineEnd, x);
+	if (cursor < lineEnd)
+		*(cursor++) = ' ';
+	cursor = appendFloatFixed6ToBuffer(cursor, lineEnd, y);
+	if (cursor < lineEnd)
+		*(cursor++) = '\n';
+
+	out.resize(oldSize + static_cast<size_t>(cursor - lineBegin));
+}
+
+void appendFaceLine(std::string& out, const std::string& storage, const core::vector<SIndexStringRef>& refs, const uint32_t i0, const uint32_t i1, const uint32_t i2)
+{
+	const auto& ref0 = refs[i0];
+	const auto& ref1 = refs[i1];
+	const auto& ref2 = refs[i2];
+	const size_t oldSize = out.size();
+	const size_t lineSize = 2ull + static_cast<size_t>(ref0.length) + 1ull + static_cast<size_t>(ref1.length) + 1ull + static_cast<size_t>(ref2.length) + 1ull;
+	out.resize(oldSize + lineSize);
+	char* cursor = out.data() + oldSize;
+	*(cursor++) = 'f';
+	*(cursor++) = ' ';
+	std::memcpy(cursor, storage.data() + ref0.offset, ref0.length);
+	cursor += ref0.length;
+	*(cursor++) = ' ';
+	std::memcpy(cursor, storage.data() + ref1.offset, ref1.length);
+	cursor += ref1.length;
+	*(cursor++) = ' ';
+	std::memcpy(cursor, storage.data() + ref2.offset, ref2.length);
+	cursor += ref2.length;
+	*(cursor++) = '\n';
+}


why not take hlsl::float32_tN and hlsl::uint32_t3 instead of individual scalar arguments?

Also you have this out state that could really be wrapped up in a context struct with methods

devshgraphicsprogramming · 2026-02-17T16:31:29Z

src/nbl/asset/interchange/COBJMeshWriter.cpp

+	const auto* geom = IAsset::castDown<const ICPUPolygonGeometry>(_params.rootAsset);
+	if (!geom || !geom->valid())
+		return false;
+


btw OBJ writer should be an ICPUScene writer

devshgraphicsprogramming · 2026-02-17T16:53:14Z