modelpack · rishi-jat · Mar 26, 2026 · Copilot · Mar 26, 2026 · gemini-code-assist
diff --git a/tools/hf_to_arch.py b/tools/hf_to_arch.py
@@ -0,0 +1,59 @@
+#!/usr/bin/env python3
+"""Convert HuggingFace config.json to architecture_config format."""
+
+import json
+import sys
+
+
+REQUIRED_MAPPINGS = {
+    "numLayers": "num_hidden_layers",
+    "hiddenSize": "hidden_size",
+    "numAttentionHeads": "num_attention_heads",
+}
+
+
+def convert_hf_config(hf_config: dict) -> dict:
+    """Convert HuggingFace config to architecture_config format."""
+    arch_config = {"type": "transformer"}
+
+    for arch_key, hf_key in REQUIRED_MAPPINGS.items():
+        if hf_key not in hf_config:
+            raise ValueError(f"missing required field: {hf_key}")
+        value = hf_config[hf_key]
+        if not isinstance(value, int) or isinstance(value, bool):
-        if not isinstance(value, int) or isinstance(value, bool):
+        if type(value) is not int:
-        if not isinstance(value, int) or isinstance(value, bool):
+        if type(value) is not int:
+            raise ValueError(f"field {hf_key} must be an integer, got {type(value).__name__}")
+        if value < 1:
+            raise ValueError(f"field {hf_key} must be >= 1, got {value}")
+        arch_config[arch_key] = value
+
+    return arch_config
+
+
+def main():
+    if len(sys.argv) != 2:
+        print(f"usage: {sys.argv[0]} <config.json>", file=sys.stderr)
+        sys.exit(1)
+
+    config_path = sys.argv[1]
-    if len(sys.argv) != 2:
-        print(f"usage: {sys.argv[0]} <config.json>", file=sys.stderr)
-        sys.exit(1)
-
-    config_path = sys.argv[1]
+    parser = argparse.ArgumentParser(description="Convert HuggingFace config.json to architecture_config format.")
+    parser.add_argument("config_path", help="Path to the HuggingFace config.json file.")
+    args = parser.parse_args()
+
+    config_path = args.config_path
-    if len(sys.argv) != 2:
-        print(f"usage: {sys.argv[0]} <config.json>", file=sys.stderr)
-        sys.exit(1)
-
-    config_path = sys.argv[1]
+    parser = argparse.ArgumentParser(description="Convert HuggingFace config.json to architecture_config format.")
+    parser.add_argument("config_path", help="Path to the HuggingFace config.json file.")
+    args = parser.parse_args()
+
+    config_path = args.config_path
+
+    try:
+        with open(config_path, "r") as f:
-        with open(config_path, "r") as f:
+        with open(config_path, "r", encoding="utf-8") as f:
-        with open(config_path, "r") as f:
+        with open(config_path, "r", encoding="utf-8") as f:
+            hf_config = json.load(f)
+    except FileNotFoundError:
+        print(f"error: file not found: {config_path}", file=sys.stderr)
+        sys.exit(1)
+    except json.JSONDecodeError as e:
+        print(f"error: invalid JSON: {e}", file=sys.stderr)
+        sys.exit(1)
+
+    try:
+        arch_config = convert_hf_config(hf_config)
+    except ValueError as e:
+        print(f"error: {e}", file=sys.stderr)
+        sys.exit(1)
+
+    print(json.dumps(arch_config, indent=2, sort_keys=True))
+
+
+if __name__ == "__main__":
+    main()
diff --git a/tools/hf_to_arch_test.py b/tools/hf_to_arch_test.py
@@ -0,0 +1,146 @@
+#!/usr/bin/env python3
+"""Tests for hf_to_arch.py"""
+
+import json
+import subprocess
+import sys
+import tempfile
+import os
+
+SCRIPT_PATH = os.path.join(os.path.dirname(__file__), "hf_to_arch.py")
+
+
+def run_script(config_content: str) -> tuple:
+    """Run hf_to_arch.py with given config content, return (exitcode, stdout, stderr)."""
+    with tempfile.NamedTemporaryFile(mode="w", suffix=".json", delete=False) as f:
+        f.write(config_content)
+        f.flush()
+        temp_path = f.name
+
+    try:
+        result = subprocess.run(
+            [sys.executable, SCRIPT_PATH, temp_path],
+            capture_output=True,
+            text=True,
+        )
+        return result.returncode, result.stdout, result.stderr
+    finally:
+        os.unlink(temp_path)
+
+
+def test_valid_config():
+    """Valid HuggingFace config produces correct output."""
+    config = json.dumps({
+        "num_hidden_layers": 32,
+        "hidden_size": 4096,
+        "num_attention_heads": 32,
+        "vocab_size": 32000,
+    })
+
+    exitcode, stdout, stderr = run_script(config)
+
+    assert exitcode == 0, f"expected exit 0, got {exitcode}: {stderr}"
+    output = json.loads(stdout)
+    assert output == {
+        "type": "transformer",
+        "numLayers": 32,
+        "hiddenSize": 4096,
+        "numAttentionHeads": 32,
+    }, f"unexpected output: {output}"
+    print("PASS: test_valid_config")
+
+
+def test_missing_field():
+    """Missing required field produces error."""
+    config = json.dumps({
+        "num_hidden_layers": 32,
+        "hidden_size": 4096,
+    })
+
+    exitcode, stdout, stderr = run_script(config)
+
+    assert exitcode != 0, "expected non-zero exit for missing field"
+    assert "num_attention_heads" in stderr, f"error should mention missing field: {stderr}"
+    print("PASS: test_missing_field")
+
+
+def test_invalid_json():
+    """Invalid JSON produces error."""
+    exitcode, stdout, stderr = run_script("not valid json {")
+
+    assert exitcode != 0, "expected non-zero exit for invalid JSON"
+    assert "invalid JSON" in stderr.lower() or "json" in stderr.lower(), f"error should mention JSON: {stderr}"
+    print("PASS: test_invalid_json")
+
+
+def test_file_not_found():
+    """Non-existent file produces error."""
+    result = subprocess.run(
+        [sys.executable, SCRIPT_PATH, "/nonexistent/path/config.json"],
+        capture_output=True,
+        text=True,
+    )
+
+    assert result.returncode != 0, "expected non-zero exit for missing file"
+    assert "not found" in result.stderr.lower(), f"error should mention file not found: {result.stderr}"
+    print("PASS: test_file_not_found")
+
+
+def test_invalid_field_type():
+    """Non-integer field produces error."""
+    config = json.dumps({
+        "num_hidden_layers": "32",
+        "hidden_size": 4096,
+        "num_attention_heads": 32,
+    })
+
+    exitcode, stdout, stderr = run_script(config)
+
+    assert exitcode != 0, "expected non-zero exit for invalid type"
+    assert "integer" in stderr.lower(), f"error should mention type: {stderr}"
+    print("PASS: test_invalid_field_type")
+
+
+def test_zero_value():
+    """Zero value produces error."""
+    config = json.dumps({
+        "num_hidden_layers": 0,
+        "hidden_size": 4096,
+        "num_attention_heads": 32,
+    })
+
+    exitcode, stdout, stderr = run_script(config)
+
+    assert exitcode != 0, "expected non-zero exit for zero value"
+    assert ">= 1" in stderr, f"error should mention minimum: {stderr}"
+    print("PASS: test_zero_value")
+
+
+def test_bool_value():
+    """Boolean value produces error."""
+    config = json.dumps({
+        "num_hidden_layers": True,
+        "hidden_size": 4096,
+        "num_attention_heads": 32,
+    })
+
+    exitcode, stdout, stderr = run_script(config)
+
+    assert exitcode != 0, "expected non-zero exit for bool value"
+    assert "integer" in stderr.lower(), f"error should mention type: {stderr}"
+    print("PASS: test_bool_value")
+
+
+def main():
+    test_valid_config()
+    test_missing_field()
+    test_invalid_json()
+    test_file_not_found()
+    test_invalid_field_type()
+    test_zero_value()
+    test_bool_value()
+    print("\nAll tests passed.")
+
+
+if __name__ == "__main__":
+    main()
-def main():
-    test_valid_config()
-    test_missing_field()
-    test_invalid_json()
-    test_file_not_found()
-    test_invalid_field_type()
-    test_zero_value()
-    test_bool_value()
-    print("\nAll tests passed.")
-
-
-if __name__ == "__main__":
-    main()
-def main():
-    test_valid_config()
-    test_missing_field()
-    test_invalid_json()
-    test_file_not_found()
-    test_invalid_field_type()
-    test_zero_value()
-    test_bool_value()
-    print("\nAll tests passed.")
-
-
-if __name__ == "__main__":
-    main()