modelpack · rishi-jat · Mar 25, 2026 · Mar 25, 2026 · Copilot · Mar 26, 2026
diff --git a/schema/config-schema.json b/schema/config-schema.json
@@ -41,8 +41,34 @@
           },
           "capabilities": {
             "$ref": "#/$defs/ModelCapabilities"
+          },
+          "architecture_config": {
-          "architecture_config": {
+          "architectureConfig": {
-          "architecture_config": {
+          "architectureConfig": {
+            "$ref": "#/$defs/ArchitectureConfig"
+          }
+        },
+        "additionalProperties": false
+      },
+      "ArchitectureConfig": {
+        "type": "object",
+        "properties": {
+          "type": {
+            "type": "string",
+            "enum": ["transformer"]
+          },
+          "numLayers": {
+            "type": "integer",
+            "minimum": 1
+          },
+          "hiddenSize": {
+            "type": "integer",
+            "minimum": 1
+          },
+          "numAttentionHeads": {
+            "type": "integer",
+            "minimum": 1
           }
         },
+        "required": ["type", "numLayers", "hiddenSize", "numAttentionHeads"],
         "additionalProperties": false
       },
       "ModelDescriptor": {

diff --git a/schema/config_test.go b/schema/config_test.go
@@ -589,3 +589,51 @@ func TestConfig(t *testing.T) {
 		}
 	}
 }
+
+func TestArchitectureConfigValid(t *testing.T) {
+	validJSON := `{
+		"descriptor": {"name": "test-model"},
+		"config": {
+			"paramSize": "8b",
+			"architecture_config": {
+				"type": "transformer",
+				"numLayers": 32,
+				"hiddenSize": 4096,
+				"numAttentionHeads": 32
+			}
+		},
+		"modelfs": {
+			"type": "layers",
+			"diffIds": ["sha256:1234567890abcdef1234567890abcdef1234567890abcdef1234567890abcdef"]
+		}
+	}`
+
+	err := schema.ValidatorMediaTypeModelConfig.Validate(strings.NewReader(validJSON))
+	if err != nil {
+		t.Fatalf("expected valid architecture_config to pass, got error: %v", err)
+	}
+}
+
+func TestArchitectureConfigMissingRequiredField(t *testing.T) {
+	// Missing numLayers field
+	invalidJSON := `{
+		"descriptor": {"name": "test-model"},
+		"config": {
+			"paramSize": "8b",
+			"architecture_config": {
+				"type": "transformer",
+				"hiddenSize": 4096,
+				"numAttentionHeads": 32
+			}
+		},
+		"modelfs": {
+			"type": "layers",
+			"diffIds": ["sha256:1234567890abcdef1234567890abcdef1234567890abcdef1234567890abcdef"]
+		}
+	}`
+
+	err := schema.ValidatorMediaTypeModelConfig.Validate(strings.NewReader(invalidJSON))
+	if err == nil {
+		t.Fatalf("expected architecture_config with missing numLayers to fail validation")
+	}
+}
diff --git a/specs-go/v1/config.go b/specs-go/v1/config.go
@@ -42,6 +42,24 @@ type ModelConfig struct {
 
 	// Special capabilities that the model supports
 	Capabilities *ModelCapabilities `json:"capabilities,omitempty"`
+
+	// Architecture-specific configuration parameters
+	ArchitectureConfig *ArchitectureConfig `json:"architecture_config,omitempty"`
-	ArchitectureConfig *ArchitectureConfig `json:"architecture_config,omitempty"`
+	ArchitectureConfig *ArchitectureConfig `json:"architectureConfig,omitempty"`
-	ArchitectureConfig *ArchitectureConfig `json:"architecture_config,omitempty"`
+	ArchitectureConfig *ArchitectureConfig `json:"architectureConfig,omitempty"`
+}
+
+// ArchitectureConfig defines architecture-specific parameters for the model.
+type ArchitectureConfig struct {
+	// Type specifies the model architecture type (e.g., "transformer").
+	Type string `json:"type"`
+
+	// NumLayers is the number of layers in the model.
+	NumLayers int `json:"numLayers"`
+
+	// HiddenSize is the dimensionality of the hidden representations.
+	HiddenSize int `json:"hiddenSize"`
+
+	// NumAttentionHeads is the number of attention heads.
+	NumAttentionHeads int `json:"numAttentionHeads"`
 }
 
 // ModelFS describes a layer content addresses

diff --git a/tools/hf_to_arch.py b/tools/hf_to_arch.py
@@ -0,0 +1,59 @@
+#!/usr/bin/env python3
+"""Convert HuggingFace config.json to architecture_config format."""
+
+import json
+import sys
+
+
+REQUIRED_MAPPINGS = {
+    "numLayers": "num_hidden_layers",
+    "hiddenSize": "hidden_size",
+    "numAttentionHeads": "num_attention_heads",
+}
+
+
+def convert_hf_config(hf_config: dict) -> dict:
+    """Convert HuggingFace config to architecture_config format."""
+    arch_config = {"type": "transformer"}
+
+    for arch_key, hf_key in REQUIRED_MAPPINGS.items():
+        if hf_key not in hf_config:
+            raise ValueError(f"missing required field: {hf_key}")
+        value = hf_config[hf_key]
+        if not isinstance(value, int) or isinstance(value, bool):
+            raise ValueError(f"field {hf_key} must be an integer, got {type(value).__name__}")
+        if value < 1:
+            raise ValueError(f"field {hf_key} must be >= 1, got {value}")
+        arch_config[arch_key] = value
+
+    return arch_config
+
+
+def main():
+    if len(sys.argv) != 2:
+        print(f"usage: {sys.argv[0]} <config.json>", file=sys.stderr)
+        sys.exit(1)
+
+    config_path = sys.argv[1]
-    if len(sys.argv) != 2:
-        print(f"usage: {sys.argv[0]} <config.json>", file=sys.stderr)
-        sys.exit(1)
-
-    config_path = sys.argv[1]
+    parser = argparse.ArgumentParser(description=__doc__.strip())
+    parser.add_argument("config_path", metavar="config.json", help="Path to HuggingFace config.json")
+    args = parser.parse_args()
+    config_path = args.config_path
-    if len(sys.argv) != 2:
-        print(f"usage: {sys.argv[0]} <config.json>", file=sys.stderr)
-        sys.exit(1)
-
-    config_path = sys.argv[1]
+    parser = argparse.ArgumentParser(description=__doc__.strip())
+    parser.add_argument("config_path", metavar="config.json", help="Path to HuggingFace config.json")
+    args = parser.parse_args()
+    config_path = args.config_path
+
+    try:
+        with open(config_path, "r") as f:
+            hf_config = json.load(f)
+    except FileNotFoundError:
+        print(f"error: file not found: {config_path}", file=sys.stderr)
+        sys.exit(1)
+    except json.JSONDecodeError as e:
+        print(f"error: invalid JSON: {e}", file=sys.stderr)
+        sys.exit(1)
+
+    try:
+        arch_config = convert_hf_config(hf_config)
+    except ValueError as e:
+        print(f"error: {e}", file=sys.stderr)
+        sys.exit(1)
+
+    print(json.dumps(arch_config, indent=2, sort_keys=True))
+
+
+if __name__ == "__main__":
+    main()
diff --git a/tools/hf_to_arch_test.py b/tools/hf_to_arch_test.py
@@ -0,0 +1,146 @@
+#!/usr/bin/env python3
+"""Tests for hf_to_arch.py"""
+
+import json
+import subprocess
+import sys
+import tempfile
+import os
+
+SCRIPT_PATH = os.path.join(os.path.dirname(__file__), "hf_to_arch.py")
+
+
+def run_script(config_content: str) -> tuple:
+    """Run hf_to_arch.py with given config content, return (exitcode, stdout, stderr)."""
+    with tempfile.NamedTemporaryFile(mode="w", suffix=".json", delete=False) as f:
+        f.write(config_content)
+        f.flush()
+        temp_path = f.name
+
+    try:
+        result = subprocess.run(
+            [sys.executable, SCRIPT_PATH, temp_path],
+            capture_output=True,
+            text=True,
+        )
+        return result.returncode, result.stdout, result.stderr
+    finally:
+        os.unlink(temp_path)
+
+
+def test_valid_config():
+    """Valid HuggingFace config produces correct output."""
+    config = json.dumps({
+        "num_hidden_layers": 32,
+        "hidden_size": 4096,
+        "num_attention_heads": 32,
+        "vocab_size": 32000,
+    })
+
+    exitcode, stdout, stderr = run_script(config)
+
+    assert exitcode == 0, f"expected exit 0, got {exitcode}: {stderr}"
+    output = json.loads(stdout)
+    assert output == {
+        "type": "transformer",
+        "numLayers": 32,
+        "hiddenSize": 4096,
+        "numAttentionHeads": 32,
+    }, f"unexpected output: {output}"
+    print("PASS: test_valid_config")
+
+
+def test_missing_field():
+    """Missing required field produces error."""
+    config = json.dumps({
+        "num_hidden_layers": 32,
+        "hidden_size": 4096,
+    })
+
+    exitcode, stdout, stderr = run_script(config)
+
+    assert exitcode != 0, "expected non-zero exit for missing field"
+    assert "num_attention_heads" in stderr, f"error should mention missing field: {stderr}"
+    print("PASS: test_missing_field")
+
+
+def test_invalid_json():
+    """Invalid JSON produces error."""
+    exitcode, stdout, stderr = run_script("not valid json {")
+
+    assert exitcode != 0, "expected non-zero exit for invalid JSON"
+    assert "invalid JSON" in stderr.lower() or "json" in stderr.lower(), f"error should mention JSON: {stderr}"
-    assert "invalid JSON" in stderr.lower() or "json" in stderr.lower(), f"error should mention JSON: {stderr}"
+    assert "invalid json" in stderr.lower() or "json" in stderr.lower(), f"error should mention JSON: {stderr}"
-    assert "invalid JSON" in stderr.lower() or "json" in stderr.lower(), f"error should mention JSON: {stderr}"
+    assert "invalid json" in stderr.lower() or "json" in stderr.lower(), f"error should mention JSON: {stderr}"
+    print("PASS: test_invalid_json")
+
+
+def test_file_not_found():
+    """Non-existent file produces error."""
+    result = subprocess.run(
+        [sys.executable, SCRIPT_PATH, "/nonexistent/path/config.json"],
+        capture_output=True,
+        text=True,
+    )
+
+    assert result.returncode != 0, "expected non-zero exit for missing file"
+    assert "not found" in result.stderr.lower(), f"error should mention file not found: {result.stderr}"
+    print("PASS: test_file_not_found")
+
+
+def test_invalid_field_type():
+    """Non-integer field produces error."""
+    config = json.dumps({
+        "num_hidden_layers": "32",
+        "hidden_size": 4096,
+        "num_attention_heads": 32,
+    })
+
+    exitcode, stdout, stderr = run_script(config)
+
+    assert exitcode != 0, "expected non-zero exit for invalid type"
+    assert "integer" in stderr.lower(), f"error should mention type: {stderr}"
+    print("PASS: test_invalid_field_type")
+
+
+def test_zero_value():
+    """Zero value produces error."""
+    config = json.dumps({
+        "num_hidden_layers": 0,
+        "hidden_size": 4096,
+        "num_attention_heads": 32,
+    })
+
+    exitcode, stdout, stderr = run_script(config)
+
+    assert exitcode != 0, "expected non-zero exit for zero value"
+    assert ">= 1" in stderr, f"error should mention minimum: {stderr}"
+    print("PASS: test_zero_value")
+
+
+def test_bool_value():
+    """Boolean value produces error."""
+    config = json.dumps({
+        "num_hidden_layers": True,
+        "hidden_size": 4096,
+        "num_attention_heads": 32,
+    })
+
+    exitcode, stdout, stderr = run_script(config)
+
+    assert exitcode != 0, "expected non-zero exit for bool value"
+    assert "integer" in stderr.lower(), f"error should mention type: {stderr}"
+    print("PASS: test_bool_value")
+
+
+def main():
+    test_valid_config()
+    test_missing_field()
+    test_invalid_json()
+    test_file_not_found()
+    test_invalid_field_type()
+    test_zero_value()
+    test_bool_value()
+    print("\nAll tests passed.")
+
+
+if __name__ == "__main__":
+    main()