AI-Hypercomputer
diff --git a/‎MaxText/tests/run_sharding_dump.py
Lines changed: 53 additions & 0 deletions b/‎MaxText/tests/run_sharding_dump.py
Lines changed: 53 additions & 0 deletions
diff --git a/‎MaxText/tests/sharding_compare_test.py
Lines changed: 111 additions & 0 deletions b/‎MaxText/tests/sharding_compare_test.py
Lines changed: 111 additions & 0 deletions
@@ -0,0 +1,53 @@
+"""
+Copyright 2023 Google LLC
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+     https://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+""" Run script to dump sharding of various combination of model and topology. """
+
+
+from typing import Sequence
+from MaxText.tests.sharding_dump import TEST_CASES
+import os
+import subprocess
+from absl import app
+
+
+def run_single_dump(model_name: str, topology: str, num_slice: str) -> None:
+  """Generate sharding json file for one specific model, topology and slice."""
+  subprocess.run(
+      [
+          "python",
+          "-m",
+          "MaxText.tests.sharding_dump",
+          "MaxText/configs/base.yml",
+          f"compile_topology={topology}",
+          f"compile_topology_num_slices={num_slice}",
+          f"model_name={model_name}",
+      ],
+      check=True,
+  )
+
+
+def main(argv: Sequence[str]) -> None:
+  """Generate sharding json files for every combination of model, topology and slices."""
+  for model_name, topology, num_slice in TEST_CASES:
+    json_path = f"sharding_info/{model_name}/{topology}/slice_{num_slice}/named_shardings.json"
+    if os.path.exists(json_path):
+      continue
+    run_single_dump(model_name, topology, num_slice)
+
+
+if __name__ == "__main__":
+  app.run(main)
@@ -0,0 +1,111 @@
+"""
+Copyright 2023 Google LLC
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+     https://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+"""Compare expected sharding of models with actual sharding of models."""
+
+
+import hashlib
+from MaxText.train_compile import get_shaped_inputs, get_topology_mesh, validate_config
+from MaxText.tests.sharding_dump import named_shardings_to_json, load_named_sharding_json, TEST_CASES
+from MaxText import pyconfig
+import pytest
+import os
+import json
+
+
+def compute_checksum(d: dict) -> str:
+  """Compute a checksum (SHA256) of a dictionary."""
+  # Serialize the dictionary into a JSON string (ensuring consistent ordering of keys)
+  json_str = json.dumps(d, sort_keys=True)
+
+  # Compute the SHA256 checksum of the serialized string
+  checksum = hashlib.sha256(json_str.encode("utf-8")).hexdigest()
+
+  return checksum
+
+
+def compare_named_sharding_jsons(json1: dict, model1_name: str, json2: dict, model2_name: str) -> bool:
+  """Compare two json files and print the differences if any."""
+  keys1 = set(json1.keys())
+  keys2 = set(json2.keys())
+
+  only_in_1 = keys1 - keys2
+  only_in_2 = keys2 - keys1
+  shared_keys = keys1 & keys2
+
+  if only_in_1:
+    print(f"Keys only in {model1_name}:")
+    for k in sorted(only_in_1):
+      print(f"  {k}")
+
+  if only_in_2:
+    print(f"Keys only in {model2_name}:")
+    for k in sorted(only_in_2):
+      print(f"  {k}")
+
+  for key in sorted(shared_keys):
+    entry1 = json1[key]
+    entry2 = json2[key]
+
+    mesh1 = entry1.get("mesh", {})
+    mesh2 = entry2.get("mesh", {})
+    spec1 = entry1.get("partition_spec", [])
+    spec2 = entry2.get("partition_spec", [])
+
+    if mesh1 != mesh2:
+      print(f"\nMesh mismatch at '{key}':")
+      print(f"  mesh1: {mesh1}")
+      print(f"  mesh2: {mesh2}")
+
+    if spec1 != spec2:
+      print(f"\nPartitionSpec mismatch at '{key}':")
+      print(f"  spec1: {spec1}")
+      print(f"  spec2: {spec2}")
+
+  return not only_in_1 and not only_in_2 and all(json1[k] == json2[k] for k in shared_keys)
+
+
+@pytest.mark.parametrize("model_name, topology, num_slice", TEST_CASES)
+def test_sharding_dump_for_model(model_name: str, topology: str, num_slice: str) -> None:
+  """Test if the sharding of new model implementation is as expected."""
+  params = [
+      "/deps/MaxText/tests/sharding_compare_test",
+      "MaxText/configs/base.yml",
+      f"compile_topology={topology}",
+      f"compile_topology_num_slices={num_slice}",
+      f"model_name={model_name}",
+  ]
+
+  json_path = f"sharding_info/" f"{model_name}/" f"{topology}/" f"slice_{num_slice}/named_shardings.json"
+  if not os.path.exists(json_path):
+    return
+
+  config = pyconfig.initialize(params)
+  validate_config(config)
+
+  topology_mesh = get_topology_mesh(config)
+  _, _, state_mesh_shardings, _ = get_shaped_inputs(topology_mesh, config)
+  actual_json = named_shardings_to_json(state_mesh_shardings)
+  expected_json = load_named_sharding_json(json_path)
+
+  actual_checksum = compute_checksum(actual_json)
+  expected_checksum2 = compute_checksum(expected_json)
+  result = actual_checksum == expected_checksum2
+
+  if not result:
+    compare_named_sharding_jsons(expected_json, f"expected_{model_name}", actual_json, f"actual_{model_name}")
+
+  assert result is True