[JAX SC] Refactor _get_stack_table_names into helper functions.

adityagupta1089 · Google-ML-Automation · commit c1f92d78c6dc · 2025-11-14T11:14:00.000-08:00
This change breaks down the logic of `_get_stack_table_names` into three new private functions: `_group_tables_by_specs`, `_calculate_activation_memory_metrics`, and `_split_groups_by_memory_limit`. Dedicated unit tests are added for `_split_groups_by_memory_limit`.

PiperOrigin-RevId: 832388245
diff --git a/jax_tpu_embedding/sparsecore/lib/nn/table_stacking.py b/jax_tpu_embedding/sparsecore/lib/nn/table_stacking.py
@@ -373,15 +373,11 @@ def round_up_dim_and_vocab_size(
   return table_to_padded_dim, table_to_padded_vocab_size
 
 
-def _get_stack_table_names(
+def _group_tables_for_stacking(
     num_sc: int,
     flatten_tables: Mapping[str, embedding_spec.TableSpec],
-    flatten_features: Sequence[embedding_spec.FeatureSpec],
-    activation_mem_bytes_limit: int,
-) -> Sequence[Sequence[str]]:
-  """Returns the stack groups for the tables based on their specs."""
-  original_table_names = set(flatten_tables.keys())
-
+) -> list[list[str]]:
+  """Groups table names by padded dimension, optimizer, and combiner."""
   table_to_padded_dim, _ = round_up_dim_and_vocab_size(flatten_tables, num_sc)
   table_name_map = collections.defaultdict(list)
   for table_name, dim in table_to_padded_dim.items():
@@ -391,9 +387,15 @@ def _get_stack_table_names(
         flatten_tables[table_name].combiner,
     )
     table_name_map[key].append(table_name)
+  return list(table_name_map.values())
 
-  groups = list(table_name_map.values())
 
+def _calculate_activation_memory_metrics(
+    num_sc: int,
+    flatten_tables: Mapping[str, embedding_spec.TableSpec],
+    flatten_features: Sequence[embedding_spec.FeatureSpec],
+) -> tuple[Mapping[str, int], Mapping[str, int]]:
+  """Calculates sample count and activation memory bytes per table."""
   # Calculate sample_count per sparsecore for each table.
   table_to_sample_count = collections.defaultdict(int)
   for feature in flatten_features:
@@ -402,11 +404,52 @@ def _get_stack_table_names(
     )
 
   # Calculate and register the activation memory usage of this table.
+  table_to_padded_dim, _ = round_up_dim_and_vocab_size(flatten_tables, num_sc)
   table_to_activation_mem_bytes = {
       tname: table_to_padded_dim[tname] * table_to_sample_count[tname] * 4
       for tname in flatten_tables.keys()
   }
+  return table_to_sample_count, table_to_activation_mem_bytes
+
+
+def _get_stack_table_names(
+    num_sc: int,
+    flatten_tables: Mapping[str, embedding_spec.TableSpec],
+    flatten_features: Sequence[embedding_spec.FeatureSpec],
+    activation_mem_bytes_limit: int,
+) -> Sequence[Sequence[str]]:
+  """Returns the stack groups for the tables based on their specs."""
+  original_table_names = set(flatten_tables.keys())
+
+  groups = _group_tables_for_stacking(num_sc, flatten_tables)
+
+  _, table_to_activation_mem_bytes = _calculate_activation_memory_metrics(
+      num_sc, flatten_tables, flatten_features
+  )
+
+  validated_groups = _split_groups_by_memory_limit(
+      groups, table_to_activation_mem_bytes, activation_mem_bytes_limit
+  )
+
+  grouped_table_names = set()
+  for group in validated_groups:
+    grouped_table_names.update(group)
+
+  if original_table_names != grouped_table_names:
+    raise ValueError(
+        "Table names are not grouped correctly. Original table names:"
+        f" {original_table_names}, grouped table names: {grouped_table_names}"
+    )
+
+  return validated_groups
 
+
+def _split_groups_by_memory_limit(
+    groups: list[list[str]],
+    table_to_activation_mem_bytes: Mapping[str, int],
+    activation_mem_bytes_limit: int,
+) -> list[list[str]]:
+  """Splits table groups to respect the activation memory limit."""
   validated_groups = []
   for group in groups:
     # A list of groups that are split from the current group.
@@ -446,17 +489,6 @@ def _get_stack_table_names(
           )
     # Add into the validated groups.
     validated_groups.extend(split_groups)
-
-  grouped_table_names = set()
-  for group in validated_groups:
-    grouped_table_names.update(group)
-
-  if original_table_names != grouped_table_names:
-    raise ValueError(
-        "Table names are not grouped correctly. Original table names:"
-        f" {original_table_names}, grouped table names: {grouped_table_names}"
-    )
-
   return validated_groups
 
 
diff --git a/jax_tpu_embedding/sparsecore/lib/nn/tests/table_stacking_test.py b/jax_tpu_embedding/sparsecore/lib/nn/tests/table_stacking_test.py
@@ -813,6 +813,88 @@ def get_feature_specs() -> list[embedding_spec.FeatureSpec]:
           num_sc_per_device=self.num_sc_per_device,
       )
 
+  @parameterized.parameters(
+      dict(
+          groups=[['a', 'b', 'c']],
+          table_to_mem={'a': 10, 'b': 20, 'c': 30},
+          limit=100,
+          expected=[['a', 'b', 'c']],
+      ),
+      dict(
+          groups=[['a', 'b', 'c']],
+          table_to_mem={'a': 10, 'b': 20, 'c': 30},
+          limit=30,
+          expected=[['a', 'b'], ['c']],
+      ),
+      dict(
+          groups=[['a', 'b', 'c']],
+          table_to_mem={'a': 10, 'b': 20, 'c': 30},
+          limit=35,
+          expected=[['a', 'b'], ['c']],
+      ),
+      dict(
+          groups=[['a', 'b', 'c', 'd']],
+          table_to_mem={'a': 10, 'b': 10, 'c': 10, 'd': 10},
+          limit=25,
+          expected=[['a', 'b'], ['c', 'd']],
+      ),
+      dict(
+          groups=[['a'], ['b', 'c']],
+          table_to_mem={'a': 10, 'b': 20, 'c': 30},
+          limit=35,
+          expected=[['a'], ['b'], ['c']],
+      ),
+      dict(
+          groups=[['a', 'b'], ['c', 'd']],
+          table_to_mem={'a': 10, 'b': 20, 'c': 5, 'd': 5},
+          limit=30,
+          expected=[['a', 'b'], ['c', 'd']],
+      ),
+      dict(
+          groups=[['a', 'b', 'c']],
+          table_to_mem={'a': 60, 'b': 60, 'c': 60},
+          limit=50,
+          expected=[['a'], ['b'], ['c']],
+      ),
+      dict(
+          groups=[['a', 'b', 'c']],
+          table_to_mem={'a': 10, 'b': 20, 'c': 30},
+          limit=60,
+          expected=[['a', 'b', 'c']],
+      ),
+      dict(
+          groups=[['a', 'b', 'c']],
+          table_to_mem={'a': 10, 'b': 20, 'c': 30},
+          limit=40,
+          expected=[['a', 'b'], ['c']],
+      ),
+      dict(
+          groups=[['a', 'b'], ['c']],
+          table_to_mem={'a': 10, 'b': 20, 'c': 30},
+          limit=30,
+          expected=[['a', 'b'], ['c']],
+      ),
+      dict(
+          groups=[['a', 'b'], ['c', 'd']],
+          table_to_mem={'a': 10, 'b': 15, 'c': 20, 'd': 25},
+          limit=30,
+          expected=[['a', 'b'], ['c'], ['d']],
+      ),
+      dict(
+          groups=[],
+          table_to_mem={'a': 10},
+          limit=100,
+          expected=[],
+      ),
+  )
+  def test_split_groups_by_memory_limit(
+      self, groups, table_to_mem, limit, expected
+  ):
+    result = table_stacking._split_groups_by_memory_limit(
+        groups, table_to_mem, limit
+    )
+    self.assertEqual(result, expected)
+
   @parameterized.product(
       donate=[True, False],
       device_count=[1, 2, 4, -1],