Add heuristic for max ids of stacked tables.

hertschuh · hertschuh · commit b27a31d58799 · 2025-10-29T14:06:03.000-07:00
Propagate the `max_ids_per_partition` and `max_unique_ids_per_partition` from `TableSpec`s to `StackedTableSpec`s by taking the max from the stacked tables.
diff --git a/keras_rs/src/layers/embedding/jax/distributed_embedding.py b/keras_rs/src/layers/embedding/jax/distributed_embedding.py
@@ -1,5 +1,7 @@
 """JAX implementation of the TPU embedding layer."""
 
+import collections
+import dataclasses
 import math
 import typing
 from typing import Any, Mapping, Sequence, Union
@@ -445,6 +447,30 @@ def sparsecore_build(
         table_specs = embedding.get_table_specs(feature_specs)
         table_stacks = jte_table_stacking.get_table_stacks(table_specs)
 
+        # Create new instances of StackTableSpec with updated values that are
+        # the maximum from stacked tables.
+        stacked_table_specs = embedding.get_stacked_table_specs(feature_specs)
+        stacked_table_specs = {
+            stack_name: dataclasses.replace(
+                stacked_table_spec,
+                max_ids_per_partition=max(
+                    table.max_ids_per_partition
+                    for table in table_stacks[stack_name]
+                ),
+                max_unique_ids_per_partition=max(
+                    table.max_unique_ids_per_partition
+                    for table in table_stacks[stack_name]
+                ),
+            )
+            for stack_name, stacked_table_spec in stacked_table_specs.items()
+        }
+
+        # Rewrite the stacked_table_spec in all TableSpecs.
+        for stack_name, table_specs in table_stacks.items():
+            stacked_table_spec = stacked_table_specs[stack_name]
+            for table_spec in table_specs:
+                table_spec.stacked_table_spec = stacked_table_spec
+
         # Create variables for all stacked tables and slot variables.
         with sparsecore_distribution.scope():
             self._table_and_slot_variables = {