Add OptimType.NONE in SplitTBE (defuse bwd and optim) (#1819)

Summary: Pull Request resolved: #1819 This diff is the **backend** part This diff introduces `OptimType.NONE`. Unlike other `OptimType`s, `OptimType.NONE` does not perform the optimizer step during SplitTBE's backward pass. With `OptimType.NONE`, SplitTBE deduplicates output gradients in the backward pass and generates a sparse gradient tensor (PyTorch's `sparse_coo_tensor`) for the device's weight (FQN: `weights_dev`). **Limitation**: Currently, `OptimType.NONE` only supports the case where the embedding dimensions of all embedding tables are identical. Reviewed By: jianyuh Differential Revision: D44392172 fbshipit-source-id: bf1e0d9d15632c3f34909cc736af6e9ca4593686
pytorch · Jun 12, 2023 · edc57b1 · edc57b1
1 parent 46c764b
commit edc57b1
Show file tree

Hide file tree

Showing 9 changed files with 381 additions and 182 deletions.
diff --git a/fbgemm_gpu/CMakeLists.txt b/fbgemm_gpu/CMakeLists.txt
@@ -183,7 +183,8 @@ set(GPU_ONLY_OPTIMIZERS
   partial_rowwise_lamb
   lars_sgd
   rowwise_adagrad_with_weight_decay
-  approx_rowwise_adagrad_with_weight_decay)
+  approx_rowwise_adagrad_with_weight_decay
+  none)
 
 set(DEPRECATED_OPTIMIZERS
   approx_sgd

diff --git a/fbgemm_gpu/codegen/embedding_backward_code_generator.py b/fbgemm_gpu/codegen/embedding_backward_code_generator.py
@@ -1641,6 +1641,23 @@ def backward_dense() -> None:
     )
 
 
+def none_optimizer() -> None:
+    generate(
+        optimizer="none",
+        dense=False,
+        args=make_args(
+            [
+                (INT, "total_hash_size"),
+                (INT, "total_unique_indices"),
+            ]
+        ),
+        # Generate only GPU code
+        has_cpu_support=False,
+        has_gpu_support=True,
+        has_vbe_support=False,
+    )
+
+
 def gen__init__py() -> None:
     template = env.get_template("__init__.template")
     src_py = template.render()
@@ -1670,6 +1687,8 @@ def emb_codegen(
     rowwise_adagrad_with_counter()
     rowwise_weighted_adagrad()
     sgd()
+    none_optimizer()
+
     gen__init__py()