fix: vendor stk decorators

Files changed (7) hide show

torch-ext/megablocks/ops/binned_gather.py CHANGED Viewed

@@ -3,7 +3,7 @@
 from typing import Any
 import torch
-from stk.backend.autocast import custom_bwd, custom_fwd
 from ..backend import kernels

 from typing import Any
 import torch
+from .stk_autocast import custom_bwd, custom_fwd
 from ..backend import kernels

torch-ext/megablocks/ops/binned_scatter.py CHANGED Viewed

@@ -3,7 +3,7 @@
 from typing import Any
 import torch
-from stk.backend.autocast import custom_bwd, custom_fwd
 from ..backend import kernels

 from typing import Any
 import torch
+from .stk_autocast import custom_bwd, custom_fwd
 from ..backend import kernels

torch-ext/megablocks/ops/gather.py CHANGED Viewed

@@ -3,7 +3,7 @@
 from typing import Any
 import torch
-from stk.backend.autocast import custom_bwd, custom_fwd
 from ..backend import kernels

 from typing import Any
 import torch
+from .stk_autocast import custom_bwd, custom_fwd
 from ..backend import kernels

torch-ext/megablocks/ops/padded_gather.py CHANGED Viewed

@@ -3,7 +3,7 @@
 from typing import Any
 import torch
-from stk.backend.autocast import custom_bwd, custom_fwd
 from ..backend import kernels

 from typing import Any
 import torch
+from .stk_autocast import custom_bwd, custom_fwd
 from ..backend import kernels

torch-ext/megablocks/ops/padded_scatter.py CHANGED Viewed

@@ -3,7 +3,7 @@
 from typing import Any
 import torch
-from stk.backend.autocast import custom_bwd, custom_fwd
 from ..backend import kernels

 from typing import Any
 import torch
+from .stk_autocast import custom_bwd, custom_fwd
 from ..backend import kernels

torch-ext/megablocks/ops/scatter.py CHANGED Viewed

@@ -4,7 +4,7 @@
 from typing import Any, Optional
 import torch
-from stk.backend.autocast import custom_bwd, custom_fwd
 from ..backend import kernels

 from typing import Any, Optional
 import torch
+from .stk_autocast import custom_bwd, custom_fwd
 from ..backend import kernels

torch-ext/megablocks/ops/stk_autocast.py ADDED Viewed

+# vendored from
+# https://github.com/stanford-futuredata/stk/blob/736313768ef697ce13a0594a41b2512a0fbc9884/stk/backend/autocast.py
+import functools
+import torch
+def _is_eligible(x):
+    return x.is_floating_point() and x.is_cuda and (x.dtype is not torch.float64)
+def _cast(x, dtype):
+    if isinstance(x, torch.Tensor) and _is_eligible(x):
+        return x.to(dtype)
+    elif isinstance(x, map):
+        return {_cast(k, dtype): _cast(v, dtype) for k, v in x.items()}
+    elif isinstance(x, list) or isinstance(x, tuple):
+        return type(x)(map(lambda y: _cast(y, dtype), x))
+    return x
+def custom_fwd(fwd):
+    """Wrap a custom autograd function that always uses autocast dtype."""
+    @functools.wraps(fwd)
+    def decorate_fwd(*args, **kwargs):
+        if torch.is_autocast_enabled():
+            with torch.autocast(device_type="cuda", enabled=False):
+                dtype = torch.get_autocast_gpu_dtype()
+                return fwd(*_cast(args, dtype), **_cast(kwargs, dtype))
+        return fwd(*args, **kwargs)
+    return decorate_fwd
+def custom_bwd(bwd):
+    @functools.wraps(bwd)
+    def decorate_bwd(*args, **kwargs):
+        with torch.autocast(device_type="cuda", enabled=False):
+            return bwd(*args, **kwargs)
+    return decorate_bwd