kernel
File size: 789 Bytes
2595c46
 
 
 
 
 
 
 
 
 
 
 
9c4ca75
 
 
 
 
 
 
 
 
 
 
6756875
 
9c4ca75
 
2595c46
 
 
 
 
 
 
 
 
 
 
3224250
 
 
 
2595c46
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
[general]
name = "megablocks"
universal = false

[torch]
src = [
  "torch-ext/torch_binding.cpp",
  "torch-ext/torch_binding.h"
]

[kernel.megablocks]
backend = "cuda"
cuda-capabilities = [
    "7.0",
    "7.2",
    "7.5",
    "8.0",
    "8.6",
    "8.7",
    "8.9",
    "9.0",
    "10.0",
    "10.1",
    "11.8",
    "12.0"
]
depends = ["torch", "cutlass_3_8"]
src = [
    "csrc/new_cumsum.h",
    "csrc/new_cumsum.cu",
    "csrc/new_histogram.h",
    "csrc/new_histogram.cu",
    "csrc/new_indices.h",
    "csrc/new_indices.cu",
    "csrc/new_replicate.cu",
    "csrc/new_replicate.h",
    "csrc/new_sort.h",
    "csrc/new_sort.cu",
    # vendored grouped gemm
    "csrc/grouped_gemm/fill_arguments.cuh",
    "csrc/grouped_gemm/grouped_gemm.cu",
    "csrc/grouped_gemm/grouped_gemm.h",
]