| [general] | |
| name = "rwkv" | |
| universal = false | |
| [torch] | |
| src = [ | |
| "torch-ext/torch_binding.cpp", | |
| ] | |
| [kernel.rwkv] | |
| depends = ["torch"] | |
| backend = "cuda" | |
| cuda-capabilities = [ | |
| "8.0", | |
| "8.9", | |
| "9.0", | |
| "10.0", | |
| "12.0", | |
| ] | |
| include = ["."] | |
| src = [ | |
| "rwkv/wkv_cuda.cu", | |
| "rwkv/wkv_cuda_bf16.cu", | |
| ] | |
| cuda-flags = [ | |
| "-res-usage", | |
| "--use_fast_math", | |
| "-O3", | |
| "--extra-device-vectorization", | |
| "-DTmax=1024", | |
| ] | |