Spaces:
Running
on
A100
Running
on
A100
void FP8_AdamW(torch::Tensor params, // parameter | |
torch::Tensor grads, // gradient | |
torch::Tensor exp_avg, // first order momentum | |
torch::Tensor scale_exp_avg, | |
torch::Tensor exp_avg_sq, // second order momentum | |
torch::Tensor scale_exp_avg_sq, float beta1, float beta2, | |
float lr, float wd, float eps, int step, int qgroup_size); | |