File size: 1,212 Bytes
174ae06
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
# Copyright (c) 2025 NVIDIA CORPORATION.
# Licensed under the MIT license.

# Adapted from https://github.com/NVlabs/VILA/tree/main under the Apache 2.0 license.
# LICENSE is in incl_licenses directory.

# Activation
# Utils
from ._dequantize import fp8_dequantize
from ._division import fp8_division
from ._division_transpose import fp8_division_transpose
from ._quantize import fp8_quantize
from ._quantize_pertensor import fp8_quantize_pertensor
from ._quantize_pertensor_transpose import fp8_quantize_pertensor_transpose
from ._transpose import fp8_transpose
from .add_bwd import fp8_add_Ifp_Ifp_Ofp_Opt
from .add_fwd import fp8_add_Ifp_Ifp_Ofp_Og16

# Normalization
from .func_layernorm_noparam import fp8_layernorm_noparam_backward, fp8_layernorm_noparam_forward
from .func_quantize import Coat_quantize_bgn, Coat_quantize_end
from .func_rmsnorm import fp8_rmsnorm_backward, fp8_rmsnorm_forward
from .gelu_bwd import fp8_gelu_backward
from .gelu_fwd import fp8_gelu_forward

# linear and add
from .linear import fp8_linear_backward, fp8_linear_forward
from .mul_bwd import fp8_mul_backward
from .mul_fwd import fp8_mul_forward
from .silu_bwd import fp8_silu_backward
from .silu_fwd import fp8_silu_forward