File size: 312 Bytes
401522d |
1 2 3 4 5 6 |
from .quantizer import Quantizer
from .fused_attn import QuantLlamaAttention, make_quant_attn
from .fused_mlp import QuantLlamaMLP, make_fused_mlp, autotune_warmup_fused
from .quant_linear import QuantLinear, make_quant_linear, autotune_warmup_linear
from .triton_norm import TritonLlamaRMSNorm, make_quant_norm
|