diff --git a/include/infinicore/nn/linear.hpp b/include/infinicore/nn/linear.hpp index 667a980fa..89a832ceb 100644 --- a/include/infinicore/nn/linear.hpp +++ b/include/infinicore/nn/linear.hpp @@ -35,6 +35,8 @@ class BaseLinear : public Module { Tensor weight_scale() const { return weight_scale_; } Tensor weight_zeros() const { return weight_zeros_; } + std::shared_ptr get_quantization() const { return quantization_; } + protected: // Parameters INFINICORE_NN_PARAMETER(weight);