|
|
@@ -17530,6 +17530,8 @@ static void llama_model_quantize_internal(const std::string & fname_inp, const s
|
|
|
quantize &= name.find("time_mix_first.weight") == std::string::npos;
|
|
|
quantize &= name.find("time_mix_w1.weight") == std::string::npos;
|
|
|
quantize &= name.find("time_mix_w2.weight") == std::string::npos;
|
|
|
+ quantize &= name.find("time_mix_decay_w1.weight") == std::string::npos;
|
|
|
+ quantize &= name.find("time_mix_decay_w2.weight") == std::string::npos;
|
|
|
|
|
|
// do not quantize relative position bias (T5)
|
|
|
quantize &= name.find("attn_rel_b.weight") == std::string::npos;
|