6 months ago · 86f5623d90
--- a/src/llama-model.cpp
+++ b/src/llama-model.cpp
@@ -646,6 +646,9 @@ void llama_model::load_hparams(llama_model_loader & ml) {
 
				                 ml.get_key(LLM_KV_RESIDUAL_SCALE,              hparams.f_residual_scale);
			
 
				                 ml.get_key(LLM_KV_LOGIT_SCALE,                 hparams.f_logit_scale);
			
 
				 
			
 
				+                // MiniCPM uses rope by default, unlike Granite which uses it as a switch
			
 
				+                hparams.rope_finetuned = true;
			
 
				+
			
 
				                 switch (hparams.n_layer) {
			
 
				                     case 52: type = LLM_TYPE_1B; break;
			
 
				                     case 40: type = LLM_TYPE_2B; break;