|
@@ -186,7 +186,7 @@ struct llama_hparams {
|
|
|
// LLaMAv2
|
|
// LLaMAv2
|
|
|
// TODO: load from model data hparams
|
|
// TODO: load from model data hparams
|
|
|
float f_ffn_mult = 1.0f;
|
|
float f_ffn_mult = 1.0f;
|
|
|
- float f_rms_norm_eps = 1e-6f;
|
|
|
|
|
|
|
+ float f_rms_norm_eps = LLAMA_DEFAULT_RMS_EPS;
|
|
|
|
|
|
|
|
float rope_freq_base = 10000.0f;
|
|
float rope_freq_base = 10000.0f;
|
|
|
float rope_freq_scale = 1.0f;
|
|
float rope_freq_scale = 1.0f;
|
|
@@ -870,7 +870,7 @@ struct llama_context_params llama_context_default_params() {
|
|
|
/*.n_ctx =*/ 512,
|
|
/*.n_ctx =*/ 512,
|
|
|
/*.n_batch =*/ 512,
|
|
/*.n_batch =*/ 512,
|
|
|
/*.n_gqa =*/ 1,
|
|
/*.n_gqa =*/ 1,
|
|
|
- /*.rms_norm_eps =*/ 1e-6f,
|
|
|
|
|
|
|
+ /*.rms_norm_eps =*/ LLAMA_DEFAULT_RMS_EPS,
|
|
|
/*.gpu_layers =*/ 0,
|
|
/*.gpu_layers =*/ 0,
|
|
|
/*.main_gpu =*/ 0,
|
|
/*.main_gpu =*/ 0,
|
|
|
/*.tensor_split =*/ nullptr,
|
|
/*.tensor_split =*/ nullptr,
|