%!s(int64=2) %!d(string=hai) anos · 10f19c1121
--- a/examples/common.h
+++ b/examples/common.h
@@ -20,7 +20,7 @@ struct gpt_params {
 
															     int32_t repeat_last_n = 64;   // last n tokens to penalize
														
 
															     int32_t n_parts       = -1;   // amount of model parts (-1 = determine from model dimensions)
														
 
															     int32_t n_ctx         = 512;  // context size
														
 
															-    int32_t n_batch       = 8;    // batch size for prompt processing
														
 
															+    int32_t n_batch       = 512;  // batch size for prompt processing (must be >=32 to use BLAS)
														
 
															     int32_t n_keep        = 0;    // number of tokens to keep from initial prompt
														
 
															     // sampling parameters