added ctx_size parameter (#148)

* added ctx_size parameter * added it in more places * Apply suggestions from code review --------- Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
2025-07-02 05:15:47 +00:00 · 2023-03-15 15:42:40 -04:00
parent 16b2c61a22
commit 2d64715ad4
3 changed files with 8 additions and 3 deletions
--- a/utils.h
+++ b/utils.h
@ -17,7 +17,8 @@ struct gpt_params {
    int32_t n_threads = std::min(4, (int32_t) std::thread::hardware_concurrency());
    int32_t n_predict = 128; // new tokens to predict
    int32_t repeat_last_n = 64;  // last n tokens to penalize
-
+    int32_t n_ctx = 512; //context size
+    
    // sampling parameters
    int32_t top_k = 40;
    float   top_p = 0.95f;