Inifinite generation via context swapping (#71)

2025-08-18 05:56:00 -04:00 · 2023-03-25 21:36:22 +02:00
parent 03f7e33560
commit e2d490dafd
4 changed files with 100 additions and 40 deletions
--- a/examples/common.h
+++ b/examples/common.h
@@ -21,6 +21,7 @@ struct gpt_params {
    int32_t n_parts       = -1;   // amount of model parts (-1 = determine from model dimensions)
    int32_t n_ctx         = 512;  // context size
    int32_t n_batch       = 8;    // batch size for prompt processing
+    int32_t n_keep        = 0;    // number of tokens to keep from initial prompt

    // sampling parameters
    int32_t top_k = 40;