mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-07-25 04:02:50 +00:00
scripts: benchmark for HTTP server throughput (#14668)
* scripts: benchmark for HTTP server throughput * fix server connection reset
This commit is contained in:
@ -11,6 +11,8 @@
|
||||
|
||||
// increase max payload length to allow use of larger context size
|
||||
#define CPPHTTPLIB_FORM_URL_ENCODED_PAYLOAD_MAX_LENGTH 1048576
|
||||
// increase backlog size to avoid connection resets for >> 1 slots
|
||||
#define CPPHTTPLIB_LISTEN_BACKLOG 512
|
||||
// disable Nagle's algorithm
|
||||
#define CPPHTTPLIB_TCP_NODELAY true
|
||||
#include <cpp-httplib/httplib.h>
|
||||
|
Reference in New Issue
Block a user