2025-05-25 01:48:08 +01:00
# include "chat-parser.h"
# include "common.h"
# include "log.h"
# include "regex-partial.h"
# include <optional>
# include <stdexcept>
# include <string>
# include <vector>
using json = nlohmann : : ordered_json ;
common_chat_msg_parser : : common_chat_msg_parser ( const std : : string & input , bool is_partial , const common_chat_syntax & syntax )
: input_ ( input ) , is_partial_ ( is_partial ) , syntax_ ( syntax )
{
result_ . role = " assistant " ;
while ( true ) {
std : : string id = std : : to_string ( std : : rand ( ) ) ;
if ( input . find ( id ) = = std : : string : : npos ) {
healing_marker_ = id ;
break ;
}
}
}
std : : string common_chat_msg_parser : : str ( const common_string_range & rng ) const {
GGML_ASSERT ( rng . begin < = rng . end ) ;
return input_ . substr ( rng . begin , rng . end - rng . begin ) ;
}
void common_chat_msg_parser : : add_content ( const std : : string & content ) {
result_ . content + = content ;
}
void common_chat_msg_parser : : add_reasoning_content ( const std : : string & reasoning_content ) {
result_ . reasoning_content + = reasoning_content ;
}
bool common_chat_msg_parser : : add_tool_call ( const std : : string & name , const std : : string & id , const std : : string & arguments ) {
if ( name . empty ( ) ) {
return false ;
}
common_chat_tool_call tool_call ;
tool_call . name = name ;
tool_call . arguments = arguments ;
tool_call . id = id ;
// LOG_DBG("Tool call arguments:\n\traw: %s\n\tresult: %s\n", arguments.c_str(), tool_call.arguments.c_str());
result_ . tool_calls . emplace_back ( tool_call ) ;
return true ;
}
bool common_chat_msg_parser : : add_tool_call ( const json & tool_call ) {
std : : string name = tool_call . contains ( " name " ) ? tool_call . at ( " name " ) : " " ;
std : : string id = tool_call . contains ( " id " ) ? tool_call . at ( " id " ) : " " ;
std : : string arguments = tool_call . contains ( " arguments " ) ? tool_call . at ( " arguments " ) : " " ;
return add_tool_call ( name , id , arguments ) ;
}
bool common_chat_msg_parser : : add_tool_calls ( const json & arr ) {
for ( const auto & item : arr ) {
if ( ! add_tool_call ( item ) ) {
return false ;
}
}
return true ;
}
void common_chat_msg_parser : : finish ( ) {
if ( ! is_partial_ & & pos_ ! = input_ . size ( ) ) {
throw std : : runtime_error ( " Unexpected content at end of input " ) ; // + input_.substr(pos_));
}
}
bool common_chat_msg_parser : : consume_spaces ( ) {
const auto length = input_ . size ( ) ;
auto consumed = false ;
while ( pos_ < length & & std : : isspace ( input_ [ pos_ ] ) ) {
+ + pos_ ;
consumed = true ;
}
return consumed ;
}
bool common_chat_msg_parser : : try_consume_literal ( const std : : string & literal ) {
auto pos = pos_ ;
for ( auto i = 0u ; i < literal . size ( ) ; + + i ) {
if ( pos > = input_ . size ( ) ) {
return false ;
}
if ( input_ [ pos ] ! = literal [ i ] ) {
return false ;
}
+ + pos ;
}
pos_ = pos ;
return true ;
}
std : : optional < common_chat_msg_parser : : find_regex_result > common_chat_msg_parser : : try_find_literal ( const std : : string & literal ) {
auto idx = input_ . find ( literal , pos_ ) ;
if ( idx ! = std : : string : : npos ) {
find_regex_result res ;
res . prelude = input_ . substr ( pos_ , idx - pos_ ) ;
auto end = idx + literal . size ( ) ;
res . groups . emplace_back ( common_string_range { idx , end } ) ;
move_to ( end ) ;
return res ;
}
if ( is_partial_ ) {
idx = string_find_partial_stop ( input_ , literal ) ;
if ( idx ! = std : : string : : npos & & idx > = pos_ ) {
find_regex_result res ;
res . prelude = input_ . substr ( pos_ , idx - pos_ ) ;
auto end = input_ . size ( ) ;
res . groups . emplace_back ( common_string_range { idx , end } ) ;
move_to ( end ) ;
return res ;
}
}
return std : : nullopt ;
}
void common_chat_msg_parser : : consume_literal ( const std : : string & literal ) {
if ( ! try_consume_literal ( literal ) ) {
throw common_chat_msg_partial_exception ( literal ) ;
}
}
bool common_chat_msg_parser : : try_parse_reasoning ( const std : : string & start_think , const std : : string & end_think ) {
auto handle_reasoning = [ & ] ( const std : : string & reasoning , bool closed ) {
auto stripped_reasoning = string_strip ( reasoning ) ;
if ( stripped_reasoning . empty ( ) ) {
return ;
}
if ( syntax_ . reasoning_in_content ) {
add_content ( syntax_ . reasoning_format = = COMMON_REASONING_FORMAT_DEEPSEEK ? " <think> " : start_think ) ;
add_content ( stripped_reasoning ) ;
if ( closed ) {
add_content ( syntax_ . reasoning_format = = COMMON_REASONING_FORMAT_DEEPSEEK ? " </think> " : end_think ) ;
}
} else {
add_reasoning_content ( stripped_reasoning ) ;
}
} ;
if ( syntax_ . reasoning_format ! = COMMON_REASONING_FORMAT_NONE ) {
if ( syntax_ . thinking_forced_open | | try_consume_literal ( start_think ) ) {
if ( auto res = try_find_literal ( end_think ) ) {
handle_reasoning ( res - > prelude , /* closed */ true ) ;
consume_spaces ( ) ;
return true ;
}
auto rest = consume_rest ( ) ;
if ( ! rest . empty ( ) ) {
handle_reasoning ( rest , /* closed */ ! is_partial ( ) ) ;
}
2025-05-31 08:26:10 -07:00
// Allow unclosed thinking tags, for now (https://github.com/ggml-org/llama.cpp/issues/13812, https://github.com/ggml-org/llama.cpp/issues/13877)
// if (!syntax_.thinking_forced_open) {
// throw common_chat_msg_partial_exception(end_think);
// }
2025-05-25 01:48:08 +01:00
return true ;
}
}
return false ;
}
std : : string common_chat_msg_parser : : consume_rest ( ) {
auto rest = input_ . substr ( pos_ ) ;
pos_ = input_ . size ( ) ;
return rest ;
}
// Tries to find the regex, consumes it (pos right after it) and gives the prelude (right before it) and the groups to the callback.
2025-05-26 08:03:57 -07:00
std : : optional < common_chat_msg_parser : : find_regex_result > common_chat_msg_parser : : try_find_regex ( const common_regex & regex , size_t from , bool add_prelude_to_content ) {
2025-05-25 01:48:08 +01:00
auto m = regex . search ( input_ , from = = std : : string : : npos ? pos_ : from ) ;
if ( m . type = = COMMON_REGEX_MATCH_TYPE_NONE ) {
return std : : nullopt ;
}
2025-05-26 08:03:57 -07:00
auto prelude = input_ . substr ( pos_ , m . groups [ 0 ] . begin - pos_ ) ;
pos_ = m . groups [ 0 ] . end ;
if ( add_prelude_to_content ) {
add_content ( prelude ) ;
}
2025-05-25 01:48:08 +01:00
if ( m . type = = COMMON_REGEX_MATCH_TYPE_PARTIAL ) {
if ( is_partial ( ) ) {
throw common_chat_msg_partial_exception ( regex . str ( ) ) ;
}
return std : : nullopt ;
}
return find_regex_result { prelude , m . groups } ;
}
common_chat_msg_parser : : find_regex_result common_chat_msg_parser : : consume_regex ( const common_regex & regex ) {
if ( auto result = try_consume_regex ( regex ) ) {
return * result ;
}
throw common_chat_msg_partial_exception ( regex . str ( ) ) ;
}
std : : optional < common_chat_msg_parser : : find_regex_result > common_chat_msg_parser : : try_consume_regex ( const common_regex & regex ) {
auto m = regex . search ( input_ , pos_ ) ;
if ( m . type = = COMMON_REGEX_MATCH_TYPE_NONE ) {
return std : : nullopt ;
}
if ( m . type = = COMMON_REGEX_MATCH_TYPE_PARTIAL ) {
if ( is_partial ( ) ) {
throw common_chat_msg_partial_exception ( regex . str ( ) ) ;
}
return std : : nullopt ;
}
if ( m . groups [ 0 ] . begin ! = pos_ ) {
// Didn't match at the current position.
return std : : nullopt ;
}
pos_ = m . groups [ 0 ] . end ;
return find_regex_result {
/* .prelude = */ " " ,
m . groups ,
} ;
}
std : : optional < common_json > common_chat_msg_parser : : try_consume_json ( ) {
auto it = input_ . cbegin ( ) + pos_ ;
const auto end = input_ . cend ( ) ;
common_json result ;
if ( ! common_json_parse ( it , end , healing_marker_ , result ) ) {
return std : : nullopt ;
}
pos_ = std : : distance ( input_ . cbegin ( ) , it ) ;
if ( result . healing_marker . marker . empty ( ) ) {
// No healing marker, just return the parsed json
return result ;
}
if ( ! is_partial ( ) ) {
throw common_chat_msg_partial_exception ( " JSON " ) ;
}
return result ;
}
common_json common_chat_msg_parser : : consume_json ( ) {
if ( auto result = try_consume_json ( ) ) {
return * result ;
}
throw common_chat_msg_partial_exception ( " JSON " ) ;
}
common_chat_msg_parser : : consume_json_result common_chat_msg_parser : : consume_json_with_dumped_args (
const std : : vector < std : : vector < std : : string > > & args_paths ,
const std : : vector < std : : vector < std : : string > > & content_paths
) {
if ( auto result = try_consume_json_with_dumped_args ( args_paths , content_paths ) ) {
return * result ;
}
throw common_chat_msg_partial_exception ( " JSON " ) ;
}
std : : optional < common_chat_msg_parser : : consume_json_result > common_chat_msg_parser : : try_consume_json_with_dumped_args (
const std : : vector < std : : vector < std : : string > > & args_paths ,
const std : : vector < std : : vector < std : : string > > & content_paths
) {
auto partial = try_consume_json ( ) ;
if ( ! partial ) {
return std : : nullopt ;
}
auto is_arguments_path = [ & ] ( const std : : vector < std : : string > & path ) {
return std : : find ( args_paths . begin ( ) , args_paths . end ( ) , path ) ! = args_paths . end ( ) ;
} ;
auto is_content_path = [ & ] ( const std : : vector < std : : string > & path ) {
return std : : find ( content_paths . begin ( ) , content_paths . end ( ) , path ) ! = content_paths . end ( ) ;
} ;
if ( partial - > healing_marker . marker . empty ( ) ) {
if ( args_paths . empty ( ) ) {
// No arguments to dump, and JSON was parsed fully.
return consume_json_result {
partial - > json ,
/* .is_partial = */ false ,
} ;
}
if ( is_arguments_path ( { } ) ) {
// Entire JSON is the arguments and was parsed fully.
return consume_json_result {
partial - > json . dump ( ) ,
/* .is_partial = */ false ,
} ;
}
}
LOG_DBG ( " Parsed partial JSON: %s (json_healing_marker: %s) \n " , partial - > json . dump ( ) . c_str ( ) , partial - > healing_marker . json_dump_marker . c_str ( ) ) ;
auto found_healing_marker = false ;
std : : vector < std : : string > path ;
std : : function < json ( const json & ) > remove_unsupported_healings_and_dump_args = [ & ] ( const json & j ) - > json {
if ( is_arguments_path ( path ) ) {
auto arguments = j . dump ( ) ;
if ( is_partial ( ) & & ! partial - > healing_marker . marker . empty ( ) ) {
auto idx = arguments . find ( partial - > healing_marker . json_dump_marker ) ;
if ( idx ! = std : : string : : npos ) {
arguments . resize ( idx ) ;
found_healing_marker = true ;
}
if ( arguments = = " \" " ) {
// This happens because of completing `:"$magic` after `"arguments"`
arguments = " " ;
}
}
return arguments ;
}
if ( is_content_path ( path ) ) {
if ( ! j . is_string ( ) ) {
throw std : : runtime_error ( " Content path must be a string " ) ;
}
std : : string str = j ;
auto idx = str . find ( partial - > healing_marker . marker ) ; // not using json_dump_marker as we're inside a string
if ( idx ! = std : : string : : npos ) {
str . resize ( idx ) ;
found_healing_marker = true ;
}
return str ;
}
if ( j . is_object ( ) ) {
auto obj = json : : object ( ) ;
for ( const auto & p : j . items ( ) ) {
const auto & key = p . key ( ) ;
const auto & value = p . value ( ) ;
const std : : string key_str = key ; // NOLINT
auto idx = key_str . find ( healing_marker_ ) ;
if ( idx ! = std : : string : : npos ) {
found_healing_marker = true ;
break ;
}
path . push_back ( key_str ) ;
if ( value . is_string ( ) ) {
const std : : string value_str = value ;
if ( value_str . find ( healing_marker_ ) ! = std : : string : : npos ) {
found_healing_marker = true ;
if ( is_content_path ( path ) ) {
if ( partial - > healing_marker . marker = = partial - > healing_marker . json_dump_marker ) {
// The healing occurred inside the string: good. Otherwise we just ditch the entire key/value pair.
obj [ key ] = remove_unsupported_healings_and_dump_args ( value ) ;
}
}
break ;
}
obj [ key ] = value ;
} else {
obj [ key ] = remove_unsupported_healings_and_dump_args ( value ) ;
}
path . pop_back ( ) ;
}
return obj ;
}
if ( j . is_array ( ) ) {
auto arr = json : : array ( ) ;
for ( const auto & value : j ) {
if ( value . is_string ( ) ) {
std : : string str = value ;
auto idx = str . find ( healing_marker_ ) ;
if ( idx ! = std : : string : : npos ) {
// Don't heal array values that aren't in the arguments.
found_healing_marker = true ;
break ;
}
}
arr . push_back ( remove_unsupported_healings_and_dump_args ( value ) ) ;
}
return arr ;
}
return j ;
} ;
auto cleaned = remove_unsupported_healings_and_dump_args ( partial - > json ) ;
LOG_DBG ( " Cleaned up JSON %s to %s (json_healing_marker : '%s') \n " , partial - > json . dump ( ) . c_str ( ) , cleaned . dump ( ) . c_str ( ) , partial - > healing_marker . json_dump_marker . c_str ( ) ) ;
return consume_json_result {
cleaned ,
/* .is_partial = */ found_healing_marker ,
} ;
}