From 2acf8092cd90a4d5ebf484ac45ff47639ea2fe03 Mon Sep 17 00:00:00 2001 From: Sandro Cavallari Date: Thu, 15 May 2025 09:21:32 +0000 Subject: [PATCH 1/2] fix the introduction of an additional space and split words in subtokens --- nemoguardrails/rails/llm/llmrails.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/nemoguardrails/rails/llm/llmrails.py b/nemoguardrails/rails/llm/llmrails.py index daf36ff51..b93be2a38 100644 --- a/nemoguardrails/rails/llm/llmrails.py +++ b/nemoguardrails/rails/llm/llmrails.py @@ -1297,7 +1297,7 @@ def _prepare_params( ) async for chunk_list, chunk_str_rep in buffer_strategy(streaming_handler): - chunk_str = " ".join(chunk_list) + chunk_str = "".join(chunk_list) # Check if chunk_str_rep is a JSON string # we yield a json error payload in generate_async when From 959742c58c2dec1e5a2cfb5d32925a19a537a78e Mon Sep 17 00:00:00 2001 From: Sandro Cavallari Date: Mon, 16 Jun 2025 17:00:05 +0000 Subject: [PATCH 2/2] yield words as they are --- nemoguardrails/rails/llm/llmrails.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/nemoguardrails/rails/llm/llmrails.py b/nemoguardrails/rails/llm/llmrails.py index b93be2a38..aa9995a01 100644 --- a/nemoguardrails/rails/llm/llmrails.py +++ b/nemoguardrails/rails/llm/llmrails.py @@ -1311,8 +1311,8 @@ def _prepare_params( if stream_first: words = chunk_str_rep.split() if words: - yield words[0] - for word in words[1:]: + # yield words[0] + for word in words: yield f" {word}" for flow_id in output_rails_flows_id: