NVIDIA · andompesta · May 15, 2025 · Jun 16, 2025 · trebedea · Jun 17, 2025
diff --git a/nemoguardrails/rails/llm/llmrails.py b/nemoguardrails/rails/llm/llmrails.py
@@ -1297,7 +1297,7 @@ def _prepare_params(
         )
 
         async for chunk_list, chunk_str_rep in buffer_strategy(streaming_handler):
-            chunk_str = " ".join(chunk_list)
+            chunk_str = "".join(chunk_list)
 
             # Check if chunk_str_rep is a JSON string
             # we yield a json error payload in generate_async when
@@ -1311,8 +1311,8 @@ def _prepare_params(
             if stream_first:
                 words = chunk_str_rep.split()
                 if words:
-                    yield words[0]
-                    for word in words[1:]:
+                    # yield words[0]
+                    for word in words:
                         yield f" {word}"
 
             for flow_id in output_rails_flows_id: