From e1c1783e7cbac1565765a83fc83fb2a985c1df9b Mon Sep 17 00:00:00 2001
From: Hatter Jiang <jht5945@gmail.com>
Date: Sun, 19 Apr 2026 14:17:32 +0800
Subject: [PATCH] =?UTF-8?q?=F0=9F=94=84=20Refactor=20streaming=20logic=20a?=
 =?UTF-8?q?nd=20update=20chat=20message=20content=20in=20AI=20test=20scrip?=
 =?UTF-8?q?ts?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 projects/local-ai-test/main-stream.py | 65 ++++++++++++++++-----------
 projects/local-ai-test/main.py        |  2 +-
 2 files changed, 39 insertions(+), 28 deletions(-)

diff --git a/projects/local-ai-test/main-stream.py b/projects/local-ai-test/main-stream.py
index 3e86bdf..08b5d0d 100644
--- a/projects/local-ai-test/main-stream.py
+++ b/projects/local-ai-test/main-stream.py
@@ -1,44 +1,55 @@
 import os
+from datetime import datetime
 from pprint import pprint
 
 from openai import OpenAI
 from openai._types import Timeout
-from openai.types.chat import ChatCompletionUserMessageParam, ChatCompletionSystemMessageParam
+from openai.types.chat import ChatCompletionUserMessageParam, ChatCompletionSystemMessageParam, \
+    ChatCompletionStreamOptionsParam
 
 
 def main():
     client = OpenAI(
         api_key=os.environ.get("OPENAI_API_KEY", "sk-dummy"),
         base_url=os.environ.get("OPENAI_API_BASE", "http://localhost:11434/v1"),
-        timeout=Timeout(30, connect=5),
+        timeout=Timeout(10, connect=5),
     )
 
-    response = client.chat.completions.create(
-        model=os.environ.get("OPENAI_MODEL", "qwen-math-turbo"),
-        messages=[
-            ChatCompletionSystemMessageParam(role="system", content="You are a useful assistant."),
-            # ChatCompletionUserMessageParam(**{"role": "user", "content": "Hello!"}),
-            ChatCompletionUserMessageParam(role="user", content="Hello!"),
-        ],
-        stream=True,
-        # stream_options={"include_usage": True},
-    )
-    print()
-    pprint(vars(response))
-    print()
-    # print(response.choices[0].message.content)
+    print("Start", datetime.now())
+    try:
+        stream = client.chat.completions.create(
+            model=os.environ.get("OPENAI_MODEL", "qwen-math-turbo"),
+            messages=[
+                ChatCompletionSystemMessageParam(role="system", content="You are a useful assistant."),
+                # ChatCompletionUserMessageParam(**{"role": "user", "content": "Hello!"}),
+                ChatCompletionUserMessageParam(role="user", content="Introduce your self."),
+            ],
+            stream=True,
+            stream_options=ChatCompletionStreamOptionsParam(include_usage=True),
+        )
+        print()
+        pprint(vars(stream))
+        print()
 
-    for chunk in response:
-        print('xx')
-        if chunk.choices:
-            content = chunk.choices[0].delta.content or ""
-            print('CHUNK:', content, end="", flush=True)
-            # content_parts.append(content)
-        elif chunk.usage:
-            print("\n--- 请求用量 ---")
-            print(f"输入 Tokens: {chunk.usage.prompt_tokens}")
-            print(f"输出 Tokens: {chunk.usage.completion_tokens}")
-            print(f"总计 Tokens: {chunk.usage.total_tokens}")
+        content_parts = []
+        print("Begin chunk", datetime.now())
+        for chunk in stream:
+            print("Chunk", datetime.now())
+            if chunk.choices:
+                content = chunk.choices[0].delta.content or ""
+                print('CHUNK:', content, flush=True)
+                content_parts.append(content)
+            elif chunk.usage:
+                print("\n----- Usage -----")
+                print(f"Input  Tokens: {chunk.usage.prompt_tokens}")
+                print(f"Output Tokens: {chunk.usage.completion_tokens}")
+                print(f"Total  Tokens: {chunk.usage.total_tokens}")
+                print("")
+        print("Finally:", "".join(content_parts))
+    except Exception as e:
+        print("Exception", datetime.now(), e)
+    finally:
+        print("End", datetime.now())
 
 
 if __name__ == "__main__":
diff --git a/projects/local-ai-test/main.py b/projects/local-ai-test/main.py
index 39eed48..8a3c39e 100644
--- a/projects/local-ai-test/main.py
+++ b/projects/local-ai-test/main.py
@@ -18,7 +18,7 @@ def main():
         messages=[
             ChatCompletionSystemMessageParam(role="system", content="You are a useful assistant."),
             # ChatCompletionUserMessageParam(**{"role": "user", "content": "Hello!"}),
-            ChatCompletionUserMessageParam(role="user", content="Hello!"),
+            ChatCompletionUserMessageParam(role="user", content="Introduce your self in short a sentence."),
         ],
     )
     print()