diff --git a/example_apps/openai_compatible.py b/example_apps/openai_compatible.py index 921bcc4..e3341e1 100644 --- a/example_apps/openai_compatible.py +++ b/example_apps/openai_compatible.py @@ -31,6 +31,7 @@ ) MODEL = os.getenv("OPENAI_MODEL", "") +REASONING_EFFORT = os.getenv("OPENAI_REASONING_EFFORT", "none") SYSTEM_PROMPT = "あなたは親切な音声アシスタントです。音声で返答するため、マークダウンは記述せず、簡潔に答えてください。だいたい3文程度で答えてください。" @@ -80,6 +81,7 @@ async def talk_session(proxy: WsProxy): resp = await client.chat.completions.create( model=MODEL, messages=messages, + reasoning_effort=REASONING_EFFORT, ) reply = resp.choices[0].message.content or "" diff --git a/misc/on_mac_demo/start-ollama.sh b/misc/on_mac_demo/start-ollama.sh new file mode 100755 index 0000000..53ba3ee --- /dev/null +++ b/misc/on_mac_demo/start-ollama.sh @@ -0,0 +1,14 @@ +#!/bin/bash + +MODEL_NAME="gemma4:26b" +CONTEXT_SIZE=$((1024 * 128)) + +curl http://localhost:11434/api/generate \ + -H 'Content-Type: application/json' \ + -d "{ + \"model\": \"$MODEL_NAME\", + \"keep_alive\": -1, + \"options\": { + \"num_ctx\": $CONTEXT_SIZE + } + }'"