# Midscene.js AI Model Configuration # 选择一个支持视觉的模型,取消对应注释 # === OpenAI GPT-4o === # OPENAI_API_KEY=your_openai_api_key # MIDSCENE_MODEL_NAME=gpt-4o # === Anthropic Claude === # ANTHROPIC_API_KEY=your_anthropic_api_key # MIDSCENE_MODEL_NAME=claude-sonnet-4-20250514 # === Google Gemini === # GOOGLE_GENERATIVE_AI_API_KEY=your_gemini_api_key # MIDSCENE_MODEL_NAME=gemini-2.5-flash # === Qwen3-VL (开源,通过DashScope) === # MIDSCENE_MODEL_NAME=qwen-vl-max # MIDSCENE_OPENAI_BASE_URL=https://dashscope.aliyuncs.com/compatible-mode/v1 # MIDSCENE_OPENAI_KEY=your_dashscope_api_key # === UI-TARS (开源,需自部署) === # MIDSCENE_MODEL_NAME=ui-tars # MIDSCENE_OPENAI_BASE_URL=http://localhost:8000/v1 # MIDSCENE_OPENAI_KEY=not-needed # === iOS WDA Configuration === # WDA_HOST=localhost # WDA_PORT=8100