web-infra-dev
diff --git a/‎apps/site/docs/zh/index.mdx
Lines changed: 1 addition & 1 deletion b/‎apps/site/docs/zh/index.mdx
Lines changed: 1 addition & 1 deletion
diff --git a/‎packages/midscene/src/action/executor.ts renamed to ‎packages/midscene/src/ai-model/action-executor.ts b/‎packages/midscene/src/action/executor.ts renamed to ‎packages/midscene/src/ai-model/action-executor.ts
diff --git a/‎packages/midscene/src/ai-model/common.ts
Lines changed: 1 addition & 3 deletions b/‎packages/midscene/src/ai-model/common.ts
Lines changed: 1 addition & 3 deletions
diff --git a/‎packages/midscene/src/ai-model/index.ts
Lines changed: 4 additions & 5 deletions b/‎packages/midscene/src/ai-model/index.ts
Lines changed: 4 additions & 5 deletions
diff --git a/‎packages/midscene/src/ai-model/inspect.ts
Lines changed: 5 additions & 13 deletions b/‎packages/midscene/src/ai-model/inspect.ts
Lines changed: 5 additions & 13 deletions
diff --git a/‎packages/midscene/src/ai-model/automation.ts renamed to ‎packages/midscene/src/ai-model/llm-planning.ts
Lines changed: 1 addition & 1 deletion b/‎packages/midscene/src/ai-model/automation.ts renamed to ‎packages/midscene/src/ai-model/llm-planning.ts
Lines changed: 1 addition & 1 deletion
diff --git a/‎packages/midscene/src/ai-model/prompt/element-inspector.ts renamed to ‎packages/midscene/src/ai-model/prompt/llm-locator.ts
Lines changed: 3 additions & 9 deletions b/‎packages/midscene/src/ai-model/prompt/element-inspector.ts renamed to ‎packages/midscene/src/ai-model/prompt/llm-locator.ts
Lines changed: 3 additions & 9 deletions
diff --git a/‎packages/midscene/src/ai-model/prompt/planning.ts renamed to ‎packages/midscene/src/ai-model/prompt/llm-planning.ts b/‎packages/midscene/src/ai-model/prompt/planning.ts renamed to ‎packages/midscene/src/ai-model/prompt/llm-planning.ts
diff --git a/‎packages/midscene/src/ai-model/prompt/element-point.ts renamed to ‎packages/midscene/src/ai-model/prompt/ui-tars-locator.ts
Lines changed: 1 addition & 1 deletion b/‎packages/midscene/src/ai-model/prompt/element-point.ts renamed to ‎packages/midscene/src/ai-model/prompt/ui-tars-locator.ts
Lines changed: 1 addition & 1 deletion
diff --git a/‎packages/midscene/src/ai-model/prompt/ui-tars-planning.ts
Lines changed: 1 addition & 1 deletion b/‎packages/midscene/src/ai-model/prompt/ui-tars-planning.ts
Lines changed: 1 addition & 1 deletion
@@ -1,6 +1,6 @@
 # Midscene.js - AI 加持，带来愉悦的 UI 自动化体验
 
-UI 自动化太难维护了。UI 自动化脚本里往往到处都是选择器，比如 `#ids`、`data-test`、`.selectors`。在需要重构的时候，这可能会让人感到非常头疼，尽管在这种情况下，UI 自动化应该能够发挥作用。
+传统 UI 自动化太难维护了。自动化脚本里往往到处都是选择器，比如 `#ids`、`data-test`、`.selectors`。在需要重构的时候，这可能会让人感到非常头疼，尽管在这种情况下，UI 自动化应该能够发挥作用。
 
 我们在这里推出 Midscene.js，助你重拾编码的乐趣。
 
 
@@ -1,13 +1,11 @@
 import assert from 'node:assert';
-import { MIDSCENE_MODEL_TEXT_ONLY, getAIConfig } from '@/env';
 import type { AIUsageInfo } from '@/types';
 
 import type {
-  ChatCompletionContentPart,
   ChatCompletionSystemMessageParam,
   ChatCompletionUserMessageParam,
 } from 'openai/resources';
-import { callToGetJSONObject, checkAIConfig } from './openai';
+import { callToGetJSONObject, checkAIConfig } from './service-caller';
 
 export type AIArgs = [
   ChatCompletionSystemMessageParam,
 
@@ -1,5 +1,5 @@
-export { callToGetJSONObject } from './openai';
-export { systemPromptToFindElement } from './prompt/element-inspector';
+export { callToGetJSONObject } from './service-caller';
+export { systemPromptToLocateElement } from './prompt/llm-locator';
 export { describeUserPage } from './prompt/util';
 
 export type { ChatCompletionMessageParam } from 'openai/resources';
@@ -11,7 +11,6 @@ export {
   transformElementPositionToId,
 } from './inspect';
 
-export { plan } from './automation';
+export { plan } from './llm-planning';
 export { callAiFn } from './common';
-
-export { vlmPlanning } from './vlm-planning';
+export { vlmPlanning } from './ui-tars-planning';
@@ -1,5 +1,4 @@
 import assert from 'node:assert';
-import path from 'node:path';
 import type {
   AIAssertionResponse,
   AIElementResponse,
@@ -9,29 +8,26 @@ import type {
   AIUsageInfo,
   BaseElement,
   ElementById,
-  Point,
   Size,
   UIContext,
 } from '@/types';
-import { savePositionImg } from '@midscene/shared/img';
 import type {
   ChatCompletionSystemMessageParam,
   ChatCompletionUserMessageParam,
 } from 'openai/resources';
 import { AIActionType, callAiFn } from './common';
-import { call, callToGetJSONObject } from './openai';
 import {
   findElementPrompt,
-  multiDescription,
-  systemPromptToFindElement,
-} from './prompt/element-inspector';
+  systemPromptToLocateElement,
+} from './prompt/llm-locator';
 import {
   describeUserPage,
   elementByPositionWithElementInfo,
   extractDataPrompt,
   systemPromptToAssert,
   systemPromptToExtract,
 } from './prompt/util';
+import { callToGetJSONObject } from './service-caller';
 
 export type AIArgs = [
   ChatCompletionSystemMessageParam,
@@ -69,11 +65,7 @@ export async function transformElementPositionToId(
       },
       size,
     );
-    // await savePositionImg({
-    //   inputImgBase64: screenshotBase64,
-    //   rect: absolutePosition,
-    //   outputPath: path.join(__dirname, 'test-data', `output-${index++}.png`),
-    // });
+
     const element = elementByPositionWithElementInfo(
       elementsInfo,
       absolutePosition,
@@ -182,7 +174,7 @@ export async function AiInspectElement<
     targetElementDescription,
     multi,
   });
-  const systemPrompt = systemPromptToFindElement();
+  const systemPrompt = systemPromptToLocateElement();
   const msgs: AIArgs = [
     { role: 'system', content: systemPrompt },
     {
 
@@ -6,7 +6,7 @@ import {
   automationUserPrompt,
   generateTaskBackgroundContext,
   systemPromptToTaskPlanning,
-} from './prompt/planning';
+} from './prompt/llm-planning';
 import { describeUserPage } from './prompt/util';
 
 export async function plan(
 
@@ -1,11 +1,11 @@
 import { MATCH_BY_POSITION, getAIConfig } from '@/env';
 import { PromptTemplate } from '@langchain/core/prompts';
 import type { ResponseFormatJSONSchema } from 'openai/resources';
-import { systemPromptToFindElementPosition } from './element-point';
+import { systemPromptToLocateElementPosition } from './ui-tars-locator';
 
-export function systemPromptToFindElement() {
+export function systemPromptToLocateElement() {
   if (getAIConfig(MATCH_BY_POSITION)) {
-    return systemPromptToFindElementPosition();
+    return systemPromptToLocateElementPosition();
   }
   return `
 ## Role:
@@ -144,12 +144,6 @@ Output Example:
   `;
 }
 
-export function multiDescription(multi: boolean) {
-  return multi
-    ? 'multiple elements matching the description (two or more)'
-    : 'The element closest to the description (only one)';
-}
-
 export const findElementSchema: ResponseFormatJSONSchema = {
   type: 'json_schema',
   json_schema: {
 
@@ -1,5 +1,5 @@
 // claude 3.5 sonnet computer The ability to understand the content of the image is better, Does not provide element snapshot effect
-export function systemPromptToFindElementPosition() {
+export function systemPromptToLocateElementPosition() {
   return `
   You are a GUI agent. You are given a task and your action history, with screenshots. You need to perform the next action to complete the task.
   
 
@@ -1,4 +1,4 @@
-import type { Action } from '../vlm-planning';
+import type { Action } from '../ui-tars-planning';
 
 export const uiTarsPlanningPrompt = `
 You are a GUI agent. You are given a task and your action history, with screenshots. You need to perform the next action to complete the task.
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-import type { Action } from '../vlm-planning';`
	`1`	`+import type { Action } from '../ui-tars-planning';`
`2`	`2`
`3`	`3`	export const uiTarsPlanningPrompt = `
`4`	`4`	`You are a GUI agent. You are given a task and your action history, with screenshots. You need to perform the next action to complete the task.`