midscene/packages/core/tests/ai/insight/insight.test.ts

import { distance } from '@/ai-model/prompt/util';
import Insight from '@/insight';
import { sleep } from '@/utils';
import { vlLocateMode } from '@midscene/shared/env';
import { getContextFromFixture } from 'tests/evaluation';
import { describe, expect, test, vi } from 'vitest';

vi.setConfig({
  testTimeout: 60 * 1000,
});

const vlMode = vlLocateMode();

describe.skipIf(!vlMode)('insight locate with deep think', () => {
  test('insight locate with search area', async () => {
    const { context } = await getContextFromFixture('taobao');

    const insight = new Insight(context);
    const { element } = await insight.locate({
      prompt: '购物车 icon',
      deepThink: true,
    });
    expect(element).toBeDefined();

    await sleep(3000);
  });

  test('insight locate with search area and think twice', async () => {
    const { context } = await getContextFromFixture('taobao');

    const insight = new Insight(context);
    const { element, rect } = await insight.locate({
      prompt: '顶部购物车 icon',
      deepThink: true,
    });
    expect(element).toBeDefined();
    expect(rect).toBeDefined();
    expect(
      distance(
        {
          x: element!.rect.left,
          y: element!.rect.top,
        },
        {
          x: rect!.left,
          y: rect!.top,
        },
      ),
    ).toBeLessThan(100);
    await sleep(3000);
  });
});

vi.setConfig({
  testTimeout: 60 * 1000,
});

test.skip('insight locate with search area', async () => {
  const { context } = await getContextFromFixture('image-only');

  const insight = new Insight(context);
  const { element, rect } = await insight.locate({
    prompt: '-',
    deepThink: true,
  });
  console.log(element, rect);
  await sleep(3000);
});
feat: use aiTap(prompt, opt) style interface (#512) 2025-04-01 10:41:31 +08:00			`import { distance } from '@/ai-model/prompt/util';`
feat: enable search area for locate (#473) * feat: enable search area for locate * fix: update evaluation * fix: build error * fix: ci * fix: locator * feat: show searchArea in report * chore: add yaml support for aiTap * feat: update status tip * fix: #473 (#484) * chore: optimize unit test list --------- Co-authored-by: zhouxiao.shaw <zhouxiao.shaw@bytedance.com> 2025-03-24 09:50:27 +08:00			`import Insight from '@/insight';`
			`import { sleep } from '@/utils';`
feat(core): allow custom midscene_run dir (#631) * feat(core): support custom midscene_run dir * feat(report): add search functionality to PlaywrightCaseSelector component * refactor(shared): simplify base directory resolution and remove unused environment variable * feat(shared): integrate shared environment variables across multiple packages * refactor(shared): update base directory resolution to use dynamic midscene_run directory * fix(puppeteer): increase screenshot timeout from 3s to 10s for improved reliability 2025-04-24 22:54:52 +08:00			`import { vlLocateMode } from '@midscene/shared/env';`
feat: enable search area for locate (#473) * feat: enable search area for locate * fix: update evaluation * fix: build error * fix: ci * fix: locator * feat: show searchArea in report * chore: add yaml support for aiTap * feat: update status tip * fix: #473 (#484) * chore: optimize unit test list --------- Co-authored-by: zhouxiao.shaw <zhouxiao.shaw@bytedance.com> 2025-03-24 09:50:27 +08:00			`import { getContextFromFixture } from 'tests/evaluation';`
fix: ai test (#494) * fix: ai test * fix: planning ci 2025-03-25 10:04:03 +08:00			`import { describe, expect, test, vi } from 'vitest';`
feat: enable search area for locate (#473) * feat: enable search area for locate * fix: update evaluation * fix: build error * fix: ci * fix: locator * feat: show searchArea in report * chore: add yaml support for aiTap * feat: update status tip * fix: #473 (#484) * chore: optimize unit test list --------- Co-authored-by: zhouxiao.shaw <zhouxiao.shaw@bytedance.com> 2025-03-24 09:50:27 +08:00
			`vi.setConfig({`
			`testTimeout: 60 * 1000,`
			`});`

fix: ai test (#494) * fix: ai test * fix: planning ci 2025-03-25 10:04:03 +08:00			`const vlMode = vlLocateMode();`
feat: enable search area for locate (#473) * feat: enable search area for locate * fix: update evaluation * fix: build error * fix: ci * fix: locator * feat: show searchArea in report * chore: add yaml support for aiTap * feat: update status tip * fix: #473 (#484) * chore: optimize unit test list --------- Co-authored-by: zhouxiao.shaw <zhouxiao.shaw@bytedance.com> 2025-03-24 09:50:27 +08:00
chore: update evaluation fixture (#552) 2025-04-10 16:54:21 +08:00			`describe.skipIf(!vlMode)('insight locate with deep think', () => {`
fix: ai test (#494) * fix: ai test * fix: planning ci 2025-03-25 10:04:03 +08:00			`test('insight locate with search area', async () => {`
			`const { context } = await getContextFromFixture('taobao');`
feat: enable search area for locate (#473) * feat: enable search area for locate * fix: update evaluation * fix: build error * fix: ci * fix: locator * feat: show searchArea in report * chore: add yaml support for aiTap * feat: update status tip * fix: #473 (#484) * chore: optimize unit test list --------- Co-authored-by: zhouxiao.shaw <zhouxiao.shaw@bytedance.com> 2025-03-24 09:50:27 +08:00
fix: ai test (#494) * fix: ai test * fix: planning ci 2025-03-25 10:04:03 +08:00			`const insight = new Insight(context);`
			`const { element } = await insight.locate({`
			`prompt: '购物车 icon',`
chore: update evaluation fixture (#552) 2025-04-10 16:54:21 +08:00			`deepThink: true,`
fix: ai test (#494) * fix: ai test * fix: planning ci 2025-03-25 10:04:03 +08:00			`});`
			`expect(element).toBeDefined();`

			`await sleep(3000);`
			`});`
feat: enable search area for locate (#473) * feat: enable search area for locate * fix: update evaluation * fix: build error * fix: ci * fix: locator * feat: show searchArea in report * chore: add yaml support for aiTap * feat: update status tip * fix: #473 (#484) * chore: optimize unit test list --------- Co-authored-by: zhouxiao.shaw <zhouxiao.shaw@bytedance.com> 2025-03-24 09:50:27 +08:00
fix: ai test (#494) * fix: ai test * fix: planning ci 2025-03-25 10:04:03 +08:00			`test('insight locate with search area and think twice', async () => {`
			`const { context } = await getContextFromFixture('taobao');`
feat: enable search area for locate (#473) * feat: enable search area for locate * fix: update evaluation * fix: build error * fix: ci * fix: locator * feat: show searchArea in report * chore: add yaml support for aiTap * feat: update status tip * fix: #473 (#484) * chore: optimize unit test list --------- Co-authored-by: zhouxiao.shaw <zhouxiao.shaw@bytedance.com> 2025-03-24 09:50:27 +08:00
fix: ai test (#494) * fix: ai test * fix: planning ci 2025-03-25 10:04:03 +08:00			`const insight = new Insight(context);`
feat: use aiTap(prompt, opt) style interface (#512) 2025-04-01 10:41:31 +08:00			`const { element, rect } = await insight.locate({`
fix: ai test (#494) * fix: ai test * fix: planning ci 2025-03-25 10:04:03 +08:00			`prompt: '顶部购物车 icon',`
			`deepThink: true,`
			`});`
			`expect(element).toBeDefined();`
feat: use aiTap(prompt, opt) style interface (#512) 2025-04-01 10:41:31 +08:00			`expect(rect).toBeDefined();`
			`expect(`
			`distance(`
			`{`
			`x: element!.rect.left,`
			`y: element!.rect.top,`
			`},`
			`{`
			`x: rect!.left,`
			`y: rect!.top,`
			`},`
			`),`
			`).toBeLessThan(100);`
fix: ai test (#494) * fix: ai test * fix: planning ci 2025-03-25 10:04:03 +08:00			`await sleep(3000);`
feat: enable search area for locate (#473) * feat: enable search area for locate * fix: update evaluation * fix: build error * fix: ci * fix: locator * feat: show searchArea in report * chore: add yaml support for aiTap * feat: update status tip * fix: #473 (#484) * chore: optimize unit test list --------- Co-authored-by: zhouxiao.shaw <zhouxiao.shaw@bytedance.com> 2025-03-24 09:50:27 +08:00			`});`
			`});`
use adb instead of appium (#483) * feat: enable search area for locate * fix: update evaluation * fix: locator * feat: show searchArea in report * chore: add yaml support for aiTap * feat: use adb instead appium * feat: Adds debugging information and reconstructs input text capabilities * feat: refactoring Android related functions and adding android modules * feat: update the image scaling algorithm, adjust the Android page class to support device scaling, and remove test files that are no longer needed * feat: adjust the Android page class to support device scaling, and remove test files that are no longer needed * feat: use appium-adb instead of bare command * fix: update entry for @midscene/android * feat: optimize the screenshot processing logic, add a backup mechanism when screenshots fail, and update test cases to accommodate new features * fix: rethrow error * feat: add Android debug configuration options and update documentation * chore: fix code style in #483 (#492) * fix: remove try for error handle by outside --------- Co-authored-by: yutao <yutao.tao@bytedance.com> Co-authored-by: linyibing <linyibing@bytedance.com> Co-authored-by: yuyutaotao <167746126+yuyutaotao@users.noreply.github.com> 2025-03-25 22:45:05 +08:00
			`vi.setConfig({`
			`testTimeout: 60 * 1000,`
			`});`

chore: update evaluation fixture (#552) 2025-04-10 16:54:21 +08:00			`test.skip('insight locate with search area', async () => {`
			`const { context } = await getContextFromFixture('image-only');`
use adb instead of appium (#483) * feat: enable search area for locate * fix: update evaluation * fix: locator * feat: show searchArea in report * chore: add yaml support for aiTap * feat: use adb instead appium * feat: Adds debugging information and reconstructs input text capabilities * feat: refactoring Android related functions and adding android modules * feat: update the image scaling algorithm, adjust the Android page class to support device scaling, and remove test files that are no longer needed * feat: adjust the Android page class to support device scaling, and remove test files that are no longer needed * feat: use appium-adb instead of bare command * fix: update entry for @midscene/android * feat: optimize the screenshot processing logic, add a backup mechanism when screenshots fail, and update test cases to accommodate new features * fix: rethrow error * feat: add Android debug configuration options and update documentation * chore: fix code style in #483 (#492) * fix: remove try for error handle by outside --------- Co-authored-by: yutao <yutao.tao@bytedance.com> Co-authored-by: linyibing <linyibing@bytedance.com> Co-authored-by: yuyutaotao <167746126+yuyutaotao@users.noreply.github.com> 2025-03-25 22:45:05 +08:00
chore: update evaluation fixture (#552) 2025-04-10 16:54:21 +08:00			`const insight = new Insight(context);`
			`const { element, rect } = await insight.locate({`
			`prompt: '-',`
			`deepThink: true,`
			`});`
			`console.log(element, rect);`
			`await sleep(3000);`
			`});`