mirror of
https://github.com/QwenLM/qwen-code.git
synced 2025-12-20 08:47:44 +00:00
(model) - Use Flash Lite For Next Speaker Checks (#4991)
This commit is contained in:
@@ -6,4 +6,5 @@
|
|||||||
|
|
||||||
export const DEFAULT_GEMINI_MODEL = 'gemini-2.5-pro';
|
export const DEFAULT_GEMINI_MODEL = 'gemini-2.5-pro';
|
||||||
export const DEFAULT_GEMINI_FLASH_MODEL = 'gemini-2.5-flash';
|
export const DEFAULT_GEMINI_FLASH_MODEL = 'gemini-2.5-flash';
|
||||||
|
export const DEFAULT_GEMINI_FLASH_LITE_MODEL = 'gemini-2.5-flash-lite';
|
||||||
export const DEFAULT_GEMINI_EMBEDDING_MODEL = 'gemini-embedding-001';
|
export const DEFAULT_GEMINI_EMBEDDING_MODEL = 'gemini-embedding-001';
|
||||||
|
|||||||
@@ -21,6 +21,7 @@ export function tokenLimit(model: Model): TokenCount {
|
|||||||
case 'gemini-2.5-pro':
|
case 'gemini-2.5-pro':
|
||||||
case 'gemini-2.5-flash-preview-05-20':
|
case 'gemini-2.5-flash-preview-05-20':
|
||||||
case 'gemini-2.5-flash':
|
case 'gemini-2.5-flash':
|
||||||
|
case 'gemini-2.5-flash-lite':
|
||||||
case 'gemini-2.0-flash':
|
case 'gemini-2.0-flash':
|
||||||
return 1_048_576;
|
return 1_048_576;
|
||||||
case 'gemini-2.0-flash-preview-image-generation':
|
case 'gemini-2.0-flash-preview-image-generation':
|
||||||
|
|||||||
@@ -6,7 +6,7 @@
|
|||||||
|
|
||||||
import { describe, it, expect, vi, beforeEach, Mock, afterEach } from 'vitest';
|
import { describe, it, expect, vi, beforeEach, Mock, afterEach } from 'vitest';
|
||||||
import { Content, GoogleGenAI, Models } from '@google/genai';
|
import { Content, GoogleGenAI, Models } from '@google/genai';
|
||||||
import { DEFAULT_GEMINI_FLASH_MODEL } from '../config/models.js';
|
import { DEFAULT_GEMINI_FLASH_LITE_MODEL } from '../config/models.js';
|
||||||
import { GeminiClient } from '../core/client.js';
|
import { GeminiClient } from '../core/client.js';
|
||||||
import { Config } from '../config/config.js';
|
import { Config } from '../config/config.js';
|
||||||
import { checkNextSpeaker, NextSpeakerResponse } from './nextSpeakerChecker.js';
|
import { checkNextSpeaker, NextSpeakerResponse } from './nextSpeakerChecker.js';
|
||||||
@@ -248,6 +248,6 @@ describe('checkNextSpeaker', () => {
|
|||||||
expect(mockGeminiClient.generateJson).toHaveBeenCalled();
|
expect(mockGeminiClient.generateJson).toHaveBeenCalled();
|
||||||
const generateJsonCall = (mockGeminiClient.generateJson as Mock).mock
|
const generateJsonCall = (mockGeminiClient.generateJson as Mock).mock
|
||||||
.calls[0];
|
.calls[0];
|
||||||
expect(generateJsonCall[3]).toBe(DEFAULT_GEMINI_FLASH_MODEL);
|
expect(generateJsonCall[3]).toBe(DEFAULT_GEMINI_FLASH_LITE_MODEL);
|
||||||
});
|
});
|
||||||
});
|
});
|
||||||
|
|||||||
@@ -5,7 +5,7 @@
|
|||||||
*/
|
*/
|
||||||
|
|
||||||
import { Content, SchemaUnion, Type } from '@google/genai';
|
import { Content, SchemaUnion, Type } from '@google/genai';
|
||||||
import { DEFAULT_GEMINI_FLASH_MODEL } from '../config/models.js';
|
import { DEFAULT_GEMINI_FLASH_LITE_MODEL } from '../config/models.js';
|
||||||
import { GeminiClient } from '../core/client.js';
|
import { GeminiClient } from '../core/client.js';
|
||||||
import { GeminiChat } from '../core/geminiChat.js';
|
import { GeminiChat } from '../core/geminiChat.js';
|
||||||
import { isFunctionResponse } from './messageInspectors.js';
|
import { isFunctionResponse } from './messageInspectors.js';
|
||||||
@@ -132,7 +132,7 @@ export async function checkNextSpeaker(
|
|||||||
contents,
|
contents,
|
||||||
RESPONSE_SCHEMA,
|
RESPONSE_SCHEMA,
|
||||||
abortSignal,
|
abortSignal,
|
||||||
DEFAULT_GEMINI_FLASH_MODEL,
|
DEFAULT_GEMINI_FLASH_LITE_MODEL,
|
||||||
)) as unknown as NextSpeakerResponse;
|
)) as unknown as NextSpeakerResponse;
|
||||||
|
|
||||||
if (
|
if (
|
||||||
|
|||||||
Reference in New Issue
Block a user