429 fix (#1668)

2025-06-25 21:45:38 -04:00 · 2025-06-25 21:45:38 -04:00 · bb797ded7d
parent b6b9923dc3
commit bb797ded7d
6 changed files with 72 additions and 50 deletions
--- a/packages/core/src/core/client.ts
+++ b/packages/core/src/core/client.ts
@ -196,7 +196,6 @@ export class GeminiClient {
      return new GeminiChat(
        this.config,
        this.getContentGenerator(),
        this.model,
        {
          systemInstruction,
          ...generateContentConfigWithThinking,
--- a/packages/core/src/core/geminiChat.test.ts
+++ b/packages/core/src/core/geminiChat.test.ts
@ -25,34 +25,36 @@ const mockModelsModule = {
  batchEmbedContents: vi.fn(),
 } as unknown as Models;
 const mockConfig = {
  getSessionId: () => 'test-session-id',
  getTelemetryLogPromptsEnabled: () => true,
  getUsageStatisticsEnabled: () => true,
  getDebugMode: () => false,
  getContentGeneratorConfig: () => ({
    authType: 'oauth-personal',
    model: 'test-model',
  }),
  setModel: vi.fn(),
  flashFallbackHandler: undefined,
 } as unknown as Config;
 describe('GeminiChat', () => {
  let chat: GeminiChat;
-  const model = 'gemini-pro';
+  let mockConfig: Config;
  const config: GenerateContentConfig = {};
  beforeEach(() => {
    vi.clearAllMocks();
    mockConfig = {
      getSessionId: () => 'test-session-id',
      getTelemetryLogPromptsEnabled: () => true,
      getUsageStatisticsEnabled: () => true,
      getDebugMode: () => false,
      getContentGeneratorConfig: () => ({
        authType: 'oauth-personal',
        model: 'test-model',
      }),
      getModel: vi.fn().mockReturnValue('gemini-pro'),
      setModel: vi.fn(),
      flashFallbackHandler: undefined,
    } as unknown as Config;
    // Disable 429 simulation for tests
    setSimulate429(false);
    // Reset history for each test by creating a new instance
-    chat = new GeminiChat(mockConfig, mockModelsModule, model, config, []);
+    chat = new GeminiChat(mockConfig, mockModelsModule, config, []);
  });
  afterEach(() => {
    vi.restoreAllMocks();
    vi.resetAllMocks();
  });
  describe('sendMessage', () => {
@ -203,7 +205,7 @@ describe('GeminiChat', () => {
      chat.recordHistory(userInput, newModelOutput); // userInput here is for the *next* turn, but history is already primed
      // Reset and set up a more realistic scenario for merging with existing history
-      chat = new GeminiChat(mockConfig, mockModelsModule, model, config, []);
+      chat = new GeminiChat(mockConfig, mockModelsModule, config, []);
      const firstUserInput: Content = {
        role: 'user',
        parts: [{ text: 'First user input' }],
@ -246,7 +248,7 @@ describe('GeminiChat', () => {
        role: 'model',
        parts: [{ text: 'Initial model answer.' }],
      };
-      chat = new GeminiChat(mockConfig, mockModelsModule, model, config, [
+      chat = new GeminiChat(mockConfig, mockModelsModule, config, [
        initialUser,
        initialModel,
      ]);
--- a/packages/core/src/core/geminiChat.ts
+++ b/packages/core/src/core/geminiChat.ts
@ -138,7 +138,6 @@ export class GeminiChat {
  constructor(
    private readonly config: Config,
    private readonly contentGenerator: ContentGenerator,
    private readonly model: string,
    private readonly generationConfig: GenerateContentConfig = {},
    private history: Content[] = [],
  ) {
@ -168,7 +167,12 @@ export class GeminiChat {
  ): Promise<void> {
    logApiResponse(
      this.config,
-      new ApiResponseEvent(this.model, durationMs, usageMetadata, responseText),
+      new ApiResponseEvent(
        this.config.getModel(),
        durationMs,
        usageMetadata,
        responseText,
      ),
    );
  }
@ -178,7 +182,12 @@ export class GeminiChat {
    logApiError(
      this.config,
-      new ApiErrorEvent(this.model, errorMessage, durationMs, errorType),
+      new ApiErrorEvent(
        this.config.getModel(),
        errorMessage,
        durationMs,
        errorType,
      ),
    );
  }
@ -192,7 +201,7 @@ export class GeminiChat {
      return null;
    }
-    const currentModel = this.model;
+    const currentModel = this.config.getModel();
    const fallbackModel = DEFAULT_GEMINI_FLASH_MODEL;
    // Don't fallback if already using Flash model
@ -244,7 +253,7 @@ export class GeminiChat {
    const userContent = createUserContent(params.message);
    const requestContents = this.getHistory(true).concat(userContent);
-    this._logApiRequest(requestContents, this.model);
+    this._logApiRequest(requestContents, this.config.getModel());
    const startTime = Date.now();
    let response: GenerateContentResponse;
@ -252,12 +261,23 @@ export class GeminiChat {
    try {
      const apiCall = () =>
        this.contentGenerator.generateContent({
-          model: this.model,
+          model: this.config.getModel() || DEFAULT_GEMINI_FLASH_MODEL,
          contents: requestContents,
          config: { ...this.generationConfig, ...params.config },
        });
-      response = await retryWithBackoff(apiCall);
+      response = await retryWithBackoff(apiCall, {
        shouldRetry: (error: Error) => {
          if (error && error.message) {
            if (error.message.includes('429')) return true;
            if (error.message.match(/5\d{2}/)) return true;
          }
          return false;
        },
        onPersistent429: async (authType?: string) =>
          await this.handleFlashFallback(authType),
        authType: this.config.getContentGeneratorConfig()?.authType,
      });
      const durationMs = Date.now() - startTime;
      await this._logApiResponse(
        durationMs,
@ -326,14 +346,14 @@ export class GeminiChat {
    await this.sendPromise;
    const userContent = createUserContent(params.message);
    const requestContents = this.getHistory(true).concat(userContent);
-    this._logApiRequest(requestContents, this.model);
+    this._logApiRequest(requestContents, this.config.getModel());
    const startTime = Date.now();
    try {
      const apiCall = () =>
        this.contentGenerator.generateContentStream({
-          model: this.model,
+          model: this.config.getModel(),
          contents: requestContents,
          config: { ...this.generationConfig, ...params.config },
        });
--- a/packages/core/src/utils/nextSpeakerChecker.test.ts
+++ b/packages/core/src/utils/nextSpeakerChecker.test.ts
@ -71,7 +71,6 @@ describe('checkNextSpeaker', () => {
    chatInstance = new GeminiChat(
      mockConfigInstance,
      mockModelsInstance, // This is the instance returned by mockGoogleGenAIInstance.getGenerativeModel
      'gemini-pro', // model name
      {},
      [], // initial history
    );
--- a/packages/core/src/utils/retry.test.ts
+++ b/packages/core/src/utils/retry.test.ts
@ -272,7 +272,7 @@ describe('retryWithBackoff', () => {
      expect(fallbackCallback).toHaveBeenCalledWith('oauth-personal');
      // Should retry again after fallback
-      expect(mockFn).toHaveBeenCalledTimes(4); // 3 initial attempts + 1 after fallback
+      expect(mockFn).toHaveBeenCalledTimes(3); // 2 initial attempts + 1 after fallback
    });
    it('should NOT trigger fallback for API key users', async () => {
--- a/packages/core/src/utils/retry.ts
+++ b/packages/core/src/utils/retry.ts
@ -67,9 +67,9 @@ export async function retryWithBackoff<T>(
    maxAttempts,
    initialDelayMs,
    maxDelayMs,
    shouldRetry,
    onPersistent429,
    authType,
    shouldRetry,
  } = {
    ...DEFAULT_RETRY_OPTIONS,
    ...options,
@ -93,28 +93,30 @@ export async function retryWithBackoff<T>(
        consecutive429Count = 0;
      }
      // If we have persistent 429s and a fallback callback for OAuth
      if (
        consecutive429Count >= 2 &&
        onPersistent429 &&
        authType === AuthType.LOGIN_WITH_GOOGLE_PERSONAL
      ) {
        try {
          const fallbackModel = await onPersistent429(authType);
          if (fallbackModel) {
            // Reset attempt counter and try with new model
            attempt = 0;
            consecutive429Count = 0;
            currentDelay = initialDelayMs;
            // With the model updated, we continue to the next attempt
            continue;
          }
        } catch (fallbackError) {
          // If fallback fails, continue with original error
          console.warn('Fallback to Flash model failed:', fallbackError);
        }
      }
      // Check if we've exhausted retries or shouldn't retry
      if (attempt >= maxAttempts || !shouldRetry(error as Error)) {
        // If we have persistent 429s and a fallback callback for OAuth
        if (
          consecutive429Count >= 2 &&
          onPersistent429 &&
          authType === AuthType.LOGIN_WITH_GOOGLE_PERSONAL
        ) {
          try {
            const fallbackModel = await onPersistent429(authType);
            if (fallbackModel) {
              // Reset attempt counter and try with new model
              attempt = 0;
              consecutive429Count = 0;
              currentDelay = initialDelayMs;
              continue;
            }
          } catch (fallbackError) {
            // If fallback fails, continue with original error
            console.warn('Fallback to Flash model failed:', fallbackError);
          }
        }
        throw error;
      }