feat: Update default model to gemini-3.1-flash-live-preview, remove proactive audio and affective dialog features, and refactor turn_coverage into realtimeInputConfig.

thorwebdev · thorwebdev · commit 251aa7886995 · 2026-03-25T17:52:48.000-04:00
diff --git a/command-line/node/main.mts b/command-line/node/main.mts
@@ -8,7 +8,7 @@ const ai = new GoogleGenAI({});
 // More information at: https://ai.google.dev/gemini-api/docs/ephemeral-tokens
 
 // --- Live API config ---
-const model = 'gemini-2.5-flash-native-audio-preview-12-2025';
+const model = 'gemini-3.1-flash-live-preview';
 const config = {
   responseModalities: [Modality.AUDIO],
   systemInstruction: "You are a helpful and friendly AI assistant.",
diff --git a/gemini-live-ephemeral-tokens-websocket/README.md b/gemini-live-ephemeral-tokens-websocket/README.md
@@ -92,7 +92,7 @@ class MyTool extends FunctionCallDefinition {
 
 ## Configuration Options
 
-- **Model**: `gemini-3.1-flash-audio-eap` (default)
+- **Model**: `gemini-3.1-flash-live-preview` (default)
 - **Voice**: Puck, Charon, Kore, Fenrir, Aoede
 - **Response**: Audio, text, or both
 - **Tools**: Custom functions or Google Search grounding
diff --git a/gemini-live-ephemeral-tokens-websocket/frontend/geminilive.js b/gemini-live-ephemeral-tokens-websocket/frontend/geminilive.js
@@ -144,10 +144,8 @@ class GeminiLiveAPI {
     this.responseModalities = ["AUDIO"];
     this.systemInstructions = "";
     this.googleGrounding = false;
-    this.enableAffectiveDialog = false; // Default affective dialog
     this.voiceName = "Puck"; // Default voice
     this.temperature = 1.0; // Default temperature
-    this.proactivity = { proactiveAudio: false }; // Proactivity config
     this.inputAudioTranscription = false;
     this.outputAudioTranscription = false;
     this.enableFunctionCalls = false;
@@ -218,10 +216,7 @@ class GeminiLiveAPI {
     this.voiceName = voiceName;
   }
 
-  setProactivity(proactivity) {
-    console.log("setting proactivity: ", proactivity);
-    this.proactivity = proactivity;
-  }
+
 
   setInputAudioTranscription(enabled) {
     console.log("setting input audio transcription: ", enabled);
@@ -346,19 +341,19 @@ class GeminiLiveAPI {
         },
         systemInstruction: { parts: [{ text: this.systemInstructions }] },
         tools: [{ functionDeclarations: tools }],
-        turnCoverage: "TURN_INCLUDES_ONLY_ACTIVITY",
-        // proactivity: this.proactivity,
-
-        // realtimeInputConfig: {
-        //   automaticActivityDetection: {
-        //     disabled: this.automaticActivityDetection.disabled,
-        //     silenceDurationMs: this.automaticActivityDetection.silence_duration_ms,
-        //     prefixPaddingMs: this.automaticActivityDetection.prefix_padding_ms,
-        //     endOfSpeechSensitivity: this.automaticActivityDetection.end_of_speech_sensitivity,
-        //     startOfSpeechSensitivity: this.automaticActivityDetection.start_of_speech_sensitivity,
-        //   },
-        //   activityHandling: this.activityHandling,
-        // },
+
+
+        realtimeInputConfig: {
+          automaticActivityDetection: {
+            disabled: this.automaticActivityDetection.disabled,
+            silenceDurationMs: this.automaticActivityDetection.silence_duration_ms,
+            prefixPaddingMs: this.automaticActivityDetection.prefix_padding_ms,
+            endOfSpeechSensitivity: this.automaticActivityDetection.end_of_speech_sensitivity,
+            startOfSpeechSensitivity: this.automaticActivityDetection.start_of_speech_sensitivity,
+          },
+          activityHandling: this.activityHandling,
+          turnCoverage: "TURN_INCLUDES_ONLY_ACTIVITY",
+        },
       },
     };
 
@@ -378,10 +373,7 @@ class GeminiLiveAPI {
       sessionSetupMessage.setup.tools = [{ googleSearch: {} }];
     }
 
-    // Add affective dialog if enabled
-    // if (this.enableAffectiveDialog) {
-    //   sessionSetupMessage.setup.generationConfig.enableAffectiveDialog = true;
-    // }
+
 
     // Store the setup message for later access
     this.lastSetupMessage = sessionSetupMessage;
diff --git a/gemini-live-ephemeral-tokens-websocket/frontend/index.html b/gemini-live-ephemeral-tokens-websocket/frontend/index.html
@@ -85,7 +85,7 @@ <h2>API Configuration</h2>
 
           <div>
             <label for="model">Model ID:</label><br />
-            <input type="text" id="model" value="gemini-3.1-flash-audio-eap" placeholder="Enter model ID" />
+            <input type="text" id="model" value="gemini-3.1-flash-live-preview" placeholder="Enter model ID" />
           </div>
         </details>
 
@@ -118,24 +118,12 @@ <h2>API Configuration</h2>
               Lower = more predictable/focused</small>
           </div>
 
-          <div>
-            <input type="checkbox" id="enableProactiveAudio" checked />
-            <label for="enableProactiveAudio">Enable proactive audio (Gemini will ignore speech based on
-              instructions)</label>
-          </div>
-
           <div>
             <input type="checkbox" id="enableGrounding" />
             <label for="enableGrounding">Enable Google grounding (Enabling Google grounding will disable
               custom tools)
             </label>
           </div>
-
-          <div>
-            <input type="checkbox" id="enableAffectiveDialog" checked />
-            <label for="enableAffectiveDialog">Enable affective dialog (emotion detection and empathetic
-              responses)</label>
-          </div>
         </details>
 
         <!-- Custom Tools -->
diff --git a/gemini-live-genai-python-sdk/gemini_live.py b/gemini-live-genai-python-sdk/gemini_live.py
@@ -42,8 +42,9 @@ async def start_session(self, audio_input_queue, video_input_queue, text_input_q
             system_instruction=types.Content(parts=[types.Part(text="You are a helpful AI assistant. Keep your responses concise. Speak in a friendly Irish accent. You can see the user's camera or screen which is shared as realtime input images with you.")]),
             input_audio_transcription=types.AudioTranscriptionConfig(),
             output_audio_transcription=types.AudioTranscriptionConfig(),
-            turn_coverage="TURN_INCLUDES_ONLY_ACTIVITY",
-
+            realtime_input_config=types.RealtimeInputConfig(
+                turn_coverage="TURN_INCLUDES_ONLY_ACTIVITY",
+            ),
             tools=self.tools,
         )