deprecated-generative-ai-python/min_p_sampling_approx.py at 693185421573f19f3230641bce7cda750c64d80d · google-gemini/deprecated-generative-ai-python · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
import google.generativeai as genai
import collections
import random
import math
from google.generativeai.types import GenerationConfig, GenerateContentResponse


def _normalize_probs(prob_map):
    total_prob = sum(prob_map.values())
    if total_prob == 0:
        num_tokens = len(prob_map)
        if num_tokens == 0:
            return {}
        equal_prob = 1.0 / num_tokens
        return {token: equal_prob for token in prob_map}

    return {token: prob / total_prob for token, prob in prob_map.items()}


def generate_content_min_p_approx(
    model: genai.GenerativeModel,
    prompt: str,
    max_new_tokens: int = 50,
    p_base: float = 0.1,
    temperature: float = 1.0,
    num_samples: int = 100,
    fallback_to_most_frequent: bool = True
) -> str:

    if not (0.0 < p_base <= 1.0):
        raise ValueError("p_base must be between 0.0 (exclusive) and 1.0 (inclusive)")

    generated_sequence = prompt
    current_prompt = prompt

    print(f"Starting min_p approximation (p_base={p_base}, temp={temperature}, samples={num_samples})...")

    for i in range(max_new_tokens):
        print(f"  Step {i+1}/{max_new_tokens}: Generating candidates...")
        try:
            estimation_config = GenerationConfig(
                candidate_count=num_samples,
                max_output_tokens=1,
                temperature=temperature
            )

            response: GenerateContentResponse = model.generate_content(
                current_prompt,
                generation_config=estimation_config,
            )

            if not response.candidates:
                 print("  Warning: No candidates generated by the API. Stopping generation.")
                 break

            token_counts = collections.Counter()
            valid_candidates = 0
            for candidate in response.candidates:
                if candidate.content and candidate.content.parts:
                    try:
                         token_text = candidate.content.parts[0].text
                         if token_text:
                            token_counts[token_text] += 1
                            valid_candidates += 1
                    except (IndexError, AttributeError, KeyError):
                        print(f"  Warning: Skipping malformed candidate: {candidate}")
                        continue
                else:
                     print(f"  Warning: Skipping empty or blocked candidate: {candidate.finish_reason}, {candidate.safety_ratings}")


            if valid_candidates == 0:
                print("  Error: No valid tokens found among candidates. Stopping generation.")
                break

            estimated_probs = {token: count / valid_candidates for token, count in token_counts.items()}

            if not estimated_probs:
                 print("  Error: Estimated probabilities are empty. Stopping generation.")
                 break

            p_max = max(estimated_probs.values())
            p_threshold = p_base * p_max

            filtered_probs = {
                token: prob for token, prob in estimated_probs.items() if prob >= p_threshold
            }

            chosen_token = None
            if not filtered_probs:
                print("  Warning: Min_p filter resulted in empty set.")
                if fallback_to_most_frequent:
                    chosen_token = token_counts.most_common(1)[0][0]
                    print(f"    Falling back to most frequent token: '{chosen_token}'")
                else:
                    print("  Error: No tokens passed min_p filter and no fallback. Stopping.")
                    break
            else:
                normalized_filtered_probs = _normalize_probs(filtered_probs)

                tokens = list(normalized_filtered_probs.keys())
                probabilities = list(normalized_filtered_probs.values())
                chosen_token = random.choices(tokens, weights=probabilities, k=1)[0]

            if chosen_token is None:
                 print("  Error: Could not select a token. Stopping generation.")
                 break

            generated_sequence += chosen_token
            current_prompt += chosen_token

        except Exception as e:
            print(f"  Error during generation step {i+1}: {e}")
            break

    print("Finished min_p approximation.")
    return generated_sequence

if __name__ == "__main__":
    try:

        model = genai.GenerativeModel('gemini-1.5-flash-latest')

        initial_prompt = "Write a short story about a curious cat exploring a futuristic city."


        p_base_val = 0.1
        temp_val = 1.5
        samples_per_step = 100
        tokens_to_generate = 100


        generated_text = generate_content_min_p_approx(
            model,
            initial_prompt,
            max_new_tokens=tokens_to_generate,
            p_base=p_base_val,
            temperature=temp_val,
            num_samples=samples_per_step
        )

        print("\n--- Generated Text ---")
        print(generated_text)

    except Exception as e:
        print(f"An error occurred during example usage: {e}")
        print("Please ensure you have configured your API key and have access to the specified model.")