File size: 1,695 Bytes
35765b5 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 |
"""Test which Gemini/Gemma models are available for your API key."""
import google.generativeai as genai
import os
from dotenv import load_dotenv
load_dotenv()
GEMINI_API_KEY = os.getenv("GEMINI_API_KEY")
if not GEMINI_API_KEY:
print("ERROR: GEMINI_API_KEY not found in .env")
exit(1)
genai.configure(api_key=GEMINI_API_KEY)
# Models to test
MODELS = [
"gemini-2.0-flash",
"gemini-2.0-flash-lite",
"gemma-3-1b-it",
"gemma-3-4b-it",
"gemma-3-12b-it",
"gemma-3-27b-it",
]
TEST_PROMPT = "Say 'Hello' in one word."
print("=" * 60)
print("Testing Gemini/Gemma Models Availability")
print("=" * 60)
available = []
unavailable = []
for model_name in MODELS:
try:
model = genai.GenerativeModel(model_name)
response = model.generate_content(TEST_PROMPT)
text = response.text.strip()[:50]
print(f"[OK] {model_name:25} -> {text}")
available.append(model_name)
except Exception as e:
error_msg = str(e)[:60]
print(f"[ERR] {model_name:25} -> {error_msg}")
unavailable.append(model_name)
print("\n" + "=" * 60)
print("SUMMARY")
print("=" * 60)
print(f"\nAvailable ({len(available)}):")
for m in available:
print(f" - {m}")
print(f"\nUnavailable ({len(unavailable)}):")
for m in unavailable:
print(f" - {m}")
# Calculate combined RPM
rpm_map = {
"gemini-2.0-flash": 15,
"gemini-2.0-flash-lite": 30,
"gemma-3-1b-it": 30,
"gemma-3-4b-it": 30,
"gemma-3-12b-it": 30,
"gemma-3-27b-it": 30,
}
total_rpm = sum(rpm_map.get(m, 0) for m in available)
print(f"\nCombined RPM capacity: {total_rpm} RPM")
print(f"With 50% cache hit rate: ~{total_rpm * 2} effective RPM")
|