File size: 1,505 Bytes
b56d4a6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
import os
from pathlib import Path

# API Keys
SERP_API_KEY = "2d78ac7b2491065a206825e614a2f20e6f70f90a7958463883f58ae2c2f55bae"
GEMINI_API_KEY = "AIzaSyAPf9oyyb0l9vQcP46Yh1SkG1dE8GvJJv0"

# API Limits
SERP_MONTHLY_LIMIT = 80
GEMINI_RATE_LIMIT = 10  # requests per minute
PAIRS_PER_PROMPT = 5
TARGET_QA_PAIRS = 1000

# Project Paths
PROJECT_ROOT = Path(__file__).parent
DATA_DIR = PROJECT_ROOT / "data"
RAW_DIR = DATA_DIR / "raw"
PROCESSED_DIR = DATA_DIR / "processed"
FINAL_DIR = DATA_DIR / "final"
LOG_DIR = PROJECT_ROOT / "logs"

# Create directories if they don't exist
for dir_path in [DATA_DIR, RAW_DIR, PROCESSED_DIR, FINAL_DIR, LOG_DIR]:
    dir_path.mkdir(parents=True, exist_ok=True)

# Search Queries
SEARCH_QUERIES = {
    "attractions": [
        "Bloomington Indiana tourist attractions",
        "Indiana University landmarks",
        "Bloomington cultural venues"
    ],
    "dining": [
        "Best restaurants Bloomington Indiana",
        "Bloomington cafes and bars",
        "Food trucks Bloomington IN"
    ],
    "events": [
        "Events in Bloomington Indiana",
        "Festivals Bloomington IN",
        "Concerts Bloomington Indiana"
    ],
    "outdoor": [
        "Bloomington parks and recreation",
        "Hiking trails Bloomington IN",
        "Lake Monroe activities"
    ],
    "accommodation": [
        "Hotels Bloomington Indiana",
        "B&B Bloomington IN",
        "Student housing IU Bloomington"
    ]
}