Upload 4 files

Browse files

Files changed (4) hide show

ddqn.py +239 -0
rl_wallet_model.h5 +3 -0
test.py +122 -0
train.py +280 -0

ddqn.py ADDED Viewed

	@@ -0,0 +1,239 @@

+import numpy as np
+import tensorflow as tf
+from tensorflow.keras import layers
+from pymongo import MongoClient
+import requests
+import random
+from sklearn.preprocessing import StandardScaler
+import os
+from dotenv import load_dotenv
+from langchain_openai import OpenAI
+from langchain.prompts import PromptTemplate
+from operator import itemgetter
+# Load environment variables from .env file
+load_dotenv()
+API_URL = "https://soltrendio.com/api/stats/getTrends"  # Replace with your actual API URL
+MODEL_PATH = "rl_wallet_model.h5"  # Path to the trained model
+# MongoDB Connection Setup
+def get_mongo_connection():
+    MONGO_URI = os.getenv("MONGODB_URI")
+    print(f"Attempting to connect to MongoDB with URI: {MONGO_URI[:20]}...")  # Only show start of URI for security
+    DB_NAME = "walletAnalyzer"
+    COLLECTION_NAME = "wallets"
+    client = MongoClient(
+        MONGO_URI,
+        tls=True,
+        tlsAllowInvalidCertificates=True
+    )
+    db = client[DB_NAME]
+    print("Successfully connected to MongoDB")
+    return db[COLLECTION_NAME]
+collection = get_mongo_connection()
+# Fetch Aggregated Data from API
+def fetch_aggregated_data(api_url):
+    print(f"Fetching data from API: {api_url}")
+    response = requests.get(api_url)
+    print(f"API Response status code: {response.status_code}")
+    return response.json()
+# Extract States from Wallet Data
+def extract_state(wallet, api_data):
+    print(f"\nExtracting state for wallet: {wallet.get('address', 'Unknown address')}")
+    if wallet.get("topHoldings") is None or not wallet["topHoldings"]:
+        print("Warning: Wallet has no topHoldings")
+        return None
+    print(f"Number of top holdings: {len(wallet['topHoldings'])}")
+    # Pad or truncate topHoldings to exactly 8 tokens
+    MAX_TOKENS = 8
+    padded_holdings = wallet['topHoldings'][:MAX_TOKENS]  # Truncate if more than 8
+    while len(padded_holdings) < MAX_TOKENS:  # Pad with empty holdings if less than 8
+        padded_holdings.append({
+            'marketCap': '0',
+            'price': '0',
+            'balance': '0',
+            'symbol': 'EMPTY'
+        })
+    market_caps = [float(h.get('marketCap', 0)) for h in padded_holdings]
+    token_prices = [float(h.get('price', 0)) for h in padded_holdings]
+    token_balances = [float(h.get('balance', 0)) for h in padded_holdings]
+    print(f"Market caps: {market_caps}")
+    print(f"Token prices: {token_prices}")
+    print(f"Token balances: {token_balances}")
+    avg_market_cap = sum(market_caps) / len(market_caps) if market_caps else 0
+    print(f"Average market cap: {avg_market_cap}")
+    # Ensure totalValue is a float
+    total_value = wallet['totalValue']
+    if isinstance(total_value, dict) and '$numberDouble' in total_value:
+        total_value = float(total_value['$numberDouble'])
+    print(f"Total wallet value: {total_value}")
+    # Create state vector with exactly 25 features:
+    # 5 portfolio metrics + (8 tokens × 2.5 features per token = 20 features)
+    state = [
+        total_value,                    # Total portfolio value
+        len(wallet['topHoldings']),     # Original number of holdings
+        avg_market_cap,                 # Average market cap of top holdings
+        api_data['portfolioMetrics']['averagePortfolioValue'],  # Average portfolio value
+        api_data['portfolioMetrics']['totalPortfolioValue']     # Total portfolio value
+    ] + token_balances + token_prices   # 8 balances + 8 prices = 16 features
+    # Total features: 5 + 8 + 8 = 21 features
+    # Add 4 more features to reach 25 (you might want to adjust these based on your model's requirements)
+    state.extend([0.0] * 4)  # Padding with zeros to reach 25 features
+    print(f"Final state vector shape: {len(state)}")
+    print(f"State vector: {state}\n")
+    return np.array(state)
+# Normalize Features
+def normalize_states(states, scaler=None):
+    print("\nNormalizing states...")
+    # Convert list to numpy array if it isn't already
+    states = np.array(states)
+    print(f"Input states shape: {states.shape}")
+    if scaler is None:
+        scaler = StandardScaler()
+        states = scaler.fit_transform(states)
+        print("Created new scaler and fit_transformed states")
+    else:
+        states = scaler.transform(states)
+        print("Used existing scaler to transform states")
+    print(f"Normalized states shape: {states.shape}")
+    print(f"Normalized states sample: {states[0][:5]}...\n")
+    return states, scaler
+# Add this new function to create the summary
+def generate_trading_summary(wallet_address, holdings_analysis):
+    """
+    Generate a natural language summary of trading recommendations using Langchain.
+    """
+    try:
+        llm = OpenAI(temperature=0.7, openai_api_key=os.getenv("OPENAI_API_KEY"))
+        # Create a prompt template
+        template = """
+        As a crypto trading advisor, analyze the following wallet and its DDQN holdings analysis:
+        Wallet Address: {wallet_address}
+        Holdings Analysis:
+        {holdings_details}
+        Please provide a concise summary of the recommended trading actions, including:
+        1. Overall portfolio assessment
+        2. Specific recommendations for each token
+        3. Key opportunities and risks
+        Summary:
+        """
+        # Create prompt with template
+        prompt = PromptTemplate(
+            input_variables=["wallet_address", "holdings_details"],
+            template=template
+        )
+        # Create and run the chain using the new pattern
+        chain = (
+            {"wallet_address": itemgetter("wallet_address"),
+             "holdings_details": itemgetter("holdings_details")}
+            | prompt
+            | llm
+        )
+        # Invoke the chain with the new pattern
+        summary = chain.invoke({
+            "wallet_address": wallet_address,
+            "holdings_details": holdings_analysis
+        })
+        print("\n=== AI Generated Trading Summary ===")
+        print(summary)
+        return summary
+    except Exception as e:
+        print(f"Error generating summary: {str(e)}")
+        return None
+# Load and Test the Trained Model
+def test_model_on_wallet(wallet_identifier, api_url, model_path):
+    # Load the trained model without compilation
+    model = tf.keras.models.load_model(model_path, compile=False)
+    print("Model loaded successfully.")
+    # Recompile the model with the correct loss function
+    model.compile(optimizer=tf.keras.optimizers.Adam(learning_rate=0.001), loss='mse')
+    print("Model recompiled with MSE loss.")
+    # Fetch API data
+    api_data = fetch_aggregated_data(api_url)
+    # Fetch wallet from database
+    wallet = collection.find_one({"$or": [{"address": wallet_identifier}, {"domain": wallet_identifier}]})
+    if wallet is None:
+        print(f"Wallet with identifier {wallet_identifier} not found in the database.")
+        return
+    # Extract state
+    state = extract_state(wallet, api_data)
+    if state is None:
+        print(f"Wallet {wallet_identifier} has no topHoldings or insufficient data.")
+        return
+    # Normalize the state (use a pre-fitted scaler if available)
+    states, scaler = normalize_states([state])
+    normalized_state = states[0]  # Extract the first (and only) normalized state
+    # Predict actions using the model
+    q_values = model.predict(normalized_state.reshape(1, -1))[0]
+    # Iterate over all tokens in the wallet and output the best action
+    print(f"\nAnalyzing wallet: {wallet['address']}")
+    print(f"Q-values: {q_values}")
+    # Create a list to store analysis results
+    holdings_analysis = []
+    for token_index, holding in enumerate(wallet["topHoldings"]):
+        # Determine the best action for this token
+        actions = ["Buy", "Sell", "Hold"]
+        token_q_values = q_values[token_index * 3: (token_index + 1) * 3]
+        best_action_index = np.argmax(token_q_values)
+        best_action = actions[best_action_index]
+        # Calculate confidence as the difference between the best Q-value and the average of others
+        confidence = token_q_values[best_action_index] - np.mean(token_q_values)
+        # Store the analysis
+        holdings_analysis.append({
+            "symbol": holding["symbol"],
+            "balance": holding.get("balance", 0),
+            "action": best_action,
+            "confidence": confidence,
+            "q_values": token_q_values.tolist()
+        })
+        # Output the action for the token
+        print(f"Token: {holding['symbol']}, Best action: {best_action}, Q-values: {token_q_values}")
+    # Generate and display the trading summary
+    generate_trading_summary(wallet['address'], holdings_analysis)
+if __name__ == "__main__":
+    wallet_identifier = input("Enter the wallet address or .sol domain to analyze: ").strip()
+    test_model_on_wallet(wallet_identifier, API_URL, MODEL_PATH)

rl_wallet_model.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6a3055e68bb0f8eeb44e06cba1cb8fd3219cb8f1d74f5a65fb1a26684d1a8f24
+size 145360

test.py ADDED Viewed

	@@ -0,0 +1,122 @@

+import numpy as np
+import tensorflow as tf
+from tensorflow.keras import layers
+from pymongo import MongoClient
+import requests
+import random
+from sklearn.preprocessing import StandardScaler
+import os
+from dotenv import load_dotenv
+# Load environment variables from .env file
+load_dotenv()
+# MongoDB Connection Setup
+def get_mongo_connection():
+    MONGO_URI = os.getenv("MONGODB_URI")
+    DB_NAME = "walletAnalyzer"
+    COLLECTION_NAME = "wallets"
+    client = MongoClient(
+        MONGO_URI,
+        tls=True,
+        tlsAllowInvalidCertificates=True
+    )
+    db = client[DB_NAME]
+    return db[COLLECTION_NAME]
+collection = get_mongo_connection()
+# Fetch Aggregated Data from API
+def fetch_aggregated_data(api_url):
+    response = requests.get(api_url)
+    return response.json()
+# Extract States from Wallet Data
+def extract_state(wallet, api_data):
+    if wallet.get("topHoldings") is None or not wallet["topHoldings"]:
+        return None  # Skip wallets without topHoldings
+    market_caps = [float(h.get('marketCap', 0)) for h in wallet['topHoldings']]
+    token_prices = [float(h.get('price', 0)) for h in wallet['topHoldings']]
+    token_balances = [float(h.get('balance', 0)) for h in wallet['topHoldings']]
+    avg_market_cap = sum(market_caps) / len(market_caps) if market_caps else 0
+    # Ensure totalValue is a float
+    total_value = wallet['totalValue']
+    if isinstance(total_value, dict) and '$numberDouble' in total_value:
+        total_value = float(total_value['$numberDouble'])
+    state = [
+        total_value,  # Total portfolio value
+        len(wallet['topHoldings']),  # Number of holdings
+        avg_market_cap,  # Average market cap of top holdings
+        api_data['portfolioMetrics']['averagePortfolioValue'],  # Average portfolio value
+        api_data['portfolioMetrics']['totalPortfolioValue']  # Total portfolio value
+    ] + token_balances + token_prices
+    return np.array(state)
+# Normalize Features
+def normalize_states(states, scaler=None):
+    if scaler is None:
+        scaler = StandardScaler()
+        states = scaler.fit_transform(states)
+    else:
+        states = scaler.transform(states)
+    return states, scaler
+# Load and Test the Trained Model
+def test_model_on_random_wallet(api_url, model_path):
+    # Load the trained model without compilation
+    model = tf.keras.models.load_model(model_path, compile=False)
+    print("Model loaded successfully.")
+    # Recompile the model with the correct loss function
+    model.compile(optimizer=tf.keras.optimizers.Adam(learning_rate=0.001), loss='mse')
+    print("Model recompiled with MSE loss.")
+    # Fetch API data
+    api_data = fetch_aggregated_data(api_url)
+    # Retry fetching a wallet with topHoldings
+    max_retries = 10
+    for attempt in range(max_retries):
+        random_wallet = collection.aggregate([{"$sample": {"size": 1}}]).next()
+        state = extract_state(random_wallet, api_data)
+        if state is not None:
+            break
+        print(f"Attempt {attempt + 1}: Wallet has no topHoldings. Retrying...")
+    else:
+        print("Failed to fetch a valid wallet with topHoldings after multiple attempts.")
+        return
+    # Normalize the state (use a pre-fitted scaler if available)
+    states, scaler = normalize_states([state])
+    normalized_state = states[0]  # Extract the first (and only) normalized state
+    # Predict actions using the model
+    q_values = model.predict(normalized_state.reshape(1, -1))[0]
+    # Iterate over all tokens in the wallet and output the best action
+    print(f"Testing on wallet: {random_wallet['address']}")
+    print(f"Q-values: {q_values}")
+    for token_index, holding in enumerate(random_wallet["topHoldings"]):
+        # Determine the best action for this token
+        actions = ["Buy", "Sell", "Hold"]
+        token_q_values = q_values[token_index * 3: (token_index + 1) * 3]
+        best_action_index = np.argmax(token_q_values)
+        best_action = actions[best_action_index]
+        # Output the action for the token
+        token_symbol = holding["symbol"]
+        print(f"Token: {token_symbol}, Best action: {best_action}, Q-values: {token_q_values}")
+if __name__ == "__main__":
+    API_URL = "https://soltrendio.com/api/stats/getTrends"  # Replace with your actual API URL
+    MODEL_PATH = "rl_wallet_model.h5"  # Path to the trained model
+    # Test the model on a random wallet
+    test_model_on_random_wallet(API_URL, MODEL_PATH)

train.py ADDED Viewed

	@@ -0,0 +1,280 @@

+import numpy as np
+import tensorflow as tf
+from tensorflow.keras import layers
+from pymongo import MongoClient
+import requests
+import random
+from collections import deque
+from sklearn.preprocessing import StandardScaler
+import os
+from dotenv import load_dotenv
+# Load environment variables from .env file
+load_dotenv()
+# MongoDB Connection Setup
+# Define connection parameters and establish connection to MongoDB
+def get_mongo_connection():
+    MONGO_URI = os.getenv("MONGODB_URI")
+    DB_NAME = "walletAnalyzer"
+    COLLECTION_NAME = "wallets"
+    client = MongoClient(
+        MONGO_URI,
+        tls=True,
+        tlsAllowInvalidCertificates=True
+    )
+    db = client[DB_NAME]
+    return db[COLLECTION_NAME]
+collection = get_mongo_connection()
+# DexScreener API URL
+DEX_API_URL = "https://api.dexscreener.com/latest/dex/tokens"
+# Fetch Aggregated Data from API
+# Retrieve portfolio and token trends from external API
+def fetch_aggregated_data(api_url):
+    response = requests.get(api_url)
+    return response.json()
+# Retrieve Contract Address for Token
+# Find the contract address of a Solana token by its ticker symbol
+def get_solana_token_ca(ticker):
+    try:
+        url = f"https://api.dexscreener.com/latest/dex/search?q={ticker}"
+        response = requests.get(url)
+        response.raise_for_status()
+        data = response.json()
+        first_found_address = None
+        for pair in data.get('pairs', []):
+            if pair.get('chainId') == 'solana':
+                base_token = pair.get('baseToken', {})
+                quote_token = pair.get('quoteToken', {})
+                if first_found_address is None:
+                    first_found_address = base_token.get('address') or quote_token.get('address')
+                if base_token.get('symbol').upper() == ticker.upper():
+                    return base_token.get('address')
+                elif quote_token.get('symbol').upper() == ticker.upper():
+                    return quote_token.get('address')
+        return first_found_address
+    except requests.RequestException as e:
+        print(f"Error fetching token data: {e}")
+        return None
+# Fetch Market Data for Token
+# Retrieve market cap and price data for a token contract address
+def fetch_market_data(contract_address):
+    try:
+        response = requests.get(f"{DEX_API_URL}/{contract_address}")
+        if response.status_code == 200:
+            data = response.json()
+            if "pairs" in data and len(data["pairs"]) > 0:
+                pair = data["pairs"][0]
+                return {
+                    "marketCap": pair.get("marketCap"),
+                    "price": pair.get("priceUsd"),
+                }
+        else:
+            print(f"Failed to fetch data for contract address {contract_address}: {response.status_code}")
+    except Exception as e:
+        print(f"Error fetching market data for contract address {contract_address}: {e}")
+    return None
+# Update Wallets in Database
+# Enhance wallet data with token market information and contract addresses
+def update_wallets():
+    wallets = collection.find()
+    for wallet in wallets:
+        updated = False
+        if wallet.get("topHoldings") is None or not wallet["topHoldings"]:
+            continue
+        for holding in wallet.get("topHoldings", []):
+            symbol = holding.get("symbol")
+            contract_address = holding.get("contractAddress")
+            if not contract_address:
+                contract_address = get_solana_token_ca(symbol)
+                if contract_address:
+                    holding["contractAddress"] = contract_address
+                    print(f"Updated {symbol} with contract address {contract_address}.")
+                    updated = True
+            if "marketCap" not in holding or "price" not in holding:
+                market_data = fetch_market_data(contract_address)
+                if market_data:
+                    holding["marketCap"] = market_data["marketCap"]
+                    holding["price"] = market_data["price"]
+                    updated = True
+                    print(f"Updated {symbol} in wallet {wallet['address']} with marketCap and price.")
+        if updated:
+            collection.update_one({"_id": wallet["_id"]}, {"$set": {"topHoldings": wallet["topHoldings"]}})
+# Extract States from Wallet Data
+# Convert wallet data into numerical state vectors for RL training
+def extract_state(wallet, api_data, max_tokens=10):
+    if wallet.get("topHoldings") is None or not wallet["topHoldings"]:
+        return None  # Skip wallets without topHoldings
+    # Extract market caps, token prices, and balances
+    market_caps = [float(h.get('marketCap', 0)) for h in wallet['topHoldings'][:max_tokens]]
+    token_prices = [float(h.get('price', 0)) for h in wallet['topHoldings'][:max_tokens]]
+    token_balances = [float(h.get('balance', 0)) for h in wallet['topHoldings'][:max_tokens]]
+    # Pad with zeros to ensure fixed length
+    market_caps += [0] * (max_tokens - len(market_caps))
+    token_prices += [0] * (max_tokens - len(token_prices))
+    token_balances += [0] * (max_tokens - len(token_balances))
+    avg_market_cap = sum(market_caps) / len(market_caps) if market_caps else 0
+    # Ensure totalValue is a float
+    total_value = wallet['totalValue']
+    if isinstance(total_value, dict) and '$numberDouble' in total_value:
+        total_value = float(total_value['$numberDouble'])
+    state = [
+        total_value,  # Total portfolio value
+        len(wallet['topHoldings']),  # Number of holdings
+        avg_market_cap,  # Average market cap of top holdings
+        api_data['portfolioMetrics']['averagePortfolioValue'],  # Average portfolio value
+        api_data['portfolioMetrics']['totalPortfolioValue'],  # Total portfolio value
+    ] + token_balances + token_prices  # Include token balances and prices
+    return np.array(state)
+# Normalize Features
+# Standardize state features for improved model training
+def normalize_states(states):
+    scaler = StandardScaler()
+    return scaler.fit_transform(states)
+# Create DQN Model
+# Define the neural network for the RL agent
+def create_dqn(state_size, action_size):
+    model = tf.keras.Sequential([
+        layers.Dense(64, activation='relu', input_shape=(state_size,)),
+        layers.Dense(64, activation='relu'),
+        layers.Dense(action_size, activation='linear')
+    ])
+    model.compile(optimizer=tf.keras.optimizers.Adam(learning_rate=0.001), loss='mse')
+    return model
+# Simulate Next State
+# Generate the next state based on the action taken and simulated market changes
+def simulate_next_state(state, action, token_prices, token_balances):
+    token_idx = action // 3  # Determine token index
+    action_type = action % 3  # Determine action type (Buy, Sell, Hold)
+    if action_type == 0:  # Buy
+        state[token_idx + 5] += 1  # Increase token balance
+    elif action_type == 1:  # Sell
+        state[token_idx + 5] -= 1  # Decrease token balance
+    # Simulate market changes in token prices
+    token_prices = [price * np.random.uniform(0.95, 1.05) for price in token_prices]
+    # Update total portfolio value based on new token balances and prices
+    total_value = sum(balance * price for balance, price in zip(token_balances, token_prices))
+    state[0] = total_value  # Update total portfolio value
+    return state, token_prices
+# Termination Logic
+# Define conditions for ending an RL episode
+def check_termination(state, steps, max_steps):
+    if state[0] <= 0 or steps >= max_steps:
+        return True
+    return False
+# Reward Function
+# Calculate rewards based on portfolio performance and risk
+def calculate_reward(old_value, new_value, diversification_score):
+    value_change = (new_value - old_value) / old_value if old_value > 0 else 0
+    reward = value_change - (1 - diversification_score)  # Penalize lack of diversification
+    return reward
+# Main Training Loop
+# Train the RL agent by simulating interactions with the environment
+# Main Training Loop
+def train_rl_model(api_url):
+    update_wallets()  # Ensure wallets are updated before training
+    data = collection.find()  # Fetch data directly from updated collection
+    api_data = fetch_aggregated_data(api_url)
+    # Extract valid states, skipping None
+    states = [
+        state for wallet in data
+        if (state := extract_state(wallet, api_data)) is not None
+    ]
+    # Ensure states list is not empty before proceeding
+    if not states:
+        print("No valid states available for training.")
+        return
+    states = normalize_states(states)
+    state_size = len(states[0])
+    action_size = 3 * len(states[0][5:])  # Buy, Sell, Hold for each token
+    model = create_dqn(state_size, action_size)
+    replay_buffer = deque(maxlen=2000)
+    gamma = 0.99
+    episodes = 100
+    for episode in range(episodes):
+        state = states[np.random.randint(0, len(states))]  # Random start
+        token_prices = state[-len(state[5:]):]  # Extract token prices from state
+        token_balances = state[5:5 + len(state[5:])]  # Extract token balances from state
+        steps = 0
+        done = False
+        while not done:
+            if np.random.rand() < 0.1:  # Exploration
+                action = np.random.choice(action_size)
+            else:  # Exploitation
+                action = np.argmax(model.predict(state.reshape(1, -1))[0])
+            next_state, token_prices = simulate_next_state(state, action, token_prices, token_balances)
+            diversification_score = len(set(token_balances)) / len(token_balances)  # Diversity metric
+            reward = calculate_reward(state[0], next_state[0], diversification_score)
+            done = check_termination(next_state, steps, max_steps=50)
+            replay_buffer.append((state, action, reward, next_state, done))
+            if len(replay_buffer) > 32:
+                minibatch = random.sample(replay_buffer, 32)
+                states_mb, actions_mb, rewards_mb, next_states_mb, dones_mb = zip(*minibatch)
+                targets = model.predict(np.array(states_mb))
+                next_q_values = model.predict(np.array(next_states_mb))
+                for i in range(32):
+                    if dones_mb[i]:
+                        targets[i][actions_mb[i]] = rewards_mb[i]
+                    else:
+                        targets[i][actions_mb[i]] = rewards_mb[i] + gamma * np.max(next_q_values[i])
+                model.fit(np.array(states_mb), targets, epochs=1, verbose=0)
+            state = next_state
+            steps += 1
+        print(f"Episode {episode + 1}/{episodes} completed.")
+    model.save("rl_wallet_model.h5")
+    print("Model training complete and saved.")
+if __name__ == "__main__":
+    API_URL = "https://soltrendio.com/api/stats/getTrends"  # Replace with your actual API URL
+    train_rl_model(API_URL)