AI-that-works
/

H_MH_QA

+{
+  "nbformat": 4,
+  "nbformat_minor": 0,
+  "metadata": {
+    "colab": {
+      "provenance": []
+    },
+    "kernelspec": {
+      "name": "python3",
+      "display_name": "Python 3"
+    },
+    "language_info": {
+      "name": "python"
+    }
+  },
+  "cells": [
+    {
+      "cell_type": "code",
+      "source": [
+        "\"\"\"\n",
+        "This script implements corresponds to the experiments conducted for\n",
+        "weitting the paper \"Optimizing AI Reasoning: A Hamiltonian Dynamics Approach to\n",
+        "Multi-Hop Question Answering\".\n",
+        "\n",
+        "Author: Javier Marín\n",
+        "Email: javier@jmarin.info\n",
+        "Version: 1.0.0\n",
+        "Date: October 65, 2024\n",
+        "\n",
+        "License: MIT License\n",
+        "\n",
+        "Copyright (c) 2024 Javier Marín\n",
+        "\n",
+        "Permission is hereby granted, free of charge, to any person obtaining a copy\n",
+        "of this software and associated documentation files (the \"Software\"), to deal\n",
+        "in the Software without restriction, including without limitation the rights\n",
+        "to use, copy, modify, merge, publish, distribute, sublicense, and/or sell\n",
+        "copies of the Software, and to permit persons to whom the Software is\n",
+        "furnished to do so, subject to the following conditions:\n",
+        "\n",
+        "The above copyright notice and this permission notice shall be included in all\n",
+        "copies or substantial portions of the Software.\n",
+        "\n",
+        "THE SOFTWARE IS PROVIDED \"AS IS\", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR\n",
+        "IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,\n",
+        "FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE\n",
+        "AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER\n",
+        "LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,\n",
+        "OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE\n",
+        "SOFTWARE.\n",
+        "\n",
+        "Dependencies:\n",
+        "- Python 3.8+\n",
+        "- NumPy\n",
+        "- Pandas\n",
+        "- PyTorch\n",
+        "- Transformers\n",
+        "- Scikit-learn\n",
+        "- SciPy\n",
+        "- Statsmodels\n",
+        "- Matplotlib\n",
+        "- Seaborn\n",
+        "\n",
+        "For a full list of dependencies and their versions, see requirements.txt\n",
+        "\"\"\""
+      ],
+      "metadata": {
+        "id": "T-57ivc-aTrA"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "source": [
+        "## Imports"
+      ],
+      "metadata": {
+        "id": "QUcpzyBmWpLv"
+      }
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "l2rfFoVtIL6_"
+      },
+      "outputs": [],
+      "source": [
+        "# Standard library imports\n",
+        "import os\n",
+        "import re\n",
+        "import time\n",
+        "\n",
+        "# Third-party imports\n",
+        "import numpy as np\n",
+        "import pandas as pd\n",
+        "import torch\n",
+        "import seaborn as sns\n",
+        "import matplotlib.pyplot as plt\n",
+        "from mpl_toolkits.mplot3d import Axes3D\n",
+        "\n",
+        "from transformers import AutoTokenizer, AutoModel\n",
+        "from statsmodels.multivariate.manova import MANOVA\n",
+        "from scipy import stats\n",
+        "from scipy.optimize import curve_fit\n",
+        "from scipy.integrate import odeint\n",
+        "from sklearn import (\n",
+        "    metrics,\n",
+        "    model_selection,\n",
+        "    cluster,\n",
+        "    decomposition,\n",
+        "    feature_extraction,\n",
+        "    linear_model\n",
+        ")\n",
+        "\n",
+        "# Visualization settings\n",
+        "sns.set_theme(style=\"whitegrid\", context=\"paper\")\n",
+        "plt.rcParams['font.family'] = 'serif'\n",
+        "plt.rcParams['font.serif'] = ['Times New Roman'] + plt.rcParams['font.serif']"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "source": [
+        "## Load BERT pretrained model"
+      ],
+      "metadata": {
+        "id": "4nApCVrOWkR3"
+      }
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Load pre-trained model and tokenizer\n",
+        "tokenizer = AutoTokenizer.from_pretrained(\"bert-base-uncased\")\n",
+        "model = AutoModel.from_pretrained(\"bert-base-uncased\")"
+      ],
+      "metadata": {
+        "id": "hT2I1H8BIOp_"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "source": [
+        "## Load data"
+      ],
+      "metadata": {
+        "id": "9KKw24bCWgWj"
+      }
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Load the OBQA dataset\n",
+        "df = pd.read_csv(\"obqa_chains.csv\", sep=\";\")\n",
+        "\n",
+        "# Ensure necessary columns exist\n",
+        "required_columns = ['QID', 'Chain#', 'Question', 'Answer', 'Fact1', 'Fact2', 'Turk']\n",
+        "missing_columns = [col for col in required_columns if col not in df.columns]\n",
+        "if missing_columns:\n",
+        "    raise ValueError(f\"Missing required columns: {missing_columns}\")\n",
+        "\n",
+        "# Preprocess the data\n",
+        "df['Question'] = df['Question'] + \" \" + df['Answer']  # Combine question and answer\n",
+        "df['is_valid'] = df['Turk'].str.contains('yes', case=False, na=False)"
+      ],
+      "metadata": {
+        "id": "g2f-T9koIOjH"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "source": [
+        "## Model embeddings"
+      ],
+      "metadata": {
+        "id": "XdN9XTGOWdsh"
+      }
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "def get_bert_embedding(text):\n",
+        "    \"\"\"Get BERT embedding for a given text.\"\"\"\n",
+        "    inputs = tokenizer(text, return_tensors=\"pt\", padding=True, truncation=True, max_length=512)\n",
+        "    with torch.no_grad():\n",
+        "        outputs = model(**inputs)\n",
+        "    return outputs.last_hidden_state.mean(dim=1).squeeze().numpy()\n",
+        "\n",
+        "def refined_hamiltonian_energy(chain):\n",
+        "    emb1 = get_bert_embedding(chain['Fact1'])\n",
+        "    emb2 = get_bert_embedding(chain['Fact2'])\n",
+        "    emb_q = get_bert_embedding(chain['Question'])\n",
+        "\n",
+        "    # Refined kinetic term: measure of change between facts\n",
+        "    T = np.linalg.norm(emb2 - emb1)\n",
+        "\n",
+        "    # Refined potential term: measure of relevance to question\n",
+        "    V = (np.dot(emb1, emb_q) + np.dot(emb2, emb_q)) / 2\n",
+        "\n",
+        "    # Total \"Hamiltonian\" energy: balance between change and relevance\n",
+        "    H = T - V\n",
+        "\n",
+        "    return H, T, V\n",
+        "\n",
+        "\n",
+        "# Analyze energy conservation\n",
+        "def energy_conservation_score(chain):\n",
+        "    _, T, V = refined_hamiltonian_energy(chain)\n",
+        "    # Measure how balanced T and V are\n",
+        "    return 1 / (1 + abs(T - V))  # Now always between 0 and 1, 1 being perfect balance\n",
+        "\n",
+        "\n",
+        "\n",
+        "# Calculate refined energies and scores\n",
+        "df['H_energy'], df['T_energy'], df['V_energy'] = zip(*df.apply(refined_hamiltonian_energy, axis=1))\n",
+        "df['energy_conservation'] = df.apply(energy_conservation_score, axis=1)"
+      ],
+      "metadata": {
+        "id": "3q4EMfekIOZ_"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "source": [
+        "## Hamiltonian systems"
+      ],
+      "metadata": {
+        "id": "pvQgqhW2Wage"
+      }
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "def get_trajectory(row):\n",
+        "    # Ensure we're working with strings\n",
+        "    chain = [str(row['Fact1']), str(row['Fact2'])]\n",
+        "    embeddings = [get_bert_embedding(sentence) for sentence in chain]\n",
+        "    return np.array(embeddings)\n",
+        "\n",
+        "def refined_hamiltonian_energy(chain):\n",
+        "    emb1 = get_bert_embedding(chain['Fact1'])\n",
+        "    emb2 = get_bert_embedding(chain['Fact2'])\n",
+        "\n",
+        "    # Refined kinetic term: measure of change between facts\n",
+        "    T = np.linalg.norm(emb2 - emb1)\n",
+        "\n",
+        "    # Refined potential term: measure of relevance to facts\n",
+        "    V = (np.linalg.norm(emb1) + np.linalg.norm(emb2)) / 2\n",
+        "\n",
+        "    # Total \"Hamiltonian\" energy: balance between change and relevance\n",
+        "    H = T - V\n",
+        "\n",
+        "    return H, T, V\n",
+        "\n",
+        "\n",
+        "def compute_trajectory_energy(trajectory):\n",
+        "    return refined_hamiltonian_energy({'Fact1': str(trajectory[0]), 'Fact2': str(trajectory[1])})[0]\n",
+        "\n",
+        "\n",
+        "# Compute trajectories for all chains\n",
+        "trajectories = df.apply(get_trajectory, axis=1)\n",
+        "\n",
+        "# Compute energies for trajectories\n",
+        "trajectory_energies = trajectories.apply(compute_trajectory_energy)\n"
+      ],
+      "metadata": {
+        "id": "yveIXutUX3ub"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Use PCA to reduce dimensionality for visualization\n",
+        "pca = PCA(n_components=3)\n",
+        "all_points = np.vstack(trajectories.values)\n",
+        "pca_result = pca.fit_transform(all_points)\n",
+        "\n",
+        "trajectories_3d = trajectories.apply(lambda t: pca.transform(t))\n",
+        "\n",
+        "\n",
+        "# Analyze trajectory properties\n",
+        "def trajectory_length(traj):\n",
+        "    return np.sum(np.sqrt(np.sum(np.diff(traj, axis=0)**2, axis=1)))\n",
+        "\n",
+        "def trajectory_smoothness(traj):\n",
+        "    first = abs(np.diff(traj[0], axis=0))[0]\n",
+        "    second = abs(np.diff(traj[1], axis=0))[0]\n",
+        "    return (first + second)/2\n",
+        "\n",
+        "traj_properties = pd.DataFrame({\n",
+        "    'length': trajectories_3d.apply(trajectory_length),\n",
+        "    'smoothness': trajectories_3d.apply(trajectory_smoothness),\n",
+        "    'is_valid': df['is_valid']\n",
+        "})\n"
+      ],
+      "metadata": {
+        "id": "qFF7_0TD6JRO"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Create the main figure and grid for subplots\n",
+        "fig, axs = plt.subplots(2, 2, figsize=(15, 12))\n",
+        "fig.suptitle(\"Refined Hamiltonian-Inspired Energy Analysis of Reasoning Chains\", fontsize=16)\n",
+        "\n",
+        "# Distribution of Hamiltonian Energy\n",
+        "sns.histplot(data=df, x='H_energy', ax=axs[0, 0], kde=True, color='blue', bins=50)\n",
+        "axs[0, 0].set_title(\"Distribution of Refined Hamiltonian Energy\")\n",
+        "axs[0, 0].set_xlabel(\"Hamiltonian Energy\")\n",
+        "axs[0, 0].set_ylabel(\"Count\")\n",
+        "\n",
+        "# Kinetic vs Potential Energy\n",
+        "scatter = axs[0, 1].scatter(df['T_energy'], df['V_energy'], c=df['H_energy'], cmap='viridis', s=5, alpha=0.6)\n",
+        "axs[0, 1].set_title(\"Refined Kinetic vs Potential Energy\")\n",
+        "axs[0, 1].set_xlabel(\"Kinetic Energy (T)\")\n",
+        "axs[0, 1].set_ylabel(\"Potential Energy (V)\")\n",
+        "plt.colorbar(scatter, ax=axs[0, 1], label=\"Hamiltonian Energy\")\n",
+        "\n",
+        "# Hamiltonian Energy: Valid vs Invalid Chains\n",
+        "valid_chains = df[df['is_valid']]\n",
+        "invalid_chains = df[~df['is_valid']]\n",
+        "sns.histplot(data=valid_chains, x='H_energy', ax=axs[1, 0], kde=True, color='green', label='Valid Chains', bins=50, alpha=0.6)\n",
+        "sns.histplot(data=invalid_chains, x='H_energy', ax=axs[1, 0], kde=True, color='red', label='Invalid Chains', bins=50, alpha=0.6)\n",
+        "axs[1, 0].set_title(\"Refined Hamiltonian Energy: Valid vs Invalid Chains\")\n",
+        "axs[1, 0].set_xlabel(\"Hamiltonian Energy\")\n",
+        "axs[1, 0].set_ylabel(\"Count\")\n",
+        "axs[1, 0].legend()\n",
+        "\n",
+        "# Distribution of Energy Conservation Scores\n",
+        "sns.histplot(data=df, x='energy_conservation', ax=axs[1, 1], kde=True, color='orange', bins=50)\n",
+        "axs[1, 1].set_title(\"Distribution of Refined Energy Conservation Scores\")\n",
+        "axs[1, 1].set_xlabel(\"Energy Conservation Score\")\n",
+        "axs[1, 1].set_ylabel(\"Count\")\n",
+        "\n",
+        "# Adjust layout and display\n",
+        "plt.tight_layout()\n",
+        "plt.subplots_adjust(top=0.93)  # Adjust for main title\n",
+        "plt.savefig('refined_hamiltonian_analysis.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "kqfbA7w3NuPM"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Calculate direction vectors\n",
+        "def calculate_direction(trajectory):\n",
+        "    return trajectory[1] - trajectory[0]\n",
+        "\n",
+        "direction_vectors = np.array([calculate_direction(traj) for traj in trajectories_3d])\n",
+        "\n",
+        "# Calculate magnitude and angle of direction vectors\n",
+        "magnitudes = np.linalg.norm(direction_vectors, axis=1)\n",
+        "angles = np.arctan2(direction_vectors[:, 1], direction_vectors[:, 0])\n",
+        "\n",
+        "# Add these to the dataframe\n",
+        "df['trajectory_magnitude'] = magnitudes\n",
+        "df['trajectory_angle'] = angles\n",
+        "\n",
+        "# Visualize magnitude distribution\n",
+        "plt.figure(figsize=(12, 6))\n",
+        "sns.histplot(data=df, x='trajectory_magnitude', hue='is_valid', element='step', stat='density', common_norm=False)\n",
+        "plt.title('Distribution of Trajectory Magnitudes')\n",
+        "plt.xlabel('Magnitude')\n",
+        "plt.ylabel('Density')\n",
+        "plt.legend(title='Is Valid')\n",
+        "plt.tight_layout()\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('trajectories_magntude_plot.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "tYVhJJbPwNxo"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "plt.figure(figsize=(12, 6))\n",
+        "\n",
+        "# Define colors explicitly\n",
+        "colors = {'Valid': 'blue', 'Invalid': 'red'}\n",
+        "\n",
+        "# Create a new DataFrame with the data for plotting\n",
+        "plot_data = pd.DataFrame({\n",
+        "    'Hamiltonian Energy': df['H_energy'],\n",
+        "    'Validity': df['is_valid'].map({True: 'Valid', False: 'Invalid'})\n",
+        "})\n",
+        "\n",
+        "# Create the histogram plot with explicit colors\n",
+        "sns.histplot(data=plot_data, x='Hamiltonian Energy', hue='Validity',\n",
+        "             element='step', stat='density', common_norm=False,\n",
+        "             palette=colors)\n",
+        "\n",
+        "plt.title('Distribution of Refined Hamiltonian Energy', fontsize=16)\n",
+        "plt.xlabel('Hamiltonian Energy', fontsize=14)\n",
+        "plt.ylabel('Density', fontsize=14)\n",
+        "\n",
+        "# Adjust legend\n",
+        "plt.legend(title='Chain Validity', title_fontsize='13', fontsize='12')\n",
+        "\n",
+        "# Add vertical lines for mean energies\n",
+        "plt.axvline(x=-60.889, color='blue', linestyle='--', label='Mean Valid')\n",
+        "plt.axvline(x=-53.816, color='red', linestyle='--', label='Mean Invalid')\n",
+        "\n",
+        "# Add text annotations for mean energies\n",
+        "plt.text(-60.889, plt.gca().get_ylim()[1], 'Mean Valid',\n",
+        "         rotation=90, va='top', ha='right', color='blue')\n",
+        "plt.text(-53.816, plt.gca().get_ylim()[1], 'Mean Invalid',\n",
+        "         rotation=90, va='top', ha='left', color='red')\n",
+        "\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('refined_hamiltonian_energy_distribution.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "m1fHZ-NpMnHD"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Perform PCA to reduce to 2 dimensions\n",
+        "pca = PCA(n_components=2)\n",
+        "trajectories_2d = pca.fit_transform(np.vstack(trajectories))\n",
+        "\n",
+        "# Reshape the data back into trajectories\n",
+        "trajectories_2d = trajectories_2d.reshape(len(trajectories), -1, 2)\n",
+        "\n",
+        "# Create the plot\n",
+        "plt.figure(figsize=(12, 10))\n",
+        "plt.style.use('seaborn-whitegrid')\n",
+        "sns.set_context(\"paper\")\n",
+        "plt.rcParams['font.family'] = 'serif'\n",
+        "plt.rcParams['font.serif'] = ['Times New Roman'] + plt.rcParams['font.serif']\n",
+        "\n",
+        "# Plot trajectories\n",
+        "valid_trajectories = []\n",
+        "invalid_trajectories = []\n",
+        "for i, traj in enumerate(trajectories_2d[:100]):  # Limit to 100 for clarity\n",
+        "    if df.iloc[i]['is_valid']:\n",
+        "        valid_trajectories.append(traj)\n",
+        "        color = 'green'\n",
+        "    else:\n",
+        "        invalid_trajectories.append(traj)\n",
+        "        color = 'red'\n",
+        "    plt.plot(traj[:, 0], traj[:, 1], color=color, alpha=0.5)\n",
+        "    plt.scatter(traj[0, 0], traj[0, 1], color=color, s=20, marker='o')\n",
+        "    plt.scatter(traj[-1, 0], traj[-1, 1], color=color, s=20, marker='s')\n",
+        "\n",
+        "# Calculate the vector field based on the average direction of trajectories\n",
+        "grid_size = 20\n",
+        "x = np.linspace(trajectories_2d[:, :, 0].min(), trajectories_2d[:, :, 0].max(), grid_size)\n",
+        "y = np.linspace(trajectories_2d[:, :, 1].min(), trajectories_2d[:, :, 1].max(), grid_size)\n",
+        "X, Y = np.meshgrid(x, y)\n",
+        "\n",
+        "U = np.zeros_like(X)\n",
+        "V = np.zeros_like(Y)\n",
+        "\n",
+        "for i in range(grid_size):\n",
+        "    for j in range(grid_size):\n",
+        "        nearby_trajectories = [traj for traj in trajectories_2d if\n",
+        "                               (x[i]-0.5 < traj[:, 0]).any() and (traj[:, 0] < x[i]+0.5).any() and\n",
+        "                               (y[j]-0.5 < traj[:, 1]).any() and (traj[:, 1] < y[j]+0.5).any()]\n",
+        "        if nearby_trajectories:\n",
+        "            directions = np.diff(nearby_trajectories, axis=1)\n",
+        "            avg_direction = np.mean(directions, axis=(0, 1))\n",
+        "            U[j, i], V[j, i] = avg_direction\n",
+        "\n",
+        "# Normalize the vector field\n",
+        "magnitude = np.sqrt(U**2 + V**2)\n",
+        "U = U / np.where(magnitude > 0, magnitude, 1)\n",
+        "V = V / np.where(magnitude > 0, magnitude, 1)\n",
+        "\n",
+        "plt.streamplot(X, Y, U, V, density=1, color='gray', linewidth=0.5, arrowsize=0.5)\n",
+        "\n",
+        "# Find key points using KMeans clustering\n",
+        "n_clusters = 5  # Adjust this number based on how many key points you want\n",
+        "kmeans = KMeans(n_clusters=n_clusters)\n",
+        "flattened_trajectories = trajectories_2d.reshape(-1, 2)\n",
+        "kmeans.fit(flattened_trajectories)\n",
+        "key_points = kmeans.cluster_centers_\n",
+        "\n",
+        "# Plot key points\n",
+        "plt.scatter(key_points[:, 0], key_points[:, 1], color='blue', s=100, marker='*', zorder=5)\n",
+        "\n",
+        "# Add labels to key points\n",
+        "for i, point in enumerate(key_points):\n",
+        "    plt.annotate(f'Key Point {i+1}', (point[0], point[1]), xytext=(5, 5),\n",
+        "                 textcoords='offset points', fontsize=8, color='blue')\n",
+        "\n",
+        "# Add labels and title\n",
+        "plt.xlabel('PCA 1')\n",
+        "plt.ylabel('PCA 2')\n",
+        "plt.title('2D Reasoning Trajectories with Phase Space Features and Key Points')\n",
+        "\n",
+        "# Add a legend\n",
+        "valid_line = plt.Line2D([], [], color='green', label='Valid Chains')\n",
+        "invalid_line = plt.Line2D([], [], color='red', label='Invalid Chains')\n",
+        "vector_field_line = plt.Line2D([], [], color='gray', label='Vector Field')\n",
+        "key_point_marker = plt.Line2D([], [], color='blue', marker='*', linestyle='None',\n",
+        "                              markersize=10, label='Key Points')\n",
+        "plt.legend(handles=[valid_line, invalid_line, vector_field_line, key_point_marker])\n",
+        "\n",
+        "# Show the plot\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('2d_reasoning_trajectories_with_key_points.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "m38JkWLcQKCc"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "fig = plt.figure(figsize=(10, 8))\n",
+        "ax = fig.add_subplot(111, projection='3d')\n",
+        "\n",
+        "for i, trajectory in enumerate(trajectories_3d[:100]):  # Limit to first 100 for clarity\n",
+        "    color = 'green' if df.iloc[i]['is_valid'] else 'red'\n",
+        "    ax.plot(trajectory[:, 0], trajectory[:, 1], trajectory[:, 2], color=color, alpha=0.5)\n",
+        "    ax.scatter(trajectory[0, 0], trajectory[0, 1], trajectory[0, 2], color=color, s=20)\n",
+        "    ax.scatter(trajectory[-1, 0], trajectory[-1, 1], trajectory[-1, 2], color=color, s=20, marker='s')\n",
+        "\n",
+        "ax.set_xlabel('PCA 1')\n",
+        "ax.set_ylabel('PCA 2')\n",
+        "ax.set_zlabel('PCA 3')\n",
+        "ax.set_title('Reasoning Trajectories in 3D Embedding Space')\n",
+        "plt.tight_layout()\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "nVVADjWNNVy_"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "def compute_vector_field(trajectories, grid_size=10):\n",
+        "    # Determine the bounds of the space\n",
+        "    all_points = np.vstack(trajectories)\n",
+        "    mins = np.min(all_points, axis=0)\n",
+        "    maxs = np.max(all_points, axis=0)\n",
+        "\n",
+        "    # Create a grid\n",
+        "    x = np.linspace(mins[0], maxs[0], grid_size)\n",
+        "    y = np.linspace(mins[1], maxs[1], grid_size)\n",
+        "    z = np.linspace(mins[2], maxs[2], grid_size)\n",
+        "    X, Y, Z = np.meshgrid(x, y, z)\n",
+        "\n",
+        "    U = np.zeros((grid_size, grid_size, grid_size))\n",
+        "    V = np.zeros((grid_size, grid_size, grid_size))\n",
+        "    W = np.zeros((grid_size, grid_size, grid_size))\n",
+        "\n",
+        "    # Compute average direction for each grid cell\n",
+        "    for trajectory in trajectories:\n",
+        "        directions = np.diff(trajectory, axis=0)\n",
+        "        for direction, point in zip(directions, trajectory[:-1]):\n",
+        "            i, j, k = np.floor((point - mins) / (maxs - mins) * (grid_size - 1)).astype(int)\n",
+        "            U[i, j, k] += direction[0]\n",
+        "            V[i, j, k] += direction[1]\n",
+        "            W[i, j, k] += direction[2]\n",
+        "\n",
+        "    # Normalize\n",
+        "    magnitude = np.sqrt(U**2 + V**2 + W**2)\n",
+        "    U /= np.where(magnitude > 0, magnitude, 1)\n",
+        "    V /= np.where(magnitude > 0, magnitude, 1)\n",
+        "    W /= np.where(magnitude > 0, magnitude, 1)\n",
+        "\n",
+        "    return X, Y, Z, U, V, W\n",
+        "\n",
+        "# Set up the figure and 3D axis\n",
+        "fig = plt.figure(figsize=(12, 10))\n",
+        "ax = fig.add_subplot(111, projection='3d')\n",
+        "\n",
+        "# Plot trajectories\n",
+        "for i, trajectory in enumerate(trajectories_3d[:100]):  # Limit to first 100 for clarity\n",
+        "    color = 'green' if df.iloc[i]['is_valid'] else 'red'\n",
+        "    ax.plot(trajectory[:, 0], trajectory[:, 1], trajectory[:, 2], color=color, alpha=0.5)\n",
+        "    ax.scatter(trajectory[0, 0], trajectory[0, 1], trajectory[0, 2], color=color, s=20)\n",
+        "    ax.scatter(trajectory[-1, 0], trajectory[-1, 1], trajectory[-1, 2], color=color, s=20, marker='s')\n",
+        "\n",
+        "# Compute and plot vector field\n",
+        "X, Y, Z, U, V, W = compute_vector_field(trajectories_3d[:100])\n",
+        "ax.quiver(X, Y, Z, U, V, W, length=0.5, normalize=True, color='blue', alpha=0.3)\n",
+        "\n",
+        "ax.set_xlabel('PCA 1')\n",
+        "ax.set_ylabel('PCA 2')\n",
+        "ax.set_zlabel('PCA 3')\n",
+        "ax.set_title('Reasoning Trajectories and Phase Space in 3D Embedding Space')\n",
+        "\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('3d_phase_space_plot.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "l0UmPM8xftuv"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "plt.figure(figsize=(10, 6))\n",
+        "\n",
+        "# Create the histogram plot\n",
+        "sns.histplot(data=df, x='energy_conservation', kde=True, bins=50, color='green')\n",
+        "\n",
+        "# Set the title and labels\n",
+        "plt.title(\"Distribution of Energy Conservation Scores\", fontsize=16)\n",
+        "plt.xlabel(\"Energy Conservation Score\", fontsize=12)\n",
+        "plt.ylabel(\"Frequency\", fontsize=12)\n",
+        "\n",
+        "# Adjust layout and display\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('energy_conservation_distribution.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "qca1p7PhOaU6"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(15, 6))\n",
+        "\n",
+        "sns.histplot(data=df, x='trajectory_magnitude', hue='is_valid', element='step', stat='density', common_norm=False, ax=ax1)\n",
+        "ax1.set_title('Distribution of Trajectory Magnitudes')\n",
+        "ax1.set_xlabel('Magnitude')\n",
+        "ax1.set_ylabel('Density')\n",
+        "\n",
+        "sns.histplot(data=df, x='trajectory_angle', hue='is_valid', element='step', stat='density', common_norm=False, ax=ax2)\n",
+        "ax2.set_title('Distribution of Trajectory Angles')\n",
+        "ax2.set_xlabel('Angle (radians)')\n",
+        "ax2.set_ylabel('Density')\n",
+        "\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('magnitude_angle_distribution.png', dpi=300, bbox_inches='tight')\n",
+        "plt.close()"
+      ],
+      "metadata": {
+        "id": "I8VrMb6MMsOc"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Additional analysis\n",
+        "print(f\"Average Energy Conservation Score: {df['energy_conservation'].mean():.4f}\")\n",
+        "print(f\"Correlation between Energy Conservation and Validity: {df['energy_conservation'].corr(df['is_valid']):.4f}\")\n",
+        "print(f\"Average Hamiltonian Energy for Valid Chains: {valid_chains['H_energy'].mean():.4f}\")\n",
+        "print(f\"Average Hamiltonian Energy for Invalid Chains: {invalid_chains['H_energy'].mean():.4f}\")\n",
+        "\n",
+        "# T-test for difference in Hamiltonian Energy\n",
+        "t_stat, p_value = stats.ttest_ind(valid_chains['H_energy'], invalid_chains['H_energy'])\n",
+        "print(f\"\\nT-test for difference in Hamiltonian Energy:\")\n",
+        "print(f\"t-statistic: {t_stat:.4f}\")\n",
+        "print(f\"p-value: {p_value:.4f}\")"
+      ],
+      "metadata": {
+        "id": "FHmMSmNAI-qc"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "source": [
+        "## Geometric analysis"
+      ],
+      "metadata": {
+        "id": "1s_DosZEWVhy"
+      }
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "fig = plt.figure(figsize=(10, 8))\n",
+        "ax = fig.add_subplot(111, projection='3d')\n",
+        "\n",
+        "for i, trajectory in enumerate(trajectories_3d[:100]):  # Limit to first 100 for clarity\n",
+        "    color = 'green' if df.iloc[i]['is_valid'] else 'red'\n",
+        "    ax.plot(trajectory[:, 0], trajectory[:, 1], trajectory[:, 2], color=color, alpha=0.5)\n",
+        "    ax.scatter(trajectory[0, 0], trajectory[0, 1], trajectory[0, 2], color=color, s=20)\n",
+        "    ax.scatter(trajectory[-1, 0], trajectory[-1, 1], trajectory[-1, 2], color=color, s=20, marker='s')\n",
+        "\n",
+        "ax.set_xlabel('PCA 1')\n",
+        "ax.set_ylabel('PCA 2')\n",
+        "ax.set_zlabel('PCA 3')\n",
+        "ax.set_title('Reasoning Trajectories in 3D Embedding Space')\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('3d_trajectories.png', dpi=300, bbox_inches='tight')\n",
+        "plt.close()\n",
+        "\n",
+        "# 2. Trajectory Energy by Chain Index\n",
+        "plt.figure(figsize=(10, 6))\n",
+        "sns.scatterplot(x=df.index, y=trajectory_energies, hue=df['is_valid'], palette={True: 'green', False: 'red'})\n",
+        "plt.title('Trajectory Energy by Chain Index')\n",
+        "plt.xlabel('Chain Index')\n",
+        "plt.ylabel('Energy')\n",
+        "plt.legend(title='Is Valid')\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('trajectory_energy.png', dpi=300, bbox_inches='tight')\n",
+        "plt.close()"
+      ],
+      "metadata": {
+        "id": "2Sz-nqGA9p8B"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Energy Plot\n",
+        "plt.figure(figsize=(12, 6))\n",
+        "sns.scatterplot(x=df.index, y=trajectory_energies, hue=df['is_valid'], palette={True: 'green', False: 'red'})\n",
+        "plt.title('Trajectory Energy by Chain Index')\n",
+        "plt.xlabel('Chain Index')\n",
+        "plt.ylabel('Energy')\n",
+        "plt.legend(title='Is Valid')\n",
+        "plt.tight_layout()\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "5rN0K7tM_68P"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "plt.figure(figsize=(12, 6))\n",
+        "\n",
+        "# Define colors explicitly\n",
+        "colors = {'Valid': 'green', 'Invalid': 'red'}\n",
+        "\n",
+        "# Create the histogram plot with explicit colors\n",
+        "sns.histplot(data=pd.DataFrame({'Energy': trajectory_energies, 'Is Valid': df['is_valid'].map({True: 'Valid', False: 'Invalid'})}),\n",
+        "             x='Energy', hue='Is Valid', element='step', stat='density', common_norm=False,\n",
+        "             palette=colors)\n",
+        "\n",
+        "plt.title('Distribution of Trajectory Energies', fontsize=16)\n",
+        "plt.xlabel('Energy', fontsize=14)\n",
+        "plt.ylabel('Density', fontsize=14)\n",
+        "\n",
+        "# Create a custom legend\n",
+        "handles = [plt.Rectangle((0,0),1,1, color=color) for color in colors.values()]\n",
+        "labels = list(colors.keys())\n",
+        "plt.legend(handles, labels, title='Trajectory Validity', title_fontsize='13', fontsize='12')\n",
+        "\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('energy_distribution_plot.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "iRG8GKRF__3a"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Distribution of Trajectory Magnitudes and Angles\n",
+        "fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(15, 6))\n",
+        "\n",
+        "sns.histplot(data=df, x='trajectory_magnitude', hue='is_valid', element='step', stat='density', common_norm=False, ax=ax1)\n",
+        "ax1.set_title('Distribution of Trajectory Magnitudes')\n",
+        "ax1.set_xlabel('Magnitude')\n",
+        "ax1.set_ylabel('Density')\n",
+        "\n",
+        "sns.histplot(data=df, x='trajectory_angle', hue='is_valid', element='step', stat='density', common_norm=False, ax=ax2)\n",
+        "ax2.set_title('Distribution of Trajectory Angles')\n",
+        "ax2.set_xlabel('Angle (radians)')\n",
+        "ax2.set_ylabel('Density')\n",
+        "\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('magnitude_angle_distribution.png', dpi=300, bbox_inches='tight')\n",
+        "plt.close()"
+      ],
+      "metadata": {
+        "id": "yLJie7VYoas6"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Trajectory Magnitude vs Angle\n",
+        "plt.figure(figsize=(10, 8))\n",
+        "sns.scatterplot(data=df, x='trajectory_angle', y='trajectory_magnitude', hue='is_valid', alpha=0.6)\n",
+        "plt.title('Trajectory Magnitude vs Angle')\n",
+        "plt.xlabel('Angle (radians)')\n",
+        "plt.ylabel('Magnitude')\n",
+        "plt.legend(title='Is Valid')\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('magnitude_vs_angle.png', dpi=300, bbox_inches='tight')\n",
+        "plt.close()\n",
+        "\n",
+        "# 6. Trajectory Properties Comparison\n",
+        "fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(15, 6))\n",
+        "\n",
+        "sns.boxplot(x='is_valid', y='length', data=traj_properties, ax=ax1)\n",
+        "ax1.set_title('Trajectory Length')\n",
+        "ax1.set_xlabel('Is Valid')\n",
+        "ax1.set_ylabel('Length')\n",
+        "\n",
+        "sns.boxplot(x='is_valid', y='smoothness', data=traj_properties, ax=ax2)\n",
+        "ax2.set_title('Trajectory Smoothness')\n",
+        "ax2.set_xlabel('Is Valid')\n",
+        "ax2.set_ylabel('Smoothness')\n",
+        "\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('trajectory_properties.png', dpi=300, bbox_inches='tight')\n",
+        "plt.close()"
+      ],
+      "metadata": {
+        "id": "OOasgefio41H"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "plt.figure(figsize=(12, 8))\n",
+        "\n",
+        "# Define colors explicitly\n",
+        "colors = {'Valid': 'blue', 'Invalid': 'red'}\n",
+        "\n",
+        "# Prepare the data\n",
+        "plot_data = df.copy()\n",
+        "plot_data['Validity'] = df['is_valid'].map({True: 'Valid', False: 'Invalid'})\n",
+        "\n",
+        "# Create the scatter plot with explicit colors\n",
+        "sns.scatterplot(data=plot_data, x='trajectory_angle', y='trajectory_magnitude', hue='Validity',\n",
+        "                palette=colors, alpha=0.6)\n",
+        "\n",
+        "plt.title('Trajectory Magnitude vs Angle', fontsize=16)\n",
+        "plt.xlabel('Angle (radians)', fontsize=14)\n",
+        "plt.ylabel('Magnitude', fontsize=14)\n",
+        "\n",
+        "# Create custom legend handles\n",
+        "handles = [plt.Line2D([0], [0], marker='o', color='w', markerfacecolor=color, markersize=10, alpha=0.6)\n",
+        "           for color in colors.values()]\n",
+        "labels = list(colors.keys())\n",
+        "\n",
+        "# Add the legend with custom handles\n",
+        "plt.legend(handles, labels, title='Chain Validity', title_fontsize='13', fontsize='12')\n",
+        "\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('refined_magnitude_vs_angle_plot.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()\n",
+        "\n",
+        "# Calculate and print statistical information\n",
+        "valid_data = df[df['is_valid']]\n",
+        "invalid_data = df[~df['is_valid']]\n",
+        "\n",
+        "print(\"Statistical Information:\")\n",
+        "print(f\"Correlation between Angle and Magnitude (overall): {df['trajectory_angle'].corr(df['trajectory_magnitude']):.3f}\")\n",
+        "print(f\"Correlation for Valid Chains: {valid_data['trajectory_angle'].corr(valid_data['trajectory_magnitude']):.3f}\")\n",
+        "print(f\"Correlation for Invalid Chains: {invalid_data['trajectory_angle'].corr(invalid_data['trajectory_magnitude']):.3f}\")\n",
+        "\n",
+        "# Perform t-tests\n",
+        "t_stat_angle, p_value_angle = stats.ttest_ind(valid_data['trajectory_angle'], invalid_data['trajectory_angle'])\n",
+        "t_stat_mag, p_value_mag = stats.ttest_ind(valid_data['trajectory_magnitude'], invalid_data['trajectory_magnitude'])\n",
+        "\n",
+        "print(\"\\nT-test for difference in Trajectory Angle:\")\n",
+        "print(f\"t-statistic: {t_stat_angle:.4f}\")\n",
+        "print(f\"p-value: {p_value_angle:.4f}\")\n",
+        "\n",
+        "print(\"\\nT-test for difference in Trajectory Magnitude:\")\n",
+        "print(f\"t-statistic: {t_stat_mag:.4f}\")\n",
+        "print(f\"p-value: {p_value_mag:.4f}\")\n",
+        "\n",
+        "# Calculate and print mean values\n",
+        "print(\"\\nMean Values:\")\n",
+        "print(f\"Mean Angle for Valid Chains: {valid_data['trajectory_angle'].mean():.3f}\")\n",
+        "print(f\"Mean Angle for Invalid Chains: {invalid_data['trajectory_angle'].mean():.3f}\")\n",
+        "print(f\"Mean Magnitude for Valid Chains: {valid_data['trajectory_magnitude'].mean():.3f}\")\n",
+        "print(f\"Mean Magnitude for Invalid Chains: {invalid_data['trajectory_magnitude'].mean():.3f}\")"
+      ],
+      "metadata": {
+        "id": "6pBMYGiKBR7f"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Statistical tests\n",
+        "valid_mag = df[df['is_valid']]['trajectory_magnitude']\n",
+        "invalid_mag = df[~df['is_valid']]['trajectory_magnitude']\n",
+        "mag_ttest = ttest_ind(valid_mag, invalid_mag)\n",
+        "\n",
+        "valid_ang = df[df['is_valid']]['trajectory_angle']\n",
+        "invalid_ang = df[~df['is_valid']]['trajectory_angle']\n",
+        "ang_ttest = ttest_ind(valid_ang, invalid_ang)\n",
+        "\n",
+        "print(\"T-test for trajectory magnitude:\", mag_ttest)\n",
+        "print(\"T-test for trajectory angle:\", ang_ttest)\n",
+        "\n",
+        "# Correlation with energy\n",
+        "mag_energy_corr = df['trajectory_magnitude'].corr(df['H_energy'])\n",
+        "ang_energy_corr = df['trajectory_angle'].corr(df['H_energy'])\n",
+        "\n",
+        "print(\"Correlation between magnitude and H energy:\", mag_energy_corr)\n",
+        "print(\"Correlation between angle and H energy:\", ang_energy_corr)"
+      ],
+      "metadata": {
+        "id": "i2ccr--MBXYa"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "def calculate_curvature(trajectory):\n",
+        "    # Assuming trajectory has 3 points: start, middle, end\n",
+        "\n",
+        "    a = np.linalg.norm(trajectory[0][1] - trajectory[0][0])\n",
+        "    b = np.linalg.norm(trajectory[0][2] - trajectory[0][1])\n",
+        "    c = np.linalg.norm(trajectory[0][2] - trajectory[0][0])\n",
+        "\n",
+        "    s = (a + b + c) / 2\n",
+        "    area = np.sqrt(s * (s-a) * (s-b) * (s-c))\n",
+        "\n",
+        "    return 4 * area / (a * b * c)\n",
+        "\n",
+        "def calculate_rate_of_change(trajectory):\n",
+        "    # Calculate the rate of change between each pair of consecutive points\n",
+        "    changes = np.diff(trajectory, axis=0)\n",
+        "    rates = np.linalg.norm(changes, axis=1)\n",
+        "    return np.mean(rates)\n",
+        "\n",
+        "# Calculate curvature and rate of change\n",
+        "curvatures = []\n",
+        "rates_of_change = []\n",
+        "\n",
+        "for traj in trajectories_3d:\n",
+        "    curvatures.append(calculate_curvature(traj))\n",
+        "    rates_of_change.append(calculate_rate_of_change(traj))\n",
+        "\n",
+        "# Add these to the dataframe\n",
+        "df['curvature'] = curvatures\n",
+        "df['rate_of_change'] = rates_of_change\n",
+        "\n",
+        "\n",
+        "plt.figure(figsize=(12, 6))\n",
+        "\n",
+        "# Define colors explicitly\n",
+        "colors = {'Valid': 'blue', 'Invalid': 'red'}\n",
+        "\n",
+        "# Prepare the data\n",
+        "plot_data = pd.DataFrame({\n",
+        "    'Curvature': df['curvature'],\n",
+        "    'Validity': df['is_valid'].map({True: 'Valid', False: 'Invalid'})\n",
+        "})\n",
+        "\n",
+        "# Create the histogram plot with explicit colors\n",
+        "sns.histplot(data=plot_data, x='Curvature', hue='Validity',\n",
+        "             element='step', stat='density', common_norm=False,\n",
+        "             palette=colors)\n",
+        "\n",
+        "plt.title('Distribution of Trajectory Curvatures', fontsize=16)\n",
+        "plt.xlabel('Curvature', fontsize=14)\n",
+        "plt.ylabel('Density', fontsize=14)\n",
+        "\n",
+        "# Adjust legend\n",
+        "plt.legend(title='Chain Validity', title_fontsize='13', fontsize='12')\n",
+        "\n",
+        "# Calculate mean curvatures for valid and invalid chains\n",
+        "mean_valid = df[df['is_valid']]['curvature'].mean()\n",
+        "mean_invalid = df[~df['is_valid']]['curvature'].mean()\n",
+        "\n",
+        "# Add vertical lines for mean curvatures\n",
+        "plt.axvline(x=mean_valid, color='blue', linestyle='--', label='Mean Valid')\n",
+        "plt.axvline(x=mean_invalid, color='red', linestyle='--', label='Mean Invalid')\n",
+        "\n",
+        "# Add text annotations for mean curvatures\n",
+        "plt.text(mean_valid, plt.gca().get_ylim()[1], f'Mean Valid: {mean_valid:.3f}',\n",
+        "         rotation=90, va='top', ha='right', color='blue')\n",
+        "plt.text(mean_invalid, plt.gca().get_ylim()[1], f'Mean Invalid: {mean_invalid:.3f}',\n",
+        "         rotation=90, va='top', ha='left', color='red')\n",
+        "\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('refined_curvature_distribution.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()\n",
+        "\n",
+        "# Calculate and print statistical information\n",
+        "valid_curv = df[df['is_valid']]['curvature']\n",
+        "invalid_curv = df[~df['is_valid']]['curvature']\n",
+        "t_stat, p_value = stats.ttest_ind(valid_curv, invalid_curv)"
+      ],
+      "metadata": {
+        "id": "BlXQkEKjCrSK"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "plt.figure(figsize=(12, 6))\n",
+        "\n",
+        "# Define colors explicitly\n",
+        "colors = {'Valid': 'blue', 'Invalid': 'red'}\n",
+        "\n",
+        "# Prepare the data\n",
+        "plot_data = pd.DataFrame({\n",
+        "    'Rate of Change': df['rate_of_change'],\n",
+        "    'Validity': df['is_valid'].map({True: 'Valid', False: 'Invalid'})\n",
+        "})\n",
+        "\n",
+        "# Create the histogram plot with explicit colors\n",
+        "sns.histplot(data=plot_data, x='Rate of Change', hue='Validity',\n",
+        "             element='step', stat='density', common_norm=False,\n",
+        "             palette=colors)\n",
+        "\n",
+        "plt.title('Distribution of Trajectory Rates of Change', fontsize=16)\n",
+        "plt.xlabel('Rate of Change', fontsize=14)\n",
+        "plt.ylabel('Density', fontsize=14)\n",
+        "\n",
+        "# Create custom legend handles\n",
+        "handles = [plt.Rectangle((0,0),1,1, color=colors[label]) for label in colors]\n",
+        "labels = list(colors.keys())\n",
+        "\n",
+        "# Add the legend with custom handles\n",
+        "plt.legend(handles, labels, title='Chain Validity', title_fontsize='13', fontsize='12')\n",
+        "\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('simplified_rate_of_change_distribution.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()\n",
+        "\n",
+        "# Calculate and print statistical information\n",
+        "valid_roc = df[df['is_valid']]['rate_of_change']\n",
+        "invalid_roc = df[~df['is_valid']]['rate_of_change']\n",
+        "t_stat, p_value = stats.ttest_ind(valid_roc, invalid_roc)\n",
+        "\n",
+        "mean_valid = valid_roc.mean()\n",
+        "mean_invalid = invalid_roc.mean()\n",
+        "\n",
+        "print(\"Distribution of Trajectory Rates of Change\")\n",
+        "print(f\"Average Rate of Change for Valid Chains: {mean_valid:.3f}\")\n",
+        "print(f\"Average Rate of Change for Invalid Chains: {mean_invalid:.3f}\")\n",
+        "print(f\"Correlation between Rate of Change and Validity: {df['rate_of_change'].corr(df['is_valid']):.3f}\")\n",
+        "print(\"\\nT-test for difference in Rate of Change:\")\n",
+        "print(f\"t-statistic: {t_stat:.4f}\")\n",
+        "print(f\"p-value: {p_value:.4f}\")"
+      ],
+      "metadata": {
+        "id": "T7GzkWJzCwJe"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Statistical tests\n",
+        "df['curvature'] = df['curvature'].fillna(0)\n",
+        "df['rate_of_change'] = df['rate_of_change'].astype(float)\n",
+        "valid_curv = df[df['is_valid']]['curvature']\n",
+        "invalid_curv = df[~df['is_valid']]['curvature']\n",
+        "curv_ttest = ttest_ind(valid_curv, invalid_curv)\n",
+        "\n",
+        "valid_roc = df[df['is_valid']]['rate_of_change']\n",
+        "invalid_roc = df[~df['is_valid']]['rate_of_change']\n",
+        "roc_ttest = ttest_ind(valid_roc, invalid_roc)\n",
+        "\n",
+        "print(\"T-test for trajectory curvature:\", curv_ttest)\n",
+        "print(\"T-test for trajectory rate of change:\", roc_ttest)\n",
+        "\n",
+        "# Correlation with energy\n",
+        "curv_energy_corr = df['curvature'].corr(df['H_energy'])\n",
+        "roc_energy_corr = df['rate_of_change'].corr(df['H_energy'])\n",
+        "\n",
+        "print(\"Correlation between curvature and energy:\", curv_energy_corr)\n",
+        "print(\"Correlation between rate of change and energy:\", roc_energy_corr)"
+      ],
+      "metadata": {
+        "id": "0PabrOYpC7dK"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Frenet's framework\n",
+        "def reduce_dimensionality(trajectories, n_components=3):\n",
+        "    \"\"\"Reduce dimensionality of trajectories using PCA\"\"\"\n",
+        "    flattened = np.vstack(trajectories)\n",
+        "    pca = PCA(n_components=n_components)\n",
+        "    reduced = pca.fit_transform(flattened)\n",
+        "    return reduced.reshape(len(trajectories), -1, n_components), pca\n",
+        "\n",
+        "def frenet_serret_frame(trajectory):\n",
+        "    \"\"\"Compute Frenet-Serret frame for a trajectory\"\"\"\n",
+        "    # Compute tangent vectors\n",
+        "    T = np.diff(trajectory, axis=0)\n",
+        "    T_norm = np.linalg.norm(T, axis=1, keepdims=True)\n",
+        "    T = np.divide(T, T_norm, where=T_norm!=0)\n",
+        "\n",
+        "    # Compute normal vectors\n",
+        "    N = np.diff(T, axis=0)\n",
+        "    N_norm = np.linalg.norm(N, axis=1, keepdims=True)\n",
+        "    N = np.divide(N, N_norm, where=N_norm!=0)\n",
+        "\n",
+        "    # Compute binormal vectors\n",
+        "    B = np.cross(T[:-1], N)\n",
+        "\n",
+        "    return T[:-1], N, B\n",
+        "\n",
+        "def compute_curvature_torsion(T, N, B):\n",
+        "    \"\"\"Compute curvature and torsion from Frenet-Serret frame\"\"\"\n",
+        "    dT = np.diff(T, axis=0)\n",
+        "    curvature = np.linalg.norm(dT, axis=1)\n",
+        "\n",
+        "    # Compute torsion\n",
+        "    dB = np.diff(B, axis=0)\n",
+        "    torsion = np.sum(dB * N[1:], axis=1)\n",
+        "\n",
+        "    return np.mean(curvature), np.mean(torsion)\n",
+        "\n",
+        "# Reduce dimensionality of trajectories\n",
+        "reduced_trajectories, pca = reduce_dimensionality(trajectories)\n",
+        "\n",
+        "# Compute Frenet-Serret frames and curvature/torsion\n",
+        "curvatures = []\n",
+        "torsions = []\n",
+        "for i, traj in enumerate(reduced_trajectories):\n",
+        "    try:\n",
+        "        T, N, B = frenet_serret_frame(traj)\n",
+        "        curvature, torsion = compute_curvature_torsion(T, N, B)\n",
+        "        curvatures.append(curvature)\n",
+        "        torsions.append(torsion)\n",
+        "    except Exception as e:\n",
+        "        print(f\"Error processing trajectory {i}: {str(e)}\")\n",
+        "        print(f\"Trajectory shape: {traj.shape}\")\n",
+        "        curvatures.append(np.nan)\n",
+        "        torsions.append(np.nan)\n",
+        "\n",
+        "df['curvature'] = curvatures\n",
+        "df['torsion'] = torsions\n",
+        "\n",
+        "# Remove any NaN values\n",
+        "df = df.dropna(subset=['curvature', 'torsion'])\n"
+      ],
+      "metadata": {
+        "id": "hgpHHxRz438n"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Analyze the principal components\n",
+        "explained_variance_ratio = pca.explained_variance_ratio_\n",
+        "cumulative_variance_ratio = np.cumsum(explained_variance_ratio)\n",
+        "\n",
+        "plt.figure(figsize=(10, 6))\n",
+        "plt.plot(range(1, len(explained_variance_ratio) + 1), cumulative_variance_ratio, 'bo-')\n",
+        "plt.xlabel('Number of Components', fontsize=14)\n",
+        "plt.ylabel('Cumulative Explained Variance Ratio', fontsize=14)\n",
+        "plt.title('Explained Variance Ratio by Principal Components', fontsize=16)\n",
+        "plt.savefig('pca_explained_variance.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()\n",
+        "\n",
+        "print(f\"Explained variance ratio of first 3 components: {explained_variance_ratio[:3]}\")\n",
+        "print(f\"Cumulative explained variance ratio of first 3 components: {cumulative_variance_ratio[2]:.4f}\")"
+      ],
+      "metadata": {
+        "id": "UHASmPhm5dsa"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Compute and visualize Hamiltonian along trajectories\n",
+        "\n",
+        "def hamiltonian(q, p, q_goal):\n",
+        "  \"\"\"Hamiltonian function\"\"\"\n",
+        "  T = 0.5 * np.dot(p, p)  # Kinetic energy\n",
+        "  V = sophisticated_potential(q, q_goal)  # Potential energy\n",
+        "  return T + V\n",
+        "\n",
+        "def sophisticated_potential(q, q_goal):\n",
+        "  \"\"\"A more sophisticated potential energy function\"\"\"\n",
+        "  similarity = np.dot(q, q_goal) / (np.linalg.norm(q) * np.linalg.norm(q_goal))\n",
+        "  complexity = np.linalg.norm(q)  # Assume more complex states have higher norm\n",
+        "  return -similarity + 0.1 * complexity  # Balance between relevance and complexity\n",
+        "\n",
+        "# Compute and visualize Hamiltonian along trajectories\n",
+        "hamiltonians = []\n",
+        "q_goal = np.mean([traj[-1] for traj in trajectories], axis=0)  # Assuming the goal is the average final state\n",
+        "\n",
+        "for traj in trajectories:\n",
+        "    H = []\n",
+        "    for i in range(len(traj)):\n",
+        "        q = traj[i]\n",
+        "        p = traj[i] - traj[i-1] if i > 0 else np.zeros_like(q)  # Estimate momentum as the difference between states\n",
+        "        H.append(hamiltonian(q, p, q_goal))\n",
+        "    hamiltonians.append(H)\n",
+        "\n",
+        "plt.figure(figsize=(12, 6))\n",
+        "for i, H in enumerate(hamiltonians[:20]):  # Plot first 20 for clarity\n",
+        "    plt.plot(H, label=f'Trajectory {i+1}')\n",
+        "plt.title('Hamiltonian Evolution Along Reasoning Trajectories', fontsize=16)\n",
+        "plt.xlabel('Time Step', fontsize=16)\n",
+        "plt.ylabel('Hamiltonian',fontsize=16)\n",
+        "plt.legend()\n",
+        "plt.savefig('hamiltonian_evolution_plot.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()\n",
+        "\n",
+        "# Statistical analysis\n",
+        "valid_curvature = df[df['is_valid']]['curvature']\n",
+        "invalid_curvature = df[~df['is_valid']]['curvature']\n",
+        "t_stat, p_value = stats.ttest_ind(valid_curvature, invalid_curvature)\n",
+        "\n",
+        "print(f\"T-test for curvature: t-statistic = {t_stat}, p-value = {p_value}\")\n",
+        "\n",
+        "# Correlation analysis\n",
+        "correlation = df['curvature'].corr(df['torsion'])\n",
+        "print(f\"Correlation between curvature and torsion: {correlation}\")\n",
+        "\n"
+      ],
+      "metadata": {
+        "id": "v0V1WiVN6F6g"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# 3D plot of trajectories\n",
+        "fig = plt.figure(figsize=(12,12))\n",
+        "ax = fig.add_subplot(111, projection='3d')\n",
+        "\n",
+        "for i, traj in enumerate(trajectories_3d[:20]):  # Plot first 20 for clarity\n",
+        "    color = 'green' if df.iloc[i]['is_valid'] else 'red'\n",
+        "    ax.plot(traj[:, 0], traj[:, 1], traj[:, 2], color=color, alpha=0.6)\n",
+        "\n",
+        "ax.set_xlabel('PCA 1', fontsize=14)\n",
+        "ax.set_ylabel('PCA 2', fontsize=14)\n",
+        "ax.set_zlabel('PCA 3', fontsize=14)\n",
+        "ax.set_title('Reasoning Trajectories in PCA Space', fontsize=16)\n",
+        "# Add legend\n",
+        "ax.legend([valid_handle, invalid_handle], ['Valid', 'Invalid'], loc='upper right')\n",
+        "plt.savefig('pca_trajectories_plot.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "7BuXJCesA-2u"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Statistical Analysis\n",
+        "\n",
+        "pca_means = np.array([traj.mean(axis=0) for traj in trajectories_3d])\n",
+        "X = pd.DataFrame(pca_means, columns=['PCA1', 'PCA2', 'PCA3'])\n",
+        "y = pd.Series(df['is_valid'].values, name='is_valid')\n",
+        "\n",
+        "# Ensure 'is_valid' is boolean\n",
+        "y = y.astype(bool)\n",
+        "\n",
+        "# Combine X and y into a single DataFrame\n",
+        "data = pd.concat([X, y], axis=1)\n",
+        "\n",
+        "# 1. MANOVA test\n",
+        "manova = MANOVA.from_formula('PCA1 + PCA2 + PCA3 ~ is_valid', data=data)\n",
+        "print(\"MANOVA test results:\")\n",
+        "print(manova.mv_test())\n",
+        "\n",
+        "# 2. T-tests for each PCA dimension\n",
+        "for i in range(3):\n",
+        "    t_stat, p_value = stats.ttest_ind(X[f'PCA{i+1}'][y], X[f'PCA{i+1}'][~y])\n",
+        "    print(f\"T-test for PCA{i+1}: t-statistic = {t_stat:.4f}, p-value = {p_value:.4f}\")\n",
+        "\n",
+        "# 3. Logistic Regression\n",
+        "log_reg = LogisticRegression()\n",
+        "log_reg.fit(X, y)\n",
+        "y_pred = log_reg.predict(X)\n",
+        "accuracy = accuracy_score(y, y_pred)\n",
+        "print(f\"Logistic Regression Accuracy: {accuracy:.4f}\")\n",
+        "\n",
+        "# 4. Effect sizes (Cohen's d) for each PCA dimension\n",
+        "for i in range(3):\n",
+        "    cohens_d = (X[f'PCA{i+1}'][y].mean() - X[f'PCA{i+1}'][~y].mean()) / np.sqrt((X[f'PCA{i+1}'][y].var() + X[f'PCA{i+1}'][~y].var()) / 2)\n",
+        "    print(f\"Cohen's d for PCA{i+1}: {cohens_d:.4f}\")\n",
+        "\n",
+        "# 5. Trajectory length comparison\n",
+        "trajectory_lengths = np.array([np.sum(np.sqrt(np.sum(np.diff(traj, axis=0)**2, axis=1))) for traj in trajectories_pca])\n",
+        "t_stat, p_value = stats.ttest_ind(trajectory_lengths[y], trajectory_lengths[~y])\n",
+        "print(f\"T-test for trajectory lengths: t-statistic = {t_stat:.4f}, p-value = {p_value:.4f}\")"
+      ],
+      "metadata": {
+        "id": "rqPocLPzDFiM"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Correlation between trajectory complexity and validity\n",
+        "# Analyze trajectory complexity\n",
+        "def trajectory_complexity(traj):\n",
+        "    return np.sum(np.linalg.norm(np.diff(traj, axis=0), axis=1))\n",
+        "\n",
+        "complexities = [trajectory_complexity(traj) for traj in reduced_trajectories]\n",
+        "df['complexity'] = complexities\n",
+        "complexity_correlation = stats.pointbiserialr(df['is_valid'], df['complexity'])\n",
+        "print(f\"Correlation between trajectory complexity and validity: r = {complexity_correlation.correlation:.4f}, p = {complexity_correlation.pvalue:.4f}\")"
+      ],
+      "metadata": {
+        "id": "csICTST5BcS5"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "source": [
+        "## Canonical transformations"
+      ],
+      "metadata": {
+        "id": "c0kKU3xdVpMf"
+      }
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "def hamiltonian(state, t, k):\n",
+        "    \"\"\"Simple harmonic oscillator Hamiltonian\"\"\"\n",
+        "    q, p = state\n",
+        "    return p**2 / 2 + k * q**2 / 2\n",
+        "\n",
+        "def hamilton_equations(state, t, k):\n",
+        "    \"\"\"Hamilton's equations for simple harmonic oscillator\"\"\"\n",
+        "    q, p = state\n",
+        "    dqdt = p\n",
+        "    dpdt = -k * q\n",
+        "    return [dqdt, dpdt]\n",
+        "\n",
+        "def canonical_transform_to_action_angle(q, p, k):\n",
+        "    \"\"\"Transform from (q,p) to action-angle variables (I, theta)\"\"\"\n",
+        "    I = (p**2 + k * q**2) / (2 * k)\n",
+        "    theta = np.arctan2(np.sqrt(k) * q, p)\n",
+        "    return I, theta\n",
+        "\n",
+        "def inverse_canonical_transform(I, theta, k):\n",
+        "    \"\"\"Transform from action-angle variables (I, theta) back to (q,p)\"\"\"\n",
+        "    q = np.sqrt(2 * I / k) * np.sin(theta)\n",
+        "    p = np.sqrt(2 * I * k) * np.cos(theta)\n",
+        "    return q, p\n",
+        "\n",
+        "# Parameters\n",
+        "k = 1.0  # Spring constant\n",
+        "t = np.linspace(0, 10, 100)\n",
+        "\n",
+        "# Apply canonical transformation to our trajectories\n",
+        "action_angle_trajectories = []\n",
+        "for traj in trajectories_pca:\n",
+        "    q, p = traj[:, 0], traj[:, 1]  # Assuming first two PCs represent position and momentum\n",
+        "    I, theta = canonical_transform_to_action_angle(q, p, k)\n",
+        "    action_angle_trajectories.append(np.column_stack((I, theta)))\n",
+        "\n",
+        "\n",
+        "# Analysis\n",
+        "action_means_valid = [np.mean(traj[:, 0]) for traj, valid in zip(action_angle_trajectories, df['is_valid'].tolist()) if valid]\n",
+        "action_means_nonvalid = [np.mean(traj[:, 0]) for traj, valid in zip(action_angle_trajectories, df['is_valid'].tolist()) if not valid]\n",
+        "angle_ranges_valid = [np.ptp(traj[:, 1]) for traj, valid in zip(action_angle_trajectories, df['is_valid'].tolist()) if valid]\n",
+        "angle_ranges_nonvalid = [np.ptp(traj[:, 1]) for traj, valid in zip(action_angle_trajectories, df['is_valid'].tolist()) if not valid]\n",
+        "\n",
+        "print(f\"Mean action for valid chains: {np.mean(action_means_valid):.4f}\")\n",
+        "print(f\"Mean action for non-valid chains: {np.mean(action_means_nonvalid):.4f}\")\n",
+        "print(f\"Mean angle range for valid chains: {np.mean(angle_ranges_valid):.4f}\")\n",
+        "print(f\"Mean angle range for non-valid chains: {np.mean(angle_ranges_nonvalid):.4f}\")\n",
+        "\n",
+        "# Statistical tests\n",
+        "from scipy import stats\n",
+        "\n",
+        "t_stat, p_value = stats.ttest_ind(action_means_valid, action_means_nonvalid)\n",
+        "print(f\"T-test for action means: t-statistic = {t_stat:.4f}, p-value = {p_value:.4f}\")\n",
+        "\n",
+        "t_stat, p_value = stats.ttest_ind(angle_ranges_valid, angle_ranges_nonvalid)\n",
+        "print(f\"T-test for angle ranges: t-statistic = {t_stat:.4f}, p-value = {p_value:.4f}\")\n",
+        "\n",
+        "# Classify trajectories based on action and angle properties\n",
+        "def classify_trajectory(action, angle_range, valid):\n",
+        "    high_action = np.mean(action_means_valid if valid else action_means_nonvalid) + np.std(action_means_valid if valid else action_means_nonvalid)\n",
+        "    low_action = np.mean(action_means_valid if valid else action_means_nonvalid) - np.std(action_means_valid if valid else action_means_nonvalid)\n",
+        "    high_angle_range = np.mean(angle_ranges_valid if valid else angle_ranges_nonvalid) + np.std(angle_ranges_valid if valid else angle_ranges_nonvalid)\n",
+        "\n",
+        "    if action > high_action and angle_range > high_angle_range:\n",
+        "        return \"High energy, complex reasoning\"\n",
+        "    elif action < low_action and angle_range > high_angle_range:\n",
+        "        return \"Low energy, exploratory reasoning\"\n",
+        "    elif action > high_action and angle_range <= high_angle_range:\n",
+        "        return \"High energy, focused reasoning\"\n",
+        "    elif action < low_action and angle_range <= high_angle_range:\n",
+        "        return \"Low energy, simple reasoning\"\n",
+        "    else:\n",
+        "        return \"Moderate reasoning\""
+      ],
+      "metadata": {
+        "id": "Pm52IjYTXMMH"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Plotting\n",
+        "fig = plt.figure(figsize=(15, 5))\n",
+        "\n",
+        "# Original space\n",
+        "ax1 = fig.add_subplot(131)\n",
+        "for traj, valid in zip(trajectories_pca[:10], df['is_valid'].tolist()[:10]):  # Plot first 10 for clarity\n",
+        "    color = 'green' if valid else 'red'\n",
+        "    ax1.plot(traj[:, 0], traj[:, 1], color=color, alpha=0.7)\n",
+        "ax1.set_xlabel('PC1 (q)', fontsize=12)\n",
+        "ax1.set_ylabel('PC2 (p)', fontsize=12)\n",
+        "ax1.set_title('Original Phase Space', fontsize=14)\n",
+        "ax1.legend([valid_handle, invalid_handle], ['Valid', 'Invalid'], loc='upper right', fontsize=12)\n",
+        "\n",
+        "# Action-Angle space\n",
+        "ax2 = fig.add_subplot(132)\n",
+        "for traj, valid in zip(action_angle_trajectories[:10], df['is_valid'].tolist()[:10]):\n",
+        "    color = 'green' if valid else 'red'\n",
+        "    ax2.plot(traj[:, 0], traj[:, 1], color=color, alpha=0.7)\n",
+        "ax2.set_xlabel('Action (I)', fontsize=12)\n",
+        "ax2.set_ylabel('Angle (theta)', fontsize=12)\n",
+        "ax2.set_title('Action-Angle Space', fontsize=14)\n",
+        "ax2.legend([valid_handle, invalid_handle], ['Valid', 'Invalid'], loc='upper right', fontsize=12)\n",
+        "\n",
+        "# 3D visualization\n",
+        "ax3 = fig.add_subplot(133, projection='3d')\n",
+        "for traj, valid in zip(action_angle_trajectories[:10], df['is_valid'].tolist()[:10]):\n",
+        "    color = 'green' if valid else 'red'\n",
+        "    ax3.plot(traj[:, 0], np.cos(traj[:, 1]), np.sin(traj[:, 1]), color=color, alpha=0.7)\n",
+        "ax3.set_xlabel('Action (I)', fontsize=12)\n",
+        "ax3.set_ylabel('cos(theta)', fontsize=12)\n",
+        "ax3.set_zlabel('sin(theta)', fontsize=12)\n",
+        "ax3.set_title('3D Action-Angle Space', fontsize=14)\n",
+        "ax3.legend([valid_handle, invalid_handle], ['Valid', 'Invalid'], loc='upper right', fontsize=12)\n",
+        "\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('canonical_transformation_analysis_with_validity.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "YlzvprO0ZBo1"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "source": [
+        "## Conservation laws"
+      ],
+      "metadata": {
+        "id": "b-FE7nQWW1Oe"
+      }
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "def calculate_hamiltonian(q, p):\n",
+        "    \"\"\"Simple Hamiltonian function\"\"\"\n",
+        "    return 0.5 * (q**2 + p**2)\n",
+        "\n",
+        "def calculate_angular_momentum(q, p):\n",
+        "    \"\"\"Angular momentum-like quantity\"\"\"\n",
+        "    return q * p\n",
+        "\n",
+        "def calculate_energy_like_quantity(q, p):\n",
+        "    \"\"\"Energy-like conserved quantity\"\"\"\n",
+        "    return q**2 - p**2\n",
+        "\n",
+        "def analyze_conservation(trajectories, quantity_func, quantity_name):\n",
+        "    conserved_scores = []\n",
+        "    for traj in trajectories:\n",
+        "        q_start, q_end = traj[:, 0]\n",
+        "        p_start, p_end = traj[:, 1]\n",
+        "        quantity_start = quantity_func(q_start, p_start)\n",
+        "        quantity_end = quantity_func(q_end, p_end)\n",
+        "        change = abs(quantity_end - quantity_start)\n",
+        "        conserved_scores.append(change)\n",
+        "    return conserved_scores\n",
+        "\n",
+        "# Analyze conservation for different quantities\n",
+        "hamiltonian_scores = analyze_conservation(trajectories_2d, calculate_hamiltonian, \"Hamiltonian\")\n",
+        "angular_momentum_scores = analyze_conservation(trajectories_2d, calculate_angular_momentum, \"Angular Momentum\")\n",
+        "energy_scores = analyze_conservation(trajectories_2d, calculate_energy_like_quantity, \"Energy-like Quantity\")\n",
+        "\n",
+        "# Print some statistics\n",
+        "print(\"Hamiltonian changes - Mean: {:.4f}, Std: {:.4f}\".format(np.mean(hamiltonian_scores), np.std(hamiltonian_scores)))\n",
+        "print(\"Angular Momentum changes - Mean: {:.4f}, Std: {:.4f}\".format(np.mean(angular_momentum_scores), np.std(angular_momentum_scores)))\n",
+        "print(\"Energy-like Quantity changes - Mean: {:.4f}, Std: {:.4f}\".format(np.mean(energy_scores), np.std(energy_scores)))"
+      ],
+      "metadata": {
+        "id": "t_aym0wlWBpg"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Visualize conservation of quantities\n",
+        "plt.figure(figsize=(15, 5))\n",
+        "\n",
+        "plt.subplot(131)\n",
+        "plt.hist(hamiltonian_scores, bins=20, color='blue', alpha=0.7)\n",
+        "plt.title(\"Conservation of Hamiltonian\", fontsize=16)\n",
+        "plt.xlabel(\"Standard Error\", fontsize=14)\n",
+        "plt.ylabel(\"Frequency\", fontsize=14)\n",
+        "\n",
+        "plt.subplot(132)\n",
+        "plt.hist(angular_momentum_scores, bins=20, color='green', alpha=0.7)\n",
+        "plt.title(\"Conservation of Angular Momentum\", fontsize=16)\n",
+        "plt.xlabel(\"Standard Error\", fontsize=14)\n",
+        "plt.ylabel(\"Frequency\", fontsize=14)\n",
+        "\n",
+        "plt.subplot(133)\n",
+        "plt.hist(energy_scores, bins=20, color='red', alpha=0.7)\n",
+        "plt.title(\"Conservation of Energy-like Quantity\", fontsize=16)\n",
+        "plt.xlabel(\"Standard Error\", fontsize=14)\n",
+        "plt.ylabel(\"Frequency\", fontsize=14)\n",
+        "\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('conservation_laws_analysis.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "zOFQfeap55P7"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Calculate the overall range for x-axis\n",
+        "all_scores = np.concatenate([hamiltonian_scores, angular_momentum_scores, energy_scores])\n",
+        "min_score = np.min(all_scores)\n",
+        "max_score = np.max(all_scores)\n",
+        "\n",
+        "# Create bins that cover the entire range\n",
+        "bins = np.linspace(min_score, max_score, 21)  # 20 bins\n",
+        "\n",
+        "# Compute histograms\n",
+        "h_hist, _ = np.histogram(hamiltonian_scores, bins=bins)\n",
+        "a_hist, _ = np.histogram(angular_momentum_scores, bins=bins)\n",
+        "e_hist, _ = np.histogram(energy_scores, bins=bins)\n",
+        "\n",
+        "# Find the maximum frequency across all histograms\n",
+        "max_freq = max(np.max(h_hist), np.max(a_hist), np.max(e_hist))\n",
+        "\n",
+        "plt.figure(figsize=(15, 5))\n",
+        "\n",
+        "plt.subplot(131)\n",
+        "plt.hist(hamiltonian_scores, bins=bins, color='blue', alpha=0.7)\n",
+        "plt.title(\"Conservation of Hamiltonian\", fontsize=16)\n",
+        "plt.xlabel(\"Standard Error\", fontsize=14)\n",
+        "plt.ylabel(\"Frequency\", fontsize=14)\n",
+        "plt.xlim(min_score, max_score)\n",
+        "plt.ylim(0, max_freq)\n",
+        "\n",
+        "plt.subplot(132)\n",
+        "plt.hist(angular_momentum_scores, bins=bins, color='green', alpha=0.7)\n",
+        "plt.title(\"Conservation of Angular Momentum\", fontsize=16)\n",
+        "plt.xlabel(\"Standard Error\", fontsize=14)\n",
+        "plt.ylabel(\"Frequency\", fontsize=14)\n",
+        "plt.xlim(min_score, max_score)\n",
+        "plt.ylim(0, max_freq)\n",
+        "\n",
+        "plt.subplot(133)\n",
+        "plt.hist(energy_scores, bins=bins, color='red', alpha=0.7)\n",
+        "plt.title(\"Conservation of Energy-like Quantity\", fontsize=16)\n",
+        "plt.xlabel(\"Standard Error\", fontsize=14)\n",
+        "plt.ylabel(\"Frequency\", fontsize=14)\n",
+        "plt.xlim(min_score, max_score)\n",
+        "plt.ylim(0, max_freq)\n",
+        "\n",
+        "plt.tight_layout()\n",
+        "plt.savefig('conservation_laws_analysis_same_scales.png', dpi=300, bbox_inches='tight')\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "9FYy8-nIZwsy"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "def calculate_trajectory_entropy(trajectory):\n",
+        "    \"\"\"Calculate the entropy of a trajectory.\"\"\"\n",
+        "    # Discretize the trajectory into bins\n",
+        "    hist, _ = np.histogram(trajectory, bins=20, density=True)\n",
+        "    return entropy(hist)\n",
+        "\n",
+        "def calculate_free_energy(trajectory, temperature=1.0):\n",
+        "    \"\"\"Calculate a free energy analog for a trajectory.\"\"\"\n",
+        "    # Assume energy is proportional to the squared distance from the origin\n",
+        "    energy = np.sum(trajectory**2, axis=1)\n",
+        "    entropy = calculate_trajectory_entropy(energy)\n",
+        "    return np.mean(energy) - temperature * entropy\n",
+        "\n",
+        "# Apply to all trajectories\n",
+        "trajectory_entropies = [calculate_trajectory_entropy(traj) for traj in trajectories_2d]\n",
+        "free_energies = [calculate_free_energy(traj) for traj in trajectories_2d]\n",
+        "\n",
+        "# Analyze the results\n",
+        "print(\"Mean trajectory entropy:\", np.mean(trajectory_entropies))\n",
+        "print(\"Mean free energy:\", np.mean(free_energies))\n",
+        "\n",
+        "# Visualize the results\n",
+        "plt.figure(figsize=(12, 5))\n",
+        "plt.subplot(121)\n",
+        "plt.hist(trajectory_entropies, bins=20)\n",
+        "plt.title(\"Distribution of Trajectory Entropies\", fontsize=16)\n",
+        "plt.xlabel(\"Entropy\", fontsize=14)\n",
+        "plt.ylabel(\"Frequency\", fontsize=14)\n",
+        "\n",
+        "plt.subplot(122)\n",
+        "plt.hist(free_energies, bins=20)\n",
+        "plt.title(\"Distribution of Free Energies\", fontsize=16)\n",
+        "plt.xlabel(\"Free Energy\", fontsize=14)\n",
+        "plt.ylabel(\"Frequency\", fontsize=14)\n",
+        "plt.tight_layout()\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "Ws8Ugh7kbj9T"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "def measure_computation_time(trajectories, num_samples):\n",
+        "    \"\"\"Measure computation time for different numbers of trajectories.\"\"\"\n",
+        "    times = []\n",
+        "    sample_sizes = range(100, num_samples, 100)\n",
+        "\n",
+        "    for size in sample_sizes:\n",
+        "        start_time = time.time()\n",
+        "        _ = [analyze_trajectory(traj) for traj in trajectories[:size]]\n",
+        "        end_time = time.time()\n",
+        "        times.append(end_time - start_time)\n",
+        "\n",
+        "    return sample_sizes, times\n",
+        "\n",
+        "def analyze_trajectory(trajectory):\n",
+        "    \"\"\"Placeholder for your trajectory analysis function.\"\"\"\n",
+        "    # Replace this with your actual analysis\n",
+        "    return calculate_hamiltonian(trajectory[:, 0], trajectory[:, 1])\n",
+        "\n",
+        "# Measure computation time\n",
+        "sample_sizes, computation_times = measure_computation_time(trajectories_2d, len(trajectories_2d))\n"
+      ],
+      "metadata": {
+        "id": "c4hO5bUXb_VP"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Plot the results\n",
+        "plt.figure(figsize=(10, 6))\n",
+        "plt.plot(sample_sizes, computation_times, 'b-')\n",
+        "plt.title(\"Computational Complexity\", fontsize=16)\n",
+        "plt.xlabel(\"Number of Trajectories\", fontsize=14)\n",
+        "plt.ylabel(\"Computation Time (seconds)\", fontsize=14)\n",
+        "plt.grid(True)\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "OWw-V4apZX48"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "# Estimate complexity\n",
+        "def complexity_function(x, a, b):\n",
+        "    return a * x**b\n",
+        "\n",
+        "popt, _ = curve_fit(complexity_function, sample_sizes, computation_times)\n",
+        "\n",
+        "print(f\"Estimated complexity: O(n^{popt[1]:.2f})\")"
+      ],
+      "metadata": {
+        "id": "Pady9Cj8ZIdz"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "def classify_trajectory(trajectory):\n",
+        "    \"\"\"Classify a trajectory as valid or invalid based on Hamiltonian conservation.\"\"\"\n",
+        "    hamiltonian_change = np.abs(calculate_hamiltonian(trajectory[0, 0], trajectory[0, 1]) -\n",
+        "                                calculate_hamiltonian(trajectory[-1, 0], trajectory[-1, 1]))\n",
+        "    return hamiltonian_change < 0.5  # Threshold for classification\n",
+        "\n",
+        "# Split the data\n",
+        "X_train, X_test, y_train, y_test = train_test_split(trajectories_2d, df['is_valid'], test_size=0.2, random_state=42)\n",
+        "\n",
+        "# Classify test set\n",
+        "y_pred = [classify_trajectory(traj) for traj in X_test]\n",
+        "\n",
+        "# Analyze errors\n",
+        "conf_matrix = confusion_matrix(y_test, y_pred)\n",
+        "class_report = classification_report(y_test, y_pred)\n",
+        "\n",
+        "print(\"Confusion Matrix:\")\n",
+        "print(conf_matrix)\n",
+        "print(\"\\nClassification Report:\")\n",
+        "print(class_report)\n",
+        "\n",
+        "# Analyze misclassified trajectories\n",
+        "misclassified = X_test[y_test != y_pred]\n",
+        "misclassified_labels = y_test[y_test != y_pred]\n",
+        "\n",
+        "print(\"\\nAnalysis of Misclassified Trajectories:\")\n",
+        "for i, (traj, true_label) in enumerate(zip(misclassified, misclassified_labels)):\n",
+        "    hamiltonian_change = np.abs(calculate_hamiltonian(traj[0, 0], traj[0, 1]) -\n",
+        "                                calculate_hamiltonian(traj[-1, 0], traj[-1, 1]))\n",
+        "    print(f\"Trajectory {i}:\")\n",
+        "    print(f\"  True label: {'Valid' if true_label else 'Invalid'}\")\n",
+        "    print(f\"  Predicted: {'Valid' if classify_trajectory(traj) else 'Invalid'}\")\n",
+        "    print(f\"  Hamiltonian change: {hamiltonian_change:.4f}\")\n",
+        "    print(f\"  Start point: {traj[0]}\")\n",
+        "    print(f\"  End point: {traj[-1]}\")\n",
+        "    print()\n",
+        "\n",
+        "# Visualize some misclassified trajectories\n",
+        "plt.figure(figsize=(15, 5))\n",
+        "for i in range(3):\n",
+        "    plt.subplot(1, 3, i+1)\n",
+        "    plt.plot(misclassified[i][:, 0], misclassified[i][:, 1], 'r-')\n",
+        "    plt.scatter(misclassified[i][0, 0], misclassified[i][0, 1], c='g', label='Start')\n",
+        "    plt.scatter(misclassified[i][-1, 0], misclassified[i][-1, 1], c='b', label='End')\n",
+        "    plt.title(f\"Misclassified Trajectory {i+1}\", fontsize=16)\n",
+        "    plt.xlabel(\"PC1\", fontsize=14)\n",
+        "    plt.ylabel(\"PC2\", fontsize=14)\n",
+        "    plt.legend()\n",
+        "plt.tight_layout()\n",
+        "plt.show()"
+      ],
+      "metadata": {
+        "id": "p9PhYaNpcJJd"
+      },
+      "execution_count": null,
+      "outputs": []
+    }
+  ]
+}