Spaces:

vkapoor
/

Entra

Sleeping

App Files Files Community

vkapoor commited on Dec 27, 2025

Commit

64a8ef6

1 Parent(s): df9a12c

push app

Browse files

Files changed (1) hide show

app.py +27 -12

app.py CHANGED Viewed

@@ -126,11 +126,12 @@ def run_transformation(
     # Get entropy comparison
     entropy = transformer.get_entropy_comparison(df, df_transformed)
     # Create plots
     fig_scatter = create_scatter_plot(df, df_transformed, columns)
     fig_hist = create_histogram_plot(df, df_transformed, columns)
-    fig_history = create_history_plot(transformer.history_)
     # Create results text
     results_text = format_results(entropy, transformer.history_)
@@ -196,7 +197,7 @@ def create_histogram_plot(df_orig, df_trans, columns):
     return fig
-def create_history_plot(history):
     """Create optimization history plot."""
     fig, axes = plt.subplots(1, 2, figsize=(12, 4))
@@ -209,11 +210,18 @@ def create_history_plot(history):
     # Gaussian entropy
     axes[1].plot(history["iteration"], history["gaussian_entropy"], "r-o", markersize=4)
     axes[1].set_xlabel("Iteration")
     axes[1].set_ylabel("H(Gaussian)")
-    axes[1].set_title(
-        "Gaussian Entropy Bound\n(decreases because we start from uniform)"
-    )
     axes[1].grid(True, alpha=0.3)
     plt.tight_layout()
@@ -225,22 +233,29 @@ def format_results(entropy, history):
     det_reduction = (
         entropy["original"]["determinant"] / entropy["transformed"]["determinant"]
     )
     text = f"""
 TRANSFORMATION RESULTS
 {'=' * 50}
-Entropy Comparison (k-NN estimator):
-  Original:    {entropy['original']['knn_entropy']:.6f} nats
-  Transformed: {entropy['transformed']['knn_entropy']:.6f} nats
-  Difference:  {abs(entropy['original']['knn_entropy'] - entropy['transformed']['knn_entropy']):.6f} nats
-  (k-NN entropy should remain ~constant for volume-preserving transformation)
 Gaussian Entropy of Transformed Data:
-  H(Gaussian): {entropy['transformed']['gaussian_entropy']:.6f} nats
-  (This is the entropy IF the transformed data were perfectly Gaussian)
 Covariance Determinant:
   Original:    {entropy['original']['determinant']:.6e}

     # Get entropy comparison
     entropy = transformer.get_entropy_comparison(df, df_transformed)
+    target_entropy = entropy["original"]["uniform_entropy"]
     # Create plots
     fig_scatter = create_scatter_plot(df, df_transformed, columns)
     fig_hist = create_histogram_plot(df, df_transformed, columns)
+    fig_history = create_history_plot(transformer.history_, target_entropy=target_entropy)
     # Create results text
     results_text = format_results(entropy, transformer.history_)
     return fig
+def create_history_plot(history, target_entropy=None):
     """Create optimization history plot."""
     fig, axes = plt.subplots(1, 2, figsize=(12, 4))
     # Gaussian entropy
     axes[1].plot(history["iteration"], history["gaussian_entropy"], "r-o", markersize=4)
+    if target_entropy is not None:
+        axes[1].axhline(
+            target_entropy,
+            color="green",
+            linestyle="--",
+            linewidth=2,
+            label=f"Target H(uniform) = {target_entropy:.4f}",
+        )
+        axes[1].legend()
     axes[1].set_xlabel("Iteration")
     axes[1].set_ylabel("H(Gaussian)")
+    axes[1].set_title("Gaussian Entropy → Target Uniform Entropy")
     axes[1].grid(True, alpha=0.3)
     plt.tight_layout()
     det_reduction = (
         entropy["original"]["determinant"] / entropy["transformed"]["determinant"]
     )
+    target_entropy = entropy["original"]["uniform_entropy"]
+    final_entropy = entropy["transformed"]["gaussian_entropy"]
+    entropy_gap = final_entropy - target_entropy
     text = f"""
 TRANSFORMATION RESULTS
 {'=' * 50}
+Target Entropy (Uniform Distribution):
+  H(uniform) = {target_entropy:.6f} nats
+  This is the true entropy we want to reach.
 Gaussian Entropy of Transformed Data:
+  H(Gaussian) = {final_entropy:.6f} nats
+  This assumes the transformed data is Gaussian with the
+  current covariance. When H(Gaussian) = H(uniform), the
+  distribution is perfectly Gaussian.
+Gap to Target:
+  H(Gaussian) - H(uniform) = {entropy_gap:.6f} nats
+  (Should approach 0 for perfect Gaussianization)
 Covariance Determinant:
   Original:    {entropy['original']['determinant']:.6e}