| { |
| "trained_at": "2026-04-27T12:00:40.349432+00:00", |
| "data_run_date": "2026-04-25", |
| "llm_run_date": "2026-04-26", |
| "version": "v0.8-fixed-wash-ensemble", |
| "description": "v0.7 features + tightened wash detection + dual-tree ensemble + bias correction", |
| "parent_version": "v0.7", |
| "changes_from_parent": [ |
| "wash detection: row-level, \u226424h + \u22651.5x price gain", |
| "wash detection: dropped wallet concentration heuristic", |
| "dual-tree ensemble: tuned XGBoost + tuned LightGBM, log-space mean", |
| "val-derived bias correction (val_bias = -0.0781)", |
| "4x Optuna budget (120 trials per model)" |
| ], |
| "splits": { |
| "train": { |
| "rows": 265240, |
| "start": "2022-01-28", |
| "end": "2023-09-30" |
| }, |
| "val": { |
| "rows": 3545, |
| "start": "2023-10-01", |
| "end": "2023-12-31" |
| }, |
| "test": { |
| "rows": 2744, |
| "start": "2024-01-01", |
| "end": "2024-05-04" |
| } |
| }, |
| "feature_count": 212, |
| "feature_cols": [ |
| "pca_000", |
| "pca_001", |
| "pca_002", |
| "pca_003", |
| "pca_004", |
| "pca_005", |
| "pca_006", |
| "pca_007", |
| "pca_008", |
| "pca_009", |
| "pca_010", |
| "pca_011", |
| "pca_012", |
| "pca_013", |
| "pca_014", |
| "pca_015", |
| "pca_016", |
| "pca_017", |
| "pca_018", |
| "pca_019", |
| "pca_020", |
| "pca_021", |
| "pca_022", |
| "pca_023", |
| "pca_024", |
| "pca_025", |
| "pca_026", |
| "pca_027", |
| "pca_028", |
| "pca_029", |
| "pca_030", |
| "pca_031", |
| "pca_032", |
| "pca_033", |
| "pca_034", |
| "pca_035", |
| "pca_036", |
| "pca_037", |
| "pca_038", |
| "pca_039", |
| "pca_040", |
| "pca_041", |
| "pca_042", |
| "pca_043", |
| "pca_044", |
| "pca_045", |
| "pca_046", |
| "pca_047", |
| "pca_048", |
| "pca_049", |
| "pca_050", |
| "pca_051", |
| "pca_052", |
| "pca_053", |
| "pca_054", |
| "pca_055", |
| "pca_056", |
| "pca_057", |
| "pca_058", |
| "pca_059", |
| "pca_060", |
| "pca_061", |
| "pca_062", |
| "pca_063", |
| "len", |
| "n_digits", |
| "n_letters", |
| "n_special", |
| "n_lower", |
| "n_upper", |
| "is_palindrome", |
| "is_all_digits", |
| "is_all_letters", |
| "is_ascii", |
| "has_unicode", |
| "starts_digit", |
| "ends_digit", |
| "max_char_run", |
| "n_unique_chars", |
| "in_wikipedia", |
| "in_geonames", |
| "in_us_firstname", |
| "in_iso3166", |
| "in_ticker", |
| "in_sec_edgar", |
| "in_wiktionary_en", |
| "wordlist_hits", |
| "club__prepunk_full_rankings", |
| "club__firstnames_usa", |
| "club__finance_terms", |
| "club__social_handles", |
| "club__gamertags", |
| "club__top_crypto_tickers", |
| "club__common_english", |
| "club__sports", |
| "club__crypto_terms", |
| "club__gamertags_double", |
| "club__pokemon_gen4", |
| "club__fine_art", |
| "club__logistics", |
| "club__top500_cities_usa", |
| "club__natural_wonders", |
| "club__familynames_usa", |
| "club__top_nouns", |
| "club__wikidata_top_fantasy_char", |
| "club__holidays", |
| "club__us_government", |
| "club__top500_cities_global", |
| "club__pokemon_gen3", |
| "club__common_animals", |
| "club__country_codes", |
| "club__personas", |
| "club__currency_symbols", |
| "club__mythical_creatures", |
| "club__pokemon_gen1", |
| "club__catholicism", |
| "club__historic_figures", |
| "club__luxury", |
| "club__paranormal", |
| "club__crayola_classic", |
| "club__top_crypto_names", |
| "club__performing_arts", |
| "club__pokemon_gen2", |
| "club__home", |
| "club__conspiracy_theories", |
| "club__memes", |
| "club__us_states", |
| "club__currency_names", |
| "club__gen_alpha", |
| "n_clubs", |
| "trademark_conflict", |
| "name_age_days", |
| "prior_transfer_count", |
| "fg_value", |
| "eth_tvl_usd", |
| "eth_stable_mcap", |
| "eth_dex_volume", |
| "nft_total_fee_usd", |
| "fame_score", |
| "crypto_relevance_ord", |
| "brand_collision_risk_ord", |
| "kind__concept", |
| "kind__random", |
| "kind__brand", |
| "kind__surname", |
| "kind__first_name", |
| "kind__abbreviation", |
| "kind__place", |
| "kind__other", |
| "kind__unknown", |
| "origin__english", |
| "origin__none", |
| "origin__mixed", |
| "origin__spanish", |
| "origin__german", |
| "origin__french", |
| "origin__japanese", |
| "origin__chinese", |
| "origin__italian", |
| "origin__slavic", |
| "origin__korean", |
| "origin__arabic", |
| "origin__other", |
| "origin__unknown", |
| "desc_pca_000", |
| "desc_pca_001", |
| "desc_pca_002", |
| "desc_pca_003", |
| "desc_pca_004", |
| "desc_pca_005", |
| "desc_pca_006", |
| "desc_pca_007", |
| "desc_pca_008", |
| "desc_pca_009", |
| "desc_pca_010", |
| "desc_pca_011", |
| "desc_pca_012", |
| "desc_pca_013", |
| "desc_pca_014", |
| "desc_pca_015", |
| "desc_pca_016", |
| "desc_pca_017", |
| "desc_pca_018", |
| "desc_pca_019", |
| "desc_pca_020", |
| "desc_pca_021", |
| "desc_pca_022", |
| "desc_pca_023", |
| "desc_pca_024", |
| "desc_pca_025", |
| "desc_pca_026", |
| "desc_pca_027", |
| "desc_pca_028", |
| "desc_pca_029", |
| "desc_pca_030", |
| "desc_pca_031", |
| "knnmp_count", |
| "knnmp_mean_log", |
| "knnmp_median_log", |
| "knnmp_p90_log", |
| "knnmp_max_sim", |
| "knnmp_min_sim", |
| "knnmp_log_max", |
| "knnmp_log_min", |
| "knnbg_count", |
| "knnbg_mean_log", |
| "knnbg_median_log", |
| "knnbg_p90_log", |
| "knnbg_max_sim", |
| "knnbg_min_sim", |
| "knnbg_log_max", |
| "knnbg_log_min" |
| ], |
| "pca_dim_concat": 64, |
| "pca_dim_description": 32, |
| "name_kind_values": [ |
| "concept", |
| "random", |
| "brand", |
| "surname", |
| "first_name", |
| "abbreviation", |
| "place", |
| "other", |
| "unknown" |
| ], |
| "cultural_origin_values": [ |
| "english", |
| "none", |
| "mixed", |
| "spanish", |
| "german", |
| "french", |
| "japanese", |
| "chinese", |
| "italian", |
| "slavic", |
| "korean", |
| "arabic", |
| "other", |
| "unknown" |
| ], |
| "wash_filtering": { |
| "method": "row_level", |
| "round_trip_max_hours": 24, |
| "round_trip_min_price_gain": 1.5, |
| "wash_train_weight": 0.1, |
| "n_round_trip_rows": 8236, |
| "n_sub_minute_rows": 2612, |
| "n_total_flagged_rows": 10733, |
| "flag_rate_pct": 3.9528006216647213 |
| }, |
| "optuna": { |
| "n_trials_per_model": 120, |
| "xgb_best_val_rmse": 1.0110926628112793, |
| "xgb_best_params": { |
| "max_depth": 12, |
| "learning_rate": 0.00707952961758631, |
| "subsample": 0.82649559352978, |
| "colsample_bytree": 0.5076045191428247, |
| "colsample_bylevel": 0.4490941323703761, |
| "min_child_weight": 25, |
| "reg_alpha": 2.1100924086636215, |
| "reg_lambda": 6.7085987791616875, |
| "gamma": 3.012785755618491 |
| }, |
| "xgb_best_trial": 78, |
| "lgb_best_val_rmse": 1.0083379004456063, |
| "lgb_best_params": { |
| "boosting_type": "gbdt", |
| "num_leaves": 294, |
| "max_depth": 13, |
| "learning_rate": 0.007555121763111837, |
| "feature_fraction": 0.714483668555124, |
| "feature_fraction_bynode": 0.5304393257914843, |
| "min_data_in_leaf": 6, |
| "lambda_l1": 0.002471118357836334, |
| "lambda_l2": 1.776020947969551, |
| "min_gain_to_split": 2.2135701585440897, |
| "bagging_fraction": 0.9999413018023948, |
| "bagging_freq": 7 |
| }, |
| "lgb_best_trial": 16 |
| }, |
| "xgb_quantile_models": { |
| "q05": { |
| "best_iteration": 984, |
| "best_val_rmse": 1.9671143709945549 |
| }, |
| "q50": { |
| "best_iteration": 1756, |
| "best_val_rmse": 1.0471049311283205 |
| }, |
| "q95": { |
| "best_iteration": 3964, |
| "best_val_rmse": 2.1785484376377413 |
| } |
| }, |
| "lgb_quantile_models": { |
| "q05": { |
| "best_iteration": 500 |
| }, |
| "q50": { |
| "best_iteration": 1465 |
| }, |
| "q95": { |
| "best_iteration": 1123 |
| } |
| }, |
| "ensemble": { |
| "method": "log_space_mean", |
| "members": [ |
| "xgb_q50", |
| "lgb_q50" |
| ] |
| }, |
| "bias_correction": { |
| "method": "val_derived_constant", |
| "val_bias": -0.0781494239191985 |
| }, |
| "calibration": { |
| "method": "additive", |
| "target_coverage": 0.9, |
| "delta_lower": 0.14621443811853208, |
| "delta_upper": 0.0, |
| "val_bias_correction": -0.0781494239191985, |
| "ensemble_method": "log_space_mean_xgb_lgb" |
| }, |
| "metrics": { |
| "final": { |
| "train": { |
| "r2_log": 0.7860012517591471, |
| "rmse_log": 0.7469926912886737, |
| "mae_log": 0.45205338808523504, |
| "median_ape": 0.24072927576014078, |
| "bias_log": -0.0053798850758574246 |
| }, |
| "val": { |
| "r2_log": 0.6758550101826879, |
| "rmse_log": 1.0429795602982888, |
| "mae_log": 0.706429696381903, |
| "median_ape": 0.43773059069184295, |
| "bias_log": -1.8039166775291682e-16 |
| }, |
| "test": { |
| "r2_log": 0.47530460716475276, |
| "rmse_log": 1.3470754265844747, |
| "mae_log": 1.0706065416171697, |
| "median_ape": 0.9519209571310361, |
| "bias_log": 0.444023565817704 |
| } |
| }, |
| "coverage": { |
| "train": { |
| "coverage_90pct": 0.937335997587091, |
| "median_interval_log": 2.823927108304763, |
| "median_interval_ratio": 16.84286471905812 |
| }, |
| "val": { |
| "coverage_90pct": 0.8493653032440056, |
| "median_interval_log": 3.6384351371935924, |
| "median_interval_ratio": 38.03227484212217 |
| }, |
| "test": { |
| "coverage_90pct": 0.8126822157434402, |
| "median_interval_log": 4.143242668045713, |
| "median_interval_ratio": 63.00680069124568 |
| } |
| } |
| }, |
| "top_features_xgb": [ |
| { |
| "name": "knnmp_mean_log", |
| "gain": 108.798828125 |
| }, |
| { |
| "name": "knnmp_median_log", |
| "gain": 78.58806610107422 |
| }, |
| { |
| "name": "knnmp_log_min", |
| "gain": 72.71774291992188 |
| }, |
| { |
| "name": "len", |
| "gain": 61.729530334472656 |
| }, |
| { |
| "name": "knnmp_p90_log", |
| "gain": 58.61769104003906 |
| }, |
| { |
| "name": "pca_004", |
| "gain": 42.28458786010742 |
| }, |
| { |
| "name": "knnmp_log_max", |
| "gain": 39.73566818237305 |
| }, |
| { |
| "name": "is_all_digits", |
| "gain": 38.88374710083008 |
| }, |
| { |
| "name": "knnmp_count", |
| "gain": 36.54442596435547 |
| }, |
| { |
| "name": "pca_002", |
| "gain": 36.348838806152344 |
| }, |
| { |
| "name": "kind__random", |
| "gain": 34.42299270629883 |
| }, |
| { |
| "name": "in_wikipedia", |
| "gain": 28.338823318481445 |
| }, |
| { |
| "name": "eth_stable_mcap", |
| "gain": 28.019874572753906 |
| }, |
| { |
| "name": "origin__none", |
| "gain": 27.93862533569336 |
| }, |
| { |
| "name": "n_digits", |
| "gain": 26.823389053344727 |
| }, |
| { |
| "name": "ends_digit", |
| "gain": 25.347196578979492 |
| }, |
| { |
| "name": "n_unique_chars", |
| "gain": 25.27269172668457 |
| }, |
| { |
| "name": "name_age_days", |
| "gain": 25.112060546875 |
| }, |
| { |
| "name": "eth_tvl_usd", |
| "gain": 24.409042358398438 |
| }, |
| { |
| "name": "starts_digit", |
| "gain": 23.97994613647461 |
| }, |
| { |
| "name": "knnbg_count", |
| "gain": 23.276514053344727 |
| }, |
| { |
| "name": "is_palindrome", |
| "gain": 22.497846603393555 |
| }, |
| { |
| "name": "brand_collision_risk_ord", |
| "gain": 21.805770874023438 |
| }, |
| { |
| "name": "origin__chinese", |
| "gain": 21.738651275634766 |
| }, |
| { |
| "name": "n_letters", |
| "gain": 20.87726402282715 |
| }, |
| { |
| "name": "kind__abbreviation", |
| "gain": 20.590986251831055 |
| }, |
| { |
| "name": "pca_001", |
| "gain": 20.483781814575195 |
| }, |
| { |
| "name": "has_unicode", |
| "gain": 19.911903381347656 |
| }, |
| { |
| "name": "nft_total_fee_usd", |
| "gain": 19.79189682006836 |
| }, |
| { |
| "name": "desc_pca_000", |
| "gain": 19.757749557495117 |
| } |
| ], |
| "top_features_lgb": [ |
| { |
| "name": "knnmp_mean_log", |
| "gain": 781449.8409805298 |
| }, |
| { |
| "name": "eth_stable_mcap", |
| "gain": 780319.1262354851 |
| }, |
| { |
| "name": "name_age_days", |
| "gain": 621649.1777780056 |
| }, |
| { |
| "name": "eth_tvl_usd", |
| "gain": 549847.3152387142 |
| }, |
| { |
| "name": "len", |
| "gain": 535403.315526247 |
| }, |
| { |
| "name": "knnmp_median_log", |
| "gain": 476187.2463479042 |
| }, |
| { |
| "name": "nft_total_fee_usd", |
| "gain": 376482.9395339489 |
| }, |
| { |
| "name": "knnmp_p90_log", |
| "gain": 299560.9693763256 |
| }, |
| { |
| "name": "fg_value", |
| "gain": 291222.41970157623 |
| }, |
| { |
| "name": "n_digits", |
| "gain": 200339.19226312637 |
| }, |
| { |
| "name": "knnmp_count", |
| "gain": 198496.79864764214 |
| }, |
| { |
| "name": "knnmp_log_min", |
| "gain": 196220.42209792137 |
| }, |
| { |
| "name": "eth_dex_volume", |
| "gain": 183750.19882249832 |
| }, |
| { |
| "name": "n_unique_chars", |
| "gain": 178599.7514090538 |
| }, |
| { |
| "name": "knnmp_log_max", |
| "gain": 165553.80459403992 |
| }, |
| { |
| "name": "pca_004", |
| "gain": 119861.93015813828 |
| }, |
| { |
| "name": "desc_pca_000", |
| "gain": 114556.08047294617 |
| }, |
| { |
| "name": "pca_002", |
| "gain": 104693.19005703926 |
| }, |
| { |
| "name": "n_letters", |
| "gain": 83801.49758315086 |
| }, |
| { |
| "name": "pca_001", |
| "gain": 82503.51477956772 |
| }, |
| { |
| "name": "n_special", |
| "gain": 70174.17102837563 |
| }, |
| { |
| "name": "is_palindrome", |
| "gain": 64647.565772771835 |
| }, |
| { |
| "name": "is_all_digits", |
| "gain": 56822.11631703377 |
| }, |
| { |
| "name": "desc_pca_002", |
| "gain": 47493.986828804016 |
| }, |
| { |
| "name": "n_lower", |
| "gain": 44417.38100814819 |
| }, |
| { |
| "name": "max_char_run", |
| "gain": 40815.91745662689 |
| }, |
| { |
| "name": "knnbg_count", |
| "gain": 39852.69767045975 |
| }, |
| { |
| "name": "fame_score", |
| "gain": 36314.24634027481 |
| }, |
| { |
| "name": "pca_005", |
| "gain": 34642.322847127914 |
| }, |
| { |
| "name": "knnmp_min_sim", |
| "gain": 34452.339801073074 |
| } |
| ], |
| "family_gain_split_xgb": { |
| "mpnet_ft_knn": 416.6655960083008, |
| "bge_knn": 94.33125257492065, |
| "llm_kind": 89.02087259292603, |
| "llm_origin": 129.38252782821655, |
| "llm_scores": 46.957244873046875, |
| "llm_desc": 279.1159596443176, |
| "llm_total": 544.4766049385071 |
| }, |
| "inference_recipe": { |
| "description": "Inference uses 6 models (XGB\u00d73 + LGB\u00d73) + bias + calibration constants", |
| "point_estimate": "(xgb_q50.predict() + lgb_q50.predict()) / 2 - val_bias", |
| "uncalibrated_low": "(xgb_q05.predict() + lgb_q05.predict()) / 2 - val_bias", |
| "uncalibrated_high": "(xgb_q95.predict() + lgb_q95.predict()) / 2 - val_bias", |
| "calibrated_low": "uncalibrated_low - delta_lower", |
| "calibrated_high": "uncalibrated_high + delta_upper", |
| "output_usd": "np.exp(final)" |
| }, |
| "wandb_run": "https://wandb.ai/quantumly-aletheia-research/ens-appraiser/runs/d3y6y5c6" |
| } |