{ "trained_at": "2026-04-27T07:37:26.101815+00:00", "data_run_date": "2026-04-25", "llm_run_date": "2026-04-26", "version": "v0.6-tuning-quantile-stacking", "description": "v0.5 features + Optuna-tuned hyperparams + quantile regression at 0.05/0.5/0.95 + tail-correction stacking", "parent_version": "v0.5", "changes_from_parent": [ "Optuna search (60 trials)", "Quantile regression trio (q=0.05, 0.5, 0.95)", "Tail-correction stacking layer on q=0.5 residuals" ], "embedders": [ "mpnet-finetuned (from v0.3)", "BAAI/bge-base-en-v1.5" ], "splits": { "train": { "rows": 265240, "start": "2022-01-28", "end": "2023-09-30" }, "val": { "rows": 3545, "start": "2023-10-01", "end": "2023-12-31" }, "test": { "rows": 2744, "start": "2024-01-01", "end": "2024-05-04" } }, "feature_count": 212, "feature_cols": [ "pca_000", "pca_001", "pca_002", "pca_003", "pca_004", "pca_005", "pca_006", "pca_007", "pca_008", "pca_009", "pca_010", "pca_011", "pca_012", "pca_013", "pca_014", "pca_015", "pca_016", "pca_017", "pca_018", "pca_019", "pca_020", "pca_021", "pca_022", "pca_023", "pca_024", "pca_025", "pca_026", "pca_027", "pca_028", "pca_029", "pca_030", "pca_031", "pca_032", "pca_033", "pca_034", "pca_035", "pca_036", "pca_037", "pca_038", "pca_039", "pca_040", "pca_041", "pca_042", "pca_043", "pca_044", "pca_045", "pca_046", "pca_047", "pca_048", "pca_049", "pca_050", "pca_051", "pca_052", "pca_053", "pca_054", "pca_055", "pca_056", "pca_057", "pca_058", "pca_059", "pca_060", "pca_061", "pca_062", "pca_063", "len", "n_digits", "n_letters", "n_special", "n_lower", "n_upper", "is_palindrome", "is_all_digits", "is_all_letters", "is_ascii", "has_unicode", "starts_digit", "ends_digit", "max_char_run", "n_unique_chars", "in_wikipedia", "in_geonames", "in_us_firstname", "in_iso3166", "in_ticker", "in_sec_edgar", "in_wiktionary_en", "wordlist_hits", "club__logistics", "club__prepunk_full_rankings", "club__gamertags", "club__natural_wonders", "club__social_handles", "club__mythical_creatures", "club__top_nouns", "club__common_english", "club__firstnames_usa", "club__luxury", "club__us_government", "club__paranormal", "club__pokemon_gen3", "club__top500_cities_usa", "club__gamertags_double", "club__historic_figures", "club__catholicism", "club__performing_arts", "club__sports", "club__crayola_classic", "club__personas", "club__gen_alpha", "club__familynames_usa", "club__crypto_terms", "club__wikidata_top_fantasy_char", "club__country_codes", "club__finance_terms", "club__fine_art", "club__home", "club__common_animals", "club__conspiracy_theories", "club__holidays", "club__top_crypto_tickers", "club__pokemon_gen1", "club__pokemon_gen2", "club__top_crypto_names", "club__top500_cities_global", "club__memes", "club__currency_symbols", "club__pokemon_gen4", "club__us_states", "club__currency_names", "n_clubs", "trademark_conflict", "name_age_days", "prior_transfer_count", "fg_value", "eth_tvl_usd", "eth_stable_mcap", "eth_dex_volume", "nft_total_fee_usd", "fame_score", "crypto_relevance_ord", "brand_collision_risk_ord", "kind__concept", "kind__random", "kind__brand", "kind__surname", "kind__first_name", "kind__abbreviation", "kind__place", "kind__other", "kind__unknown", "origin__english", "origin__none", "origin__mixed", "origin__spanish", "origin__german", "origin__french", "origin__japanese", "origin__chinese", "origin__italian", "origin__slavic", "origin__korean", "origin__arabic", "origin__other", "origin__unknown", "desc_pca_000", "desc_pca_001", "desc_pca_002", "desc_pca_003", "desc_pca_004", "desc_pca_005", "desc_pca_006", "desc_pca_007", "desc_pca_008", "desc_pca_009", "desc_pca_010", "desc_pca_011", "desc_pca_012", "desc_pca_013", "desc_pca_014", "desc_pca_015", "desc_pca_016", "desc_pca_017", "desc_pca_018", "desc_pca_019", "desc_pca_020", "desc_pca_021", "desc_pca_022", "desc_pca_023", "desc_pca_024", "desc_pca_025", "desc_pca_026", "desc_pca_027", "desc_pca_028", "desc_pca_029", "desc_pca_030", "desc_pca_031", "knnmp_count", "knnmp_mean_log", "knnmp_median_log", "knnmp_p90_log", "knnmp_max_sim", "knnmp_min_sim", "knnmp_log_max", "knnmp_log_min", "knnbg_count", "knnbg_mean_log", "knnbg_median_log", "knnbg_p90_log", "knnbg_max_sim", "knnbg_min_sim", "knnbg_log_max", "knnbg_log_min" ], "pca_dim_concat": 64, "pca_dim_description": 32, "name_kind_values": [ "concept", "random", "brand", "surname", "first_name", "abbreviation", "place", "other", "unknown" ], "cultural_origin_values": [ "english", "none", "mixed", "spanish", "german", "french", "japanese", "chinese", "italian", "slavic", "korean", "arabic", "other", "unknown" ], "best_xgb_params": { "tree_method": "hist", "device": "cuda", "seed": 42, "max_depth": 12, "learning_rate": 0.007564423378912868, "subsample": 0.7048816055233034, "colsample_bytree": 0.8377589264565862, "colsample_bylevel": 0.4011055562046537, "min_child_weight": 7, "reg_alpha": 2.609660530404674, "reg_lambda": 1.946648297232411, "gamma": 2.3669086866916134 }, "optuna": { "n_trials": 60, "best_val_rmse": 1.0080678462982178, "best_params": { "max_depth": 12, "learning_rate": 0.007564423378912868, "subsample": 0.7048816055233034, "colsample_bytree": 0.8377589264565862, "colsample_bylevel": 0.4011055562046537, "min_child_weight": 7, "reg_alpha": 2.609660530404674, "reg_lambda": 1.946648297232411, "gamma": 2.3669086866916134 } }, "quantile_models": { "q05": { "best_iteration": 798, "best_val_rmse": 1.9434242115149494 }, "q50": { "best_iteration": 2262, "best_val_rmse": 1.0197268625497296 }, "q95": { "best_iteration": 1773, "best_val_rmse": 2.2088471640402845 } }, "tail_correction": { "best_iteration": 795, "best_val_rmse": 1.0014360745042261, "cv_folds": 3, "fold_metrics": [ { "fold": 0, "best_iter": 2256 }, { "fold": 1, "best_iter": 2261 }, { "fold": 2, "best_iter": 2261 } ] }, "metrics": { "final": { "train": { "r2_log": 0.8784301280975342, "rmse_log": 0.5630198121070862, "mae_log": 0.34918516874313354, "median_ape": 0.1952281892299652, "bias_log": 0.0008572799852117896 }, "val": { "r2_log": 0.7011631727218628, "rmse_log": 1.0014359951019287, "mae_log": 0.687095046043396, "median_ape": 0.4087112247943878, "bias_log": 0.02248295769095421 }, "test": { "r2_log": 0.45456844568252563, "rmse_log": 1.3734359741210938, "mae_log": 1.1084247827529907, "median_ape": 0.9863521456718445, "bias_log": 0.5754767060279846 } }, "base": { "train": { "r2_log": 0.8039833307266235, "rmse_log": 0.7149196863174438, "mae_log": 0.4110703468322754, "median_ape": 0.19649738073349, "bias_log": -0.07636234164237976 }, "val": { "r2_log": 0.6901469230651855, "rmse_log": 1.019727349281311, "mae_log": 0.6950583457946777, "median_ape": 0.40584105253219604, "bias_log": -0.040105946362018585 }, "test": { "r2_log": 0.48208510875701904, "rmse_log": 1.3383431434631348, "mae_log": 1.0609599351882935, "median_ape": 0.9018900394439697, "bias_log": 0.4112372100353241 } }, "coverage": { "train": { "coverage_90pct": 0.9052216860202081, "median_interval_log": 2.52069091796875, "median_interval_ratio": 12.437186771527003 }, "val": { "coverage_90pct": 0.7870239774330042, "median_interval_log": 3.475064992904663, "median_interval_ratio": 32.299927734517325 }, "test": { "coverage_90pct": 0.642128279883382, "median_interval_log": 3.9815444946289062, "median_interval_ratio": 53.5997548637558 } } }, "top_features_base": [ { "name": "knnmp_mean_log", "gain": 79.17141723632812 }, { "name": "knnmp_median_log", "gain": 69.66679382324219 }, { "name": "len", "gain": 59.86244201660156 }, { "name": "knnmp_p90_log", "gain": 42.315155029296875 }, { "name": "is_all_digits", "gain": 37.01343536376953 }, { "name": "knnmp_log_min", "gain": 35.15000534057617 }, { "name": "knnmp_count", "gain": 33.0050048828125 }, { "name": "pca_004", "gain": 29.43238639831543 }, { "name": "ends_digit", "gain": 23.06843376159668 }, { "name": "knnmp_log_max", "gain": 22.34497833251953 }, { "name": "pca_002", "gain": 21.7791690826416 }, { "name": "origin__chinese", "gain": 21.658403396606445 }, { "name": "in_wikipedia", "gain": 20.88755989074707 }, { "name": "n_digits", "gain": 20.82081413269043 }, { "name": "eth_stable_mcap", "gain": 20.470684051513672 }, { "name": "brand_collision_risk_ord", "gain": 19.85502052307129 }, { "name": "kind__random", "gain": 19.53866958618164 }, { "name": "n_unique_chars", "gain": 18.933242797851562 }, { "name": "eth_tvl_usd", "gain": 18.808229446411133 }, { "name": "knnbg_count", "gain": 18.738136291503906 }, { "name": "name_age_days", "gain": 18.64664077758789 }, { "name": "starts_digit", "gain": 17.717424392700195 }, { "name": "origin__none", "gain": 17.592206954956055 }, { "name": "n_letters", "gain": 17.253936767578125 }, { "name": "is_palindrome", "gain": 16.289718627929688 }, { "name": "origin__arabic", "gain": 15.088671684265137 }, { "name": "kind__abbreviation", "gain": 15.046517372131348 }, { "name": "n_special", "gain": 14.652754783630371 }, { "name": "n_lower", "gain": 14.477858543395996 }, { "name": "desc_pca_000", "gain": 13.754626274108887 } ], "top_features_tail": [ { "name": "in_iso3166", "gain": 20.713716506958008 }, { "name": "prior_transfer_count", "gain": 19.949108123779297 }, { "name": "n_lower", "gain": 19.065231323242188 }, { "name": "brand_collision_risk_ord", "gain": 19.003070831298828 }, { "name": "n_letters", "gain": 16.631563186645508 }, { "name": "in_wiktionary_en", "gain": 15.533679962158203 }, { "name": "club__crypto_terms", "gain": 15.453104972839355 }, { "name": "fame_score", "gain": 15.42578125 }, { "name": "has_unicode", "gain": 14.748347282409668 }, { "name": "n_clubs", "gain": 14.500151634216309 }, { "name": "club__gamertags_double", "gain": 14.302302360534668 }, { "name": "is_all_letters", "gain": 14.27059555053711 }, { "name": "origin__english", "gain": 14.242754936218262 }, { "name": "crypto_relevance_ord", "gain": 14.161867141723633 }, { "name": "trademark_conflict", "gain": 13.951108932495117 }, { "name": "club__currency_symbols", "gain": 13.67905330657959 }, { "name": "n_upper", "gain": 13.592854499816895 }, { "name": "name_age_days", "gain": 13.328607559204102 }, { "name": "ends_digit", "gain": 13.104514122009277 }, { "name": "wordlist_hits", "gain": 12.854232788085938 }, { "name": "starts_digit", "gain": 12.26870059967041 }, { "name": "is_ascii", "gain": 12.160033226013184 }, { "name": "kind__random", "gain": 11.966256141662598 }, { "name": "club__prepunk_full_rankings", "gain": 11.913127899169922 }, { "name": "max_char_run", "gain": 11.784753799438477 }, { "name": "n_unique_chars", "gain": 11.777941703796387 }, { "name": "eth_stable_mcap", "gain": 11.768474578857422 }, { "name": "origin__italian", "gain": 11.581886291503906 }, { "name": "in_geonames", "gain": 11.519492149353027 }, { "name": "n_special", "gain": 11.42654800415039 } ], "inference_recipe": { "description": "Inference combines 4 models", "point_estimate": "final_log = q50_model(features) + tail_model(features)", "lower_bound_90pct": "low_log = q05_model(features)", "upper_bound_90pct": "high_log = q95_model(features)", "output_usd": "np.exp(final_log)" }, "wandb_run": "https://wandb.ai/quantumly-aletheia-research/ens-appraiser/runs/i35wokpu" }