ens-appraiser / v0_metadata.json
quantumly's picture
v0.2 appraiser: trained 2026-04-26
c480fbb verified
{
"trained_at": "2026-04-26T06:46:09.798149+00:00",
"data_run_date": "2026-04-25",
"version": "v0.2-leakage-fixed",
"fixes_vs_v0_1": [
"prior_transfer_count replaces lifetime_transfer_count (no future leakage)",
"$10 price floor (was $1) drops wash-trade noise",
"fixed-window temporal split (train < 2023-10-01, val Q4 2023, test 2024+)",
"recency-weighted sample weights (1y half-life)"
],
"splits": {
"train": {
"rows": 265240,
"start": "2022-01-28",
"end": "2023-09-30"
},
"val": {
"rows": 3545,
"start": "2023-10-01",
"end": "2023-12-31"
},
"test": {
"rows": 2744,
"start": "2024-01-01",
"end": "2024-05-04"
}
},
"feature_count": 146,
"feature_cols": [
"len",
"n_digits",
"n_letters",
"n_special",
"n_lower",
"n_upper",
"is_palindrome",
"is_all_digits",
"is_all_letters",
"is_ascii",
"has_unicode",
"starts_digit",
"ends_digit",
"max_char_run",
"n_unique_chars",
"in_wikipedia",
"in_geonames",
"in_us_firstname",
"in_iso3166",
"in_ticker",
"in_sec_edgar",
"in_wiktionary_en",
"wordlist_hits",
"club__prepunk_full_rankings",
"club__personas",
"club__gamertags",
"club__luxury",
"club__top_nouns",
"club__familynames_usa",
"club__wikidata_top_fantasy_char",
"club__firstnames_usa",
"club__natural_wonders",
"club__logistics",
"club__social_handles",
"club__top500_cities_usa",
"club__common_english",
"club__finance_terms",
"club__performing_arts",
"club__paranormal",
"club__gamertags_double",
"club__memes",
"club__sports",
"club__home",
"club__top_crypto_names",
"club__top500_cities_global",
"club__catholicism",
"club__country_codes",
"club__fine_art",
"club__us_government",
"club__pokemon_gen3",
"club__pokemon_gen4",
"club__crypto_terms",
"club__top_crypto_tickers",
"club__crayola_classic",
"club__us_states",
"club__mythical_creatures",
"club__historic_figures",
"club__pokemon_gen2",
"club__holidays",
"club__common_animals",
"club__pokemon_gen1",
"club__conspiracy_theories",
"club__gen_alpha",
"club__currency_symbols",
"club__currency_names",
"n_clubs",
"trademark_conflict",
"name_age_days",
"prior_transfer_count",
"fg_value",
"eth_tvl_usd",
"eth_stable_mcap",
"eth_dex_volume",
"nft_total_fee_usd",
"pca_000",
"pca_001",
"pca_002",
"pca_003",
"pca_004",
"pca_005",
"pca_006",
"pca_007",
"pca_008",
"pca_009",
"pca_010",
"pca_011",
"pca_012",
"pca_013",
"pca_014",
"pca_015",
"pca_016",
"pca_017",
"pca_018",
"pca_019",
"pca_020",
"pca_021",
"pca_022",
"pca_023",
"pca_024",
"pca_025",
"pca_026",
"pca_027",
"pca_028",
"pca_029",
"pca_030",
"pca_031",
"pca_032",
"pca_033",
"pca_034",
"pca_035",
"pca_036",
"pca_037",
"pca_038",
"pca_039",
"pca_040",
"pca_041",
"pca_042",
"pca_043",
"pca_044",
"pca_045",
"pca_046",
"pca_047",
"pca_048",
"pca_049",
"pca_050",
"pca_051",
"pca_052",
"pca_053",
"pca_054",
"pca_055",
"pca_056",
"pca_057",
"pca_058",
"pca_059",
"pca_060",
"pca_061",
"pca_062",
"pca_063",
"knn_count",
"knn_mean_log",
"knn_median_log",
"knn_p90_log",
"knn_max_sim",
"knn_min_sim",
"knn_log_max",
"knn_log_min"
],
"pca_dim": 64,
"embedding_model": "sentence-transformers/all-mpnet-base-v2",
"best_iteration": 170,
"xgb_params": {
"objective": "reg:squarederror",
"eval_metric": "rmse",
"tree_method": "hist",
"device": "cuda",
"max_depth": 7,
"learning_rate": 0.04,
"subsample": 0.85,
"colsample_bytree": 0.65,
"min_child_weight": 8,
"reg_alpha": 0.5,
"reg_lambda": 2.0,
"seed": 42
},
"metrics": {
"train": {
"r2_log": 0.7700075507164001,
"rmse_log": 0.7744038701057434,
"mae_log": 0.5210891962051392,
"median_ape": 0.32541945576667786,
"bias_log": -0.0004094731993973255
},
"val": {
"r2_log": 0.6602156162261963,
"rmse_log": 1.0678441524505615,
"mae_log": 0.7699634432792664,
"median_ape": 0.5703179836273193,
"bias_log": 0.2033758908510208
},
"test": {
"r2_log": 0.3080594539642334,
"rmse_log": 1.5469372272491455,
"mae_log": 1.2711551189422607,
"median_ape": 1.3828195333480835,
"bias_log": 0.7319739460945129
}
},
"top_features": [
{
"name": "knn_mean_log",
"gain": 1713.8084716796875
},
{
"name": "knn_p90_log",
"gain": 1612.9539794921875
},
{
"name": "len",
"gain": 1364.2567138671875
},
{
"name": "in_wikipedia",
"gain": 1052.1461181640625
},
{
"name": "is_all_digits",
"gain": 943.7355346679688
},
{
"name": "knn_median_log",
"gain": 604.246337890625
},
{
"name": "n_digits",
"gain": 337.8750305175781
},
{
"name": "pca_000",
"gain": 289.33624267578125
},
{
"name": "n_clubs",
"gain": 281.8310546875
},
{
"name": "ends_digit",
"gain": 276.56658935546875
},
{
"name": "name_age_days",
"gain": 274.4316101074219
},
{
"name": "n_unique_chars",
"gain": 267.8934020996094
},
{
"name": "club__gamertags",
"gain": 267.10980224609375
},
{
"name": "starts_digit",
"gain": 259.8104248046875
},
{
"name": "n_special",
"gain": 258.7098693847656
},
{
"name": "pca_001",
"gain": 238.66867065429688
},
{
"name": "n_letters",
"gain": 217.4210662841797
},
{
"name": "knn_log_max",
"gain": 214.86541748046875
},
{
"name": "trademark_conflict",
"gain": 213.1521453857422
},
{
"name": "pca_034",
"gain": 211.79525756835938
},
{
"name": "is_ascii",
"gain": 211.76641845703125
},
{
"name": "eth_stable_mcap",
"gain": 204.28631591796875
},
{
"name": "has_unicode",
"gain": 198.2250518798828
},
{
"name": "wordlist_hits",
"gain": 196.23956298828125
},
{
"name": "n_lower",
"gain": 189.0078887939453
}
]
}