malicious-coding-intent-v6 / benign_code_mathtrain_reasoner_eval.json
NecroMOnk's picture
Publish v6 classifier heads
b6ac206
Raw
History Blame Contribute Delete
11.8 kB
{
"model_dir": "models\\v6_code_aware_50k_oss_clean_benign_code",
"holdout": "data\\clf\\benign_code_holdout_mathtrain_reasoner_clean.jsonl",
"overall": {
"n": 12000,
"threshold": 0.5,
"false_positive_rate": 0.01,
"flagged": 120,
"score_mean": 0.021423,
"score_p50": 0.000676,
"score_p90": 0.032512,
"score_p95": 0.097846,
"score_p99": 0.497524,
"score_max": 0.994358
},
"by_source": {
"local_project_code": {
"n": 165,
"threshold": 0.5,
"false_positive_rate": 0.0061,
"flagged": 1,
"score_mean": 0.026509,
"score_p50": 0.002527,
"score_p90": 0.034257,
"score_p95": 0.099218,
"score_p99": 0.43596,
"score_max": 0.955582
},
"local_repo_hs": {
"n": 14,
"threshold": 0.5,
"false_positive_rate": 0.1429,
"flagged": 2,
"score_mean": 0.234466,
"score_p50": 0.173636,
"score_p90": 0.50088,
"score_p95": 0.601973,
"score_p99": 0.732286,
"score_max": 0.764864
},
"local_repo_isre": {
"n": 173,
"threshold": 0.5,
"false_positive_rate": 0.0,
"flagged": 0,
"score_mean": 0.015629,
"score_p50": 0.000923,
"score_p90": 0.065123,
"score_p95": 0.111808,
"score_p99": 0.148813,
"score_max": 0.175909
},
"local_repo_job_application_pipeline": {
"n": 444,
"threshold": 0.5,
"false_positive_rate": 0.0023,
"flagged": 1,
"score_mean": 0.016508,
"score_p50": 0.001555,
"score_p90": 0.038672,
"score_p95": 0.117372,
"score_p99": 0.200662,
"score_max": 0.691934
},
"local_repo_math_train": {
"n": 562,
"threshold": 0.5,
"false_positive_rate": 0.0569,
"flagged": 32,
"score_mean": 0.070331,
"score_p50": 0.002097,
"score_p90": 0.163531,
"score_p95": 0.558199,
"score_p99": 0.93781,
"score_max": 0.990801
},
"local_repo_math_train2": {
"n": 68,
"threshold": 0.5,
"false_positive_rate": 0.0,
"flagged": 0,
"score_mean": 0.015792,
"score_p50": 0.00076,
"score_p90": 0.047232,
"score_p95": 0.135641,
"score_p99": 0.156291,
"score_max": 0.166963
},
"local_repo_olympiad_math": {
"n": 55,
"threshold": 0.5,
"false_positive_rate": 0.0182,
"flagged": 1,
"score_mean": 0.031321,
"score_p50": 0.001742,
"score_p90": 0.071487,
"score_p95": 0.192837,
"score_p99": 0.439802,
"score_max": 0.561933
},
"local_repo_vesuvius": {
"n": 730,
"threshold": 0.5,
"false_positive_rate": 0.0548,
"flagged": 40,
"score_mean": 0.103365,
"score_p50": 0.018504,
"score_p90": 0.349818,
"score_p95": 0.531822,
"score_p99": 0.915992,
"score_max": 0.994358
},
"python_stdlib": {
"n": 9789,
"threshold": 0.5,
"false_positive_rate": 0.0044,
"flagged": 43,
"score_mean": 0.012423,
"score_p50": 0.000479,
"score_p90": 0.017982,
"score_p95": 0.048102,
"score_p99": 0.254804,
"score_max": 0.97892
}
},
"flagged_examples": [
{
"score": 0.955582,
"source": "local_project_code",
"path": "C:\\GitHub\\Safety DS\\scripts\\build_malware_code_pool.py",
"preview": "def download_vxunderground( spec: dict, builder: PoolBuilder, chunk_cfg: dict, insecure: bool ) -> None: repo = spec[\"repo\"] cache = ROOT / spec.get(\"cache_dir\", \"data/external/vxunderground\") cache.mkdir(parents=True, exist_ok=True) for su"
},
{
"score": 0.77251,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\auto_pipeline.ps1",
"preview": "$stateFile = 'C:\\lora_training\\eval_results\\pipeline_state2.txt' $qwenLog = 'C:\\lora_training\\eval_results\\eval_qwen_merged_full.log' $glmLog = 'C:\\lora_training\\eval_results\\eval_glm_both_6k.log' $glmErr = 'C:\\lora_training\\eval_results\\ev"
},
{
"score": 0.705632,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\check_adapter_structure.py",
"preview": "import sys if hasattr(sys.stdout, \"reconfigure\"): sys.stdout.reconfigure(encoding=\"utf-8\") from safetensors import safe_open from pathlib import Path import json adapter = Path(r\"C:\\lora_training\\lora_MATH_output\\qwen_run_20260408_123730\\fi"
},
{
"score": 0.590817,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\check_lora_results.py",
"preview": "import json, os path = r\"C:\\lora_training\\eval_results\\all_adapters\" for fn in [\"eval_qwen3_instruct_lora.json\", \"eval_qwen3_instruct_lora_diverse.json\", \"eval_gemma3_instruct_lora.json\", \"eval_gemma3_instruct_lora_diverse.json\", \"eval_llam"
},
{
"score": 0.599163,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\check_qwen_log.ps1",
"preview": "$logfile = \"C:\\Users\\SOL08_~1\\AppData\\Local\\Temp\\claude\\C--Users-sol08-p04dk8b-MATH-TRAIN\\4a837286-97f6-4070-a5f2-37ba2c811443\\tasks\\b1yeq9q3i.output\" if (Test-Path $logfile) { $lines = Get-Content $logfile $total = $lines.Count Write-Outpu"
},
{
"score": 0.935582,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\check_sizes.ps1",
"preview": "$files = @( 'C:\\lora_training\\OLympiad\\_output\\good_solutions_deduped.jsonl', 'C:\\lora_training\\OLympiad\\_output\\broken_only_deduped.jsonl', 'C:\\lora_training\\OLympiad\\_output\\dpo_pairs.jsonl', 'C:\\lora_training\\OLympiad\\converted_for_sft.j"
},
{
"score": 0.990801,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\clean_github.ps1",
"preview": "Set-Location 'C:\\GitHub\\Olympiad_Math' $remove = @( 'scraping\\olympiad.py', 'scraping\\geometry_scraper.py', 'scraping\\filter_geometry_links.py', 'scraping\\download_geometry_drive.py', 'scraping\\scraper_aops.py', 'scraping\\olympiad_dataset1."
},
{
"score": 0.736009,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\download_llama3b_instruct.py",
"preview": "from huggingface_hub import snapshot_download import time print(\"Downloading Llama-3.2-3B-Instruct...\", flush=True) t0 = time.time() snapshot_download( repo_id=\"meta-llama/Llama-3.2-3B-Instruct\", local_dir=r\"C:\\models\\Llama-3.2-3B-Instruct\""
},
{
"score": 0.880296,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\eval_benchmark.py",
"preview": "def print_report(results, label): total = len(results) correct = sum(r[\"correct\"] for r in results) print(f\"\\n{'='*60}\") print(f\" {label}: {correct}/{total} = {correct/total*100:.1f}%\") print(f\"{'='*60}\") # По предметам by_subj = defaultdic"
},
{
"score": 0.509782,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\eval_general_reasoning.py",
"preview": "def load_mmlu(n, seed): \"\"\"MMLU: cais/mmlu all — 200 вопросов из разных предметов.\"\"\" print(\"Loading MMLU...\") rng = random.Random(seed) # Пробуем 'all', иначе сэмплируем из нескольких предметов try: ds = load_dataset(\"cais/mmlu\", \"all\", sp"
},
{
"score": 0.74435,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\eval_general_reasoning.py",
"preview": "def load_arc(n, seed): \"\"\"ARC-Challenge — 200 вопросов.\"\"\" print(\"Loading ARC-Challenge...\") rng = random.Random(seed) ds = load_dataset(\"allenai/ai2_arc\", \"ARC-Challenge\", split=\"test\", trust_remote_code=True) pool = [] for x in ds: labels"
},
{
"score": 0.946294,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\eval_general_reasoning.py",
"preview": "def load_hellaswag(n, seed): \"\"\"HellaSwag — 200 примеров.\"\"\" print(\"Loading HellaSwag...\") rng = random.Random(seed) ds = load_dataset(\"Rowan/hellaswag\", split=\"validation\", trust_remote_code=True) pool = [] for x in ds: endings = x[\"ending"
},
{
"score": 0.569382,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\inspect_lora.py",
"preview": "import sys if hasattr(sys.stdout, \"reconfigure\"): sys.stdout.reconfigure(encoding=\"utf-8\") from safetensors import safe_open import json from pathlib import Path adapter_path = r\"C:\\lora_training\\lora_MATH_output\\qwen_run_20260408_123730\\fi"
},
{
"score": 0.956672,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\list_files.ps1",
"preview": "Get-ChildItem 'C:\\lora_training\\OLympiad' -Filter '*.jsonl' | Sort-Object Length -Descending | ForEach-Object { $mb = [math]::Round($_.Length / 1MB, 1) Write-Output \"$mb MB $($_.Name)\" }"
},
{
"score": 0.826007,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\peek_local_bench.ps1",
"preview": "$files = @( 'C:\\lora_training\\OLympiad\\olympiad\\olympiad_final_MATH.jsonl', 'C:\\lora_training\\OLympiad\\_raw\\aops_dataset.jsonl', 'C:\\lora_training\\OLympiad\\_raw\\math_dataset.jsonl' ) foreach ($f in $files) { if (Test-Path $f) { Write-Output"
},
{
"score": 0.84162,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\peek_scripts.ps1",
"preview": "$scripts = @( 'generate_cot_dataset.py', 'Complete_cot.py', 'janitor44.py', 'triage_flagged.py', 'merge_dataset.py' ) foreach ($s in $scripts) { $path = \"C:\\lora_training\\OLympiad\\$s\" if (Test-Path $path) { Write-Output \"=== $s ===\" Get-Con"
},
{
"score": 0.813426,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\run_lora_3k_v2.ps1",
"preview": "$ErrorActionPreference = \"Stop\" $ScriptDir = \"C:\\Users\\sol08_p04dk8b\\MATH TRAIN\" cd $ScriptDir Write-Host \"=== run 1/3: Qwen3-4B lora_3k_v2 ===\" -ForegroundColor Cyan python train_qwen3_4b_instruct_lora_3k_v2.py 2>&1 | Tee-Object qwen3_3k_v"
},
{
"score": 0.7723,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\setup_github_project.py",
"preview": "| SFT (good solutions) | ~22,990 | ChatML `{\"text\": ...}` | | Broken / incomplete | ~6,518 | same | | DPO pairs | ~4,393 | `{\"problem\", \"chosen\", \"rejected\"}` | Data files are **not included** in this repo (too large). Sources: AoPS, IMO Sh"
},
{
"score": 0.976724,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\show_github.ps1",
"preview": "Write-Output \"=== C:\\GitHub\\Olympiad_Math ===\" Write-Output \"\" Write-Output \"--- Root files ---\" Get-ChildItem 'C:\\GitHub\\Olympiad_Math' -File | ForEach-Object { $mb = [math]::Round($_.Length / 1MB, 2) Write-Output \" $($_.Name) ($mb MB)\" } "
},
{
"score": 0.982568,
"source": "local_repo_math_train",
"path": "C:\\Users\\sol08_p04dk8b\\MATH TRAIN\\show_structure.ps1",
"preview": "Write-Output \"=== Files in root ===\" Get-ChildItem 'C:\\lora_training\\OLympiad' -File | ForEach-Object { Write-Output $_.Name } Write-Output \"\" Write-Output \"=== Subfolders ===\" Get-ChildItem 'C:\\lora_training\\OLympiad' -Directory | ForEach-"
}
]
}