Instructions to use melihcatal/codedp-cpt-models-v2 with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- PEFT
How to use melihcatal/codedp-cpt-models-v2 with PEFT:
Task type is invalid.
- Notebooks
- Google Colab
- Kaggle
| {"timestamp": 1774702012.3676147, "event": "train_step", "step": 5, "epoch": 1, "metrics": {"train/step_loss": 1.8126288519965277, "train/step_real_loss": 1.2628402709960938, "train/lr": 2.0320937499999996e-05, "train/step_canary_loss": 6.2109375, "perf/step_duration_sec": 6.5845307318959385, "perf/samples_per_sec": 5.31548889740274, "perf/tokens_per_sec": 3971.7333041393276, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 26152.0, "perf/physical_batches": 10.0, "privacy/epsilon": 0.9179937536296733, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702042.723834, "event": "train_step", "step": 10, "epoch": 1, "metrics": {"train/step_loss": 1.774319635118757, "train/step_real_loss": 1.3449589759111404, "train/lr": 4.063187499999999e-05, "train/step_canary_loss": 6.354166666666667, "perf/step_duration_sec": 6.136476519983262, "perf/samples_per_sec": 5.54063881598503, "perf/tokens_per_sec": 4106.917042366315, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 25202.0, "perf/physical_batches": 10.0, "privacy/epsilon": 1.1350700492972308, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702056.6960177, "event": "eval_step", "step": 10, "epoch": 1, "metrics": {"eval/loss": 0.8437929769808595, "eval/duration_sec": 13.959845661884174}} | |
| {"timestamp": 1774702086.7039802, "event": "train_step", "step": 15, "epoch": 1, "metrics": {"train/step_loss": 2.1081008778678045, "train/step_real_loss": 1.3091134279966354, "train/lr": 6.094281249999999e-05, "train/step_canary_loss": 8.500000476837158, "perf/step_duration_sec": 6.3650285778567195, "perf/samples_per_sec": 5.498796992327954, "perf/tokens_per_sec": 4197.7816239431595, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 26719.0, "perf/physical_batches": 10.0, "privacy/epsilon": 1.3113678771368842, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702116.2851121, "event": "train_step", "step": 20, "epoch": 1, "metrics": {"train/step_loss": 2.227328584000871, "train/step_real_loss": 1.436676800251007, "train/lr": 8.125375000000001e-05, "train/step_canary_loss": 7.2875, "perf/step_duration_sec": 6.368447465822101, "perf/samples_per_sec": 5.652869116563054, "perf/tokens_per_sec": 3672.637660202591, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 23389.0, "perf/physical_batches": 10.0, "privacy/epsilon": 1.4660205587973067, "system/cuda_memory_allocated_gb": 16.531797885894775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702130.4124558, "event": "eval_step", "step": 20, "epoch": 1, "metrics": {"eval/loss": 0.8437746289101513, "eval/duration_sec": 14.115059867035598}} | |
| {"timestamp": 1774702159.9568546, "event": "train_step", "step": 25, "epoch": 1, "metrics": {"train/step_loss": 2.2077248805278056, "train/step_real_loss": 1.3339318931102753, "train/lr": 0.00010156468750000002, "train/step_canary_loss": 7.8, "perf/step_duration_sec": 6.46703625516966, "perf/samples_per_sec": 5.5666921568936765, "perf/tokens_per_sec": 4074.045507157714, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 26347.0, "perf/physical_batches": 10.0, "privacy/epsilon": 1.6056043546443448, "system/cuda_memory_allocated_gb": 16.531797885894775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702189.6155016, "event": "train_step", "step": 30, "epoch": 1, "metrics": {"train/step_loss": 1.1335942949567521, "train/step_real_loss": 1.2398687601089478, "train/lr": 0.00012187562500000007, "train/step_canary_loss": 0.0, "perf/step_duration_sec": 6.8294450980611145, "perf/samples_per_sec": 4.685592978715771, "perf/tokens_per_sec": 4090.522670418868, "perf/logical_batch_size": 32.0, "perf/logical_token_count": 27936.0, "perf/physical_batches": 11.0, "privacy/epsilon": 1.7340359481069896, "system/cuda_memory_allocated_gb": 16.53101396560669, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702203.7618637, "event": "eval_step", "step": 30, "epoch": 1, "metrics": {"eval/loss": 0.8437598190185698, "eval/duration_sec": 14.131101737031713}} | |
| {"timestamp": 1774702234.1633456, "event": "train_step", "step": 35, "epoch": 1, "metrics": {"train/step_loss": 1.8024776322501046, "train/step_real_loss": 1.270288035273552, "train/lr": 0.00012999217477858396, "train/step_canary_loss": 7.479166666666667, "perf/step_duration_sec": 6.198646542849019, "perf/samples_per_sec": 5.485068355643478, "perf/tokens_per_sec": 3847.2914748642843, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 23848.0, "perf/physical_batches": 10.0, "privacy/epsilon": 1.853859763702748, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702263.8184445, "event": "train_step", "step": 40, "epoch": 1, "metrics": {"train/step_loss": 1.9537601470947266, "train/step_real_loss": 1.394229531288147, "train/lr": 0.00012994436116313906, "train/step_canary_loss": 10.90625, "perf/step_duration_sec": 5.87393393390812, "perf/samples_per_sec": 5.788284373395853, "perf/tokens_per_sec": 3992.2137810627282, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 23450.0, "perf/physical_batches": 9.0, "privacy/epsilon": 1.9666277443610969, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702277.9697719, "event": "eval_step", "step": 40, "epoch": 1, "metrics": {"eval/loss": 0.843898346986283, "eval/duration_sec": 14.135763100115582}} | |
| {"timestamp": 1774702308.313483, "event": "train_step", "step": 45, "epoch": 1, "metrics": {"train/step_loss": 2.1885748174455433, "train/step_real_loss": 1.4172247350215912, "train/lr": 0.0001298531148973165, "train/step_canary_loss": 8.359375476837158, "perf/step_duration_sec": 6.177955470047891, "perf/samples_per_sec": 5.665304673963388, "perf/tokens_per_sec": 4449.8540226265, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 27491.0, "perf/physical_batches": 10.0, "privacy/epsilon": 2.0736842474600423, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702337.8474174, "event": "train_step", "step": 50, "epoch": 1, "metrics": {"train/step_loss": 1.4548694245955522, "train/step_real_loss": 1.2665018886327744, "train/lr": 0.0001297185002182214, "train/step_canary_loss": 4.46875, "perf/step_duration_sec": 5.920573886949569, "perf/samples_per_sec": 5.573783999679539, "perf/tokens_per_sec": 4671.3376993677875, "perf/logical_batch_size": 33.0, "perf/logical_token_count": 27657.0, "perf/physical_batches": 10.0, "privacy/epsilon": 2.1757062054803633, "system/cuda_memory_allocated_gb": 16.247522354125977, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702351.973672, "event": "eval_step", "step": 50, "epoch": 1, "metrics": {"eval/loss": 0.8441124627874657, "eval/duration_sec": 14.114086741115898}} | |
| {"timestamp": 1774702381.9348137, "event": "train_step", "step": 55, "epoch": 1, "metrics": {"train/step_loss": 2.0556979996817453, "train/step_real_loss": 1.291388377547264, "train/lr": 0.00012954061189419548, "train/step_canary_loss": 10.208333969116211, "perf/step_duration_sec": 5.173420250881463, "perf/samples_per_sec": 6.765350252386048, "perf/tokens_per_sec": 5483.4130274196405, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 28368.0, "perf/physical_batches": 9.0, "privacy/epsilon": 2.273595815344409, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702412.6737547, "event": "train_step", "step": 60, "epoch": 1, "metrics": {"train/step_loss": 2.7593861630088403, "train/step_real_loss": 1.409583568572998, "train/lr": 0.00012931957515810007, "train/step_canary_loss": 9.958333333333334, "perf/step_duration_sec": 5.686617384199053, "perf/samples_per_sec": 6.682355683993713, "perf/tokens_per_sec": 4550.684220799718, "perf/logical_batch_size": 38.0, "perf/logical_token_count": 25878.0, "perf/physical_batches": 10.0, "privacy/epsilon": 2.367780278389218, "system/cuda_memory_allocated_gb": 16.34234619140625, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702426.836693, "event": "eval_step", "step": 60, "epoch": 1, "metrics": {"eval/loss": 0.8442740922963077, "eval/duration_sec": 14.15345686301589}} | |
| {"timestamp": 1774702457.4066966, "event": "train_step", "step": 65, "epoch": 1, "metrics": {"train/step_loss": 2.3754299879074097, "train/step_real_loss": 1.3813431113958359, "train/lr": 0.00012905554561915293, "train/step_canary_loss": 10.328125, "perf/step_duration_sec": 5.36740831611678, "perf/samples_per_sec": 6.707147636206916, "perf/tokens_per_sec": 5187.606077292926, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 27844.0, "perf/physical_batches": 9.0, "privacy/epsilon": 2.4586937364590273, "system/cuda_memory_allocated_gb": 16.531797885894775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702487.3792696, "event": "train_step", "step": 70, "epoch": 1, "metrics": {"train/step_loss": 2.225886448009594, "train/step_real_loss": 1.3803218305110931, "train/lr": 0.0001287487091533796, "train/step_canary_loss": 7.6375, "perf/step_duration_sec": 5.756763354875147, "perf/samples_per_sec": 6.253513959282901, "perf/tokens_per_sec": 4960.078822037888, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 28554.0, "perf/physical_batches": 10.0, "privacy/epsilon": 2.546782782079984, "system/cuda_memory_allocated_gb": 16.5317063331604, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702501.597284, "event": "eval_step", "step": 70, "epoch": 1, "metrics": {"eval/loss": 0.8444422065195711, "eval/duration_sec": 14.201780427014455}} | |
| {"timestamp": 1774702532.704276, "event": "train_step", "step": 75, "epoch": 1, "metrics": {"train/step_loss": 2.4386765119191764, "train/step_real_loss": 1.2708915919065475, "train/lr": 0.0001283992817727574, "train/step_canary_loss": 9.9125, "perf/step_duration_sec": 5.556148232892156, "perf/samples_per_sec": 6.659289574198473, "perf/tokens_per_sec": 4632.165831652597, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 25737.0, "perf/physical_batches": 10.0, "privacy/epsilon": 2.632165147167667, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702563.5464735, "event": "train_step", "step": 80, "epoch": 1, "metrics": {"train/step_loss": 2.163449403401968, "train/step_real_loss": 1.235863372683525, "train/lr": 0.0001280075094731435, "train/step_canary_loss": 8.1, "perf/step_duration_sec": 5.656158562051132, "perf/samples_per_sec": 6.364743775313305, "perf/tokens_per_sec": 4851.879539608974, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 27443.0, "perf/physical_batches": 10.0, "privacy/epsilon": 2.71530304852675, "system/cuda_memory_allocated_gb": 16.5317063331604, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702577.757564, "event": "eval_step", "step": 80, "epoch": 1, "metrics": {"eval/loss": 0.844685033979741, "eval/duration_sec": 14.197136115049943}} | |
| {"timestamp": 1774702609.2193258, "event": "train_step", "step": 85, "epoch": 1, "metrics": {"train/step_loss": 1.865637070792062, "train/step_real_loss": 1.3862436711788177, "train/lr": 0.0001275736680610945, "train/step_canary_loss": 6.979166666666667, "perf/step_duration_sec": 6.7332652430050075, "perf/samples_per_sec": 5.049556013751516, "perf/tokens_per_sec": 4102.764261173107, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 27625.0, "perf/physical_batches": 10.0, "privacy/epsilon": 2.796124372205281, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774702639.2993205, "event": "train_step", "step": 90, "epoch": 1, "metrics": {"train/step_loss": 2.1458786063724093, "train/step_real_loss": 1.3906759023666382, "train/lr": 0.00012709806295969954, "train/step_canary_loss": 8.187500238418579, "perf/step_duration_sec": 6.3353814508300275, "perf/samples_per_sec": 5.524529228688272, "perf/tokens_per_sec": 4007.177815105976, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 25387.0, "perf/physical_batches": 10.0, "privacy/epsilon": 2.8750704373612983, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774702653.4032378, "event": "eval_step", "step": 90, "epoch": 1, "metrics": {"eval/loss": 0.8449325874786486, "eval/duration_sec": 14.09157138201408}} | |
| {"timestamp": 1774702683.1280668, "event": "train_step", "step": 95, "epoch": 1, "metrics": {"train/step_loss": 2.287695381376478, "train/step_real_loss": 1.3588135540485382, "train/lr": 0.0001265810289935633, "train/step_canary_loss": 9.71875, "perf/step_duration_sec": 6.350726207019761, "perf/samples_per_sec": 5.668643053798711, "perf/tokens_per_sec": 3957.0277761656, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 25130.0, "perf/physical_batches": 9.0, "privacy/epsilon": 2.952236944837169, "system/cuda_memory_allocated_gb": 16.5317063331604, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774702713.2526903, "event": "train_step", "step": 100, "epoch": 1, "metrics": {"train/step_loss": 2.660276669722337, "train/step_real_loss": 1.2715090364217758, "train/lr": 0.00012602293015309042, "train/step_canary_loss": 9.00892870766776, "perf/step_duration_sec": 6.10068169189617, "perf/samples_per_sec": 6.392728217865486, "perf/tokens_per_sec": 4928.137791541688, "perf/logical_batch_size": 39.0, "perf/logical_token_count": 30065.0, "perf/physical_batches": 10.0, "privacy/epsilon": 3.02772165965114, "system/cuda_memory_allocated_gb": 16.437074184417725, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774702727.4021199, "event": "eval_step", "step": 100, "epoch": 1, "metrics": {"eval/loss": 0.8450869599526579, "eval/duration_sec": 14.134249210124835}} | |
| {"timestamp": 1774702758.3756955, "event": "train_step", "step": 105, "epoch": 1, "metrics": {"train/step_loss": 2.0147700707117715, "train/step_real_loss": 1.3632959872484207, "train/lr": 0.00012542415933823736, "train/step_canary_loss": 7.226562738418579, "perf/step_duration_sec": 6.499490906950086, "perf/samples_per_sec": 5.385037151536519, "perf/tokens_per_sec": 4702.214440721688, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 30562.0, "perf/physical_batches": 10.0, "privacy/epsilon": 3.101624796248717, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774702788.885598, "event": "train_step", "step": 110, "epoch": 1, "metrics": {"train/step_loss": 1.6412376131330217, "train/step_real_loss": 1.2013536393642426, "train/lr": 0.00012478513808191193, "train/step_canary_loss": 6.333333333333333, "perf/step_duration_sec": 6.814230911899358, "perf/samples_per_sec": 4.989557947123198, "perf/tokens_per_sec": 3921.4990430301796, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 26722.0, "perf/physical_batches": 10.0, "privacy/epsilon": 3.1740494347621158, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774702803.0982556, "event": "eval_step", "step": 110, "epoch": 1, "metrics": {"eval/loss": 0.8452429744330319, "eval/duration_sec": 14.19815262989141}} | |
| {"timestamp": 1774702833.3803155, "event": "train_step", "step": 115, "epoch": 1, "metrics": {"train/step_loss": 1.9615092145072088, "train/step_real_loss": 1.3590415865182877, "train/lr": 0.00012410631625321545, "train/step_canary_loss": 6.781250238418579, "perf/step_duration_sec": 5.57559902803041, "perf/samples_per_sec": 6.277352410753219, "perf/tokens_per_sec": 4023.065483588727, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 22431.0, "perf/physical_batches": 10.0, "privacy/epsilon": 3.2451019732065296, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774702864.2162437, "event": "train_step", "step": 120, "epoch": 1, "metrics": {"train/step_loss": 2.0712238682640924, "train/step_real_loss": 1.3281737267971039, "train/lr": 0.00012338817174073607, "train/step_canary_loss": 8.015625, "perf/step_duration_sec": 6.144209424965084, "perf/samples_per_sec": 5.696420414608328, "perf/tokens_per_sec": 4443.3706782634845, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 27301.0, "perf/physical_batches": 10.0, "privacy/epsilon": 3.3148926211215466, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774702878.3740766, "event": "eval_step", "step": 120, "epoch": 1, "metrics": {"eval/loss": 0.8454045434905724, "eval/duration_sec": 14.142055293079466}} | |
| {"timestamp": 1774702908.7943094, "event": "train_step", "step": 125, "epoch": 1, "metrics": {"train/step_loss": 2.9365096336755996, "train/step_real_loss": 1.3737929612398148, "train/lr": 0.00012263121011611664, "train/step_canary_loss": 10.080357279096331, "perf/step_duration_sec": 6.29400959587656, "perf/samples_per_sec": 6.19636805535701, "perf/tokens_per_sec": 3991.7320775074236, "perf/logical_batch_size": 39.0, "perf/logical_token_count": 25124.0, "perf/physical_batches": 10.0, "privacy/epsilon": 3.383535941032408, "system/cuda_memory_allocated_gb": 16.437074184417725, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774702939.2800477, "event": "train_step", "step": 130, "epoch": 1, "metrics": {"train/step_loss": 2.5562166394414128, "train/step_real_loss": 1.2915629893541336, "train/lr": 0.00012183596427813386, "train/step_canary_loss": 10.65, "perf/step_duration_sec": 6.233254758873954, "perf/samples_per_sec": 5.935903702207111, "perf/tokens_per_sec": 4196.683917460427, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 26159.0, "perf/physical_batches": 10.0, "privacy/epsilon": 3.451151445016777, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774702953.4885442, "event": "eval_step", "step": 130, "epoch": 1, "metrics": {"eval/loss": 0.8455977827649224, "eval/duration_sec": 14.196450588060543}} | |
| {"timestamp": 1774702984.6127725, "event": "train_step", "step": 135, "epoch": 1, "metrics": {"train/step_loss": 2.4919274046614364, "train/step_real_loss": 1.3656660616397858, "train/lr": 0.00012100299407753897, "train/step_canary_loss": 9.7, "perf/step_duration_sec": 6.633939765859395, "perf/samples_per_sec": 5.5773795521049365, "perf/tokens_per_sec": 4056.8652942108147, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 26913.0, "perf/physical_batches": 10.0, "privacy/epsilon": 3.5175872041131906, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703014.206551, "event": "train_step", "step": 140, "epoch": 1, "metrics": {"train/step_loss": 1.9397865401373968, "train/step_real_loss": 1.3228848278522491, "train/lr": 0.00012013288592292455, "train/step_canary_loss": 6.875000238418579, "perf/step_duration_sec": 6.54200257291086, "perf/samples_per_sec": 5.350043753410933, "perf/tokens_per_sec": 4006.724196125925, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 26212.0, "perf/physical_batches": 10.0, "privacy/epsilon": 3.582899536731326, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703029.2357173, "event": "eval_step", "step": 140, "epoch": 1, "metrics": {"eval/loss": 0.8457667776806789, "eval/duration_sec": 15.019259387161583}} | |
| {"timestamp": 1774703059.0296578, "event": "train_step", "step": 145, "epoch": 1, "metrics": {"train/step_loss": 1.5961745580037434, "train/step_real_loss": 1.3257425129413605, "train/lr": 0.00011922625236789447, "train/step_canary_loss": 10.25, "perf/step_duration_sec": 6.143337778979912, "perf/samples_per_sec": 5.371672726984512, "perf/tokens_per_sec": 4572.432936393786, "perf/logical_batch_size": 33.0, "perf/logical_token_count": 28090.0, "perf/physical_batches": 9.0, "privacy/epsilon": 3.6474551753735103, "system/cuda_memory_allocated_gb": 16.247522354125977, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703090.0304368, "event": "train_step", "step": 150, "epoch": 1, "metrics": {"train/step_loss": 2.434952027088887, "train/step_real_loss": 1.3564289063215256, "train/lr": 0.00011828373167982802, "train/step_canary_loss": 9.3375, "perf/step_duration_sec": 6.4520685048773885, "perf/samples_per_sec": 5.7345950328999376, "perf/tokens_per_sec": 3939.511798547314, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 25418.0, "perf/physical_batches": 10.0, "privacy/epsilon": 3.7111045156948865, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703104.2008579, "event": "eval_step", "step": 150, "epoch": 1, "metrics": {"eval/loss": 0.845938040959564, "eval/duration_sec": 14.160498020006344}} | |
| {"timestamp": 1774703134.3571382, "event": "train_step", "step": 155, "epoch": 1, "metrics": {"train/step_loss": 1.6117286121144014, "train/step_real_loss": 1.4233991503715515, "train/lr": 0.00011730598739054154, "train/step_canary_loss": 4.625, "perf/step_duration_sec": 6.366527742007747, "perf/samples_per_sec": 5.183359177445935, "perf/tokens_per_sec": 4364.231355919252, "perf/logical_batch_size": 33.0, "perf/logical_token_count": 27785.0, "perf/physical_batches": 10.0, "privacy/epsilon": 3.7736700577602584, "system/cuda_memory_allocated_gb": 16.247522354125977, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703164.0835865, "event": "train_step", "step": 160, "epoch": 1, "metrics": {"train/step_loss": 1.8811148054459517, "train/step_real_loss": 1.3463407307863235, "train/lr": 0.00011629370782916385, "train/step_canary_loss": 10.4375, "perf/step_duration_sec": 6.194121054839343, "perf/samples_per_sec": 5.489075802520276, "perf/tokens_per_sec": 4575.1446814006495, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 28339.0, "perf/physical_batches": 9.0, "privacy/epsilon": 3.8357775458019696, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703178.2333288, "event": "eval_step", "step": 160, "epoch": 1, "metrics": {"eval/loss": 0.8461048757149415, "eval/duration_sec": 14.134988086065277}} | |
| {"timestamp": 1774703208.7465525, "event": "train_step", "step": 165, "epoch": 1, "metrics": {"train/step_loss": 1.7110472066061837, "train/step_real_loss": 1.2445047572255135, "train/lr": 0.00011524760563755468, "train/step_canary_loss": 6.6875, "perf/step_duration_sec": 6.503170550102368, "perf/samples_per_sec": 5.22821902609717, "perf/tokens_per_sec": 4185.650643834264, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 27220.0, "perf/physical_batches": 10.0, "privacy/epsilon": 3.8966973756285967, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703239.680502, "event": "train_step", "step": 170, "epoch": 1, "metrics": {"train/step_loss": 1.9373356103897095, "train/step_real_loss": 1.3064556866884232, "train/lr": 0.00011416841726860683, "train/step_canary_loss": 6.984375, "perf/step_duration_sec": 6.620743467938155, "perf/samples_per_sec": 5.286415365508757, "perf/tokens_per_sec": 3832.8021804328637, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 25376.0, "perf/physical_batches": 10.0, "privacy/epsilon": 3.9571578758611676, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703253.7965026, "event": "eval_step", "step": 170, "epoch": 1, "metrics": {"eval/loss": 0.8462176741185513, "eval/duration_sec": 14.102701575960964}} | |
| {"timestamp": 1774703284.0360217, "event": "train_step", "step": 175, "epoch": 1, "metrics": {"train/step_loss": 1.8234757559640067, "train/step_real_loss": 1.4299734830856323, "train/lr": 0.00011305690246778548, "train/step_canary_loss": 6.020833333333333, "perf/step_duration_sec": 6.180147857870907, "perf/samples_per_sec": 5.501486498692473, "perf/tokens_per_sec": 3964.9536812929514, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 24504.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.016733545396104, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703314.1595054, "event": "train_step", "step": 180, "epoch": 1, "metrics": {"train/step_loss": 2.2947217322684623, "train/step_real_loss": 1.3603032529354095, "train/lr": 0.00011191384373826953, "train/step_canary_loss": 8.275, "perf/step_duration_sec": 5.662002453114837, "perf/samples_per_sec": 6.358174567761856, "perf/tokens_per_sec": 4715.4695217964945, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 26699.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.075739273126006, "system/cuda_memory_allocated_gb": 16.5317063331604, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703328.3585377, "event": "eval_step", "step": 180, "epoch": 1, "metrics": {"eval/loss": 0.846344795416702, "eval/duration_sec": 14.18977656099014}} | |
| {"timestamp": 1774703359.2694352, "event": "train_step", "step": 185, "epoch": 1, "metrics": {"train/step_loss": 2.2819890711042614, "train/step_real_loss": 1.2605970799922943, "train/lr": 0.0001107400457900718, "train/step_canary_loss": 10.453125, "perf/step_duration_sec": 5.289147150004283, "perf/samples_per_sec": 6.806390327024812, "perf/tokens_per_sec": 5045.614962703087, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 26687.0, "perf/physical_batches": 9.0, "privacy/epsilon": 4.133984134150172, "system/cuda_memory_allocated_gb": 16.531797885894775, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703390.5530107, "event": "train_step", "step": 190, "epoch": 1, "metrics": {"train/step_loss": 2.4612504469381795, "train/step_real_loss": 1.2344927042722702, "train/lr": 0.00010953633497352539, "train/step_canary_loss": 10.3125, "perf/step_duration_sec": 5.574537970125675, "perf/samples_per_sec": 6.6373213705396745, "perf/tokens_per_sec": 5376.230310137136, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 29970.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.191738086172843, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703404.6883912, "event": "eval_step", "step": 190, "epoch": 1, "metrics": {"eval/loss": 0.8465318629010157, "eval/duration_sec": 14.126018382841721}} | |
| {"timestamp": 1774703435.3802865, "event": "train_step", "step": 195, "epoch": 1, "metrics": {"train/step_loss": 1.8749484221140544, "train/step_real_loss": 1.1913481950759888, "train/lr": 0.00010830355869753557, "train/step_canary_loss": 7.343750238418579, "perf/step_duration_sec": 5.737189571838826, "perf/samples_per_sec": 6.100547935839281, "perf/tokens_per_sec": 5213.52826596825, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 29911.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.248665218250611, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703465.919752, "event": "train_step", "step": 200, "epoch": 1, "metrics": {"train/step_loss": 1.4629425090901993, "train/step_real_loss": 1.2516420409083366, "train/lr": 0.00010704258483300614, "train/step_canary_loss": 4.84375, "perf/step_duration_sec": 5.708063401049003, "perf/samples_per_sec": 5.781295280275865, "perf/tokens_per_sec": 5027.624604647174, "perf/logical_batch_size": 33.0, "perf/logical_token_count": 28698.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.305382698901073, "system/cuda_memory_allocated_gb": 16.247522354125977, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703480.1049397, "event": "eval_step", "step": 200, "epoch": 1, "metrics": {"eval/loss": 0.8466584802689878, "eval/duration_sec": 14.174285852117464}} | |
| {"timestamp": 1774703510.118628, "event": "train_step", "step": 205, "epoch": 1, "metrics": {"train/step_loss": 2.2805836136276656, "train/step_real_loss": 1.3380966782569885, "train/lr": 0.0001057543011018612, "train/step_canary_loss": 8.3125, "perf/step_duration_sec": 5.581516437930986, "perf/samples_per_sec": 6.449860069451815, "perf/tokens_per_sec": 4645.153389463256, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 25927.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.361004918038597, "system/cuda_memory_allocated_gb": 16.5317063331604, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774703540.106463, "event": "train_epoch", "step": 208, "epoch": 1, "metrics": {"train/epoch_loss": 2.082121519783371, "train/epoch_real_loss": 1.3378177472981265, "train/epoch_canary_loss": 7.986276215388099, "perf/epoch_duration_sec": 1556.7968838158995, "perf/epoch_samples_per_sec": 37.41657027037601, "perf/epoch_tokens_per_sec": 28350.44343859268, "perf/epoch_samples": 58250.0, "perf/epoch_tokens": 44135882.0, "system/cuda_epoch_peak_memory_gb": 46.082552909851074, "eval/loss": 0.8467348944395781, "eval/duration_sec": 14.12641789088957, "privacy/epsilon": 4.394378249521112}} | |
| {"timestamp": 1774703548.4726937, "event": "audit_epoch", "step": 208, "epoch": 1, "metrics": {"audit/delta": 1e-05, "audit/num_canaries": 500.0, "audit/num_members": 250.0, "audit/paper_guess_fraction": 0.2, "audit/paper_guess_steps": 20.0, "audit/loss/auc": 0.529592, "audit/loss/empirical_epsilon/0.05": 0.007771402597427368, "audit/loss/empirical_epsilon/0.01": 0.0, "audit/loss/empirical_epsilon_details/0.05/epsilon": 0.007771402597427368, "audit/loss/empirical_epsilon_details/0.05/num_guesses": 60.0, "audit/loss/empirical_epsilon_details/0.05/correct_guesses": 37.0, "audit/loss/empirical_epsilon_details/0.01/epsilon": 0.0, "audit/loss/empirical_epsilon_details/0.01/num_guesses": 0.0, "audit/loss/empirical_epsilon_details/0.01/correct_guesses": 0.0, "audit/embedding/auc": 0.503408, "audit/embedding/empirical_epsilon/0.05": 0.0, "audit/embedding/empirical_epsilon/0.01": 0.0, "audit/embedding/empirical_epsilon_details/0.05/epsilon": 0.0, "audit/embedding/empirical_epsilon_details/0.05/num_guesses": 0.0, "audit/embedding/empirical_epsilon_details/0.05/correct_guesses": 0.0, "audit/embedding/empirical_epsilon_details/0.01/epsilon": 0.0, "audit/embedding/empirical_epsilon_details/0.01/num_guesses": 0.0, "audit/embedding/empirical_epsilon_details/0.01/correct_guesses": 0.0, "perf/audit_duration_sec": 5.581604512175545}} | |
| {"timestamp": 1774703560.314456, "event": "train_step", "step": 210, "epoch": 2, "metrics": {"train/step_loss": 1.4897712118485396, "train/step_real_loss": 1.3074912875890732, "train/lr": 0.00010443961445209121, "train/step_canary_loss": 4.40625, "perf/step_duration_sec": 5.704903840087354, "perf/samples_per_sec": 5.784497149297209, "perf/tokens_per_sec": 4832.509148756811, "perf/logical_batch_size": 33.0, "perf/logical_token_count": 27569.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.416627137176122, "system/cuda_memory_allocated_gb": 16.247522354125977, "system/cuda_max_memory_allocated_gb": 46.082457065582275}} | |
| {"timestamp": 1774703574.4718843, "event": "eval_step", "step": 210, "epoch": 2, "metrics": {"eval/loss": 0.8467347511852329, "eval/duration_sec": 14.150488690007478}} | |
| {"timestamp": 1774703606.9792926, "event": "train_step", "step": 215, "epoch": 2, "metrics": {"train/step_loss": 1.9476184116469488, "train/step_real_loss": 1.3316956833004951, "train/lr": 0.0001030994504192644, "train/step_canary_loss": 6.875000238418579, "perf/step_duration_sec": 5.857716584112495, "perf/samples_per_sec": 5.97502448222371, "perf/tokens_per_sec": 4454.636823975586, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 26094.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.471245139455458, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774703637.250742, "event": "train_step", "step": 220, "epoch": 2, "metrics": {"train/step_loss": 2.704066740839105, "train/step_real_loss": 1.369282379746437, "train/lr": 0.00010173475247495244, "train/step_canary_loss": 9.822916666666666, "perf/step_duration_sec": 5.642964720958844, "perf/samples_per_sec": 6.734048834092852, "perf/tokens_per_sec": 4792.693439948453, "perf/logical_batch_size": 38.0, "perf/logical_token_count": 27045.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.5255750063855915, "system/cuda_memory_allocated_gb": 16.34234619140625, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774703651.3903606, "event": "eval_step", "step": 220, "epoch": 2, "metrics": {"eval/loss": 0.8468459952961316, "eval/duration_sec": 14.12851015292108}} | |
| {"timestamp": 1774703682.678996, "event": "train_step", "step": 225, "epoch": 2, "metrics": {"train/step_loss": 1.9755483269691467, "train/step_real_loss": 1.3416324332356453, "train/lr": 0.00010034648136252908, "train/step_canary_loss": 7.046875476837158, "perf/step_duration_sec": 5.6909152660518885, "perf/samples_per_sec": 6.150153070945562, "perf/tokens_per_sec": 4856.336583477785, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 27637.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.579643558868303, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774703712.451131, "event": "train_step", "step": 230, "epoch": 2, "metrics": {"train/step_loss": 1.9284468819113338, "train/step_real_loss": 1.4181154370307922, "train/lr": 9.893561442080963e-05, "train/step_canary_loss": 10.09375, "perf/step_duration_sec": 5.200704605085775, "perf/samples_per_sec": 6.537575690561498, "perf/tokens_per_sec": 4408.441113455984, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 22927.0, "perf/physical_batches": 9.0, "privacy/epsilon": 4.6326933869810505, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774703726.6136572, "event": "eval_step", "step": 230, "epoch": 2, "metrics": {"eval/loss": 0.8469641174782406, "eval/duration_sec": 14.14281897409819}} | |
| {"timestamp": 1774703757.02543, "event": "train_step", "step": 235, "epoch": 2, "metrics": {"train/step_loss": 2.3527077303992376, "train/step_real_loss": 1.3616399466991425, "train/lr": 9.750314489600751e-05, "train/step_canary_loss": 10.28125, "perf/step_duration_sec": 5.373189318925142, "perf/samples_per_sec": 6.69993143051983, "perf/tokens_per_sec": 4738.712613441553, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 25462.0, "perf/physical_batches": 9.0, "privacy/epsilon": 4.6857432150938, "system/cuda_memory_allocated_gb": 16.5317063331604, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774703788.9494057, "event": "train_step", "step": 240, "epoch": 2, "metrics": {"train/step_loss": 1.5969067952212166, "train/step_real_loss": 1.3666353449225426, "train/lr": 9.605008124249151e-05, "train/step_canary_loss": 5.28125, "perf/step_duration_sec": 6.371853213990107, "perf/samples_per_sec": 5.17902702584938, "perf/tokens_per_sec": 4300.318773796936, "perf/logical_batch_size": 33.0, "perf/logical_token_count": 27401.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.73825775779551, "system/cuda_memory_allocated_gb": 16.247522354125977, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774703803.0989826, "event": "eval_step", "step": 240, "epoch": 2, "metrics": {"eval/loss": 0.8470385110175068, "eval/duration_sec": 14.137771266978234}} | |
| {"timestamp": 1774703833.8403947, "event": "train_step", "step": 245, "epoch": 2, "metrics": {"train/step_loss": 1.811898694719587, "train/step_real_loss": 1.4378188848495483, "train/lr": 9.457744641283705e-05, "train/step_canary_loss": 5.802083333333333, "perf/step_duration_sec": 6.504191594896838, "perf/samples_per_sec": 5.227398286771912, "perf/tokens_per_sec": 3663.6374639849378, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 23829.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.790039620732503, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774703864.8664234, "event": "train_step", "step": 250, "epoch": 2, "metrics": {"train/step_loss": 2.421613061750257, "train/step_real_loss": 1.299990102648735, "train/lr": 9.308627713767046e-05, "train/step_canary_loss": 9.6, "perf/step_duration_sec": 6.694291755091399, "perf/samples_per_sec": 5.52709701842011, "perf/tokens_per_sec": 4366.406644551887, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 29230.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.841821483669497, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774703878.997738, "event": "eval_step", "step": 250, "epoch": 2, "metrics": {"eval/loss": 0.8471578513695435, "eval/duration_sec": 14.116636754013598}} | |
| {"timestamp": 1774703910.224147, "event": "train_step", "step": 255, "epoch": 2, "metrics": {"train/step_loss": 1.9385174070085798, "train/step_real_loss": 1.3429096639156342, "train/lr": 9.157762319581367e-05, "train/step_canary_loss": 8.291666666666666, "perf/step_duration_sec": 6.239629854913801, "perf/samples_per_sec": 5.449041175611482, "perf/tokens_per_sec": 4517.255134581918, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 28186.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.893089997598312, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774703940.0578907, "event": "train_step", "step": 260, "epoch": 2, "metrics": {"train/step_loss": 2.029318959372384, "train/step_real_loss": 1.3348019868135452, "train/lr": 9.005254667524301e-05, "train/step_canary_loss": 9.4375, "perf/step_duration_sec": 5.202967477962375, "perf/samples_per_sec": 6.726930381219097, "perf/tokens_per_sec": 5426.326441513107, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 28233.0, "perf/physical_batches": 9.0, "privacy/epsilon": 4.943615736529964, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774703954.0946558, "event": "eval_step", "step": 260, "epoch": 2, "metrics": {"eval/loss": 0.847234814173796, "eval/duration_sec": 14.017816953128204}} | |
| {"timestamp": 1774703984.0064335, "event": "train_step", "step": 265, "epoch": 2, "metrics": {"train/step_loss": 1.9851477940877278, "train/step_real_loss": 1.469619333744049, "train/lr": 8.851212122538228e-05, "train/step_canary_loss": 6.109375476837158, "perf/step_duration_sec": 5.494907427113503, "perf/samples_per_sec": 6.369534057534731, "perf/tokens_per_sec": 4886.524542253287, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 26851.0, "perf/physical_batches": 10.0, "privacy/epsilon": 4.994141475461617, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704013.7437365, "event": "train_step", "step": 270, "epoch": 2, "metrics": {"train/step_loss": 2.3492087920506797, "train/step_real_loss": 1.4143442660570145, "train/lr": 8.695743130125684e-05, "train/step_canary_loss": 9.828125, "perf/step_duration_sec": 5.297504771966487, "perf/samples_per_sec": 6.795652207904748, "perf/tokens_per_sec": 5165.450750475154, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 27364.0, "perf/physical_batches": 9.0, "privacy/epsilon": 5.044495166368542, "system/cuda_memory_allocated_gb": 16.5317063331604, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704027.8510404, "event": "eval_step", "step": 270, "epoch": 2, "metrics": {"eval/loss": 0.8473275701769374, "eval/duration_sec": 14.100647212006152}} | |
| {"timestamp": 1774704058.2686903, "event": "train_step", "step": 275, "epoch": 2, "metrics": {"train/step_loss": 1.5198324568131392, "train/step_real_loss": 1.2984157353639603, "train/lr": 8.538957140004026e-05, "train/step_canary_loss": 5.0625, "perf/step_duration_sec": 5.822425212012604, "perf/samples_per_sec": 5.667741327430994, "perf/tokens_per_sec": 5002.211095800839, "perf/logical_batch_size": 33.0, "perf/logical_token_count": 29125.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.093776396971046, "system/cuda_memory_allocated_gb": 16.247522354125977, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704089.4696596, "event": "train_step", "step": 280, "epoch": 2, "metrics": {"train/step_loss": 2.2229077236072436, "train/step_real_loss": 1.3221901804208755, "train/lr": 8.380964529053162e-05, "train/step_canary_loss": 7.9875, "perf/step_duration_sec": 6.428765488089994, "perf/samples_per_sec": 5.599830957700047, "perf/tokens_per_sec": 3581.09189744918, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 23022.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.143057627573549, "system/cuda_memory_allocated_gb": 16.531797885894775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704103.5255067, "event": "eval_step", "step": 280, "epoch": 2, "metrics": {"eval/loss": 0.8474000880325381, "eval/duration_sec": 14.038474477827549}} | |
| {"timestamp": 1774704134.5670602, "event": "train_step", "step": 285, "epoch": 2, "metrics": {"train/step_loss": 1.22309676806132, "train/step_real_loss": 1.2613185420632362, "train/lr": 8.221876523610544e-05, "train/step_canary_loss": 0.0, "perf/step_duration_sec": 6.109340019989759, "perf/samples_per_sec": 5.237881652567382, "perf/tokens_per_sec": 4262.326194776707, "perf/logical_batch_size": 32.0, "perf/logical_token_count": 26040.0, "perf/physical_batches": 9.0, "privacy/epsilon": 5.192338858176054, "system/cuda_memory_allocated_gb": 16.530968189239502, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704164.6149778, "event": "train_step", "step": 290, "epoch": 2, "metrics": {"train/step_loss": 2.0282374245779855, "train/step_real_loss": 1.2847908735275269, "train/lr": 8.061805121168158e-05, "train/step_canary_loss": 9.958333969116211, "perf/step_duration_sec": 6.064710897859186, "perf/samples_per_sec": 5.771091250591159, "perf/tokens_per_sec": 4710.85934369684, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 28570.0, "perf/physical_batches": 9.0, "privacy/epsilon": 5.24090256094613, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704178.7716405, "event": "eval_step", "step": 290, "epoch": 2, "metrics": {"eval/loss": 0.8474216041239826, "eval/duration_sec": 14.147691816091537}} | |
| {"timestamp": 1774704209.2158594, "event": "train_step", "step": 295, "epoch": 2, "metrics": {"train/step_loss": 1.7850433622087751, "train/step_real_loss": 1.3254380524158478, "train/lr": 7.900863011526601e-05, "train/step_canary_loss": 6.6875, "perf/step_duration_sec": 6.388392842141911, "perf/samples_per_sec": 5.322152353517512, "perf/tokens_per_sec": 4555.76241461099, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 29104.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.288950680092402, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704239.59642, "event": "train_step", "step": 300, "epoch": 2, "metrics": {"train/step_loss": 2.415292791418127, "train/step_real_loss": 1.2653385400772095, "train/lr": 7.739163497461804e-05, "train/step_canary_loss": 9.775, "perf/step_duration_sec": 6.4330549070145935, "perf/samples_per_sec": 5.751544256159738, "perf/tokens_per_sec": 4256.764538126439, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 27384.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.336998799238674, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704253.809411, "event": "eval_step", "step": 300, "epoch": 2, "metrics": {"eval/loss": 0.8475047380409457, "eval/duration_sec": 14.19755891081877}} | |
| {"timestamp": 1774704284.8440778, "event": "train_step", "step": 305, "epoch": 2, "metrics": {"train/step_loss": 2.310550560822358, "train/step_real_loss": 1.3493084609508514, "train/lr": 7.576820414960206e-05, "train/step_canary_loss": 8.4625, "perf/step_duration_sec": 6.562574971932918, "perf/samples_per_sec": 5.485651616014481, "perf/tokens_per_sec": 4102.505512721053, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 26923.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.385046918384947, "system/cuda_memory_allocated_gb": 16.531797885894775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704315.8771942, "event": "train_step", "step": 310, "epoch": 2, "metrics": {"train/step_loss": 1.6641213348933628, "train/step_real_loss": 1.3045077100396156, "train/lr": 7.413948053078548e-05, "train/step_canary_loss": 5.5, "perf/step_duration_sec": 6.63936623185873, "perf/samples_per_sec": 5.120970709049363, "perf/tokens_per_sec": 4047.5248783612806, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 26873.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.43223177980228, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704329.974938, "event": "eval_step", "step": 310, "epoch": 2, "metrics": {"eval/loss": 0.8475217587229881, "eval/duration_sec": 14.083483699010685}} | |
| {"timestamp": 1774704360.627232, "event": "train_step", "step": 315, "epoch": 2, "metrics": {"train/step_loss": 2.186908805692518, "train/step_real_loss": 1.294238306581974, "train/lr": 7.250661073484708e-05, "train/step_canary_loss": 7.9, "perf/step_duration_sec": 6.213432225864381, "perf/samples_per_sec": 5.7938991995670905, "perf/tokens_per_sec": 4441.3456197570395, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 27596.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.479057971982978, "system/cuda_memory_allocated_gb": 16.531797885894775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704392.1324208, "event": "train_step", "step": 320, "epoch": 2, "metrics": {"train/step_loss": 2.7599759101867676, "train/step_real_loss": 1.3868463933467865, "train/lr": 7.087074429736229e-05, "train/step_canary_loss": 10.083333333333334, "perf/step_duration_sec": 6.289313570829108, "perf/samples_per_sec": 6.041994817407479, "perf/tokens_per_sec": 4380.7642423476545, "perf/logical_batch_size": 38.0, "perf/logical_token_count": 27552.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.525884164163676, "system/cuda_memory_allocated_gb": 16.34234619140625, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704406.2982066, "event": "eval_step", "step": 320, "epoch": 2, "metrics": {"eval/loss": 0.8475614400072532, "eval/duration_sec": 14.155549821909517}} | |
| {"timestamp": 1774704436.6432343, "event": "train_step", "step": 325, "epoch": 2, "metrics": {"train/step_loss": 2.252491551476556, "train/step_real_loss": 1.3446777313947678, "train/lr": 6.923303286353341e-05, "train/step_canary_loss": 8.0625, "perf/step_duration_sec": 5.68951973086223, "perf/samples_per_sec": 6.327423350818454, "perf/tokens_per_sec": 4733.967236970673, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 26934.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.572710356344374, "system/cuda_memory_allocated_gb": 16.531797885894775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704466.6627338, "event": "train_step", "step": 330, "epoch": 2, "metrics": {"train/step_loss": 2.1172632353646414, "train/step_real_loss": 1.4720066636800766, "train/lr": 6.759462937743482e-05, "train/step_canary_loss": 9.0, "perf/step_duration_sec": 5.375310620991513, "perf/samples_per_sec": 6.511251622058635, "perf/tokens_per_sec": 5451.033822226859, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 29301.0, "perf/physical_batches": 9.0, "privacy/epsilon": 5.618962518543033, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704480.8615696, "event": "eval_step", "step": 330, "epoch": 2, "metrics": {"eval/loss": 0.8475655418905346, "eval/duration_sec": 14.183914782945067}} | |
| {"timestamp": 1774704510.6406467, "event": "train_step", "step": 335, "epoch": 2, "metrics": {"train/step_loss": 1.7520098966710709, "train/step_real_loss": 1.3185417652130127, "train/lr": 6.595668727034364e-05, "train/step_canary_loss": 8.6875, "perf/step_duration_sec": 5.2571783401072025, "perf/samples_per_sec": 6.46734765313415, "perf/tokens_per_sec": 5295.996863487088, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 27842.0, "perf/physical_batches": 9.0, "privacy/epsilon": 5.664577762030868, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704540.6550682, "event": "train_step", "step": 340, "epoch": 2, "metrics": {"train/step_loss": 1.877108369554792, "train/step_real_loss": 1.351915404200554, "train/lr": 6.432035964872754e-05, "train/step_canary_loss": 7.479166666666667, "perf/step_duration_sec": 5.681397710926831, "perf/samples_per_sec": 5.984442865988594, "perf/tokens_per_sec": 4380.9642039545915, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 24890.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.710193005518703, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704554.7934449, "event": "eval_step", "step": 340, "epoch": 2, "metrics": {"eval/loss": 0.8475861950692805, "eval/duration_sec": 14.120642909780145}} | |
| {"timestamp": 1774704584.6681478, "event": "train_step", "step": 345, "epoch": 2, "metrics": {"train/step_loss": 1.4991934860453886, "train/step_real_loss": 1.2217993289232254, "train/lr": 6.268679848246117e-05, "train/step_canary_loss": 5.9375, "perf/step_duration_sec": 5.688624897040427, "perf/samples_per_sec": 5.801050446685038, "perf/tokens_per_sec": 4507.943565296701, "perf/logical_batch_size": 33.0, "perf/logical_token_count": 25644.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.755808249006538, "system/cuda_memory_allocated_gb": 16.247522354125977, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704616.121566, "event": "train_step", "step": 350, "epoch": 2, "metrics": {"train/step_loss": 2.3897122048042916, "train/step_real_loss": 1.2767766118049622, "train/lr": 6.105715379384262e-05, "train/step_canary_loss": 9.5125, "perf/step_duration_sec": 6.4702799001242965, "perf/samples_per_sec": 5.718454312817165, "perf/tokens_per_sec": 4243.7113113873975, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 27458.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.801423492494373, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704630.2695174, "event": "eval_step", "step": 350, "epoch": 2, "metrics": {"eval/loss": 0.8475948062471368, "eval/duration_sec": 14.137833208078519}} | |
| {"timestamp": 1774704660.7510605, "event": "train_step", "step": 355, "epoch": 2, "metrics": {"train/step_loss": 2.318686291978166, "train/step_real_loss": 1.3938716500997543, "train/lr": 5.9432572847981164e-05, "train/step_canary_loss": 8.2375, "perf/step_duration_sec": 6.543381548952311, "perf/samples_per_sec": 5.501742444740077, "perf/tokens_per_sec": 4184.227955403849, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 27379.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.846029564385675, "system/cuda_memory_allocated_gb": 16.5317063331604, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704691.1978962, "event": "train_step", "step": 360, "epoch": 2, "metrics": {"train/step_loss": 2.2224914318806417, "train/step_real_loss": 1.3510057181119919, "train/lr": 5.781419934512588e-05, "train/step_canary_loss": 7.8, "perf/step_duration_sec": 6.466999434866011, "perf/samples_per_sec": 5.5667238512362545, "perf/tokens_per_sec": 3972.4759927294267, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 25690.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.890444637154906, "system/cuda_memory_allocated_gb": 16.531797885894775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704705.3308313, "event": "eval_step", "step": 360, "epoch": 2, "metrics": {"eval/loss": 0.8475845208899541, "eval/duration_sec": 14.11823072982952}} | |
| {"timestamp": 1774704735.2234209, "event": "train_step", "step": 365, "epoch": 2, "metrics": {"train/step_loss": 1.4651239479289335, "train/step_real_loss": 1.2539598196744919, "train/lr": 5.6203172615504136e-05, "train/step_canary_loss": 4.84375, "perf/step_duration_sec": 6.401590051827952, "perf/samples_per_sec": 5.154969270576294, "perf/tokens_per_sec": 4260.347785346281, "perf/logical_batch_size": 33.0, "perf/logical_token_count": 27273.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.934859709924137, "system/cuda_memory_allocated_gb": 16.247522354125977, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704766.3523452, "event": "train_step", "step": 370, "epoch": 2, "metrics": {"train/step_loss": 1.9310800234476726, "train/step_real_loss": 1.2662149965763092, "train/lr": 5.460062681723634e-05, "train/step_canary_loss": 7.250000238418579, "perf/step_duration_sec": 5.75469884602353, "perf/samples_per_sec": 6.0819863795626485, "perf/tokens_per_sec": 4689.906582800467, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 26989.0, "perf/physical_batches": 10.0, "privacy/epsilon": 5.979274782693368, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704780.5248334, "event": "eval_step", "step": 370, "epoch": 2, "metrics": {"eval/loss": 0.8475809508765286, "eval/duration_sec": 14.164534721989185}} | |
| {"timestamp": 1774704811.4827154, "event": "train_step", "step": 375, "epoch": 2, "metrics": {"train/step_loss": 1.7879679134913853, "train/step_real_loss": 1.3794180303812027, "train/lr": 5.300769013789195e-05, "train/step_canary_loss": 6.145833333333333, "perf/step_duration_sec": 5.800660178996623, "perf/samples_per_sec": 5.861401797524571, "perf/tokens_per_sec": 4652.056691358839, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 26985.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.0236898554625995, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774704841.973108, "event": "train_step", "step": 380, "epoch": 2, "metrics": {"train/step_loss": 2.1334857395717077, "train/step_real_loss": 1.4409218430519104, "train/lr": 5.142548400024875e-05, "train/step_canary_loss": 9.520833969116211, "perf/step_duration_sec": 5.35505328909494, "perf/samples_per_sec": 6.53588267203133, "perf/tokens_per_sec": 5094.81391260088, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 27283.0, "perf/physical_batches": 9.0, "privacy/epsilon": 6.067205077496726, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774704855.959503, "event": "eval_step", "step": 380, "epoch": 2, "metrics": {"eval/loss": 0.8475886901671236, "eval/duration_sec": 13.974233868997544}} | |
| {"timestamp": 1774704886.863412, "event": "train_step", "step": 385, "epoch": 2, "metrics": {"train/step_loss": 1.536392760999275, "train/step_real_loss": 1.2855769097805023, "train/lr": 4.985512227281438e-05, "train/step_canary_loss": 9.5625, "perf/step_duration_sec": 5.2073657820001245, "perf/samples_per_sec": 6.337177256506236, "perf/tokens_per_sec": 4733.1032679124, "perf/logical_batch_size": 33.0, "perf/logical_token_count": 24647.0, "perf/physical_batches": 9.0, "privacy/epsilon": 6.110430562913065, "system/cuda_memory_allocated_gb": 16.247522354125977, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774704917.4979346, "event": "train_step", "step": 390, "epoch": 2, "metrics": {"train/step_loss": 1.6382224764142717, "train/step_real_loss": 1.2586027085781097, "train/lr": 4.829771048566633e-05, "train/step_canary_loss": 5.6875, "perf/step_duration_sec": 6.297174851875752, "perf/samples_per_sec": 5.3992466145151345, "perf/tokens_per_sec": 4460.730511815592, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 28090.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.153656048329404, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774704931.5086095, "event": "eval_step", "step": 390, "epoch": 2, "metrics": {"eval/loss": 0.8475873510945926, "eval/duration_sec": 13.992301932070404}} | |
| {"timestamp": 1774704961.7628422, "event": "train_step", "step": 395, "epoch": 2, "metrics": {"train/step_loss": 1.865945900187773, "train/step_real_loss": 1.3380362689495087, "train/lr": 4.6754345052161783e-05, "train/step_canary_loss": 10.3125, "perf/step_duration_sec": 6.02248123800382, "perf/samples_per_sec": 5.645513644019165, "perf/tokens_per_sec": 4261.200489601878, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 25663.0, "perf/physical_batches": 9.0, "privacy/epsilon": 6.196881533745744, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774704992.7807424, "event": "train_step", "step": 400, "epoch": 2, "metrics": {"train/step_loss": 2.4349257752702043, "train/step_real_loss": 1.2606954276561737, "train/lr": 4.5226112497066e-05, "train/step_canary_loss": 9.95, "perf/step_duration_sec": 6.627584964968264, "perf/samples_per_sec": 5.582727372877546, "perf/tokens_per_sec": 4086.707321469955, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 27085.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.240107019162083, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774705006.780364, "event": "eval_step", "step": 400, "epoch": 2, "metrics": {"eval/loss": 0.8475714739073406, "eval/duration_sec": 13.988260480808094}} | |
| {"timestamp": 1774705037.3651092, "event": "train_step", "step": 405, "epoch": 2, "metrics": {"train/step_loss": 1.5602650922887467, "train/step_real_loss": 1.3101254105567932, "train/lr": 4.3714088691641896e-05, "train/step_canary_loss": 5.5625, "perf/step_duration_sec": 6.796408602036536, "perf/samples_per_sec": 4.855505596016047, "perf/tokens_per_sec": 4201.925115485645, "perf/logical_batch_size": 33.0, "perf/logical_token_count": 28558.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.28314125352962, "system/cuda_memory_allocated_gb": 16.247522354125977, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774705067.9668245, "event": "train_step", "step": 410, "epoch": 2, "metrics": {"train/step_loss": 2.699703835152291, "train/step_real_loss": 1.5414544343948364, "train/lr": 4.221933809623992e-05, "train/step_canary_loss": 10.1125, "perf/step_duration_sec": 6.560143044916913, "perf/samples_per_sec": 5.640120916062833, "perf/tokens_per_sec": 3741.2293957548677, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 24543.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.325187545818052, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774705081.9852448, "event": "eval_step", "step": 410, "epoch": 2, "metrics": {"eval/loss": 0.847597274421291, "eval/duration_sec": 14.00767610501498}} | |
| {"timestamp": 1774705112.1065075, "event": "train_step", "step": 415, "epoch": 2, "metrics": {"train/step_loss": 1.8917703760994806, "train/step_real_loss": 1.3216010183095932, "train/lr": 4.074291301092102e-05, "train/step_canary_loss": 6.453125238418579, "perf/step_duration_sec": 6.371549545088783, "perf/samples_per_sec": 5.493169244360368, "perf/tokens_per_sec": 3952.8845882417213, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 25186.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.3672338381064835, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774705128.5169804, "event": "train_epoch", "step": 416, "epoch": 2, "metrics": {"train/epoch_loss": 2.0575782208447424, "train/epoch_real_loss": 1.3342586813761936, "train/epoch_canary_loss": 7.713699376083211, "perf/epoch_duration_sec": 1565.7435056250542, "perf/epoch_samples_per_sec": 37.14465350873838, "perf/epoch_tokens_per_sec": 28185.43831825288, "perf/epoch_samples": 58159.0, "perf/epoch_tokens": 44131167.0, "system/cuda_epoch_peak_memory_gb": 46.082552909851074, "eval/loss": 0.8475801269100472, "eval/duration_sec": 14.195432304870337, "privacy/epsilon": 6.375643096564169}} | |
| {"timestamp": 1774705137.7497761, "event": "audit_epoch", "step": 416, "epoch": 2, "metrics": {"audit/delta": 1e-05, "audit/num_canaries": 500.0, "audit/num_members": 250.0, "audit/paper_guess_fraction": 0.2, "audit/paper_guess_steps": 20.0, "audit/loss/auc": 0.529288, "audit/loss/empirical_epsilon/0.05": 0.010390725918114185, "audit/loss/empirical_epsilon/0.01": 0.0, "audit/loss/empirical_epsilon_details/0.05/epsilon": 0.010390725918114185, "audit/loss/empirical_epsilon_details/0.05/num_guesses": 100.0, "audit/loss/empirical_epsilon_details/0.05/correct_guesses": 59.0, "audit/loss/empirical_epsilon_details/0.01/epsilon": 0.0, "audit/loss/empirical_epsilon_details/0.01/num_guesses": 0.0, "audit/loss/empirical_epsilon_details/0.01/correct_guesses": 0.0, "audit/embedding/auc": 0.549968, "audit/embedding/empirical_epsilon/0.05": 0.0, "audit/embedding/empirical_epsilon/0.01": 0.0, "audit/embedding/empirical_epsilon_details/0.05/epsilon": 0.0, "audit/embedding/empirical_epsilon_details/0.05/num_guesses": 0.0, "audit/embedding/empirical_epsilon_details/0.05/correct_guesses": 0.0, "audit/embedding/empirical_epsilon_details/0.01/epsilon": 0.0, "audit/embedding/empirical_epsilon_details/0.01/num_guesses": 0.0, "audit/embedding/empirical_epsilon_details/0.01/correct_guesses": 0.0, "perf/audit_duration_sec": 5.8933791478630155}} | |
| {"timestamp": 1774705164.712225, "event": "train_step", "step": 420, "epoch": 3, "metrics": {"train/step_loss": 1.126232988694135, "train/step_real_loss": 1.1966225504875183, "train/lr": 3.928585283464046e-05, "train/step_canary_loss": 0.0, "perf/step_duration_sec": 7.607163795968518, "perf/samples_per_sec": 4.206561191302161, "perf/tokens_per_sec": 3720.046098520621, "perf/logical_batch_size": 32.0, "perf/logical_token_count": 28299.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.409280130394915, "system/cuda_memory_allocated_gb": 16.530991077423096, "system/cuda_max_memory_allocated_gb": 46.08250570297241}} | |
| {"timestamp": 1774705178.8354776, "event": "eval_step", "step": 420, "epoch": 3, "metrics": {"eval/loss": 0.847562875090675, "eval/duration_sec": 14.108301368774846}} | |
| {"timestamp": 1774705210.6332085, "event": "train_step", "step": 425, "epoch": 3, "metrics": {"train/step_loss": 1.7482675552368163, "train/step_real_loss": 1.250058263540268, "train/lr": 3.7849183333514016e-05, "train/step_canary_loss": 7.0625, "perf/step_duration_sec": 6.502579513937235, "perf/samples_per_sec": 5.228694232362167, "perf/tokens_per_sec": 4428.550229686274, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 28797.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.451326422683347, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705240.6498296, "event": "train_step", "step": 430, "epoch": 3, "metrics": {"train/step_loss": 1.7249415201299332, "train/step_real_loss": 1.295640990138054, "train/lr": 3.6433915918681605e-05, "train/step_canary_loss": 8.59375, "perf/step_duration_sec": 5.9653377460781485, "perf/samples_per_sec": 5.699593459289536, "perf/tokens_per_sec": 4079.5678360373577, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 24336.0, "perf/physical_batches": 9.0, "privacy/epsilon": 6.4933727149717795, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705254.7985632, "event": "eval_step", "step": 430, "epoch": 3, "metrics": {"eval/loss": 0.847573630681092, "eval/duration_sec": 14.139139660866931}} | |
| {"timestamp": 1774705285.847547, "event": "train_step", "step": 435, "epoch": 3, "metrics": {"train/step_loss": 2.0515839788648815, "train/step_real_loss": 1.452563226222992, "train/lr": 3.5041046934276864e-05, "train/step_canary_loss": 6.84375, "perf/step_duration_sec": 6.4525174361187965, "perf/samples_per_sec": 5.424239507526628, "perf/tokens_per_sec": 3812.4654824330014, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 24600.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.53541900726021, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705315.8339086, "event": "train_step", "step": 440, "epoch": 3, "metrics": {"train/step_loss": 1.7793634639066809, "train/step_real_loss": 1.3007299304008484, "train/lr": 3.367155695600353e-05, "train/step_canary_loss": 9.4375, "perf/step_duration_sec": 5.832705789944157, "perf/samples_per_sec": 5.829198527142841, "perf/tokens_per_sec": 4499.798368923265, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 26246.0, "perf/physical_batches": 9.0, "privacy/epsilon": 6.576308209970124, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705330.0375705, "event": "eval_step", "step": 440, "epoch": 3, "metrics": {"eval/loss": 0.8475959929214282, "eval/duration_sec": 14.188788234023377}} | |
| {"timestamp": 1774705361.536987, "event": "train_step", "step": 445, "epoch": 3, "metrics": {"train/step_loss": 2.456523573076403, "train/step_real_loss": 1.3296131938695908, "train/lr": 3.232641010081339e-05, "train/step_canary_loss": 9.66875, "perf/step_duration_sec": 6.347707838052884, "perf/samples_per_sec": 5.828875705052849, "perf/tokens_per_sec": 4262.010900662156, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 27054.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.617185519473521, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705391.9041471, "event": "train_step", "step": 450, "epoch": 3, "metrics": {"train/step_loss": 1.8409677253049963, "train/step_real_loss": 1.3271219581365585, "train/lr": 3.100655334817044e-05, "train/step_canary_loss": 10.0625, "perf/step_duration_sec": 5.835719424998388, "perf/samples_per_sec": 5.826188259557971, "perf/tokens_per_sec": 4527.46235311121, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 26421.0, "perf/physical_batches": 9.0, "privacy/epsilon": 6.658062828976919, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705406.0578125, "event": "eval_step", "step": 450, "epoch": 3, "metrics": {"eval/loss": 0.8476238946684381, "eval/duration_sec": 14.142260301858187}} | |
| {"timestamp": 1774705436.1777883, "event": "train_step", "step": 455, "epoch": 3, "metrics": {"train/step_loss": 2.8853205411862106, "train/step_real_loss": 1.2996875047683716, "train/lr": 2.9712915873380282e-05, "train/step_canary_loss": 10.13392870766776, "perf/step_duration_sec": 5.685665256110951, "perf/samples_per_sec": 6.859355632673382, "perf/tokens_per_sec": 4687.226348993478, "perf/logical_batch_size": 39.0, "perf/logical_token_count": 26650.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.698940138480316, "system/cuda_memory_allocated_gb": 16.437074184417725, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705466.3251495, "event": "train_step", "step": 460, "epoch": 3, "metrics": {"train/step_loss": 2.517282975686563, "train/step_real_loss": 1.3813115656375885, "train/lr": 2.8446408393453304e-05, "train/step_canary_loss": 9.7875, "perf/step_duration_sec": 5.574718042043969, "perf/samples_per_sec": 6.637106974908808, "perf/tokens_per_sec": 4627.139849128992, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 25795.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.7398174479837145, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705480.4577382, "event": "eval_step", "step": 460, "epoch": 3, "metrics": {"eval/loss": 0.847630437463522, "eval/duration_sec": 14.117394712986425}} | |
| {"timestamp": 1774705510.5615659, "event": "train_step", "step": 465, "epoch": 3, "metrics": {"train/step_loss": 1.6934949466160365, "train/step_real_loss": 1.20186947286129, "train/lr": 2.7207922525962636e-05, "train/step_canary_loss": 6.9375, "perf/step_duration_sec": 5.901840454898775, "perf/samples_per_sec": 5.760914795956332, "perf/tokens_per_sec": 4966.2474314552965, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 29310.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.780694757487112, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705540.6914062, "event": "train_step", "step": 470, "epoch": 3, "metrics": {"train/step_loss": 1.9607619285583495, "train/step_real_loss": 1.3438020795583725, "train/lr": 2.5998330161347976e-05, "train/step_canary_loss": 8.541666984558105, "perf/step_duration_sec": 5.316162185044959, "perf/samples_per_sec": 6.583696806402832, "perf/tokens_per_sec": 5288.777697394915, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 28116.0, "perf/physical_batches": 9.0, "privacy/epsilon": 6.82138730332437, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705554.8670964, "event": "eval_step", "step": 470, "epoch": 3, "metrics": {"eval/loss": 0.8476283294572071, "eval/duration_sec": 14.162155629135668}} | |
| {"timestamp": 1774705585.4377017, "event": "train_step", "step": 475, "epoch": 3, "metrics": {"train/step_loss": 2.5368395624934017, "train/step_real_loss": 1.3199394941329956, "train/lr": 2.4818482849107253e-05, "train/step_canary_loss": 10.325, "perf/step_duration_sec": 5.688960139174014, "perf/samples_per_sec": 6.503824793079332, "perf/tokens_per_sec": 5011.109113543394, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 28508.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.861105661563654, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705615.8926258, "event": "train_step", "step": 480, "epoch": 3, "metrics": {"train/step_loss": 2.0716699361801147, "train/step_real_loss": 1.227113053202629, "train/lr": 2.366921119830816e-05, "train/step_canary_loss": 8.828125, "perf/step_duration_sec": 5.384118451969698, "perf/samples_per_sec": 6.686331350460899, "perf/tokens_per_sec": 5237.626224527705, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 28200.0, "perf/physical_batches": 9.0, "privacy/epsilon": 6.900824019802937, "system/cuda_memory_allocated_gb": 16.531797885894775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705630.0294645, "event": "eval_step", "step": 480, "epoch": 3, "metrics": {"eval/loss": 0.8476116240701892, "eval/duration_sec": 14.121506309136748}} | |
| {"timestamp": 1774705661.1397104, "event": "train_step", "step": 485, "epoch": 3, "metrics": {"train/step_loss": 1.78621927429648, "train/step_real_loss": 1.27481110394001, "train/lr": 2.2551324292841998e-05, "train/step_canary_loss": 9.96875, "perf/step_duration_sec": 6.077525713015348, "perf/samples_per_sec": 5.594381925392298, "perf/tokens_per_sec": 4364.111523740586, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 26523.0, "perf/physical_batches": 9.0, "privacy/epsilon": 6.940542378042221, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705691.6936827, "event": "train_step", "step": 490, "epoch": 3, "metrics": {"train/step_loss": 1.97020599577162, "train/step_real_loss": 1.2926535904407501, "train/lr": 2.1465609121830783e-05, "train/step_canary_loss": 7.390625238418579, "perf/step_duration_sec": 6.489749439992011, "perf/samples_per_sec": 5.393120385252206, "perf/tokens_per_sec": 4309.873633585834, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 27970.0, "perf/physical_batches": 10.0, "privacy/epsilon": 6.9802607362815055, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705705.8608572, "event": "eval_step", "step": 490, "epoch": 3, "metrics": {"eval/loss": 0.847628999162804, "eval/duration_sec": 14.158244116930291}} | |
| {"timestamp": 1774705736.265408, "event": "train_step", "step": 495, "epoch": 3, "metrics": {"train/step_loss": 2.179916948885531, "train/step_real_loss": 1.3037320971488953, "train/lr": 2.04128300255893e-05, "train/step_canary_loss": 7.7875, "perf/step_duration_sec": 6.454165891977027, "perf/samples_per_sec": 5.5777927934499605, "perf/tokens_per_sec": 4217.895922669119, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 27223.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.01997909452079, "system/cuda_memory_allocated_gb": 16.5317063331604, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705767.8750584, "event": "train_step", "step": 500, "epoch": 3, "metrics": {"train/step_loss": 2.5136500049281763, "train/step_real_loss": 1.363439068198204, "train/lr": 1.939372815753177e-05, "train/step_canary_loss": 9.875, "perf/step_duration_sec": 6.307756095891818, "perf/samples_per_sec": 5.86579433914665, "perf/tokens_per_sec": 4048.507838886162, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 25537.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.059697452760074, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705782.031898, "event": "eval_step", "step": 500, "epoch": 3, "metrics": {"eval/loss": 0.8476266869428483, "eval/duration_sec": 14.142719849944115}} | |
| {"timestamp": 1774705813.3792741, "event": "train_step", "step": 505, "epoch": 3, "metrics": {"train/step_loss": 1.8545954295567104, "train/step_real_loss": 1.321432501077652, "train/lr": 1.840902096240187e-05, "train/step_canary_loss": 7.541666666666667, "perf/step_duration_sec": 6.250405587023124, "perf/samples_per_sec": 5.439646999962631, "perf/tokens_per_sec": 4015.259434060651, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 25097.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.099415810999358, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705844.1240628, "event": "train_step", "step": 510, "epoch": 3, "metrics": {"train/step_loss": 1.8707237664391012, "train/step_real_loss": 1.370456501841545, "train/lr": 1.745940167119394e-05, "train/step_canary_loss": 9.875, "perf/step_duration_sec": 5.311531386105344, "perf/samples_per_sec": 6.401167107652233, "perf/tokens_per_sec": 4915.154990572849, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 26107.0, "perf/physical_batches": 9.0, "privacy/epsilon": 7.138471205899984, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705858.2967215, "event": "eval_step", "step": 510, "epoch": 3, "metrics": {"eval/loss": 0.8476048985665494, "eval/duration_sec": 14.159020371036604}} | |
| {"timestamp": 1774705890.0619946, "event": "train_step", "step": 515, "epoch": 3, "metrics": {"train/step_loss": 1.8091832978384836, "train/step_real_loss": 1.3850442320108414, "train/lr": 1.654553881312016e-05, "train/step_canary_loss": 6.333333333333333, "perf/step_duration_sec": 6.432242113165557, "perf/samples_per_sec": 5.285870681143759, "perf/tokens_per_sec": 3491.6285184649323, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 22459.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.177040470443901, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705921.5888262, "event": "train_step", "step": 520, "epoch": 3, "metrics": {"train/step_loss": 2.5437453115308606, "train/step_real_loss": 1.3689398914575577, "train/lr": 1.5668075744968074e-05, "train/step_canary_loss": 10.0625, "perf/step_duration_sec": 6.260556240100414, "perf/samples_per_sec": 5.910017988977694, "perf/tokens_per_sec": 4239.559390903944, "perf/logical_batch_size": 37.0, "perf/logical_token_count": 26542.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.215609734987817, "system/cuda_memory_allocated_gb": 16.247618198394775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705935.705343, "event": "eval_step", "step": 520, "epoch": 3, "metrics": {"eval/loss": 0.8476215902377261, "eval/duration_sec": 14.101543412078172}} | |
| {"timestamp": 1774705965.8948119, "event": "train_step", "step": 525, "epoch": 3, "metrics": {"train/step_loss": 1.9608346598488944, "train/step_real_loss": 1.2247410342097282, "train/lr": 1.4827630198179268e-05, "train/step_canary_loss": 9.8125, "perf/step_duration_sec": 5.8048105030320585, "perf/samples_per_sec": 6.029481923952257, "perf/tokens_per_sec": 4658.550005357626, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 27042.0, "perf/physical_batches": 9.0, "privacy/epsilon": 7.254178999531733, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774705996.6647747, "event": "train_step", "step": 530, "epoch": 3, "metrics": {"train/step_loss": 1.5299837869756363, "train/step_real_loss": 1.3384983986616135, "train/lr": 1.4024793843968244e-05, "train/step_canary_loss": 4.59375, "perf/step_duration_sec": 6.19956241408363, "perf/samples_per_sec": 5.322956330761903, "perf/tokens_per_sec": 3913.1794116449623, "perf/logical_batch_size": 33.0, "perf/logical_token_count": 24260.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.29274826407565, "system/cuda_memory_allocated_gb": 16.247522354125977, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774706010.9274755, "event": "eval_step", "step": 530, "epoch": 3, "metrics": {"eval/loss": 0.8476035064932974, "eval/duration_sec": 14.251294237095863}} | |
| {"timestamp": 1774706041.939134, "event": "train_step", "step": 535, "epoch": 3, "metrics": {"train/step_loss": 2.7158979114733244, "train/step_real_loss": 1.3110662698745728, "train/lr": 1.326013187678748e-05, "train/step_canary_loss": 10.208333333333334, "perf/step_duration_sec": 6.425864369142801, "perf/samples_per_sec": 5.913601317587276, "perf/tokens_per_sec": 3945.617047529153, "perf/logical_batch_size": 38.0, "perf/logical_token_count": 25354.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.331317528619566, "system/cuda_memory_allocated_gb": 16.34234619140625, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774706074.6363385, "event": "train_step", "step": 540, "epoch": 3, "metrics": {"train/step_loss": 2.1915427446365356, "train/step_real_loss": 1.4264230281114578, "train/lr": 1.2534182616432408e-05, "train/step_canary_loss": 8.312500476837158, "perf/step_duration_sec": 6.56042078207247, "perf/samples_per_sec": 5.335023645989873, "perf/tokens_per_sec": 3790.762944346347, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 24869.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.3698867931634835, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774706088.805339, "event": "eval_step", "step": 540, "epoch": 3, "metrics": {"eval/loss": 0.8476456510411068, "eval/duration_sec": 14.157518177991733}} | |
| {"timestamp": 1774706119.4987738, "event": "train_step", "step": 545, "epoch": 3, "metrics": {"train/step_loss": 2.1096764512964197, "train/step_real_loss": 1.3357977718114853, "train/lr": 1.184745712906565e-05, "train/step_canary_loss": 7.0625, "perf/step_duration_sec": 6.2488325061276555, "perf/samples_per_sec": 5.761076163379017, "perf/tokens_per_sec": 4396.341232231898, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 27472.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.4084560577074, "system/cuda_memory_allocated_gb": 16.531797885894775, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774706150.406647, "event": "train_step", "step": 550, "epoch": 3, "metrics": {"train/step_loss": 2.0274913840823703, "train/step_real_loss": 1.3707714974880219, "train/lr": 1.1200438867428068e-05, "train/step_canary_loss": 7.281250476837158, "perf/step_duration_sec": 6.412045827135444, "perf/samples_per_sec": 5.458476271626417, "perf/tokens_per_sec": 3533.505625321135, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 22657.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.446875856779603, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774706164.6008914, "event": "eval_step", "step": 550, "epoch": 3, "metrics": {"eval/loss": 0.8476151647892864, "eval/duration_sec": 14.181081710150465}} | |
| {"timestamp": 1774706195.2370367, "event": "train_step", "step": 555, "epoch": 3, "metrics": {"train/step_loss": 1.8568150520324707, "train/step_real_loss": 1.3297195881605148, "train/lr": 1.0593583330489345e-05, "train/step_canary_loss": 7.479166666666667, "perf/step_duration_sec": 6.602375558111817, "perf/samples_per_sec": 5.149661618116663, "perf/tokens_per_sec": 3895.113171561947, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 25717.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.484305715933786, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774706226.8723788, "event": "train_step", "step": 560, "epoch": 3, "metrics": {"train/step_loss": 1.6160828786737778, "train/step_real_loss": 1.455369308590889, "train/lr": 1.002731774277807e-05, "train/step_canary_loss": 4.1875, "perf/step_duration_sec": 6.593549631070346, "perf/samples_per_sec": 5.004891423656886, "perf/tokens_per_sec": 3737.288923083424, "perf/logical_batch_size": 33.0, "perf/logical_token_count": 24642.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.521735575087969, "system/cuda_memory_allocated_gb": 16.247522354125977, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774706241.0597212, "event": "eval_step", "step": 560, "epoch": 3, "metrics": {"eval/loss": 0.8476623755625704, "eval/duration_sec": 14.172422597184777}} | |
| {"timestamp": 1774706271.472136, "event": "train_step", "step": 565, "epoch": 3, "metrics": {"train/step_loss": 2.0681455612182615, "train/step_real_loss": 1.3772685825824738, "train/lr": 9.502040753616962e-06, "train/step_canary_loss": 9.4375, "perf/step_duration_sec": 6.111006421037018, "perf/samples_per_sec": 5.727370843452757, "perf/tokens_per_sec": 4291.600792582629, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 26226.0, "perf/physical_batches": 9.0, "privacy/epsilon": 7.559165434242152, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774706302.6626637, "event": "train_step", "step": 570, "epoch": 3, "metrics": {"train/step_loss": 2.806567355206138, "train/step_real_loss": 1.3445174843072891, "train/lr": 9.018122156474845e-06, "train/step_canary_loss": 10.604166666666666, "perf/step_duration_sec": 6.431410561082885, "perf/samples_per_sec": 5.908501663685077, "perf/tokens_per_sec": 4632.887251872647, "perf/logical_batch_size": 38.0, "perf/logical_token_count": 29796.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.5965952933963345, "system/cuda_memory_allocated_gb": 16.34234619140625, "system/cuda_max_memory_allocated_gb": 46.08253002166748}} | |
| {"timestamp": 1774706316.8048155, "event": "eval_step", "step": 570, "epoch": 3, "metrics": {"eval/loss": 0.8476327530701052, "eval/duration_sec": 14.132337664952502}} | |
| {"timestamp": 1774706347.943645, "event": "train_step", "step": 575, "epoch": 3, "metrics": {"train/step_loss": 2.195257032239759, "train/step_real_loss": 1.2921721935272217, "train/lr": 8.575902628633133e-06, "train/step_canary_loss": 7.975, "perf/step_duration_sec": 6.366320572094992, "perf/samples_per_sec": 5.654757656690437, "perf/tokens_per_sec": 4095.9294626627734, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 26076.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.634025152550517, "system/cuda_memory_allocated_gb": 16.5317063331604, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774706379.3289592, "event": "train_step", "step": 580, "epoch": 3, "metrics": {"train/step_loss": 1.8297266562779744, "train/step_real_loss": 1.2342237085103989, "train/lr": 8.175693491350082e-06, "train/step_canary_loss": 6.593750238418579, "perf/step_duration_sec": 6.209561487892643, "perf/samples_per_sec": 5.636468866318941, "perf/tokens_per_sec": 4345.878537899513, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 26986.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.6714550117047, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.082552909851074}} | |
| {"timestamp": 1774706393.4969764, "event": "eval_step", "step": 580, "epoch": 3, "metrics": {"eval/loss": 0.8475754701278427, "eval/duration_sec": 14.152010071091354}} | |
| {"timestamp": 1774706424.8101745, "event": "train_step", "step": 585, "epoch": 3, "metrics": {"train/step_loss": 1.7521814618791853, "train/step_real_loss": 1.3207453489303589, "train/lr": 7.817776490691442e-06, "train/step_canary_loss": 6.354166666666667, "perf/step_duration_sec": 6.214652560884133, "perf/samples_per_sec": 5.470941402903296, "perf/tokens_per_sec": 3868.438301976416, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 24041.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.708884870858882, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08257722854614}} | |
| {"timestamp": 1774706455.767074, "event": "train_step", "step": 590, "epoch": 3, "metrics": {"train/step_loss": 2.1815602586076066, "train/step_real_loss": 1.3720384240150452, "train/lr": 7.502403599182098e-06, "train/step_canary_loss": 7.3625, "perf/step_duration_sec": 6.445409220876172, "perf/samples_per_sec": 5.58537072920038, "perf/tokens_per_sec": 3695.808781674507, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 23821.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.746314730013066, "system/cuda_memory_allocated_gb": 16.5317063331604, "system/cuda_max_memory_allocated_gb": 46.08257722854614}} | |
| {"timestamp": 1774706469.9166799, "event": "eval_step", "step": 590, "epoch": 3, "metrics": {"eval/loss": 0.8476284754208544, "eval/duration_sec": 14.137012894963846}} | |
| {"timestamp": 1774706500.6368022, "event": "train_step", "step": 595, "epoch": 3, "metrics": {"train/step_loss": 2.22404556525381, "train/step_real_loss": 1.3285541087388992, "train/lr": 7.22979683841816e-06, "train/step_canary_loss": 7.0, "perf/step_duration_sec": 6.537071665050462, "perf/samples_per_sec": 5.507052980995903, "perf/tokens_per_sec": 4166.5445012051505, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 27237.0, "perf/physical_batches": 11.0, "privacy/epsilon": 7.78374458916725, "system/cuda_memory_allocated_gb": 16.531729221343994, "system/cuda_max_memory_allocated_gb": 46.08257722854614}} | |
| {"timestamp": 1774706532.4743109, "event": "train_step", "step": 600, "epoch": 3, "metrics": {"train/step_loss": 1.255253602476681, "train/step_real_loss": 1.3337069526314735, "train/lr": 7.0001481227643515e-06, "train/step_canary_loss": 0.0, "perf/step_duration_sec": 6.43329463317059, "perf/samples_per_sec": 4.974123186431631, "perf/tokens_per_sec": 4180.905979545361, "perf/logical_batch_size": 32.0, "perf/logical_token_count": 26897.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.8203949896877125, "system/cuda_memory_allocated_gb": 16.530991077423096, "system/cuda_max_memory_allocated_gb": 46.08257722854614}} | |
| {"timestamp": 1774706546.6503627, "event": "eval_step", "step": 600, "epoch": 3, "metrics": {"eval/loss": 0.8476245523515072, "eval/duration_sec": 14.160503386054188}} | |
| {"timestamp": 1774706577.223923, "event": "train_step", "step": 605, "epoch": 3, "metrics": {"train/step_loss": 2.249326480759515, "train/step_real_loss": 1.225804790854454, "train/lr": 6.813619124246933e-06, "train/step_canary_loss": 10.4375, "perf/step_duration_sec": 6.03316982393153, "perf/samples_per_sec": 5.9670125407709, "perf/tokens_per_sec": 4879.524505215403, "perf/logical_batch_size": 36.0, "perf/logical_token_count": 29439.0, "perf/physical_batches": 9.0, "privacy/epsilon": 7.85669496701106, "system/cuda_memory_allocated_gb": 16.5317063331604, "system/cuda_max_memory_allocated_gb": 46.08257722854614}} | |
| {"timestamp": 1774706608.5116968, "event": "train_step", "step": 610, "epoch": 3, "metrics": {"train/step_loss": 1.9708250496122572, "train/step_real_loss": 1.3245999962091446, "train/lr": 6.670341158736986e-06, "train/step_canary_loss": 7.140625476837158, "perf/step_duration_sec": 6.528257534839213, "perf/samples_per_sec": 5.36130809993574, "perf/tokens_per_sec": 4240.794707049171, "perf/logical_batch_size": 35.0, "perf/logical_token_count": 27685.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.892994944334407, "system/cuda_memory_allocated_gb": 16.436978340148926, "system/cuda_max_memory_allocated_gb": 46.08257722854614}} | |
| {"timestamp": 1774706622.7000098, "event": "eval_step", "step": 610, "epoch": 3, "metrics": {"eval/loss": 0.8476337621157819, "eval/duration_sec": 14.175194735173136}} | |
| {"timestamp": 1774706654.1846402, "event": "train_step", "step": 615, "epoch": 3, "metrics": {"train/step_loss": 1.8169789041791644, "train/step_real_loss": 1.346695676445961, "train/lr": 6.57041509350448e-06, "train/step_canary_loss": 6.833333333333333, "perf/step_duration_sec": 6.532371184090152, "perf/samples_per_sec": 5.2048481388823005, "perf/tokens_per_sec": 4107.5436841908795, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 26832.0, "perf/physical_batches": 10.0, "privacy/epsilon": 7.929294921657754, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08257722854614}} | |
| {"timestamp": 1774706683.850218, "event": "train_step", "step": 620, "epoch": 3, "metrics": {"train/step_loss": 1.804337599698235, "train/step_real_loss": 1.2823430746793747, "train/lr": 6.5139112762079875e-06, "train/step_canary_loss": 10.15625, "perf/step_duration_sec": 5.330887127900496, "perf/samples_per_sec": 6.377925321669768, "perf/tokens_per_sec": 4628.685509182398, "perf/logical_batch_size": 34.0, "perf/logical_token_count": 24675.0, "perf/physical_batches": 9.0, "privacy/epsilon": 7.965594898981101, "system/cuda_memory_allocated_gb": 16.34225034713745, "system/cuda_max_memory_allocated_gb": 46.08257722854614}} | |
| {"timestamp": 1774706697.9801428, "event": "eval_step", "step": 620, "epoch": 3, "metrics": {"eval/loss": 0.8476180772889744, "eval/duration_sec": 14.115275254938751}} | |
| {"timestamp": 1774706733.041422, "event": "train_epoch", "step": 624, "epoch": 3, "metrics": {"train/epoch_loss": 2.0618881598471557, "train/epoch_real_loss": 1.3318002155782387, "train/epoch_canary_loss": 7.866599485030913, "perf/epoch_duration_sec": 1581.0388780001085, "perf/epoch_samples_per_sec": 36.840966285204786, "perf/epoch_tokens_per_sec": 27916.25279691381, "perf/epoch_samples": 58247.0, "perf/epoch_tokens": 44136681.0, "system/cuda_epoch_peak_memory_gb": 46.08257722854614, "eval/loss": 0.8476120976900514, "eval/duration_sec": 14.139388957060874, "privacy/epsilon": 7.99463488083978}} | |
| {"timestamp": 1774706742.371868, "event": "audit_epoch", "step": 624, "epoch": 3, "metrics": {"audit/delta": 1e-05, "audit/num_canaries": 500.0, "audit/num_members": 250.0, "audit/paper_guess_fraction": 0.2, "audit/paper_guess_steps": 20.0, "audit/loss/auc": 0.52628, "audit/loss/empirical_epsilon/0.05": 0.0, "audit/loss/empirical_epsilon/0.01": 0.0, "audit/loss/empirical_epsilon_details/0.05/epsilon": 0.0, "audit/loss/empirical_epsilon_details/0.05/num_guesses": 0.0, "audit/loss/empirical_epsilon_details/0.05/correct_guesses": 0.0, "audit/loss/empirical_epsilon_details/0.01/epsilon": 0.0, "audit/loss/empirical_epsilon_details/0.01/num_guesses": 0.0, "audit/loss/empirical_epsilon_details/0.01/correct_guesses": 0.0, "audit/embedding/auc": 0.53716, "audit/embedding/empirical_epsilon/0.05": 0.0, "audit/embedding/empirical_epsilon/0.01": 0.0, "audit/embedding/empirical_epsilon_details/0.05/epsilon": 0.0, "audit/embedding/empirical_epsilon_details/0.05/num_guesses": 0.0, "audit/embedding/empirical_epsilon_details/0.05/correct_guesses": 0.0, "audit/embedding/empirical_epsilon_details/0.01/epsilon": 0.0, "audit/embedding/empirical_epsilon_details/0.01/num_guesses": 0.0, "audit/embedding/empirical_epsilon_details/0.01/correct_guesses": 0.0, "perf/audit_duration_sec": 5.879508854821324}} | |
| {"timestamp": 1774706751.4590647, "event": "audit_final", "step": 624, "epoch": 3, "metrics": {"audit/delta": 1e-05, "audit/num_canaries": 500.0, "audit/num_members": 250.0, "audit/paper_guess_fraction": 0.2, "audit/paper_guess_steps": 20.0, "audit/loss/auc": 0.52628, "audit/loss/empirical_epsilon/0.05": 0.0, "audit/loss/empirical_epsilon/0.01": 0.0, "audit/loss/empirical_epsilon_details/0.05/epsilon": 0.0, "audit/loss/empirical_epsilon_details/0.05/num_guesses": 0.0, "audit/loss/empirical_epsilon_details/0.05/correct_guesses": 0.0, "audit/loss/empirical_epsilon_details/0.01/epsilon": 0.0, "audit/loss/empirical_epsilon_details/0.01/num_guesses": 0.0, "audit/loss/empirical_epsilon_details/0.01/correct_guesses": 0.0, "audit/embedding/auc": 0.53716, "audit/embedding/empirical_epsilon/0.05": 0.0, "audit/embedding/empirical_epsilon/0.01": 0.0, "audit/embedding/empirical_epsilon_details/0.05/epsilon": 0.0, "audit/embedding/empirical_epsilon_details/0.05/num_guesses": 0.0, "audit/embedding/empirical_epsilon_details/0.05/correct_guesses": 0.0, "audit/embedding/empirical_epsilon_details/0.01/epsilon": 0.0, "audit/embedding/empirical_epsilon_details/0.01/num_guesses": 0.0, "audit/embedding/empirical_epsilon_details/0.01/correct_guesses": 0.0}} | |
| {"timestamp": 1774706752.0167563, "event": "energy_final", "step": 624, "epoch": null, "metrics": {"energy/codecarbon/duration": 4876.212828015909, "energy/codecarbon/emissions": 0.19531666760349806, "energy/codecarbon/emissions_rate": 4.005499236647774e-05, "energy/codecarbon/cpu_power": 81.12029064705573, "energy/codecarbon/gpu_power": 4036.488899527526, "energy/codecarbon/ram_power": 38.0, "energy/codecarbon/cpu_energy": 0.10578202327142265, "energy/codecarbon/gpu_energy": 5.4502873277263575, "energy/codecarbon/ram_energy": 0.049552082389069795, "energy/codecarbon/energy_consumed": 5.605621433386851, "energy/codecarbon/water_consumed": 0.0, "energy/codecarbon/cpu_count": 16.0, "energy/codecarbon/gpu_count": 8.0, "energy/codecarbon/longitude": 8.212, "energy/codecarbon/latitude": 47.4843, "energy/codecarbon/ram_total_size": 128.0, "energy/codecarbon/cpu_utilization_percent": 10.068375181572941, "energy/codecarbon/gpu_utilization_percent": 93.63337829425193, "energy/codecarbon/ram_utilization_percent": 26.690475202324134, "energy/codecarbon/ram_used_gb": 529.1190595498197, "energy/codecarbon/pue": 1.0, "energy/codecarbon/wue": 0.0}} | |