Alex-GSL commited on
Commit
73d5b95
·
verified ·
1 Parent(s): 6ec3759

Upload human_games/game_20260324_192413_22.json with huggingface_hub

Browse files
human_games/game_20260324_192413_22.json ADDED
@@ -0,0 +1,633 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "game_number": 22,
3
+ "timestamp": "2026-03-24T19:24:13.619000+00:00",
4
+ "checkpoint": "checkpoints/r39_900M.pkl",
5
+ "architecture": "shared",
6
+ "result": "human_win",
7
+ "final_scores": [
8
+ 23,
9
+ 0
10
+ ],
11
+ "total_turns": 4,
12
+ "actions": [
13
+ {
14
+ "turn": 0,
15
+ "player": -1,
16
+ "phase": "draw",
17
+ "action": -1,
18
+ "action_desc": "Initial deal",
19
+ "card_drawn": null,
20
+ "hands": [
21
+ [
22
+ 12,
23
+ 18,
24
+ 5,
25
+ 38,
26
+ 29,
27
+ 6,
28
+ 25,
29
+ 46,
30
+ 14,
31
+ 13
32
+ ],
33
+ [
34
+ 51,
35
+ 30,
36
+ 48,
37
+ 4,
38
+ 49,
39
+ 44,
40
+ 17,
41
+ 33,
42
+ 36,
43
+ 20
44
+ ]
45
+ ],
46
+ "hand_sizes": [
47
+ 10,
48
+ 10
49
+ ],
50
+ "discard_pile": [
51
+ 3
52
+ ],
53
+ "discard_size": 1,
54
+ "stock_remaining": 31,
55
+ "deadwood": [
56
+ 34,
57
+ 62
58
+ ],
59
+ "model_logits": null,
60
+ "model_value": null
61
+ },
62
+ {
63
+ "turn": 1,
64
+ "player": 1,
65
+ "phase": "draw",
66
+ "action": 0,
67
+ "action_desc": "Model drew from stock",
68
+ "card_drawn": 22,
69
+ "hands": [
70
+ [
71
+ 12,
72
+ 18,
73
+ 5,
74
+ 38,
75
+ 29,
76
+ 6,
77
+ 25,
78
+ 46,
79
+ 14,
80
+ 13
81
+ ],
82
+ [
83
+ 51,
84
+ 30,
85
+ 48,
86
+ 4,
87
+ 49,
88
+ 44,
89
+ 17,
90
+ 33,
91
+ 36,
92
+ 20
93
+ ]
94
+ ],
95
+ "hand_sizes": [
96
+ 10,
97
+ 10
98
+ ],
99
+ "discard_pile": [
100
+ 3
101
+ ],
102
+ "discard_size": 1,
103
+ "stock_remaining": 31,
104
+ "deadwood": [
105
+ 34,
106
+ 62
107
+ ],
108
+ "model_logits": [
109
+ 3.109464406967163,
110
+ -3.112916946411133,
111
+ 4.70317268371582,
112
+ -22.055505752563477,
113
+ 2.655984878540039,
114
+ -20.03134536743164,
115
+ 1.9063637256622314,
116
+ -0.5329421162605286,
117
+ -21.788272857666016,
118
+ 1.8471542596817017,
119
+ 2.655738592147827,
120
+ 1.2116081714630127,
121
+ 6.592553615570068,
122
+ -8.15271282196045,
123
+ 7.924522399902344,
124
+ 1.591727614402771
125
+ ],
126
+ "model_value": 0.044368676841259
127
+ },
128
+ {
129
+ "turn": 2,
130
+ "player": 1,
131
+ "phase": "discard",
132
+ "action": 2,
133
+ "action_desc": "Model discarded K\u2663",
134
+ "card_drawn": null,
135
+ "hands": [
136
+ [
137
+ 12,
138
+ 18,
139
+ 5,
140
+ 38,
141
+ 29,
142
+ 6,
143
+ 25,
144
+ 46,
145
+ 14,
146
+ 13
147
+ ],
148
+ [
149
+ 51,
150
+ 30,
151
+ 48,
152
+ 4,
153
+ 49,
154
+ 44,
155
+ 17,
156
+ 33,
157
+ 36,
158
+ 20,
159
+ 22
160
+ ]
161
+ ],
162
+ "hand_sizes": [
163
+ 10,
164
+ 11
165
+ ],
166
+ "discard_pile": [
167
+ 3
168
+ ],
169
+ "discard_size": 1,
170
+ "stock_remaining": 30,
171
+ "deadwood": [
172
+ 34,
173
+ 72
174
+ ],
175
+ "model_logits": [
176
+ -10.006057739257812,
177
+ 9.999044418334961,
178
+ 9.938360214233398,
179
+ -19.24264144897461,
180
+ 6.890890121459961,
181
+ -17.140472412109375,
182
+ 7.011821746826172,
183
+ -12.747942924499512,
184
+ -19.436288833618164,
185
+ -9.630936622619629,
186
+ 8.278351783752441,
187
+ -11.058783531188965,
188
+ 7.150765895843506,
189
+ -9.46861743927002,
190
+ 9.176074028015137,
191
+ 1.8340317010879517
192
+ ],
193
+ "model_value": 0.03979571908712387
194
+ },
195
+ {
196
+ "turn": 3,
197
+ "player": 0,
198
+ "phase": "draw",
199
+ "action": 1,
200
+ "action_desc": "Human drew K\u2663 from discard",
201
+ "card_drawn": 51,
202
+ "hands": [
203
+ [
204
+ 12,
205
+ 18,
206
+ 5,
207
+ 38,
208
+ 29,
209
+ 6,
210
+ 25,
211
+ 46,
212
+ 14,
213
+ 13
214
+ ],
215
+ [
216
+ 22,
217
+ 30,
218
+ 48,
219
+ 4,
220
+ 49,
221
+ 44,
222
+ 17,
223
+ 33,
224
+ 36,
225
+ 20
226
+ ]
227
+ ],
228
+ "hand_sizes": [
229
+ 10,
230
+ 10
231
+ ],
232
+ "discard_pile": [
233
+ 3,
234
+ 51
235
+ ],
236
+ "discard_size": 2,
237
+ "stock_remaining": 30,
238
+ "deadwood": [
239
+ 34,
240
+ 62
241
+ ],
242
+ "model_logits": null,
243
+ "model_value": null
244
+ },
245
+ {
246
+ "turn": 4,
247
+ "player": 0,
248
+ "phase": "discard",
249
+ "action": 9,
250
+ "action_desc": "Human discarded 8\u2663",
251
+ "card_drawn": null,
252
+ "hands": [
253
+ [
254
+ 12,
255
+ 18,
256
+ 5,
257
+ 38,
258
+ 29,
259
+ 6,
260
+ 25,
261
+ 46,
262
+ 14,
263
+ 13,
264
+ 51
265
+ ],
266
+ [
267
+ 22,
268
+ 30,
269
+ 48,
270
+ 4,
271
+ 49,
272
+ 44,
273
+ 17,
274
+ 33,
275
+ 36,
276
+ 20
277
+ ]
278
+ ],
279
+ "hand_sizes": [
280
+ 11,
281
+ 10
282
+ ],
283
+ "discard_pile": [
284
+ 3
285
+ ],
286
+ "discard_size": 1,
287
+ "stock_remaining": 30,
288
+ "deadwood": [
289
+ 34,
290
+ 62
291
+ ],
292
+ "model_logits": null,
293
+ "model_value": null
294
+ },
295
+ {
296
+ "turn": 5,
297
+ "player": 1,
298
+ "phase": "draw",
299
+ "action": 1,
300
+ "action_desc": "Model drew 8\u2663 from discard",
301
+ "card_drawn": 46,
302
+ "hands": [
303
+ [
304
+ 12,
305
+ 18,
306
+ 5,
307
+ 38,
308
+ 29,
309
+ 6,
310
+ 25,
311
+ 51,
312
+ 14,
313
+ 13
314
+ ],
315
+ [
316
+ 22,
317
+ 30,
318
+ 48,
319
+ 4,
320
+ 49,
321
+ 44,
322
+ 17,
323
+ 33,
324
+ 36,
325
+ 20
326
+ ]
327
+ ],
328
+ "hand_sizes": [
329
+ 10,
330
+ 10
331
+ ],
332
+ "discard_pile": [
333
+ 3,
334
+ 46
335
+ ],
336
+ "discard_size": 2,
337
+ "stock_remaining": 30,
338
+ "deadwood": [
339
+ 26,
340
+ 62
341
+ ],
342
+ "model_logits": [
343
+ -12.413908004760742,
344
+ 12.405494689941406,
345
+ 4.790521621704102,
346
+ -21.396961212158203,
347
+ 3.492217540740967,
348
+ -19.653650283813477,
349
+ 3.1724815368652344,
350
+ 0.03338705003261566,
351
+ -21.141630172729492,
352
+ 4.521771430969238,
353
+ 2.902677297592163,
354
+ 4.073572158813477,
355
+ -1.0634233951568604,
356
+ -8.263012886047363,
357
+ 8.02218246459961,
358
+ 1.5639886856079102
359
+ ],
360
+ "model_value": -0.12015456706285477
361
+ },
362
+ {
363
+ "turn": 6,
364
+ "player": 1,
365
+ "phase": "discard",
366
+ "action": 2,
367
+ "action_desc": "Model discarded 10\u2665",
368
+ "card_drawn": null,
369
+ "hands": [
370
+ [
371
+ 12,
372
+ 18,
373
+ 5,
374
+ 38,
375
+ 29,
376
+ 6,
377
+ 25,
378
+ 51,
379
+ 14,
380
+ 13
381
+ ],
382
+ [
383
+ 22,
384
+ 30,
385
+ 48,
386
+ 4,
387
+ 49,
388
+ 44,
389
+ 17,
390
+ 33,
391
+ 36,
392
+ 20,
393
+ 46
394
+ ]
395
+ ],
396
+ "hand_sizes": [
397
+ 10,
398
+ 11
399
+ ],
400
+ "discard_pile": [
401
+ 3
402
+ ],
403
+ "discard_size": 1,
404
+ "stock_remaining": 30,
405
+ "deadwood": [
406
+ 26,
407
+ 46
408
+ ],
409
+ "model_logits": [
410
+ -1.6212071180343628,
411
+ 1.6183295249938965,
412
+ 2.4860188961029053,
413
+ -9.728973388671875,
414
+ 0.7912133932113647,
415
+ -7.736215114593506,
416
+ 0.49954953789711,
417
+ -1.744486689567566,
418
+ -9.424201011657715,
419
+ -10.191868782043457,
420
+ 1.532856822013855,
421
+ -10.971802711486816,
422
+ -10.603041648864746,
423
+ -9.129015922546387,
424
+ 8.874019622802734,
425
+ 1.7276297807693481
426
+ ],
427
+ "model_value": -0.10639283806085587
428
+ },
429
+ {
430
+ "turn": 7,
431
+ "player": 0,
432
+ "phase": "draw",
433
+ "action": 0,
434
+ "action_desc": "Human drew from stock",
435
+ "card_drawn": 31,
436
+ "hands": [
437
+ [
438
+ 12,
439
+ 18,
440
+ 5,
441
+ 38,
442
+ 29,
443
+ 6,
444
+ 25,
445
+ 51,
446
+ 14,
447
+ 13
448
+ ],
449
+ [
450
+ 46,
451
+ 30,
452
+ 48,
453
+ 4,
454
+ 49,
455
+ 44,
456
+ 17,
457
+ 33,
458
+ 36,
459
+ 20
460
+ ]
461
+ ],
462
+ "hand_sizes": [
463
+ 10,
464
+ 10
465
+ ],
466
+ "discard_pile": [
467
+ 3,
468
+ 22
469
+ ],
470
+ "discard_size": 2,
471
+ "stock_remaining": 30,
472
+ "deadwood": [
473
+ 26,
474
+ 36
475
+ ],
476
+ "model_logits": null,
477
+ "model_value": null
478
+ },
479
+ {
480
+ "turn": 8,
481
+ "player": 0,
482
+ "phase": "discard",
483
+ "action": 7,
484
+ "action_desc": "Human discarded 7\u2660",
485
+ "card_drawn": null,
486
+ "hands": [
487
+ [
488
+ 12,
489
+ 18,
490
+ 5,
491
+ 38,
492
+ 29,
493
+ 6,
494
+ 25,
495
+ 51,
496
+ 14,
497
+ 13,
498
+ 31
499
+ ],
500
+ [
501
+ 46,
502
+ 30,
503
+ 48,
504
+ 4,
505
+ 49,
506
+ 44,
507
+ 17,
508
+ 33,
509
+ 36,
510
+ 20
511
+ ]
512
+ ],
513
+ "hand_sizes": [
514
+ 11,
515
+ 10
516
+ ],
517
+ "discard_pile": [
518
+ 3,
519
+ 22
520
+ ],
521
+ "discard_size": 2,
522
+ "stock_remaining": 29,
523
+ "deadwood": [
524
+ 14,
525
+ 36
526
+ ],
527
+ "model_logits": null,
528
+ "model_value": null
529
+ },
530
+ {
531
+ "turn": 9,
532
+ "player": 0,
533
+ "phase": "knock_decision",
534
+ "action": 14,
535
+ "action_desc": "Human knocked",
536
+ "card_drawn": null,
537
+ "hands": [
538
+ [
539
+ 12,
540
+ 18,
541
+ 5,
542
+ 38,
543
+ 29,
544
+ 31,
545
+ 25,
546
+ 51,
547
+ 14,
548
+ 13
549
+ ],
550
+ [
551
+ 46,
552
+ 30,
553
+ 48,
554
+ 4,
555
+ 49,
556
+ 44,
557
+ 17,
558
+ 33,
559
+ 36,
560
+ 20
561
+ ]
562
+ ],
563
+ "hand_sizes": [
564
+ 10,
565
+ 10
566
+ ],
567
+ "discard_pile": [
568
+ 3,
569
+ 22,
570
+ 6
571
+ ],
572
+ "discard_size": 3,
573
+ "stock_remaining": 29,
574
+ "deadwood": [
575
+ 7,
576
+ 36
577
+ ],
578
+ "model_logits": null,
579
+ "model_value": null
580
+ },
581
+ {
582
+ "turn": 10,
583
+ "player": -1,
584
+ "phase": "game_over",
585
+ "action": -1,
586
+ "action_desc": "Game over.",
587
+ "card_drawn": null,
588
+ "hands": [
589
+ [
590
+ 12,
591
+ 18,
592
+ 5,
593
+ 38,
594
+ 29,
595
+ 31,
596
+ 25,
597
+ 51,
598
+ 14,
599
+ 13
600
+ ],
601
+ [
602
+ 46,
603
+ 30,
604
+ 48,
605
+ 4,
606
+ 49,
607
+ 44,
608
+ 17,
609
+ 33,
610
+ 36,
611
+ 20
612
+ ]
613
+ ],
614
+ "hand_sizes": [
615
+ 10,
616
+ 10
617
+ ],
618
+ "discard_pile": [
619
+ 3,
620
+ 22,
621
+ 6
622
+ ],
623
+ "discard_size": 3,
624
+ "stock_remaining": 29,
625
+ "deadwood": [
626
+ 7,
627
+ 36
628
+ ],
629
+ "model_logits": null,
630
+ "model_value": null
631
+ }
632
+ ]
633
+ }