Alex-GSL commited on
Commit
fa2c55a
·
verified ·
1 Parent(s): d77bd58

Upload human_games/game_20260324_063935_7.json with huggingface_hub

Browse files
human_games/game_20260324_063935_7.json ADDED
@@ -0,0 +1,1421 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "game_number": 7,
3
+ "timestamp": "2026-03-24T06:39:35.260079+00:00",
4
+ "checkpoint": "checkpoints/r39_900M.pkl",
5
+ "architecture": "shared",
6
+ "result": "model_win",
7
+ "final_scores": [
8
+ 0,
9
+ 11
10
+ ],
11
+ "total_turns": 10,
12
+ "actions": [
13
+ {
14
+ "turn": 0,
15
+ "player": -1,
16
+ "phase": "draw",
17
+ "action": -1,
18
+ "action_desc": "Initial deal",
19
+ "card_drawn": null,
20
+ "hands": [
21
+ [
22
+ 39,
23
+ 16,
24
+ 21,
25
+ 50,
26
+ 5,
27
+ 29,
28
+ 22,
29
+ 48,
30
+ 38,
31
+ 32
32
+ ],
33
+ [
34
+ 14,
35
+ 15,
36
+ 2,
37
+ 6,
38
+ 18,
39
+ 10,
40
+ 0,
41
+ 42,
42
+ 20,
43
+ 31
44
+ ]
45
+ ],
46
+ "hand_sizes": [
47
+ 10,
48
+ 10
49
+ ],
50
+ "discard_pile": [
51
+ 33
52
+ ],
53
+ "discard_size": 1,
54
+ "stock_remaining": 31,
55
+ "deadwood": [
56
+ 71,
57
+ 50
58
+ ],
59
+ "model_logits": null,
60
+ "model_value": null
61
+ },
62
+ {
63
+ "turn": 1,
64
+ "player": 0,
65
+ "phase": "draw",
66
+ "action": 1,
67
+ "action_desc": "Human drew 8\u2666 from discard",
68
+ "card_drawn": 33,
69
+ "hands": [
70
+ [
71
+ 39,
72
+ 16,
73
+ 21,
74
+ 50,
75
+ 5,
76
+ 29,
77
+ 22,
78
+ 48,
79
+ 38,
80
+ 32
81
+ ],
82
+ [
83
+ 14,
84
+ 15,
85
+ 2,
86
+ 6,
87
+ 18,
88
+ 10,
89
+ 0,
90
+ 42,
91
+ 20,
92
+ 31
93
+ ]
94
+ ],
95
+ "hand_sizes": [
96
+ 10,
97
+ 10
98
+ ],
99
+ "discard_pile": [
100
+ 33
101
+ ],
102
+ "discard_size": 1,
103
+ "stock_remaining": 31,
104
+ "deadwood": [
105
+ 71,
106
+ 50
107
+ ],
108
+ "model_logits": null,
109
+ "model_value": null
110
+ },
111
+ {
112
+ "turn": 2,
113
+ "player": 0,
114
+ "phase": "discard",
115
+ "action": 10,
116
+ "action_desc": "Human discarded K\u2666",
117
+ "card_drawn": null,
118
+ "hands": [
119
+ [
120
+ 39,
121
+ 16,
122
+ 21,
123
+ 50,
124
+ 5,
125
+ 29,
126
+ 22,
127
+ 48,
128
+ 38,
129
+ 32,
130
+ 33
131
+ ],
132
+ [
133
+ 14,
134
+ 15,
135
+ 2,
136
+ 6,
137
+ 18,
138
+ 10,
139
+ 0,
140
+ 42,
141
+ 20,
142
+ 31
143
+ ]
144
+ ],
145
+ "hand_sizes": [
146
+ 11,
147
+ 10
148
+ ],
149
+ "discard_pile": [],
150
+ "discard_size": 0,
151
+ "stock_remaining": 31,
152
+ "deadwood": [
153
+ 79,
154
+ 50
155
+ ],
156
+ "model_logits": null,
157
+ "model_value": null
158
+ },
159
+ {
160
+ "turn": 3,
161
+ "player": 1,
162
+ "phase": "draw",
163
+ "action": 0,
164
+ "action_desc": "Model drew from stock",
165
+ "card_drawn": 37,
166
+ "hands": [
167
+ [
168
+ 39,
169
+ 16,
170
+ 21,
171
+ 50,
172
+ 5,
173
+ 29,
174
+ 22,
175
+ 48,
176
+ 33,
177
+ 32
178
+ ],
179
+ [
180
+ 14,
181
+ 15,
182
+ 2,
183
+ 6,
184
+ 18,
185
+ 10,
186
+ 0,
187
+ 42,
188
+ 20,
189
+ 31
190
+ ]
191
+ ],
192
+ "hand_sizes": [
193
+ 10,
194
+ 10
195
+ ],
196
+ "discard_pile": [
197
+ 38
198
+ ],
199
+ "discard_size": 1,
200
+ "stock_remaining": 31,
201
+ "deadwood": [
202
+ 69,
203
+ 50
204
+ ],
205
+ "model_logits": [
206
+ 5.126653671264648,
207
+ -5.1295084953308105,
208
+ -6.861243724822998,
209
+ -6.543865203857422,
210
+ -5.290234565734863,
211
+ -2.0543019771575928,
212
+ -3.1220903396606445,
213
+ -0.45276135206222534,
214
+ -7.185001373291016,
215
+ -4.5501389503479,
216
+ -2.469714403152466,
217
+ -3.647491455078125,
218
+ -1.4985601902008057,
219
+ -8.0098876953125,
220
+ 7.796536445617676,
221
+ 1.5130730867385864
222
+ ],
223
+ "model_value": -0.21141019463539124
224
+ },
225
+ {
226
+ "turn": 4,
227
+ "player": 1,
228
+ "phase": "discard",
229
+ "action": 7,
230
+ "action_desc": "Model discarded J\u2660",
231
+ "card_drawn": null,
232
+ "hands": [
233
+ [
234
+ 39,
235
+ 16,
236
+ 21,
237
+ 50,
238
+ 5,
239
+ 29,
240
+ 22,
241
+ 48,
242
+ 33,
243
+ 32
244
+ ],
245
+ [
246
+ 14,
247
+ 15,
248
+ 2,
249
+ 6,
250
+ 18,
251
+ 10,
252
+ 0,
253
+ 42,
254
+ 20,
255
+ 31,
256
+ 37
257
+ ]
258
+ ],
259
+ "hand_sizes": [
260
+ 10,
261
+ 11
262
+ ],
263
+ "discard_pile": [
264
+ 38
265
+ ],
266
+ "discard_size": 1,
267
+ "stock_remaining": 30,
268
+ "deadwood": [
269
+ 69,
270
+ 60
271
+ ],
272
+ "model_logits": [
273
+ 8.324285507202148,
274
+ -8.325616836547852,
275
+ -13.471858024597168,
276
+ -12.16165828704834,
277
+ -12.394731521606445,
278
+ -7.47069787979126,
279
+ -9.250984191894531,
280
+ 14.0492582321167,
281
+ -13.336589813232422,
282
+ -9.89210033416748,
283
+ -8.505082130432129,
284
+ -9.964954376220703,
285
+ 14.825322151184082,
286
+ -11.19517993927002,
287
+ 10.921822547912598,
288
+ 2.189155101776123
289
+ ],
290
+ "model_value": -0.2725549638271332
291
+ },
292
+ {
293
+ "turn": 5,
294
+ "player": 0,
295
+ "phase": "draw",
296
+ "action": 0,
297
+ "action_desc": "Human drew from stock",
298
+ "card_drawn": 45,
299
+ "hands": [
300
+ [
301
+ 39,
302
+ 16,
303
+ 21,
304
+ 50,
305
+ 5,
306
+ 29,
307
+ 22,
308
+ 48,
309
+ 33,
310
+ 32
311
+ ],
312
+ [
313
+ 14,
314
+ 15,
315
+ 2,
316
+ 6,
317
+ 18,
318
+ 37,
319
+ 0,
320
+ 42,
321
+ 20,
322
+ 31
323
+ ]
324
+ ],
325
+ "hand_sizes": [
326
+ 10,
327
+ 10
328
+ ],
329
+ "discard_pile": [
330
+ 38,
331
+ 10
332
+ ],
333
+ "discard_size": 2,
334
+ "stock_remaining": 30,
335
+ "deadwood": [
336
+ 69,
337
+ 50
338
+ ],
339
+ "model_logits": null,
340
+ "model_value": null
341
+ },
342
+ {
343
+ "turn": 6,
344
+ "player": 0,
345
+ "phase": "discard",
346
+ "action": 5,
347
+ "action_desc": "Human discarded Q\u2663",
348
+ "card_drawn": null,
349
+ "hands": [
350
+ [
351
+ 39,
352
+ 16,
353
+ 21,
354
+ 50,
355
+ 5,
356
+ 29,
357
+ 22,
358
+ 48,
359
+ 33,
360
+ 32,
361
+ 45
362
+ ],
363
+ [
364
+ 14,
365
+ 15,
366
+ 2,
367
+ 6,
368
+ 18,
369
+ 37,
370
+ 0,
371
+ 42,
372
+ 20,
373
+ 31
374
+ ]
375
+ ],
376
+ "hand_sizes": [
377
+ 11,
378
+ 10
379
+ ],
380
+ "discard_pile": [
381
+ 38,
382
+ 10
383
+ ],
384
+ "discard_size": 2,
385
+ "stock_remaining": 29,
386
+ "deadwood": [
387
+ 76,
388
+ 50
389
+ ],
390
+ "model_logits": null,
391
+ "model_value": null
392
+ },
393
+ {
394
+ "turn": 7,
395
+ "player": 1,
396
+ "phase": "draw",
397
+ "action": 0,
398
+ "action_desc": "Model drew from stock",
399
+ "card_drawn": 19,
400
+ "hands": [
401
+ [
402
+ 39,
403
+ 16,
404
+ 21,
405
+ 45,
406
+ 5,
407
+ 29,
408
+ 22,
409
+ 48,
410
+ 33,
411
+ 32
412
+ ],
413
+ [
414
+ 14,
415
+ 15,
416
+ 2,
417
+ 6,
418
+ 18,
419
+ 37,
420
+ 0,
421
+ 42,
422
+ 20,
423
+ 31
424
+ ]
425
+ ],
426
+ "hand_sizes": [
427
+ 10,
428
+ 10
429
+ ],
430
+ "discard_pile": [
431
+ 38,
432
+ 10,
433
+ 50
434
+ ],
435
+ "discard_size": 3,
436
+ "stock_remaining": 29,
437
+ "deadwood": [
438
+ 66,
439
+ 50
440
+ ],
441
+ "model_logits": [
442
+ 4.401744365692139,
443
+ -4.4058990478515625,
444
+ -7.724531650543213,
445
+ -6.9231791496276855,
446
+ -5.224926471710205,
447
+ -2.9028067588806152,
448
+ -3.0285537242889404,
449
+ 0.11879847943782806,
450
+ -7.425036907196045,
451
+ -4.322253704071045,
452
+ -2.4713757038116455,
453
+ -3.9531264305114746,
454
+ -3.5391485691070557,
455
+ -8.811593055725098,
456
+ 8.573871612548828,
457
+ 1.6507983207702637
458
+ ],
459
+ "model_value": -0.255930632352829
460
+ },
461
+ {
462
+ "turn": 8,
463
+ "player": 1,
464
+ "phase": "discard",
465
+ "action": 7,
466
+ "action_desc": "Model discarded Q\u2666",
467
+ "card_drawn": null,
468
+ "hands": [
469
+ [
470
+ 39,
471
+ 16,
472
+ 21,
473
+ 45,
474
+ 5,
475
+ 29,
476
+ 22,
477
+ 48,
478
+ 33,
479
+ 32
480
+ ],
481
+ [
482
+ 14,
483
+ 15,
484
+ 2,
485
+ 6,
486
+ 18,
487
+ 37,
488
+ 0,
489
+ 42,
490
+ 20,
491
+ 31,
492
+ 19
493
+ ]
494
+ ],
495
+ "hand_sizes": [
496
+ 10,
497
+ 11
498
+ ],
499
+ "discard_pile": [
500
+ 38,
501
+ 10,
502
+ 50
503
+ ],
504
+ "discard_size": 3,
505
+ "stock_remaining": 28,
506
+ "deadwood": [
507
+ 66,
508
+ 36
509
+ ],
510
+ "model_logits": [
511
+ -5.679299831390381,
512
+ 5.667057037353516,
513
+ -3.651925563812256,
514
+ -3.393664598464966,
515
+ -2.980839729309082,
516
+ 0.4642338156700134,
517
+ -32.51799011230469,
518
+ 4.752808570861816,
519
+ -4.431901931762695,
520
+ -0.4568707346916199,
521
+ -12.822242736816406,
522
+ -0.25161805748939514,
523
+ -7.1858296394348145,
524
+ -10.867212295532227,
525
+ 10.578520774841309,
526
+ 2.002751350402832
527
+ ],
528
+ "model_value": -0.041785724461078644
529
+ },
530
+ {
531
+ "turn": 9,
532
+ "player": 0,
533
+ "phase": "draw",
534
+ "action": 0,
535
+ "action_desc": "Human drew from stock",
536
+ "card_drawn": 43,
537
+ "hands": [
538
+ [
539
+ 39,
540
+ 16,
541
+ 21,
542
+ 45,
543
+ 5,
544
+ 29,
545
+ 22,
546
+ 48,
547
+ 33,
548
+ 32
549
+ ],
550
+ [
551
+ 14,
552
+ 15,
553
+ 2,
554
+ 6,
555
+ 18,
556
+ 19,
557
+ 0,
558
+ 42,
559
+ 20,
560
+ 31
561
+ ]
562
+ ],
563
+ "hand_sizes": [
564
+ 10,
565
+ 10
566
+ ],
567
+ "discard_pile": [
568
+ 38,
569
+ 10,
570
+ 50,
571
+ 37
572
+ ],
573
+ "discard_size": 4,
574
+ "stock_remaining": 28,
575
+ "deadwood": [
576
+ 66,
577
+ 26
578
+ ],
579
+ "model_logits": null,
580
+ "model_value": null
581
+ },
582
+ {
583
+ "turn": 10,
584
+ "player": 0,
585
+ "phase": "discard",
586
+ "action": 9,
587
+ "action_desc": "Human discarded 10\u2663",
588
+ "card_drawn": null,
589
+ "hands": [
590
+ [
591
+ 39,
592
+ 16,
593
+ 21,
594
+ 45,
595
+ 5,
596
+ 29,
597
+ 22,
598
+ 48,
599
+ 33,
600
+ 32,
601
+ 43
602
+ ],
603
+ [
604
+ 14,
605
+ 15,
606
+ 2,
607
+ 6,
608
+ 18,
609
+ 19,
610
+ 0,
611
+ 42,
612
+ 20,
613
+ 31
614
+ ]
615
+ ],
616
+ "hand_sizes": [
617
+ 11,
618
+ 10
619
+ ],
620
+ "discard_pile": [
621
+ 38,
622
+ 10,
623
+ 50,
624
+ 37
625
+ ],
626
+ "discard_size": 4,
627
+ "stock_remaining": 27,
628
+ "deadwood": [
629
+ 71,
630
+ 26
631
+ ],
632
+ "model_logits": null,
633
+ "model_value": null
634
+ },
635
+ {
636
+ "turn": 11,
637
+ "player": 1,
638
+ "phase": "draw",
639
+ "action": 0,
640
+ "action_desc": "Model drew from stock",
641
+ "card_drawn": 30,
642
+ "hands": [
643
+ [
644
+ 39,
645
+ 16,
646
+ 21,
647
+ 45,
648
+ 5,
649
+ 29,
650
+ 22,
651
+ 43,
652
+ 33,
653
+ 32
654
+ ],
655
+ [
656
+ 14,
657
+ 15,
658
+ 2,
659
+ 6,
660
+ 18,
661
+ 19,
662
+ 0,
663
+ 42,
664
+ 20,
665
+ 31
666
+ ]
667
+ ],
668
+ "hand_sizes": [
669
+ 10,
670
+ 10
671
+ ],
672
+ "discard_pile": [
673
+ 38,
674
+ 10,
675
+ 50,
676
+ 37,
677
+ 48
678
+ ],
679
+ "discard_size": 5,
680
+ "stock_remaining": 27,
681
+ "deadwood": [
682
+ 61,
683
+ 26
684
+ ],
685
+ "model_logits": [
686
+ 3.51971435546875,
687
+ -3.5317254066467285,
688
+ 0.2833046615123749,
689
+ 1.0819870233535767,
690
+ 1.7867908477783203,
691
+ 4.607614517211914,
692
+ -27.000417709350586,
693
+ -25.44249153137207,
694
+ -0.2194102704524994,
695
+ 2.900752544403076,
696
+ -25.785076141357422,
697
+ 3.275852680206299,
698
+ 1.052756905555725,
699
+ -10.98749828338623,
700
+ 10.677159309387207,
701
+ 2.084076404571533
702
+ ],
703
+ "model_value": 0.055591605603694916
704
+ },
705
+ {
706
+ "turn": 12,
707
+ "player": 1,
708
+ "phase": "discard",
709
+ "action": 12,
710
+ "action_desc": "Model discarded 5\u2666",
711
+ "card_drawn": null,
712
+ "hands": [
713
+ [
714
+ 39,
715
+ 16,
716
+ 21,
717
+ 45,
718
+ 5,
719
+ 29,
720
+ 22,
721
+ 43,
722
+ 33,
723
+ 32
724
+ ],
725
+ [
726
+ 14,
727
+ 15,
728
+ 2,
729
+ 6,
730
+ 18,
731
+ 19,
732
+ 0,
733
+ 42,
734
+ 20,
735
+ 31,
736
+ 30
737
+ ]
738
+ ],
739
+ "hand_sizes": [
740
+ 10,
741
+ 11
742
+ ],
743
+ "discard_pile": [
744
+ 38,
745
+ 10,
746
+ 50,
747
+ 37,
748
+ 48
749
+ ],
750
+ "discard_size": 5,
751
+ "stock_remaining": 26,
752
+ "deadwood": [
753
+ 61,
754
+ 31
755
+ ],
756
+ "model_logits": [
757
+ 3.3101553916931152,
758
+ -3.3224661350250244,
759
+ -10.904746055603027,
760
+ -11.095510482788086,
761
+ -10.693611145019531,
762
+ 12.521478652954102,
763
+ -21.422319412231445,
764
+ -18.493745803833008,
765
+ -11.821793556213379,
766
+ -8.317180633544922,
767
+ -20.57308578491211,
768
+ 10.463668823242188,
769
+ 14.69269847869873,
770
+ -13.32497501373291,
771
+ 12.951459884643555,
772
+ 2.5454325675964355
773
+ ],
774
+ "model_value": -0.10870037227869034
775
+ },
776
+ {
777
+ "turn": 13,
778
+ "player": 0,
779
+ "phase": "draw",
780
+ "action": 0,
781
+ "action_desc": "Human drew from stock",
782
+ "card_drawn": 51,
783
+ "hands": [
784
+ [
785
+ 39,
786
+ 16,
787
+ 21,
788
+ 45,
789
+ 5,
790
+ 29,
791
+ 22,
792
+ 43,
793
+ 33,
794
+ 32
795
+ ],
796
+ [
797
+ 14,
798
+ 15,
799
+ 2,
800
+ 6,
801
+ 18,
802
+ 19,
803
+ 0,
804
+ 42,
805
+ 20,
806
+ 31
807
+ ]
808
+ ],
809
+ "hand_sizes": [
810
+ 10,
811
+ 10
812
+ ],
813
+ "discard_pile": [
814
+ 38,
815
+ 10,
816
+ 50,
817
+ 37,
818
+ 48,
819
+ 30
820
+ ],
821
+ "discard_size": 6,
822
+ "stock_remaining": 26,
823
+ "deadwood": [
824
+ 61,
825
+ 26
826
+ ],
827
+ "model_logits": null,
828
+ "model_value": null
829
+ },
830
+ {
831
+ "turn": 14,
832
+ "player": 0,
833
+ "phase": "discard",
834
+ "action": 12,
835
+ "action_desc": "Human discarded K\u2663",
836
+ "card_drawn": null,
837
+ "hands": [
838
+ [
839
+ 39,
840
+ 16,
841
+ 21,
842
+ 45,
843
+ 5,
844
+ 29,
845
+ 22,
846
+ 43,
847
+ 33,
848
+ 32,
849
+ 51
850
+ ],
851
+ [
852
+ 14,
853
+ 15,
854
+ 2,
855
+ 6,
856
+ 18,
857
+ 19,
858
+ 0,
859
+ 42,
860
+ 20,
861
+ 31
862
+ ]
863
+ ],
864
+ "hand_sizes": [
865
+ 11,
866
+ 10
867
+ ],
868
+ "discard_pile": [
869
+ 38,
870
+ 10,
871
+ 50,
872
+ 37,
873
+ 48,
874
+ 30
875
+ ],
876
+ "discard_size": 6,
877
+ "stock_remaining": 25,
878
+ "deadwood": [
879
+ 71,
880
+ 26
881
+ ],
882
+ "model_logits": null,
883
+ "model_value": null
884
+ },
885
+ {
886
+ "turn": 15,
887
+ "player": 1,
888
+ "phase": "draw",
889
+ "action": 0,
890
+ "action_desc": "Model drew from stock",
891
+ "card_drawn": 28,
892
+ "hands": [
893
+ [
894
+ 39,
895
+ 16,
896
+ 21,
897
+ 45,
898
+ 5,
899
+ 29,
900
+ 22,
901
+ 43,
902
+ 33,
903
+ 32
904
+ ],
905
+ [
906
+ 14,
907
+ 15,
908
+ 2,
909
+ 6,
910
+ 18,
911
+ 19,
912
+ 0,
913
+ 42,
914
+ 20,
915
+ 31
916
+ ]
917
+ ],
918
+ "hand_sizes": [
919
+ 10,
920
+ 10
921
+ ],
922
+ "discard_pile": [
923
+ 38,
924
+ 10,
925
+ 50,
926
+ 37,
927
+ 48,
928
+ 30,
929
+ 51
930
+ ],
931
+ "discard_size": 7,
932
+ "stock_remaining": 25,
933
+ "deadwood": [
934
+ 61,
935
+ 26
936
+ ],
937
+ "model_logits": [
938
+ 3.7137739658355713,
939
+ -3.7257795333862305,
940
+ 0.25913307070732117,
941
+ 0.9811568856239319,
942
+ 1.2438340187072754,
943
+ 5.041465759277344,
944
+ -27.491424560546875,
945
+ -26.291391372680664,
946
+ -0.5412510633468628,
947
+ 2.8459887504577637,
948
+ -26.207008361816406,
949
+ 3.29575777053833,
950
+ 1.2365401983261108,
951
+ -11.469968795776367,
952
+ 11.145064353942871,
953
+ 2.177492618560791
954
+ ],
955
+ "model_value": -0.03628332167863846
956
+ },
957
+ {
958
+ "turn": 16,
959
+ "player": 1,
960
+ "phase": "discard",
961
+ "action": 5,
962
+ "action_desc": "Model discarded 7\u2660",
963
+ "card_drawn": null,
964
+ "hands": [
965
+ [
966
+ 39,
967
+ 16,
968
+ 21,
969
+ 45,
970
+ 5,
971
+ 29,
972
+ 22,
973
+ 43,
974
+ 33,
975
+ 32
976
+ ],
977
+ [
978
+ 14,
979
+ 15,
980
+ 2,
981
+ 6,
982
+ 18,
983
+ 19,
984
+ 0,
985
+ 42,
986
+ 20,
987
+ 31,
988
+ 28
989
+ ]
990
+ ],
991
+ "hand_sizes": [
992
+ 10,
993
+ 11
994
+ ],
995
+ "discard_pile": [
996
+ 38,
997
+ 10,
998
+ 50,
999
+ 37,
1000
+ 48,
1001
+ 30,
1002
+ 51
1003
+ ],
1004
+ "discard_size": 7,
1005
+ "stock_remaining": 24,
1006
+ "deadwood": [
1007
+ 61,
1008
+ 20
1009
+ ],
1010
+ "model_logits": [
1011
+ -0.580439031124115,
1012
+ 0.5654222369194031,
1013
+ 1.00437593460083,
1014
+ -2.1447203159332275,
1015
+ -2.519040584564209,
1016
+ 5.23391580581665,
1017
+ -29.072206497192383,
1018
+ -26.79841423034668,
1019
+ -0.23038282990455627,
1020
+ 3.612154722213745,
1021
+ -27.754079818725586,
1022
+ 3.82499623298645,
1023
+ -3.793586492538452,
1024
+ -13.010588645935059,
1025
+ 12.637957572937012,
1026
+ 2.462074041366577
1027
+ ],
1028
+ "model_value": 0.17074382305145264
1029
+ },
1030
+ {
1031
+ "turn": 17,
1032
+ "player": 0,
1033
+ "phase": "draw",
1034
+ "action": 1,
1035
+ "action_desc": "Human drew 7\u2660 from discard",
1036
+ "card_drawn": 6,
1037
+ "hands": [
1038
+ [
1039
+ 39,
1040
+ 16,
1041
+ 21,
1042
+ 45,
1043
+ 5,
1044
+ 29,
1045
+ 22,
1046
+ 43,
1047
+ 33,
1048
+ 32
1049
+ ],
1050
+ [
1051
+ 14,
1052
+ 15,
1053
+ 2,
1054
+ 28,
1055
+ 18,
1056
+ 19,
1057
+ 0,
1058
+ 42,
1059
+ 20,
1060
+ 31
1061
+ ]
1062
+ ],
1063
+ "hand_sizes": [
1064
+ 10,
1065
+ 10
1066
+ ],
1067
+ "discard_pile": [
1068
+ 38,
1069
+ 10,
1070
+ 50,
1071
+ 37,
1072
+ 48,
1073
+ 30,
1074
+ 51,
1075
+ 6
1076
+ ],
1077
+ "discard_size": 8,
1078
+ "stock_remaining": 24,
1079
+ "deadwood": [
1080
+ 61,
1081
+ 13
1082
+ ],
1083
+ "model_logits": null,
1084
+ "model_value": null
1085
+ },
1086
+ {
1087
+ "turn": 18,
1088
+ "player": 0,
1089
+ "phase": "discard",
1090
+ "action": 10,
1091
+ "action_desc": "Human discarded 8\u2666",
1092
+ "card_drawn": null,
1093
+ "hands": [
1094
+ [
1095
+ 39,
1096
+ 16,
1097
+ 21,
1098
+ 45,
1099
+ 5,
1100
+ 29,
1101
+ 22,
1102
+ 43,
1103
+ 33,
1104
+ 32,
1105
+ 6
1106
+ ],
1107
+ [
1108
+ 14,
1109
+ 15,
1110
+ 2,
1111
+ 28,
1112
+ 18,
1113
+ 19,
1114
+ 0,
1115
+ 42,
1116
+ 20,
1117
+ 31
1118
+ ]
1119
+ ],
1120
+ "hand_sizes": [
1121
+ 11,
1122
+ 10
1123
+ ],
1124
+ "discard_pile": [
1125
+ 38,
1126
+ 10,
1127
+ 50,
1128
+ 37,
1129
+ 48,
1130
+ 30,
1131
+ 51
1132
+ ],
1133
+ "discard_size": 7,
1134
+ "stock_remaining": 24,
1135
+ "deadwood": [
1136
+ 47,
1137
+ 13
1138
+ ],
1139
+ "model_logits": null,
1140
+ "model_value": null
1141
+ },
1142
+ {
1143
+ "turn": 19,
1144
+ "player": 1,
1145
+ "phase": "draw",
1146
+ "action": 0,
1147
+ "action_desc": "Model drew from stock",
1148
+ "card_drawn": 40,
1149
+ "hands": [
1150
+ [
1151
+ 39,
1152
+ 16,
1153
+ 21,
1154
+ 45,
1155
+ 5,
1156
+ 29,
1157
+ 22,
1158
+ 43,
1159
+ 6,
1160
+ 32
1161
+ ],
1162
+ [
1163
+ 14,
1164
+ 15,
1165
+ 2,
1166
+ 28,
1167
+ 18,
1168
+ 19,
1169
+ 0,
1170
+ 42,
1171
+ 20,
1172
+ 31
1173
+ ]
1174
+ ],
1175
+ "hand_sizes": [
1176
+ 10,
1177
+ 10
1178
+ ],
1179
+ "discard_pile": [
1180
+ 38,
1181
+ 10,
1182
+ 50,
1183
+ 37,
1184
+ 48,
1185
+ 30,
1186
+ 51,
1187
+ 33
1188
+ ],
1189
+ "discard_size": 8,
1190
+ "stock_remaining": 24,
1191
+ "deadwood": [
1192
+ 39,
1193
+ 13
1194
+ ],
1195
+ "model_logits": [
1196
+ 2.573659658432007,
1197
+ -2.58231782913208,
1198
+ 6.347954273223877,
1199
+ -14.177045822143555,
1200
+ -13.017663955688477,
1201
+ -14.66211223602295,
1202
+ -21.7970027923584,
1203
+ -22.045923233032227,
1204
+ 6.178452968597412,
1205
+ 9.758776664733887,
1206
+ -19.829437255859375,
1207
+ 10.041627883911133,
1208
+ 3.9640257358551025,
1209
+ -12.038032531738281,
1210
+ 11.681946754455566,
1211
+ 2.3303403854370117
1212
+ ],
1213
+ "model_value": 0.09014331549406052
1214
+ },
1215
+ {
1216
+ "turn": 20,
1217
+ "player": 1,
1218
+ "phase": "discard",
1219
+ "action": 11,
1220
+ "action_desc": "Model discarded 6\u2666",
1221
+ "card_drawn": null,
1222
+ "hands": [
1223
+ [
1224
+ 39,
1225
+ 16,
1226
+ 21,
1227
+ 45,
1228
+ 5,
1229
+ 29,
1230
+ 22,
1231
+ 43,
1232
+ 6,
1233
+ 32
1234
+ ],
1235
+ [
1236
+ 14,
1237
+ 15,
1238
+ 2,
1239
+ 28,
1240
+ 18,
1241
+ 19,
1242
+ 0,
1243
+ 42,
1244
+ 20,
1245
+ 31,
1246
+ 40
1247
+ ]
1248
+ ],
1249
+ "hand_sizes": [
1250
+ 10,
1251
+ 11
1252
+ ],
1253
+ "discard_pile": [
1254
+ 38,
1255
+ 10,
1256
+ 50,
1257
+ 37,
1258
+ 48,
1259
+ 30,
1260
+ 51,
1261
+ 33
1262
+ ],
1263
+ "discard_size": 8,
1264
+ "stock_remaining": 23,
1265
+ "deadwood": [
1266
+ 39,
1267
+ 15
1268
+ ],
1269
+ "model_logits": [
1270
+ -4.153538703918457,
1271
+ 4.141969680786133,
1272
+ 8.283892631530762,
1273
+ -13.9446382522583,
1274
+ -13.641948699951172,
1275
+ -13.380784034729004,
1276
+ -21.186758041381836,
1277
+ -19.702402114868164,
1278
+ -11.739419937133789,
1279
+ 11.330644607543945,
1280
+ -19.836627960205078,
1281
+ 12.001965522766113,
1282
+ 3.390955686569214,
1283
+ -13.666848182678223,
1284
+ 13.266141891479492,
1285
+ 2.6160666942596436
1286
+ ],
1287
+ "model_value": 0.1503770351409912
1288
+ },
1289
+ {
1290
+ "turn": 21,
1291
+ "player": 1,
1292
+ "phase": "knock_decision",
1293
+ "action": 14,
1294
+ "action_desc": "Model knocked",
1295
+ "card_drawn": null,
1296
+ "hands": [
1297
+ [
1298
+ 39,
1299
+ 16,
1300
+ 21,
1301
+ 45,
1302
+ 5,
1303
+ 29,
1304
+ 22,
1305
+ 43,
1306
+ 6,
1307
+ 32
1308
+ ],
1309
+ [
1310
+ 14,
1311
+ 15,
1312
+ 2,
1313
+ 28,
1314
+ 18,
1315
+ 19,
1316
+ 0,
1317
+ 42,
1318
+ 20,
1319
+ 40
1320
+ ]
1321
+ ],
1322
+ "hand_sizes": [
1323
+ 10,
1324
+ 10
1325
+ ],
1326
+ "discard_pile": [
1327
+ 38,
1328
+ 10,
1329
+ 50,
1330
+ 37,
1331
+ 48,
1332
+ 30,
1333
+ 51,
1334
+ 33,
1335
+ 31
1336
+ ],
1337
+ "discard_size": 9,
1338
+ "stock_remaining": 23,
1339
+ "deadwood": [
1340
+ 39,
1341
+ 9
1342
+ ],
1343
+ "model_logits": [
1344
+ 3.756993293762207,
1345
+ -3.7701854705810547,
1346
+ 6.154211044311523,
1347
+ -11.575858116149902,
1348
+ -12.498071670532227,
1349
+ -14.86362075805664,
1350
+ -21.703907012939453,
1351
+ -19.479597091674805,
1352
+ 4.714268207550049,
1353
+ 6.769254684448242,
1354
+ -19.45001220703125,
1355
+ 5.898441314697266,
1356
+ 3.1961967945098877,
1357
+ -11.973695755004883,
1358
+ 11.630904197692871,
1359
+ 2.339296817779541
1360
+ ],
1361
+ "model_value": 0.21073266863822937
1362
+ },
1363
+ {
1364
+ "turn": 22,
1365
+ "player": -1,
1366
+ "phase": "game_over",
1367
+ "action": -1,
1368
+ "action_desc": "Game over.",
1369
+ "card_drawn": null,
1370
+ "hands": [
1371
+ [
1372
+ 39,
1373
+ 16,
1374
+ 21,
1375
+ 45,
1376
+ 5,
1377
+ 29,
1378
+ 22,
1379
+ 43,
1380
+ 6,
1381
+ 32
1382
+ ],
1383
+ [
1384
+ 14,
1385
+ 15,
1386
+ 2,
1387
+ 28,
1388
+ 18,
1389
+ 19,
1390
+ 0,
1391
+ 42,
1392
+ 20,
1393
+ 40
1394
+ ]
1395
+ ],
1396
+ "hand_sizes": [
1397
+ 10,
1398
+ 10
1399
+ ],
1400
+ "discard_pile": [
1401
+ 38,
1402
+ 10,
1403
+ 50,
1404
+ 37,
1405
+ 48,
1406
+ 30,
1407
+ 51,
1408
+ 33,
1409
+ 31
1410
+ ],
1411
+ "discard_size": 9,
1412
+ "stock_remaining": 23,
1413
+ "deadwood": [
1414
+ 39,
1415
+ 9
1416
+ ],
1417
+ "model_logits": null,
1418
+ "model_value": null
1419
+ }
1420
+ ]
1421
+ }