{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "provenance": [], "gpuType": "T4" }, "kernelspec": { "name": "python3", "display_name": "Python 3" }, "language_info": { "name": "python" }, "accelerator": "GPU" }, "cells": [ { "cell_type": "code", "source": [ "!pip -q install chess pygame numpy torch matplotlib pandas" ], "metadata": { "id": "DAV6zrHmztwq" }, "execution_count": null, "outputs": [] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "43KPUdCMgdyR", "outputId": "b6095333-3653-4823-bd03-383cf8a80ecf" }, "outputs": [ { "metadata": { "tags": null }, "name": "stdout", "output_type": "stream", "text": [ "Compiling JIT model for Tensor Core reduction...\n", "\n", "šŸš€ Optimized Pipeline | Envs: 256 | BZ: 8192 | Device: CUDA\n" ] }, { "metadata": { "tags": null }, "name": "stderr", "output_type": "stream", "text": [ "W0421 02:50:31.332000 39915 torch/_inductor/utils.py:1679] [0/0] Not enough SMs to use max_autotune_gemm mode\n", "/usr/local/lib/python3.12/dist-packages/torch/_inductor/select_algorithm.py:3464: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage()\n", " current_size = base.storage().size()\n", "Autotune Choices Stats:\n", "{\"num_choices\": 2, \"num_triton_choices\": 0, \"best_kernel\": \"bias_addmm\", \"best_time\": 0.4034560024738312}\n", "AUTOTUNE addmm(256x5376, 256x2048, 2048x5376)\n", "strides: [0, 1], [2048, 1], [1, 2048]\n", "dtypes: torch.float16, torch.float16, torch.float16\n", " bias_addmm 0.4035 ms 100.0% \n", " addmm 0.4853 ms 83.1% \n", "SingleProcess AUTOTUNE benchmarking takes 0.2749 seconds and 0.0003 seconds precompiling for 2 choices\n", "Autotune Choices Stats:\n", "{\"num_choices\": 2, \"num_triton_choices\": 0, \"best_kernel\": \"bias_addmm\", \"best_time\": 8.788448333740234}\n", "AUTOTUNE addmm(8192x5376, 8192x2048, 2048x5376)\n", "strides: [0, 1], [2048, 1], [1, 2048]\n", "dtypes: torch.float16, torch.float16, torch.float16\n", " bias_addmm 8.7884 ms 100.0% \n", " addmm 9.4638 ms 92.9% \n", "SingleProcess AUTOTUNE benchmarking takes 0.1625 seconds and 0.0004 seconds precompiling for 2 choices\n" ] }, { "metadata": { "tags": null }, "name": "stdout", "output_type": "stream", "text": [ "[Iter 0001] P: 0.1286 | V: 0.0680 | V_Mean: 0.022 | Win%: 0.04 | FPS: 260\n", "[Iter 0002] P: 0.2187 | V: 0.0789 | V_Mean: 0.052 | Win%: 0.09 | FPS: 2161\n", "[Iter 0003] P: 0.2295 | V: 0.0712 | V_Mean: 0.077 | Win%: 0.15 | FPS: 2109\n", "[Iter 0004] P: 0.2508 | V: 0.0857 | V_Mean: 0.104 | Win%: 0.21 | FPS: 2105\n", "[Iter 0005] P: 0.2623 | V: 0.0932 | V_Mean: 0.124 | Win%: 0.27 | FPS: 2146\n", "[Iter 0006] P: 0.2850 | V: 0.1089 | V_Mean: 0.158 | Win%: 0.33 | FPS: 2153\n", "[Iter 0007] P: 0.2834 | V: 0.1107 | V_Mean: 0.167 | Win%: 0.37 | FPS: 2184\n" ] }, { "metadata": { "tags": null }, "name": "stderr", "output_type": "stream", "text": [ "CUDAGraph supports dynamic shapes by recording a new graph for each distinct input size. Recording too many CUDAGraphs may lead to extra overhead. We have observed 9 distinct sizes. Please consider the following options for better performance: a) padding inputs to a few fixed number of shapes; or b) set torch._inductor.config.triton.cudagraph_skip_dynamic_graphs=True. Set torch._inductor.config.triton.cudagraph_dynamic_shape_warn_limit=None to silence this warning.\n", "CUDAGraph supports dynamic shapes by recording a new graph for each distinct input size. Recording too many CUDAGraphs may lead to extra overhead. We have observed 9 distinct sizes. Please consider the following options for better performance: a) padding inputs to a few fixed number of shapes; or b) set torch._inductor.config.triton.cudagraph_skip_dynamic_graphs=True. Set torch._inductor.config.triton.cudagraph_dynamic_shape_warn_limit=None to silence this warning.\n" ] }, { "output_type": "stream", "name": "stdout", "text": [ "[Iter 0008] P: 0.3000 | V: 0.1349 | V_Mean: 0.208 | Win%: 0.45 | FPS: 2042\n", "[Iter 0009] P: 0.3013 | V: 0.1323 | V_Mean: 0.221 | Win%: 0.50 | FPS: 2040\n", "[Iter 0010] P: 0.3028 | V: 0.1476 | V_Mean: 0.244 | Win%: 0.54 | FPS: 2153\n", "[Iter 0011] P: 0.2981 | V: 0.1452 | V_Mean: 0.251 | Win%: 0.58 | FPS: 2124\n", "[Iter 0012] P: 0.3019 | V: 0.1464 | V_Mean: 0.269 | Win%: 0.62 | FPS: 2126\n", "[Iter 0013] P: 0.3031 | V: 0.1572 | V_Mean: 0.304 | Win%: 0.70 | FPS: 2075\n", "[Iter 0014] P: 0.2985 | V: 0.1593 | V_Mean: 0.323 | Win%: 0.76 | FPS: 1984\n", "[Iter 0015] P: 0.3137 | V: 0.1541 | V_Mean: 0.346 | Win%: 0.82 | FPS: 2111\n", "[Iter 0016] P: 0.3117 | V: 0.1767 | V_Mean: 0.352 | Win%: 0.88 | FPS: 2117\n", "[Iter 0017] P: 0.3176 | V: 0.1587 | V_Mean: 0.376 | Win%: 0.99 | FPS: 2062\n", "[Iter 0018] P: 0.2984 | V: 0.1580 | V_Mean: 0.392 | Win%: 1.05 | FPS: 2038\n", "[Iter 0019] P: 0.2929 | V: 0.1633 | V_Mean: 0.407 | Win%: 1.11 | FPS: 2102\n", "[Iter 0020] P: 0.2834 | V: 0.1586 | V_Mean: 0.422 | Win%: 1.17 | FPS: 2098\n", "[Iter 0021] P: 0.2636 | V: 0.1636 | V_Mean: 0.437 | Win%: 1.24 | FPS: 2080\n", "[Iter 0022] P: 0.2738 | V: 0.1558 | V_Mean: 0.455 | Win%: 1.30 | FPS: 2009\n", "[Iter 0023] P: 0.2464 | V: 0.1615 | V_Mean: 0.465 | Win%: 1.34 | FPS: 2066\n", "[Iter 0024] P: 0.2225 | V: 0.1590 | V_Mean: 0.472 | Win%: 1.37 | FPS: 2124\n", "[Iter 0025] P: 0.1825 | V: 0.1552 | V_Mean: 0.465 | Win%: 1.38 | FPS: 2089\n", "[Iter 0026] P: 0.1481 | V: 0.1455 | V_Mean: 0.470 | Win%: 1.38 | FPS: 2041\n", "[Iter 0027] P: 0.1393 | V: 0.1555 | V_Mean: 0.467 | Win%: 1.38 | FPS: 2054\n", "[Iter 0028] P: 0.1221 | V: 0.1437 | V_Mean: 0.463 | Win%: 1.39 | FPS: 2085\n", "[Iter 0029] P: 0.1266 | V: 0.1563 | V_Mean: 0.470 | Win%: 1.41 | FPS: 2020\n", "[Iter 0030] P: 0.1303 | V: 0.1570 | V_Mean: 0.469 | Win%: 1.41 | FPS: 2051\n", "[Iter 0031] P: 0.1044 | V: 0.1498 | V_Mean: 0.469 | Win%: 1.42 | FPS: 2091\n", "[Iter 0032] P: 0.1057 | V: 0.1553 | V_Mean: 0.470 | Win%: 1.42 | FPS: 2140\n", "[Iter 0033] P: 0.0951 | V: 0.1499 | V_Mean: 0.466 | Win%: 1.43 | FPS: 2140\n", "[Iter 0034] P: 0.0978 | V: 0.1557 | V_Mean: 0.465 | Win%: 1.43 | FPS: 2017\n", "[Iter 0035] P: 0.0871 | V: 0.1510 | V_Mean: 0.464 | Win%: 1.43 | FPS: 2059\n", "[Iter 0036] P: 0.0862 | V: 0.1585 | V_Mean: 0.464 | Win%: 1.43 | FPS: 2195\n", "[Iter 0037] P: 0.0885 | V: 0.1616 | V_Mean: 0.462 | Win%: 1.44 | FPS: 2146\n", "[Iter 0038] P: 0.0935 | V: 0.1661 | V_Mean: 0.462 | Win%: 1.44 | FPS: 2263\n", "[Iter 0039] P: 0.0738 | V: 0.1652 | V_Mean: 0.462 | Win%: 1.44 | FPS: 2044\n", "[Iter 0040] P: 0.0709 | V: 0.1533 | V_Mean: 0.463 | Win%: 1.45 | FPS: 2123\n", "[Iter 0041] P: 0.0790 | V: 0.1694 | V_Mean: 0.461 | Win%: 1.45 | FPS: 2068\n", "[Iter 0042] P: 0.0785 | V: 0.1665 | V_Mean: 0.462 | Win%: 1.45 | FPS: 2194\n", "[Iter 0043] P: 0.0702 | V: 0.1611 | V_Mean: 0.462 | Win%: 1.45 | FPS: 2064\n", "[Iter 0044] P: 0.0843 | V: 0.1657 | V_Mean: 0.462 | Win%: 1.46 | FPS: 2053\n", "[Iter 0045] P: 0.0843 | V: 0.1642 | V_Mean: 0.462 | Win%: 1.47 | FPS: 2094\n", "[Iter 0046] P: 0.1080 | V: 0.1737 | V_Mean: 0.464 | Win%: 1.47 | FPS: 2142\n", "[Iter 0047] P: 0.0711 | V: 0.1611 | V_Mean: 0.461 | Win%: 1.47 | FPS: 2063\n", "[Iter 0048] P: 0.0578 | V: 0.1708 | V_Mean: 0.462 | Win%: 1.47 | FPS: 2096\n", "[Iter 0049] P: 0.0475 | V: 0.1717 | V_Mean: 0.461 | Win%: 1.48 | FPS: 2218\n", "[Iter 0050] P: 0.0519 | V: 0.1686 | V_Mean: 0.461 | Win%: 1.48 | FPS: 2159\n", "[Iter 0051] P: 0.0469 | V: 0.1664 | V_Mean: 0.465 | Win%: 1.48 | FPS: 2237\n", "[Iter 0052] P: 0.0601 | V: 0.1657 | V_Mean: 0.465 | Win%: 1.49 | FPS: 2017\n", "[Iter 0053] P: 0.0508 | V: 0.1662 | V_Mean: 0.464 | Win%: 1.49 | FPS: 2101\n", "[Iter 0054] P: 0.0509 | V: 0.1744 | V_Mean: 0.466 | Win%: 1.49 | FPS: 2147\n", "[Iter 0055] P: 0.0572 | V: 0.1731 | V_Mean: 0.465 | Win%: 1.49 | FPS: 2216\n", "[Iter 0056] P: 0.0658 | V: 0.1690 | V_Mean: 0.465 | Win%: 1.50 | FPS: 2040\n", "[Iter 0057] P: 0.0747 | V: 0.1656 | V_Mean: 0.467 | Win%: 1.50 | FPS: 2028\n", "[Iter 0058] P: 0.0716 | V: 0.1629 | V_Mean: 0.468 | Win%: 1.50 | FPS: 2443\n", "[Iter 0059] P: 0.0899 | V: 0.1675 | V_Mean: 0.467 | Win%: 1.51 | FPS: 2088\n", "[Iter 0060] P: 0.0715 | V: 0.1681 | V_Mean: 0.470 | Win%: 1.52 | FPS: 2086\n", "[Iter 0061] P: 0.0632 | V: 0.1708 | V_Mean: 0.470 | Win%: 1.52 | FPS: 1988\n", "[Iter 0062] P: 0.0448 | V: 0.1645 | V_Mean: 0.470 | Win%: 1.53 | FPS: 2322\n", "[Iter 0063] P: 0.0616 | V: 0.1659 | V_Mean: 0.470 | Win%: 1.54 | FPS: 2115\n", "[Iter 0064] P: 0.0617 | V: 0.1574 | V_Mean: 0.472 | Win%: 1.55 | FPS: 2031\n", "[Iter 0065] P: 0.0685 | V: 0.1673 | V_Mean: 0.472 | Win%: 1.56 | FPS: 2006\n", "[Iter 0066] P: 0.0879 | V: 0.1718 | V_Mean: 0.478 | Win%: 1.57 | FPS: 2105\n", "[Iter 0067] P: 0.0512 | V: 0.1713 | V_Mean: 0.477 | Win%: 1.58 | FPS: 2080\n", "[Iter 0068] P: 0.0420 | V: 0.1658 | V_Mean: 0.480 | Win%: 1.59 | FPS: 2047\n", "[Iter 0069] P: 0.0491 | V: 0.1746 | V_Mean: 0.477 | Win%: 1.60 | FPS: 2051\n", "[Iter 0070] P: 0.0446 | V: 0.1726 | V_Mean: 0.480 | Win%: 1.61 | FPS: 2110\n", "[Iter 0071] P: 0.0578 | V: 0.1723 | V_Mean: 0.479 | Win%: 1.61 | FPS: 2336\n", "[Iter 0072] P: 0.0640 | V: 0.1782 | V_Mean: 0.478 | Win%: 1.61 | FPS: 2390\n", "[Iter 0073] P: 0.0538 | V: 0.1642 | V_Mean: 0.478 | Win%: 1.61 | FPS: 2090\n", "[Iter 0074] P: 0.0606 | V: 0.1565 | V_Mean: 0.478 | Win%: 1.61 | FPS: 1965\n", "[Iter 0075] P: 0.0765 | V: 0.1714 | V_Mean: 0.481 | Win%: 1.62 | FPS: 2292\n", "[Iter 0076] P: 0.0741 | V: 0.1734 | V_Mean: 0.480 | Win%: 1.62 | FPS: 2147\n", "[Iter 0077] P: 0.0552 | V: 0.1661 | V_Mean: 0.477 | Win%: 1.63 | FPS: 2432\n", "[Iter 0078] P: 0.0394 | V: 0.1631 | V_Mean: 0.475 | Win%: 1.64 | FPS: 2068\n", "[Iter 0079] P: 0.0580 | V: 0.1743 | V_Mean: 0.477 | Win%: 1.65 | FPS: 1951\n", "[Iter 0080] P: 0.0578 | V: 0.1717 | V_Mean: 0.477 | Win%: 1.65 | FPS: 2240\n", "[Iter 0081] P: 0.0589 | V: 0.1668 | V_Mean: 0.477 | Win%: 1.66 | FPS: 2130\n", "[Iter 0082] P: 0.0610 | V: 0.1791 | V_Mean: 0.479 | Win%: 1.67 | FPS: 2139\n", "[Iter 0083] P: 0.0680 | V: 0.1686 | V_Mean: 0.478 | Win%: 1.67 | FPS: 2225\n", "[Iter 0084] P: 0.0686 | V: 0.1749 | V_Mean: 0.478 | Win%: 1.68 | FPS: 2085\n", "[Iter 0085] P: 0.0647 | V: 0.1701 | V_Mean: 0.479 | Win%: 1.68 | FPS: 2275\n", "[Iter 0086] P: 0.0759 | V: 0.1697 | V_Mean: 0.478 | Win%: 1.68 | FPS: 2202\n", "[Iter 0087] P: 0.0674 | V: 0.1715 | V_Mean: 0.479 | Win%: 1.68 | FPS: 2114\n", "[Iter 0088] P: 0.0643 | V: 0.1571 | V_Mean: 0.478 | Win%: 1.69 | FPS: 2039\n", "[Iter 0089] P: 0.0943 | V: 0.1723 | V_Mean: 0.482 | Win%: 1.70 | FPS: 2065\n", "[Iter 0090] P: 0.0731 | V: 0.1765 | V_Mean: 0.481 | Win%: 1.70 | FPS: 2255\n", "[Iter 0091] P: 0.0513 | V: 0.1742 | V_Mean: 0.481 | Win%: 1.70 | FPS: 2539\n", "[Iter 0092] P: 0.0365 | V: 0.1763 | V_Mean: 0.478 | Win%: 1.71 | FPS: 2235\n", "[Iter 0093] P: 0.0482 | V: 0.1748 | V_Mean: 0.481 | Win%: 1.72 | FPS: 2224\n", "[Iter 0094] P: 0.0473 | V: 0.1725 | V_Mean: 0.483 | Win%: 1.72 | FPS: 2367\n", "[Iter 0095] P: 0.0444 | V: 0.1706 | V_Mean: 0.484 | Win%: 1.73 | FPS: 2155\n", "[Iter 0096] P: 0.0426 | V: 0.1665 | V_Mean: 0.483 | Win%: 1.73 | FPS: 2360\n", "[Iter 0097] P: 0.0509 | V: 0.1737 | V_Mean: 0.483 | Win%: 1.73 | FPS: 2372\n", "[Iter 0098] P: 0.0545 | V: 0.1708 | V_Mean: 0.482 | Win%: 1.74 | FPS: 2247\n", "[Iter 0099] P: 0.0633 | V: 0.1774 | V_Mean: 0.486 | Win%: 1.75 | FPS: 2227\n", "[Iter 0100] P: 0.0608 | V: 0.1698 | V_Mean: 0.490 | Win%: 1.76 | FPS: 2245\n", "[Iter 0101] P: 0.0511 | V: 0.1672 | V_Mean: 0.488 | Win%: 1.77 | FPS: 2175\n", "[Iter 0102] P: 0.0476 | V: 0.1688 | V_Mean: 0.488 | Win%: 1.77 | FPS: 2186\n", "[Iter 0103] P: 0.0571 | V: 0.1702 | V_Mean: 0.489 | Win%: 1.77 | FPS: 2469\n", "[Iter 0104] P: 0.0621 | V: 0.1689 | V_Mean: 0.488 | Win%: 1.78 | FPS: 2281\n", "[Iter 0105] P: 0.0579 | V: 0.1773 | V_Mean: 0.494 | Win%: 1.79 | FPS: 2339\n", "[Iter 0106] P: 0.0578 | V: 0.1714 | V_Mean: 0.497 | Win%: 1.80 | FPS: 2331\n", "[Iter 0107] P: 0.0861 | V: 0.1658 | V_Mean: 0.496 | Win%: 1.80 | FPS: 2256\n", "[Iter 0108] P: 0.1142 | V: 0.1635 | V_Mean: 0.499 | Win%: 1.83 | FPS: 2172\n", "[Iter 0109] P: 0.1137 | V: 0.1630 | V_Mean: 0.497 | Win%: 1.83 | FPS: 2357\n", "[Iter 0110] P: 0.0807 | V: 0.1648 | V_Mean: 0.500 | Win%: 1.83 | FPS: 2210\n", "[Iter 0111] P: 0.0900 | V: 0.1713 | V_Mean: 0.499 | Win%: 1.83 | FPS: 2445\n", "[Iter 0112] P: 0.0876 | V: 0.1681 | V_Mean: 0.499 | Win%: 1.83 | FPS: 2241\n", "[Iter 0113] P: 0.0534 | V: 0.1629 | V_Mean: 0.499 | Win%: 1.84 | FPS: 2557\n", "[Iter 0114] P: 0.0661 | V: 0.1611 | V_Mean: 0.499 | Win%: 1.85 | FPS: 2234\n", "[Iter 0115] P: 0.0810 | V: 0.1667 | V_Mean: 0.499 | Win%: 1.85 | FPS: 2727\n", "[Iter 0116] P: 0.0606 | V: 0.1712 | V_Mean: 0.499 | Win%: 1.85 | FPS: 2221\n", "[Iter 0117] P: 0.0452 | V: 0.1648 | V_Mean: 0.501 | Win%: 1.86 | FPS: 2225\n", "[Iter 0118] P: 0.0816 | V: 0.1657 | V_Mean: 0.500 | Win%: 1.86 | FPS: 2419\n", "[Iter 0119] P: 0.0517 | V: 0.1674 | V_Mean: 0.499 | Win%: 1.86 | FPS: 2218\n", "[Iter 0120] P: 0.0465 | V: 0.1637 | V_Mean: 0.499 | Win%: 1.86 | FPS: 2466\n", "[Iter 0121] P: 0.0361 | V: 0.1685 | V_Mean: 0.497 | Win%: 1.86 | FPS: 2259\n", "[Iter 0122] P: 0.0338 | V: 0.1649 | V_Mean: 0.498 | Win%: 1.87 | FPS: 2340\n", "[Iter 0123] P: 0.0402 | V: 0.1639 | V_Mean: 0.497 | Win%: 1.87 | FPS: 2303\n", "[Iter 0124] P: 0.0593 | V: 0.1689 | V_Mean: 0.496 | Win%: 1.87 | FPS: 2293\n", "[Iter 0125] P: 0.0503 | V: 0.1612 | V_Mean: 0.497 | Win%: 1.88 | FPS: 2224\n", "[Iter 0126] P: 0.0727 | V: 0.1661 | V_Mean: 0.498 | Win%: 1.88 | FPS: 2188\n", "[Iter 0127] P: 0.0609 | V: 0.1667 | V_Mean: 0.498 | Win%: 1.88 | FPS: 2232\n", "[Iter 0128] P: 0.0514 | V: 0.1636 | V_Mean: 0.499 | Win%: 1.88 | FPS: 2258\n", "[Iter 0129] P: 0.0461 | V: 0.1640 | V_Mean: 0.500 | Win%: 1.88 | FPS: 2224\n", "[Iter 0130] P: 0.0521 | V: 0.1665 | V_Mean: 0.499 | Win%: 1.89 | FPS: 2604\n", "[Iter 0131] P: 0.0607 | V: 0.1681 | V_Mean: 0.498 | Win%: 1.89 | FPS: 2512\n", "[Iter 0132] P: 0.0426 | V: 0.1688 | V_Mean: 0.498 | Win%: 1.89 | FPS: 2698\n", "[Iter 0133] P: 0.0474 | V: 0.1670 | V_Mean: 0.498 | Win%: 1.89 | FPS: 2245\n", "[Iter 0134] P: 0.0414 | V: 0.1625 | V_Mean: 0.498 | Win%: 1.89 | FPS: 2437\n", "[Iter 0135] P: 0.0504 | V: 0.1660 | V_Mean: 0.498 | Win%: 1.89 | FPS: 2201\n", "[Iter 0136] P: 0.0556 | V: 0.1636 | V_Mean: 0.498 | Win%: 1.89 | FPS: 2375\n", "[Iter 0137] P: 0.0651 | V: 0.1691 | V_Mean: 0.498 | Win%: 1.89 | FPS: 2168\n", "[Iter 0138] P: 0.0537 | V: 0.1710 | V_Mean: 0.498 | Win%: 1.90 | FPS: 2224\n", "[Iter 0139] P: 0.0502 | V: 0.1650 | V_Mean: 0.497 | Win%: 1.90 | FPS: 2606\n", "[Iter 0140] P: 0.0604 | V: 0.1639 | V_Mean: 0.498 | Win%: 1.90 | FPS: 2239\n", "[Iter 0141] P: 0.0615 | V: 0.1655 | V_Mean: 0.498 | Win%: 1.90 | FPS: 2313\n", "[Iter 0142] P: 0.0566 | V: 0.1706 | V_Mean: 0.498 | Win%: 1.90 | FPS: 2516\n", "[Iter 0143] P: 0.0679 | V: 0.1637 | V_Mean: 0.498 | Win%: 1.91 | FPS: 2159\n", "[Iter 0144] P: 0.0552 | V: 0.1654 | V_Mean: 0.497 | Win%: 1.91 | FPS: 2397\n", "[Iter 0145] P: 0.0487 | V: 0.1686 | V_Mean: 0.497 | Win%: 1.91 | FPS: 2432\n", "[Iter 0146] P: 0.0487 | V: 0.1687 | V_Mean: 0.497 | Win%: 1.91 | FPS: 2335\n", "[Iter 0147] P: 0.0548 | V: 0.1682 | V_Mean: 0.497 | Win%: 1.91 | FPS: 2419\n", "[Iter 0148] P: 0.0605 | V: 0.1667 | V_Mean: 0.497 | Win%: 1.91 | FPS: 2271\n", "[Iter 0149] P: 0.0593 | V: 0.1691 | V_Mean: 0.498 | Win%: 1.91 | FPS: 2431\n", "[Iter 0150] P: 0.0580 | V: 0.1713 | V_Mean: 0.498 | Win%: 1.91 | FPS: 2552\n", "[Iter 0151] P: 0.0485 | V: 0.1698 | V_Mean: 0.497 | Win%: 1.91 | FPS: 2538\n", "[Iter 0152] P: 0.0362 | V: 0.1693 | V_Mean: 0.495 | Win%: 1.91 | FPS: 2334\n", "[Iter 0153] P: 0.0428 | V: 0.1662 | V_Mean: 0.496 | Win%: 1.91 | FPS: 2151\n", "[Iter 0154] P: 0.0438 | V: 0.1682 | V_Mean: 0.497 | Win%: 1.91 | FPS: 2305\n", "[Iter 0155] P: 0.0457 | V: 0.1677 | V_Mean: 0.497 | Win%: 1.91 | FPS: 2439\n", "[Iter 0156] P: 0.0457 | V: 0.1668 | V_Mean: 0.497 | Win%: 1.91 | FPS: 2127\n", "[Iter 0157] P: 0.0358 | V: 0.1689 | V_Mean: 0.496 | Win%: 1.92 | FPS: 2353\n", "[Iter 0158] P: 0.0339 | V: 0.1664 | V_Mean: 0.497 | Win%: 1.92 | FPS: 2720\n", "[Iter 0159] P: 0.0350 | V: 0.1682 | V_Mean: 0.497 | Win%: 1.92 | FPS: 2331\n", "[Iter 0160] P: 0.0379 | V: 0.1616 | V_Mean: 0.496 | Win%: 1.93 | FPS: 2605\n", "[Iter 0161] P: 0.0537 | V: 0.1641 | V_Mean: 0.500 | Win%: 1.93 | FPS: 2300\n", "[Iter 0162] P: 0.0511 | V: 0.1668 | V_Mean: 0.497 | Win%: 1.94 | FPS: 2282\n", "[Iter 0163] P: 0.0415 | V: 0.1675 | V_Mean: 0.500 | Win%: 1.94 | FPS: 2427\n", "[Iter 0164] P: 0.0469 | V: 0.1664 | V_Mean: 0.498 | Win%: 1.94 | FPS: 2095\n", "[Iter 0165] P: 0.0496 | V: 0.1624 | V_Mean: 0.500 | Win%: 1.95 | FPS: 2101\n", "[Iter 0166] P: 0.0485 | V: 0.1632 | V_Mean: 0.500 | Win%: 1.95 | FPS: 2380\n", "[Iter 0167] P: 0.0492 | V: 0.1597 | V_Mean: 0.501 | Win%: 1.95 | FPS: 2481\n", "[Iter 0168] P: 0.0512 | V: 0.1655 | V_Mean: 0.501 | Win%: 1.95 | FPS: 2142\n", "[Iter 0169] P: 0.0517 | V: 0.1696 | V_Mean: 0.500 | Win%: 1.96 | FPS: 2139\n", "[Iter 0170] P: 0.0646 | V: 0.1651 | V_Mean: 0.502 | Win%: 1.96 | FPS: 2272\n", "[Iter 0171] P: 0.0593 | V: 0.1642 | V_Mean: 0.500 | Win%: 1.96 | FPS: 2252\n", "[Iter 0172] P: 0.0491 | V: 0.1655 | V_Mean: 0.501 | Win%: 1.96 | FPS: 2328\n", "[Iter 0173] P: 0.0564 | V: 0.1694 | V_Mean: 0.502 | Win%: 1.97 | FPS: 2415\n", "[Iter 0174] P: 0.0431 | V: 0.1697 | V_Mean: 0.503 | Win%: 1.97 | FPS: 2516\n", "[Iter 0175] P: 0.0459 | V: 0.1662 | V_Mean: 0.503 | Win%: 1.98 | FPS: 2152\n", "[Iter 0176] P: 0.0465 | V: 0.1701 | V_Mean: 0.503 | Win%: 1.98 | FPS: 2366\n", "[Iter 0177] P: 0.0388 | V: 0.1690 | V_Mean: 0.504 | Win%: 1.98 | FPS: 2094\n", "[Iter 0178] P: 0.0399 | V: 0.1688 | V_Mean: 0.504 | Win%: 1.98 | FPS: 2033\n", "[Iter 0179] P: 0.0398 | V: 0.1637 | V_Mean: 0.504 | Win%: 1.98 | FPS: 2476\n", "[Iter 0180] P: 0.0482 | V: 0.1659 | V_Mean: 0.504 | Win%: 1.98 | FPS: 2205\n", "[Iter 0181] P: 0.0512 | V: 0.1648 | V_Mean: 0.504 | Win%: 1.98 | FPS: 2168\n", "[Iter 0182] P: 0.0489 | V: 0.1654 | V_Mean: 0.503 | Win%: 1.98 | FPS: 2260\n", "[Iter 0183] P: 0.0531 | V: 0.1659 | V_Mean: 0.503 | Win%: 1.98 | FPS: 2310\n", "[Iter 0184] P: 0.0559 | V: 0.1648 | V_Mean: 0.503 | Win%: 1.98 | FPS: 2237\n", "[Iter 0185] P: 0.0560 | V: 0.1664 | V_Mean: 0.503 | Win%: 1.98 | FPS: 2352\n", "[Iter 0186] P: 0.0522 | V: 0.1632 | V_Mean: 0.500 | Win%: 1.98 | FPS: 2493\n", "[Iter 0187] P: 0.0604 | V: 0.1573 | V_Mean: 0.499 | Win%: 1.98 | FPS: 2361\n", "[Iter 0188] P: 0.0620 | V: 0.1679 | V_Mean: 0.500 | Win%: 1.98 | FPS: 2485\n", "[Iter 0189] P: 0.0647 | V: 0.1701 | V_Mean: 0.500 | Win%: 1.98 | FPS: 2592\n", "[Iter 0190] P: 0.0750 | V: 0.1661 | V_Mean: 0.500 | Win%: 1.98 | FPS: 2509\n", "[Iter 0191] P: 0.0400 | V: 0.1690 | V_Mean: 0.497 | Win%: 1.98 | FPS: 2622\n", "[Iter 0192] P: 0.0485 | V: 0.1666 | V_Mean: 0.496 | Win%: 1.98 | FPS: 2535\n", "[Iter 0193] P: 0.0493 | V: 0.1630 | V_Mean: 0.493 | Win%: 1.98 | FPS: 2315\n", "[Iter 0194] P: 0.0504 | V: 0.1735 | V_Mean: 0.494 | Win%: 1.99 | FPS: 2160\n", "[Iter 0195] P: 0.0430 | V: 0.1697 | V_Mean: 0.494 | Win%: 1.99 | FPS: 2452\n", "[Iter 0196] P: 0.0475 | V: 0.1669 | V_Mean: 0.494 | Win%: 1.99 | FPS: 2444\n", "[Iter 0197] P: 0.0419 | V: 0.1676 | V_Mean: 0.493 | Win%: 1.99 | FPS: 2381\n", "[Iter 0198] P: 0.0531 | V: 0.1704 | V_Mean: 0.491 | Win%: 1.99 | FPS: 2508\n", "[Iter 0199] P: 0.0528 | V: 0.1656 | V_Mean: 0.492 | Win%: 1.99 | FPS: 2491\n", "[Iter 0200] P: 0.0544 | V: 0.1692 | V_Mean: 0.487 | Win%: 1.98 | FPS: 2339\n", "[Iter 0201] P: 0.0408 | V: 0.1654 | V_Mean: 0.486 | Win%: 1.98 | FPS: 2248\n", "[Iter 0202] P: 0.0523 | V: 0.1702 | V_Mean: 0.483 | Win%: 1.98 | FPS: 2630\n", "[Iter 0203] P: 0.0488 | V: 0.1670 | V_Mean: 0.483 | Win%: 1.99 | FPS: 2508\n", "[Iter 0204] P: 0.0622 | V: 0.1659 | V_Mean: 0.484 | Win%: 1.99 | FPS: 2279\n", "[Iter 0205] P: 0.0500 | V: 0.1731 | V_Mean: 0.482 | Win%: 2.00 | FPS: 2101\n", "[Iter 0206] P: 0.0509 | V: 0.1725 | V_Mean: 0.479 | Win%: 2.00 | FPS: 2388\n", "[Iter 0207] P: 0.0625 | V: 0.1716 | V_Mean: 0.478 | Win%: 2.00 | FPS: 2379\n", "[Iter 0208] P: 0.0378 | V: 0.1693 | V_Mean: 0.478 | Win%: 2.00 | FPS: 2288\n", "[Iter 0209] P: 0.0458 | V: 0.1698 | V_Mean: 0.476 | Win%: 2.00 | FPS: 2188\n", "[Iter 0210] P: 0.0488 | V: 0.1703 | V_Mean: 0.477 | Win%: 2.00 | FPS: 2386\n", "[Iter 0211] P: 0.0444 | V: 0.1687 | V_Mean: 0.478 | Win%: 2.01 | FPS: 2181\n", "[Iter 0212] P: 0.0515 | V: 0.1736 | V_Mean: 0.475 | Win%: 2.01 | FPS: 2263\n", "[Iter 0213] P: 0.0325 | V: 0.1738 | V_Mean: 0.475 | Win%: 2.01 | FPS: 2073\n", "[Iter 0214] P: 0.0371 | V: 0.1741 | V_Mean: 0.474 | Win%: 2.01 | FPS: 2260\n", "[Iter 0215] P: 0.0412 | V: 0.1751 | V_Mean: 0.474 | Win%: 2.02 | FPS: 2143\n", "[Iter 0216] P: 0.0332 | V: 0.1681 | V_Mean: 0.473 | Win%: 2.02 | FPS: 2475\n", "[Iter 0217] P: 0.0377 | V: 0.1737 | V_Mean: 0.473 | Win%: 2.02 | FPS: 2132\n", "[Iter 0218] P: 0.0345 | V: 0.1678 | V_Mean: 0.474 | Win%: 2.02 | FPS: 2104\n", "[Iter 0219] P: 0.0359 | V: 0.1744 | V_Mean: 0.473 | Win%: 2.02 | FPS: 2268\n", "[Iter 0220] P: 0.0391 | V: 0.1734 | V_Mean: 0.473 | Win%: 2.02 | FPS: 2253\n", "[Iter 0221] P: 0.0335 | V: 0.1713 | V_Mean: 0.473 | Win%: 2.02 | FPS: 2471\n", "[Iter 0222] P: 0.0329 | V: 0.1756 | V_Mean: 0.474 | Win%: 2.02 | FPS: 2492\n", "[Iter 0223] P: 0.0274 | V: 0.1726 | V_Mean: 0.473 | Win%: 2.02 | FPS: 2137\n", "[Iter 0224] P: 0.0386 | V: 0.1726 | V_Mean: 0.475 | Win%: 2.03 | FPS: 2184\n", "[Iter 0225] P: 0.0346 | V: 0.1725 | V_Mean: 0.475 | Win%: 2.03 | FPS: 2334\n", "[Iter 0226] P: 0.0371 | V: 0.1691 | V_Mean: 0.473 | Win%: 2.03 | FPS: 2276\n", "[Iter 0227] P: 0.0410 | V: 0.1691 | V_Mean: 0.475 | Win%: 2.03 | FPS: 2081\n", "[Iter 0228] P: 0.0475 | V: 0.1725 | V_Mean: 0.475 | Win%: 2.04 | FPS: 2343\n", "[Iter 0229] P: 0.0375 | V: 0.1707 | V_Mean: 0.475 | Win%: 2.04 | FPS: 2152\n", "[Iter 0230] P: 0.0363 | V: 0.1705 | V_Mean: 0.476 | Win%: 2.04 | FPS: 2193\n", "[Iter 0231] P: 0.0507 | V: 0.1720 | V_Mean: 0.476 | Win%: 2.05 | FPS: 2221\n", "[Iter 0232] P: 0.0492 | V: 0.1735 | V_Mean: 0.474 | Win%: 2.05 | FPS: 2318\n", "[Iter 0233] P: 0.0535 | V: 0.1700 | V_Mean: 0.475 | Win%: 2.05 | FPS: 2106\n", "[Iter 0234] P: 0.0442 | V: 0.1718 | V_Mean: 0.475 | Win%: 2.05 | FPS: 2198\n", "[Iter 0235] P: 0.0493 | V: 0.1693 | V_Mean: 0.473 | Win%: 2.06 | FPS: 2151\n", "[Iter 0236] P: 0.0400 | V: 0.1656 | V_Mean: 0.470 | Win%: 2.06 | FPS: 2383\n", "[Iter 0237] P: 0.0457 | V: 0.1741 | V_Mean: 0.466 | Win%: 2.06 | FPS: 2054\n", "[Iter 0238] P: 0.0500 | V: 0.1722 | V_Mean: 0.466 | Win%: 2.06 | FPS: 2295\n", "[Iter 0239] P: 0.0466 | V: 0.1729 | V_Mean: 0.468 | Win%: 2.06 | FPS: 2150\n", "[Iter 0240] P: 0.0828 | V: 0.1663 | V_Mean: 0.468 | Win%: 2.06 | FPS: 2116\n", "[Iter 0241] P: 0.0701 | V: 0.1744 | V_Mean: 0.466 | Win%: 2.06 | FPS: 2566\n", "[Iter 0242] P: 0.0508 | V: 0.1716 | V_Mean: 0.466 | Win%: 2.07 | FPS: 2625\n", "[Iter 0243] P: 0.0377 | V: 0.1723 | V_Mean: 0.465 | Win%: 2.07 | FPS: 2311\n", "[Iter 0244] P: 0.0443 | V: 0.1759 | V_Mean: 0.465 | Win%: 2.08 | FPS: 2439\n", "[Iter 0245] P: 0.0397 | V: 0.1718 | V_Mean: 0.465 | Win%: 2.08 | FPS: 2351\n", "[Iter 0246] P: 0.0455 | V: 0.1712 | V_Mean: 0.464 | Win%: 2.08 | FPS: 2172\n", "[Iter 0247] P: 0.0375 | V: 0.1721 | V_Mean: 0.464 | Win%: 2.08 | FPS: 2415\n", "[Iter 0248] P: 0.0430 | V: 0.1745 | V_Mean: 0.464 | Win%: 2.08 | FPS: 2515\n", "[Iter 0249] P: 0.0337 | V: 0.1700 | V_Mean: 0.463 | Win%: 2.08 | FPS: 2481\n", "[Iter 0250] P: 0.0450 | V: 0.1704 | V_Mean: 0.464 | Win%: 2.08 | FPS: 2560\n", "[Iter 0251] P: 0.0355 | V: 0.1723 | V_Mean: 0.463 | Win%: 2.08 | FPS: 2640\n", "[Iter 0252] P: 0.0452 | V: 0.1758 | V_Mean: 0.464 | Win%: 2.09 | FPS: 2392\n", "[Iter 0253] P: 0.0482 | V: 0.1732 | V_Mean: 0.464 | Win%: 2.09 | FPS: 2594\n", "[Iter 0254] P: 0.0489 | V: 0.1698 | V_Mean: 0.463 | Win%: 2.09 | FPS: 2344\n", "[Iter 0255] P: 0.0577 | V: 0.1708 | V_Mean: 0.463 | Win%: 2.09 | FPS: 2613\n", "[Iter 0256] P: 0.0716 | V: 0.1731 | V_Mean: 0.465 | Win%: 2.10 | FPS: 2600\n", "[Iter 0257] P: 0.0859 | V: 0.1739 | V_Mean: 0.463 | Win%: 2.10 | FPS: 2197\n", "[Iter 0258] P: 0.0775 | V: 0.1734 | V_Mean: 0.458 | Win%: 2.10 | FPS: 2355\n", "[Iter 0259] P: 0.0393 | V: 0.1703 | V_Mean: 0.455 | Win%: 2.10 | FPS: 2242\n", "[Iter 0260] P: 0.0517 | V: 0.1732 | V_Mean: 0.455 | Win%: 2.10 | FPS: 2303\n", "[Iter 0261] P: 0.0450 | V: 0.1757 | V_Mean: 0.456 | Win%: 2.10 | FPS: 2321\n", "[Iter 0262] P: 0.0403 | V: 0.1773 | V_Mean: 0.458 | Win%: 2.11 | FPS: 2396\n", "[Iter 0263] P: 0.0342 | V: 0.1722 | V_Mean: 0.456 | Win%: 2.11 | FPS: 2206\n", "[Iter 0264] P: 0.0344 | V: 0.1709 | V_Mean: 0.458 | Win%: 2.11 | FPS: 2141\n", "[Iter 0265] P: 0.0364 | V: 0.1715 | V_Mean: 0.458 | Win%: 2.11 | FPS: 2118\n", "[Iter 0266] P: 0.0360 | V: 0.1766 | V_Mean: 0.455 | Win%: 2.12 | FPS: 2025\n", "[Iter 0267] P: 0.0403 | V: 0.1753 | V_Mean: 0.453 | Win%: 2.11 | FPS: 2341\n", "[Iter 0268] P: 0.0374 | V: 0.1743 | V_Mean: 0.454 | Win%: 2.11 | FPS: 2190\n", "[Iter 0269] P: 0.0391 | V: 0.1721 | V_Mean: 0.453 | Win%: 2.12 | FPS: 2464\n", "[Iter 0270] P: 0.0413 | V: 0.1736 | V_Mean: 0.454 | Win%: 2.12 | FPS: 2513\n", "[Iter 0271] P: 0.0429 | V: 0.1729 | V_Mean: 0.453 | Win%: 2.12 | FPS: 2523\n", "[Iter 0272] P: 0.0306 | V: 0.1710 | V_Mean: 0.453 | Win%: 2.12 | FPS: 2507\n", "[Iter 0273] P: 0.0322 | V: 0.1725 | V_Mean: 0.452 | Win%: 2.11 | FPS: 2139\n", "[Iter 0274] P: 0.0350 | V: 0.1718 | V_Mean: 0.451 | Win%: 2.12 | FPS: 2295\n", "[Iter 0275] P: 0.0336 | V: 0.1778 | V_Mean: 0.452 | Win%: 2.12 | FPS: 2285\n", "[Iter 0276] P: 0.0261 | V: 0.1742 | V_Mean: 0.452 | Win%: 2.12 | FPS: 2293\n", "[Iter 0277] P: 0.0317 | V: 0.1702 | V_Mean: 0.451 | Win%: 2.12 | FPS: 2189\n", "[Iter 0278] P: 0.0355 | V: 0.1707 | V_Mean: 0.451 | Win%: 2.12 | FPS: 2395\n", "[Iter 0279] P: 0.0430 | V: 0.1722 | V_Mean: 0.451 | Win%: 2.12 | FPS: 2457\n", "[Iter 0280] P: 0.0379 | V: 0.1753 | V_Mean: 0.452 | Win%: 2.12 | FPS: 2507\n", "[Iter 0281] P: 0.0345 | V: 0.1744 | V_Mean: 0.450 | Win%: 2.12 | FPS: 2514\n", "[Iter 0282] P: 0.0319 | V: 0.1716 | V_Mean: 0.450 | Win%: 2.13 | FPS: 2459\n", "[Iter 0283] P: 0.0380 | V: 0.1723 | V_Mean: 0.450 | Win%: 2.12 | FPS: 2290\n", "[Iter 0284] P: 0.0280 | V: 0.1736 | V_Mean: 0.451 | Win%: 2.13 | FPS: 2228\n", "[Iter 0285] P: 0.0347 | V: 0.1722 | V_Mean: 0.450 | Win%: 2.13 | FPS: 2294\n", "[Iter 0286] P: 0.0396 | V: 0.1751 | V_Mean: 0.448 | Win%: 2.13 | FPS: 2055\n", "[Iter 0287] P: 0.0375 | V: 0.1724 | V_Mean: 0.449 | Win%: 2.14 | FPS: 2197\n", "[Iter 0288] P: 0.0387 | V: 0.1751 | V_Mean: 0.448 | Win%: 2.14 | FPS: 2402\n", "[Iter 0289] P: 0.0370 | V: 0.1718 | V_Mean: 0.446 | Win%: 2.14 | FPS: 2176\n", "[Iter 0290] P: 0.0339 | V: 0.1711 | V_Mean: 0.445 | Win%: 2.14 | FPS: 2219\n", "[Iter 0291] P: 0.0424 | V: 0.1735 | V_Mean: 0.446 | Win%: 2.14 | FPS: 2274\n", "[Iter 0292] P: 0.0480 | V: 0.1786 | V_Mean: 0.444 | Win%: 2.14 | FPS: 2330\n", "[Iter 0293] P: 0.0350 | V: 0.1732 | V_Mean: 0.444 | Win%: 2.14 | FPS: 2424\n", "[Iter 0294] P: 0.0462 | V: 0.1757 | V_Mean: 0.444 | Win%: 2.14 | FPS: 2499\n", "[Iter 0295] P: 0.0344 | V: 0.1740 | V_Mean: 0.442 | Win%: 2.14 | FPS: 2464\n", "[Iter 0296] P: 0.0283 | V: 0.1744 | V_Mean: 0.441 | Win%: 2.14 | FPS: 2472\n", "[Iter 0297] P: 0.0349 | V: 0.1795 | V_Mean: 0.441 | Win%: 2.14 | FPS: 2381\n", "[Iter 0298] P: 0.0284 | V: 0.1749 | V_Mean: 0.441 | Win%: 2.14 | FPS: 2177\n", "[Iter 0299] P: 0.0449 | V: 0.1807 | V_Mean: 0.441 | Win%: 2.14 | FPS: 2082\n", "[Iter 0300] P: 0.0378 | V: 0.1747 | V_Mean: 0.442 | Win%: 2.14 | FPS: 2293\n", "[Iter 0301] P: 0.0364 | V: 0.1747 | V_Mean: 0.442 | Win%: 2.14 | FPS: 2414\n", "[Iter 0302] P: 0.0371 | V: 0.1780 | V_Mean: 0.440 | Win%: 2.14 | FPS: 2398\n", "[Iter 0303] P: 0.0292 | V: 0.1772 | V_Mean: 0.439 | Win%: 2.14 | FPS: 2453\n", "[Iter 0304] P: 0.0383 | V: 0.1757 | V_Mean: 0.438 | Win%: 2.14 | FPS: 2481\n", "[Iter 0305] P: 0.0383 | V: 0.1746 | V_Mean: 0.439 | Win%: 2.14 | FPS: 2475\n", "[Iter 0306] P: 0.0400 | V: 0.1749 | V_Mean: 0.440 | Win%: 2.15 | FPS: 2495\n", "[Iter 0307] P: 0.0335 | V: 0.1744 | V_Mean: 0.442 | Win%: 2.15 | FPS: 2205\n", "[Iter 0308] P: 0.0336 | V: 0.1759 | V_Mean: 0.442 | Win%: 2.15 | FPS: 2274\n", "[Iter 0309] P: 0.0341 | V: 0.1747 | V_Mean: 0.441 | Win%: 2.15 | FPS: 2270\n", "[Iter 0310] P: 0.0299 | V: 0.1742 | V_Mean: 0.441 | Win%: 2.16 | FPS: 2282\n", "[Iter 0311] P: 0.0338 | V: 0.1747 | V_Mean: 0.439 | Win%: 2.16 | FPS: 2297\n", "[Iter 0312] P: 0.0371 | V: 0.1748 | V_Mean: 0.439 | Win%: 2.16 | FPS: 2495\n", "[Iter 0313] P: 0.0420 | V: 0.1806 | V_Mean: 0.438 | Win%: 2.17 | FPS: 2493\n", "[Iter 0314] P: 0.0310 | V: 0.1796 | V_Mean: 0.440 | Win%: 2.17 | FPS: 2238\n", "[Iter 0315] P: 0.0297 | V: 0.1764 | V_Mean: 0.435 | Win%: 2.16 | FPS: 2515\n", "[Iter 0316] P: 0.0363 | V: 0.1738 | V_Mean: 0.434 | Win%: 2.16 | FPS: 2497\n", "[Iter 0317] P: 0.0382 | V: 0.1757 | V_Mean: 0.432 | Win%: 2.16 | FPS: 2239\n", "[Iter 0318] P: 0.0354 | V: 0.1749 | V_Mean: 0.433 | Win%: 2.16 | FPS: 2109\n", "[Iter 0319] P: 0.0410 | V: 0.1776 | V_Mean: 0.433 | Win%: 2.17 | FPS: 2330\n", "[Iter 0320] P: 0.0379 | V: 0.1778 | V_Mean: 0.432 | Win%: 2.17 | FPS: 2341\n", "[Iter 0321] P: 0.0381 | V: 0.1751 | V_Mean: 0.433 | Win%: 2.17 | FPS: 2496\n", "[Iter 0322] P: 0.0396 | V: 0.1751 | V_Mean: 0.432 | Win%: 2.17 | FPS: 2449\n", "[Iter 0323] P: 0.0347 | V: 0.1687 | V_Mean: 0.432 | Win%: 2.17 | FPS: 2540\n", "[Iter 0324] P: 0.0437 | V: 0.1780 | V_Mean: 0.432 | Win%: 2.17 | FPS: 2433\n", "[Iter 0325] P: 0.0379 | V: 0.1763 | V_Mean: 0.431 | Win%: 2.18 | FPS: 2164\n", "[Iter 0326] P: 0.0337 | V: 0.1768 | V_Mean: 0.428 | Win%: 2.18 | FPS: 2481\n", "[Iter 0327] P: 0.0304 | V: 0.1775 | V_Mean: 0.428 | Win%: 2.18 | FPS: 2522\n", "[Iter 0328] P: 0.0280 | V: 0.1750 | V_Mean: 0.427 | Win%: 2.18 | FPS: 2077\n", "[Iter 0329] P: 0.0395 | V: 0.1775 | V_Mean: 0.427 | Win%: 2.18 | FPS: 2301\n", "[Iter 0330] P: 0.0323 | V: 0.1779 | V_Mean: 0.428 | Win%: 2.18 | FPS: 2283\n", "[Iter 0331] P: 0.0279 | V: 0.1798 | V_Mean: 0.427 | Win%: 2.18 | FPS: 2380\n", "[Iter 0332] P: 0.0277 | V: 0.1748 | V_Mean: 0.427 | Win%: 2.18 | FPS: 2445\n", "[Iter 0333] P: 0.0438 | V: 0.1756 | V_Mean: 0.429 | Win%: 2.19 | FPS: 2543\n", "[Iter 0334] P: 0.0382 | V: 0.1749 | V_Mean: 0.429 | Win%: 2.19 | FPS: 2490\n", "[Iter 0335] P: 0.0357 | V: 0.1755 | V_Mean: 0.427 | Win%: 2.19 | FPS: 2293\n", "[Iter 0336] P: 0.0392 | V: 0.1779 | V_Mean: 0.427 | Win%: 2.19 | FPS: 2563\n", "[Iter 0337] P: 0.0316 | V: 0.1753 | V_Mean: 0.427 | Win%: 2.19 | FPS: 2317\n", "[Iter 0338] P: 0.0354 | V: 0.1797 | V_Mean: 0.428 | Win%: 2.19 | FPS: 2351\n", "[Iter 0339] P: 0.0276 | V: 0.1794 | V_Mean: 0.427 | Win%: 2.19 | FPS: 2294\n", "[Iter 0340] P: 0.0247 | V: 0.1769 | V_Mean: 0.428 | Win%: 2.19 | FPS: 2097\n", "[Iter 0341] P: 0.0297 | V: 0.1797 | V_Mean: 0.427 | Win%: 2.19 | FPS: 2342\n", "[Iter 0342] P: 0.0339 | V: 0.1764 | V_Mean: 0.428 | Win%: 2.19 | FPS: 2207\n", "[Iter 0343] P: 0.0316 | V: 0.1765 | V_Mean: 0.427 | Win%: 2.20 | FPS: 2140\n", "[Iter 0344] P: 0.0368 | V: 0.1769 | V_Mean: 0.427 | Win%: 2.20 | FPS: 2431\n", "[Iter 0345] P: 0.0296 | V: 0.1757 | V_Mean: 0.427 | Win%: 2.20 | FPS: 2298\n", "[Iter 0346] P: 0.0337 | V: 0.1746 | V_Mean: 0.428 | Win%: 2.20 | FPS: 2074\n", "[Iter 0347] P: 0.0329 | V: 0.1777 | V_Mean: 0.428 | Win%: 2.20 | FPS: 2251\n", "[Iter 0348] P: 0.0362 | V: 0.1747 | V_Mean: 0.427 | Win%: 2.20 | FPS: 2364\n", "[Iter 0349] P: 0.0305 | V: 0.1740 | V_Mean: 0.427 | Win%: 2.20 | FPS: 2420\n", "[Iter 0350] P: 0.0322 | V: 0.1749 | V_Mean: 0.427 | Win%: 2.20 | FPS: 2473\n", "[Iter 0351] P: 0.0302 | V: 0.1737 | V_Mean: 0.423 | Win%: 2.20 | FPS: 2384\n", "[Iter 0352] P: 0.0372 | V: 0.1750 | V_Mean: 0.422 | Win%: 2.20 | FPS: 2128\n", "[Iter 0353] P: 0.0383 | V: 0.1791 | V_Mean: 0.427 | Win%: 2.20 | FPS: 2049\n", "[Iter 0354] P: 0.0295 | V: 0.1757 | V_Mean: 0.425 | Win%: 2.20 | FPS: 2288\n", "[Iter 0355] P: 0.0360 | V: 0.1760 | V_Mean: 0.428 | Win%: 2.20 | FPS: 2342\n", "[Iter 0356] P: 0.0340 | V: 0.1748 | V_Mean: 0.426 | Win%: 2.20 | FPS: 2420\n", "[Iter 0357] P: 0.0309 | V: 0.1753 | V_Mean: 0.425 | Win%: 2.20 | FPS: 2173\n", "[Iter 0358] P: 0.0360 | V: 0.1740 | V_Mean: 0.424 | Win%: 2.20 | FPS: 2468\n", "[Iter 0359] P: 0.0402 | V: 0.1717 | V_Mean: 0.424 | Win%: 2.21 | FPS: 2400\n", "[Iter 0360] P: 0.0391 | V: 0.1729 | V_Mean: 0.422 | Win%: 2.21 | FPS: 2234\n", "[Iter 0361] P: 0.0432 | V: 0.1775 | V_Mean: 0.422 | Win%: 2.21 | FPS: 2303\n", "[Iter 0362] P: 0.0374 | V: 0.1773 | V_Mean: 0.422 | Win%: 2.21 | FPS: 2297\n", "[Iter 0363] P: 0.0359 | V: 0.1731 | V_Mean: 0.426 | Win%: 2.22 | FPS: 2122\n", "[Iter 0364] P: 0.0344 | V: 0.1762 | V_Mean: 0.425 | Win%: 2.22 | FPS: 2473\n", "[Iter 0365] P: 0.0350 | V: 0.1752 | V_Mean: 0.425 | Win%: 2.22 | FPS: 2501\n", "[Iter 0366] P: 0.0266 | V: 0.1742 | V_Mean: 0.425 | Win%: 2.22 | FPS: 2182\n", "[Iter 0367] P: 0.0420 | V: 0.1772 | V_Mean: 0.425 | Win%: 2.22 | FPS: 2217\n", "[Iter 0368] P: 0.0341 | V: 0.1784 | V_Mean: 0.425 | Win%: 2.22 | FPS: 2093\n", "[Iter 0369] P: 0.0394 | V: 0.1749 | V_Mean: 0.423 | Win%: 2.22 | FPS: 2322\n", "[Iter 0370] P: 0.0351 | V: 0.1777 | V_Mean: 0.423 | Win%: 2.22 | FPS: 2153\n", "[Iter 0371] P: 0.0318 | V: 0.1781 | V_Mean: 0.422 | Win%: 2.22 | FPS: 2453\n", "[Iter 0372] P: 0.0343 | V: 0.1742 | V_Mean: 0.421 | Win%: 2.22 | FPS: 2468\n", "[Iter 0373] P: 0.0380 | V: 0.1740 | V_Mean: 0.421 | Win%: 2.22 | FPS: 2493\n", "[Iter 0374] P: 0.0346 | V: 0.1773 | V_Mean: 0.420 | Win%: 2.22 | FPS: 2504\n", "[Iter 0375] P: 0.0328 | V: 0.1743 | V_Mean: 0.421 | Win%: 2.22 | FPS: 2500\n", "[Iter 0376] P: 0.0380 | V: 0.1748 | V_Mean: 0.421 | Win%: 2.23 | FPS: 2253\n", "[Iter 0377] P: 0.0346 | V: 0.1737 | V_Mean: 0.420 | Win%: 2.23 | FPS: 2289\n", "[Iter 0378] P: 0.0408 | V: 0.1767 | V_Mean: 0.420 | Win%: 2.23 | FPS: 2098\n", "[Iter 0379] P: 0.0329 | V: 0.1796 | V_Mean: 0.420 | Win%: 2.23 | FPS: 2357\n", "[Iter 0380] P: 0.0329 | V: 0.1786 | V_Mean: 0.423 | Win%: 2.24 | FPS: 2409\n", "[Iter 0381] P: 0.0227 | V: 0.1782 | V_Mean: 0.422 | Win%: 2.24 | FPS: 2220\n", "[Iter 0382] P: 0.0274 | V: 0.1759 | V_Mean: 0.422 | Win%: 2.24 | FPS: 2577\n", "[Iter 0383] P: 0.0235 | V: 0.1728 | V_Mean: 0.422 | Win%: 2.24 | FPS: 2501\n", "[Iter 0384] P: 0.0301 | V: 0.1736 | V_Mean: 0.418 | Win%: 2.24 | FPS: 2200\n", "[Iter 0385] P: 0.0326 | V: 0.1743 | V_Mean: 0.417 | Win%: 2.24 | FPS: 2101\n", "[Iter 0386] P: 0.0364 | V: 0.1791 | V_Mean: 0.415 | Win%: 2.24 | FPS: 2252\n", "[Iter 0387] P: 0.0354 | V: 0.1741 | V_Mean: 0.415 | Win%: 2.24 | FPS: 2149\n", "[Iter 0388] P: 0.0434 | V: 0.1810 | V_Mean: 0.412 | Win%: 2.24 | FPS: 2468\n", "[Iter 0389] P: 0.0339 | V: 0.1780 | V_Mean: 0.410 | Win%: 2.25 | FPS: 2449\n", "[Iter 0390] P: 0.0341 | V: 0.1794 | V_Mean: 0.410 | Win%: 2.25 | FPS: 2513\n", "[Iter 0391] P: 0.0359 | V: 0.1774 | V_Mean: 0.410 | Win%: 2.25 | FPS: 2471\n", "[Iter 0392] P: 0.0312 | V: 0.1765 | V_Mean: 0.411 | Win%: 2.25 | FPS: 2200\n", "[Iter 0393] P: 0.0420 | V: 0.1796 | V_Mean: 0.410 | Win%: 2.25 | FPS: 2306\n", "[Iter 0394] P: 0.0350 | V: 0.1772 | V_Mean: 0.409 | Win%: 2.25 | FPS: 2279\n", "[Iter 0395] P: 0.0394 | V: 0.1758 | V_Mean: 0.408 | Win%: 2.25 | FPS: 2288\n", "[Iter 0396] P: 0.0358 | V: 0.1761 | V_Mean: 0.409 | Win%: 2.25 | FPS: 2148\n", "[Iter 0397] P: 0.0387 | V: 0.1767 | V_Mean: 0.408 | Win%: 2.25 | FPS: 2518\n", "[Iter 0398] P: 0.0366 | V: 0.1789 | V_Mean: 0.406 | Win%: 2.25 | FPS: 2506\n", "[Iter 0399] P: 0.0298 | V: 0.1768 | V_Mean: 0.406 | Win%: 2.25 | FPS: 2492\n", "[Iter 0400] P: 0.0334 | V: 0.1802 | V_Mean: 0.405 | Win%: 2.25 | FPS: 2453\n", "[Iter 0401] P: 0.0360 | V: 0.1819 | V_Mean: 0.407 | Win%: 2.25 | FPS: 2445\n", "[Iter 0402] P: 0.0268 | V: 0.1782 | V_Mean: 0.404 | Win%: 2.26 | FPS: 2376\n", "[Iter 0403] P: 0.0346 | V: 0.1767 | V_Mean: 0.405 | Win%: 2.26 | FPS: 2288\n", "[Iter 0404] P: 0.0288 | V: 0.1764 | V_Mean: 0.405 | Win%: 2.26 | FPS: 2293\n", "[Iter 0405] P: 0.0315 | V: 0.1762 | V_Mean: 0.403 | Win%: 2.27 | FPS: 2089\n", "[Iter 0406] P: 0.0333 | V: 0.1793 | V_Mean: 0.404 | Win%: 2.27 | FPS: 2438\n", "[Iter 0407] P: 0.0412 | V: 0.1766 | V_Mean: 0.405 | Win%: 2.27 | FPS: 2565\n", "[Iter 0408] P: 0.0402 | V: 0.1771 | V_Mean: 0.405 | Win%: 2.27 | FPS: 2479\n", "[Iter 0409] P: 0.0382 | V: 0.1806 | V_Mean: 0.403 | Win%: 2.27 | FPS: 2485\n", "[Iter 0410] P: 0.0313 | V: 0.1738 | V_Mean: 0.403 | Win%: 2.27 | FPS: 2490\n", "[Iter 0411] P: 0.0420 | V: 0.1772 | V_Mean: 0.403 | Win%: 2.27 | FPS: 2505\n", "[Iter 0412] P: 0.0344 | V: 0.1778 | V_Mean: 0.403 | Win%: 2.27 | FPS: 2481\n", "[Iter 0413] P: 0.0332 | V: 0.1799 | V_Mean: 0.400 | Win%: 2.27 | FPS: 2451\n", "[Iter 0414] P: 0.0301 | V: 0.1745 | V_Mean: 0.401 | Win%: 2.27 | FPS: 2275\n", "[Iter 0415] P: 0.0391 | V: 0.1759 | V_Mean: 0.400 | Win%: 2.27 | FPS: 2283\n", "[Iter 0416] P: 0.0315 | V: 0.1749 | V_Mean: 0.401 | Win%: 2.28 | FPS: 2272\n", "[Iter 0417] P: 0.0313 | V: 0.1737 | V_Mean: 0.401 | Win%: 2.28 | FPS: 2267\n", "[Iter 0418] P: 0.0383 | V: 0.1757 | V_Mean: 0.400 | Win%: 2.29 | FPS: 2212\n", "[Iter 0419] P: 0.0486 | V: 0.1764 | V_Mean: 0.400 | Win%: 2.29 | FPS: 2568\n", "[Iter 0420] P: 0.0372 | V: 0.1777 | V_Mean: 0.399 | Win%: 2.29 | FPS: 2154\n", "[Iter 0421] P: 0.0376 | V: 0.1809 | V_Mean: 0.400 | Win%: 2.29 | FPS: 2177\n", "[Iter 0422] P: 0.0291 | V: 0.1784 | V_Mean: 0.403 | Win%: 2.30 | FPS: 2097\n", "[Iter 0423] P: 0.0286 | V: 0.1763 | V_Mean: 0.401 | Win%: 2.30 | FPS: 2103\n", "[Iter 0424] P: 0.0386 | V: 0.1781 | V_Mean: 0.401 | Win%: 2.30 | FPS: 2510\n", "[Iter 0425] P: 0.0355 | V: 0.1751 | V_Mean: 0.400 | Win%: 2.30 | FPS: 2465\n", "[Iter 0426] P: 0.0301 | V: 0.1757 | V_Mean: 0.399 | Win%: 2.30 | FPS: 2448\n", "[Iter 0427] P: 0.0397 | V: 0.1770 | V_Mean: 0.399 | Win%: 2.30 | FPS: 2602\n", "[Iter 0428] P: 0.0360 | V: 0.1756 | V_Mean: 0.399 | Win%: 2.30 | FPS: 2151\n", "[Iter 0429] P: 0.0330 | V: 0.1746 | V_Mean: 0.401 | Win%: 2.31 | FPS: 2130\n", "[Iter 0430] P: 0.0343 | V: 0.1798 | V_Mean: 0.400 | Win%: 2.31 | FPS: 2293\n", "[Iter 0431] P: 0.0297 | V: 0.1795 | V_Mean: 0.399 | Win%: 2.31 | FPS: 2088\n", "[Iter 0432] P: 0.0326 | V: 0.1750 | V_Mean: 0.400 | Win%: 2.31 | FPS: 2565\n", "[Iter 0433] P: 0.0262 | V: 0.1747 | V_Mean: 0.398 | Win%: 2.31 | FPS: 2469\n", "[Iter 0434] P: 0.0389 | V: 0.1780 | V_Mean: 0.398 | Win%: 2.31 | FPS: 2503\n", "[Iter 0435] P: 0.0271 | V: 0.1799 | V_Mean: 0.399 | Win%: 2.31 | FPS: 2522\n", "[Iter 0436] P: 0.0299 | V: 0.1780 | V_Mean: 0.399 | Win%: 2.31 | FPS: 2495\n", "[Iter 0437] P: 0.0259 | V: 0.1749 | V_Mean: 0.399 | Win%: 2.31 | FPS: 2443\n", "[Iter 0438] P: 0.0312 | V: 0.1777 | V_Mean: 0.397 | Win%: 2.31 | FPS: 2491\n", "[Iter 0439] P: 0.0326 | V: 0.1765 | V_Mean: 0.397 | Win%: 2.31 | FPS: 2352\n", "[Iter 0440] P: 0.0354 | V: 0.1740 | V_Mean: 0.398 | Win%: 2.31 | FPS: 2322\n", "[Iter 0441] P: 0.0356 | V: 0.1760 | V_Mean: 0.396 | Win%: 2.31 | FPS: 2083\n", "[Iter 0442] P: 0.0279 | V: 0.1697 | V_Mean: 0.395 | Win%: 2.31 | FPS: 2131\n", "[Iter 0443] P: 0.0428 | V: 0.1752 | V_Mean: 0.393 | Win%: 2.31 | FPS: 2500\n", "[Iter 0444] P: 0.0416 | V: 0.1735 | V_Mean: 0.390 | Win%: 2.31 | FPS: 2491\n", "[Iter 0445] P: 0.0433 | V: 0.1753 | V_Mean: 0.387 | Win%: 2.30 | FPS: 2601\n", "[Iter 0446] P: 0.0347 | V: 0.1756 | V_Mean: 0.385 | Win%: 2.30 | FPS: 2177\n", "[Iter 0447] P: 0.0361 | V: 0.1734 | V_Mean: 0.384 | Win%: 2.30 | FPS: 2385\n", "[Iter 0448] P: 0.0374 | V: 0.1770 | V_Mean: 0.384 | Win%: 2.30 | FPS: 2282\n", "[Iter 0449] P: 0.0298 | V: 0.1793 | V_Mean: 0.385 | Win%: 2.31 | FPS: 2315\n", "[Iter 0450] P: 0.0381 | V: 0.1798 | V_Mean: 0.382 | Win%: 2.31 | FPS: 2300\n", "[Iter 0451] P: 0.0304 | V: 0.1729 | V_Mean: 0.380 | Win%: 2.32 | FPS: 2429\n", "[Iter 0452] P: 0.0354 | V: 0.1759 | V_Mean: 0.381 | Win%: 2.31 | FPS: 2602\n", "[Iter 0453] P: 0.0427 | V: 0.1745 | V_Mean: 0.380 | Win%: 2.32 | FPS: 2453\n", "[Iter 0454] P: 0.0345 | V: 0.1770 | V_Mean: 0.380 | Win%: 2.32 | FPS: 2421\n", "[Iter 0455] P: 0.0371 | V: 0.1730 | V_Mean: 0.380 | Win%: 2.32 | FPS: 2407\n", "[Iter 0456] P: 0.0370 | V: 0.1755 | V_Mean: 0.379 | Win%: 2.32 | FPS: 2147\n", "[Iter 0457] P: 0.0420 | V: 0.1731 | V_Mean: 0.377 | Win%: 2.32 | FPS: 2428\n", "[Iter 0458] P: 0.0403 | V: 0.1737 | V_Mean: 0.378 | Win%: 2.33 | FPS: 2268\n", "[Iter 0459] P: 0.0423 | V: 0.1722 | V_Mean: 0.378 | Win%: 2.32 | FPS: 2277\n", "[Iter 0460] P: 0.0419 | V: 0.1783 | V_Mean: 0.378 | Win%: 2.32 | FPS: 2286\n", "[Iter 0461] P: 0.0306 | V: 0.1769 | V_Mean: 0.378 | Win%: 2.32 | FPS: 2375\n", "[Iter 0462] P: 0.0386 | V: 0.1751 | V_Mean: 0.377 | Win%: 2.32 | FPS: 2473\n", "[Iter 0463] P: 0.0368 | V: 0.1769 | V_Mean: 0.374 | Win%: 2.32 | FPS: 2550\n", "[Iter 0464] P: 0.0321 | V: 0.1765 | V_Mean: 0.372 | Win%: 2.32 | FPS: 2458\n", "[Iter 0465] P: 0.0310 | V: 0.1757 | V_Mean: 0.373 | Win%: 2.32 | FPS: 2431\n", "[Iter 0466] P: 0.0356 | V: 0.1766 | V_Mean: 0.373 | Win%: 2.32 | FPS: 2433\n", "[Iter 0467] P: 0.0371 | V: 0.1751 | V_Mean: 0.373 | Win%: 2.32 | FPS: 2448\n", "[Iter 0468] P: 0.0327 | V: 0.1761 | V_Mean: 0.372 | Win%: 2.33 | FPS: 2505\n", "[Iter 0469] P: 0.0347 | V: 0.1768 | V_Mean: 0.371 | Win%: 2.33 | FPS: 2389\n", "[Iter 0470] P: 0.0409 | V: 0.1786 | V_Mean: 0.370 | Win%: 2.33 | FPS: 2253\n", "[Iter 0471] P: 0.0348 | V: 0.1791 | V_Mean: 0.370 | Win%: 2.33 | FPS: 2293\n", "[Iter 0472] P: 0.0345 | V: 0.1779 | V_Mean: 0.368 | Win%: 2.33 | FPS: 2088\n", "[Iter 0473] P: 0.0326 | V: 0.1770 | V_Mean: 0.369 | Win%: 2.34 | FPS: 2204\n", "[Iter 0474] P: 0.0353 | V: 0.1725 | V_Mean: 0.368 | Win%: 2.34 | FPS: 2487\n", "[Iter 0475] P: 0.0441 | V: 0.1791 | V_Mean: 0.367 | Win%: 2.34 | FPS: 2463\n", "[Iter 0476] P: 0.0376 | V: 0.1761 | V_Mean: 0.369 | Win%: 2.34 | FPS: 2117\n", "[Iter 0477] P: 0.0358 | V: 0.1736 | V_Mean: 0.368 | Win%: 2.33 | FPS: 2237\n", "[Iter 0478] P: 0.0326 | V: 0.1764 | V_Mean: 0.368 | Win%: 2.33 | FPS: 2339\n", "[Iter 0479] P: 0.0450 | V: 0.1798 | V_Mean: 0.368 | Win%: 2.33 | FPS: 2266\n", "[Iter 0480] P: 0.0372 | V: 0.1773 | V_Mean: 0.370 | Win%: 2.33 | FPS: 2047\n", "[Iter 0481] P: 0.0347 | V: 0.1742 | V_Mean: 0.366 | Win%: 2.33 | FPS: 2425\n", "[Iter 0482] P: 0.0462 | V: 0.1771 | V_Mean: 0.366 | Win%: 2.33 | FPS: 2560\n", "[Iter 0483] P: 0.0353 | V: 0.1725 | V_Mean: 0.366 | Win%: 2.33 | FPS: 2493\n", "[Iter 0484] P: 0.0450 | V: 0.1750 | V_Mean: 0.366 | Win%: 2.33 | FPS: 2498\n", "[Iter 0485] P: 0.0303 | V: 0.1724 | V_Mean: 0.365 | Win%: 2.33 | FPS: 2481\n", "[Iter 0486] P: 0.0379 | V: 0.1761 | V_Mean: 0.364 | Win%: 2.33 | FPS: 2453\n", "[Iter 0487] P: 0.0362 | V: 0.1718 | V_Mean: 0.364 | Win%: 2.33 | FPS: 2448\n", "[Iter 0488] P: 0.0444 | V: 0.1752 | V_Mean: 0.363 | Win%: 2.33 | FPS: 2285\n", "[Iter 0489] P: 0.0376 | V: 0.1741 | V_Mean: 0.363 | Win%: 2.33 | FPS: 2299\n", "[Iter 0490] P: 0.0354 | V: 0.1750 | V_Mean: 0.363 | Win%: 2.33 | FPS: 2292\n", "[Iter 0491] P: 0.0439 | V: 0.1764 | V_Mean: 0.363 | Win%: 2.33 | FPS: 2335\n", "[Iter 0492] P: 0.0415 | V: 0.1748 | V_Mean: 0.363 | Win%: 2.33 | FPS: 2392\n", "[Iter 0493] P: 0.0411 | V: 0.1752 | V_Mean: 0.362 | Win%: 2.33 | FPS: 2499\n", "[Iter 0494] P: 0.0289 | V: 0.1737 | V_Mean: 0.362 | Win%: 2.33 | FPS: 2607\n", "[Iter 0495] P: 0.0472 | V: 0.1750 | V_Mean: 0.360 | Win%: 2.33 | FPS: 2506\n", "[Iter 0496] P: 0.0366 | V: 0.1747 | V_Mean: 0.359 | Win%: 2.33 | FPS: 2256\n", "[Iter 0497] P: 0.0463 | V: 0.1762 | V_Mean: 0.355 | Win%: 2.33 | FPS: 2446\n", "[Iter 0498] P: 0.0407 | V: 0.1764 | V_Mean: 0.353 | Win%: 2.33 | FPS: 2552\n", "[Iter 0499] P: 0.0424 | V: 0.1720 | V_Mean: 0.352 | Win%: 2.32 | FPS: 2388\n", "[Iter 0500] P: 0.0481 | V: 0.1737 | V_Mean: 0.352 | Win%: 2.33 | FPS: 2092\n", "[Iter 0501] P: 0.0456 | V: 0.1716 | V_Mean: 0.349 | Win%: 2.33 | FPS: 2135\n", "[Iter 0502] P: 0.0521 | V: 0.1765 | V_Mean: 0.348 | Win%: 2.33 | FPS: 2420\n", "[Iter 0503] P: 0.0447 | V: 0.1764 | V_Mean: 0.348 | Win%: 2.33 | FPS: 2469\n", "[Iter 0504] P: 0.0354 | V: 0.1753 | V_Mean: 0.348 | Win%: 2.33 | FPS: 2522\n", "[Iter 0505] P: 0.0421 | V: 0.1765 | V_Mean: 0.346 | Win%: 2.34 | FPS: 2405\n", "[Iter 0506] P: 0.0335 | V: 0.1770 | V_Mean: 0.346 | Win%: 2.34 | FPS: 2478\n", "[Iter 0507] P: 0.0343 | V: 0.1725 | V_Mean: 0.346 | Win%: 2.34 | FPS: 2350\n", "[Iter 0508] P: 0.0443 | V: 0.1743 | V_Mean: 0.348 | Win%: 2.34 | FPS: 2190\n", "[Iter 0509] P: 0.0325 | V: 0.1760 | V_Mean: 0.349 | Win%: 2.34 | FPS: 2258\n", "[Iter 0510] P: 0.0385 | V: 0.1758 | V_Mean: 0.346 | Win%: 2.34 | FPS: 2223\n", "[Iter 0511] P: 0.0356 | V: 0.1748 | V_Mean: 0.346 | Win%: 2.34 | FPS: 2069\n", "[Iter 0512] P: 0.0414 | V: 0.1753 | V_Mean: 0.345 | Win%: 2.34 | FPS: 2475\n", "[Iter 0513] P: 0.0511 | V: 0.1769 | V_Mean: 0.345 | Win%: 2.34 | FPS: 2305\n", "[Iter 0514] P: 0.0314 | V: 0.1756 | V_Mean: 0.345 | Win%: 2.34 | FPS: 2452\n", "[Iter 0515] P: 0.0422 | V: 0.1758 | V_Mean: 0.345 | Win%: 2.34 | FPS: 2474\n", "[Iter 0516] P: 0.0399 | V: 0.1754 | V_Mean: 0.345 | Win%: 2.34 | FPS: 2257\n", "[Iter 0517] P: 0.0385 | V: 0.1773 | V_Mean: 0.345 | Win%: 2.35 | FPS: 2258\n", "[Iter 0518] P: 0.0334 | V: 0.1784 | V_Mean: 0.345 | Win%: 2.35 | FPS: 2268\n", "[Iter 0519] P: 0.0341 | V: 0.1737 | V_Mean: 0.345 | Win%: 2.35 | FPS: 2356\n", "[Iter 0520] P: 0.0294 | V: 0.1732 | V_Mean: 0.345 | Win%: 2.35 | FPS: 2321\n", "[Iter 0521] P: 0.0378 | V: 0.1751 | V_Mean: 0.348 | Win%: 2.35 | FPS: 2401\n", "[Iter 0522] P: 0.0364 | V: 0.1783 | V_Mean: 0.345 | Win%: 2.35 | FPS: 2526\n", "[Iter 0523] P: 0.0372 | V: 0.1750 | V_Mean: 0.346 | Win%: 2.35 | FPS: 2485\n", "[Iter 0524] P: 0.0388 | V: 0.1753 | V_Mean: 0.346 | Win%: 2.35 | FPS: 2475\n", "[Iter 0525] P: 0.0356 | V: 0.1751 | V_Mean: 0.346 | Win%: 2.35 | FPS: 2587\n", "[Iter 0526] P: 0.0370 | V: 0.1758 | V_Mean: 0.346 | Win%: 2.34 | FPS: 2496\n", "[Iter 0527] P: 0.0530 | V: 0.1772 | V_Mean: 0.346 | Win%: 2.35 | FPS: 2446\n", "[Iter 0528] P: 0.0368 | V: 0.1723 | V_Mean: 0.347 | Win%: 2.35 | FPS: 2491\n", "[Iter 0529] P: 0.0538 | V: 0.1763 | V_Mean: 0.346 | Win%: 2.35 | FPS: 2314\n", "[Iter 0530] P: 0.0436 | V: 0.1747 | V_Mean: 0.346 | Win%: 2.35 | FPS: 2145\n", "[Iter 0531] P: 0.0549 | V: 0.1761 | V_Mean: 0.344 | Win%: 2.35 | FPS: 2022\n", "[Iter 0532] P: 0.0370 | V: 0.1738 | V_Mean: 0.343 | Win%: 2.35 | FPS: 2367\n", "[Iter 0533] P: 0.0436 | V: 0.1711 | V_Mean: 0.343 | Win%: 2.35 | FPS: 2543\n", "[Iter 0534] P: 0.0450 | V: 0.1765 | V_Mean: 0.341 | Win%: 2.35 | FPS: 2226\n", "[Iter 0535] P: 0.0393 | V: 0.1756 | V_Mean: 0.340 | Win%: 2.35 | FPS: 2157\n", "[Iter 0536] P: 0.0369 | V: 0.1744 | V_Mean: 0.340 | Win%: 2.35 | FPS: 2222\n", "[Iter 0537] P: 0.0466 | V: 0.1755 | V_Mean: 0.339 | Win%: 2.35 | FPS: 2180\n", "[Iter 0538] P: 0.0380 | V: 0.1723 | V_Mean: 0.339 | Win%: 2.35 | FPS: 2243\n", "[Iter 0539] P: 0.0482 | V: 0.1753 | V_Mean: 0.339 | Win%: 2.35 | FPS: 2322\n", "[Iter 0540] P: 0.0364 | V: 0.1733 | V_Mean: 0.338 | Win%: 2.35 | FPS: 2410\n", "[Iter 0541] P: 0.0341 | V: 0.1747 | V_Mean: 0.339 | Win%: 2.36 | FPS: 2176\n", "[Iter 0542] P: 0.0512 | V: 0.1778 | V_Mean: 0.338 | Win%: 2.36 | FPS: 2302\n", "[Iter 0543] P: 0.0287 | V: 0.1714 | V_Mean: 0.337 | Win%: 2.36 | FPS: 2218\n", "[Iter 0544] P: 0.0468 | V: 0.1723 | V_Mean: 0.338 | Win%: 2.36 | FPS: 2293\n", "[Iter 0545] P: 0.0481 | V: 0.1760 | V_Mean: 0.339 | Win%: 2.37 | FPS: 2182\n", "[Iter 0546] P: 0.0396 | V: 0.1733 | V_Mean: 0.339 | Win%: 2.37 | FPS: 2210\n", "[Iter 0547] P: 0.0413 | V: 0.1692 | V_Mean: 0.337 | Win%: 2.37 | FPS: 2409\n", "[Iter 0548] P: 0.0528 | V: 0.1733 | V_Mean: 0.339 | Win%: 2.37 | FPS: 2358\n", "[Iter 0549] P: 0.0445 | V: 0.1749 | V_Mean: 0.339 | Win%: 2.37 | FPS: 2413\n", "[Iter 0550] P: 0.0497 | V: 0.1731 | V_Mean: 0.338 | Win%: 2.37 | FPS: 2515\n", "[Iter 0551] P: 0.0382 | V: 0.1776 | V_Mean: 0.339 | Win%: 2.37 | FPS: 2288\n", "[Iter 0552] P: 0.0352 | V: 0.1735 | V_Mean: 0.338 | Win%: 2.37 | FPS: 2049\n", "[Iter 0553] P: 0.0424 | V: 0.1745 | V_Mean: 0.338 | Win%: 2.37 | FPS: 2286\n", "[Iter 0554] P: 0.0416 | V: 0.1747 | V_Mean: 0.335 | Win%: 2.37 | FPS: 2179\n", "[Iter 0555] P: 0.0416 | V: 0.1743 | V_Mean: 0.335 | Win%: 2.37 | FPS: 2412\n", "[Iter 0556] P: 0.0361 | V: 0.1735 | V_Mean: 0.334 | Win%: 2.37 | FPS: 2206\n", "[Iter 0557] P: 0.0426 | V: 0.1762 | V_Mean: 0.333 | Win%: 2.37 | FPS: 2382\n", "[Iter 0558] P: 0.0397 | V: 0.1722 | V_Mean: 0.333 | Win%: 2.36 | FPS: 2371\n", "[Iter 0559] P: 0.0413 | V: 0.1718 | V_Mean: 0.330 | Win%: 2.37 | FPS: 2078\n", "[Iter 0560] P: 0.0473 | V: 0.1713 | V_Mean: 0.330 | Win%: 2.37 | FPS: 2298\n", "[Iter 0561] P: 0.0466 | V: 0.1739 | V_Mean: 0.330 | Win%: 2.38 | FPS: 2334\n", "[Iter 0562] P: 0.0424 | V: 0.1747 | V_Mean: 0.329 | Win%: 2.38 | FPS: 2455\n", "[Iter 0563] P: 0.0410 | V: 0.1715 | V_Mean: 0.329 | Win%: 2.38 | FPS: 2337\n", "[Iter 0564] P: 0.0476 | V: 0.1745 | V_Mean: 0.330 | Win%: 2.38 | FPS: 2421\n", "[Iter 0565] P: 0.0419 | V: 0.1750 | V_Mean: 0.329 | Win%: 2.38 | FPS: 2533\n", "[Iter 0566] P: 0.0404 | V: 0.1746 | V_Mean: 0.330 | Win%: 2.38 | FPS: 2361\n", "[Iter 0567] P: 0.0376 | V: 0.1727 | V_Mean: 0.329 | Win%: 2.38 | FPS: 2259\n", "[Iter 0568] P: 0.0454 | V: 0.1734 | V_Mean: 0.329 | Win%: 2.38 | FPS: 2243\n", "[Iter 0569] P: 0.0452 | V: 0.1738 | V_Mean: 0.329 | Win%: 2.38 | FPS: 1969\n", "[Iter 0570] P: 0.0389 | V: 0.1726 | V_Mean: 0.329 | Win%: 2.39 | FPS: 2279\n", "[Iter 0571] P: 0.0431 | V: 0.1729 | V_Mean: 0.328 | Win%: 2.39 | FPS: 2376\n", "[Iter 0572] P: 0.0493 | V: 0.1738 | V_Mean: 0.329 | Win%: 2.39 | FPS: 2492\n", "[Iter 0573] P: 0.0434 | V: 0.1737 | V_Mean: 0.330 | Win%: 2.39 | FPS: 2096\n", "[Iter 0574] P: 0.0558 | V: 0.1710 | V_Mean: 0.329 | Win%: 2.39 | FPS: 2221\n", "[Iter 0575] P: 0.0420 | V: 0.1764 | V_Mean: 0.329 | Win%: 2.39 | FPS: 2290\n", "[Iter 0576] P: 0.0385 | V: 0.1718 | V_Mean: 0.329 | Win%: 2.39 | FPS: 2198\n", "[Iter 0577] P: 0.0449 | V: 0.1730 | V_Mean: 0.331 | Win%: 2.40 | FPS: 2277\n", "[Iter 0578] P: 0.0396 | V: 0.1706 | V_Mean: 0.332 | Win%: 2.40 | FPS: 2388\n", "[Iter 0579] P: 0.0480 | V: 0.1731 | V_Mean: 0.333 | Win%: 2.41 | FPS: 2211\n", "[Iter 0580] P: 0.0507 | V: 0.1763 | V_Mean: 0.332 | Win%: 2.41 | FPS: 2165\n", "[Iter 0581] P: 0.0330 | V: 0.1761 | V_Mean: 0.332 | Win%: 2.41 | FPS: 2066\n", "[Iter 0582] P: 0.0455 | V: 0.1724 | V_Mean: 0.331 | Win%: 2.41 | FPS: 2291\n", "[Iter 0583] P: 0.0466 | V: 0.1732 | V_Mean: 0.329 | Win%: 2.41 | FPS: 2086\n", "[Iter 0584] P: 0.0413 | V: 0.1719 | V_Mean: 0.329 | Win%: 2.41 | FPS: 2406\n", "[Iter 0585] P: 0.0406 | V: 0.1731 | V_Mean: 0.329 | Win%: 2.41 | FPS: 2521\n", "[Iter 0586] P: 0.0418 | V: 0.1732 | V_Mean: 0.329 | Win%: 2.41 | FPS: 2407\n", "[Iter 0587] P: 0.0486 | V: 0.1738 | V_Mean: 0.329 | Win%: 2.41 | FPS: 2511\n", "[Iter 0588] P: 0.0509 | V: 0.1732 | V_Mean: 0.330 | Win%: 2.41 | FPS: 2154\n", "[Iter 0589] P: 0.0440 | V: 0.1762 | V_Mean: 0.329 | Win%: 2.42 | FPS: 2355\n", "[Iter 0590] P: 0.0384 | V: 0.1729 | V_Mean: 0.329 | Win%: 2.41 | FPS: 2252\n", "[Iter 0591] P: 0.0482 | V: 0.1715 | V_Mean: 0.329 | Win%: 2.41 | FPS: 2236\n", "[Iter 0592] P: 0.0503 | V: 0.1729 | V_Mean: 0.329 | Win%: 2.41 | FPS: 2373\n", "[Iter 0593] P: 0.0527 | V: 0.1732 | V_Mean: 0.330 | Win%: 2.42 | FPS: 2430\n", "[Iter 0594] P: 0.0500 | V: 0.1765 | V_Mean: 0.330 | Win%: 2.42 | FPS: 2533\n", "[Iter 0595] P: 0.0392 | V: 0.1738 | V_Mean: 0.330 | Win%: 2.42 | FPS: 2415\n", "[Iter 0596] P: 0.0499 | V: 0.1767 | V_Mean: 0.330 | Win%: 2.42 | FPS: 2436\n", "[Iter 0597] P: 0.0469 | V: 0.1737 | V_Mean: 0.329 | Win%: 2.42 | FPS: 2508\n", "[Iter 0598] P: 0.0451 | V: 0.1736 | V_Mean: 0.329 | Win%: 2.42 | FPS: 2396\n", "[Iter 0599] P: 0.0458 | V: 0.1726 | V_Mean: 0.329 | Win%: 2.42 | FPS: 2421\n", "[Iter 0600] P: 0.0376 | V: 0.1723 | V_Mean: 0.328 | Win%: 2.42 | FPS: 2251\n", "[Iter 0601] P: 0.0611 | V: 0.1740 | V_Mean: 0.329 | Win%: 2.42 | FPS: 2251\n", "[Iter 0602] P: 0.0408 | V: 0.1729 | V_Mean: 0.327 | Win%: 2.42 | FPS: 2131\n", "[Iter 0603] P: 0.0500 | V: 0.1754 | V_Mean: 0.327 | Win%: 2.42 | FPS: 2402\n", "[Iter 0604] P: 0.0422 | V: 0.1741 | V_Mean: 0.327 | Win%: 2.42 | FPS: 2525\n", "[Iter 0605] P: 0.0509 | V: 0.1726 | V_Mean: 0.326 | Win%: 2.42 | FPS: 2456\n", "[Iter 0606] P: 0.0456 | V: 0.1714 | V_Mean: 0.327 | Win%: 2.42 | FPS: 2505\n", "[Iter 0607] P: 0.0511 | V: 0.1731 | V_Mean: 0.327 | Win%: 2.42 | FPS: 2421\n", "[Iter 0608] P: 0.0510 | V: 0.1758 | V_Mean: 0.327 | Win%: 2.43 | FPS: 2346\n", "[Iter 0609] P: 0.0417 | V: 0.1734 | V_Mean: 0.327 | Win%: 2.43 | FPS: 2303\n", "[Iter 0610] P: 0.0510 | V: 0.1727 | V_Mean: 0.327 | Win%: 2.43 | FPS: 2247\n", "[Iter 0611] P: 0.0358 | V: 0.1721 | V_Mean: 0.329 | Win%: 2.43 | FPS: 2082\n", "[Iter 0612] P: 0.0461 | V: 0.1723 | V_Mean: 0.328 | Win%: 2.43 | FPS: 2522\n", "[Iter 0613] P: 0.0369 | V: 0.1722 | V_Mean: 0.328 | Win%: 2.43 | FPS: 2428\n", "[Iter 0614] P: 0.0402 | V: 0.1740 | V_Mean: 0.329 | Win%: 2.43 | FPS: 2199\n", "[Iter 0615] P: 0.0395 | V: 0.1728 | V_Mean: 0.328 | Win%: 2.43 | FPS: 2404\n", "[Iter 0616] P: 0.0569 | V: 0.1723 | V_Mean: 0.328 | Win%: 2.43 | FPS: 2439\n", "[Iter 0617] P: 0.0440 | V: 0.1728 | V_Mean: 0.326 | Win%: 2.44 | FPS: 2215\n", "[Iter 0618] P: 0.0480 | V: 0.1736 | V_Mean: 0.326 | Win%: 2.44 | FPS: 2315\n", "[Iter 0619] P: 0.0438 | V: 0.1754 | V_Mean: 0.326 | Win%: 2.44 | FPS: 2276\n", "[Iter 0620] P: 0.0473 | V: 0.1715 | V_Mean: 0.324 | Win%: 2.44 | FPS: 2386\n", "[Iter 0621] P: 0.0518 | V: 0.1751 | V_Mean: 0.324 | Win%: 2.44 | FPS: 2388\n", "[Iter 0622] P: 0.0500 | V: 0.1747 | V_Mean: 0.325 | Win%: 2.44 | FPS: 2439\n", "[Iter 0623] P: 0.0582 | V: 0.1748 | V_Mean: 0.324 | Win%: 2.43 | FPS: 2482\n", "[Iter 0624] P: 0.0513 | V: 0.1747 | V_Mean: 0.324 | Win%: 2.43 | FPS: 2440\n", "[Iter 0625] P: 0.0410 | V: 0.1739 | V_Mean: 0.322 | Win%: 2.43 | FPS: 2533\n", "[Iter 0626] P: 0.0404 | V: 0.1717 | V_Mean: 0.322 | Win%: 2.43 | FPS: 2437\n", "[Iter 0627] P: 0.0484 | V: 0.1738 | V_Mean: 0.320 | Win%: 2.43 | FPS: 2380\n", "[Iter 0628] P: 0.0414 | V: 0.1736 | V_Mean: 0.320 | Win%: 2.43 | FPS: 2290\n", "[Iter 0629] P: 0.0500 | V: 0.1704 | V_Mean: 0.321 | Win%: 2.43 | FPS: 2135\n", "[Iter 0630] P: 0.0481 | V: 0.1710 | V_Mean: 0.320 | Win%: 2.43 | FPS: 2303\n", "[Iter 0631] P: 0.0489 | V: 0.1745 | V_Mean: 0.320 | Win%: 2.43 | FPS: 2271\n", "[Iter 0632] P: 0.0459 | V: 0.1717 | V_Mean: 0.320 | Win%: 2.43 | FPS: 2434\n", "[Iter 0633] P: 0.0440 | V: 0.1721 | V_Mean: 0.319 | Win%: 2.43 | FPS: 2521\n", "[Iter 0634] P: 0.0544 | V: 0.1694 | V_Mean: 0.320 | Win%: 2.43 | FPS: 2457\n", "[Iter 0635] P: 0.0510 | V: 0.1725 | V_Mean: 0.320 | Win%: 2.43 | FPS: 2518\n", "[Iter 0636] P: 0.0497 | V: 0.1708 | V_Mean: 0.319 | Win%: 2.43 | FPS: 2420\n", "[Iter 0637] P: 0.0476 | V: 0.1727 | V_Mean: 0.319 | Win%: 2.43 | FPS: 2528\n", "[Iter 0638] P: 0.0524 | V: 0.1737 | V_Mean: 0.317 | Win%: 2.43 | FPS: 2343\n", "[Iter 0639] P: 0.0424 | V: 0.1701 | V_Mean: 0.317 | Win%: 2.43 | FPS: 2271\n", "[Iter 0640] P: 0.0468 | V: 0.1709 | V_Mean: 0.316 | Win%: 2.43 | FPS: 2327\n", "[Iter 0641] P: 0.0543 | V: 0.1711 | V_Mean: 0.316 | Win%: 2.43 | FPS: 2254\n", "[Iter 0642] P: 0.0495 | V: 0.1728 | V_Mean: 0.317 | Win%: 2.44 | FPS: 2281\n", "[Iter 0643] P: 0.0478 | V: 0.1719 | V_Mean: 0.317 | Win%: 2.44 | FPS: 2362\n", "[Iter 0644] P: 0.0526 | V: 0.1755 | V_Mean: 0.317 | Win%: 2.44 | FPS: 2454\n", "[Iter 0645] P: 0.0408 | V: 0.1735 | V_Mean: 0.316 | Win%: 2.44 | FPS: 2359\n", "[Iter 0646] P: 0.0445 | V: 0.1696 | V_Mean: 0.316 | Win%: 2.44 | FPS: 2481\n", "[Iter 0647] P: 0.0511 | V: 0.1727 | V_Mean: 0.316 | Win%: 2.44 | FPS: 2371\n", "[Iter 0648] P: 0.0530 | V: 0.1721 | V_Mean: 0.314 | Win%: 2.44 | FPS: 2341\n", "[Iter 0649] P: 0.0506 | V: 0.1728 | V_Mean: 0.315 | Win%: 2.45 | FPS: 2014\n", "[Iter 0650] P: 0.0511 | V: 0.1706 | V_Mean: 0.314 | Win%: 2.44 | FPS: 2243\n", "[Iter 0651] P: 0.0530 | V: 0.1706 | V_Mean: 0.314 | Win%: 2.45 | FPS: 2491\n", "[Iter 0652] P: 0.0580 | V: 0.1737 | V_Mean: 0.314 | Win%: 2.45 | FPS: 2467\n", "[Iter 0653] P: 0.0415 | V: 0.1700 | V_Mean: 0.314 | Win%: 2.45 | FPS: 2453\n", "[Iter 0654] P: 0.0552 | V: 0.1717 | V_Mean: 0.314 | Win%: 2.44 | FPS: 2394\n", "[Iter 0655] P: 0.0512 | V: 0.1725 | V_Mean: 0.312 | Win%: 2.44 | FPS: 2157\n", "[Iter 0656] P: 0.0478 | V: 0.1713 | V_Mean: 0.312 | Win%: 2.44 | FPS: 2322\n", "[Iter 0657] P: 0.0540 | V: 0.1709 | V_Mean: 0.312 | Win%: 2.44 | FPS: 2267\n", "[Iter 0658] P: 0.0582 | V: 0.1717 | V_Mean: 0.313 | Win%: 2.45 | FPS: 2119\n", "[Iter 0659] P: 0.0484 | V: 0.1711 | V_Mean: 0.311 | Win%: 2.45 | FPS: 2303\n", "[Iter 0660] P: 0.0563 | V: 0.1710 | V_Mean: 0.312 | Win%: 2.45 | FPS: 2248\n", "[Iter 0661] P: 0.0452 | V: 0.1701 | V_Mean: 0.310 | Win%: 2.45 | FPS: 2418\n", "[Iter 0662] P: 0.0571 | V: 0.1699 | V_Mean: 0.310 | Win%: 2.45 | FPS: 2152\n", "[Iter 0663] P: 0.0522 | V: 0.1698 | V_Mean: 0.309 | Win%: 2.45 | FPS: 2382\n", "[Iter 0664] P: 0.0551 | V: 0.1723 | V_Mean: 0.309 | Win%: 2.46 | FPS: 2060\n", "[Iter 0665] P: 0.0480 | V: 0.1703 | V_Mean: 0.307 | Win%: 2.46 | FPS: 2348\n", "[Iter 0666] P: 0.0510 | V: 0.1686 | V_Mean: 0.306 | Win%: 2.46 | FPS: 2292\n", "[Iter 0667] P: 0.0540 | V: 0.1693 | V_Mean: 0.305 | Win%: 2.46 | FPS: 2538\n", "[Iter 0668] P: 0.0562 | V: 0.1722 | V_Mean: 0.305 | Win%: 2.46 | FPS: 2474\n", "[Iter 0669] P: 0.0458 | V: 0.1696 | V_Mean: 0.303 | Win%: 2.46 | FPS: 2300\n", "[Iter 0670] P: 0.0629 | V: 0.1723 | V_Mean: 0.299 | Win%: 2.46 | FPS: 2224\n", "[Iter 0671] P: 0.0554 | V: 0.1708 | V_Mean: 0.300 | Win%: 2.46 | FPS: 2196\n", "[Iter 0672] P: 0.0566 | V: 0.1719 | V_Mean: 0.300 | Win%: 2.46 | FPS: 2367\n", "[Iter 0673] P: 0.0533 | V: 0.1708 | V_Mean: 0.297 | Win%: 2.46 | FPS: 2369\n", "[Iter 0674] P: 0.0567 | V: 0.1710 | V_Mean: 0.298 | Win%: 2.46 | FPS: 2091\n", "[Iter 0675] P: 0.0435 | V: 0.1670 | V_Mean: 0.298 | Win%: 2.46 | FPS: 2227\n", "[Iter 0676] P: 0.0540 | V: 0.1705 | V_Mean: 0.297 | Win%: 2.47 | FPS: 2451\n", "[Iter 0677] P: 0.0560 | V: 0.1721 | V_Mean: 0.298 | Win%: 2.47 | FPS: 2232\n", "[Iter 0678] P: 0.0543 | V: 0.1708 | V_Mean: 0.300 | Win%: 2.47 | FPS: 2227\n", "[Iter 0679] P: 0.0578 | V: 0.1690 | V_Mean: 0.295 | Win%: 2.47 | FPS: 2064\n", "[Iter 0680] P: 0.0501 | V: 0.1680 | V_Mean: 0.294 | Win%: 2.47 | FPS: 2325\n", "[Iter 0681] P: 0.0532 | V: 0.1710 | V_Mean: 0.295 | Win%: 2.47 | FPS: 2133\n", "[Iter 0682] P: 0.0490 | V: 0.1706 | V_Mean: 0.292 | Win%: 2.47 | FPS: 2210\n", "[Iter 0683] P: 0.0501 | V: 0.1678 | V_Mean: 0.291 | Win%: 2.47 | FPS: 2459\n", "[Iter 0684] P: 0.0570 | V: 0.1693 | V_Mean: 0.292 | Win%: 2.46 | FPS: 2439\n", "[Iter 0685] P: 0.0493 | V: 0.1690 | V_Mean: 0.290 | Win%: 2.46 | FPS: 2093\n", "[Iter 0686] P: 0.0526 | V: 0.1676 | V_Mean: 0.291 | Win%: 2.46 | FPS: 2037\n", "[Iter 0687] P: 0.0565 | V: 0.1705 | V_Mean: 0.289 | Win%: 2.46 | FPS: 2257\n", "[Iter 0688] P: 0.0495 | V: 0.1698 | V_Mean: 0.289 | Win%: 2.46 | FPS: 2177\n", "[Iter 0689] P: 0.0550 | V: 0.1702 | V_Mean: 0.289 | Win%: 2.46 | FPS: 2130\n", "[Iter 0690] P: 0.0456 | V: 0.1686 | V_Mean: 0.289 | Win%: 2.46 | FPS: 2515\n", "[Iter 0691] P: 0.0629 | V: 0.1692 | V_Mean: 0.289 | Win%: 2.46 | FPS: 2349\n", "[Iter 0692] P: 0.0525 | V: 0.1673 | V_Mean: 0.288 | Win%: 2.47 | FPS: 2360\n", "[Iter 0693] P: 0.0576 | V: 0.1676 | V_Mean: 0.288 | Win%: 2.47 | FPS: 2357\n", "[Iter 0694] P: 0.0537 | V: 0.1665 | V_Mean: 0.286 | Win%: 2.47 | FPS: 2144\n", "[Iter 0695] P: 0.0530 | V: 0.1675 | V_Mean: 0.283 | Win%: 2.46 | FPS: 2174\n", "[Iter 0696] P: 0.0549 | V: 0.1679 | V_Mean: 0.282 | Win%: 2.46 | FPS: 2306\n", "[Iter 0697] P: 0.0554 | V: 0.1668 | V_Mean: 0.281 | Win%: 2.47 | FPS: 2167\n", "[Iter 0698] P: 0.0573 | V: 0.1665 | V_Mean: 0.279 | Win%: 2.47 | FPS: 2568\n", "[Iter 0699] P: 0.0540 | V: 0.1678 | V_Mean: 0.280 | Win%: 2.47 | FPS: 2127\n", "[Iter 0700] P: 0.0567 | V: 0.1680 | V_Mean: 0.280 | Win%: 2.47 | FPS: 2109\n", "[Iter 0701] P: 0.0575 | V: 0.1674 | V_Mean: 0.279 | Win%: 2.46 | FPS: 2209\n", "[Iter 0702] P: 0.0676 | V: 0.1657 | V_Mean: 0.277 | Win%: 2.46 | FPS: 2203\n", "[Iter 0703] P: 0.0573 | V: 0.1653 | V_Mean: 0.274 | Win%: 2.46 | FPS: 2220\n", "[Iter 0704] P: 0.0534 | V: 0.1656 | V_Mean: 0.274 | Win%: 2.46 | FPS: 2507\n", "[Iter 0705] P: 0.0644 | V: 0.1642 | V_Mean: 0.274 | Win%: 2.46 | FPS: 2366\n", "[Iter 0706] P: 0.0672 | V: 0.1682 | V_Mean: 0.274 | Win%: 2.47 | FPS: 2064\n", "[Iter 0707] P: 0.0574 | V: 0.1647 | V_Mean: 0.271 | Win%: 2.48 | FPS: 2171\n", "[Iter 0708] P: 0.0680 | V: 0.1669 | V_Mean: 0.274 | Win%: 2.48 | FPS: 2218\n", "[Iter 0709] P: 0.0572 | V: 0.1663 | V_Mean: 0.272 | Win%: 2.48 | FPS: 2519\n", "[Iter 0710] P: 0.0573 | V: 0.1672 | V_Mean: 0.274 | Win%: 2.48 | FPS: 2106\n", "[Iter 0711] P: 0.0663 | V: 0.1644 | V_Mean: 0.270 | Win%: 2.48 | FPS: 2193\n", "[Iter 0712] P: 0.0520 | V: 0.1648 | V_Mean: 0.269 | Win%: 2.48 | FPS: 2372\n", "[Iter 0713] P: 0.0589 | V: 0.1662 | V_Mean: 0.268 | Win%: 2.48 | FPS: 2167\n", "[Iter 0714] P: 0.0584 | V: 0.1659 | V_Mean: 0.268 | Win%: 2.48 | FPS: 2406\n", "[Iter 0715] P: 0.0557 | V: 0.1647 | V_Mean: 0.268 | Win%: 2.48 | FPS: 2578\n", "[Iter 0716] P: 0.0597 | V: 0.1658 | V_Mean: 0.269 | Win%: 2.48 | FPS: 2556\n", "[Iter 0717] P: 0.0525 | V: 0.1646 | V_Mean: 0.267 | Win%: 2.48 | FPS: 2439\n", "[Iter 0718] P: 0.0578 | V: 0.1640 | V_Mean: 0.268 | Win%: 2.47 | FPS: 2576\n", "[Iter 0719] P: 0.0562 | V: 0.1669 | V_Mean: 0.268 | Win%: 2.47 | FPS: 2572\n", "[Iter 0720] P: 0.0591 | V: 0.1646 | V_Mean: 0.268 | Win%: 2.47 | FPS: 2572\n", "[Iter 0721] P: 0.0556 | V: 0.1644 | V_Mean: 0.268 | Win%: 2.47 | FPS: 2430\n", "[Iter 0722] P: 0.0623 | V: 0.1648 | V_Mean: 0.268 | Win%: 2.47 | FPS: 2570\n", "[Iter 0723] P: 0.0558 | V: 0.1654 | V_Mean: 0.267 | Win%: 2.47 | FPS: 2553\n", "[Iter 0724] P: 0.0500 | V: 0.1644 | V_Mean: 0.267 | Win%: 2.47 | FPS: 2581\n", "[Iter 0725] P: 0.0560 | V: 0.1633 | V_Mean: 0.266 | Win%: 2.48 | FPS: 2452\n", "[Iter 0726] P: 0.0602 | V: 0.1642 | V_Mean: 0.267 | Win%: 2.48 | FPS: 2521\n", "[Iter 0727] P: 0.0657 | V: 0.1645 | V_Mean: 0.265 | Win%: 2.47 | FPS: 2285\n", "[Iter 0728] P: 0.0570 | V: 0.1650 | V_Mean: 0.266 | Win%: 2.47 | FPS: 2361\n", "[Iter 0729] P: 0.0574 | V: 0.1643 | V_Mean: 0.266 | Win%: 2.48 | FPS: 2301\n", "[Iter 0730] P: 0.0639 | V: 0.1639 | V_Mean: 0.264 | Win%: 2.48 | FPS: 2327\n", "[Iter 0731] P: 0.0570 | V: 0.1627 | V_Mean: 0.265 | Win%: 2.48 | FPS: 2400\n", "[Iter 0732] P: 0.0592 | V: 0.1626 | V_Mean: 0.265 | Win%: 2.49 | FPS: 2458\n", "[Iter 0733] P: 0.0687 | V: 0.1643 | V_Mean: 0.264 | Win%: 2.49 | FPS: 2425\n", "[Iter 0734] P: 0.0720 | V: 0.1656 | V_Mean: 0.265 | Win%: 2.49 | FPS: 2550\n", "[Iter 0735] P: 0.0522 | V: 0.1639 | V_Mean: 0.265 | Win%: 2.49 | FPS: 2301\n", "[Iter 0736] P: 0.0663 | V: 0.1647 | V_Mean: 0.264 | Win%: 2.49 | FPS: 2527\n", "[Iter 0737] P: 0.0556 | V: 0.1643 | V_Mean: 0.265 | Win%: 2.50 | FPS: 2443\n", "[Iter 0738] P: 0.0643 | V: 0.1655 | V_Mean: 0.265 | Win%: 2.50 | FPS: 2553\n", "[Iter 0739] P: 0.0537 | V: 0.1639 | V_Mean: 0.266 | Win%: 2.51 | FPS: 2570\n", "[Iter 0740] P: 0.0587 | V: 0.1654 | V_Mean: 0.265 | Win%: 2.51 | FPS: 2470\n", "[Iter 0741] P: 0.0593 | V: 0.1644 | V_Mean: 0.264 | Win%: 2.51 | FPS: 2292\n", "[Iter 0742] P: 0.0669 | V: 0.1636 | V_Mean: 0.264 | Win%: 2.51 | FPS: 2331\n", "[Iter 0743] P: 0.0548 | V: 0.1626 | V_Mean: 0.263 | Win%: 2.51 | FPS: 2264\n", "[Iter 0744] P: 0.0624 | V: 0.1637 | V_Mean: 0.264 | Win%: 2.51 | FPS: 2261\n", "[Iter 0745] P: 0.0615 | V: 0.1641 | V_Mean: 0.265 | Win%: 2.51 | FPS: 2374\n", "[Iter 0746] P: 0.0630 | V: 0.1640 | V_Mean: 0.264 | Win%: 2.51 | FPS: 2449\n", "[Iter 0747] P: 0.0538 | V: 0.1635 | V_Mean: 0.264 | Win%: 2.51 | FPS: 2518\n", "[Iter 0748] P: 0.0521 | V: 0.1647 | V_Mean: 0.264 | Win%: 2.52 | FPS: 2319\n", "[Iter 0749] P: 0.0524 | V: 0.1658 | V_Mean: 0.267 | Win%: 2.52 | FPS: 2183\n", "[Iter 0750] P: 0.0600 | V: 0.1653 | V_Mean: 0.265 | Win%: 2.52 | FPS: 2432\n", "[Iter 0751] P: 0.0576 | V: 0.1657 | V_Mean: 0.266 | Win%: 2.52 | FPS: 2035\n", "[Iter 0752] P: 0.0521 | V: 0.1651 | V_Mean: 0.266 | Win%: 2.53 | FPS: 2270\n", "[Iter 0753] P: 0.0645 | V: 0.1641 | V_Mean: 0.267 | Win%: 2.54 | FPS: 2446\n", "[Iter 0754] P: 0.0579 | V: 0.1646 | V_Mean: 0.266 | Win%: 2.54 | FPS: 2447\n", "[Iter 0755] P: 0.0517 | V: 0.1643 | V_Mean: 0.266 | Win%: 2.54 | FPS: 2362\n", "[Iter 0756] P: 0.0512 | V: 0.1637 | V_Mean: 0.264 | Win%: 2.54 | FPS: 2405\n", "[Iter 0757] P: 0.0495 | V: 0.1646 | V_Mean: 0.264 | Win%: 2.54 | FPS: 2386\n", "[Iter 0758] P: 0.0627 | V: 0.1644 | V_Mean: 0.261 | Win%: 2.54 | FPS: 2142\n", "[Iter 0759] P: 0.0573 | V: 0.1637 | V_Mean: 0.262 | Win%: 2.54 | FPS: 2279\n", "[Iter 0760] P: 0.0637 | V: 0.1660 | V_Mean: 0.263 | Win%: 2.54 | FPS: 2241\n", "[Iter 0761] P: 0.0560 | V: 0.1652 | V_Mean: 0.263 | Win%: 2.54 | FPS: 2325\n", "[Iter 0762] P: 0.0634 | V: 0.1640 | V_Mean: 0.264 | Win%: 2.55 | FPS: 2291\n", "[Iter 0763] P: 0.0710 | V: 0.1654 | V_Mean: 0.264 | Win%: 2.55 | FPS: 2147\n", "[Iter 0764] P: 0.0621 | V: 0.1639 | V_Mean: 0.263 | Win%: 2.55 | FPS: 2207\n", "[Iter 0765] P: 0.0578 | V: 0.1648 | V_Mean: 0.262 | Win%: 2.55 | FPS: 2594\n", "[Iter 0766] P: 0.0755 | V: 0.1664 | V_Mean: 0.263 | Win%: 2.55 | FPS: 2250\n", "[Iter 0767] P: 0.0612 | V: 0.1648 | V_Mean: 0.262 | Win%: 2.56 | FPS: 2139\n", "[Iter 0768] P: 0.0712 | V: 0.1647 | V_Mean: 0.262 | Win%: 2.56 | FPS: 2270\n", "[Iter 0769] P: 0.0664 | V: 0.1661 | V_Mean: 0.264 | Win%: 2.57 | FPS: 2098\n", "[Iter 0770] P: 0.0599 | V: 0.1642 | V_Mean: 0.264 | Win%: 2.58 | FPS: 2257\n", "[Iter 0771] P: 0.0728 | V: 0.1653 | V_Mean: 0.265 | Win%: 2.59 | FPS: 2556\n", "[Iter 0772] P: 0.0757 | V: 0.1663 | V_Mean: 0.261 | Win%: 2.59 | FPS: 2549\n", "[Iter 0773] P: 0.0611 | V: 0.1640 | V_Mean: 0.262 | Win%: 2.59 | FPS: 2233\n", "[Iter 0774] P: 0.0704 | V: 0.1651 | V_Mean: 0.261 | Win%: 2.59 | FPS: 2549\n", "[Iter 0775] P: 0.0694 | V: 0.1647 | V_Mean: 0.262 | Win%: 2.59 | FPS: 2530\n", "[Iter 0776] P: 0.0765 | V: 0.1648 | V_Mean: 0.260 | Win%: 2.59 | FPS: 2289\n", "[Iter 0777] P: 0.0680 | V: 0.1654 | V_Mean: 0.260 | Win%: 2.60 | FPS: 2156\n", "[Iter 0778] P: 0.0698 | V: 0.1650 | V_Mean: 0.261 | Win%: 2.61 | FPS: 2134\n", "[Iter 0779] P: 0.0660 | V: 0.1651 | V_Mean: 0.261 | Win%: 2.61 | FPS: 2234\n", "[Iter 0780] P: 0.0785 | V: 0.1655 | V_Mean: 0.260 | Win%: 2.61 | FPS: 2543\n", "[Iter 0781] P: 0.0538 | V: 0.1641 | V_Mean: 0.260 | Win%: 2.61 | FPS: 2447\n", "[Iter 0782] P: 0.0687 | V: 0.1649 | V_Mean: 0.261 | Win%: 2.61 | FPS: 2569\n", "[Iter 0783] P: 0.0651 | V: 0.1641 | V_Mean: 0.260 | Win%: 2.61 | FPS: 2200\n", "[Iter 0784] P: 0.0640 | V: 0.1642 | V_Mean: 0.260 | Win%: 2.62 | FPS: 2501\n", "[Iter 0785] P: 0.0700 | V: 0.1644 | V_Mean: 0.259 | Win%: 2.62 | FPS: 2448\n", "[Iter 0786] P: 0.0654 | V: 0.1638 | V_Mean: 0.259 | Win%: 2.62 | FPS: 2204\n", "[Iter 0787] P: 0.0661 | V: 0.1647 | V_Mean: 0.259 | Win%: 2.62 | FPS: 2139\n", "[Iter 0788] P: 0.0614 | V: 0.1634 | V_Mean: 0.258 | Win%: 2.62 | FPS: 2306\n", "[Iter 0789] P: 0.0585 | V: 0.1649 | V_Mean: 0.259 | Win%: 2.62 | FPS: 2380\n", "[Iter 0790] P: 0.0600 | V: 0.1652 | V_Mean: 0.259 | Win%: 2.62 | FPS: 2546\n", "[Iter 0791] P: 0.0816 | V: 0.1650 | V_Mean: 0.258 | Win%: 2.62 | FPS: 2529\n", "[Iter 0792] P: 0.0692 | V: 0.1635 | V_Mean: 0.258 | Win%: 2.63 | FPS: 2526\n", "[Iter 0793] P: 0.0711 | V: 0.1640 | V_Mean: 0.258 | Win%: 2.63 | FPS: 2517\n", "[Iter 0794] P: 0.0586 | V: 0.1638 | V_Mean: 0.260 | Win%: 2.63 | FPS: 2509\n", "[Iter 0795] P: 0.0551 | V: 0.1639 | V_Mean: 0.259 | Win%: 2.64 | FPS: 2140\n", "[Iter 0796] P: 0.0599 | V: 0.1624 | V_Mean: 0.258 | Win%: 2.64 | FPS: 2412\n", "[Iter 0797] P: 0.0599 | V: 0.1640 | V_Mean: 0.259 | Win%: 2.64 | FPS: 2356\n", "[Iter 0798] P: 0.0606 | V: 0.1645 | V_Mean: 0.259 | Win%: 2.64 | FPS: 2134\n", "[Iter 0799] P: 0.0546 | V: 0.1633 | V_Mean: 0.258 | Win%: 2.64 | FPS: 2173\n", "[Iter 0800] P: 0.0551 | V: 0.1640 | V_Mean: 0.258 | Win%: 2.64 | FPS: 2269\n", "[Iter 0801] P: 0.0704 | V: 0.1646 | V_Mean: 0.258 | Win%: 2.64 | FPS: 2143\n", "[Iter 0802] P: 0.0568 | V: 0.1644 | V_Mean: 0.258 | Win%: 2.64 | FPS: 2071\n", "[Iter 0803] P: 0.0551 | V: 0.1644 | V_Mean: 0.258 | Win%: 2.64 | FPS: 2268\n", "[Iter 0804] P: 0.0567 | V: 0.1633 | V_Mean: 0.257 | Win%: 2.64 | FPS: 2245\n", "[Iter 0805] P: 0.0644 | V: 0.1652 | V_Mean: 0.255 | Win%: 2.64 | FPS: 2201\n", "[Iter 0806] P: 0.0589 | V: 0.1638 | V_Mean: 0.255 | Win%: 2.65 | FPS: 2247\n", "[Iter 0807] P: 0.0615 | V: 0.1645 | V_Mean: 0.254 | Win%: 2.65 | FPS: 2157\n", "[Iter 0808] P: 0.0555 | V: 0.1630 | V_Mean: 0.251 | Win%: 2.65 | FPS: 2118\n", "[Iter 0809] P: 0.0602 | V: 0.1624 | V_Mean: 0.250 | Win%: 2.65 | FPS: 2041\n" ] } ], "source": [ "# NOTE FOR COLAB USERS: Run the following line in a separate cell before running this script:\n", "# !pip -q install chess numpy torch matplotlib pandas\n", "\n", "\"\"\"\n", "Hyper-Optimized GRPO Chess Agent – T4/Colab Targeted\n", "Engineered for strict 14GB VRAM limit, maximized Tensor Core utilization, and minimal CPU-GPU latency.\n", "\n", "Architectural Enhancements:\n", "- FP16 Stable Masking (-60000.0 instead of -1e9)\n", "- Fused AdamW Kernels & Channels Last Memory Format\n", "- TF32 Matmul Precision Enabled\n", "- Int8 GPU Buffer Allocation (Reduces VRAM bandwidth by 75% during rollouts)\n", "- GPU-Accelerated Advantage Normalization & Return Calculation\n", "\"\"\"\n", "\n", "import os\n", "import sys\n", "import csv\n", "import time\n", "import argparse\n", "import random\n", "import numpy as np\n", "import pandas as pd\n", "import matplotlib\n", "matplotlib.use('Agg')\n", "import matplotlib.pyplot as plt\n", "\n", "try:\n", " import chess\n", "except ImportError:\n", " os.system(\"pip install -q chess\")\n", " import chess\n", "\n", "import torch\n", "import torch.nn as nn\n", "import torch.nn.functional as F\n", "\n", "# ----------------------------------------------------------------------\n", "# Core High-Performance Flags\n", "# ----------------------------------------------------------------------\n", "torch.backends.cudnn.benchmark = True\n", "torch.backends.cuda.matmul.allow_tf32 = True\n", "torch.backends.cudnn.allow_tf32 = True\n", "if hasattr(torch, 'set_float32_matmul_precision'):\n", " torch.set_float32_matmul_precision('high')\n", "\n", "CONFIG = {\n", " \"num_envs\": 256, # Maximize batch size for GPU starvation\n", " \"grpo_group_size\": 8,\n", " \"ppo_epochs\": 4,\n", " \"mini_batch_size\": 8192, # Pushed to limits for T4 VRAM throughput\n", " \"learning_rate\": 3e-4,\n", " \"weight_decay\": 1e-4,\n", " \"gamma\": 0.995,\n", " \"clip_epsilon\": 0.2,\n", " \"entropy_coef\": 0.05,\n", " \"value_coef\": 0.5,\n", " \"max_steps\": 128, # Power of 2 for better memory alignment\n", " \"checkpoint_dir\": \"./checkpoints\",\n", " \"save_interval\": 50,\n", " \"log_interval\": 1,\n", " \"device\": \"cuda\" if torch.cuda.is_available() else \"cpu\",\n", " \"seed\": 42,\n", "}\n", "\n", "# ----------------------------------------------------------------------\n", "# Action Space Mapper (Optimized Lookup)\n", "# ----------------------------------------------------------------------\n", "class ActionMapper:\n", " __slots__ = ['move_to_idx', 'idx_to_move', 'num_actions']\n", " def __init__(self):\n", " self.move_to_idx = {}\n", " self.idx_to_move = []\n", " idx = 0\n", " for f in range(64):\n", " for t in range(64):\n", " if f == t: continue\n", " uci = chess.SQUARE_NAMES[f] + chess.SQUARE_NAMES[t]\n", " self.move_to_idx[uci] = idx\n", " self.idx_to_move.append(uci)\n", " idx += 1\n", " if chess.square_rank(f) in (1, 6) and abs(chess.square_file(f) - chess.square_file(t)) <= 1:\n", " for promo in \"nbrq\":\n", " promo_uci = uci + promo\n", " self.move_to_idx[promo_uci] = idx\n", " self.idx_to_move.append(promo_uci)\n", " idx += 1\n", " self.num_actions = idx\n", "\n", "ACTION_MAPPER = ActionMapper()\n", "\n", "# ----------------------------------------------------------------------\n", "# Ultra-Fast CPU Vectorization\n", "# ----------------------------------------------------------------------\n", "def populate_states_fast(envs, active_mask, bbs_np, meta_np):\n", " \"\"\"Direct attribute access to bypass function call overhead.\"\"\"\n", " for b in range(len(envs)):\n", " if not active_mask[b]: continue\n", " env = envs[b]\n", " w = env.occupied_co[chess.WHITE]\n", " bc = env.occupied_co[chess.BLACK]\n", "\n", " bbs_np[b, 0] = env.pawns & w\n", " bbs_np[b, 1] = env.knights & w\n", " bbs_np[b, 2] = env.bishops & w\n", " bbs_np[b, 3] = env.rooks & w\n", " bbs_np[b, 4] = env.queens & w\n", " bbs_np[b, 5] = env.kings & w\n", " bbs_np[b, 6] = env.pawns & bc\n", " bbs_np[b, 7] = env.knights & bc\n", " bbs_np[b, 8] = env.bishops & bc\n", " bbs_np[b, 9] = env.rooks & bc\n", " bbs_np[b, 10] = env.queens & bc\n", " bbs_np[b, 11] = env.kings & bc\n", "\n", " meta_np[b, 0] = 1.0 if env.turn else -1.0\n", " meta_np[b, 1] = env.castling_rights * 0.1333333 - 1.0 # (x/15)*2-1 optimized\n", " meta_np[b, 2] = 1.0 if env.ep_square else -1.0\n", "\n", "def get_legal_masks(envs, active_mask) -> tuple[np.ndarray, list[list[chess.Move]]]:\n", " masks = np.zeros((len(envs), ACTION_MAPPER.num_actions), dtype=np.bool_)\n", " moves_list = [None] * len(envs)\n", " for b in range(len(envs)):\n", " if not active_mask[b]: continue\n", " legal = list(envs[b].legal_moves)\n", " moves_list[b] = legal\n", " for m in legal:\n", " masks[b, ACTION_MAPPER.move_to_idx[m.uci()]] = True\n", " return masks, moves_list\n", "\n", "# ----------------------------------------------------------------------\n", "# Neural Network – ResNet (Channels Last Optimized)\n", "# ----------------------------------------------------------------------\n", "class ChessNet(nn.Module):\n", " def __init__(self):\n", " super().__init__()\n", " self.conv_in = nn.Conv2d(14, 128, kernel_size=3, padding=1, bias=False)\n", " self.bn_in = nn.BatchNorm2d(128)\n", "\n", " self.res_blocks = nn.ModuleList([\n", " nn.Sequential(\n", " nn.Conv2d(128, 128, 3, padding=1, bias=False),\n", " nn.BatchNorm2d(128),\n", " nn.ReLU(inplace=True),\n", " nn.Conv2d(128, 128, 3, padding=1, bias=False),\n", " nn.BatchNorm2d(128)\n", " ) for _ in range(6)\n", " ])\n", "\n", " self.policy_head = nn.Sequential(\n", " nn.Conv2d(128, 32, 1, bias=False),\n", " nn.BatchNorm2d(32),\n", " nn.ReLU(inplace=True),\n", " nn.Flatten(),\n", " nn.Linear(32 * 8 * 8, ACTION_MAPPER.num_actions)\n", " )\n", "\n", " self.value_head = nn.Sequential(\n", " nn.Conv2d(128, 32, 1, bias=False),\n", " nn.BatchNorm2d(32),\n", " nn.ReLU(inplace=True),\n", " nn.Flatten(),\n", " nn.Linear(32 * 8 * 8, 256),\n", " nn.ReLU(inplace=True),\n", " nn.Linear(256, 1),\n", " nn.Tanh()\n", " )\n", "\n", " def forward(self, x):\n", " x = F.relu(self.bn_in(self.conv_in(x)), inplace=True)\n", " for block in self.res_blocks:\n", " x = F.relu(x + block(x), inplace=True)\n", " return self.policy_head(x), self.value_head(x)\n", "\n", "# ----------------------------------------------------------------------\n", "# Optimized GRPO Trainer\n", "# ----------------------------------------------------------------------\n", "class GRPOTrainer:\n", " def __init__(self):\n", " self.device = CONFIG[\"device\"]\n", "\n", " _model = ChessNet().to(self.device).to(memory_format=torch.channels_last)\n", " try:\n", " print(\"Compiling JIT model for Tensor Core reduction...\")\n", " self.model = torch.compile(_model, mode=\"max-autotune\")\n", " except Exception:\n", " self.model = _model\n", "\n", " # Fused AdamW prevents host-to-device kernel launch overheads\n", " self.optimizer = torch.optim.AdamW(\n", " self.model.parameters(),\n", " lr=CONFIG[\"learning_rate\"],\n", " weight_decay=CONFIG[\"weight_decay\"],\n", " fused=True if torch.cuda.is_available() else False\n", " )\n", " self.scaler = torch.amp.GradScaler('cuda')\n", " self.start_iter = 0\n", "\n", " self.shifts = torch.arange(64, dtype=torch.int64, device=self.device).view(1, 1, 64)\n", "\n", " os.makedirs(CONFIG[\"checkpoint_dir\"], exist_ok=True)\n", " self.log_file = os.path.join(CONFIG[\"checkpoint_dir\"], \"training_log.csv\")\n", "\n", " if not os.path.exists(self.log_file):\n", " with open(self.log_file, \"w\", newline=\"\") as f:\n", " csv.writer(f).writerow([\"iteration\", \"p_loss\", \"v_loss\", \"v_mean\", \"fps\", \"win_rate\", \"draw_rate\"])\n", "\n", " self._init_checkpointing()\n", "\n", " def _init_checkpointing(self):\n", " latest = os.path.join(CONFIG[\"checkpoint_dir\"], \"latest.pt\")\n", " if os.path.exists(latest):\n", " checkpoint = torch.load(latest, map_location=self.device)\n", " self.model.load_state_dict(checkpoint['model_state_dict'])\n", " self.optimizer.load_state_dict(checkpoint['optimizer_state_dict'])\n", " self.scaler.load_state_dict(checkpoint['scaler_state_dict'])\n", " self.start_iter = checkpoint['iteration'] + 1\n", "\n", " def save_checkpoint(self, iteration: int):\n", " path = os.path.join(CONFIG[\"checkpoint_dir\"], f\"iter_{iteration:04d}.pt\")\n", " torch.save({\n", " 'iteration': iteration,\n", " 'model_state_dict': self.model.state_dict(),\n", " 'optimizer_state_dict': self.optimizer.state_dict(),\n", " 'scaler_state_dict': self.scaler.state_dict(),\n", " }, path)\n", " latest = os.path.join(CONFIG[\"checkpoint_dir\"], \"latest.pt\")\n", " if os.path.exists(latest): os.remove(latest)\n", " os.symlink(os.path.basename(path), latest)\n", "\n", " def train(self, num_iterations: int):\n", " B = CONFIG[\"num_envs\"]\n", " max_steps = CONFIG[\"max_steps\"]\n", "\n", " # Buffer Allocation (int8/bool used heavily to minimize VRAM footprint)\n", " states_buf = torch.zeros((max_steps, B, 14, 8, 8), dtype=torch.int8, device=self.device)\n", " actions_buf = torch.zeros((max_steps, B), dtype=torch.int16, device=self.device)\n", " logprobs_buf = torch.zeros((max_steps, B), dtype=torch.float32, device=self.device)\n", " values_buf = torch.zeros((max_steps, B), dtype=torch.float32, device=self.device)\n", " rewards_buf = torch.zeros((max_steps, B), dtype=torch.float32, device=self.device)\n", " dones_buf = torch.zeros((max_steps, B), dtype=torch.bool, device=self.device)\n", " active_buf = torch.zeros((max_steps, B), dtype=torch.bool, device=self.device)\n", "\n", " bbs_np = np.zeros((B, 12), dtype=np.uint64)\n", " meta_np = np.zeros((B, 3), dtype=np.float32)\n", "\n", " print(f\"\\nšŸš€ Optimized Pipeline | Envs: {B} | BZ: {CONFIG['mini_batch_size']} | Device: {self.device.upper()}\")\n", "\n", " for iteration in range(self.start_iter, num_iterations):\n", " iter_start = time.time()\n", " envs = [chess.Board() for _ in range(B)]\n", " active = np.ones(B, dtype=bool)\n", "\n", " # --- PHASE 1: VECTORIZED ROLLOUT ---\n", " for t in range(max_steps):\n", " if not active.any(): break\n", "\n", " populate_states_fast(envs, active, bbs_np, meta_np)\n", "\n", " bbs_t = torch.as_tensor(bbs_np.astype(np.int64), dtype=torch.int64, device=self.device)\n", " unpacked_bits = ((bbs_t.unsqueeze(-1) >> self.shifts) & 1).to(torch.int8)\n", " meta_t = torch.as_tensor(meta_np, dtype=torch.int8, device=self.device)\n", "\n", " states_buf[t, :, :12, :, :] = unpacked_bits.view(B, 12, 8, 8)\n", " states_buf[t, :, 12, :, :] = meta_t[:, 0].view(B, 1, 1).expand(B, 8, 8)\n", " states_buf[t, :, 13, :, :] = meta_t[:, 1].view(B, 1, 1).expand(B, 8, 8)\n", " states_buf[t, :, 13, 0, 1] = meta_t[:, 2]\n", "\n", " active_buf[t] = torch.as_tensor(active, dtype=torch.bool, device=self.device)\n", "\n", " # Expand states to float32 only for forward pass\n", " model_input = states_buf[t].to(dtype=torch.float32, memory_format=torch.channels_last)\n", "\n", " self.model.eval()\n", " with torch.no_grad(), torch.amp.autocast('cuda'):\n", " logits, values = self.model(model_input)\n", "\n", " masks_np, legal_moves_list = get_legal_masks(envs, active)\n", " masks_t = torch.as_tensor(masks_np, dtype=torch.bool, device=self.device)\n", "\n", " # Float16 safe clamping\n", " logits = logits.to(torch.float32)\n", " logits = torch.where(masks_t, logits, torch.tensor(-60000.0, device=self.device))\n", "\n", " # Fix for environments with 0 legal moves (checkmate scenarios caught before break)\n", " is_all_zero = (~masks_t.any(dim=-1, keepdim=True))\n", " logits.masked_fill_(is_all_zero, 0.0)\n", "\n", " probs = F.softmax(logits, dim=-1)\n", " dist = torch.distributions.Categorical(probs)\n", " actions = dist.sample()\n", "\n", " actions_buf[t] = actions.to(torch.int16)\n", " logprobs_buf[t] = dist.log_prob(actions)\n", " values_buf[t] = values.squeeze(-1)\n", "\n", " actions_cpu = actions.cpu().numpy()\n", "\n", " for b in range(B):\n", " if not active[b]: continue\n", "\n", " move_uci = ACTION_MAPPER.idx_to_move[actions_cpu[b]]\n", " move = chess.Move.from_uci(move_uci)\n", "\n", " if move not in legal_moves_list[b]:\n", " move = random.choice(legal_moves_list[b])\n", "\n", " envs[b].push(move)\n", "\n", " if envs[b].is_game_over():\n", " res = envs[b].result()\n", " term_reward = 1.0 if res == \"1-0\" else (-1.0 if res == \"0-1\" else 0.0)\n", " rewards_buf[t, b] = term_reward if envs[b].turn == chess.BLACK else -term_reward\n", " dones_buf[t, b] = True\n", " active[b] = False\n", "\n", " # --- PHASE 2: PARALLELIZED RETURNS ---\n", " returns = torch.zeros(B, dtype=torch.float32, device=self.device)\n", " returns_buf = torch.zeros_like(rewards_buf)\n", "\n", " for step in reversed(range(max_steps)):\n", " returns = rewards_buf[step] + CONFIG[\"gamma\"] * returns * (~dones_buf[step]).float()\n", " returns_buf[step] = returns * active_buf[step].float()\n", "\n", " valid_mask = active_buf.view(-1)\n", " flat_states = states_buf.view(-1, 14, 8, 8)[valid_mask].to(torch.float32, memory_format=torch.channels_last)\n", " flat_actions = actions_buf.view(-1)[valid_mask].to(torch.int64)\n", " flat_old_logprobs = logprobs_buf.view(-1)[valid_mask]\n", " flat_returns = returns_buf.view(-1)[valid_mask]\n", " flat_values = values_buf.view(-1)[valid_mask]\n", "\n", " dataset_size = flat_states.size(0)\n", " if dataset_size < 100: continue # Skip degenerate rollouts\n", "\n", " flat_advantages = flat_returns - flat_values\n", " flat_advantages = (flat_advantages - flat_advantages.mean()) / (flat_advantages.std() + 1e-8)\n", "\n", " # --- PHASE 3: PPO OPTIMIZATION ---\n", " self.model.train()\n", " total_policy_loss, total_value_loss = 0.0, 0.0\n", " mb_size = CONFIG[\"mini_batch_size\"]\n", " num_updates = 0\n", "\n", " for _ in range(CONFIG[\"ppo_epochs\"]):\n", " indices = torch.randperm(dataset_size, device=self.device)\n", "\n", " for start in range(0, dataset_size, mb_size):\n", " end = min(start + mb_size, dataset_size)\n", " mb_idx = indices[start:end]\n", "\n", " with torch.amp.autocast('cuda'):\n", " new_logits, new_values = self.model(flat_states[mb_idx])\n", " new_dist = torch.distributions.Categorical(logits=new_logits)\n", " new_log_probs = new_dist.log_prob(flat_actions[mb_idx])\n", "\n", " ratio = torch.exp(new_log_probs - flat_old_logprobs[mb_idx])\n", " mb_adv = flat_advantages[mb_idx]\n", "\n", " surr1 = ratio * mb_adv\n", " surr2 = torch.clamp(ratio, 1.0 - CONFIG[\"clip_epsilon\"], 1.0 + CONFIG[\"clip_epsilon\"]) * mb_adv\n", " policy_loss = -torch.min(surr1, surr2).mean()\n", "\n", " value_loss = F.mse_loss(new_values.squeeze(-1), flat_returns[mb_idx])\n", " entropy = new_dist.entropy().mean()\n", "\n", " loss = policy_loss + CONFIG[\"value_coef\"] * value_loss - CONFIG[\"entropy_coef\"] * entropy\n", "\n", " self.optimizer.zero_grad(set_to_none=True)\n", " self.scaler.scale(loss).backward()\n", " self.scaler.unscale_(self.optimizer)\n", " nn.utils.clip_grad_norm_(self.model.parameters(), 1.0)\n", " self.scaler.step(self.optimizer)\n", " self.scaler.update()\n", "\n", " total_policy_loss += policy_loss.item()\n", " total_value_loss += value_loss.item()\n", " num_updates += 1\n", "\n", " # --- PHASE 4: METRICS ---\n", " win_count = (rewards_buf > 0).sum().item()\n", " draw_count = ((dones_buf) & (rewards_buf == 0)).sum().item()\n", "\n", " if (iteration + 1) % CONFIG[\"log_interval\"] == 0:\n", " fps = dataset_size / max(time.time() - iter_start, 0.001)\n", " log_data = [\n", " iteration + 1,\n", " total_policy_loss / max(1, num_updates),\n", " total_value_loss / max(1, num_updates),\n", " flat_returns.mean().item(),\n", " fps,\n", " win_count / B,\n", " draw_count / B\n", " ]\n", "\n", " print(f\"[Iter {log_data[0]:04d}] P: {log_data[1]:.4f} | V: {log_data[2]:.4f} | \"\n", " f\"V_Mean: {log_data[3]:.3f} | Win%: {log_data[5]:.2f} | FPS: {log_data[4]:.0f}\")\n", "\n", " with open(self.log_file, \"a\", newline=\"\") as f:\n", " csv.writer(f).writerow(log_data)\n", "\n", " if (iteration + 1) % CONFIG[\"save_interval\"] == 0:\n", " self.save_checkpoint(iteration + 1)\n", " self.plot_metrics()\n", "\n", " # Free unused memory back to cache aggressively\n", " torch.cuda.empty_cache()\n", "\n", " def plot_metrics(self):\n", " if not os.path.exists(self.log_file): return\n", " df = pd.read_csv(self.log_file)\n", " if len(df) == 0: return\n", "\n", " fig, axs = plt.subplots(2, 2, figsize=(12, 8))\n", " axs[0, 0].plot(df['iteration'], df['p_loss'], color='blue'); axs[0, 0].set_title('Policy Loss')\n", " axs[0, 1].plot(df['iteration'], df['v_loss'], color='red'); axs[0, 1].set_title('Value Loss')\n", " axs[1, 0].plot(df['iteration'], df['v_mean'], color='green'); axs[1, 0].set_title('Value Mean')\n", " if 'win_rate' in df.columns:\n", " axs[1, 1].plot(df['iteration'], df['win_rate'], label='Win', color='purple')\n", " axs[1, 1].plot(df['iteration'], df['draw_rate'], label='Draw', color='orange')\n", " axs[1, 1].set_title('Outcomes'); axs[1, 1].legend()\n", "\n", " plt.tight_layout()\n", " plt.savefig(os.path.join(CONFIG[\"checkpoint_dir\"], \"training_performance.png\"))\n", " plt.close(fig)\n", "\n", "if __name__ == \"__main__\":\n", " parser = argparse.ArgumentParser()\n", " parser.add_argument(\"--iterations\", type=int, default=10000)\n", " parser.add_argument(\"--test-batch\", action=\"store_true\")\n", " args, _ = parser.parse_known_args()\n", "\n", " torch.manual_seed(CONFIG[\"seed\"])\n", " np.random.seed(CONFIG[\"seed\"])\n", " random.seed(CONFIG[\"seed\"])\n", "\n", " trainer = GRPOTrainer()\n", " trainer.train(2 if args.test_batch else args.iterations)" ] } ] }