IshiKura-a
commited on
Commit
·
d91fa39
1
Parent(s):
8051f90
chessdata
Browse files- .gitattributes +10 -0
- chess/checker&LLM.pdf +0 -0
- chess/chess&LLM.pdf +0 -0
- chess/chessgpt_data_chess_puzzle_dataset_info.json +24 -0
- chess/process_jsonlines.py +24 -0
- chess/puzzle00.jsonl +3 -0
- chess/puzzle01.jsonl +3 -0
- chess/puzzle02.jsonl +3 -0
- chess/puzzle03.jsonl +3 -0
- chess/puzzle04.jsonl +3 -0
- chess/puzzle05.jsonl +3 -0
- chess/puzzle06.jsonl +3 -0
- chess/puzzle07.jsonl +3 -0
- chess/puzzle08.jsonl +3 -0
- chess/puzzle09.jsonl +3 -0
- chess/puzzle10.jsonl +3 -0
- chess/puzzle11.jsonl +3 -0
- chess/puzzle12.jsonl +3 -0
- chess/puzzle13.jsonl +3 -0
- chess/puzzle14.jsonl +3 -0
- chess/puzzle15.jsonl +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,13 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
*.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
*.wandb filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
*.log filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
*.jsonl
|
| 40 |
+
*.wandb
|
| 41 |
+
*.log
|
| 42 |
+
*.jsonl*
|
| 43 |
+
*.wandb*
|
| 44 |
+
*.log*
|
| 45 |
+
*.pdf
|
chess/checker&LLM.pdf
ADDED
|
Binary file (927 kB). View file
|
|
|
chess/chess&LLM.pdf
ADDED
|
Binary file (517 kB). View file
|
|
|
chess/chessgpt_data_chess_puzzle_dataset_info.json
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"shard_lengths": [
|
| 3 |
+
199851,
|
| 4 |
+
199924,
|
| 5 |
+
199453,
|
| 6 |
+
199726,
|
| 7 |
+
199272,
|
| 8 |
+
199512,
|
| 9 |
+
199747,
|
| 10 |
+
199343,
|
| 11 |
+
199682,
|
| 12 |
+
198787,
|
| 13 |
+
199206,
|
| 14 |
+
199248,
|
| 15 |
+
199706,
|
| 16 |
+
199924,
|
| 17 |
+
199539,
|
| 18 |
+
198900
|
| 19 |
+
],
|
| 20 |
+
"total_size": 1525978293,
|
| 21 |
+
"filename_pattern": "chess_puzzle-data.jsonl-{shard_id:05d}-of-{num_shards:05d}",
|
| 22 |
+
"num_examples": 3191820,
|
| 23 |
+
"dataset_name": "chess_puzzle"
|
| 24 |
+
}
|
chess/process_jsonlines.py
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
import jsonlines
|
| 2 |
+
import re
|
| 3 |
+
|
| 4 |
+
def extract_fen(puzzle_data):
|
| 5 |
+
text = puzzle_data["text"]
|
| 6 |
+
fen = re.search('(?<=is )[0-9A-Za-z]+/[0-9A-Za-z]+/[0-9A-Za-z]+/[0-9A-Za-z]+/[0-9A-Za-z]+/[0-9A-Za-z]+/[0-9A-Za-z]+/.+?[,.]', text).group(0)[:-1]
|
| 7 |
+
|
| 8 |
+
return fen
|
| 9 |
+
|
| 10 |
+
|
| 11 |
+
for i in range(16):
|
| 12 |
+
read_file = 'chess_puzzle-data.jsonl-000' + str(i).zfill(2) + '-of-00016'
|
| 13 |
+
with jsonlines.open(read_file) as reader:
|
| 14 |
+
write_file = 'puzzle' + str(i).zfill(2) + '.jsonl'
|
| 15 |
+
with jsonlines.open(write_file, mode='w') as writer:
|
| 16 |
+
# count = 0
|
| 17 |
+
for puzzle in reader:
|
| 18 |
+
# count += 1
|
| 19 |
+
writer.write(extract_fen(puzzle))
|
| 20 |
+
# for key, value in puzzle.items():
|
| 21 |
+
# writer.write("key: " + key + " value: " + str(value))
|
| 22 |
+
# writer.write("-----")
|
| 23 |
+
# if count == 10:
|
| 24 |
+
# break
|
chess/puzzle00.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e65c604357197a5ddfdadc131f21ccd11d8fc3d0961a0b2bb4f3e3f5ab7eafc0
|
| 3 |
+
size 11582431
|
chess/puzzle01.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:83b7730299910a88c0b61b217b8623ff10ade2165c3a599b5e498410a7fb6b7e
|
| 3 |
+
size 11591576
|
chess/puzzle02.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bc50ac1a84612dbff90d3079fe2e126420fcb5d475edf16be621449b99df225d
|
| 3 |
+
size 11561724
|
chess/puzzle03.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e137c284018cbd7da06d4f6af76b0f4e2fd8c9b2ea6b78f668a3071d6e56f67
|
| 3 |
+
size 11581850
|
chess/puzzle04.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0c9e27136067121f97d670af6837da130b8040c588b6c89c9ca9315f7c54752
|
| 3 |
+
size 11551762
|
chess/puzzle05.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22d7e3e0308506625eae9234b40d2224014d71d4f7e8be48f244a393d6449398
|
| 3 |
+
size 11568178
|
chess/puzzle06.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:35123330882cc045444050a044cdee04ec2067a2351491318e1c604e9053c7da
|
| 3 |
+
size 11577697
|
chess/puzzle07.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f60c2689fc013ac9d7e0434e66a203d167cb3e21355eabfb55b49a8136dab935
|
| 3 |
+
size 11555884
|
chess/puzzle08.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e759021b88813aec161ee676bb723105ff5ef1a1673f4fbf17485d86a7bb9e69
|
| 3 |
+
size 11580910
|
chess/puzzle09.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1e58cc12c5e42a98ca2ea1c3b5de4f0e248020a96c8b74e729e22530aea3c710
|
| 3 |
+
size 11520781
|
chess/puzzle10.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:561492edd423940a845204030489fa0890c40fb248c94c91de2ab0352d8e9a68
|
| 3 |
+
size 11542376
|
chess/puzzle11.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:99d81aec2219794d7c0ace6d9067bd68a51b4bb6f332bfe5c80890a44dab7e39
|
| 3 |
+
size 11548297
|
chess/puzzle12.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f4bcfe91fc66133dc83ebac6460fd9ad62cd414be1eaad9599b0e1037cbdbb5b
|
| 3 |
+
size 11576974
|
chess/puzzle13.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:51d17eab86eb8d2c1d3b6e6a22ea95b91c0f1bc77120f3fb78e7117f62cc2488
|
| 3 |
+
size 11588079
|
chess/puzzle14.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2ebc6aa1241c858b1c7145ca863e6bdba6f41db6db4520a833972af483069046
|
| 3 |
+
size 11568015
|
chess/puzzle15.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c47c8013506927eae1c019afaeb479035cee935a5ba7c63b1a44d33b0222df3
|
| 3 |
+
size 11529247
|