Spaces:
Running on CPU Upgrade
Running on CPU Upgrade
Started working on dumping the database
Browse files- bin/dumpDB.sh +17 -0
- src/dump_handler.py +34 -0
bin/dumpDB.sh
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
#!/usr/bin/env bash
|
| 2 |
+
|
| 3 |
+
DB_NAME="${1:-}";
|
| 4 |
+
SAVE_NAME="${2:-}";
|
| 5 |
+
|
| 6 |
+
if [[ -z "$DB_NAME" || -z "$SAVE_NAME" ]];; then
|
| 7 |
+
echo "usage: $(basename "$0") DB_NAME SAVE_NAME" >&2;
|
| 8 |
+
exit 1;
|
| 9 |
+
fi
|
| 10 |
+
|
| 11 |
+
OUTPUT_DIR="dump_${DB_NAME}_$(date +%Y%m%d_%H%M%S)";
|
| 12 |
+
|
| 13 |
+
mongodump \
|
| 14 |
+
--db "$DB_NAME" \
|
| 15 |
+
--out "$OUTPUT_DIR";
|
| 16 |
+
|
| 17 |
+
exec python3 ../src/dump_handler.py "$OUTPUT_DIR" "$SAVE_NAME";
|
src/dump_handler.py
ADDED
|
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
from huggingface_hub import upload_folder
|
| 2 |
+
from huggingface_hub import HfApi
|
| 3 |
+
from huggingface_hub import login
|
| 4 |
+
import os
|
| 5 |
+
from pathlib import Path
|
| 6 |
+
import sys
|
| 7 |
+
|
| 8 |
+
class DatasetHandler():
|
| 9 |
+
|
| 10 |
+
def __init__(self,hf_token):
|
| 11 |
+
login(hf_token)
|
| 12 |
+
self.api = HfApi(token = hf_token)
|
| 13 |
+
|
| 14 |
+
def upload_dump(self,path,name):
|
| 15 |
+
try:
|
| 16 |
+
upload_folder(folder_path=path,path_in_repo=name, repo_id="ProjectFrozone/MongoDBDumps", repo_type="dataset")
|
| 17 |
+
return 0
|
| 18 |
+
except:
|
| 19 |
+
return 1
|
| 20 |
+
|
| 21 |
+
if __name__ == "__main__":
|
| 22 |
+
|
| 23 |
+
if len(sys.argv) != 3:
|
| 24 |
+
print("Usage: python3 dump_handler.py file_path name")
|
| 25 |
+
raise Exception()
|
| 26 |
+
|
| 27 |
+
file_path = sys.argv[1]
|
| 28 |
+
name = sys.argv[2]
|
| 29 |
+
token = os.getenv("HF_TOKEN")
|
| 30 |
+
handler = DatasetHandler(token)
|
| 31 |
+
try:
|
| 32 |
+
handler.upload_dump(file_path,name)
|
| 33 |
+
except:
|
| 34 |
+
print("Problem In Upload")
|