Update app.py
Browse files
app.py
CHANGED
|
@@ -36,6 +36,10 @@ def setup_training():
|
|
| 36 |
# Load your dataset with the specified configuration
|
| 37 |
logging.info("Loading the MarbleX dataset")
|
| 38 |
dataset = load_dataset("Oranblock/marblex_dataset", "config1") # Replace "config1" with the appropriate config name
|
|
|
|
|
|
|
|
|
|
|
|
|
| 39 |
logging.info(f"Dataset loaded. Train size: {len(dataset['train'])}, Test size: {len(dataset['test'])}")
|
| 40 |
|
| 41 |
# Load tokenizer and model
|
|
|
|
| 36 |
# Load your dataset with the specified configuration
|
| 37 |
logging.info("Loading the MarbleX dataset")
|
| 38 |
dataset = load_dataset("Oranblock/marblex_dataset", "config1") # Replace "config1" with the appropriate config name
|
| 39 |
+
|
| 40 |
+
# Print dataset structure
|
| 41 |
+
logging.info(f"Dataset columns: {dataset['train'].column_names}")
|
| 42 |
+
|
| 43 |
logging.info(f"Dataset loaded. Train size: {len(dataset['train'])}, Test size: {len(dataset['test'])}")
|
| 44 |
|
| 45 |
# Load tokenizer and model
|