Buckets:
| import os | |
| from dagster import Definitions | |
| from dagster_hf_datasets import ( | |
| HuggingFaceResource, | |
| ) | |
| from dagster_hf_datasets.io_manager import HFParquetIOManager | |
| from code_instruction_pipeline.assets import ( | |
| code_quality_metrics, | |
| instruction_examples, | |
| language_filtered_code, | |
| raw_code_stack, | |
| ) | |
| defs = Definitions( | |
| assets=[ | |
| raw_code_stack, | |
| language_filtered_code, | |
| instruction_examples, | |
| code_quality_metrics, | |
| ], | |
| resources={ | |
| "huggingface": HuggingFaceResource( | |
| cache_dir=".hf_cache", | |
| offline=False, | |
| token=os.environ.get("HF_TOKEN"), | |
| ), | |
| "hf_parquet_io_manager": HFParquetIOManager( | |
| base_dir=".dagster_hf_storage", | |
| ), | |
| }, | |
| ) | |
Xet Storage Details
- Size:
- 769 Bytes
- Xet hash:
- 386c4fabbbd396b3c957f9a6bb8343c7356205e4964ded084b651ea04d755f55
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.