| from swift.llm import load_dataset | |
| def test_local_dataset(): | |
| # please use git clone | |
| from swift.llm import git_clone_github | |
| model_dir = git_clone_github('https://www.modelscope.cn/datasets/swift/swift-sft-mixture.git') | |
| dataset = load_dataset(datasets=[f'{model_dir}:firefly'], streaming=True)[0] | |
| print(next(iter(dataset))) | |
| def test_hub_dataset(): | |
| local_dataset = 'swift/swift-sft-mixture:firefly' | |
| dataset = load_dataset(datasets=[local_dataset], streaming=True)[0] | |
| print(next(iter(dataset))) | |
| if __name__ == '__main__': | |
| test_local_dataset() | |
| # test_hub_dataset() | |