File size: 1,643 Bytes
aef1f5a
3c4c67b
 
 
aef1f5a
3c4c67b
 
363ba14
3c4c67b
363ba14
aef1f5a
3c4c67b
aef1f5a
 
3c4c67b
 
aef1f5a
 
 
 
 
3c4c67b
 
aef1f5a
 
 
 
 
3c4c67b
 
363ba14
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
"""Tests for the data loader."""

from __future__ import annotations

from typing import TYPE_CHECKING

import pytest
from datasets.exceptions import DatasetNotFoundError

from stroke_deepisles_demo.data.adapter import HuggingFaceDataset, LocalDataset
from stroke_deepisles_demo.data.loader import load_isles_dataset

if TYPE_CHECKING:
    from pathlib import Path


def test_load_from_local_returns_local_dataset(synthetic_isles_dir: Path) -> None:
    """Test that loading from local path returns a LocalDataset."""
    dataset = load_isles_dataset(source=synthetic_isles_dir, local_mode=True)
    assert isinstance(dataset, LocalDataset)
    assert len(dataset) > 0


def test_load_from_local_finds_all_cases(synthetic_isles_dir: Path) -> None:
    """Test that the loader correctly delegates finding cases to adapter."""
    dataset = load_isles_dataset(source=synthetic_isles_dir)
    assert len(dataset) == 2
    assert dataset.list_case_ids() == ["sub-stroke0001", "sub-stroke0002"]


def test_load_hf_raises_on_invalid_dataset() -> None:
    """Test that loading a non-existent HF dataset raises DatasetNotFoundError."""
    with pytest.raises(DatasetNotFoundError):
        load_isles_dataset(source="fake/nonexistent-dataset", local_mode=False)


@pytest.mark.integration
def test_load_from_huggingface_returns_hf_dataset() -> None:
    """Test that loading from HuggingFace returns a HuggingFaceDataset."""
    with load_isles_dataset() as dataset:  # Default is HuggingFace mode
        assert isinstance(dataset, HuggingFaceDataset)
        assert len(dataset) == 149
        assert dataset.list_case_ids()[0] == "sub-stroke0001"