Update README.md
#2
by bfshi - opened
README.md
CHANGED
|
@@ -38,15 +38,15 @@ num_video_frames_thumbnail = 64 # Total sampled frames for thumbnails
|
|
| 38 |
max_tiles_video = 48 # Max spatial tiles per video (one tile is 392x392)
|
| 39 |
|
| 40 |
# ----- AutoGaze args (tiles) -----
|
| 41 |
-
gazing_ratio_tile = [0.2] + [0.06] * 15 # Per-frame max gazing ratios (single float or list)
|
| 42 |
-
task_loss_requirement_tile = 0.6
|
| 43 |
|
| 44 |
# ----- AutoGaze args (thumbnails) -----
|
| 45 |
-
gazing_ratio_thumbnail = 1 # Set to None to skip gazing on thumbnails
|
| 46 |
task_loss_requirement_thumbnail = None
|
| 47 |
|
| 48 |
# ----- Batching -----
|
| 49 |
-
max_batch_size_autogaze = 16
|
| 50 |
max_batch_size_siglip = 32
|
| 51 |
|
| 52 |
# Load processor and model
|
|
|
|
| 38 |
max_tiles_video = 48 # Max spatial tiles per video (one tile is 392x392)
|
| 39 |
|
| 40 |
# ----- AutoGaze args (tiles) -----
|
| 41 |
+
gazing_ratio_tile = [0.2] + [0.06] * 15 # Per-frame max gazing ratios (single float or list). Videos with higher resolution/FPS usually need lower gazing ratio.
|
| 42 |
+
task_loss_requirement_tile = 0.6 # AutoGaze stops gazing at each frame when the estimated reconstruction loss of that frame is lower than this threshold.
|
| 43 |
|
| 44 |
# ----- AutoGaze args (thumbnails) -----
|
| 45 |
+
gazing_ratio_thumbnail = 1 # Set gazing ratio to 1 and task loss requirement to None to skip gazing on thumbnails
|
| 46 |
task_loss_requirement_thumbnail = None
|
| 47 |
|
| 48 |
# ----- Batching -----
|
| 49 |
+
max_batch_size_autogaze = 16 # Set AutoGaze and SigLIP to use smaller mini-batch size if GPU memory is limited
|
| 50 |
max_batch_size_siglip = 32
|
| 51 |
|
| 52 |
# Load processor and model
|