hieu3636
/

cxr-vlm-code

Model card Files Files and versions

xet

Community

convitom commited on 9 days ago

Commit

d313d81

1 Parent(s): 1c5d410

f

Browse files

Files changed (2) hide show

scripts/cxrvlm_colab_train.ipynb +16 -8
utils/_httpx_compat.py +6 -0

scripts/cxrvlm_colab_train.ipynb CHANGED Viewed

@@ -65,6 +65,12 @@
     "# Supported: 'kaggle' | 'colab' | 'lightning' | 'gcp' | 'local'\n",
     "PLATFORM     = 'colab'\n",
     "DATASET_NAME = 'MIMIC-CXR_resized'   # 'MIMIC-CXR' | 'MIMIC-CXR_resized' | 'IU-Xray'\n",
     "\n",
     "assert PLATFORM     in ('kaggle', 'colab', 'lightning', 'gcp', 'local')\n",
     "assert DATASET_NAME in ('MIMIC-CXR', 'MIMIC-CXR_resized', 'IU-Xray')\n",
@@ -337,6 +343,9 @@
     "        def patched(self, *args, **kwargs):\n",
     "            if 'allow_redirects' in kwargs:\n",
     "                kwargs['follow_redirects'] = kwargs.pop('allow_redirects')\n",
     "            return orig(self, *args, **kwargs)\n",
     "        return patched\n",
     "    for cls in (httpx.Client, httpx.AsyncClient):\n",
@@ -741,8 +750,8 @@
     "#                'merged'        → 1 task (full report \"Findings: ...\\n\\nImpression: ...\")\n",
     "#                'split_cascade' → split, but impression's context = GT findings\n",
     "#   image_mode : 'all_views_split' | 'frontal_only_split' | 'multi_image_merged'\n",
-    "train_cfg.data.report_mode             = 'split'\n",
-    "train_cfg.data.image_mode              = 'all_views_split'\n",
     "train_cfg.data.max_images_per_sample   = 2          # only used in multi_image_merged\n",
     "\n",
     "# ── dataset-specific paths ──\n",
@@ -912,7 +921,8 @@
     "train_cfg.training.dataloader_persistent_workers = True\n",
     "train_cfg.training.optim                       = _profile['optim']\n",
     "# Ensure stage2 still uses the same per-run epoch count we want.\n",
-    "train_cfg.stage2.num_epochs                    = 5\n",
     "\n",
     "model_cfg.llm.attn_implementation       = _profile['attn_implementation']\n",
     "model_cfg.llm.gradient_checkpointing    = _profile['gradient_checkpointing']\n",
@@ -976,8 +986,10 @@
   },
   {
    "cell_type": "code",
    "id": "cell-itc",
    "metadata": {},
    "source": [
     "# ── (Optional) Stage-1 ITC alignment toggle ─────────────────────────\n",
     "USE_ITC         = False   # True → contrastive Stage-1 (no Vicuna); False → original\n",
@@ -1029,9 +1041,7 @@
     "    print(OmegaConf.to_yaml(train_cfg.stage1))\n",
     "else:\n",
     "    print('ITC disabled - Stage 1 uses the original LM-loss alignment.')"
-   ],
-   "execution_count": null,
-   "outputs": []
   },
   {
    "cell_type": "markdown",
@@ -1201,8 +1211,6 @@
    "outputs": [],
    "source": [
     "# Resume controller — set MODE once, run the train cell below.\n",
-    "MODE            = 'fresh'        # 'fresh' | 'resume'\n",
-    "EXPLICIT_RUN_ID = None           # None  | 'IU-Xray_run_5'   (only matters when MODE='resume')\n",
     "\n",
     "assert MODE in ('fresh', 'resume'), \"MODE must be 'fresh' or 'resume'\"\n",
     "if MODE == 'resume' and EXPLICIT_RUN_ID:\n",

     "# Supported: 'kaggle' | 'colab' | 'lightning' | 'gcp' | 'local'\n",
     "PLATFORM     = 'colab'\n",
     "DATASET_NAME = 'MIMIC-CXR_resized'   # 'MIMIC-CXR' | 'MIMIC-CXR_resized' | 'IU-Xray'\n",
+    "REPORT_MODE = 'split_cascade'        # 'split' | 'merged' | 'split_cascade'\n",
+    "IMAGE_MODE  = 'all_views_split'  # 'all_views_split' | 'frontal_only_split' | 'multi_image_merged'\n",
+    "S1_EPOCHS   = 2\n",
+    "S2_EPOCHS   = 5\n",
+    "MODE            = 'fresh'        # 'fresh' | 'resume'\n",
+    "EXPLICIT_RUN_ID = None           # None  | 'IU-Xray_run_5'   (only matters when MODE='resume')\n",
     "\n",
     "assert PLATFORM     in ('kaggle', 'colab', 'lightning', 'gcp', 'local')\n",
     "assert DATASET_NAME in ('MIMIC-CXR', 'MIMIC-CXR_resized', 'IU-Xray')\n",
     "        def patched(self, *args, **kwargs):\n",
     "            if 'allow_redirects' in kwargs:\n",
     "                kwargs['follow_redirects'] = kwargs.pop('allow_redirects')\n",
+    "            # httpx 0.28+ removed per-request `proxies=` too — transformers ≤4.49\n",
+    "            # still passes it via huggingface_hub.has_file → drop it silently.\n",
+    "            kwargs.pop('proxies', None)\n",
     "            return orig(self, *args, **kwargs)\n",
     "        return patched\n",
     "    for cls in (httpx.Client, httpx.AsyncClient):\n",
     "#                'merged'        → 1 task (full report \"Findings: ...\\n\\nImpression: ...\")\n",
     "#                'split_cascade' → split, but impression's context = GT findings\n",
     "#   image_mode : 'all_views_split' | 'frontal_only_split' | 'multi_image_merged'\n",
+    "train_cfg.data.report_mode             = REPORT_MODE\n",
+    "train_cfg.data.image_mode              = IMAGE_MODE\n",
     "train_cfg.data.max_images_per_sample   = 2          # only used in multi_image_merged\n",
     "\n",
     "# ── dataset-specific paths ──\n",
     "train_cfg.training.dataloader_persistent_workers = True\n",
     "train_cfg.training.optim                       = _profile['optim']\n",
     "# Ensure stage2 still uses the same per-run epoch count we want.\n",
+    "train_cfg.stage1.num_epochs                    = S1_EPOCHS\n",
+    "train_cfg.stage2.num_epochs                    = S2_EPOCHS\n",
     "\n",
     "model_cfg.llm.attn_implementation       = _profile['attn_implementation']\n",
     "model_cfg.llm.gradient_checkpointing    = _profile['gradient_checkpointing']\n",
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "id": "cell-itc",
    "metadata": {},
+   "outputs": [],
    "source": [
     "# ── (Optional) Stage-1 ITC alignment toggle ─────────────────────────\n",
     "USE_ITC         = False   # True → contrastive Stage-1 (no Vicuna); False → original\n",
     "    print(OmegaConf.to_yaml(train_cfg.stage1))\n",
     "else:\n",
     "    print('ITC disabled - Stage 1 uses the original LM-loss alignment.')"
+   ]
   },
   {
    "cell_type": "markdown",
    "outputs": [],
    "source": [
     "# Resume controller — set MODE once, run the train cell below.\n",
     "\n",
     "assert MODE in ('fresh', 'resume'), \"MODE must be 'fresh' or 'resume'\"\n",
     "if MODE == 'resume' and EXPLICIT_RUN_ID:\n",

utils/_httpx_compat.py CHANGED Viewed

@@ -45,6 +45,12 @@ def apply() -> bool:
                 # follow_redirects is the modern equivalent. If both are
                 # somehow set, allow_redirects wins (matches old behaviour).
                 kwargs["follow_redirects"] = kwargs.pop("allow_redirects")
             return orig(self, *args, **kwargs)
         return patched

                 # follow_redirects is the modern equivalent. If both are
                 # somehow set, allow_redirects wins (matches old behaviour).
                 kwargs["follow_redirects"] = kwargs.pop("allow_redirects")
+            # httpx 0.28 also removed per-request `proxies=`. Some
+            # transformers / huggingface_hub paths still pass it (e.g.
+            # transformers.utils.hub.has_file → Client.head(proxies=...)),
+            # raising TypeError. Drop it silently — httpx 0.28 picks up
+            # proxies from the Client/transport instead.
+            kwargs.pop("proxies", None)
             return orig(self, *args, **kwargs)
         return patched