Spaces:

THP2903
/

demo_MLN

Build error

App Files Files Community

THP2903 commited on May 24, 2025

Commit

b0c81df

verified ·

1 Parent(s): c3edd3f

Upload folder using huggingface_hub

Browse files

Files changed (5) hide show

Dockerfile +43 -0
GUI.py +217 -0
README.md +259 -12
main.py +3 -14
requirements.txt +1 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,43 @@

+FROM nvidia/cuda:11.1-base-ubuntu20.04
+RUN apt update && DEBIAN_FRONTEND=noninteractive apt install git bzip2 wget unzip python3-pip python3-dev cmake libgl1-mesa-dev python-is-python3 libgtk2.0-dev -yq
+ADD . /app
+WORKDIR /app
+RUN cd Face_Enhancement/models/networks/ &&\
+  git clone https://github.com/vacancy/Synchronized-BatchNorm-PyTorch &&\
+  cp -rf Synchronized-BatchNorm-PyTorch/sync_batchnorm . &&\
+  cd ../../../
+RUN cd Global/detection_models &&\
+  git clone https://github.com/vacancy/Synchronized-BatchNorm-PyTorch &&\
+  cp -rf Synchronized-BatchNorm-PyTorch/sync_batchnorm . &&\
+  cd ../../
+RUN cd Face_Detection/ &&\
+  wget http://dlib.net/files/shape_predictor_68_face_landmarks.dat.bz2 &&\
+  bzip2 -d shape_predictor_68_face_landmarks.dat.bz2 &&\
+  cd ../
+RUN cd Face_Enhancement/ &&\
+  wget https://facevc.blob.core.windows.net/zhanbo/old_photo/pretrain/Face_Enhancement/checkpoints.zip &&\
+  unzip checkpoints.zip &&\
+  cd ../ &&\
+  cd Global/ &&\
+  wget https://facevc.blob.core.windows.net/zhanbo/old_photo/pretrain/Global/checkpoints.zip &&\
+  unzip checkpoints.zip &&\
+  rm -f checkpoints.zip &&\
+  cd ../
+RUN pip3 install numpy
+RUN pip3 install dlib
+RUN pip3 install -r requirements.txt
+RUN git clone https://github.com/NVlabs/SPADE.git
+RUN cd SPADE/ && pip3 install -r requirements.txt
+RUN cd ..
+CMD ["python3", "run.py"]

GUI.py ADDED Viewed

	@@ -0,0 +1,217 @@

+import numpy as np
+import cv2
+import PySimpleGUI as sg
+import os.path
+import argparse
+import os
+import sys
+import shutil
+from subprocess import call
+def modify(image_filename=None, cv2_frame=None):
+    def run_cmd(command):
+        try:
+            call(command, shell=True)
+        except KeyboardInterrupt:
+            print("Process interrupted")
+            sys.exit(1)
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--input_folder", type=str,
+                        default= image_filename, help="Test images")
+    parser.add_argument(
+        "--output_folder",
+        type=str,
+        default="./output",
+        help="Restored images, please use the absolute path",
+    )
+    parser.add_argument("--GPU", type=str, default="-1", help="0,1,2")
+    parser.add_argument(
+        "--checkpoint_name", type=str, default="Setting_9_epoch_100", help="choose which checkpoint"
+    )
+    parser.add_argument("--with_scratch",default="--with_scratch" ,action="store_true")
+    opts = parser.parse_args()
+    gpu1 = opts.GPU
+    # resolve relative paths before changing directory
+    opts.input_folder = os.path.abspath(opts.input_folder)
+    opts.output_folder = os.path.abspath(opts.output_folder)
+    if not os.path.exists(opts.output_folder):
+        os.makedirs(opts.output_folder)
+    main_environment = os.getcwd()
+    # Stage 1: Overall Quality Improve
+    print("Running Stage 1: Overall restoration")
+    os.chdir("./Global")
+    stage_1_input_dir = opts.input_folder
+    stage_1_output_dir = os.path.join(
+        opts.output_folder, "stage_1_restore_output")
+    if not os.path.exists(stage_1_output_dir):
+        os.makedirs(stage_1_output_dir)
+    if not opts.with_scratch:
+        stage_1_command = (
+            "python test.py --test_mode Full --Quality_restore --test_input "
+            + stage_1_input_dir
+            + " --outputs_dir "
+            + stage_1_output_dir
+            + " --gpu_ids "
+            + gpu1
+        )
+        run_cmd(stage_1_command)
+    else:
+        mask_dir = os.path.join(stage_1_output_dir, "masks")
+        new_input = os.path.join(mask_dir, "input")
+        new_mask = os.path.join(mask_dir, "mask")
+        stage_1_command_1 = (
+            "python detection.py --test_path "
+            + stage_1_input_dir
+            + " --output_dir "
+            + mask_dir
+            + " --input_size full_size"
+            + " --GPU "
+            + gpu1
+        )
+        stage_1_command_2 = (
+            "python test.py --Scratch_and_Quality_restore --test_input "
+            + new_input
+            + " --test_mask "
+            + new_mask
+            + " --outputs_dir "
+            + stage_1_output_dir
+            + " --gpu_ids "
+            + gpu1
+        )
+        run_cmd(stage_1_command_1)
+        run_cmd(stage_1_command_2)
+    # Solve the case when there is no face in the old photo
+    stage_1_results = os.path.join(stage_1_output_dir, "restored_image")
+    stage_4_output_dir = os.path.join(opts.output_folder, "final_output")
+    if not os.path.exists(stage_4_output_dir):
+        os.makedirs(stage_4_output_dir)
+    for x in os.listdir(stage_1_results):
+        img_dir = os.path.join(stage_1_results, x)
+        shutil.copy(img_dir, stage_4_output_dir)
+    print("Finish Stage 1 ...")
+    print("\n")
+    # Stage 2: Face Detection
+    print("Running Stage 2: Face Detection")
+    os.chdir(".././Face_Detection")
+    stage_2_input_dir = os.path.join(stage_1_output_dir, "restored_image")
+    stage_2_output_dir = os.path.join(
+        opts.output_folder, "stage_2_detection_output")
+    if not os.path.exists(stage_2_output_dir):
+        os.makedirs(stage_2_output_dir)
+    stage_2_command = (
+        "python detect_all_dlib.py --url " + stage_2_input_dir +
+        " --save_url " + stage_2_output_dir
+    )
+    run_cmd(stage_2_command)
+    print("Finish Stage 2 ...")
+    print("\n")
+    # Stage 3: Face Restore
+    print("Running Stage 3: Face Enhancement")
+    os.chdir(".././Face_Enhancement")
+    stage_3_input_mask = "./"
+    stage_3_input_face = stage_2_output_dir
+    stage_3_output_dir = os.path.join(
+        opts.output_folder, "stage_3_face_output")
+    if not os.path.exists(stage_3_output_dir):
+        os.makedirs(stage_3_output_dir)
+    stage_3_command = (
+        "python test_face.py --old_face_folder "
+        + stage_3_input_face
+        + " --old_face_label_folder "
+        + stage_3_input_mask
+        + " --tensorboard_log --name "
+        + opts.checkpoint_name
+        + " --gpu_ids "
+        + gpu1
+        + " --load_size 256 --label_nc 18 --no_instance --preprocess_mode resize --batchSize 4 --results_dir "
+        + stage_3_output_dir
+        + " --no_parsing_map"
+    )
+    run_cmd(stage_3_command)
+    print("Finish Stage 3 ...")
+    print("\n")
+    # Stage 4: Warp back
+    print("Running Stage 4: Blending")
+    os.chdir(".././Face_Detection")
+    stage_4_input_image_dir = os.path.join(
+        stage_1_output_dir, "restored_image")
+    stage_4_input_face_dir = os.path.join(stage_3_output_dir, "each_img")
+    stage_4_output_dir = os.path.join(opts.output_folder, "final_output")
+    if not os.path.exists(stage_4_output_dir):
+        os.makedirs(stage_4_output_dir)
+    stage_4_command = (
+        "python align_warp_back_multiple_dlib.py --origin_url "
+        + stage_4_input_image_dir
+        + " --replace_url "
+        + stage_4_input_face_dir
+        + " --save_url "
+        + stage_4_output_dir
+    )
+    run_cmd(stage_4_command)
+    print("Finish Stage 4 ...")
+    print("\n")
+    print("All the processing is done. Please check the results.")
+# --------------------------------- The GUI ---------------------------------
+# First the window layout...
+images_col = [[sg.Text('Input file:'), sg.In(enable_events=True, key='-IN FILE-'), sg.FileBrowse()],
+              [sg.Button('Modify Photo', key='-MPHOTO-'), sg.Button('Exit')],
+              [sg.Image(filename='', key='-IN-'), sg.Image(filename='', key='-OUT-')],]
+# ----- Full layout -----
+layout = [[sg.VSeperator(), sg.Column(images_col)]]
+# ----- Make the window -----
+window = sg.Window('Bringing-old-photos-back-to-life', layout, grab_anywhere=True)
+# ----- Run the Event Loop -----
+prev_filename = colorized = cap = None
+while True:
+    event, values = window.read()
+    if event in (None, 'Exit'):
+        break
+    elif event == '-MPHOTO-':
+        try:
+            n1 = filename.split("/")[-2]
+            n2 = filename.split("/")[-3]
+            n3 = filename.split("/")[-1]
+            filename= str(f"./{n2}/{n1}")
+            modify(filename)
+            global f_image
+            f_image = f'./output/final_output/{n3}'
+            image = cv2.imread(f_image)
+            window['-OUT-'].update(data=cv2.imencode('.png', image)[1].tobytes())
+        except:
+            continue
+    elif event == '-IN FILE-':      # A single filename was chosen
+        filename = values['-IN FILE-']
+        if filename != prev_filename:
+            prev_filename = filename
+            try:
+                image = cv2.imread(filename)
+                window['-IN-'].update(data=cv2.imencode('.png', image)[1].tobytes())
+            except:
+                continue
+# ----- Exit program -----
+window.close()

README.md CHANGED Viewed

@@ -1,12 +1,259 @@
----
-title: Phục hồi ảnh & mô tả triết học
-emoji: 🖼️
-colorFrom: blue
-colorTo: green
-sdk: gradio
-sdk_version: 5.31.0
-app_file: app.py
-pinned: false
----
-Upload ảnh cũ bị hư để phục hồi và nhận mô tả triết học từ AI.

+# Old Photo Restoration (Official PyTorch Implementation)
+<img src='imgs/0001.jpg'/>
+### [Project Page](http://raywzy.com/Old_Photo/) | [Paper (CVPR version)](https://arxiv.org/abs/2004.09484) | [Paper (Journal version)](https://arxiv.org/pdf/2009.07047v1.pdf) | [Pretrained Model](https://hkustconnect-my.sharepoint.com/:f:/g/personal/bzhangai_connect_ust_hk/Em0KnYOeSSxFtp4g_dhWdf0BdeT3tY12jIYJ6qvSf300cA?e=nXkJH2) | [Colab Demo](https://colab.research.google.com/drive/1NEm6AsybIiC5TwTU_4DqDkQO0nFRB-uA?usp=sharing)  | [Replicate Demo & Docker Image](https://replicate.ai/zhangmozhe/bringing-old-photos-back-to-life) :fire:
+**Bringing Old Photos Back to Life, CVPR2020 (Oral)**
+**Old Photo Restoration via Deep Latent Space Translation, TPAMI 2022**
+[Ziyu Wan](http://raywzy.com/)<sup>1</sup>,
+[Bo Zhang](https://www.microsoft.com/en-us/research/people/zhanbo/)<sup>2</sup>,
+[Dongdong Chen](http://www.dongdongchen.bid/)<sup>3</sup>,
+[Pan Zhang](https://panzhang0212.github.io/)<sup>4</sup>,
+[Dong Chen](https://www.microsoft.com/en-us/research/people/doch/)<sup>2</sup>,
+[Jing Liao](https://liaojing.github.io/html/)<sup>1</sup>,
+[Fang Wen](https://www.microsoft.com/en-us/research/people/fangwen/)<sup>2</sup> <br>
+<sup>1</sup>City University of Hong Kong, <sup>2</sup>Microsoft Research Asia, <sup>3</sup>Microsoft Cloud AI, <sup>4</sup>USTC
+<!-- ## Notes of this project
+The code originates from our research project and the aim is to demonstrate the research idea, so we have not optimized it from a product perspective. And we will spend time to address some common issues, such as out of memory issue, limited resolution, but will not involve too much in engineering problems, such as speedup of the inference, fastapi deployment and so on. **We welcome volunteers to contribute to this project to make it more usable for practical application.** -->
+## :sparkles: News
+**2022.3.31**: Our new work regarding old film restoration will be published in CVPR 2022. For more details, please refer to the [project website](http://raywzy.com/Old_Film/) and [github repo](https://github.com/raywzy/Bringing-Old-Films-Back-to-Life).
+The framework now supports the restoration of high-resolution input.
+<img src='imgs/HR_result.png'>
+Training code is available and welcome to have a try and learn the training details.
+You can now play with our [Colab](https://colab.research.google.com/drive/1NEm6AsybIiC5TwTU_4DqDkQO0nFRB-uA?usp=sharing) and try it on your photos.
+## Requirement
+The code is tested on Ubuntu with Nvidia GPUs and CUDA installed. Python>=3.6 is required to run the code.
+## Installation
+Clone the Synchronized-BatchNorm-PyTorch repository for
+```
+cd Face_Enhancement/models/networks/
+git clone https://github.com/vacancy/Synchronized-BatchNorm-PyTorch
+cp -rf Synchronized-BatchNorm-PyTorch/sync_batchnorm .
+cd ../../../
+```
+```
+cd Global/detection_models
+git clone https://github.com/vacancy/Synchronized-BatchNorm-PyTorch
+cp -rf Synchronized-BatchNorm-PyTorch/sync_batchnorm .
+cd ../../
+```
+Download the landmark detection pretrained model
+```
+cd Face_Detection/
+wget http://dlib.net/files/shape_predictor_68_face_landmarks.dat.bz2
+bzip2 -d shape_predictor_68_face_landmarks.dat.bz2
+cd ../
+```
+Download the pretrained model, put the file `Face_Enhancement/checkpoints.zip` under `./Face_Enhancement`, and put the file `Global/checkpoints.zip` under `./Global`. Then unzip them respectively.
+```
+cd Face_Enhancement/
+wget https://github.com/microsoft/Bringing-Old-Photos-Back-to-Life/releases/download/v1.0/face_checkpoints.zip
+unzip face_checkpoints.zip
+cd ../
+cd Global/
+wget https://github.com/microsoft/Bringing-Old-Photos-Back-to-Life/releases/download/v1.0/global_checkpoints.zip
+unzip global_checkpoints.zip
+cd ../
+```
+Install dependencies:
+```bash
+pip install -r requirements.txt
+```
+## :rocket: How to use?
+**Note**: GPU can be set 0 or 0,1,2 or 0,2; use -1 for CPU
+### 1) Full Pipeline
+You could easily restore the old photos with one simple command after installation and downloading the pretrained model.
+For images without scratches:
+```
+python run.py --input_folder [test_image_folder_path] \
+              --output_folder [output_path] \
+              --GPU 0
+```
+For scratched images:
+```
+python run.py --input_folder [test_image_folder_path] \
+              --output_folder [output_path] \
+              --GPU 0 \
+              --with_scratch
+```
+**For high-resolution images with scratches**:
+```
+python run.py --input_folder [test_image_folder_path] \
+              --output_folder [output_path] \
+              --GPU 0 \
+              --with_scratch \
+              --HR
+```
+Note: Please try to use the absolute path. The final results will be saved in `./output_path/final_output/`. You could also check the produced results of different steps in `output_path`.
+### 2) Scratch Detection
+Currently we don't plan to release the scratched old photos dataset with labels directly. If you want to get the paired data, you could use our pretrained model to test the collected images to obtain the labels.
+```
+cd Global/
+python detection.py --test_path [test_image_folder_path] \
+                    --output_dir [output_path] \
+                    --input_size [resize_256|full_size|scale_256]
+```
+<img src='imgs/scratch_detection.png'>
+### 3) Global Restoration
+A triplet domain translation network is proposed to solve both structured degradation and unstructured degradation of old photos.
+<p align="center">
+<img src='imgs/pipeline.PNG' width="50%" height="50%"/>
+</p>
+```
+cd Global/
+python test.py --Scratch_and_Quality_restore \
+               --test_input [test_image_folder_path] \
+               --test_mask [corresponding mask] \
+               --outputs_dir [output_path]
+python test.py --Quality_restore \
+               --test_input [test_image_folder_path] \
+               --outputs_dir [output_path]
+```
+<img src='imgs/global.png'>
+### 4) Face Enhancement
+We use a progressive generator to refine the face regions of old photos. More details could be found in our journal submission and `./Face_Enhancement` folder.
+<p align="center">
+<img src='imgs/face_pipeline.jpg' width="60%" height="60%"/>
+</p>
+<img src='imgs/face.png'>
+> *NOTE*:
+> This repo is mainly for research purpose and we have not yet optimized the running performance.
+>
+> Since the model is pretrained with 256*256 images, the model may not work ideally for arbitrary resolution.
+### 5) GUI
+A user-friendly GUI which takes input of image by user and shows result in respective window.
+#### How it works:
+1. Run GUI.py file.
+2. Click browse and select your image from test_images/old_w_scratch folder to remove scratches.
+3. Click Modify Photo button.
+4. Wait for a while and see results on GUI window.
+5. Exit window by clicking Exit Window and get your result image in output folder.
+<img src='imgs/gui.PNG'>
+## How to train?
+### 1) Create Training File
+Put the folders of VOC dataset, collected old photos (e.g., Real_L_old and Real_RGB_old) into one shared folder. Then
+```
+cd Global/data/
+python Create_Bigfile.py
+```
+Note: Remember to modify the code based on your own environment.
+### 2) Train the VAEs of domain A and domain B respectively
+```
+cd ..
+python train_domain_A.py --use_v2_degradation --continue_train --training_dataset domain_A --name domainA_SR_old_photos --label_nc 0 --loadSize 256 --fineSize 256 --dataroot [your_data_folder] --no_instance --resize_or_crop crop_only --batchSize 100 --no_html --gpu_ids 0,1,2,3 --self_gen --nThreads 4 --n_downsample_global 3 --k_size 4 --use_v2 --mc 64 --start_r 1 --kl 1 --no_cgan --outputs_dir [your_output_folder] --checkpoints_dir [your_ckpt_folder]
+python train_domain_B.py --continue_train --training_dataset domain_B --name domainB_old_photos --label_nc 0 --loadSize 256 --fineSize 256 --dataroot [your_data_folder]  --no_instance --resize_or_crop crop_only --batchSize 120 --no_html --gpu_ids 0,1,2,3 --self_gen --nThreads 4 --n_downsample_global 3 --k_size 4 --use_v2 --mc 64 --start_r 1 --kl 1 --no_cgan --outputs_dir [your_output_folder]  --checkpoints_dir [your_ckpt_folder]
+```
+Note: For the --name option, please ensure your experiment name contains "domainA" or "domainB", which will be used to select different dataset.
+### 3) Train the mapping network between domains
+Train the mapping without scratches:
+```
+python train_mapping.py --use_v2_degradation --training_dataset mapping --use_vae_which_epoch 200 --continue_train --name mapping_quality --label_nc 0 --loadSize 256 --fineSize 256 --dataroot [your_data_folder] --no_instance --resize_or_crop crop_only --batchSize 80 --no_html --gpu_ids 0,1,2,3 --nThreads 8 --load_pretrainA [ckpt_of_domainA_SR_old_photos] --load_pretrainB [ckpt_of_domainB_old_photos] --l2_feat 60 --n_downsample_global 3 --mc 64 --k_size 4 --start_r 1 --mapping_n_block 6 --map_mc 512 --use_l1_feat --niter 150 --niter_decay 100 --outputs_dir [your_output_folder] --checkpoints_dir [your_ckpt_folder]
+```
+Traing the mapping with scraches:
+```
+python train_mapping.py --no_TTUR --NL_res --random_hole --use_SN --correlation_renormalize --training_dataset mapping --NL_use_mask --NL_fusion_method combine --non_local Setting_42 --use_v2_degradation --use_vae_which_epoch 200 --continue_train --name mapping_scratch --label_nc 0 --loadSize 256 --fineSize 256 --dataroot [your_data_folder] --no_instance --resize_or_crop crop_only --batchSize 36 --no_html --gpu_ids 0,1,2,3 --nThreads 8 --load_pretrainA [ckpt_of_domainA_SR_old_photos] --load_pretrainB [ckpt_of_domainB_old_photos] --l2_feat 60 --n_downsample_global 3 --mc 64 --k_size 4 --start_r 1 --mapping_n_block 6 --map_mc 512 --use_l1_feat --niter 150 --niter_decay 100 --outputs_dir [your_output_folder] --checkpoints_dir [your_ckpt_folder] --irregular_mask [absolute_path_of_mask_file]
+```
+Traing the mapping with scraches (Multi-Scale Patch Attention for HR input):
+```
+python train_mapping.py --no_TTUR --NL_res --random_hole --use_SN --correlation_renormalize --training_dataset mapping --NL_use_mask --NL_fusion_method combine --non_local Setting_42 --use_v2_degradation --use_vae_which_epoch 200 --continue_train --name mapping_Patch_Attention --label_nc 0 --loadSize 256 --fineSize 256 --dataroot [your_data_folder] --no_instance --resize_or_crop crop_only --batchSize 36 --no_html --gpu_ids 0,1,2,3 --nThreads 8 --load_pretrainA [ckpt_of_domainA_SR_old_photos] --load_pretrainB [ckpt_of_domainB_old_photos] --l2_feat 60 --n_downsample_global 3 --mc 64 --k_size 4 --start_r 1 --mapping_n_block 6 --map_mc 512 --use_l1_feat --niter 150 --niter_decay 100 --outputs_dir [your_output_folder] --checkpoints_dir [your_ckpt_folder] --irregular_mask [absolute_path_of_mask_file] --mapping_exp 1
+```
+## Citation
+If you find our work useful for your research, please consider citing the following papers :)
+```bibtex
+@inproceedings{wan2020bringing,
+title={Bringing Old Photos Back to Life},
+author={Wan, Ziyu and Zhang, Bo and Chen, Dongdong and Zhang, Pan and Chen, Dong and Liao, Jing and Wen, Fang},
+booktitle={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition},
+pages={2747--2757},
+year={2020}
+}
+```
+```bibtex
+@article{wan2020old,
+  title={Old Photo Restoration via Deep Latent Space Translation},
+  author={Wan, Ziyu and Zhang, Bo and Chen, Dongdong and Zhang, Pan and Chen, Dong and Liao, Jing and Wen, Fang},
+  journal={arXiv preprint arXiv:2009.07047},
+  year={2020}
+}
+```
+If you are also interested in the legacy photo/video colorization, please refer to [this work](https://github.com/zhangmozhe/video-colorization).
+## Maintenance
+This project is currently maintained by Ziyu Wan and is for academic research use only. If you have any questions, feel free to contact raywzy@gmail.com.
+## License
+The codes and the pretrained model in this repository are under the MIT license as specified by the LICENSE file. We use our labeled dataset to train the scratch detection model.
+This project has adopted the [Microsoft Open Source Code of Conduct](https://opensource.microsoft.com/codeofconduct/). For more information see the [Code of Conduct FAQ](https://opensource.microsoft.com/codeofconduct/faq/) or contact [opencode@microsoft.com](mailto:opencode@microsoft.com) with any additional questions or comments.

main.py CHANGED Viewed

@@ -11,7 +11,7 @@
 # ]
 # API_URL = "https://generativelanguage.googleapis.com/v1beta"
 # WORKING_MODELS = [
 #     "models/gemini-1.5-flash-latest",
 #     "models/gemini-1.5-flash-001",
@@ -200,18 +200,7 @@ def try_models_on_image(image_path):
     print("\n🚫 All models failed or all API keys quota exceeded.")
     return ""  # Return empty string if all attempts fail
-# if __name__ == "__main__":
-#     image_path = "/home/nhattan05022003/coding/SEM_8/MLN_111/photo_restoration/output_img_folder/final_output/monalisa.png"
-#     description = try_models_on_image(image_path)
-#     print(f"Final description: {description}")
 if __name__ == "__main__":
-    import sys
-    if len(sys.argv) < 2:
-        print("❌ Không truyền đường dẫn ảnh.")
-        sys.exit(1)
-    image_path = sys.argv[1]
     description = try_models_on_image(image_path)
-    print(description)

 # ]
 # API_URL = "https://generativelanguage.googleapis.com/v1beta"
 # WORKING_MODELS = [
 #     "models/gemini-1.5-flash-latest",
 #     "models/gemini-1.5-flash-001",
     print("\n🚫 All models failed or all API keys quota exceeded.")
     return ""  # Return empty string if all attempts fail
 if __name__ == "__main__":
+    image_path = "/home/nhattan05022003/coding/SEM_8/MLN_111/photo_restoration/output_img_folder/final_output/monalisa.png"
     description = try_models_on_image(image_path)
+    print(f"Final description: {description}")

requirements.txt CHANGED Viewed

@@ -1,5 +1,6 @@
 torch
 torchvision
 scikit-image
 easydict
 PyYAML

 torch
 torchvision
+dlib
 scikit-image
 easydict
 PyYAML