Spaces:

SKT27182
/

NeuralStyleTransfer

Sleeping

App Files Files Community

SKT27182 commited on May 28, 2023

Commit

9317f0e

1 Parent(s): 700a2d4

Tunend intital values and also the range

Browse files

Files changed (8) hide show

app.py +38 -49
examples/{content_1.jpg → painting.jpg} +2 -2
examples/{content_2.jpg → scene.jpg} +2 -2
examples/style_2.jpg +0 -3
examples/style_3.jpg +0 -3
examples/{content_3.jpg → swan.jpg} +2 -2
examples/{style_1.jpg → van_gogh.jpg} +2 -2
model.py +17 -22

app.py CHANGED Viewed

@@ -159,8 +159,8 @@ def fit_style_transfer(
 def main():
-    content_image = gr.Image(type="filepath", label="Content Image", shape=(512, 512))
-    style_image = gr.Image(type="filepath", label="Style Image", shape=(512, 512))
     extractor = gr.Dropdown(
         ["inception_v3", "vgg19", "resnet50", "mobilenet_v2"],
@@ -180,7 +180,7 @@ def main():
     n_style_layers = gr.Slider(
         1,
         5,
-        value=2,
         step=1,
         label="Style Layers",
     )
@@ -191,34 +191,31 @@ def main():
     steps_per_epoch = gr.Slider(
         1,
-        10,
         value=5,
         step=1,
         label="Steps Per Epoch",
     )
     style_weight = gr.Slider(
-        1e-4,
-        1e-1,
-        value=5e-2,
-        step=1e-4,
         label="Style Weight",
     )
     content_weight = gr.Slider(
-        1e-3,
-        1e-1,
-        value=3e-2,
-        step=1e-4,
         label="Content Weight",
     )
     var_weight = gr.Slider(
         0,
-        3,
-        value=1.5,
-        step=0.2,
-        label="Total Variation Weight",
     )
     inputs = [
@@ -237,49 +234,34 @@ def main():
     examples = [
         [
-            "examples/style_1.jpg",
-            "examples/content_1.jpg",
             "inception_v3",
-            3,
-            1,
             5,
-            80,
             10,
-            2e-2,
-            1e-2,
-            1.5,
-        ],
-        [
-            "examples/style_2.jpg",
-            "examples/content_2.jpg",
-            "inception_v3",
-            3,
-            2,
-            4,
-            60,
             10,
-            5e-2,
-            3e-2,
-            1.5,
         ],
         [
-            "examples/style_3.jpg",
-            "examples/content_3.jpg",
-            "inception_v3",
-            3,
-            1,
-            4,
-            60,
             10,
-            5e-2,
-            3e-2,
-            1.5,
         ]
     ]
-    output_image = gr.Image(type="numpy", label="Output Image", shape=(512, 512))
     style_loss = gr.Number(label="Current Style Loss")
@@ -291,6 +273,10 @@ def main():
     curr_step = gr.Number(label="Current Step")
     outputs = [output_image, style_loss, content_loss, var_loss, curr_epoch, curr_step]
@@ -299,7 +285,10 @@ def main():
         fn=fit_style_transfer,
         inputs=inputs,
         outputs=outputs,
         examples=examples,
     )

 def main():
+    content_image = gr.Image(type="filepath", label="Content Image")
+    style_image = gr.Image(type="filepath", label="Style Image")
     extractor = gr.Dropdown(
         ["inception_v3", "vgg19", "resnet50", "mobilenet_v2"],
     n_style_layers = gr.Slider(
         1,
         5,
+        value=3,
         step=1,
         label="Style Layers",
     )
     steps_per_epoch = gr.Slider(
         1,
+        20,
         value=5,
         step=1,
         label="Steps Per Epoch",
     )
     style_weight = gr.Slider(
+        0,
+        1,
+        value=0.1,
         label="Style Weight",
     )
     content_weight = gr.Slider(
+        0,
+        1,
+        value=1,
         label="Content Weight",
     )
     var_weight = gr.Slider(
         0,
+        0.8,
+        value=0,
+        label="Variation Weight",
     )
     inputs = [
     examples = [
         [
+            "examples/van_gogh.jpg",
+            "examples/scene.jpg",
             "inception_v3",
             5,
+            5,
             10,
+            40,
             10,
+            0.1,
+            1,
+            0.01,
         ],
         [
+            "examples/painting.jpg",
+            "examples/swan.jpg",
+            "vgg19",
+            5,
+            5,
             10,
+            40,
+            10,
+            0.1,
+            1,
+            0.01,
         ]
     ]
+    output_image = gr.Image(type="numpy", label="Output Image")
     style_loss = gr.Number(label="Current Style Loss")
     curr_step = gr.Number(label="Current Step")
+    title = "Neural Style Transfer"
+    description = """### This app uses a neural network to transfer the style of one image to another. \n### The `style image` is the image whose style you want to transfer, and the `content image` is the image you want to transfer the style to. \n### The `feature extractor` is the neural network used to extract the features from the images. \n### The number of `style layers` and `content layers` are the number of layers in the feature extractor used to extract the style and content features respectively. \n### The `epochs`, `learning_rate`, `steps_per_epoch`, `style_weight`, `content_weight`, and `total_variation_weight` are all **hyperparameters** that affect the style transfer process. \n### The style weight controls how much the style image affects the output image, the content weight controls how much the content image affects the output image, and the variation weight controls how much the total variation of the output image affects the output image. The total variation of an image is the sum of the absolute differences for neighboring pixel-values in the image. The total variation loss is used to smooth the output image. The higher the variation weight, the smoother the output image will be."""
     outputs = [output_image, style_loss, content_loss, var_loss, curr_epoch, curr_step]
         fn=fit_style_transfer,
         inputs=inputs,
         outputs=outputs,
+        title=title,
+        description=description,
         examples=examples,
+        theme='gradio/monochrome'
     )

examples/{content_1.jpg → painting.jpg} RENAMED Viewed

File without changes

examples/{content_2.jpg → scene.jpg} RENAMED Viewed

File without changes

examples/style_2.jpg DELETED Viewed

Git LFS Details

SHA256: d25bb1f00ca850cab0710ac98414a0de63dd9e49f9abc96ee9415cbdf7e4540a
Pointer size: 133 Bytes
Size of remote file: 14.3 MB

examples/style_3.jpg DELETED Viewed

Git LFS Details

SHA256: 749549277a70212a842011a60228ae91d17026ecac8aecc3aab90799b6eed6a2
Pointer size: 132 Bytes
Size of remote file: 4.41 MB

examples/{content_3.jpg → swan.jpg} RENAMED Viewed

File without changes

examples/{style_1.jpg → van_gogh.jpg} RENAMED Viewed

File without changes

model.py CHANGED Viewed

@@ -6,6 +6,8 @@ from keras import backend as K
 class NeuralStyleTransfer:
     def __init__(self, style_image, content_image, extractor, n_style_layers=5, n_content_layers=5):
         # load the model
         if extractor == "inception_v3":
             self.feature_extractor = tf.keras.applications.InceptionV3(
@@ -69,31 +71,19 @@ class NeuralStyleTransfer:
         return image
-    def imshow(self, image, title=None):
-        """displays an image with a corresponding title"""
-        if len(image.shape) > 3:
-            image = tf.squeeze(image, axis=0)
-        plt.imshow(image)
-        if title:
-            plt.title(title)
-    def show_images_with_objects(self, images, titles=[]):
-        """displays a row of images with corresponding titles"""
-        if len(images) != len(titles):
-            return
-        plt.figure(figsize=(20, 12))
-        for idx, (image, title) in enumerate(zip(images, titles)):
-            plt.subplot(1, len(images), idx + 1)
-            plt.xticks([])
-            plt.yticks([])
-            self.imshow(image, title)
     def _preprocess_image(self, image):
         image = tf.cast(image, dtype=tf.float32)
-        image = (image / 127.5) - 1.0
         return image
     def get_output_layers(self):
@@ -219,6 +209,11 @@ class NeuralStyleTransfer:
                 )
             ]
         )
         total_loss = style_loss + content_loss
         return total_loss, style_loss, content_loss

 class NeuralStyleTransfer:
     def __init__(self, style_image, content_image, extractor, n_style_layers=5, n_content_layers=5):
+        self.extractor = extractor
         # load the model
         if extractor == "inception_v3":
             self.feature_extractor = tf.keras.applications.InceptionV3(
         return image
     def _preprocess_image(self, image):
         image = tf.cast(image, dtype=tf.float32)
+        if self.extractor == "inception_v3":
+            image = image / 127.5 - 1
+        elif self.extractor == "vgg19":
+            image = tf.keras.applications.vgg19.preprocess_input(image)
+        elif self.extractor == "resnet50":
+            image = tf.keras.applications.resnet50.preprocess_input(image)
+        elif self.extractor == "mobilenet_v2":
+            # scale pixel between -1 and 1
+            image = image / 127.5 - 1
         return image
     def get_output_layers(self):
                 )
             ]
         )
+        style_loss /= self.n_style_layers
+        content_loss /= self.n_content_layers
         total_loss = style_loss + content_loss
         return total_loss, style_loss, content_loss