Spaces:
Sleeping
Sleeping
update prompt
Browse files
app.py
CHANGED
|
@@ -18,6 +18,11 @@ class AudioPalette:
|
|
| 18 |
self.pace_model = PaceModel(height, width, channels, resnet50_tf_model_weights_path, pace_model_weights_path)
|
| 19 |
self.image_captioning = ImageCaptioning()
|
| 20 |
self.audio_generation = AudioGeneration()
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 21 |
|
| 22 |
def generate(self, input_image: PIL.Image.Image, ngrok_endpoint: str):
|
| 23 |
pace = self.pace_model.predict(input_image)
|
|
@@ -27,7 +32,8 @@ class AudioPalette:
|
|
| 27 |
print("Captioning Done")
|
| 28 |
|
| 29 |
generated_text = generated_text if generated_text is not None else ""
|
| 30 |
-
prompt = f"Generate a soundtrack for {generated_text} with {pace} beats and the instrument of choice is the guitar, High quality"
|
|
|
|
| 31 |
|
| 32 |
audio_file = self.audio_generation.generate(prompt, ngrok_endpoint)
|
| 33 |
print("Audio Generation Done")
|
|
|
|
| 18 |
self.pace_model = PaceModel(height, width, channels, resnet50_tf_model_weights_path, pace_model_weights_path)
|
| 19 |
self.image_captioning = ImageCaptioning()
|
| 20 |
self.audio_generation = AudioGeneration()
|
| 21 |
+
self.pace_map = {
|
| 22 |
+
"Fast": "high",
|
| 23 |
+
"Medium": "medium",
|
| 24 |
+
"Slow": "low"
|
| 25 |
+
}
|
| 26 |
|
| 27 |
def generate(self, input_image: PIL.Image.Image, ngrok_endpoint: str):
|
| 28 |
pace = self.pace_model.predict(input_image)
|
|
|
|
| 32 |
print("Captioning Done")
|
| 33 |
|
| 34 |
generated_text = generated_text if generated_text is not None else ""
|
| 35 |
+
# prompt = f"Generate a soundtrack for {generated_text} with {pace} beats and the instrument of choice is the guitar, High quality"
|
| 36 |
+
prompt = f"A soundtrack for {generated_text} with {self.pace_map[pace]} beats per minute. High quality."
|
| 37 |
|
| 38 |
audio_file = self.audio_generation.generate(prompt, ngrok_endpoint)
|
| 39 |
print("Audio Generation Done")
|