Spaces:
Sleeping
Sleeping
Update alternative-2.py
Browse files- alternative-2.py +11 -12
alternative-2.py
CHANGED
|
@@ -97,7 +97,7 @@ def extractDataFromUrls(urls: str, loader_type: str):
|
|
| 97 |
for item in data:
|
| 98 |
jsonData.append(item.to_json())
|
| 99 |
|
| 100 |
-
return jsonData, data
|
| 101 |
|
| 102 |
except Exception as err:
|
| 103 |
return "An Error Occurred. Contact Developer" + str(err), "Error Occured. Boom"
|
|
@@ -140,27 +140,26 @@ choices = [
|
|
| 140 |
|
| 141 |
# Create the Gradio interface
|
| 142 |
with gr.Blocks(theme="sudeepshouche/minimalist") as demo:
|
|
|
|
|
|
|
| 143 |
gr.Markdown("# The Big Scraper")
|
| 144 |
with gr.Tab("Scraped"):
|
| 145 |
with gr.Row():
|
| 146 |
-
|
| 147 |
-
|
| 148 |
-
|
| 149 |
-
|
| 150 |
-
|
|
|
|
| 151 |
|
| 152 |
btn = gr.Button("Extract Data")
|
| 153 |
-
btn.click(extractDataFromUrls, inputs=[url_input, loader_dropdown], outputs=[json_output, text_output])
|
|
|
|
| 154 |
|
| 155 |
with gr.Tab("Images"):
|
| 156 |
-
with gr.Row():
|
| 157 |
-
image_url_input = gr.Textbox(label="Enter URL for Screenshot:")
|
| 158 |
with gr.Row():
|
| 159 |
screenshot_output = gr.Image(label="Screenshot")
|
| 160 |
title_output = gr.Textbox(label="Page Title")
|
| 161 |
|
| 162 |
-
btn2 = gr.Button("Take Screenshot")
|
| 163 |
-
btn2.click(take_webdata, inputs=image_url_input, outputs=[screenshot_output, title_output])
|
| 164 |
-
|
| 165 |
# Launch the Gradio interface
|
| 166 |
demo.launch()
|
|
|
|
| 97 |
for item in data:
|
| 98 |
jsonData.append(item.to_json())
|
| 99 |
|
| 100 |
+
return jsonData, data, urls[0]
|
| 101 |
|
| 102 |
except Exception as err:
|
| 103 |
return "An Error Occurred. Contact Developer" + str(err), "Error Occured. Boom"
|
|
|
|
| 140 |
|
| 141 |
# Create the Gradio interface
|
| 142 |
with gr.Blocks(theme="sudeepshouche/minimalist") as demo:
|
| 143 |
+
extracted_url = gr.State() # Use gr.State() to store the URL
|
| 144 |
+
|
| 145 |
gr.Markdown("# The Big Scraper")
|
| 146 |
with gr.Tab("Scraped"):
|
| 147 |
with gr.Row():
|
| 148 |
+
with gr.Column():
|
| 149 |
+
url_input = gr.Textbox(label="Enter your comma separated URLs here")
|
| 150 |
+
loader_dropdown = gr.Dropdown(choices=choices, label="Pick your Loader from here")
|
| 151 |
+
with gr.Column():
|
| 152 |
+
json_output = gr.JSON(label="Extracted Data (JSON)")
|
| 153 |
+
text_output = gr.Textbox(label="Extracted Data (Text)")
|
| 154 |
|
| 155 |
btn = gr.Button("Extract Data")
|
| 156 |
+
btn.click(extractDataFromUrls, inputs=[url_input, loader_dropdown], outputs=[json_output, text_output, extracted_url]) \
|
| 157 |
+
.then(take_webdata, inputs=extracted_url, outputs=[screenshot_output, title_output])
|
| 158 |
|
| 159 |
with gr.Tab("Images"):
|
|
|
|
|
|
|
| 160 |
with gr.Row():
|
| 161 |
screenshot_output = gr.Image(label="Screenshot")
|
| 162 |
title_output = gr.Textbox(label="Page Title")
|
| 163 |
|
|
|
|
|
|
|
|
|
|
| 164 |
# Launch the Gradio interface
|
| 165 |
demo.launch()
|