im commited on
Commit ·
bceab41
1
Parent(s): 14feef8
remove possilbe query parameters from the link
Browse files
app.py
CHANGED
|
@@ -18,6 +18,7 @@ from langchain.schema import (
|
|
| 18 |
SystemMessage
|
| 19 |
)
|
| 20 |
import random
|
|
|
|
| 21 |
|
| 22 |
set_api_key(st.secrets["ELEVENLABS_API_KEY"])
|
| 23 |
crawling_api_key = st.secrets["CRAWLING_API_KEY"]
|
|
@@ -40,14 +41,13 @@ def get_llm(model_name, model_temperature, api_key, max_tokens=None):
|
|
| 40 |
openai_api_key=api_key)
|
| 41 |
|
| 42 |
|
| 43 |
-
def is_valid_web_link(
|
| 44 |
-
|
| 45 |
-
|
| 46 |
-
|
| 47 |
-
|
| 48 |
-
|
| 49 |
-
|
| 50 |
-
return bool(url_pattern.match(text))
|
| 51 |
|
| 52 |
|
| 53 |
@st.cache_data
|
|
@@ -182,7 +182,7 @@ def get_query_params():
|
|
| 182 |
if 'web_url' in params:
|
| 183 |
web_url = params['web_url'][0]
|
| 184 |
if len(web_url) > 0:
|
| 185 |
-
if is_valid_web_link(web_url):
|
| 186 |
st.session_state.web_url = web_url
|
| 187 |
|
| 188 |
|
|
@@ -216,16 +216,16 @@ def main() -> None:
|
|
| 216 |
st.caption(description)
|
| 217 |
st.divider()
|
| 218 |
|
| 219 |
-
|
| 220 |
label_visibility='collapsed',
|
| 221 |
placeholder='Paste your link, e.g. https://expresso.today')
|
| 222 |
col1, _, _, _, col2 = st.columns(5)
|
| 223 |
col1.button("Doodle")
|
| 224 |
if col2.button("Random Page"):
|
| 225 |
-
|
| 226 |
-
if len(
|
| 227 |
-
if is_valid_web_link(
|
| 228 |
-
st.session_state.web_url =
|
| 229 |
st.experimental_rerun()
|
| 230 |
else:
|
| 231 |
st.warning(
|
|
|
|
| 18 |
SystemMessage
|
| 19 |
)
|
| 20 |
import random
|
| 21 |
+
from urllib.parse import urlparse, urlunparse
|
| 22 |
|
| 23 |
set_api_key(st.secrets["ELEVENLABS_API_KEY"])
|
| 24 |
crawling_api_key = st.secrets["CRAWLING_API_KEY"]
|
|
|
|
| 41 |
openai_api_key=api_key)
|
| 42 |
|
| 43 |
|
| 44 |
+
def is_valid_web_link(url):
|
| 45 |
+
parsed_url = urlparse(url)
|
| 46 |
+
cleaned_url = parsed_url._replace(query='')._replace(params='')
|
| 47 |
+
if parsed_url.scheme and parsed_url.netloc:
|
| 48 |
+
return urlunparse(cleaned_url)
|
| 49 |
+
else:
|
| 50 |
+
return None
|
|
|
|
| 51 |
|
| 52 |
|
| 53 |
@st.cache_data
|
|
|
|
| 182 |
if 'web_url' in params:
|
| 183 |
web_url = params['web_url'][0]
|
| 184 |
if len(web_url) > 0:
|
| 185 |
+
if web_url := is_valid_web_link(web_url):
|
| 186 |
st.session_state.web_url = web_url
|
| 187 |
|
| 188 |
|
|
|
|
| 216 |
st.caption(description)
|
| 217 |
st.divider()
|
| 218 |
|
| 219 |
+
web_url = st.text_input(label='Paste your link, e.g. https://expresso.today',
|
| 220 |
label_visibility='collapsed',
|
| 221 |
placeholder='Paste your link, e.g. https://expresso.today')
|
| 222 |
col1, _, _, _, col2 = st.columns(5)
|
| 223 |
col1.button("Doodle")
|
| 224 |
if col2.button("Random Page"):
|
| 225 |
+
web_url = get_random_page()
|
| 226 |
+
if len(web_url) > 0:
|
| 227 |
+
if web_url := is_valid_web_link(web_url):
|
| 228 |
+
st.session_state.web_url = web_url
|
| 229 |
st.experimental_rerun()
|
| 230 |
else:
|
| 231 |
st.warning(
|