Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -292,6 +292,18 @@ if st.session_state.status_message:
|
|
| 292 |
chunks = manager.get_chunks()
|
| 293 |
if not chunks:
|
| 294 |
st.write("Process a URL to begin editing content chunks, or adjust settings in the sidebar.")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 295 |
else:
|
| 296 |
chunk_ids = [c['id'] for c in chunks]
|
| 297 |
if st.session_state.selected_chunk_id not in chunk_ids:
|
|
|
|
| 292 |
chunks = manager.get_chunks()
|
| 293 |
if not chunks:
|
| 294 |
st.write("Process a URL to begin editing content chunks, or adjust settings in the sidebar.")
|
| 295 |
+
with st.expander("Chunking Strategy Examples"):
|
| 296 |
+
st.write("See how different websites structure their content, affecting chunking quality.")
|
| 297 |
+
st.error("**Bad Chunking Example (Few Structural Headers)**")
|
| 298 |
+
st.markdown("""
|
| 299 |
+
* [Wikipedia: Markdown](https://en.wikipedia.org/wiki/Markdown)
|
| 300 |
+
""")
|
| 301 |
+
st.success("**Good Chunking Examples (Clear, Hierarchical Headers)**")
|
| 302 |
+
st.markdown("""
|
| 303 |
+
* [The Blog Starter](https://www.theblogstarter.com/)
|
| 304 |
+
* [Google Safety Blog](https://blog.google/technology/safety-security/google-survey-digital-security-2025/)
|
| 305 |
+
* [HubSpot: What is a Blog?](https://blog.hubspot.com/marketing/what-is-a-blog)
|
| 306 |
+
""")
|
| 307 |
else:
|
| 308 |
chunk_ids = [c['id'] for c in chunks]
|
| 309 |
if st.session_state.selected_chunk_id not in chunk_ids:
|