Em4e commited on
Commit
a1361c0
·
verified ·
1 Parent(s): e6e0447

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -0
app.py CHANGED
@@ -292,6 +292,18 @@ if st.session_state.status_message:
292
  chunks = manager.get_chunks()
293
  if not chunks:
294
  st.write("Process a URL to begin editing content chunks, or adjust settings in the sidebar.")
 
 
 
 
 
 
 
 
 
 
 
 
295
  else:
296
  chunk_ids = [c['id'] for c in chunks]
297
  if st.session_state.selected_chunk_id not in chunk_ids:
 
292
  chunks = manager.get_chunks()
293
  if not chunks:
294
  st.write("Process a URL to begin editing content chunks, or adjust settings in the sidebar.")
295
+ with st.expander("Chunking Strategy Examples"):
296
+ st.write("See how different websites structure their content, affecting chunking quality.")
297
+ st.error("**Bad Chunking Example (Few Structural Headers)**")
298
+ st.markdown("""
299
+ * [Wikipedia: Markdown](https://en.wikipedia.org/wiki/Markdown)
300
+ """)
301
+ st.success("**Good Chunking Examples (Clear, Hierarchical Headers)**")
302
+ st.markdown("""
303
+ * [The Blog Starter](https://www.theblogstarter.com/)
304
+ * [Google Safety Blog](https://blog.google/technology/safety-security/google-survey-digital-security-2025/)
305
+ * [HubSpot: What is a Blog?](https://blog.hubspot.com/marketing/what-is-a-blog)
306
+ """)
307
  else:
308
  chunk_ids = [c['id'] for c in chunks]
309
  if st.session_state.selected_chunk_id not in chunk_ids: