awacke1 commited on
Commit
e081c7c
·
verified ·
1 Parent(s): 3d5a413

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +64 -69
app.py CHANGED
@@ -59,8 +59,8 @@ if 'model_loaded' not in st.session_state:
59
  st.session_state['model_loaded'] = False
60
  if 'processing' not in st.session_state:
61
  st.session_state['processing'] = {}
62
- if 'pdf_checkboxes' not in st.session_state:
63
- st.session_state['pdf_checkboxes'] = {}
64
  if 'downloaded_pdfs' not in st.session_state:
65
  st.session_state['downloaded_pdfs'] = {}
66
 
@@ -329,7 +329,7 @@ def get_model_files(model_type="causal_lm"):
329
  path = "models/*" if model_type == "causal_lm" else "diffusion_models/*"
330
  return [d for d in glob.glob(path) if os.path.isdir(d)]
331
 
332
- def get_gallery_files(file_types=["png"]):
333
  return sorted([f for ext in file_types for f in glob.glob(f"*.{ext}")])
334
 
335
  def get_pdf_files():
@@ -367,11 +367,11 @@ async def process_pdf_snapshot(pdf_path, mode="single"):
367
  output_file = generate_filename(f"twopage_{i}", "png")
368
  pix.save(output_file)
369
  output_files.append(output_file)
370
- elif mode == "allthumbs":
371
  for i in range(len(doc)):
372
  page = doc[i]
373
- pix = page.get_pixmap(matrix=fitz.Matrix(0.5, 0.5))
374
- output_file = generate_filename(f"thumb_{i}", "png")
375
  pix.save(output_file)
376
  output_files.append(output_file)
377
  doc.close()
@@ -506,19 +506,56 @@ def calculate_cargo_travel_time(origin_coords: Tuple[float, float], destination_
506
  st.title("AI Vision & SFT Titans 🚀")
507
 
508
  st.sidebar.header("Captured Files 📜")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
509
  gallery_size = st.sidebar.slider("Gallery Size", 1, 10, 2)
510
  def update_gallery():
511
- media_files = get_gallery_files(["png"])
512
- pdf_files = get_pdf_files()
513
- if media_files or pdf_files:
514
- st.sidebar.subheader("Images 📸")
515
  cols = st.sidebar.columns(2)
516
- for idx, file in enumerate(media_files[:gallery_size * 2]):
517
  with cols[idx % 2]:
518
- st.image(Image.open(file), caption=os.path.basename(file), use_container_width=True)
519
- st.sidebar.subheader("PDF Downloads 📖")
520
- for pdf_file in pdf_files[:gallery_size * 2]:
521
- st.markdown(get_download_link(pdf_file, "application/pdf", f"📥 Grab {os.path.basename(pdf_file)}"), unsafe_allow_html=True)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
522
  update_gallery()
523
 
524
  st.sidebar.subheader("Model Management 🗂️")
@@ -625,44 +662,12 @@ with tab2:
625
  status_text.text("Robo-Download complete! 🚀")
626
  update_gallery()
627
 
628
- st.subheader("PDF Gallery 📖")
629
- downloaded_pdfs = list(st.session_state['downloaded_pdfs'].values())
630
- if downloaded_pdfs:
631
- cols_per_row = 3
632
- for i in range(0, len(downloaded_pdfs), cols_per_row):
633
- cols = st.columns(cols_per_row)
634
- for j, pdf_path in enumerate(downloaded_pdfs[i:i + cols_per_row]):
635
- with cols[j]:
636
- doc = fitz.open(pdf_path)
637
- page = doc[0]
638
- pix = page.get_pixmap(matrix=fitz.Matrix(0.5, 0.5))
639
- img = Image.frombytes("RGB", [pix.width, pix.height], pix.samples)
640
- st.image(img, caption=os.path.basename(pdf_path), use_container_width=True)
641
- checkbox_key = f"pdf_{pdf_path}"
642
- st.session_state['pdf_checkboxes'][checkbox_key] = st.checkbox(
643
- "Use for SFT/Input",
644
- value=st.session_state['pdf_checkboxes'].get(checkbox_key, False),
645
- key=checkbox_key
646
- )
647
- st.markdown(get_download_link(pdf_path, "application/pdf", "Snag It! 📥"), unsafe_allow_html=True)
648
- if st.button("Zap It! 🗑️", key=f"delete_{pdf_path}"):
649
- os.remove(pdf_path)
650
- url_key = next((k for k, v in st.session_state['downloaded_pdfs'].items() if v == pdf_path), None)
651
- if url_key:
652
- del st.session_state['downloaded_pdfs'][url_key]
653
- del st.session_state['pdf_checkboxes'][checkbox_key]
654
- st.success(f"PDF {os.path.basename(pdf_path)} vaporized! 💨")
655
- st.rerun()
656
- doc.close()
657
- else:
658
- st.info("No PDFs captured yet. Feed the robo-downloader some URLs! 🤖")
659
-
660
- mode = st.selectbox("Snapshot Mode", ["Single Page (High-Res)", "Two Pages (High-Res)", "All Pages (Thumbnails)"], key="download_mode")
661
  if st.button("Snapshot Selected 📸"):
662
- selected_pdfs = [path for key, path in st.session_state['downloaded_pdfs'].items() if st.session_state['pdf_checkboxes'].get(f"pdf_{path}", False)]
663
  if selected_pdfs:
664
  for pdf_path in selected_pdfs:
665
- mode_key = {"Single Page (High-Res)": "single", "Two Pages (High-Res)": "twopage", "All Pages (Thumbnails)": "allthumbs"}[mode]
666
  snapshots = asyncio.run(process_pdf_snapshot(pdf_path, mode_key))
667
  for snapshot in snapshots:
668
  st.image(Image.open(snapshot), caption=snapshot, use_container_width=True)
@@ -727,12 +732,9 @@ with tab4:
727
  st.markdown(get_download_link(zip_path, "application/zip", "Download Fine-Tuned Titan"), unsafe_allow_html=True)
728
  st.rerun()
729
  elif isinstance(st.session_state['builder'], DiffusionBuilder):
730
- captured_files = get_gallery_files(["png"])
731
- selected_pdfs = [path for key, path in st.session_state['downloaded_pdfs'].items() if st.session_state['pdf_checkboxes'].get(f"pdf_{path}", False)]
732
- if len(captured_files) + len(selected_pdfs) >= 2:
733
- demo_data = [{"image": img, "text": f"Superhero {os.path.basename(img).split('.')[0]}"} for img in captured_files]
734
- for pdf_path in selected_pdfs:
735
- demo_data.append({"image": pdf_path, "text": f"PDF {os.path.basename(pdf_path)}"})
736
  edited_data = st.data_editor(pd.DataFrame(demo_data), num_rows="dynamic")
737
  if st.button("Fine-Tune with Dataset 🔄"):
738
  images = [Image.open(row["image"]) if row["image"].endswith('.png') else Image.frombytes("RGB", fitz.open(row["image"])[0].get_pixmap(matrix=fitz.Matrix(2.0, 2.0)).size, fitz.open(row["image"])[0].get_pixmap(matrix=fitz.Matrix(2.0, 2.0)).samples) for _, row in edited_data.iterrows()]
@@ -785,7 +787,6 @@ with tab5:
785
  status_container.empty()
786
  elif isinstance(st.session_state['builder'], DiffusionBuilder):
787
  test_prompt = st.text_area("Enter Test Prompt", "Neon Batman")
788
- selected_pdfs = [path for key, path in st.session_state['downloaded_pdfs'].items() if st.session_state['pdf_checkboxes'].get(f"pdf_{path}", False)]
789
  if st.button("Run Test ▶️"):
790
  image = st.session_state['builder'].generate(test_prompt)
791
  output_file = generate_filename("diffusion_test", "png")
@@ -828,9 +829,7 @@ with tab6:
828
 
829
  with tab7:
830
  st.header("Test OCR 🔍")
831
- captured_files = get_gallery_files(["png"])
832
- selected_pdfs = [path for key, path in st.session_state['downloaded_pdfs'].items() if st.session_state['pdf_checkboxes'].get(f"pdf_{path}", False)]
833
- all_files = captured_files + selected_pdfs
834
  if all_files:
835
  selected_file = st.selectbox("Select Image or PDF", all_files, key="ocr_select")
836
  if selected_file:
@@ -853,13 +852,11 @@ with tab7:
853
  st.success(f"OCR output saved to {output_file}")
854
  st.session_state['processing']['ocr'] = False
855
  else:
856
- st.warning("No images or PDFs captured yet. Use Camera Snap or Download PDFs first!")
857
 
858
  with tab8:
859
  st.header("Test Image Gen 🎨")
860
- captured_files = get_gallery_files(["png"])
861
- selected_pdfs = [path for key, path in st.session_state['downloaded_pdfs'].items() if st.session_state['pdf_checkboxes'].get(f"pdf_{path}", False)]
862
- all_files = captured_files + selected_pdfs
863
  if all_files:
864
  selected_file = st.selectbox("Select Image or PDF", all_files, key="gen_select")
865
  if selected_file:
@@ -883,14 +880,12 @@ with tab8:
883
  st.success(f"Image saved to {output_file}")
884
  st.session_state['processing']['gen'] = False
885
  else:
886
- st.warning("No images or PDFs captured yet. Use Camera Snap or Download PDFs first!")
887
 
888
  with tab9:
889
  st.header("Custom Diffusion 🎨🤓")
890
  st.write("Unleash your inner artist with our tiny diffusion models!")
891
- captured_files = get_gallery_files(["png"])
892
- selected_pdfs = [path for key, path in st.session_state['downloaded_pdfs'].items() if st.session_state['pdf_checkboxes'].get(f"pdf_{path}", False)]
893
- all_files = captured_files + selected_pdfs
894
  if all_files:
895
  st.subheader("Select Images or PDFs to Train")
896
  selected_files = st.multiselect("Pick Images or PDFs", all_files, key="diffusion_select")
@@ -929,6 +924,6 @@ with tab9:
929
  st.success(f"Image saved to {output_file}")
930
  st.session_state['processing']['diffusion'] = False
931
  else:
932
- st.warning("No images or PDFs captured yet. Use Camera Snap or Download PDFs first!")
933
 
934
  update_gallery()
 
59
  st.session_state['model_loaded'] = False
60
  if 'processing' not in st.session_state:
61
  st.session_state['processing'] = {}
62
+ if 'asset_checkboxes' not in st.session_state:
63
+ st.session_state['asset_checkboxes'] = {}
64
  if 'downloaded_pdfs' not in st.session_state:
65
  st.session_state['downloaded_pdfs'] = {}
66
 
 
329
  path = "models/*" if model_type == "causal_lm" else "diffusion_models/*"
330
  return [d for d in glob.glob(path) if os.path.isdir(d)]
331
 
332
+ def get_gallery_files(file_types=["png", "pdf"]):
333
  return sorted([f for ext in file_types for f in glob.glob(f"*.{ext}")])
334
 
335
  def get_pdf_files():
 
367
  output_file = generate_filename(f"twopage_{i}", "png")
368
  pix.save(output_file)
369
  output_files.append(output_file)
370
+ elif mode == "allpages":
371
  for i in range(len(doc)):
372
  page = doc[i]
373
+ pix = page.get_pixmap(matrix=fitz.Matrix(2.0, 2.0))
374
+ output_file = generate_filename(f"page_{i}", "png")
375
  pix.save(output_file)
376
  output_files.append(output_file)
377
  doc.close()
 
506
  st.title("AI Vision & SFT Titans 🚀")
507
 
508
  st.sidebar.header("Captured Files 📜")
509
+ cols = st.sidebar.columns(2)
510
+ with cols[0]:
511
+ if st.button("Zip All 🤐"):
512
+ zip_path = f"all_assets_{int(time.time())}.zip"
513
+ with zipfile.ZipFile(zip_path, 'w', zipfile.ZIP_DEFLATED) as zipf:
514
+ for file in get_gallery_files():
515
+ zipf.write(file, os.path.basename(file))
516
+ st.sidebar.markdown(get_download_link(zip_path, "application/zip", "Download All Assets"), unsafe_allow_html=True)
517
+ with cols[1]:
518
+ if st.button("Zap All! 🗑️"):
519
+ for file in get_gallery_files():
520
+ os.remove(file)
521
+ st.session_state['asset_checkboxes'].clear()
522
+ st.session_state['downloaded_pdfs'].clear()
523
+ st.sidebar.success("All assets vaporized! 💨")
524
+ st.rerun()
525
+
526
  gallery_size = st.sidebar.slider("Gallery Size", 1, 10, 2)
527
  def update_gallery():
528
+ all_files = get_gallery_files()
529
+ if all_files:
530
+ st.sidebar.subheader("Asset Gallery 📸📖")
 
531
  cols = st.sidebar.columns(2)
532
+ for idx, file in enumerate(all_files[:gallery_size * 2]):
533
  with cols[idx % 2]:
534
+ if file.endswith('.png'):
535
+ st.image(Image.open(file), caption=os.path.basename(file), use_container_width=True)
536
+ else:
537
+ doc = fitz.open(file)
538
+ pix = doc[0].get_pixmap(matrix=fitz.Matrix(0.5, 0.5))
539
+ img = Image.frombytes("RGB", [pix.width, pix.height], pix.samples)
540
+ st.image(img, caption=os.path.basename(file), use_container_width=True)
541
+ doc.close()
542
+ checkbox_key = f"asset_{file}"
543
+ st.session_state['asset_checkboxes'][checkbox_key] = st.checkbox(
544
+ "Use for SFT/Input",
545
+ value=st.session_state['asset_checkboxes'].get(checkbox_key, False),
546
+ key=checkbox_key
547
+ )
548
+ mime_type = "image/png" if file.endswith('.png') else "application/pdf"
549
+ st.markdown(get_download_link(file, mime_type, "Snag It! 📥"), unsafe_allow_html=True)
550
+ if st.button("Zap It! 🗑️", key=f"delete_{file}"):
551
+ os.remove(file)
552
+ del st.session_state['asset_checkboxes'][checkbox_key]
553
+ if file.endswith('.pdf'):
554
+ url_key = next((k for k, v in st.session_state['downloaded_pdfs'].items() if v == file), None)
555
+ if url_key:
556
+ del st.session_state['downloaded_pdfs'][url_key]
557
+ st.sidebar.success(f"Asset {os.path.basename(file)} vaporized! 💨")
558
+ st.rerun()
559
  update_gallery()
560
 
561
  st.sidebar.subheader("Model Management 🗂️")
 
662
  status_text.text("Robo-Download complete! 🚀")
663
  update_gallery()
664
 
665
+ mode = st.selectbox("Snapshot Mode", ["Single Page (High-Res)", "Two Pages (High-Res)", "All Pages (High-Res)"], key="download_mode")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
666
  if st.button("Snapshot Selected 📸"):
667
+ selected_pdfs = [path for path in get_gallery_files() if path.endswith('.pdf') and st.session_state['asset_checkboxes'].get(f"asset_{path}", False)]
668
  if selected_pdfs:
669
  for pdf_path in selected_pdfs:
670
+ mode_key = {"Single Page (High-Res)": "single", "Two Pages (High-Res)": "twopage", "All Pages (High-Res)": "allpages"}[mode]
671
  snapshots = asyncio.run(process_pdf_snapshot(pdf_path, mode_key))
672
  for snapshot in snapshots:
673
  st.image(Image.open(snapshot), caption=snapshot, use_container_width=True)
 
732
  st.markdown(get_download_link(zip_path, "application/zip", "Download Fine-Tuned Titan"), unsafe_allow_html=True)
733
  st.rerun()
734
  elif isinstance(st.session_state['builder'], DiffusionBuilder):
735
+ selected_files = [path for path in get_gallery_files() if st.session_state['asset_checkboxes'].get(f"asset_{path}", False)]
736
+ if len(selected_files) >= 2:
737
+ demo_data = [{"image": file, "text": f"Asset {os.path.basename(file).split('.')[0]}"} for file in selected_files]
 
 
 
738
  edited_data = st.data_editor(pd.DataFrame(demo_data), num_rows="dynamic")
739
  if st.button("Fine-Tune with Dataset 🔄"):
740
  images = [Image.open(row["image"]) if row["image"].endswith('.png') else Image.frombytes("RGB", fitz.open(row["image"])[0].get_pixmap(matrix=fitz.Matrix(2.0, 2.0)).size, fitz.open(row["image"])[0].get_pixmap(matrix=fitz.Matrix(2.0, 2.0)).samples) for _, row in edited_data.iterrows()]
 
787
  status_container.empty()
788
  elif isinstance(st.session_state['builder'], DiffusionBuilder):
789
  test_prompt = st.text_area("Enter Test Prompt", "Neon Batman")
 
790
  if st.button("Run Test ▶️"):
791
  image = st.session_state['builder'].generate(test_prompt)
792
  output_file = generate_filename("diffusion_test", "png")
 
829
 
830
  with tab7:
831
  st.header("Test OCR 🔍")
832
+ all_files = [path for path in get_gallery_files() if st.session_state['asset_checkboxes'].get(f"asset_{path}", False)]
 
 
833
  if all_files:
834
  selected_file = st.selectbox("Select Image or PDF", all_files, key="ocr_select")
835
  if selected_file:
 
852
  st.success(f"OCR output saved to {output_file}")
853
  st.session_state['processing']['ocr'] = False
854
  else:
855
+ st.warning("No images or PDFs selected yet. Check some boxes in the sidebar gallery!")
856
 
857
  with tab8:
858
  st.header("Test Image Gen 🎨")
859
+ all_files = [path for path in get_gallery_files() if st.session_state['asset_checkboxes'].get(f"asset_{path}", False)]
 
 
860
  if all_files:
861
  selected_file = st.selectbox("Select Image or PDF", all_files, key="gen_select")
862
  if selected_file:
 
880
  st.success(f"Image saved to {output_file}")
881
  st.session_state['processing']['gen'] = False
882
  else:
883
+ st.warning("No images or PDFs selected yet. Check some boxes in the sidebar gallery!")
884
 
885
  with tab9:
886
  st.header("Custom Diffusion 🎨🤓")
887
  st.write("Unleash your inner artist with our tiny diffusion models!")
888
+ all_files = [path for path in get_gallery_files() if st.session_state['asset_checkboxes'].get(f"asset_{path}", False)]
 
 
889
  if all_files:
890
  st.subheader("Select Images or PDFs to Train")
891
  selected_files = st.multiselect("Pick Images or PDFs", all_files, key="diffusion_select")
 
924
  st.success(f"Image saved to {output_file}")
925
  st.session_state['processing']['diffusion'] = False
926
  else:
927
+ st.warning("No images or PDFs selected yet. Check some boxes in the sidebar gallery!")
928
 
929
  update_gallery()