Spaces:

WaysAheadGlobal
/

VLM

Sleeping

VLM

File size: 1,121 Bytes

d78fda0
621bb5d
d78fda0
 
ae103bc
a3766e8
ae103bc
106eff3
ae103bc
621bb5d
 
 
 
 
d78fda0
 
ae103bc
 
 
 
a3766e8
24e5396
ae103bc
 
 
 
 
a3766e8
24e5396
ae103bc
a3766e8
 
ae103bc
24e5396
fb9ccfe
ae103bc
 
fb9ccfe
 
d78fda0
fb9ccfe

import streamlit as st
from transformers import pipeline
from PIL import Image

# Setup
st.set_page_config(page_title="TinyLLaVA Snapshot Q&A", layout="centered")
st.title("📸 TinyLLaVA — Snapshot Q&A (Spaces Safe)")

# Load model
pipe = pipeline(
    task="image-to-text",
    model="bczhou/tiny-llava-v1-hf",
    trust_remote_code=True,
    device_map="cpu"
)

# 👇 Clear info so the widget tree is stable
st.markdown("Use your **webcam** OR upload a file:")

# Try webcam first
image = st.camera_input("📷 Take a snapshot")

# Fallback uploader
if not image:
    image = st.file_uploader("📂 Or upload an image", type=["jpg", "png", "jpeg"])

# Prompt
prompt = st.text_input("💬 Your question:", value="Describe this scene.")

# Run TinyLLaVA
if image is not None and prompt:
    img = Image.open(image).convert("RGB")
    st.image(img, caption="Your Image", use_column_width=True)

    query = f"USER: <image>\n{prompt}\nASSISTANT:"

    with st.spinner("Generating..."):
        result = pipe(query, img)
        answer = result[0]["generated_text"]

    st.subheader("📝 Answer")
    st.write(answer)