Spaces:
Running on CPU Upgrade

File size: 2,051 Bytes
a225caf
7360ef0
2064a53
7360ef0
a225caf
 
 
ae9601e
 
 
 
7360ef0
ae9601e
 
7360ef0
a225caf
ae9601e
257403d
 
 
 
 
 
7360ef0
a225caf
 
7360ef0
a225caf
 
7360ef0
a225caf
 
7360ef0
 
a225caf
 
7360ef0
a225caf
 
7360ef0
a225caf
 
 
2064a53
 
 
 
 
a225caf
7360ef0
a225caf
7360ef0
a225caf
7360ef0
a225caf
7360ef0
a225caf
7360ef0
 
 
a225caf
7360ef0
a225caf
7360ef0
 
a225caf
7360ef0
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
import gradio as gr
from gradio_client import Client, handle_file

MODELS = {"SmolVLM-Instruct": "akhaliq/SmolVLM-Instruct"}


def create_chat_fn(client):
    def chat(message, history):
        # Extract text and files from the message
        text = message.get("text", "")
        files = message.get("files", [])

        # Handle file uploads if present
        processed_files = [handle_file(f) for f in files]

        response = client.predict(
            message={"text": text, "files": processed_files},
            system_prompt="You are a helpful AI assistant.",
            temperature=0.7,
            max_new_tokens=1024,
            top_k=40,
            repetition_penalty=1.1,
            top_p=0.95,
            api_name="/chat",
        )
        return response

    return chat


def set_client_for_session(model_name, request: gr.Request):
    headers = {}
    if request and hasattr(request, "headers"):
        x_ip_token = request.headers.get("x-ip-token")
        if x_ip_token:
            headers["X-IP-Token"] = x_ip_token

    return Client(MODELS[model_name], headers=headers)


def safe_chat_fn(message, history, client):
    if client is None:
        return "Error: Client not initialized. Please refresh the page."
    try:
        return create_chat_fn(client)(message, history)
    except Exception as e:
        print(f"Error during chat: {str(e)}")
        return f"Error during chat: {str(e)}"


with gr.Blocks() as demo:

    client = gr.State()

    model_dropdown = gr.Dropdown(
        choices=list(MODELS.keys()), value="SmolVLM-Instruct", label="Select Model", interactive=True
    )

    chat_interface = gr.ChatInterface(fn=safe_chat_fn, additional_inputs=[client], multimodal=True)

    # Update client when model changes
    model_dropdown.change(fn=set_client_for_session, inputs=[model_dropdown], outputs=[client])

    # Initialize client on page load
    demo.load(fn=set_client_for_session, inputs=[gr.State("SmolVLM-Instruct")], outputs=[client])

if __name__ == "__main__":
    demo.launch()