Skip to content

Commit a71753e

Browse files
committed
feat: added minikube, oke deployment, standard k8s readme, and updated local rag agent with more debug options
1 parent ac1a470 commit a71753e

File tree

1 file changed

+24
-13
lines changed

1 file changed

+24
-13
lines changed

agentic_rag/gradio_app.py

Lines changed: 24 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -319,27 +319,35 @@ def create_interface():
319319
Choose your preferred model for the conversation.
320320
""")
321321

322-
model_dropdown = gr.Dropdown(
323-
choices=model_choices,
324-
value=default_model,
325-
label="Select Model",
326-
info="Choose the model to use for the conversation"
327-
)
322+
with gr.Row():
323+
with gr.Column():
324+
model_dropdown = gr.Dropdown(
325+
choices=model_choices,
326+
value=default_model,
327+
label="Select Model",
328+
info="Choose the model to use for the conversation"
329+
)
330+
download_button = gr.Button("Download Selected Model")
331+
model_status = gr.Textbox(
332+
label="Download Status",
333+
placeholder="Select a model and click Download to begin...",
334+
interactive=False
335+
)
328336

329337
# Add model FAQ section
330338
gr.Markdown("""
331339
## Model FAQ
332340
333341
| Model | Parameters | Size | Download Command |
334342
|-------|------------|------|------------------|
335-
| qwq | 7B | 4.1GB | qwq:latest |
336-
| gemma3 | 7B | 4.1GB | gemma3:latest |
337-
| llama3.3 | 7B | 4.1GB | llama3.3:latest |
338-
| phi4 | 7B | 4.1GB | phi4:latest |
343+
| qwq | 32B | 20GB | qwq:latest |
344+
| gemma3 | 4B | 3.3GB | gemma3:latest |
345+
| llama3.3 | 70B | 43GB | llama3.3:latest |
346+
| phi4 | 14B | 9.1GB | phi4:latest |
339347
| mistral | 7B | 4.1GB | mistral:latest |
340-
| llava | 7B | 4.1GB | llava:latest |
341-
| phi3 | 7B | 4.1GB | phi3:latest |
342-
| deepseek-r1 | 7B | 4.1GB | deepseek-r1:latest |
348+
| llava | 7B | 4.5GB | llava:latest |
349+
| phi3 | 4B | 4.0GB | phi3:latest |
350+
| deepseek-r1 | 7B | 4.7GB | deepseek-r1:latest |
343351
344352
Note: All models are available through Ollama. Make sure Ollama is running on your system.
345353
""")
@@ -434,6 +442,9 @@ def create_interface():
434442
url_button.click(process_url, inputs=[url_input], outputs=[url_output])
435443
repo_button.click(process_repo, inputs=[repo_input], outputs=[repo_output])
436444

445+
# Model download event handler
446+
download_button.click(download_model, inputs=[model_dropdown], outputs=[model_status])
447+
437448
# Standard chat handlers
438449
standard_msg.submit(
439450
chat,

0 commit comments

Comments
 (0)