more bug fixes.

This commit is contained in:
2026-02-12 05:36:15 -05:00
parent 72681217ef
commit b2d2252342
5 changed files with 8 additions and 11 deletions

View File

@@ -20,7 +20,7 @@ spec:
spec: spec:
containers: containers:
- name: gradio - name: gradio
image: ghcr.io/billy-davies-2/llm-apps:v2-202602120526 image: ghcr.io/billy-davies-2/llm-apps:v2-202602120535
imagePullPolicy: Always imagePullPolicy: Always
command: ["python", "embeddings.py"] command: ["python", "embeddings.py"]
ports: ports:

11
llm.py
View File

@@ -218,18 +218,15 @@ Chat with **Llama 3.1 70B** (AWQ INT4) served via vLLM on AMD Strix Halo (ROCm).
with gr.TabItem("💬 Chat"): with gr.TabItem("💬 Chat"):
chatbot = gr.ChatInterface( chatbot = gr.ChatInterface(
fn=chat_stream, fn=chat_stream,
type="messages",
additional_inputs=[system_prompt, temperature, max_tokens, top_p], additional_inputs=[system_prompt, temperature, max_tokens, top_p],
examples=[ examples=[
"Hello! What can you tell me about yourself?", ["Hello! What can you tell me about yourself?"],
"Explain how a GPU executes a matrix multiplication.", ["Explain how a GPU executes a matrix multiplication."],
"Write a Python function to compute the Fibonacci sequence.", ["Write a Python function to compute the Fibonacci sequence."],
"What are the pros and cons of running LLMs on AMD GPUs?", ["What are the pros and cons of running LLMs on AMD GPUs?"],
], ],
chatbot=gr.Chatbot( chatbot=gr.Chatbot(
height=520, height=520,
type="messages",
show_copy_button=True,
placeholder="Type a message to start chatting...", placeholder="Type a message to start chatting...",
), ),
) )

View File

@@ -20,7 +20,7 @@ spec:
spec: spec:
containers: containers:
- name: gradio - name: gradio
image: ghcr.io/billy-davies-2/llm-apps:v2-202602120526 image: ghcr.io/billy-davies-2/llm-apps:v2-202602120535
imagePullPolicy: Always imagePullPolicy: Always
command: ["python", "llm.py"] command: ["python", "llm.py"]
ports: ports:

View File

@@ -20,7 +20,7 @@ spec:
spec: spec:
containers: containers:
- name: gradio - name: gradio
image: ghcr.io/billy-davies-2/llm-apps:v2-202602120526 image: ghcr.io/billy-davies-2/llm-apps:v2-202602120535
imagePullPolicy: Always imagePullPolicy: Always
command: ["python", "stt.py"] command: ["python", "stt.py"]
ports: ports:

View File

@@ -20,7 +20,7 @@ spec:
spec: spec:
containers: containers:
- name: gradio - name: gradio
image: ghcr.io/billy-davies-2/llm-apps:v2-202602120526 image: ghcr.io/billy-davies-2/llm-apps:v2-202602120535
imagePullPolicy: Always imagePullPolicy: Always
command: ["python", "tts.py"] command: ["python", "tts.py"]
ports: ports: