Spaces:

SomePersonAlt
/

the

Runtime error

App Files Files Community

Austin Stockbridge commited on Nov 30, 2024

Commit

122221c

verified ·

1 Parent(s): bf9137e

Update app.py

Browse files

Files changed (1) hide show

app.py +53 -11

app.py CHANGED Viewed

@@ -1,10 +1,11 @@
 from huggingface_hub import hf_hub_list, hf_hub_download
 from transformers import AutoModel, AutoTokenizer
-# Hugging Face model repository
 model_repo = "mradermacher/Qwen2-2B-RepleteCoder-DHM-GGUF"
-# Find files containing 'Q2_K'
 def find_q2_k_files(repo_id):
     files = hf_hub_list(repo_id)
     q2_k_files = [file for file in files if "Q2_K" in file.filename and file.filename.endswith(".gguf")]
@@ -12,16 +13,57 @@ def find_q2_k_files(repo_id):
         raise ValueError(f"No files containing 'Q2_K' found in the repository {repo_id}.")
     return q2_k_files
-# Download and load the desired model
-def load_q2_k_model(repo_id):
-    q2_k_files = find_q2_k_files(repo_id)
-    # For simplicity, load the first matching file
-    chosen_file = q2_k_files[0]
-    print(f"Loading model from: {chosen_file.filename}")
-    model_path = hf_hub_download(repo_id, chosen_file.filename)
     model = AutoModel.from_pretrained(model_path)
     tokenizer = AutoTokenizer.from_pretrained(model_path)
     return model, tokenizer
-# Initialize the model
-model, tokenizer = load_q2_k_model(model_repo)

 from huggingface_hub import hf_hub_list, hf_hub_download
 from transformers import AutoModel, AutoTokenizer
+import gradio as gr
+# Hugging Face repository
 model_repo = "mradermacher/Qwen2-2B-RepleteCoder-DHM-GGUF"
+# Step 1: List and filter GGUF files with 'Q2_K'
 def find_q2_k_files(repo_id):
     files = hf_hub_list(repo_id)
     q2_k_files = [file for file in files if "Q2_K" in file.filename and file.filename.endswith(".gguf")]
         raise ValueError(f"No files containing 'Q2_K' found in the repository {repo_id}.")
     return q2_k_files
+# Step 2: Load model and tokenizer
+def load_q2_k_model(repo_id, filename):
+    model_path = hf_hub_download(repo_id, filename)
     model = AutoModel.from_pretrained(model_path)
     tokenizer = AutoTokenizer.from_pretrained(model_path)
     return model, tokenizer
+# Step 3: Chatbot logic
+def chat(messages, model, tokenizer):
+    # Chat template formatting
+    input_text = ""
+    for i, message in enumerate(messages):
+        if i == 0 and message['role'] != 'system':
+            input_text += "<|im_start|>system You are a helpful assistant<|im_end|> "
+        input_text += f"<|im_start|>{message['role']} {message['content']}<|im_end|> "
+    input_text += "<|im_start|>assistant "
+    inputs = tokenizer(input_text, return_tensors="pt")
+    outputs = model.generate(**inputs)
+    response = tokenizer.decode(outputs[0], skip_special_tokens=True)
+    return response
+# Step 4: Gradio Interface
+def chatbot_interface(selected_file, chat_history):
+    # Load model dynamically
+    model, tokenizer = load_q2_k_model(model_repo, selected_file)
+    response = chat(chat_history, model, tokenizer)
+    chat_history.append({"role": "assistant", "content": response})
+    return chat_history, chat_history
+# Step 5: Build the UI
+q2_k_files = find_q2_k_files(model_repo)
+file_options = [file.filename for file in q2_k_files]
+with gr.Blocks() as demo:
+    gr.Markdown("# Hugging Face Q2_K Chatbot")
+    model_selector = gr.Dropdown(choices=file_options, label="Select Model File")
+    chat_history = gr.State([])
+    chatbot = gr.Chatbot()
+    user_input = gr.Textbox(label="Your Message")
+    send_button = gr.Button("Send")
+    # Update chat history
+    def update_chat(history, user_message, selected_file):
+        history.append({"role": "user", "content": user_message})
+        return chatbot_interface(selected_file, history)
+    send_button.click(
+        update_chat,
+        inputs=[chat_history, user_input, model_selector],
+        outputs=[chatbot, chat_history]
+    )
+demo.launch()