Spaces:

AI-RESEARCHER-2024
/

CHAT-PDF

Build error

App Files Files Community

AI-RESEARCHER-2024 commited on Oct 31, 2024

Commit

bcc34fe

verified ·

1 Parent(s): f29c5c3

Update app.py

Browse files

Files changed (1) hide show

app.py +35 -20

app.py CHANGED Viewed

@@ -21,12 +21,21 @@ class RAGInterface:
             embedding_function=self.embeddings
         )
-        # Initialize LLM
-        self.llm = Llama.from_pretrained(
-            repo_id="bartowski/Meta-Llama-3.1-8B-Instruct-GGUF",
-            filename="Meta-Llama-3.1-8B-Instruct-Q4_K_M.gguf",
-            n_ctx=2048
-        )
         # Define RAG prompt template
         self.template = """Answer the question based only on the following context:
@@ -43,7 +52,20 @@ class RAGInterface:
         """
         self.prompt = PromptTemplate.from_template(self.template)
-    def respond(self, message, history, system_message, temperature,max_tokens=2048):
         # Build messages list
         messages = [{"role": "system", "content": system_message}]
         for user_msg, assistant_msg in history:
@@ -161,14 +183,12 @@ class RAGInterface:
                     label="System Message",
                     elem_classes="control-panel"
                 ),
-                # gr.Slider(
-                #     minimum=1,
-                #     maximum=2048,
-                #     value=512,
-                #     step=1,
-                #     label="Max New Tokens",
-                #     elem_classes="control-panel"
-                # ),
                 gr.Slider(
                     minimum=0.1,
                     maximum=1.0,
@@ -180,11 +200,6 @@ class RAGInterface:
             ],
             title="",  # Title is handled in custom HTML
             description="Ask questions about Computers and get AI-powered answers.",
-            # examples=[
-            #     "What is a Computer?",
-            #     "How does machine learning work?",
-            #     "Explain artificial intelligence.",
-            # ],
             theme=gr.themes.Default(),
         )

             embedding_function=self.embeddings
         )
+        # Model configurations
+        self.model_configs = {
+            "Llama 3.2 3B (Fast, Less Accurate)": {
+                "repo_id": "bartowski/Llama-3.2-3B-Instruct-GGUF",
+                "filename": "Llama-3.2-3B-Instruct-Q6_K.gguf",
+            },
+            "Llama 3.1 8B (Slower, More Accurate)": {
+                "repo_id": "bartowski/Meta-Llama-3.1-8B-Instruct-GGUF",
+                "filename": "Meta-Llama-3.1-8B-Instruct-Q4_K_M.gguf",
+            }
+        }
+        # Initialize with default model
+        self.current_model = "Llama 3.1 8B (Slower, More Accurate)"
+        self.load_model(self.current_model)
         # Define RAG prompt template
         self.template = """Answer the question based only on the following context:
         """
         self.prompt = PromptTemplate.from_template(self.template)
+    def load_model(self, model_name):
+        config = self.model_configs[model_name]
+        self.llm = Llama.from_pretrained(
+            repo_id=config["repo_id"],
+            filename=config["filename"],
+            n_ctx=2048
+        )
+        self.current_model = model_name
+    def respond(self, message, history, system_message, model_choice, temperature, max_tokens=2048):
+        # Load new model if different from current
+        if model_choice != self.current_model:
+            self.load_model(model_choice)
         # Build messages list
         messages = [{"role": "system", "content": system_message}]
         for user_msg, assistant_msg in history:
                     label="System Message",
                     elem_classes="control-panel"
                 ),
+                gr.Dropdown(
+                    choices=list(self.model_configs.keys()),
+                    value=self.current_model,
+                    label="Select Model",
+                    elem_classes="control-panel"
+                ),
                 gr.Slider(
                     minimum=0.1,
                     maximum=1.0,
             ],
             title="",  # Title is handled in custom HTML
             description="Ask questions about Computers and get AI-powered answers.",
             theme=gr.themes.Default(),
         )