Spaces:

Lap1official
/

API

Running

App Files Files Community

Reality123b commited on 27 days ago

Commit

0b53b16

verified ·

1 Parent(s): 0b8e032

Update app.py

Browse files

Files changed (1) hide show

app.py +73 -21

app.py CHANGED Viewed

@@ -29,8 +29,8 @@ class XylariaChat:
             raise ValueError("HuggingFace token not found in environment variables")
         self.client = InferenceClient(
-            model="Qwen/QwQ-32B-Preview",
-            api_key=self.hf_token
         )
         self.image_api_url = "https://api-inference.huggingface.co/models/Salesforce/blip-image-captioning-large"
@@ -442,6 +442,14 @@ class XylariaChat:
             if response.status_code == 200:
                 image_bytes = response.content
                 return image_bytes
             else:
                 return f"Error generating image: {response.status_code} - {response.text}"
@@ -521,14 +529,17 @@ class XylariaChat:
             max_new_tokens = 16384 - input_tokens - 50
             max_new_tokens = min(max_new_tokens, 10020)
-            stream = self.client.chat_completion(
-                messages=messages,
-                model="Qwen/QwQ-32B-Preview",
                 temperature=0.7,
-                max_tokens=max_new_tokens,
                 top_p=0.9,
-                stream=True
             )
             return stream
@@ -615,35 +626,64 @@ class XylariaChat:
     def create_interface(self):
         def streaming_response(message, chat_history, image_filepath, math_ocr_image_path):
             if message.strip().lower().startswith("/image"):
-                # Extract image generation prompt from the message
                 image_prompt = message.strip().lower()[len("/image"):].strip()
                 if not image_prompt:
-                    image_prompt = "A realistic image"  # Default prompt
-                # Generate image based on the extracted prompt
                 image_bytes = self.generate_image(image_prompt)
                 if isinstance(image_bytes, bytes):
                     base64_image = base64.b64encode(image_bytes).decode("utf-8")
                     image_html = f'<img src="data:image/png;base64,{base64_image}" alt="Generated Image" style="max-width: 100%; max-height: 400px;">'
-                    # Append the /image command and generated image to chat history
-                    chat_history.append([message, ""])
-                    chat_history.append(["", image_html])
-                    # Update conversation history
                     self.conversation_history.append(ChatMessage(role="user", content=message).to_dict())
                     self.conversation_history.append(ChatMessage(role="assistant", content=image_html).to_dict())
-                    # Update the chat history file
                     self.save_chat()
                     all_chats = self.load_all_chats()
                     chat_titles = [f"{chat['timestamp']}: {chat['conversation'][0]['content'][:30]}..." if len(chat['conversation']) > 0 and chat['conversation'][0]['content'] else f"{chat['timestamp']}: Empty Chat" for chat in all_chats]
                     yield "", chat_history, None, None, gr.update(choices=chat_titles, visible=True)
                 else:
-                    chat_history.append([message, image_bytes])
                     yield "", chat_history, None, None, None
                 return
@@ -669,18 +709,30 @@ class XylariaChat:
             full_response = ""
             updated_history = chat_history + [[message, ""]]
             try:
                 for chunk in response_stream:
-                    if chunk.choices and chunk.choices[0].delta and chunk.choices[0].delta.content:
-                        chunk_content = chunk.choices[0].delta.content
-                        full_response += chunk_content
                         updated_history[-1][1] = full_response
                         yield "", updated_history, None, None, None
             except Exception as e:
                 print(f"Streaming error: {e}")
                 updated_history[-1][1] = f"Error during response: {e}"
                 yield "", updated_history, None, None, None
                 return
@@ -732,7 +784,7 @@ class XylariaChat:
             all_chats = self.load_all_chats()
             chat_titles = [f"{chat['timestamp']}: {chat['conversation'][0]['content'][:30]}..." if len(chat['conversation']) > 0 and chat['conversation'][0]['content'] else f"{chat['timestamp']}: Empty Chat" for chat in all_chats]
             yield "", updated_history, None, None, gr.update(choices=chat_titles, visible=True)
         def load_selected_chat(chat_index, evt: gr.SelectData):
             if chat_index is not None:
                 loaded_chat = self.load_chat(evt.index)

             raise ValueError("HuggingFace token not found in environment variables")
         self.client = InferenceClient(
+            model="Qwen/Qwen-32B-Preview",  # Corrected model name
+            token=self.hf_token  # Changed api_key to token
         )
         self.image_api_url = "https://api-inference.huggingface.co/models/Salesforce/blip-image-captioning-large"
             if response.status_code == 200:
                 image_bytes = response.content
                 return image_bytes
+            elif response.status_code == 503:
+                error_message = response.json().get("error", "Unknown error")
+                if "estimated_time" in response.json():
+                  estimated_time = response.json()["estimated_time"]
+                  error_message += f" Estimated time to complete: {estimated_time:.2f} seconds"
+                else:
+                  error_message += "The model is currently loading, please try again later"
+                return f"Error: {error_message}"
             else:
                 return f"Error generating image: {response.status_code} - {response.text}"
             max_new_tokens = 16384 - input_tokens - 50
             max_new_tokens = min(max_new_tokens, 10020)
+            formatted_messages = self.messages_to_prompt(messages)
+            stream = self.client.text_generation(
+                prompt=formatted_messages,
+                max_new_tokens=max_new_tokens,
                 temperature=0.7,
                 top_p=0.9,
+                stream=True,
+                details=True,
+                do_sample=True
             )
             return stream
     def create_interface(self):
         def streaming_response(message, chat_history, image_filepath, math_ocr_image_path):
+            # Placeholder for image generation
+            loading_svg = """<svg width="256" height="256" viewBox="0 0 256 256" xmlns="http://www.w3.org/2000/svg">
+              <style>
+                rect {
+                  animation: fillAnimation 3s ease-in-out infinite;
+                }
+                @keyframes fillAnimation {
+                  0% { fill: #626262; }
+                  50% { fill: #111111; }
+                  100% { fill: #626262; }
+                }
+                text {
+                  font-family: 'Helvetica Neue', Arial, sans-serif;
+                  font-weight: 300;
+                  text-shadow: 0px 2px 4px rgba(0, 0, 0, 0.4);
+                }
+              </style>
+              <rect width="256" height="256" rx="20" fill="#888888" />
+              <text x="50%" y="50%" dominant-baseline="middle" text-anchor="middle" font-size="24" fill="white" opacity="0.8">
+                <tspan>creating your image</tspan>
+                <tspan x="50%" dy="1.2em">with xylaria iris</tspan>
+              </text>
+            </svg>"""
             if message.strip().lower().startswith("/image"):
                 image_prompt = message.strip().lower()[len("/image"):].strip()
                 if not image_prompt:
+                    image_prompt = "A realistic image"
+                chat_history.append([message, ""])
+                chat_history.append(("", loading_svg))
+                yield "", chat_history, None, None, None
                 image_bytes = self.generate_image(image_prompt)
                 if isinstance(image_bytes, bytes):
                     base64_image = base64.b64encode(image_bytes).decode("utf-8")
                     image_html = f'<img src="data:image/png;base64,{base64_image}" alt="Generated Image" style="max-width: 100%; max-height: 400px;">'
+                    chat_history[-1] = ("", image_html)
                     self.conversation_history.append(ChatMessage(role="user", content=message).to_dict())
                     self.conversation_history.append(ChatMessage(role="assistant", content=image_html).to_dict())
                     self.save_chat()
                     all_chats = self.load_all_chats()
                     chat_titles = [f"{chat['timestamp']}: {chat['conversation'][0]['content'][:30]}..." if len(chat['conversation']) > 0 and chat['conversation'][0]['content'] else f"{chat['timestamp']}: Empty Chat" for chat in all_chats]
                     yield "", chat_history, None, None, gr.update(choices=chat_titles, visible=True)
                 else:
+                    chat_history[-1] = ("", image_bytes)
                     yield "", chat_history, None, None, None
                 return
             full_response = ""
             updated_history = chat_history + [[message, ""]]
+            if isinstance(response_stream, str):
+                updated_history = chat_history + [[message, response_stream]]
+                yield "", updated_history, None, None, None
+                return
             try:
                 for chunk in response_stream:
+                    if not chunk.token.special:
+                        full_response += chunk.token.text
                         updated_history[-1][1] = full_response
+                        self.conversation_history.append(ChatMessage(role="user", content=message).to_dict())
+                        self.conversation_history.append(ChatMessage(role="assistant", content=full_response).to_dict())
                         yield "", updated_history, None, None, None
             except Exception as e:
                 print(f"Streaming error: {e}")
                 updated_history[-1][1] = f"Error during response: {e}"
                 yield "", updated_history, None, None, None
                 return
             all_chats = self.load_all_chats()
             chat_titles = [f"{chat['timestamp']}: {chat['conversation'][0]['content'][:30]}..." if len(chat['conversation']) > 0 and chat['conversation'][0]['content'] else f"{chat['timestamp']}: Empty Chat" for chat in all_chats]
             yield "", updated_history, None, None, gr.update(choices=chat_titles, visible=True)
         def load_selected_chat(chat_index, evt: gr.SelectData):
             if chat_index is not None:
                 loaded_chat = self.load_chat(evt.index)