Spaces:

khulnasoft
/

gpt-computer-agent

Build error

App Files Files Community

khulnasoft commited on Aug 27, 2024

Commit

873d0cf

verified ·

1 Parent(s): 1b30ca3

Upload 76 files

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +1 -0
CONTRIBUTING.md +1 -0
LICENSE +21 -0
MANIFEST.in +2 -0
README.TR.md +327 -0
README.md +331 -12
README.zh_CN.md +160 -0
README.zh_TW.md +208 -0
build_scripts/openai/macos_build.sh +30 -0
build_scripts/openai/windows_build.sh +59 -0
bump.py +135 -0
example_use_cases/workday_summerizer.md +55 -0
gca_setup_generator.py +12 -0
gpt_computer_agent/__init__.py +7 -0
gpt_computer_agent/agent/__init__.py +4 -0
gpt_computer_agent/agent/agent.py +80 -0
gpt_computer_agent/agent/agent_tools.py +64 -0
gpt_computer_agent/agent/assistant.py +234 -0
gpt_computer_agent/agent/background.py +21 -0
gpt_computer_agent/agent/chat_history.py +31 -0
gpt_computer_agent/agent/process.py +299 -0
gpt_computer_agent/agentic.py +36 -0
gpt_computer_agent/api.py +673 -0
gpt_computer_agent/audio/__init__.py +1 -0
gpt_computer_agent/audio/record.py +159 -0
gpt_computer_agent/audio/stt.py +77 -0
gpt_computer_agent/audio/stt_providers/openai.py +11 -0
gpt_computer_agent/audio/stt_providers/openai_whisper_local.py +19 -0
gpt_computer_agent/audio/tts.py +106 -0
gpt_computer_agent/audio/tts_providers/microsoft_local.py +55 -0
gpt_computer_agent/audio/tts_providers/openai.py +13 -0
gpt_computer_agent/audio/wake_word.py +40 -0
gpt_computer_agent/character.py +47 -0
gpt_computer_agent/custom_callback.py +21 -0
gpt_computer_agent/display_tools.py +242 -0
gpt_computer_agent/gpt_computer_assistant.py +1599 -0
gpt_computer_agent/gui/__init__.py +0 -0
gpt_computer_agent/gui/button.py +169 -0
gpt_computer_agent/gui/llmsettings.py +276 -0
gpt_computer_agent/gui/settings.py +351 -0
gpt_computer_agent/gui/signal.py +27 -0
gpt_computer_agent/llm.py +108 -0
gpt_computer_agent/llm_settings.py +185 -0
gpt_computer_agent/remote.py +291 -0
gpt_computer_agent/screen/__init__.py +0 -0
gpt_computer_agent/screen/shot.py +49 -0
gpt_computer_agent/standard_tools.py +315 -0
gpt_computer_agent/start.py +204 -0
gpt_computer_agent/teams.py +264 -0
gpt_computer_agent/tooler.py +26 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+gpt_computer_agent/utils/media/SF-Pro-Text-Bold.otf filter=lfs diff=lfs merge=lfs -text

CONTRIBUTING.md ADDED Viewed

	@@ -0,0 +1 @@


1	+ We are open to any contribution as well.

LICENSE ADDED Viewed

	@@ -0,0 +1,21 @@

+MIT License
+Copyright (c) 2024 KhulnaSoft Ltd.
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

MANIFEST.in ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ include gpt_computer_agent/utils/media/*
2	+ include requirements.txt

README.TR.md ADDED Viewed

	@@ -0,0 +1,327 @@

+<p align="center">
+<p align="center">
+  <a href="#">
+    <img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/deeeb463-c161-4fc6-8407-71c3d8b7defe" alt="Logo"  >
+  </a>
+  <br>
+  <a href="#">
+    <img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/36714716-6990-40b0-84d5-cd7432811bcb" alt="Logo"  >
+  </a>
+  <h3 align="center">GPT Computer Assistant</h3>
+  <p align="center">
+    <a href="https://discord.gg/qApFmWMt8x"><img alt="Static Badge" src="https://img.shields.io/badge/Discord-Join?style=social&logo=discord" width=150></a>
+  </p>
+  <p align="center">
+    gpt-4o for windows, macos and ubuntu
+    <br />
+   <a href="https://github.com/khulnasoft/gpt-computer-agent/wiki"><strong>Dökümantasyon</strong></a>
+   .
+    <a href="https://github.com/khulnasoft/gpt-computer-agent/#Capabilities"><strong>Yeteneklerini Keşfet »</strong></a>
+    <br />
+    </p>
+    <br>
+    <p align="center">
+     <a href="https://github.com/khulnasoft/gpt-computer-agent/wiki">
+   <img src="https://img.shields.io/badge/Windows-0078D6?style=for-the-badge&logo=windows&logoColor=white" alt="windows">
+   </a>
+   <a href="https://github.com/khulnasoft/gpt-computer-agent/wiki">
+   <img src="https://img.shields.io/badge/mac%20os-000000?style=for-the-badge&logo=apple&logoColor=white" alt="macos">
+   </a>
+    <a href="https://github.com/khulnasoft/gpt-computer-agent/wiki">
+   <img src="https://img.shields.io/badge/Linux-FCC624?style=for-the-badge&logo=linux&logoColor=black" alt="linux">
+   </a>
+  <br>
+  <p align="center">
+  <a href="https://www.python.org/">
+  <img src="https://img.shields.io/badge/Made%20with-Python-1f425f.svg" alt="Made_with_python">
+  </a>
+  .
+  <img src="https://static.pepy.tech/personalized-badge/gpt-computer-agent?period=total&units=international_system&left_color=grey&right_color=blue&left_text=PyPI%20Downloads" alt="pypi_downloads">
+  </p>
+  <p align="center">
+   <a href="https://x.com/GPTCompAsst"><img alt="Static Badge" src="https://img.shields.io/twitter/follow/GPTCompAsst?style=social" width=160></a>
+</p>
+<br>
+|[ENGLISH](README.md)|[简体中文](README.zh_CN.md)|[正體中文](README.zh_TW.md)|TÜRKÇE|
+# GPT Bilgisayar Asistanı
+Merhaba, bu ChatGPT MacOS uygulamasının Windows ve Linux için alternatif bir çalışmasıdır. Bu şekilde, taze ve stabil bir çalışma sunuyoruz. Python kütüphanesi olarak kurulumu oldukça kolaydır, ancak ilerleyen zamanlarda .exe formatında doğrudan kurulum betikleri sağlayacak bir iş akışı hazırlayacağız.
+Powered by [**KhulnaSoft Tiger 🐅**](https://github.com/KhulnaSoft/Tiger) - LLM ajanları için bir işlev merkezi.
+## Kurulum ve Çalıştırma
+Python 3.9 veya üstü gereklidir.
+```console
+pip3 install 'gpt-computer-agent[base]'
+```
+```console
+computeragent
+```
+### Uyandırma Komutu(Wake Word) | YENİ
+<details>
+Pvporcupine entegrasyonunu ekledik. Bu özelliği kullanmak için ek bir kütüphane kurmanız gerekiyor:
+```console
+pip3 install 'gpt-computer-agent[wakeword]'
+```
+Sonrasında, lütfen [Pvporcupine](https://picovoice.ai/) API anahtarınızı girin ve uyandırma komutu özelliğini etkinleştirin.
+</details>
+<p align="center">
+<br>
+  <br>
+  <br>
+</p>
+<p align="center">
+<a href="#">
+    <img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/5c6b7063-3d9b-4ea6-befa-ce15d69fcd43" alt="Logo"  >
+  </a>
+</p>
+### Ajan Altyapısı
+Bu şekilde `crewai` ajanları oluşturabilir ve onları gpt-computer-agent arayüzü ve araçları içinde kullanabilirsiniz.
+```console
+pip3 install 'gpt-computer-agent[base]'
+pip3 install 'gpt-computer-agent[agentic]'
+```
+```python
+from gpt_computer_agent import Agent, start
+manager = Agent(
+  role='Proje Yöneticisi',
+  goal='proje ihtiyaçlarını anlar ve kodlayıcıya yardımcı olur',
+  backstory="""Büyük bir şirkette bir yöneticisiniz.""",
+)
+coder = Agent(
+  role='Kıdemli Python Geliştirici',
+  goal='Python scriptleri yazmak ve panoya kopyalamak',
+  backstory="""Büyük bir şirkette bir Python geliştiricisisiniz.""",
+)
+start()
+```
+<p align="center">
+<a href="#">
+    <img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/c78f3460-6660-4da6-8941-a8ac5cfc1191" alt="Logo"  >
+  </a>
+</p>
+### Özel Araçlar Ekleme
+Artık agentic altyapı ve asistan işlemlerinde çalışan özel araçlar ekleyebilirsiniz.
+```python
+from gpt_computer_agent import Tool, start
+@Tool
+def toplam_aracı(ilk_sayı: int, ikinci_sayı: int) -> str:
+    """İki sayıyı toplamanız gerektiğinde kullanışlıdır."""
+    return ilk_sayı + ikinci_sayı
+start()
+```
+<p align="center">
+<a href="#">
+    <img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/65b5fe7c-c0e1-40e9-9447-f41cd4f369a3" alt="Logo"  >
+  </a>
+</p>
+### API | YENİ
+Artık GPT Bilgisayar Asistanınızı uzaktan kullanabilirsiniz! GUI hala aktif, bunun için birkaç adım bulunmaktadır:
+```console
+pip3 install 'gpt-computer-agent[base]'
+pip3 install 'gpt-computer-agent[api]'
+```
+```console
+computeragent --api
+```
+```python
+from gpt_computer_agent.remote import remote
+output = remote.input("Merhaba, bugün nasılsın?", screen=False, talk=False)
+print(output)
+remote.just_screenshot()
+remote.talk("TTS test")
+# Other Functionalities
+remote.reset_memory()
+remote.profile("default")
+remote.enable_predefined_agents()
+remote.disable_predefined_agents()
+remote.enable_online_tools()
+remote.disable_online_tools()
+```
+<p align="center">
+<br>
+  <br>
+  <br>
+  <br>
+  <br>
+</p>
+<p align="center">
+<br>
+  <br>
+  <br>
+</p>
+https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/26ae3624-e619-44d6-9b04-f39cf1ac1f8f
+## Kullanım
+![options](https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/37d34745-ae4b-4b37-9bfa-aec070c97897)
+### Kullanım Alanları
+<table>
+  <tr>
+    <td><img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/b4a4f11e-5588-4656-b5d7-b612a9a2855b" alt="Take Meeting Notes" width="500"/></td>
+    <td><img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/49eeac70-b33a-4ec4-8125-64127621ed62" alt="Daily Assistant" width="500"/></td>
+  </tr>
+  <tr>
+    <td><img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/10b69a18-033c-4d81-8ac9-f4e3c65b59c3" alt="Read Docs" width="500"/></td>
+    <td><img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/0f483bae-ffaf-4311-8653-c0dc64fb5ebe" alt="Coding Assistant" width="500"/></td>
+  </tr>
+</table>
+## Yol Haritası
+| Özellik                            | Durum        | Hedef Çeyrek    |
+|------------------------------------|--------------|----------------|
+| Sohbet Geçmişini Temizle            | Tamamlandı   | 2024 Q2        |
+| Uzun Ses Desteği (20mb Bölme)       | Tamamlandı   | 2024 Q2        |
+| Metin Girişleri                     | Tamamlandı   | 2024 Q2        |
+| Sadece Metin Modu (Konuşmayı Sustur) | Tamamlandı  | 2024 Q2        |
+| Profil Ekleme (Farklı Sohbetler)    | Tamamlandı   | 2024 Q2        |
+| Asistan Durumu Hakkında Daha Fazla Geri Bildirim | Tamamlandı | 2024 Q2        |
+| Yerel Model Görüntü ve Metin (Ollama ve görüntü modelleri ile) | Tamamlandı | 2024 Q2        |
+| **Özelleştirilebilir Ajan Altyapısı** | Tamamlandı   | 2024 Q2        |
+| Groq Modellerini Destekleme         | Tamamlandı   | 2024 Q2        |
+| **Özel Araçlar Ekleme**             | Tamamlandı   | 2024 Q2        |
+| Ekrandaki bir şeye tıklama (metin ve simge) | Tamamlandı | 2024 Q2        |
+| Yeni Kullanıcı Arayüzü              | Tamamlandı   | 2024 Q2        |
+| Yerel Uygulamalar, exe, dmg         | Başarısız (Agentic Altyapı kütüphaneleri şu anda desteklenmiyor) | 2024 Q2        |
+| **Uzun yanıtlarda işbirlikçi konuşan farklı ses modelleri.** | Tamamlandı | 2024 Q2        |
+| **Konuşmayı Tamamladığınızda Otomatik Kaydı Durdurma** | Tamamlandı | 2024 Q2        |
+| **Uyanma Komutu**                   | Tamamlandı   | 2024 Q2        |
+| **Sürekli Konuşmalar**              | Tamamlandı   | 2024 Q2        |
+| **Cihazda daha fazla yetenek ekleme** | Planlanıyor | 2024 Q2        |
+| DeepFace Entegrasyonu (Yüz Tanıma)  | Planlanıyor  | 2024 Q2        |
+## Yetenekler
+Şu anda birçok altyapı öğemiz var. ChatGPT uygulamasında zaten bulunan tüm öğeleri sağlamayı hedefliyoruz.
+| Yetenek                              | Durum   |
+|--------------------------------------|---------|
+| **Ekran Okuma**                      | OK      |
+| **Ekrandaki Metin veya Simgeye Tıklama** | OK      |
+| **Ekrandaki Metin veya Simgeye Taşıma** | OK      |
+| **Bir Şeyler Yazma**                 | OK      |
+| **Herhangi Bir Tuşa Basma**          | OK      |
+| **Kaydırma**                         | OK      |
+| **Mikrofon**                         | OK      |
+| **Sistem Sesleri**                   | OK      |
+| **Bellek**                           | OK      |
+| **Uygulama Açma ve Kapatma**         | OK      |
+| **Bir URL Açma**                     | OK      |
+| **Pano**                             | OK      |
+| **Arama Motorları**                  | OK      |
+| **Python Yazma ve Çalıştırma**       | OK      |
+| **SH (Shell) Yazma ve Çalıştırma**   | OK      |
+| **Telegram Hesabınızı Kullanma**     | OK      |
+| **Bilgi Yönetimi**                   | OK      |
+| **[Daha fazla araç ekle](https://github.com/khulnasoft/gpt-computer-agent/blob/master/gpt_computer_agent/standard_tools.py)** | ?       |
+### Önceden Tanımlı Ajanlar
+Eğer etkinleştirirseniz asistanınız bu ekiplerle çalışabilir:
+| Takım Adı                               | Durum   |
+|-----------------------------------------|---------|
+| **search_on_internet_and_report_team**   | OK      |
+| **generate_code_with_aim_team_**         | OK      |
+| **[Kendi ekleyin](https://github.com/khulnasoft/gpt-computer-agent/blob/master/gpt_computer_agent/teams.py)** | ?       |
+  <a href="#">
+    <img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/ba590bf8-6059-4cb6-8c4e-6d105ce4edd2" alt="Logo"  >
+  </a>
+## Katkıda Bulunanlar
+<a href="https://github.com/khulnasoft/gpt-computer-agent/graphs/contributors">
+  <img src="https://contrib.rocks/image?repo=khulnasoft/gpt-computer-agent" />
+</a>
+</p>

README.md CHANGED Viewed

@@ -1,12 +1,331 @@
----
-title: Gpt Computer Agent
-emoji: 🐨
-colorFrom: blue
-colorTo: pink
-sdk: gradio
-sdk_version: 4.42.0
-app_file: app.py
-pinned: false
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

+# GPT Computer Agent
+<p align="center">
+  <a href="https://docs.gca.dev">
+    <img src="https://github.com/user-attachments/assets/c60562bf-540e-47d9-b578-994285071128" width="250">
+  </a>
+  .
+  <a href="https://github.com/KhulnaSoft/gpt-computer-agent/releases/latest/download/gpt-computer-agent-openai.dmg">
+    <img src="https://github.com/user-attachments/assets/a0475f31-9dfd-4a0c-91b0-7ae128c3c773" width="250">
+  </a>
+  .
+  <a href="https://github.com/KhulnaSoft/gpt-computer-agent/releases/latest/download/gpt-computer-agent-openai.exe">
+    <img src="https://github.com/user-attachments/assets/c94139fd-609c-4780-9541-6e9e01dd0e47" width="250">
+  </a>
+</p>
+  <p align="center">
+    <a href="https://www.producthunt.com/posts/gpt-computer-agent?embed=true&utm_source=badge-top-post-badge&utm_medium=badge&utm_souce=badge-gpt&#0045;computer&#0045;assistant" target="_blank"><img src="https://api.producthunt.com/widgets/embed-image/v1/top-post-badge.svg?post_id=465468&theme=dark&period=daily" alt="GPT&#0032;Computer&#0032;Assistant - Create&#0032;intelligence&#0032;for&#0032;your&#0032;products | Product Hunt" style="width: 250px; height: 54px;" width="250" height="54" /></a>
+    .
+    <a href="https://discord.gg/qApFmWMt8x"><img alt="Static Badge" src="https://img.shields.io/badge/Discord-Join?style=social&logo=discord" width=150></a>
+    .
+    <a href="https://x.com/GPTCompAsst"><img alt="Static Badge" src="https://img.shields.io/badge/X_App-Join?style=social&logo=x" width=150></a>
+  </p>
+  <p align="center">
+    <br />
+    Intelligence development framework
+    <br />
+    </p>
+    <br>
+  <p align="center">
+  <a href="https://www.python.org/">
+  <img src="https://img.shields.io/badge/Made%20with-Python-1f425f.svg" alt="Made_with_python">
+  </a>
+  .
+  <img src="https://static.pepy.tech/personalized-badge/gpt-computer-agent?period=total&units=international_system&left_color=grey&right_color=blue&left_text=PyPI%20Downloads" alt="pypi_downloads">
+  </p>
+|ENGLISH|[简体中文](README.zh_CN.md)|[正體中文](README.zh_TW.md)|[TÜRKÇE](README.TR.md)
+Hi, this is an alternative work for providing ChatGPT MacOS app to Windows and Linux. In this way this is a fresh and stable work. You can easily install as Python library for this time but we will prepare a pipeline for providing native install scripts (.exe).
+Powered by <a href="https://github.com/KhulnaSoft/Tiger"><strong>KhulnaSoft Tiger 🐅</strong></a> A function hub for llm agents.
+## 1. Install and run
+**Python 3.10 or 3.11 is required**
+```console
+pip install 'gpt-computer-agent[base]'
+pip install 'gpt-computer-agent[api]'
+```
+To run gpt-computer-agent, simply type
+```console
+computeragent --api
+```
+<p align="center">
+  <a href="#">
+    <img src="https://github.com/user-attachments/assets/890b4e0a-4484-4870-a158-2d365b0d969e" >
+  </a>
+</p>
+<p align="center">
+<br>
+  <br>
+  <br>
+  <br>
+  <br>
+</p>
+## 2. LLM Settings
+```python
+from gpt_computer_agent.remote import remote
+remote.save_models("gpt-4o")
+remote.save_openai_api_key("sk-**")
+```
+<p align="start">
+  <a href="https://docs.upsonic.co/gca/dev_guides/llm_settings">
+    <img src="https://github.com/user-attachments/assets/a75c8ddf-f9df-436b-9dc8-c5220211e15e" width="150">
+  </a>
+</p>
+<p align="center">
+<br>
+  <br>
+  <br>
+</p>
+## 3. Characteristic API
+```python
+# Name of the assitant:
+remote.change_name("X Intelligence")
+#Developer personna of the assistant:
+remote.change_developer("X Company")
+```
+<p align="start">
+  <a href="https://docs.upsonic.co/gca/dev_guides/characteristic">
+    <img src="https://github.com/user-attachments/assets/d7e02ac6-e40c-4b35-8e65-4621bf3fb9a1" width="150">
+  </a>
+</p>
+<p align="center">
+<br>
+  <br>
+  <br>
+</p>
+## 4. Connect Your Functions API
+```python
+# Installing an library:
+remote.install_library("numpy")
+# Adding functianility as python functions:
+@remote.custom_tool
+def my_server_status() -> bool:
+  """
+  Check the server status.
+  """
+  return True
+```
+<p align="center">
+<br>
+  <br>
+  <br>
+</p>
+## 5. Interact with User API
+### remote.input
+Talk with assistant, about user and computer. With this api you can create an consulting process.
+```markdown
+`Hi, look to user window and return which app using now`
+`Ask user to is user need any kind of supoprt`
+`Extract the user redis config file.`
+```
+With this questions you will make a shortcut for your needs.
+**You can collect informations from user computer or directly from user or user computer.**
+```python
+output = remote.input("Extract the user redis config file.", screen=False)
+print(output)
+```
+<p align="start">
+  <a href="https://docs.upsonic.co/gca/dev_guides/interact">
+    <img src="https://github.com/user-attachments/assets/81614347-ab85-4965-9b77-225d0f2961e9" width="150">
+  </a>
+  .
+  <a href="https://docs.upsonic.co/gca/dev_guides/interact">
+    <img src="https://github.com/user-attachments/assets/ecaa7590-f4c5-4eda-9482-462cef54aeff" width="150">
+  </a>
+  .
+  <a href="https://docs.upsonic.co/gca/dev_guides/interact">
+    <img src="https://github.com/user-attachments/assets/0f35df10-b32e-4fa1-936e-b336be46b1bd" width="150">
+  </a>
+</p>
+<p align="start">
+  <a href="https://docs.upsonic.co/gca/dev_guides/interact">
+    <img src="https://github.com/user-attachments/assets/a893c50c-3ede-4b42-90ee-92e2fea82120" width="150">
+  </a>
+</p>
+<p align="center">
+<br>
+  <br>
+  <br>
+</p>
+## Usage
+![options](https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/37d34745-ae4b-4b37-9bfa-aec070c97897)
+### Use cases
+<img alt="Screenshot 2024-08-13 at 18 33 52" src="https://github.com/user-attachments/assets/8f994160-893a-4f56-bbf0-4a7aa87af650">
+## Roadmap
+| Feature                         | Status       | Target Release |
+|---------------------------------|--------------|----------------|
+| Clear Chat History         | Completed    | Q2 2024        |
+| Long Audios Support (Split 20mb)      | Completed    | Q2 2024        |
+| Text Inputs               | Completed      | Q2 2024        |
+| Just Text Mode (Mute Speech)           | Completed  | Q2 2024        |
+| Added profiles (Different Chats)          | Completed    | Q2 2024        |
+| More Feedback About Assistant Status                  | Completed    | Q2 2024        |
+| Local Model Vision and Text (With Ollama, and vision models)  | Completed  | Q2 2024        |
+| **Our Customizable Agent Infrastructure**              | Completed      | Q2 2024        |
+| Supporting Groq Models  | Completed  | Q2 2024        |
+| **Adding Custom Tools**  | Completed  | Q2 2024        |
+| Click on something on the screen (text and icon)              | Completed      | Q2 2024        |
+| New UI              | Completed      | Q2 2024        |
+| Native Applications, exe, dmg              | Completed     | Q3 2024        |
+| **Collaborated Speaking Different Voice Models on long responses.**              | Completed     | Q2 2024        |
+| **Auto Stop Recording, when you complate talking**              | Completed     | Q2 2024        |
+| **Wakeup Word**              | Completed     | Q2 2024        |
+| **Continuously Conversations**              | Completed     | Q2 2024        |
+| **Adding more capability on device**              | Completed     | Q2 2024        |
+| **Local TTS**              | Completed     | Q3 2024        |
+| **Local STT**              | Completed     | Q3 2024        |
+| Tray Menu              | Completed     | Q3 2024        |
+| **Global Hotkey**              | On the way     | Q3 2024        |
+| DeepFace Integration (Facial Recognition)                    | Planned  | Q3 2024        |
+## Capabilities
+At this time we have many infrastructure elements. We just aim to provide whole things that already in ChatGPT app.
+| Capability                         | Status                      |
+|------------------------------------|----------------------------------|
+| **Local LLM with Vision (Ollama)**                    |            OK                    |
+| Local text-to-speech                    |            OK                    |
+| Local speech-to-text                    |            OK                    |
+| **Screen Read**                    |            OK                    |
+| **Click to and Text or Icon in the screen**                    |            OK                    |
+| **Move to and Text or Icon in the screen**                    |            OK                    |
+| **Typing Something**                    |            OK                    |
+| **Pressing to Any Key**                    |            OK                    |
+| **Scrolling**                    |            OK                    |
+| **Microphone**                     |            OK                    |
+| **System Audio**                  |            OK                    |
+| **Memory**                         |            OK                    |
+| **Open and Close App**             |            OK                    |
+| **Open a URL**                     |            OK                    |
+| **Clipboard**                       |            OK                    |
+| **Search Engines**                 |            OK                    |
+| **Writing and running Python**     |            OK                    |
+| **Writing and running SH**    |            OK                    |
+| **Using your Telegram Account**    |            OK                    |
+| **Knowledge Management**           |            OK                    |
+| **[Add more tool](https://github.com/khulnasoft/gpt-computer-agent/blob/master/gpt_computer_agent/standard_tools.py)**           |            ?                    |
+### Predefined Agents
+If you enable it your assistant will work with these teams:
+| Team Name                         | Status                      |
+|------------------------------------|----------------------------------|
+| **search_on_internet_and_report_team**                    |            OK                    |
+| **generate_code_with_aim_team_**                    |            OK                    |
+| **[Add your own one](https://github.com/khulnasoft/gpt-computer-agent/blob/master/gpt_computer_agent/teams.py)**                    |            ?                    |
+  <a href="#">
+    <img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/ba590bf8-6059-4cb6-8c4e-6d105ce4edd2" alt="Logo"  >
+  </a>
+## Contributors
+<a href="https://github.com/khulnasoft/gpt-computer-agent/graphs/contributors">
+  <img src="https://contrib.rocks/image?repo=khulnasoft/gpt-computer-agent" />
+</a>

README.zh_CN.md ADDED Viewed

	@@ -0,0 +1,160 @@

+<p align="center">
+  <a href="#">
+    <img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/176c8ddb-219e-444e-8782-1f8c37a92678" alt="Logo" width="250" >
+  </a>
+  <h3 align="center">GPT 计算机助手</h3>
+  <p align="center">
+    适用于 Windows、MacOS 和 Ubuntu 的 gpt-4o
+    <br />
+   <a href="https://github.com/khulnasoft/gpt-computer-agent/wiki"><strong>文档</strong></a>
+   .
+    <a href="https://github.com/khulnasoft/gpt-computer-agent/#Capabilities"><strong>探索功能 »</strong></a>
+    <br />
+    </p>
+    <br>
+    <p align="center">
+     <a href="https://github.com/khulnasoft/gpt-computer-agent/wiki">
+   <img src="https://img.shields.io/badge/Windows-0078D6?style=for-the-badge&logo=windows&logoColor=white" alt="windows">
+   </a>
+   <a href="https://github.com/khulnasoft/gpt-computer-agent/wiki">
+   <img src="https://img.shields.io/badge/mac%20os-000000?style=for-the-badge&logo=apple&logoColor=white" alt="macos">
+   </a>
+    <a href="https://github.com/khulnasoft/gpt-computer-agent/wiki">
+   <img src="https://img.shields.io/badge/Linux-FCC624?style=for-the-badge&logo=linux&logoColor=black" alt="linux">
+   </a>
+  <br>
+  </p>
+  <p align="center">
+  <a href="https://www.python.org/">
+  <img src="https://img.shields.io/badge/Made%20with-Python-1f425f.svg" alt="Made_with_python">
+  </a>
+  .
+  <img src="https://static.pepy.tech/personalized-badge/gpt-computer-agent?period=total&units=international_system&left_color=grey&right_color=blue&left_text=PyPI%20Downloads" alt="pypi_downloads">
+  </p>
+  <p align="center">
+   <a href="https://discord.gg/qApFmWMt8x"><img alt="Static Badge" src="https://img.shields.io/badge/Discord-Join?style=social&logo=discord" width=150></a>
+   <a href="https://x.com/GPTCompAsst"><img alt="Static Badge" src="https://img.shields.io/badge/X-Join?style=social&logo=x" width=100></a>
+  </p>
+|[ENGLISH](README.md)|简体中文|[正體中文](README.zh_TW.md)|[TÜRKÇE](README.TR.md)
+# GPT 计算机助手
+你好，这是一个将 ChatGPT MacOS 应用程序提供给 Windows 和 Linux 的替代工作。因此，这是一个全新且稳定的项目。此时，您可以轻松地将其作为 Python 库安装，但我们将准备一个流水线来提供本机安装脚本 (.exe)。
+由 <a href="https://github.com/KhulnaSoft/Tiger"><strong>KhulnaSoft Tiger 🐅</strong></a> 提供支持的功能集成中心。
+## 安装 && 运行
+需要 >= Python 3.9
+```console
+pip3 install 'gpt-computer-agent[default]'
+```
+```console
+computeragent
+```
+### 演示视频（1 分钟）
+https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/26ae3624-e619-44d6-9b04-f39cf1ac1f8f
+## 使用案例
+<table>
+  <tr>
+    <td><img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/b4a4f11e-5588-4656-b5d7-b612a9a2855b" alt="Take Meeting Notes" width="500"/></td>
+    <td><img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/49eeac70-b33a-4ec4-8125-64127621ed62" alt="Daily Assistant" width="500"/></td>
+  </tr>
+  <tr>
+    <td><img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/10b69a18-033c-4d81-8ac9-f4e3c65b59c3" alt="Read Docs" width="500"/></td>
+    <td><img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/0f483bae-ffaf-4311-8653-c0dc64fb5ebe" alt="Coding Assistant" width="500"/></td>
+  </tr>
+</table>
+## 路线图
+| 功能                             | 状态         | 目标发布      |
+|---------------------------------|--------------|--------------|
+| 清除聊天记录                     | 已完成       | 2024 年第二季度|
+| 长音频支持（拆分 20mb）          | 已完成       | 2024 年第二季度|
+| 文本输入                          | 已完成       | 2024 年第二季度|
+| 仅文本模式（静音）                | 已完成       | 2024 年第二季度|
+| 添加配置文件（不同聊天）           | 已完成       | 2024 年第二季度|
+| 更多关于助手状态的反馈             | 已完成       | 2024 年第二季度|
+| **新 UI**                        | 计划中       | 2024 年第二季度|
+| **我们的自定义代理基础设施**        | 计划中       | 2024 年第二季度|
+| **本机应用程序，exe，dmg，appimage** | 计划中       | 2024 年第二季度|
+| **DeepFace 集成（面部识别）**      | 计划中       | 2024 年第二季度|
+| **本地模式（使用 Ollama，语音和视觉模型）** | 计划中       | 2024 年第二季度|
+#### 代理基础设施 | 即将推出
+```python
+from gpt-comptuer-assistant import crew, agent
+coder = agent("你是一名高级 Python 开发者")
+manager = agent("你是一名高级项目经理")
+assistant = crew(
+ [coder, manager]
+)
+assistant.gui()
+```
+## 功能
+此时我们拥有许多基础设施元素。我们只是希望提供 ChatGPT 应用中已经存在的所有功能。
+| 功能                              | 描述                          |
+|-----------------------------------|-------------------------------|
+| **屏幕读取**                      |            OK                 |
+| **麦克风**                        |            OK                 |
+| **系统音频**                      |            OK                 |
+| **内存**                          |            OK                 |
+| **打开和关闭应用程序**              |            OK                 |
+| **打开一个 URL**                  |            OK                 |
+| **剪贴板**                        |            OK                 |
+| **搜索引擎**                      |            OK                 |
+| **编写和运行 Python**            |            OK                 |
+| **编写和运行 SH**                |            OK                 |
+| **使用你的 Telegram 账户**        |            OK                 |
+| **知识管理**                      |            OK                 |
+## 用法
+![options](https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/20972b1e-6d4f-4314-8470-f2fcf79b6e6d)
+** 第一次单击包含麦克风或系统音频的选项后，需要再次单击相同选项以停止。
+## 贡献者
+<a href="https://github.com/khulnasoft/gpt-computer-agent/graphs/contributors">
+  <img src="https://contrib.rocks/image?repo=khulnasoft/gpt-computer-agent" />
+</a>

README.zh_TW.md ADDED Viewed

	@@ -0,0 +1,208 @@

+<p align="center">
+  <a href="#">
+    <img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/176c8ddb-219e-444e-8782-1f8c37a92678" alt="Logo" width="250" >
+  </a>
+  <h3 align="center">GPT 電腦助手</h3>
+  <p align="center">
+  <a href="https://discord.gg/qApFmWMt8x"><img alt="Static Badge" src="https://img.shields.io/discord/1148697961639968859.svg?label=&logo=discord&logoColor=ffffff&color=7389D8&labelColor=6A7EC2" width=100></a>
+  </p>
+  <p align="center">
+    適用於 Windows、MacOS 和 Ubuntu 的 gpt-4o
+    <br />
+   <a href="https://github.com/khulnasoft/gpt-computer-agent/wiki"><strong>文件</strong></a>
+   .
+    <a href="https://github.com/khulnasoft/gpt-computer-agent/#Capabilities"><strong>探索功能 »</strong></a>
+    <br />
+    </p>
+    <br>
+    <p align="center">
+     <a href="https://github.com/khulnasoft/gpt-computer-agent/wiki">
+   <img src="https://img.shields.io/badge/Windows-0078D6?style=for-the-badge&logo=windows&logoColor=white" alt="windows">
+   </a>
+   <a href="https://github.com/khulnasoft/gpt-computer-agent/wiki">
+   <img src="https://img.shields.io/badge/mac%20os-000000?style=for-the-badge&logo=apple&logoColor=white" alt="macos">
+   </a>
+    <a href="https://github.com/khulnasoft/gpt-computer-agent/wiki">
+   <img src="https://img.shields.io/badge/Linux-FCC624?style=for-the-badge&logo=linux&logoColor=black" alt="linux">
+   </a>
+  <br>
+  </p>
+  <p align="center">
+  <a href="https://www.python.org/">
+  <img src="https://img.shields.io/badge/Made%20with-Python-1f425f.svg" alt="Made_with_python">
+  </a>
+  .
+  <img src="https://static.pepy.tech/personalized-badge/gpt-computer-agent?period=total&units=international_system&left_color=grey&right_color=blue&left_text=PyPI%20Downloads" alt="pypi_downloads">
+  </p>
+  <p align="center">
+   <a href="https://x.com/GPTCompAsst"><img alt="Static Badge" src="https://img.shields.io/twitter/follow/GPTCompAsst?style=social" width=160></a>
+</p>
+|[ENGLISH](README.md)|[簡體中文](README.zh_CN.md)|正體中文|[TÜRKÇE](README.TR.md)
+# GPT 電腦助手
+嗨，這是為了將 ChatGPT MacOS 應用程式提供給 Windows 和 Linux 的替代方案。這樣做可以提供一個新鮮且穩定的解決方案。這次您可以輕鬆地安裝為 Python 庫，但我們將準備一個流程，提供本機安裝腳本（.exe）。
+由 <a href="https://github.com/KhulnaSoft/Tiger"><strong>KhulnaSoft Tiger 🐅</strong></a> 提供支持的功能集成中心。
+ <a href="https://github.com/khulnasoft/gpt-computer-agent/wiki/Usage"><img alt="Static Badge" src="https://img.shields.io/badge/Local_Models-Available-blue" width=150></a>
+ <br>
+ <a href="https://github.com/khulnasoft/gpt-computer-agent/wiki/Usage"><img alt="Static Badge" src="https://img.shields.io/badge/Groq-Available-blue" width=100></a>
+## 安裝 && 運行
+需要 >= Python 3.9
+```console
+pip3 install 'gpt-computer-agent[default]'
+```
+```console
+computeragent
+```
+### 代理基礎設施
+這樣一來，您可以創建 `crewai` 代理，並將其用於 gpt-computer-agent 圖形用戶界面和工具中。
+```console
+pip3 install 'gpt-computer-agent[agentic]'
+```
+```python
+from gpt_computer_agent import Agent, start
+manager = Agent(
+  role='Project Manager',
+  goal='understands project needs and assist coder',
+  backstory="""You're a manager at a large company.""",
+)
+coder = Agent(
+  role='Senior Python Coder',
+  goal='writing python scripts and copying to clipboard',
+  backstory="""You're a python developer at a large company.""",
+)
+start()
+```
+### 新增自訂工具
+現在您可以添加在代理基礎設施和助理進程中運行的自訂工具。
+```python
+from gpt_computer_agent import Tool, start
+@Tool
+def sum_tool(first_number: int, second_number: int) -> str:
+    """Useful for when you need to sum two numbers together."""
+    return first_number + second_number
+start()
+```
+https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/26ae3624-e619-44d6-9b04-f39cf1ac1f8f
+<p align="center">
+  <a href="#">
+    <img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/94ac619c-1f29-4fe6-b3cb-85a03932646b" alt="Logo"  >
+  </a>
+</p>
+## 使用方式
+![選項](https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/54b39347-98e0-4ee4-a715-9128c40dbcd4)
+## 使用案例
+<table>
+  <tr>
+    <td><img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/b4a4f11e-5588-4656-b5d7-b612a9a2855b" alt="Take Meeting Notes" width="500"/></td>
+    <td><img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/49eeac70-b33a-4ec4-8125-64127621ed62" alt="Daily Assistant" width="500"/></td>
+  </tr>
+  <tr>
+    <td><img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/10b69a18-033c-4d81-8ac9-f4e3c65b59c3" alt="Read Docs" width="500"/></td>
+    <td><img src="https://github.com/khulnasoft/gpt-computer-agent/assets/41792982/0f483bae-ffaf-4311-8653-c0dc64fb5ebe" alt="Coding Assistant" width="500"/></td>
+  </tr>
+</table>
+## 路線圖
+| 功能                             | 狀態         | 目標發布      |
+|---------------------------------|--------------|--------------|
+| 清除聊天記錄                     | 已完成       | 2024 年第二季度|
+| 長音訊支持（拆分 20mb）          | 已完成       | 2024 年第二季度|
+| 文本輸入                          | 已完成       | 2024 年第二季度|
+| 僅文本模式（靜音）                | 已完成       | 2024 年第二季度|
+| 添加配置文件（不同聊天）           | 已完成       | 2024 年第二季度|
+| 更多關於助手狀態的回饋             | 已完成       | 2024 年第二季度|
+| **新 UI**                        | 計劃中       | 2024 年第二季度|
+| **我們的自訂代理基礎設施**        | 計劃中       | 2024 年第二季度|
+| **本機應用程式，exe，dmg，appimage** | 計劃中       | 2024 年第二季度|
+| **DeepFace 集成（臉部識別）**      | 計劃中       | 2024 年第二季度|
+| **本地模式（使用 Ollama，語音和視覺模型）** | 計劃中       | 2024 年第二季度|
+## 功能
+此時我們擁有許多基礎設施元素。我們只是希望提供 ChatGPT 應用中已經存在的所有功能。
+| 功能                              | 描述                          |
+|-----------------------------------|-------------------------------|
+| **螢幕讀取**                      |            OK                 |
+| **麥克風**                        |            OK                 |
+| **系統音訊**                      |            OK                 |
+| **記憶體**                          |            OK                 |
+| **打開和關閉應用程式**              |            OK                 |
+| **打開一個 URL**                  |            OK                 |
+| **剪貼簿**                        |            OK                 |
+| **搜尋引擎**                      |            OK                 |
+| **編寫和運行 Python**            |            OK                 |
+| **編寫和運行 SH**                |            OK                 |
+| **使用你的 Telegram 帳戶**        |            OK                 |
+| **知識管理**                      |            OK                 |
+## 貢獻者
+<a href="https://github.com/khulnasoft/gpt-computer-agent/graphs/contributors">
+  <img src="https://contrib.rocks/image?repo=khulnasoft/gpt-computer-agent" />
+</a>

build_scripts/openai/macos_build.sh ADDED Viewed

	@@ -0,0 +1,30 @@

+#!/bin/sh
+# Requireed installations
+pip install ".[base]"
+pip install '.[agentic]'
+brew install create-dmg
+pip install pyinstaller==6.9.0
+# Pyinstaller
+pyinstaller --recursive-copy-metadata gpt_computer_agent run.py --windowed --add-data="gpt_computer_agent/utils/media/*":"gpt_computer_agent/utils/media" --icon="gpt_computer_agent/utils/media/icon.icns" --name="GPT_Computer_Agent"
+# Create a DMG
+# Create a folder (named dmg) to prepare our DMG in (if it doesn't already exist).
+mkdir -p dist/dmg
+# Empty the dmg folder.
+rm -r dist/dmg/*
+# Copy the app bundle to the dmg folder.
+cp -r "dist/GPT_Computer_Agent.app" dist/dmg
+# If the DMG already exists, delete it.
+test -f "dist/GPT_Computer_Agent.dmg" && rm "dist/GPT_Computer_Agent.dmg"
+create-dmg \
+  --volname "GPT_Computer_Agent" \
+  --volicon "gpt_computer_agent/utils/media/icon.icns" \
+  --window-pos 200 120 \
+  --window-size 600 300 \
+  --icon-size 100 \
+  --icon "GPT_Computer_Agent.app" 175 120 \
+  --hide-extension "GPT_Computer_Agent.app" \
+  --app-drop-link 425 120 \
+  "dist/GPT_Computer_Agent.dmg" \
+  "dist/dmg/"

build_scripts/openai/windows_build.sh ADDED Viewed

	@@ -0,0 +1,59 @@

+#!/bin/sh
+# Requireed installations
+python -m pip install pyinstaller==6.9.0
+# Pyinstaller
+pip3 install .
+pip3 install crewai==0.30.11
+pip3 install langgraph==0.0.51
+pip3 install pyqt5==5.15.10
+pip3 install scipy==1.13.1
+pip3 install pygame==2.5.2
+pip3 install soundcard==0.4.3
+pip3 install openai==1.30.3
+pip3 install langchain-google-genai==1.0.4
+pip3 install python-dotenv==1.0.0
+pip3 install upsonic==0.28.4
+pip3 install pyautogui==0.9.54
+pip3 install sounddevice==0.4.6
+pip3 install soundfile==0.12.1
+pip3 install pydub==0.25.1
+pip3 install pyscreeze==0.1.30
+pip3 install pyperclip==1.8.2
+pip3 install pydantic==2.7.2
+pip3 install pillow==10.3.0
+pip3 install langchainhub==0.1.18
+pip3 install langchain-experimental==0.0.58
+pip3 install opentelemetry-sdk==1.24.0
+pip3 install opentelemetry-exporter-otlp==1.24.0
+pip3 install langchain-groq==0.1.5
+pip3 install langchain-openai==0.1.6
+pip3 install open-interpreter==0.2.6
+pip3 install langchain==0.1.20
+pip3 install langchain-community==0.0.38
+pip3 install langchain-core==0.1.52
+# custom tools
+pip3 install pyperclip==1.8.2
+pip3 install google==3.0.0
+pip3 install duckduckgo-search==5.3.0
+pip3 install beautifulsoup4==4.12.3
+pip3 install pytesseract==0.3.10
+pip3 install pywifi-controls==0.7
+pip3 install pynput==1.7.7
+pip3 uninstall numpy -y
+pip3 install numpy
+pyinstaller --recursive-copy-metadata gpt_computer_agent run.py --onefile --add-data="gpt_computer_agent/utils/media/*":"gpt_computer_agent/utils/media" --icon="gpt_computer_agent/utils/media/icon.ico" --name="GPT_Computer_Agent"

bump.py ADDED Viewed

	@@ -0,0 +1,135 @@

+"""Module for managing the version updates of a python package."""
+import os
+import sys
+import re
+import logging
+import shlex
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+def read_version():
+    """
+    Gets and extracts the version number from the '__init__.py' file of
+    a Python package.
+    Returns:
+        str or None: The version number of the package if found, otherwise None.
+    """
+    with open("gpt_computer_agent/__init__.py", "r") as file:
+        for line in file:
+            match = re.search(r"__version__ = '(.*)'", line)
+            if match:
+                return match.group(1)
+def increment_version(part, version):
+    """
+    Simple function that increments the version number based on the given part
+    i.e., ('major', 'minor', or 'patch').
+    Notes:
+        Splits the version string into major, minor, and patch components, then
+        increments the specified part by one
+    Args:
+        part (str): The part of the version number to increment
+            ('major', 'minor', or 'patch').
+        version (str): The current version number in 'major.minor.patch' format.
+    Returns:
+        str: String containing new changes made to the version.
+    """
+    major, minor, patch = map(int, version.split("."))
+    if part == "major":
+        major += 1
+        minor = 0
+        patch = 0
+    elif part == "minor":
+        minor += 1
+        patch = 0
+    elif part == "patch":
+        patch += 1
+    return f"{major}.{minor}.{patch}"
+def write_version(version):
+    """
+    Updates the `__version__` variable in the `__init__.py` file of the
+    `gpt_computer_agent` package.
+    Args:
+        version (str): The new version number to replace the existing one.
+    """
+    with open("gpt_computer_agent/__init__.py", "r+") as file:
+        content = file.read()
+        content = re.sub(r"__version__ = '.*'", f"__version__ = '{version}'", content)  # fmt: off
+        file.seek(0)
+        file.write(content)
+def update_version(version):
+    """
+    Updates the version number found in a list of files.
+    Args:
+        version (str): The new version number to replace the existing one.
+    """
+    files = ["setup.py"]
+    for file in files:
+        with open(file, "r+") as f:
+            content = f.read()
+            content = re.sub(r'    version=".*"', f'    version="{version}"', content)  # fmt: off
+            f.seek(0)
+            f.write(content)
+def create_tag(version):
+    """
+    Uses the `os.system()` to create a `Git tag` for a specified version.
+    Args:
+        version (str): The version number for the git tag.
+    """
+    os.system(f"git tag v{shlex.quote(version)}")
+def create_commit(version):
+    """
+    Uses `os.system()` to add and commit the changed version number
+    to the Git repository.
+    Args:
+        version (str): Version number included in the commit message.
+    """
+    os.system("git add .")
+    os.system(f"git commit -m 'Changed version number with v{shlex.quote(version)}'")
+def push():
+    """Pushes changes and tags to the repository."""
+    os.system("git push")
+    os.system("git push --tag")
+def main():
+    """The main function for managing version updates."""
+    valid_parts = ["major", "minor", "patch"]
+    if len(sys.argv) != 2 or sys.argv[1] not in valid_parts:
+        logger.error(f"Usage: python version.py <{'|'.join(valid_parts)}>")
+        sys.exit(1)
+    part = sys.argv[1]
+    version = read_version()
+    new_version = increment_version(part, version)
+    write_version(new_version)
+    update_version(new_version)
+    create_commit(new_version)
+    create_tag(new_version)
+    push()
+if __name__ == "__main__":
+    main()

example_use_cases/workday_summerizer.md ADDED Viewed

	@@ -0,0 +1,55 @@

+# Introduction
+In this example we have an idea to summerize whole day of an employee via GPT Computer Assistant.
+# Code
+```console
+computeragent --api
+```
+```python
+from gpt_computer_agent.remote import remote
+remote.profile("Screen Analysis")
+# We will loop for 5 minutes
+loop_results = []
+for i in range(1000):
+    remote.reset_memory()
+    remote.just_screenshot()
+    detailed_analyses = remote.input("What is in the scren, detailed analyses")
+    app_name = remote.input("What is the app that the employee is using?")
+    subject = remote.input("What is the subject of this usage of the app?")
+    activity = remote.input("What is the employee doing now?")
+    loop_results.append({"detailed_analyses": detailed_analyses, "app_name": app_name, "subject": subject, "activity": activity})
+    remote.wait(10)
+# Summery of the work day
+summery_results = []
+remote.profile("Summerizer")
+remote.reset_memory()
+for i in loop_results:
+    total_string = i["detailed_analyses"] + " " + i["app_name"] + " " + i["subject"] + " " + i["activity"]
+    total_string = "Please summerize the work day" + total_string
+    summerized = remote.input(total_string)
+    summery_results.append(summerized)
+print("Summery: ", summery_results)
+```

gca_setup_generator.py ADDED Viewed

	@@ -0,0 +1,12 @@

+# Read the contents of setup.py
+with open("setup.py", "r") as file:
+    setup_content = file.read()
+# Replace the project name
+setup_content = setup_content.replace(
+    """name="gpt_computer_agent",""", """name="gcadev","""
+)
+# Write the modified content to gca_setup.py
+with open("gca_setup.py", "w") as file:
+    file.write(setup_content)

gpt_computer_agent/__init__.py ADDED Viewed

	@@ -0,0 +1,7 @@

+from .start import start
+from .agentic import Agent
+from .tooler import Tool
+__version__ = '0.22.4'  # fmt: skip

gpt_computer_agent/agent/__init__.py ADDED Viewed

	@@ -0,0 +1,4 @@

+from .agent import *
+from .assistant import *
+from .background import *
+from .chat_history import *

gpt_computer_agent/agent/agent.py ADDED Viewed

	@@ -0,0 +1,80 @@

+try:
+    from ..llm import get_model
+    from ..utils.db import *
+    from ..llm_settings import llm_settings
+    from ..tooler import *
+    from ..display_tools import *
+    from ..teams import *
+    from .agent_tools import get_tools
+except ImportError:
+    from llm import get_model
+    from utils.db import *
+    from llm_settings import llm_settings
+    from tooler import *
+    from display_tools import *
+    from teams import *
+    from agent.agent_tools import get_tools
+from langgraph.prebuilt import chat_agent_executor
+custom_tools_ = []
+def custom_tools():
+    global custom_tools_
+    the_list = []
+    the_list += custom_tools_
+    return the_list
+prompt_cache = {}
+def get_prompt(name):
+    global prompt_cache
+    if name in prompt_cache:
+        return prompt_cache[name]
+    else:
+        from langchain import hub
+        prompt = hub.pull(name)
+        prompt_cache[name] = prompt
+        return prompt
+def get_agent_executor():
+    tools = get_tools()
+    tools += custom_tools()
+    model = load_model_settings()
+    if is_predefined_agents_setting_active() and llm_settings[model]["tools"]:
+        try:
+            import crewai
+            tools += [search_on_internet_and_report_team, generate_code_with_aim_team]
+        except ImportError:
+            pass
+    if llm_settings[model]["provider"] == "openai":
+        tools += [
+            click_on_a_text_on_the_screen,
+            click_on_a_icon_on_the_screen,
+            move_on_a_text_on_the_screen,
+            move_on_a_icon_on_the_screen,
+            mouse_scroll,
+        ]
+    tools += [get_texts_on_the_screen]
+    if (
+        llm_settings[model]["provider"] == "openai"
+        or llm_settings[model]["provider"] == "groq"
+    ):
+        return chat_agent_executor.create_tool_calling_executor(get_model(), tools)
+    if llm_settings[model]["provider"] == "ollama":
+        print("Ollama tool len", len(tools))
+        return chat_agent_executor.create_tool_calling_executor(get_model(), tools)

gpt_computer_agent/agent/agent_tools.py ADDED Viewed

	@@ -0,0 +1,64 @@

+try:
+    from ..utils.db import *
+    from ..tooler import *
+    from ..display_tools import *
+    from ..teams import *
+    from ..llm_settings import each_message_extension, llm_settings
+except ImportError:
+    from utils.db import *
+    from tooler import *
+    from display_tools import *
+    from teams import *
+    from llm_settings import llm_settings
+custom_tools = []
+def load_tiger_tools():
+    try:
+        from upsonic import Tiger
+        tools = Tiger()
+        tools.enable_auto_requirements = True
+        tools = tools.langchain()
+        return tools
+    except:
+        return False
+def load_default_tools():
+    from ..standard_tools import get_standard_tools
+    return get_standard_tools()
+cached_tiger_tools = None
+def get_tiger_tools():
+    global cached_tiger_tools
+    if cached_tiger_tools is None:
+        cached_tiger_tools = load_tiger_tools()
+    return cached_tiger_tools
+if is_online_tools_setting_active():
+    get_tiger_tools()
+def get_tools():
+    model = load_model_settings()
+    if not llm_settings[model]["tools"]:
+        return []
+    if is_online_tools_setting_active():
+        tools = get_tiger_tools()
+        if not tools:
+            tools = load_default_tools()
+    else:
+        tools = load_default_tools()
+    return tools

gpt_computer_agent/agent/assistant.py ADDED Viewed

	@@ -0,0 +1,234 @@

+from langchain_core.messages import HumanMessage, SystemMessage, AIMessage
+from .chat_history import *
+from .agent import *
+try:
+    from ..screen.shot import *
+    from ..utils.db import load_model_settings, agents
+    from ..llm import get_model
+    from ..llm_settings import each_message_extension, llm_settings
+except ImportError:
+    from screen.shot import *
+    from utils.db import load_model_settings, agents
+    from llm import get_model
+    from llm_settings import each_message_extension, llm_settings
+config = {"configurable": {"thread_id": "abc123"}}
+def agentic(
+    llm_input, llm_history, client, screenshot_path=None, dont_save_image=False
+):
+    global agents
+    from crewai import Task, Crew
+    from crewai import Agent as crewai_Agent
+    the_agents = []
+    for each in agents:
+        the_agents.append(
+            crewai_Agent(
+                role=each["role"],
+                goal=each["goal"],
+                backstory=each["backstory"],
+                llm=get_model(high_context=True),
+            )
+        )
+    agents = the_agents
+    print("LLM INPUT", llm_input)
+    def image_explaination():
+        the_message = [
+            {"type": "text", "text": "Explain the image"},
+        ]
+        if screenshot_path:
+            base64_image = encode_image(screenshot_path)
+            the_message.append(
+                {
+                    "type": "image_url",
+                    "image_url": {"url": f"data:image/jpeg;base64,{base64_image}"},
+                },
+            )
+            print("LEN OF İMAGE", len(base64_image))
+        the_message = HumanMessage(content=the_message)
+        get_chat_message_history().add_message(the_message)
+        the_model = load_model_settings()
+        if (
+            llm_settings[the_model]["provider"] == "openai"
+            and llm_settings[the_model]["provider"] == "ollama"
+        ):
+            msg = get_agent_executor().invoke(
+                {"messages": llm_history + [the_message]}, config=config
+            )
+        if llm_settings[the_model]["provider"] == "google":
+            msg = get_agent_executor().invoke(
+                {"messages": llm_history + [the_message]}, config=config
+            )
+        the_last_messages = msg["messages"]
+        return the_last_messages[-1].content
+    if screenshot_path:
+        image_explain = image_explaination()
+        llm_input += "User Sent Image and image content is: " + image_explain
+    llm_input = llm_input + each_message_extension
+    task = Task(
+        description=llm_input,
+        expected_output="Answer",
+        agent=agents[0],
+        tools=get_tools(),
+    )
+    the_crew = Crew(
+        agents=agents,
+        tasks=[task],
+        full_output=True,
+        verbose=True,
+    )
+    result = the_crew.kickoff()["final_output"]
+    get_chat_message_history().add_message(
+        HumanMessage(content=[llm_input.replace(each_message_extension, "")])
+    )
+    get_chat_message_history().add_message(AIMessage(content=[result]))
+    return result
+def assistant(
+    llm_input, llm_history, client, screenshot_path=None, dont_save_image=False
+):
+    the_model = load_model_settings()
+    if len(agents) != 0:
+        print("Moving to Agentic")
+        return agentic(llm_input, llm_history, client, screenshot_path, dont_save_image)
+    print("LLM INPUT", llm_input)
+    if llm_settings[the_model]["tools"]:
+        llm_input = llm_input + each_message_extension
+    the_message = [
+        {"type": "text", "text": f"{llm_input}"},
+    ]
+    if screenshot_path:
+        base64_image = encode_image(screenshot_path)
+        if llm_settings[the_model]["provider"] == "ollama":
+            the_message.append(
+                {
+                    "type": "image_url",
+                    "image_url": base64_image,
+                },
+            )
+        else:
+            the_message.append(
+                {
+                    "type": "image_url",
+                    "image_url": {"url": f"data:image/jpeg;base64,{base64_image}"},
+                },
+            )
+        print("LEN OF IMAGE", len(base64_image))
+    the_message = HumanMessage(content=the_message)
+    get_chat_message_history().add_message(the_message)
+    if (
+        llm_settings[the_model]["provider"] == "openai"
+        or llm_settings[the_model]["provider"] == "ollama"
+    ):
+        msg = get_agent_executor().invoke(
+            {"messages": llm_history + [the_message]}, config=config
+        )
+    if llm_settings[the_model]["provider"] == "google":
+        the_history = []
+        for message in llm_history:
+            try:
+                if isinstance(message, SystemMessage):
+                    the_mes = HumanMessage(content=message.content[0]["text"])
+                    the_history.append(the_mes)
+                elif isinstance(message, HumanMessage):
+                    the_mes = HumanMessage(content=message.content[0]["text"])
+                    the_history.append(the_mes)
+                else:
+                    the_mes = AIMessage(content=message.content[0]["text"])
+                    the_history.append(the_mes)
+            except:
+                the_mes = AIMessage(content=message.content)
+                the_history.append(the_mes)
+        the_last_message = HumanMessage(content=llm_input)
+        msg = get_agent_executor().invoke(
+            {"messages": the_history + [the_last_message]}, config=config
+        )
+    elif llm_settings[the_model]["provider"] == "groq":
+        the_history = []
+        for message in llm_history:
+            try:
+                if isinstance(message, SystemMessage):
+                    the_mes = SystemMessage(content=message.content[0]["text"])
+                    the_history.append(the_mes)
+                elif isinstance(message, HumanMessage):
+                    the_mes = HumanMessage(content=message.content[0]["text"])
+                    the_history.append(the_mes)
+                else:
+                    the_mes = AIMessage(content=message.content[0]["text"])
+                    the_history.append(the_mes)
+            except:
+                the_mes = AIMessage(content=message.content)
+                the_history.append(the_mes)
+        the_last_message = HumanMessage(content=llm_input)
+        msg = get_agent_executor().invoke(
+            {"messages": the_history + [the_last_message]}, config=config
+        )
+    the_last_messages = msg["messages"]
+    if dont_save_image and screenshot_path is not None:
+        currently_messages = get_chat_message_history().messages
+        last_message = currently_messages[-1].content[0]
+        currently_messages.remove(currently_messages[-1])
+        get_chat_message_history().clear()
+        for message in currently_messages:
+            get_chat_message_history().add_message(message)
+        get_chat_message_history().add_message(HumanMessage(content=[last_message]))
+    get_chat_message_history().add_message(the_last_messages[-1])
+    # Replace each_message_extension with empty string
+    list_of_messages = get_chat_message_history().messages
+    get_chat_message_history().clear()
+    for message in list_of_messages:
+        try:
+            message.content[0]["text"] = message.content[0]["text"].replace(
+                each_message_extension, ""
+            )
+            get_chat_message_history().add_message(message)
+        except:
+            get_chat_message_history().add_message(message)
+    print("The return", the_last_messages[-1].content)
+    return the_last_messages[-1].content

gpt_computer_agent/agent/background.py ADDED Viewed

	@@ -0,0 +1,21 @@

+from langchain_core.messages import SystemMessage
+try:
+    from .chat_history import *
+    from ..llm_settings import first_message
+except ImportError:
+    from agent.chat_history import *
+    from llm_settings import first_message
+def llm_history_oiginal():
+    return [
+        SystemMessage(
+            content=[
+                {
+                    "type": "text",
+                    "text": first_message(),
+                }
+            ]
+        ),
+    ]

gpt_computer_agent/agent/chat_history.py ADDED Viewed

	@@ -0,0 +1,31 @@

+from langchain_community.chat_message_histories import SQLChatMessageHistory
+from .background import llm_history_oiginal
+try:
+    from ..utils.db import get_history_db
+    from ..utils.db import load_model_settings, agents
+    from ..llm_settings import each_message_extension, llm_settings
+except ImportError:
+    from utils.db import get_history_db
+    from utils.db import load_model_settings
+    from llm_settings import llm_settings
+def get_chat_message_history():
+    connection = SQLChatMessageHistory(
+        session_id="abc123", connection_string=f"sqlite:///{get_history_db()}"
+    )
+    if len(connection.messages) == 0:
+        the_model = load_model_settings()
+        if llm_settings[the_model]["tools"]:
+            connection.add_message(llm_history_oiginal()[0])
+    return connection
+def clear_chat_history():
+    get_chat_message_history().clear()
+    the_model = load_model_settings()
+    if llm_settings[the_model]["tools"]:
+        get_chat_message_history().add_message(llm_history_oiginal()[0])

gpt_computer_agent/agent/process.py ADDED Viewed

	@@ -0,0 +1,299 @@

+try:
+    from ..llm import *
+    from .assistant import *
+    from .chat_history import *
+    from ..audio.tts import text_to_speech
+    from ..audio.stt import speech_to_text
+    from ..audio.record import audio_data
+    from ..gui.signal import signal_handler
+    from ..utils.db import *
+    from ..utils.telemetry import my_tracer, os_name
+except ImportError:
+    from llm import *
+    from agent.assistant import *
+    from agent.chat_history import *
+    from audio.tts import text_to_speech
+    from audio.stt import speech_to_text
+    from gui.signal import signal_handler
+    from utils.db import *
+    from utils.telemetry import my_tracer, os_name
+import threading
+import traceback
+from pygame import mixer
+import time
+last_ai_response = None
+user_id = load_user_id()
+os_name_ = os_name()
+def tts_if_you_can(
+    text: str, not_threaded=False, status_edit=False, bypass_other_settings=False
+):
+    try:
+        try:
+            from ..gpt_computer_agent import the_main_window
+        except ImportError:
+            from gpt_computer_agent import the_main_window
+        first_control = None
+        try:
+            first_control = (
+                not is_just_text_model_active() and not the_main_window.api_enabled
+            )
+        except:
+            first_control = False
+        if first_control or bypass_other_settings:
+            response_path = text_to_speech(text)
+            if status_edit:
+                signal_handler.assistant_response_ready.emit()
+            def play_audio():
+                for each_r in response_path:
+                    mixer.init()
+                    mixer.music.load(each_r)
+                    mixer.music.play()
+                    while mixer.music.get_busy():
+                        the_stop_talking = False
+                        try:
+                            the_stop_talking = the_main_window.stop_talking
+                        except:
+                            pass
+                        if the_stop_talking:
+                            mixer.music.stop()
+                            break
+                        time.sleep(0.1)
+                if status_edit:
+                    signal_handler.assistant_response_stopped.emit()
+            if not not_threaded:
+                playback_thread = threading.Thread(target=play_audio)
+                playback_thread.start()
+            else:
+                play_audio()
+    except Exception:
+        traceback.print_exc()
+        pass
+def process_audio(take_screenshot=True, take_system_audio=False, dont_save_image=False):
+    with my_tracer.start_span("process_audio") as span:
+        span.set_attribute("user_id", user_id)
+        span.set_attribute("os_name", os_name_)
+        try:
+            global audio_data, last_ai_response
+            from ..gpt_computer_agent import the_input_box, the_main_window
+            from ..audio.record import audio_data, the_input_box_pre
+            transcription = speech_to_text(mic_record_location)
+            if take_system_audio:
+                transcription2 = speech_to_text(system_sound_location)
+            llm_input = transcription
+            print("Previously AI response", last_ai_response, "end prev")
+            print("Input Box AI", the_input_box_pre)
+            if (
+                the_input_box_pre != ""
+                and not the_input_box_pre.startswith("System:")
+                and the_input_box_pre not in last_ai_response
+            ):
+                llm_input += the_input_box_pre
+            if take_system_audio:
+                llm_input += " \n Other of USER: " + transcription2
+            if the_input_box.toPlainText().startswith("System:"):
+                the_main_window.update_from_thread(
+                    "Transciption Completed. Running AI..."
+                )
+            print("LLM INPUT (screenshot)", llm_input)
+            llm_output = assistant(
+                llm_input,
+                get_chat_message_history().messages,
+                get_client(),
+                screenshot_path=screenshot_path if take_screenshot else None,
+                dont_save_image=dont_save_image,
+            )
+            if the_input_box.toPlainText().startswith("System:"):
+                the_main_window.update_from_thread(
+                    "AI Response Completed. Generating Audio..."
+                )
+            last_ai_response = llm_output.replace("<Answer>", "")
+            from ..gpt_computer_agent import the_main_window
+            model = load_model_settings()
+            if not llm_settings[model][
+                "stream"
+            ] or the_main_window.worker.the_input_text.startswith("System:"):
+                the_main_window.set_text_to_input_box(last_ai_response)
+                the_main_window.complated_answer = True
+            signal_handler.assistant_response_ready.emit()
+            def play_text():
+                from ..gpt_computer_agent import the_main_window
+                the_main_window.complated_answer = True
+                the_main_window.manuel_stop = True
+                while (
+                    the_main_window.reading_thread or the_main_window.reading_thread_2
+                ):
+                    time.sleep(0.1)
+                the_main_window.read_part_task()
+                if the_main_window.stop_talking:
+                    the_main_window.stop_talking = False
+                signal_handler.assistant_response_stopped.emit()
+            playback_thread = threading.Thread(target=play_text)
+            playback_thread.start()
+        except Exception as e:
+            print("Error in process_audio", e)
+            traceback.print_exc()
+            from ..gpt_computer_agent import the_input_box, the_main_window
+            the_main_window.update_from_thread("EXCEPTION: " + str(e))
+            tts_if_you_can("Exception occurred. Please check the logs.")
+            signal_handler.assistant_response_stopped.emit()
+def process_screenshot():
+    with my_tracer.start_span("process_screenshot") as span:
+        span.set_attribute("user_id", user_id)
+        span.set_attribute("os_name", os_name_)
+        try:
+            global last_ai_response
+            from ..gpt_computer_agent import the_input_box, the_main_window
+            from ..audio.record import the_input_box_pre
+            llm_input = "I just take a screenshot. for you to remember. Just say 'Ok.' if the user doesnt want anything before."
+            if (
+                the_input_box_pre != ""
+                and not the_input_box_pre.startswith("System:")
+                and the_input_box_pre not in last_ai_response
+            ):
+                llm_input += the_input_box_pre
+            print("LLM INPUT (just screenshot)", llm_input)
+            if the_input_box.toPlainText().startswith("System:"):
+                the_main_window.update_from_thread(
+                    "Transciption Completed. Running AI..."
+                )
+            llm_output = assistant(
+                llm_input,
+                get_chat_message_history().messages,
+                get_client(),
+                screenshot_path=just_screenshot_path,
+                dont_save_image=False,
+            )
+            last_ai_response = llm_output.replace("<Answer>", "")
+            from ..gpt_computer_agent import the_main_window
+            model = load_model_settings()
+            if not llm_settings[model][
+                "stream"
+            ] or the_main_window.worker.the_input_text.startswith("System:"):
+                the_main_window.set_text_to_input_box(last_ai_response)
+                the_main_window.complated_answer = True
+            signal_handler.assistant_response_ready.emit()
+            def play_text():
+                from ..gpt_computer_agent import the_main_window
+                the_main_window.complated_answer = True
+                the_main_window.manuel_stop = True
+                while (
+                    the_main_window.reading_thread or the_main_window.reading_thread_2
+                ):
+                    time.sleep(0.1)
+                the_main_window.read_part_task()
+                if the_main_window.stop_talking:
+                    the_main_window.stop_talking = False
+                signal_handler.assistant_response_stopped.emit()
+            playback_thread = threading.Thread(target=play_text)
+            playback_thread.start()
+        except Exception as e:
+            print("Error in process_screenshot", e)
+            traceback.print_exc()
+            from ..gpt_computer_agent import the_input_box, the_main_window
+            the_main_window.update_from_thread("EXCEPTION: " + str(e))
+            tts_if_you_can("Exception occurred. Please check the logs.")
+            signal_handler.assistant_response_stopped.emit()
+def process_text(text, screenshot_path=None):
+    with my_tracer.start_span("process_text") as span:
+        span.set_attribute("user_id", user_id)
+        span.set_attribute("os_name", os_name_)
+        try:
+            global last_ai_response
+            llm_input = text
+            llm_output = assistant(
+                llm_input,
+                get_chat_message_history().messages,
+                get_client(),
+                screenshot_path=screenshot_path,
+                dont_save_image=True,
+            )
+            last_ai_response = llm_output.replace("<Answer>", "")
+            from ..gpt_computer_agent import the_main_window
+            model = load_model_settings()
+            if not llm_settings[model][
+                "stream"
+            ] or the_main_window.worker.the_input_text.startswith("System:"):
+                the_main_window.set_text_to_input_box(last_ai_response)
+                the_main_window.complated_answer = True
+            signal_handler.assistant_response_ready.emit()
+            def play_text():
+                from ..gpt_computer_agent import the_main_window
+                the_main_window.complated_answer = True
+                the_main_window.manuel_stop = True
+                while (
+                    the_main_window.reading_thread or the_main_window.reading_thread_2
+                ):
+                    time.sleep(0.1)
+                the_main_window.read_part_task()
+                if the_main_window.stop_talking:
+                    the_main_window.stop_talking = False
+                signal_handler.assistant_response_stopped.emit()
+            playback_thread = threading.Thread(target=play_text)
+            playback_thread.start()
+        except Exception as e:
+            print("Error in process_text", e)
+            traceback.print_exc()
+            from ..gpt_computer_agent import the_main_window
+            the_main_window.update_from_thread("EXCEPTION: " + str(e))
+            tts_if_you_can("Exception occurred. Please check the logs.")
+            signal_handler.assistant_response_stopped.emit()

gpt_computer_agent/agentic.py ADDED Viewed

	@@ -0,0 +1,36 @@

+from .utils.db import agents
+class Agent:
+    """
+    Represents an agent within the system.
+    This class defines an agent with a specific role, goal, and backstory. Upon initialization,
+    the agent is added to the global list of agents.
+    Attributes:
+    - role (str): The role of the agent.
+    - goal (str): The goal or objective of the agent.
+    - backstory (str): The backstory or history of the agent.
+    Methods:
+    - __init__(role, goal, backstory): Initializes the Agent object and adds it to the global list of agents.
+    Global Variables:
+    - agents (list): A global list containing information about all agents in the system.
+    """
+    def __init__(self, role, goal, backstory):
+        """
+        Initializes a new Agent object and adds it to the global list of agents.
+        Parameters:
+        - role (str): The role of the agent.
+        - goal (str): The goal or objective of the agent.
+        - backstory (str): The backstory or history of the agent.
+        Returns:
+        None
+        """
+        global agents
+        agents.append({"role": role, "goal": goal, "backstory": backstory})

gpt_computer_agent/api.py ADDED Viewed

	@@ -0,0 +1,673 @@

+# Create a python api and start_api function via flask
+from flask import Flask, request, jsonify
+import threading
+import time
+from werkzeug.serving import make_server
+app = Flask(__name__)
+@app.route("/status", methods=["POST"])
+def status():
+    return jsonify({"response": True})
+@app.route("/input", methods=["POST"])
+def input():
+    """
+    This function receives input from the user and returns the response.
+    """
+    data = request.json
+    text = data["text"]
+    screen = data["screen"]
+    talk = data["talk"]
+    print("Input:", text)
+    from .gpt_computer_agent import the_main_window, the_input_box
+    firsst_text = the_input_box.toPlainText()
+    original_tts = the_main_window.tts_available
+    if talk == "true":
+        the_main_window.tts_available = True
+        the_main_window.manuel_stop = True
+    if screen != "true":
+        the_main_window.button_handler.input_text(text)
+    else:
+        the_main_window.button_handler.input_text_screenshot(text)
+    while the_input_box.toPlainText() == firsst_text:
+        time.sleep(0.3)
+    while the_input_box.toPlainText().startswith("System:"):
+        time.sleep(0.3)
+    while not the_main_window.state == "idle":
+        time.sleep(0.3)
+    response = the_input_box.toPlainText()
+    the_main_window.tts_available = original_tts
+    return jsonify({"response": response})
+@app.route("/screenshot", methods=["POST"])
+def screenshot():
+    """
+    This function receives a screenshot from the user and returns the response.
+    """
+    from .gpt_computer_agent import the_main_window, the_input_box
+    firsst_text = the_input_box.toPlainText()
+    the_main_window.button_handler.just_screenshot()
+    while the_input_box.toPlainText() == firsst_text:
+        time.sleep(0.3)
+    while the_input_box.toPlainText().startswith("System:"):
+        time.sleep(0.3)
+    while not the_main_window.state == "idle":
+        time.sleep(0.3)
+    response = the_input_box.toPlainText()
+    return jsonify({"response": response})
+@app.route("/tts", methods=["POST"])
+def tts():
+    """
+    This function receives a text to speech request from the user and returns the response.
+    """
+    from .gpt_computer_agent import the_main_window
+    original_tts = the_main_window.tts_available
+    the_main_window.tts_available = True
+    the_main_window.manuel_stop = True
+    data = request.json
+    text = data["text"]
+    print("TTS:", text)
+    from .agent.process import tts_if_you_can
+    tts_if_you_can(
+        text, not_threaded=False, status_edit=True, bypass_other_settings=True
+    )
+    the_main_window.tts_available = original_tts
+    return jsonify({"response": "TTS request received"})
+@app.route("/profile", methods=["POST"])
+def profile():
+    """
+    This function sets the profile for the application.
+    """
+    data = request.json
+    profile = data["profile"]
+    print("Profile:", profile)
+    from .utils.db import set_profile
+    set_profile(profile)
+    from .gpt_computer_agent import the_main_window
+    the_main_window.update_from_thread("Profile set to " + profile)
+    return jsonify({"response": "Profile set to " + profile})
+@app.route("/reset_memory", methods=["POST"])
+def reset_memory():
+    """
+    This function resets the memory of the application.
+    """
+    from .agent.chat_history import clear_chat_history
+    clear_chat_history()
+    from .gpt_computer_agent import the_main_window
+    the_main_window.update_from_thread("Memory reset")
+    return jsonify({"response": "Memory reset"})
+@app.route("/activate_predefined_agents", methods=["POST"])
+def enable_predefined_agents():
+    """
+    This function enables predefined agents for the application.
+    """
+    from .utils.db import activate_predefined_agents_setting
+    activate_predefined_agents_setting()
+    from .gpt_computer_agent import the_main_window
+    the_main_window.update_from_thread("Predefined agents enabled")
+    return jsonify({"response": "Predefined agents enabled"})
+@app.route("/deactivate_predefined_agents", methods=["POST"])
+def disable_predefined_agents():
+    """
+    This function disables predefined agents for the application.
+    """
+    from .utils.db import deactivate_predefined_agents_setting
+    deactivate_predefined_agents_setting()
+    from .gpt_computer_agent import the_main_window
+    the_main_window.update_from_thread("Predefined agents disabled")
+    return jsonify({"response": "Predefined agents disabled"})
+@app.route("/activate_online_tools", methods=["POST"])
+def enable_online_tools():
+    """
+    This function enables online tools for the application.
+    """
+    from .utils.db import activate_online_tools_setting
+    activate_online_tools_setting()
+    from .gpt_computer_agent import the_main_window
+    the_main_window.update_from_thread("Online tools enabled")
+    return jsonify({"response": "Online tools enabled"})
+@app.route("/deactivate_online_tools", methods=["POST"])
+def disable_online_tools():
+    """
+    This function disables online tools for the application.
+    """
+    from .utils.db import deactivate_online_tools_setting
+    deactivate_online_tools_setting()
+    from .gpt_computer_agent import the_main_window
+    the_main_window.update_from_thread("Online tools disabled")
+    return jsonify({"response": "Online tools disabled"})
+@app.route("/change_name", methods=["POST"])
+def change_name():
+    """
+    This function changes the name of the application.
+    """
+    data = request.json
+    new_name = data["new_name"]
+    print("Name:", new_name)
+    from .character import change_name
+    change_name(new_name)
+    return jsonify({"response": "Name changed to " + new_name})
+@app.route("/change_developer", methods=["POST"])
+def change_developer():
+    """
+    This function changes the developer of the application.
+    """
+    data = request.json
+    new_developer = data["new_developer"]
+    print("Developer:", new_developer)
+    from .character import change_developer
+    change_developer(new_developer)
+    return jsonify({"response": "Developer changed to " + new_developer})
+@app.route("/library_install", methods=["POST"])
+def library_install():
+    """
+    This function install a library.
+    """
+    data = request.json
+    library = data["library"]
+    print("Library İnstall:", library)
+    from .utils.pypi import install_library
+    if install_library(library):
+        return jsonify({"response": f"Library {library} installed"})
+    else:
+        return jsonify({"response": f"Library {library} installation failed"})
+@app.route("/library_uninstall", methods=["POST"])
+def library_uninstall():
+    """
+    This function uninstall a library.
+    """
+    data = request.json
+    library = data["library"]
+    print("Library Uninstall:", library)
+    from .utils.pypi import uninstall_library
+    if uninstall_library(library):
+        return jsonify({"response": f"Library {library} uninstalled"})
+    else:
+        return jsonify({"response": f"Library {library} uninstallation failed"})
+@app.route("/custom_tool", methods=["POST"])
+def custom_tool():
+    """
+    This function adds a custom tool to the application.
+    """
+    data = request.json
+    code = data["code"]
+    print("Custom Tool:", code)
+    from .utils.function import string_to_function
+    try:
+        func = string_to_function(code)
+        from .tooler import Tool
+        Tool(func)
+        return jsonify({"response": f"Custom tool {func.__name__} added"})
+    except Exception as e:
+        return jsonify({"response": f"Custom tool addition failed: {e}"}), 500
+@app.route("/top_bar_activate", methods=["POST"])
+def top_bar_activate():
+    """
+    This function serve an animation of top bar to show an operations especialy
+    """
+    from .gpt_computer_agent import the_main_window
+    data = request.json
+    text = data["text"]
+    the_main_window.active_border_animation(text)
+    return jsonify({"response": "Activated top bar animation"})
+@app.route("/top_bar_deactivate", methods=["POST"])
+def top_bar_deactivate():
+    """
+    This function stop the top bar animation
+    """
+    from .gpt_computer_agent import the_main_window
+    data = request.json
+    text = data["text"]
+    the_main_window.deactive_border_animation(text)
+    return jsonify({"response": "Deactivated top bar animation"})
+@app.route("/boop_sound", methods=["POST"])
+def boop_sound():
+    """
+    This function sound an boop to user
+    """
+    from .gpt_computer_agent import click_sound
+    click_sound()
+    return jsonify({"response": "Sound played"})
+@app.route("/ask_to_user", methods=["POST"])
+def ask_to_user():
+    """
+    This api asks question to the user and return the result
+    """
+    data = request.json
+    question = data["question"]
+    wait_for_answer = data["wait_for_answer"]
+    from .standard_tools import ask_to_user
+    result = ask_to_user(question, wait_for_answer)
+    return jsonify({"response": result})
+@app.route("/set_text", methods=["POST"])
+def set_text():
+    """
+    This api set text to main window text input
+    """
+    data = request.json
+    text = data["text"]
+    from .gpt_computer_agent import the_main_window
+    the_main_window.set_text_from_api(text)
+    return jsonify({"response": "Text set."})
+@app.route("/set_background_color", methods=["POST"])
+def set_background_color():
+    """
+    This api set text to main window text input
+    """
+    data = request.json
+    color = data["color"]
+    from .gpt_computer_agent import the_main_window
+    the_main_window.set_background_color(color)
+    return jsonify({"response": "Background color set."})
+@app.route("/set_opacity", methods=["POST"])
+def set_opacity():
+    """
+    This api set text to main window text input
+    """
+    data = request.json
+    opacity = data["opacity"]
+    from .gpt_computer_agent import the_main_window
+    the_main_window.set_opacity(opacity)
+    return jsonify({"response": "Opacity set."})
+@app.route("/set_border_radius", methods=["POST"])
+def set_border_radius():
+    """
+    This api set text to main window text input
+    """
+    data = request.json
+    radius = data["radius"]
+    from .gpt_computer_agent import the_main_window
+    the_main_window.set_border_radius(radius)
+    return jsonify({"response": "Border radius set."})
+@app.route("/collapse", methods=["POST"])
+def collapse():
+    """
+    This api set text to main window text input
+    """
+    from .gpt_computer_agent import the_main_window
+    the_main_window.collapse_gca_api()
+    return jsonify({"response": "Collapsed."})
+@app.route("/expand", methods=["POST"])
+def expand():
+    """
+    This api set text to main window text input
+    """
+    from .gpt_computer_agent import the_main_window
+    the_main_window.uncollapse_gca_api()
+    return jsonify({"response": "Expanded."})
+@app.route("/save_openai_api_key", methods=["POST"])
+def save_openai_api_key():
+    """
+    This api saves the OpenAI API key
+    """
+    data = request.json
+    openai_api_key = data["openai_api_key"]
+    from .utils.db import save_api_key
+    save_api_key(openai_api_key)
+    return jsonify({"response": "OpenAI API key saved."})
+@app.route("/save_openai_url", methods=["POST"])
+def save_openai_url():
+    """
+    This api saves the OpenAI base URL
+    """
+    data = request.json
+    openai_url = data["openai_url"]
+    from .utils.db import save_openai_url
+    save_openai_url(openai_url)
+    return jsonify({"response": "OpenAI base URL saved."})
+@app.route("/save_model_settings", methods=["POST"])
+def save_model_settings():
+    """
+    This api saves the model settings
+    """
+    data = request.json
+    model_settings = data["model_settings"]
+    from .utils.db import save_model_settings
+    save_model_settings(model_settings)
+    return jsonify({"response": "Model settings saved."})
+@app.route("/save_groq_api_key", methods=["POST"])
+def save_groq_api_key():
+    """
+    This api saves the Groq API key
+    """
+    data = request.json
+    groq_api_key = data["groq_api_key"]
+    from .utils.db import save_groq_api_key
+    save_groq_api_key(groq_api_key)
+    return jsonify({"response": "Groq API key saved."})
+@app.route("/save_google_api_key", methods=["POST"])
+def save_google_api_key():
+    """
+    This api saves the Google Generative AI API key
+    """
+    data = request.json
+    google_api_key = data["google_api_key"]
+    from .utils.db import save_google_api_key
+    save_google_api_key(google_api_key)
+    return jsonify({"response": "Google Generative AI API key saved."})
+@app.route("/save_tts_model_settings", methods=["POST"])
+def save_tts_model_settings():
+    """
+    This api saves the TTS model settings
+    """
+    data = request.json
+    tts_model_settings = data["tts_model_settings"]
+    from .utils.db import save_tts_model_settings
+    save_tts_model_settings(tts_model_settings)
+    return jsonify({"response": "TTS model settings saved."})
+@app.route("/save_stt_model_settings", methods=["POST"])
+def save_stt_model_settings():
+    """
+    This api saves the STT model settings
+    """
+    data = request.json
+    stt_model_settings = data["stt_model_settings"]
+    from .utils.db import save_stt_model_settings
+    save_stt_model_settings(stt_model_settings)
+    return jsonify({"response": "STT model settings saved."})
+@app.route("/show_logo", methods=["POST"])
+def show_logo():
+    """
+    This api shows the custom logo
+    """
+    from .utils.db import activate_logo_active_setting
+    activate_logo_active_setting()
+    from .gpt_computer_agent import the_main_window
+    the_main_window.show_logo_api()
+    return jsonify({"response": "Custom logo activated."})
+@app.route("/hide_logo", methods=["POST"])
+def hide_logo():
+    """
+    This api hides the custom logo
+    """
+    from .utils.db import deactivate_logo_active_setting
+    deactivate_logo_active_setting()
+    from .gpt_computer_agent import the_main_window
+    the_main_window.hide_logo_api()
+    return jsonify({"response": "Custom logo deactivated."})
+@app.route("/default_logo", methods=["POST"])
+def default_logo():
+    """
+    This api enable default logo
+    """
+    from .utils.db import (
+        save_logo_file_path,
+        icon_256_path,
+        is_logo_active_setting_active,
+    )
+    save_logo_file_path(icon_256_path)
+    from .gpt_computer_agent import the_main_window
+    the_main_window.tray_and_task_bar_logo_api()
+    if is_logo_active_setting_active():
+        the_main_window.show_logo_api()
+    return jsonify({"response": "Custom logo deactivated."})
+@app.route("/custom_logo_upload", methods=["POST"])
+def custom_logo_upload():
+    """
+    This api uploads a custom logo
+    """
+    file = request.files["logo"]
+    from .utils.db import (
+        save_logo_file_path,
+        custom_logo_path,
+        is_logo_active_setting_active,
+    )
+    file.save(custom_logo_path)
+    save_logo_file_path(custom_logo_path)
+    from .gpt_computer_agent import the_main_window
+    the_main_window.tray_and_task_bar_logo_api()
+    if is_logo_active_setting_active():
+        the_main_window.show_logo_api()
+    return jsonify({"response": "Custom logo uploaded."})
+@app.route("/activate_long_gca", methods=["POST"])
+def activate_long_gca():
+    """
+    This api activates long GCA
+    """
+    from .gpt_computer_agent import the_main_window
+    the_main_window.activate_long_gca_api()
+    return jsonify({"response": "Long GCA activated."})
+@app.route("/deactivate_long_gca", methods=["POST"])
+def deactivate_long_gca():
+    """
+    This api deactivates long GCA
+    """
+    from .gpt_computer_agent import the_main_window
+    the_main_window.deactivate_long_gca_api()
+    return jsonify({"response": "Long GCA deactivated."})
+@app.route("/train", methods=["POST"])
+def train():
+    """
+    This api trains the gca with given url
+    """
+    data = request.json
+    url = data["url"]
+    from .utils.train import train
+    the_result = train(url)
+    return jsonify({"response": the_result})
+@app.route("/get_openai_models", methods=["POST"])
+def get_openai_models():
+    """
+    This api returns the list of OpenAI models
+    """
+    from .llm_settings import get_openai_models
+    return jsonify({"response": get_openai_models()})
+@app.route("/get_ollama_models", methods=["POST"])
+def get_ollama_models():
+    """
+    This api returns the list of Ollama models
+    """
+    from .llm_settings import get_ollama_models
+    return jsonify({"response": get_ollama_models()})
+@app.route("/get_google_models", methods=["POST"])
+def get_google_models():
+    """
+    This api returns the list of Google models
+    """
+    from .llm_settings import get_google_models
+    return jsonify({"response": get_google_models()})
+@app.route("/get_groq_models", methods=["POST"])
+def get_groq_models():
+    """
+    This api returns the list of Groq models
+    """
+    from .llm_settings import get_groq_models
+    return jsonify({"response": get_groq_models()})
+class ServerThread(threading.Thread):
+    def __init__(self, app, host, port):
+        threading.Thread.__init__(self)
+        self.srv = make_server(host, port, app)
+        self.ctx = app.app_context()
+        self.ctx.push()
+    def run(self):
+        print("Starting server")
+        self.srv.serve_forever()
+    def shutdown(self):
+        print("Stopping server")
+        self.srv.shutdown()
+server_thread = None
+def start_api():
+    global server_thread
+    if server_thread is None:
+        server_thread = ServerThread(app, "localhost", 7541)
+        server_thread.start()
+        print("API started")
+    else:
+        print("API is already running")
+def stop_api():
+    global server_thread
+    if server_thread is not None:
+        server_thread.shutdown()
+        server_thread.join()
+        server_thread = None
+        print("API stopped")
+    else:
+        print("API is not running")

gpt_computer_agent/audio/__init__.py ADDED Viewed

	@@ -0,0 +1 @@


1	+ from .record import *

gpt_computer_agent/audio/record.py ADDED Viewed

	@@ -0,0 +1,159 @@

+try:
+    from ..gui.signal import *
+    from ..utils.db import *
+    from ..utils.telemetry import my_tracer, os_name
+except ImportError:
+    from gui.signal import *
+    from utils.db import *
+    from utils.telemetry import my_tracer, os_name
+import numpy as np
+import sounddevice as sd
+import soundfile as sf
+import scipy.io.wavfile as wavfile
+import soundcard as sc
+import threading
+import time
+from scipy.io.wavfile import write
+samplerate = 48000  # Updated samplerate for better quality
+channels = 1
+recording = False
+audio_data = None
+user_id = load_user_id()
+os_name_ = os_name()
+the_input_box_pre = ""
+import queue
+# Initialize a queue to keep the last N audio levels (rolling window)
+audio_levels = queue.Queue(maxsize=10)  # Adjust size as needed
+def calculate_dynamic_threshold():
+    """Calculate a dynamic threshold based on recent audio levels."""
+    if audio_levels.qsize() == 0:
+        return 0.01  # Default threshold if no data is available
+    else:
+        # Calculate the average of the last N audio levels
+        return np.mean(list(audio_levels.queue)) * 2  # Adjust multiplier as needed
+silence_start_time = None
+auto_stop_recording = True
+def start_recording(take_system_audio, buttonhandler):
+    """Start recording audio from microphone and/or system sound."""
+    with my_tracer.start_span("start_recording") as span:
+        span.set_attribute("user_id", user_id)
+        span.set_attribute("os_name", os_name_)
+        global the_input_box_pre
+        from ..gpt_computer_agent import the_input_box, the_main_window
+        the_input_box_pre = the_input_box.toPlainText()
+        the_main_window.update_from_thread("Click again when recording is done")
+        global recording, audio_data, silence_start_time, auto_stop_recording
+        recording = True
+        audio_data = np.array([], dtype="float32")
+        print("Recording started...")
+        threshold = 0.01  # Define the threshold for stopping the recording
+        silence_duration = (
+            2  # Duration in seconds to consider as silence before stopping
+        )
+        silence_start_time = None
+        recording_start_time = time.time()  # Record the start time of the recording
+        auto_stop_recording = is_auto_stop_recording_setting_active()
+        def callback(indata, frames, time_info, status):
+            global audio_data, recording, silence_start_time, auto_stop_recording
+            current_level = np.max(np.abs(indata))
+            # Add the current level to the queue
+            if audio_levels.full():
+                audio_levels.get()  # Remove the oldest level if the queue is full
+            audio_levels.put(current_level)
+            # Calculate dynamic threshold based on recent audio levels
+            dynamic_threshold = calculate_dynamic_threshold()
+            if recording:
+                audio_data = np.append(audio_data, indata)
+                # Check if the audio is below the dynamic threshold
+                if current_level < dynamic_threshold and auto_stop_recording:
+                    if silence_start_time is None:
+                        silence_start_time = time.time()  # Mark the start of silence
+                    # Ensure recording has been ongoing for at least 3 seconds before considering auto-stop
+                    elif (time.time() - silence_start_time) > silence_duration and (
+                        time.time() - recording_start_time
+                    ) > 3:
+                        recording = False
+                        buttonhandler.recording = False
+                else:
+                    silence_start_time = None
+    def record_audio():
+        with my_tracer.start_span("record_audio") as span:
+            span.set_attribute("user_id", user_id)
+            span.set_attribute("os_name", os_name_)
+            global recording
+            mics = sc.all_microphones(include_loopback=True)
+            default_mic = mics[0]
+            data = []
+            with default_mic.recorder(samplerate=148000) as mic:
+                print("Recording...")
+                while recording:
+                    frame = mic.record(numframes=4096)
+                    data.append(frame)
+            data = np.concatenate(data, axis=0)
+            data_int16 = (data * 32767).astype("int16")
+            wavfile.write(system_sound_location, 148000, data_int16)
+    if take_system_audio:
+        recording_thread = threading.Thread(target=record_audio)
+        recording_thread.start()
+    with sd.InputStream(callback=callback, channels=channels, samplerate=samplerate):
+        while recording:
+            sd.sleep(100)
+    if not recording:
+        sf.write(mic_record_location, audio_data, samplerate)
+        print("Audio saved as voice_input.wav")
+        signal_handler.recording_stopped.emit()
+def stop_recording():
+    """Stop recording audio."""
+    global recording
+    recording = False
+    print("Recording stopped")
+def quick_speech_to_text(time_total: int = 5) -> str:
+    global samplerate, channels, samplerate
+    quic_location = "temp.wav"
+    myrecording = sd.rec(
+        int(time_total * samplerate), samplerate=samplerate, channels=channels
+    )
+    sd.wait()  # Wait until recording is finished
+    write(quic_location, samplerate, myrecording)  # Save as WAV file
+    try:
+        from .stt import speech_to_text
+    except ImportError:
+        from stt import speech_to_text
+    return speech_to_text(quic_location)

gpt_computer_agent/audio/stt.py ADDED Viewed

	@@ -0,0 +1,77 @@

+try:
+    from ..llm import get_client
+    from ..utils.db import *
+    from .stt_providers.openai import stt_openai
+    from .stt_providers.openai_whisper_local import stt_openai_whisper_local
+except ImportError:
+    from utils.db import *
+    from audio.stt_providers.openai import stt_openai
+    from audio.stt_providers.openai_whisper_local import stt_openai_whisper_local
+import os
+from pydub import AudioSegment
+def is_local_stt_available():
+    try:
+        return True
+    except:
+        return False
+def split_audio(file_path, max_size=20 * 1024 * 1024):
+    """Split an audio file into smaller parts if it exceeds a maximum size.
+    Args:
+        file_path (str): The path to the audio file to be split.
+        max_size (int): The maximum size in bytes for each split part. Defaults to 20 MB.
+    Returns:
+        list: A list of tuples containing the split audio segments and their respective file paths.
+    """
+    audio = AudioSegment.from_wav(file_path)
+    file_size = os.path.getsize(file_path)
+    if file_size <= max_size:
+        return [(audio, file_path)]
+    # Calculate the number of parts needed
+    num_parts = file_size // max_size + 1
+    part_length = len(audio) // num_parts
+    parts = []
+    for i in range(num_parts):
+        start = i * part_length
+        end = (i + 1) * part_length if (i + 1) < num_parts else len(audio)
+        part = audio[start:end]
+        part_path = f"{file_path[:-4]}_part_{i+1}.wav"
+        part.export(part_path, format="wav")
+        parts.append((part, part_path))
+    return parts
+def speech_to_text(location):
+    """Convert speech audio file to text using an external service.
+    Args:
+        location (str): The path to the speech audio file.
+    Returns:
+        str: The transcribed text from the speech audio file.
+    """
+    audio_parts = split_audio(location)
+    transcriptions = []
+    for part, part_path in audio_parts:
+        with open(part_path, "rb") as audio_file:
+            if load_stt_model_settings() == "openai":
+                transcription = stt_openai(audio_file)
+            else:
+                transcription = stt_openai_whisper_local(part_path)
+            transcriptions.append(transcription)
+        os.remove(part_path)  # Clean up the temporary file immediately after processing
+    # Merge transcriptions (assuming it's a list of text segments)
+    full_transcription = " ".join(transcription for transcription in transcriptions)
+    return full_transcription

gpt_computer_agent/audio/stt_providers/openai.py ADDED Viewed

	@@ -0,0 +1,11 @@

+try:
+    from ...llm import *
+except ImportError:
+    from llm import *
+def stt_openai(audio_file):
+    transcription = get_client().audio.transcriptions.create(
+        model="whisper-1", file=audio_file
+    )
+    return transcription.text

gpt_computer_agent/audio/stt_providers/openai_whisper_local.py ADDED Viewed

	@@ -0,0 +1,19 @@

+model_ = None
+def model():
+    global model_
+    if model_ is None:
+        import whisper
+        model_ = whisper.load_model("tiny")
+    return model_
+def preload_stt_openai_whisper_local():
+    model()
+def stt_openai_whisper_local(audio_file):
+    result = model().transcribe(audio_file)
+    return result["text"]

gpt_computer_agent/audio/tts.py ADDED Viewed

	@@ -0,0 +1,106 @@

+try:
+    from ..llm import *
+    from ..utils.db import *
+    from .tts_providers.openai import tts_openai
+    from .tts_providers.microsoft_local import tts_microsoft_local
+except ImportError:
+    from llm import *
+    from utils.db import *
+    from audio.tts_providers.openai import tts_openai
+    from audio.tts_providers.microsoft_local import tts_microsoft_local
+import os
+import hashlib
+import random
+import threading
+def is_local_tts_available():
+    try:
+        return True
+    except:
+        return False
+def is_openai_tts_available():
+    the_model = load_model_settings()
+    if llm_settings[the_model]["provider"] == "openai":
+        if load_api_key() != "CHANGE_ME":
+            return True
+    return False
+supported_openai_speakers = ["fable"]
+def random_model(exclude):
+    models = supported_openai_speakers.copy()
+    models.remove(exclude)
+    return random.choice(models)
+def generate_speech_chunk(text_chunk, index, voice, results):
+    sha = hashlib.sha256(text_chunk.encode()).hexdigest()
+    location = os.path.join(artifacts_dir, f"{sha}.mp3")
+    if os.path.exists(location):
+        results[index] = location
+    else:
+        the_model = load_model_settings()
+        tts_setting = load_tts_model_settings()
+        if tts_setting == "openai":
+            tts_openai(voice, text_chunk, location)
+        if tts_setting == "microsoft_local":
+            if not is_local_tts_available():
+                print("Please install gpt-computer-agent[local_tts] to use local TTS")
+            else:
+                tts_microsoft_local(text_chunk, location)
+        results[index] = location
+def split_text_to_sentences(text, max_chunk_size=300):
+    """Splits text into sentences and ensures chunks do not exceed max_chunk_size."""
+    sentences = text.split(".")
+    chunks = []
+    current_chunk = ""
+    for sentence in sentences:
+        sentence = sentence.strip()
+        if len(current_chunk) + len(sentence) + 1 <= max_chunk_size:
+            current_chunk += sentence + ". "
+        else:
+            chunks.append(current_chunk.strip())
+            current_chunk = sentence + ". "
+    if current_chunk:
+        chunks.append(current_chunk.strip())
+    return chunks
+def text_to_speech(text):
+    text_chunks = split_text_to_sentences(text)
+    threads = []
+    results = [None] * len(text_chunks)
+    initial_voice = random.choice(supported_openai_speakers)
+    for i, chunk in enumerate(text_chunks):
+        voice = (
+            initial_voice if i % 2 == 0 else random_model(initial_voice)
+        )  # Alternate voices
+        thread = threading.Thread(
+            target=generate_speech_chunk, args=(chunk, i, voice, results)
+        )
+        threads.append(thread)
+        thread.start()
+    for thread in threads:
+        thread.join()
+    mp3_files = [result for result in results if result is not None]
+    return mp3_files

gpt_computer_agent/audio/tts_providers/microsoft_local.py ADDED Viewed

	@@ -0,0 +1,55 @@

+import soundfile as sf
+synthesiser_ = None
+def synthesiser():
+    from transformers import pipeline
+    global synthesiser_
+    if synthesiser_ is None:
+        synthesiser_ = pipeline("text-to-speech", "microsoft/speecht5_tts")
+    return synthesiser_
+embeddings_dataset_ = None
+def embeddings_dataset():
+    from datasets import load_dataset
+    global embeddings_dataset_
+    if embeddings_dataset_ is None:
+        embeddings_dataset_ = load_dataset(
+            "Matthijs/cmu-arctic-xvectors", split="validation"
+        )
+    return embeddings_dataset_
+speaker_embedding_ = None
+def speaker_embedding():
+    import torch
+    global speaker_embedding_
+    if speaker_embedding_ is None:
+        speaker_embedding_ = torch.tensor(
+            embeddings_dataset()[7306]["xvector"]
+        ).unsqueeze(0)
+    return speaker_embedding_
+def preload_tts_microsoft_local():
+    synthesiser()
+    embeddings_dataset()
+    speaker_embedding()
+def tts_microsoft_local(text_chunk, location):
+    speech = synthesiser()(
+        text_chunk, forward_params={"speaker_embeddings": speaker_embedding()}
+    )
+    sf.write(location, speech["audio"], samplerate=speech["sampling_rate"])
+    return location

gpt_computer_agent/audio/tts_providers/openai.py ADDED Viewed

	@@ -0,0 +1,13 @@

+try:
+    from ...llm import *
+except ImportError:
+    from llm import *
+def tts_openai(voice, text_chunk, location):
+    response = get_client().audio.speech.create(
+        model="tts-1",
+        voice=voice,
+        input=text_chunk,
+    )
+    response.stream_to_file(location)

gpt_computer_agent/audio/wake_word.py ADDED Viewed

	@@ -0,0 +1,40 @@

+import struct
+try:
+    from ..utils.db import load_pvporcupine_api_key
+except ImportError:
+    from utils.db import load_pvporcupine_api_key
+def wake_word(the_main_window):
+    import pvporcupine
+    import pyaudio
+    porcupine = pvporcupine.create(
+        access_key=load_pvporcupine_api_key(), keywords=pvporcupine.KEYWORDS
+    )
+    # Initialize PyAudio
+    pa = pyaudio.PyAudio()
+    # Open an audio stream
+    audio_stream = pa.open(
+        rate=porcupine.sample_rate,
+        channels=1,
+        format=pyaudio.paInt16,
+        input=True,
+        frames_per_buffer=porcupine.frame_length,
+    )
+    print("Listening for wake word...")
+    # Continuously listen for the wake word
+    while the_main_window.wake_word_active:
+        pcm = audio_stream.read(porcupine.frame_length)
+        pcm = struct.unpack_from("h" * porcupine.frame_length, pcm)
+        # Process the audio frame and check for the wake word
+        keyword_index = porcupine.process(pcm)
+        if keyword_index >= 0:
+            print("Wake word detected!")
+            return True

gpt_computer_agent/character.py ADDED Viewed

	@@ -0,0 +1,47 @@

+name_ = "GPT Computer Assistant"
+def name():
+    global name_
+    return name_
+def change_name(new_name):
+    global name_
+    name_ = new_name
+    from .gpt_computer_agent import the_main_window
+    def adjust_string_length(input_string):
+        if len(input_string) < 20:
+            return input_string.ljust(20)
+        else:
+            return input_string[:20]
+    the_main_window.title_label.setText(adjust_string_length(name_))
+developer_ = "Open Source Community"
+def developer():
+    global developer_
+    return developer_
+def change_developer(new_developer):
+    global developer_
+    developer_ = new_developer
+the_website_content = None
+def get_website_content():
+    global the_website_content
+    return the_website_content
+def set_website_content(content):
+    global the_website_content
+    the_website_content = content

gpt_computer_agent/custom_callback.py ADDED Viewed

	@@ -0,0 +1,21 @@

+"""Callback Handler streams to stdout on new llm token."""
+from langchain.callbacks.streaming_stdout_final_only import (
+    FinalStreamingStdOutCallbackHandler,
+)
+from typing import Any
+class customcallback(FinalStreamingStdOutCallbackHandler):
+    def on_llm_new_token(self, token: str, **kwargs: Any) -> None:
+        self.append_to_last_tokens(token)
+        if self.check_if_answer_reached():
+            self.answer_reached = True
+            return
+        if self.answer_reached:
+            from .gpt_computer_agent import the_main_window
+            the_main_window.set_text_to_input_box(token)

gpt_computer_agent/display_tools.py ADDED Viewed

	@@ -0,0 +1,242 @@

+from langchain.tools import tool
+import traceback
+try:
+    from .utils.db import load_api_key
+    from .llm import get_model
+    from .top_bar_wrapper import wrapper
+except ImportError:
+    from utils.db import load_api_key
+    from top_bar_wrapper import wrapper
+@wrapper
+def click_on_a_text_on_the_screen_(text: str, click_type: str = "singular") -> bool:
+    """
+    A function to click on a text on the screen.
+    Parameters:
+    - text (str): The text to be clicked on.
+    - click_type (str): The type of click to be performed. The default value is "singular". Possible values are "singular" and "double".
+    Returns:
+    - bool: True if the text was clicked on successfully, False otherwise.
+    """
+    try:
+        import pyautogui
+        pyautogui.FAILSAFE = False
+        from interpreter import OpenInterpreter
+        interpreter = OpenInterpreter()
+        interpreter.llm.api_key = load_api_key()
+        screenshot = pyautogui.screenshot()
+        text_locations = interpreter.computer.display.find_text(
+            text, screenshot=screenshot
+        )
+        print(text_locations)
+        x, y = text_locations[0]["coordinates"]
+        x *= interpreter.computer.display.width
+        y *= interpreter.computer.display.height
+        x = int(x)
+        y = int(y)
+        if click_type == "singular":
+            interpreter.computer.mouse.click(x=x, y=y, screenshot=screenshot)
+        elif click_type == "double":
+            interpreter.computer.mouse.double_click(x=x, y=y, screenshot=screenshot)
+        return True
+    except:
+        traceback.print_exc()
+        return False
+click_on_a_text_on_the_screen = tool(click_on_a_text_on_the_screen_)
+@wrapper
+def move_on_a_text_on_the_screen_(text: str) -> bool:
+    """
+    A function to move on a text on the screen.
+    Parameters:
+    - text (str): The text to be moved on.
+    Returns:
+    - bool: True if the text was moved on successfully, False otherwise.
+    """
+    try:
+        import pyautogui
+        pyautogui.FAILSAFE = False
+        from interpreter import OpenInterpreter
+        interpreter = OpenInterpreter()
+        interpreter.llm.api_key = load_api_key()
+        screenshot = pyautogui.screenshot()
+        text_locations = interpreter.computer.display.find_text(
+            text, screenshot=screenshot
+        )
+        print(text_locations)
+        x, y = text_locations[0]["coordinates"]
+        x *= interpreter.computer.display.width
+        y *= interpreter.computer.display.height
+        x = int(x)
+        y = int(y)
+        interpreter.computer.mouse.move(x=x, y=y, screenshot=screenshot)
+        return True
+    except:
+        traceback.print_exc()
+        return False
+move_on_a_text_on_the_screen = tool(move_on_a_text_on_the_screen_)
+@wrapper
+def click_on_a_icon_on_the_screen_(
+    icon_name: str, click_type: str = "singular"
+) -> bool:
+    """
+    A function to click on a icon name on the screen.
+    Parameters:
+    - icon_name (str): The icon name to be clicked on.
+    - click_type (str): The type of click to be performed. The default value is "singular". Possible values are "singular" and "double".
+    Returns:
+    - bool: True if the icon name was clicked on successfully, False otherwise.
+    """
+    try:
+        import pyautogui
+        pyautogui.FAILSAFE = False
+        from interpreter import OpenInterpreter
+        screenshot = pyautogui.screenshot()
+        interpreter = OpenInterpreter()
+        interpreter.llm.api_key = load_api_key()
+        if click_type == "singular":
+            interpreter.computer.mouse.click(icon=icon_name, screenshot=screenshot)
+        elif click_type == "double":
+            interpreter.computer.mouse.double_click(
+                icon=icon_name, screenshot=screenshot
+            )
+        return True
+    except:
+        traceback.print_exc()
+        return False
+click_on_a_icon_on_the_screen = tool(click_on_a_icon_on_the_screen_)
+@wrapper
+def move_on_a_icon_on_the_screen_(
+    icon_name: str,
+) -> bool:
+    """
+    A function to move on a icon name on the screen.
+    Parameters:
+    - icon_name (str): The icon name to be move on.
+    Returns:
+    - bool: True if the icon name was moved on successfully, False otherwise.
+    """
+    try:
+        import pyautogui
+        pyautogui.FAILSAFE = False
+        from interpreter import OpenInterpreter
+        screenshot = pyautogui.screenshot()
+        interpreter = OpenInterpreter()
+        interpreter.llm.api_key = load_api_key()
+        interpreter.computer.mouse.move(icon=icon_name, screenshot=screenshot)
+        return True
+    except:
+        traceback.print_exc()
+        return False
+move_on_a_icon_on_the_screen = tool(move_on_a_icon_on_the_screen_)
+def mouse_scroll_(direction: str, amount: int = 1) -> bool:
+    """
+    A function to scroll the mouse wheel.
+    Parameters:
+    - direction (str): The direction of the scroll. Possible values are "up" and "down".
+    - amount (int): The amount of scrolling to be performed. The default value is 1.
+    Returns:
+    - bool: True if the scrolling was performed successfully, False otherwise.
+    """
+    try:
+        import pyautogui
+        pyautogui.FAILSAFE = False
+        if direction == "up":
+            pyautogui.scroll(amount)
+        elif direction == "down":
+            pyautogui.scroll(-amount)
+        return True
+    except:
+        traceback.print_exc()
+        return False
+mouse_scroll = tool(mouse_scroll_)
+@wrapper
+def get_texts_on_the_screen_() -> str:
+    """
+    It returns the texts on the screen.
+    """
+    try:
+        pass
+    except:
+        pass
+    import pyautogui
+    the_screenshot_path = "temp_screenshot.png"
+    the_screenshot = pyautogui.screenshot()
+    the_screenshot.save(the_screenshot_path)
+    from interpreter.core.computer.utils.computer_vision import pytesseract_get_text
+    return pytesseract_get_text(the_screenshot_path)
+get_texts_on_the_screen = tool(get_texts_on_the_screen_)

gpt_computer_agent/gpt_computer_assistant.py ADDED Viewed

	@@ -0,0 +1,1599 @@

+try:
+    from .agent.chat_history import *
+    from .agent.assistant import *
+    from .llm import *
+    from .llm_settings import llm_settings
+    from .agent.agent import *
+    from .agent.background import *
+    from .gui.signal import *
+    from .gui.button import *
+    from .gui.settings import settings_popup
+    from .gui.llmsettings import llmsettings_popup
+    from .utils.db import *
+    from .utils.telemetry import my_tracer, os_name
+    from .audio.wake_word import wake_word
+    from .audio.tts import text_to_speech
+    from .character import name, developer
+except ImportError:
+    # This is for running the script directly
+    # in order to test the GUI without rebuilding the package
+    from agent.chat_history import *
+    from agent.assistant import *
+    from llm import *
+    from llm_settings import llm_settings
+    from agent.agent import *
+    from agent.background import *
+    from utils.db import *
+    from gui.signal import *
+    from gui.button import *
+    from gui.settings import settings_popup
+    from gui.llmsettings import llmsettings_popup
+    from utils.telemetry import my_tracer, os_name
+    from audio.wake_word import wake_word
+    from audio.tts import text_to_speech
+import platform
+import threading
+import time
+import random
+import math
+from PyQt5.QtWidgets import QMainWindow, QVBoxLayout, QWidget
+from PyQt5.QtGui import QMouseEvent, QPainter, QPen, QBrush, QIcon, QColor
+from PyQt5.QtCore import Qt, QTimer, QRect, pyqtSignal
+from PyQt5.QtGui import QKeySequence
+from PyQt5.QtWidgets import QShortcut
+from PyQt5.QtWidgets import QSpacerItem, QSizePolicy
+from PyQt5.QtWidgets import QDesktopWidget
+from PyQt5.QtWidgets import (
+    QPushButton,
+    QLabel,
+    QHBoxLayout,
+)
+from PyQt5.QtCore import QPoint
+from PyQt5.QtWidgets import QTextEdit
+from PyQt5 import QtGui
+from PyQt5.QtCore import QThread
+import pygame
+print("Imported all libraries")
+from PyQt5 import QtCore
+try:
+    import ctypes
+    myappid = "khulnasoft.gpt_computer_agent.gui.1"
+    ctypes.windll.shell32.SetCurrentProcessExplicitAppUserModelID(myappid)
+except:
+    pass
+the_input_box = None
+the_input_text = None
+the_input_box_pre = None
+the_main_window = None
+user_id = load_user_id()
+os_name_ = os_name()
+from PyQt5.QtCore import QRegExp
+from PyQt5.QtGui import QSyntaxHighlighter, QTextCharFormat, QFont
+class PythonSyntaxHighlighter(QSyntaxHighlighter):
+    def __init__(self, parent):
+        super().__init__(parent)
+        self.highlighting_rules = []
+        # Define different text formats with appropriate colors
+        keyword_format = QTextCharFormat()
+        keyword_format.setForeground(QColor(127, 0, 85))  # Dark purple for keywords
+        built_in_formats = QTextCharFormat()
+        built_in_formats.setForeground(
+            QColor(42, 0, 255)
+        )  # Dark blue for built-ins and constants
+        string_format = QTextCharFormat()
+        string_format.setForeground(QColor(0, 128, 0))  # Green for strings
+        function_format = QTextCharFormat()
+        function_format.setForeground(QColor(0, 0, 255))  # Blue for function names
+        comment_format = QTextCharFormat()
+        comment_format.setForeground(QColor(128, 128, 128))  # Gray for comments
+        comment_format.setFontItalic(True)
+        number_format = QTextCharFormat()
+        number_format.setForeground(QColor(255, 0, 0))  # Red for numbers
+        decorator_format = QTextCharFormat()
+        decorator_format.setForeground(QColor(0, 0, 128))  # Navy blue for decorators
+        # Markdown formatting
+        header_format = QTextCharFormat()
+        header_format.setForeground(QColor(0, 128, 128))  # Teal for headers
+        header_format.setFontWeight(QFont.Bold)
+        bold_format = QTextCharFormat()
+        bold_format.setFontWeight(QFont.Bold)
+        italic_format = QTextCharFormat()
+        italic_format.setFontItalic(True)
+        code_format = QTextCharFormat()
+        code_format.setForeground(QColor(255, 140, 0))  # Dark orange for inline code
+        code_format.setFontFamily("Courier New")
+        code_format.setBackground(
+            QColor(245, 245, 245)
+        )  # Light gray background for inline code
+        block_code_format = QTextCharFormat()
+        block_code_format.setForeground(
+            QColor(255, 140, 0)
+        )  # Dark orange for code blocks
+        block_code_format.setFontFamily("Courier New")
+        block_code_format.setBackground(
+            QColor(245, 245, 245)
+        )  # Light gray background for code blocks
+        # Define the regular expressions
+        keywords = [
+            "def",
+            "class",
+            "if",
+            "else",
+            "elif",
+            "return",
+            "import",
+            "from",
+            "as",
+            "for",
+            "while",
+            "try",
+            "except",
+            "finally",
+            "with",
+            "async",
+            "await",
+            "yield",
+            "lambda",
+            "global",
+            "nonlocal",
+            "assert",
+            "del",
+            "pass",
+            "break",
+            "continue",
+            "and",
+            "or",
+            "not",
+            "is",
+            "in",
+        ]
+        self.highlighting_rules += [
+            (QRegExp(r"\b" + word + r"\b"), keyword_format) for word in keywords
+        ]
+        built_ins = [
+            "True",
+            "False",
+            "None",
+            "__init__",
+            "self",
+            "print",
+            "len",
+            "range",
+            "str",
+            "int",
+            "float",
+            "list",
+            "dict",
+            "set",
+            "tuple",
+        ]
+        self.highlighting_rules += [
+            (QRegExp(r"\b" + word + r"\b"), built_in_formats) for word in built_ins
+        ]
+        self.highlighting_rules.append(
+            (QRegExp(r'"[^"\\]*(\\.[^"\\]*)*"'), string_format)
+        )
+        self.highlighting_rules.append(
+            (QRegExp(r"'[^'\\]*(\\.[^'\\]*)*'"), string_format)
+        )
+        self.highlighting_rules.append((QRegExp(r"\bdef\b\s*(\w+)"), function_format))
+        self.highlighting_rules.append((QRegExp(r"\bclass\b\s*(\w+)"), function_format))
+        self.highlighting_rules.append((QRegExp(r"#.*"), comment_format))
+        self.highlighting_rules.append((QRegExp(r"\b[0-9]+[lL]?\b"), number_format))
+        self.highlighting_rules.append(
+            (QRegExp(r"\b0[xX][0-9A-Fa-f]+[lL]?\b"), number_format)
+        )
+        self.highlighting_rules.append(
+            (QRegExp(r"\b0[oO]?[0-7]+[lL]?\b"), number_format)
+        )
+        self.highlighting_rules.append((QRegExp(r"\b0[bB][01]+[lL]?\b"), number_format))
+        self.highlighting_rules.append((QRegExp(r"@[^\s]+"), decorator_format))
+        # Markdown rules
+        self.highlighting_rules.append(
+            (QRegExp(r"^#{1,6} .+"), header_format)
+        )  # Headers
+        self.highlighting_rules.append(
+            (QRegExp(r"\*\*[^*]+\*\*"), bold_format)
+        )  # **bold**
+        self.highlighting_rules.append((QRegExp(r"__[^_]+__"), bold_format))  # __bold__
+        self.highlighting_rules.append(
+            (QRegExp(r"\*[^*]+\*"), italic_format)
+        )  # *italic*
+        self.highlighting_rules.append((QRegExp(r"_[^_]+_"), italic_format))  # _italic_
+        self.highlighting_rules.append(
+            (QRegExp(r"`[^`]+`"), code_format)
+        )  # Inline code
+    def highlightBlock(self, text):
+        # Handle code blocks separately
+        if text.strip().startswith("```"):
+            self.setFormat(0, len(text), self.highlighting_rules[-1][1])
+            return
+        for pattern, format in self.highlighting_rules:
+            expression = QRegExp(pattern)
+            index = expression.indexIn(text)
+            while index >= 0:
+                length = expression.matchedLength()
+                self.setFormat(index, length, format)
+                index = expression.indexIn(text, index + length)
+readed_sentences = []
+import re
+def split_with_multiple_delimiters(text, delimiters):
+    """
+    Splits the text by any of the given delimiters while keeping the delimiters in the resulting parts.
+    :param text: The input text to be split.
+    :param delimiters: A string of delimiters to split the text on.
+    :return: A list of parts including the delimiters.
+    """
+    # Create a regular expression pattern that matches any of the delimiters
+    pattern = re.compile(f"(.*?[{re.escape(delimiters)}])")
+    parts = pattern.findall(text)
+    # Check if the last part is not complete and remove it if necessary
+    if (
+        parts
+        and text
+        and not any(text.endswith(d) for d in delimiters)
+        and parts
+        and not any(parts[-1].endswith(d) for d in delimiters)
+    ):
+        parts.pop()
+    return parts
+def click_sound():
+    pygame.mixer.init()
+    retro = pygame.mixer.Sound(click_sound_path)
+    retro.set_volume(0.1)
+    retro.play()
+class Worker(QThread):
+    text_to_set = pyqtSignal(str)
+    def __init__(self):
+        super().__init__()
+        self.the_input_text = None
+        self.make_animation = True
+        self.commited_text = []
+    def run(self):
+        while True:
+            self.msleep(500)  # Simulate a time-consuming task
+            if self.the_input_text:
+                last_text = (
+                    self.commited_text[-1] if len(self.commited_text) > 0 else ""
+                )
+                if self.the_input_text != last_text:
+                    self.commited_text.append(self.the_input_text)
+                    if len(self.the_input_text) > 90 or not self.make_animation:
+                        self.text_to_set.emit(self.the_input_text)
+                    else:
+                        for i in range(len(self.the_input_text)):
+                            self.text_to_set.emit(self.the_input_text[: i + 1])
+                            self.msleep(10)
+return_key_event = None
+class CustomTextEdit(QTextEdit):
+    def __init__(self, parent=None):
+        super(CustomTextEdit, self).__init__(parent)
+    def keyPressEvent(self, event):
+        if event.key() == Qt.Key_Return or event.key() == Qt.Key_Enter:
+            global return_key_event
+            return_key_event()
+        super(CustomTextEdit, self).keyPressEvent(
+            event
+        )  # Process other key events normally
+class Worker_2(QThread):
+    text_to_set = pyqtSignal(str)
+    text_to_set_title_bar = pyqtSignal(str)
+    def __init__(self):
+        super().__init__()
+        self.the_input_text = None
+        self.title_bar_text = None
+        self.prev = None
+        self.commited_text = []
+    def run(self):
+        while True:
+            self.msleep(500)  # Simulate a time-consuming task
+            if self.the_input_text and (
+                self.prev is None or self.prev != self.the_input_text
+            ):
+                self.prev = self.the_input_text
+                self.text_to_set.emit("True")
+                for i in range(len(self.title_bar_text)):
+                    self.text_to_set_title_bar.emit(self.title_bar_text[: i + 1])
+                    self.msleep(10)
+            if not self.the_input_text and self.prev != self.the_input_text:
+                self.prev = self.the_input_text
+                self.text_to_set.emit("False")
+                the_text = "  " + name()
+                for i in range(len(the_text)):
+                    self.text_to_set_title_bar.emit(the_text[: i + 1])
+                    self.msleep(10)
+class Worker_3(QThread):
+    text_to_set = pyqtSignal(str)
+    def __init__(self):
+        super().__init__()
+        self.the_input_text = None
+    def run(self):
+        while True:
+            self.msleep(500)  # Simulate a time-consuming task
+            if self.the_input_text:
+                self.text_to_set.emit("True")
+                self.the_input_text = None
+class Worker_collapse(QThread):
+    text_to_set = pyqtSignal(str)
+    def __init__(self):
+        super().__init__()
+        self.the_input_text = None
+    def run(self):
+        while True:
+            self.msleep(500)  # Simulate a time-consuming task
+            if self.the_input_text:
+                self.text_to_set.emit("True")
+                self.the_input_text = None
+class Worker_uncollapse(QThread):
+    text_to_set = pyqtSignal(str)
+    def __init__(self):
+        super().__init__()
+        self.the_input_text = None
+    def run(self):
+        while True:
+            self.msleep(500)  # Simulate a time-consuming task
+            if self.the_input_text:
+                self.text_to_set.emit("True")
+                self.the_input_text = None
+class Worker_show_logo(QThread):
+    text_to_set = pyqtSignal(str)
+    def __init__(self):
+        super().__init__()
+        self.the_input_text = None
+    def run(self):
+        while True:
+            self.msleep(500)  # Simulate a time-consuming task
+            if self.the_input_text:
+                self.text_to_set.emit("True")
+                self.the_input_text = None
+class Worker_hide_logo(QThread):
+    text_to_set = pyqtSignal(str)
+    def __init__(self):
+        super().__init__()
+        self.the_input_text = None
+    def run(self):
+        while True:
+            self.msleep(500)  # Simulate a time-consuming task
+            if self.the_input_text:
+                self.text_to_set.emit("True")
+                self.the_input_text = None
+class Worker_activate_long_gca(QThread):
+    text_to_set = pyqtSignal(str)
+    def __init__(self):
+        super().__init__()
+        self.the_input_text = None
+    def run(self):
+        while True:
+            self.msleep(500)  # Simulate a time-consuming task
+            if self.the_input_text:
+                self.text_to_set.emit("True")
+                self.the_input_text = None
+class Worker_deactivate_long_gca(QThread):
+    text_to_set = pyqtSignal(str)
+    def __init__(self):
+        super().__init__()
+        self.the_input_text = None
+    def run(self):
+        while True:
+            self.msleep(500)  # Simulate a time-consuming task
+            if self.the_input_text:
+                self.text_to_set.emit("True")
+                self.the_input_text = None
+class Worker_tray_and_task_bar_logo(QThread):
+    text_to_set = pyqtSignal(str)
+    def __init__(self):
+        super().__init__()
+        self.the_input_text = None
+    def run(self):
+        while True:
+            self.msleep(500)  # Simulate a time-consuming task
+            if self.the_input_text:
+                self.text_to_set.emit("True")
+                self.the_input_text = None
+class DrawingWidget(QWidget):
+    def __init__(self, parent=None):
+        super(DrawingWidget, self).__init__(parent)
+        # Set widget properties if needed, e.g., size
+        self.main_ = parent
+        self.active_button = ""
+    def paintEvent(self, event):
+        if llm_settings[load_model_settings()]["vision"] is True:
+            self.main_.screen_available = True
+        else:
+            self.main_.screen_available = False
+        self.main_.setAutoFillBackground(True)
+        painter = QPainter(self)
+        painter = painter
+        painter.setRenderHint(QPainter.Antialiasing)
+        painter.setPen(QPen(QColor("#000"), 1))
+        painter.setBrush(QBrush(Qt.black, Qt.SolidPattern))
+        center_x = 95
+        center_y = 40
+        if "talking" in self.main_.state:
+            # Draw a pulsating circle with smooth easing animation
+            radius_variation = 5 * (
+                1 + math.sin(self.main_.pulse_frame * math.pi / 100)
+            )
+            radius = 70 + radius_variation
+            painter.drawEllipse(
+                int(center_x - radius / 2),
+                int(center_y - radius / 2),
+                int(radius),
+                int(radius),
+            )
+        elif self.main_.state == "thinking":
+            # more slow pulsating circle with smooth easing animation
+            radius_variation = 5 * (
+                1 + math.sin(self.main_.pulse_frame * math.pi / 100)
+            )
+            radius = 70 + radius_variation
+            painter.drawEllipse(
+                int(center_x - radius / 2),
+                int(center_y - radius / 2),
+                int(radius),
+                int(radius),
+            )
+        else:
+            radius = 70
+            if self.main_.screen_available:
+                painter.drawEllipse(  # Main Button
+                    int(center_x - radius / 2),
+                    int(center_y - radius / 2),
+                    int(radius),
+                    int(radius),
+                )
+        self.main_.circle_rect = QRect(
+            int(center_x - radius / 2),
+            int(center_y - radius / 2),
+            int(radius),
+            int(radius),
+        )
+        if not self.main_.state == "thinking":
+            painter.setPen(QPen(QColor("#01EE8A"), 1))
+            if self.main_.screen_available:
+                painter.drawEllipse(  # Main BUtton Green Border
+                    int(center_x - radius / 2),
+                    int(center_y - radius / 2),
+                    int(radius),
+                    int(radius),
+                )
+        else:
+            painter.setPen(QPen(QColor("#23538F"), 1))
+            painter.drawEllipse(
+                int(center_x - radius / 2),
+                int(center_y - radius / 2),
+                int(radius),
+                int(radius),
+            )
+        painter.setPen(QPen(QColor("#000"), 1))
+        small_center_x = 165
+        small_center_y = 25
+        small_radius = 30
+        painter.drawEllipse(  # Microphone bacground black
+            int(small_center_x - small_radius / 2),
+            int(small_center_y - small_radius / 2),
+            int(small_radius),
+            int(small_radius),
+        )
+        self.main_.small_circle_rect = QRect(
+            int(small_center_x - small_radius / 2),
+            int(small_center_y - small_radius / 2),
+            int(small_radius),
+            int(small_radius),
+        )
+        # Draw the icon inside the circle
+        icon_size = small_radius * 2 // 3  # Adjust the icon size relative to the circle
+        icon_rect = QRect(
+            small_center_x - icon_size // 2,
+            small_center_y - icon_size // 2,
+            icon_size,
+            icon_size,
+        )
+        self.main_.small_circle_recticon = QIcon(microphone_icon_path)
+        self.main_.small_circle_recticon.paint(painter, icon_rect)
+        small_center_x = 30
+        small_center_y = 60
+        small_radius = 30
+        painter.drawEllipse(
+            int(small_center_x - small_radius / 2),
+            int(small_center_y - small_radius / 2),
+            int(small_radius),
+            int(small_radius),
+        )
+        self.main_.small_circle_left = QRect(
+            int(small_center_x - small_radius / 2),
+            int(small_center_y - small_radius / 2),
+            int(small_radius),
+            int(small_radius),
+        )
+        # Draw the icon inside the circle
+        icon_size = small_radius * 2 // 3  # Adjust the icon size relative to the circle
+        icon_rect = QRect(
+            small_center_x - icon_size // 2,
+            small_center_y - icon_size // 2,
+            icon_size,
+            icon_size,
+        )
+        self.main_.small_circle_lefticon = QIcon(audio_icon_path)
+        self.main_.small_circle_lefticon.paint(painter, icon_rect)
+        small_center_x = 30
+        small_center_y = 25
+        small_radius = 30
+        if self.main_.screen_available:
+            painter.drawEllipse(  # ScreenShot BUtton
+                int(small_center_x - small_radius / 2),
+                int(small_center_y - small_radius / 2),
+                int(small_radius),
+                int(small_radius),
+            )
+        self.main_.small_circle_left_top = QRect(
+            int(small_center_x - small_radius / 2),
+            int(small_center_y - small_radius / 2),
+            int(small_radius),
+            int(small_radius),
+        )
+        self.main_.screenshot_button_coordinates_size = [
+            int(small_center_x - small_radius / 2),
+            int(small_center_y - small_radius / 2),
+            int(small_radius),
+            int(small_radius),
+        ]
+        if self.active_button == "screenshot":
+            self.screenshot_button_border_activate(painter)
+            self.active_button = ""
+        if self.main_.screen_available:
+            # Draw the icon inside the circle
+            icon_size = (
+                small_radius * 2 // 3
+            )  # Adjust the icon size relative to the circle
+            icon_rect = QRect(
+                small_center_x - icon_size // 2,
+                small_center_y - icon_size // 2,
+                icon_size,
+                icon_size,
+            )
+            self.main_.small_circle_left_topticon = QIcon(screenshot_icon_path)
+            self.main_.small_circle_left_topticon.paint(painter, icon_rect)
+        small_center_x = 165
+        small_center_y = 60
+        small_radius = 30
+        painter.drawEllipse(
+            int(small_center_x - small_radius / 2),
+            int(small_center_y - small_radius / 2),
+            int(small_radius),
+            int(small_radius),
+        )
+        self.main_.small_circle_collapse = QRect(
+            int(small_center_x - small_radius / 2),
+            int(small_center_y - small_radius / 2),
+            int(small_radius),
+            int(small_radius),
+        )
+        # Draw the icon inside the circle
+        icon_size = small_radius * 2 // 3  # Adjust the icon size relative to the circle
+        icon_rect = QRect(
+            small_center_x - icon_size // 2,
+            small_center_y - icon_size // 2,
+            icon_size,
+            icon_size,
+        )
+        if is_collapse_setting_active():
+            self.main_.small_circle_collapse_icon = QIcon(down_icon_path)
+        if not is_collapse_setting_active() and is_long_gca_setting_active():
+            self.main_.small_circle_collapse_icon = QIcon(up_icon_path)
+        if not is_collapse_setting_active() and not is_long_gca_setting_active():
+            self.main_.small_circle_collapse_icon = QIcon(down_icon_path)
+        self.main_.small_circle_collapse_icon.paint(painter, icon_rect)
+    def screenshot_button_border_activate(self, painter):
+        # Add an white border to the circle
+        painter.setPen(QPen(QColor("#FFF"), 1))
+        # Draw the ellipse with the specified green border
+        self.main_.screenshot_button_border = painter.drawEllipse(
+            self.main_.screenshot_button_coordinates_size[0],
+            self.main_.screenshot_button_coordinates_size[1],
+            self.main_.screenshot_button_coordinates_size[2],
+            self.main_.screenshot_button_coordinates_size[3],
+        )
+        painter.setPen(QPen(QColor("#000"), 1))
+    def mousePressEvent(self, event: QMouseEvent):
+        self.main_.old_position = event.globalPos()
+        with my_tracer.start_span("mouse_press_event") as span:
+            span.set_attribute("user_id", user_id)
+            span.set_attribute("os_name", os_name_)
+            if self.main_.state == "idle" or "talking" in self.main_.state:
+                try:
+                    if self.main_.circle_rect.contains(event.pos()):
+                        if self.main_.state == "aitalking":
+                            self.main_.stop_ai_talking()
+                        else:
+                            self.main_.screenshot_and_microphone_button_action()
+                except:
+                    traceback.print_exc()
+                try:
+                    if self.main_.small_circle_rect.contains(event.pos()):
+                        if self.main_.state == "aitalking":
+                            self.main_.stop_ai_talking()
+                        else:
+                            click_sound()
+                            self.main_.button_handler.toggle_recording(
+                                no_screenshot=True
+                            )
+                except:
+                    traceback.print_exc()
+                try:
+                    if self.main_.small_circle_left.contains(event.pos()):
+                        if self.main_.state == "aitalking":
+                            self.main_.stop_ai_talking()
+                        else:
+                            click_sound()
+                            self.main_.button_handler.toggle_recording(
+                                take_system_audio=True
+                            )
+                except:
+                    traceback.print_exc()
+                try:
+                    if self.main_.small_circle_left_top.contains(event.pos()):
+                        if self.main_.state == "aitalking":
+                            self.main_.stop_ai_talking()
+                        else:
+                            click_sound()
+                            self.active_button = "screenshot"
+                            self.update()
+                            self.main_.button_handler.just_screenshot()
+                except:
+                    traceback.print_exc()
+            try:
+                if self.main_.small_circle_collapse.contains(event.pos()):
+                    if not is_collapse_setting_active():
+                        if is_long_gca_setting_active():
+                            self.main_.deactivate_long_gca()
+                            self.main_.collapse_gca()
+                        else:
+                            self.main_.activate_long_gca()
+                    else:
+                        self.main_.uncollapse_gca()
+                    self.main_.update()
+            except:
+                pass
+from PyQt5.QtCore import QVariantAnimation
+class MainWindow(QMainWindow):
+    api_enabled = False
+    tts_available = True
+    def screenshot_and_microphone_button_action(self):
+        click_sound()
+        if llm_settings[load_model_settings()]["vision"] is True:
+            self.button_handler.toggle_recording(dont_save_image=True)
+        else:
+            self.button_handler.toggle_recording(no_screenshot=True)
+    def stop_ai_talking(self):
+        self.manuel_stop = True
+        self.stop_talking = True
+    def __init__(self):
+        super().__init__()
+        self.background_color = "45, 45, 45"
+        self.opacity = 250
+        self.border_radius = 10
+        print("API Enabled:", MainWindow.api_enabled)
+        if MainWindow.api_enabled:
+            try:
+                from .api import start_api
+                start_api()
+            except:
+                raise Exception(
+                    "API could not be started, please install gpt-computer-agent[api]"
+                )
+        self.stop_talking = False
+        self.setWindowFlags(
+            Qt.FramelessWindowHint | Qt.WindowStaysOnTopHint
+        )  # Remove the default title bar
+        # Load the San Francisco font
+        print("Loading font")
+        print(font_dir)
+        try:
+            font_id = QtGui.QFontDatabase.addApplicationFont(font_dir)
+            font_family = QtGui.QFontDatabase.applicationFontFamilies(font_id)[0]
+            self.setFont(QtGui.QFont(font_family))
+        except:
+            print("Error loading font")
+        self.state = "idle"
+        self.pulse_timer = None
+        self.button_handler = ButtonHandler(self)
+        self.initUI()
+        self.old_position = self.pos()
+        self.collapse = is_collapse_setting_active()
+        if self.collapse:
+            self.collapse_window()
+        global the_main_window
+        the_main_window = self
+        self.general_styling()
+        if is_dark_mode_active():
+            self.dark_mode()
+        else:
+            self.light_mode()
+        self.wake_word_thread = None
+        self.wake_word_active = False
+        if load_pvporcupine_api_key() != "CHANGE_ME" and is_wake_word_active():
+            self.wake_word_active = True
+            self.wake_word_trigger()
+        self.manuel_stop = False
+        self.border_animation = None
+        self.complated_answer = False
+        self.reading_thread = False
+        self.reading_thread_2 = False
+        image_layout = QHBoxLayout()
+        self.the_image = QLabel(self)
+        self.the_image.setPixmap(QtGui.QPixmap(load_logo_file_path()).scaled(25, 25))
+        image_layout.addWidget(self.the_image)
+        self.layout.addLayout(image_layout)
+        self.the_image.setAlignment(Qt.AlignCenter)
+        self.the_image.setFixedHeight(35)
+        # Logo Adding
+        if not is_logo_active_setting_active():
+            self.the_image.hide()
+        self.update_screen()
+    def put_location(self):
+        if load_location_setting() == "right":
+            self.put_window_to_right_side_of_screen()
+    def init_border_animation(self):
+        # Create a QVariantAnimation to handle color change
+        border_animation = QVariantAnimation(
+            self,
+            valueChanged=self.update_border_color,
+            startValue=QColor("#303030"),
+            endValue=QColor("#23538F"),
+            duration=2000,  # Duration for one loop in milliseconds
+        )
+        border_animation.setLoopCount(-1)  # Loop indefinitely
+        return border_animation
+    def start_border_animation(self, status):
+        print("FUNCTION TRİGGERED")
+        if self.border_animation is None:
+            self.border_animation = self.init_border_animation()
+        status = status.lower() == "true"
+        if status:
+            self.border_animation.start()
+        else:
+            self.border_animation.stop()
+            self.title_bar.setStyleSheet(
+                "background-color: #2E2E2E; color: white; border-style: solid; border-radius: 15px; border-width: 0px; color: #fff;"
+            )
+    def update_border_color(self, color):
+        self.title_bar.setStyleSheet(
+            f"background-color: #2E2E2E; color: white; border-style: solid; border-radius: 15px; border-width: 2px; border-color: {color.name()}; color: #fff;"
+        )
+        self.title_bar.setStyleSheet(
+            f"background-color: #2E2E2E; color: white; border-style: solid; border-radius: 15px; border-width: 1px; border-color: {color.name()}; color: #fff;"
+        )
+    # Existing methods...
+    def general_styling(self, a=None):
+        self.setAttribute(Qt.WA_TranslucentBackground)
+        self.setStyleSheet(
+            f"border-radius: {self.border_radius}px; background-color: rgba({self.background_color}, {self.opacity});"
+        )
+        self.central_widget.setStyleSheet(
+            "border-style: solid; border-width: 1px; border-color: rgb(0,0,0,0);"
+        )
+        self.input_box_style = "border-radius: 10px; border-bottom: 1px solid #01EE8A;"
+        self.settingsButton_style = (
+            "border-radius: 5px; height: 25px; border-style: solid;"
+        )
+        self.llmsettingsButton_style = (
+            "border-radius: 5px; height: 25px; border-style: solid;"
+        )
+        self.btn_minimize.setStyleSheet(
+            "background-color: #2E2E2E; color: white; border-style: none;"
+        )
+        self.btn_close.setStyleSheet(
+            "background-color: #2E2E2E; color: white; border-style: none;"
+        )
+    def set_background_color(self, color):
+        self.background_color = color
+        self.worker_3.the_input_text = "True"
+    def set_opacity(self, opacity):
+        self.opacity = opacity
+        self.worker_3.the_input_text = "True"
+    def set_border_radius(self, radius):
+        self.border_radius = radius
+        self.worker_3.the_input_text = "True"
+    def wake_word_trigger(self):
+        self.wake_word_thread = threading.Thread(target=self.wake_word)
+        self.wake_word_thread.start()
+    def wake_word(self):
+        from .agent.process import tts_if_you_can
+        while True and is_wake_word_active() and self.wake_word_active:
+            if wake_word(self):
+                def random_accept_words():
+                    return random.choice(["Yes", "Sir", "Boss", "Master"])
+                tts_if_you_can(random_accept_words(), not_threaded=True)
+                def trigger_wake_word():
+                    if (
+                        is_wake_word_screen_setting_active()
+                        and llm_settings[load_model_settings()]["vision"]
+                    ):
+                        self.button_handler.toggle_recording(dont_save_image=True)
+                    else:
+                        self.button_handler.toggle_recording(no_screenshot=True)
+                if self.state == "aitalking":
+                    self.manuel_stop = True
+                    self.stop_talking = True
+                    time.sleep(1)
+                    trigger_wake_word()
+                    print("Stop talking")
+                else:
+                    trigger_wake_word()
+    def dark_mode(self):
+        self.setAutoFillBackground(True)
+        p = self.palette()
+        p.setColor(
+            self.backgroundRole(), QColor("#171717")
+        )  # Set background color to white
+        self.setPalette(p)
+        self.input_box.setStyleSheet(
+            self.input_box_style + "background-color: #2E2E2E; color: white;"
+        )
+        self.settingsButton.setStyleSheet(
+            self.settingsButton_style + "background-color: #2E2E2E; color: white;"
+        )
+        self.llmsettingsButton.setStyleSheet(
+            self.llmsettingsButton_style + "background-color: #2E2E2E; color: white;"
+        )
+    def light_mode(self):
+        self.setAutoFillBackground(True)
+        p = self.palette()
+        p.setColor(self.backgroundRole(), QColor("#F0F0F0"))
+        self.setPalette(p)
+        self.input_box.setStyleSheet(
+            self.input_box_style + "background-color: #FFFFFF; color: black;"
+        )
+        self.settingsButton.setStyleSheet(
+            self.settingsButton_style + "background-color: #FFFFFF; color: black; "
+        )
+        self.llmsettingsButton.setStyleSheet(
+            self.llmsettingsButton_style + "background-color: #FFFFFF; color: black; "
+        )
+    def collapse_window(self):
+        the_input_box.hide()
+        self.settingsButton.hide()
+        self.llmsettingsButton.hide()
+        self.update_screen()
+    def initUI(self):
+        self.setWindowTitle("GPT")
+        self.setGeometry(100, 100, 200, 200)
+        width = 210
+        height = 300
+        # setting the minimum size
+        self.setMinimumSize(width, height)
+        self.first_height = self.height()
+        self.first_width = self.width()
+        self.central_widget = QWidget(self)
+        self.setCentralWidget(self.central_widget)
+        layout = QVBoxLayout(self.central_widget)
+        # Custom title bar
+        self.title_bar = QWidget(self)
+        self.title_bar.setFixedHeight(30)  # Set a fixed height for the title bar
+        self.title_bar.setStyleSheet(
+            "background-color: #2E2E2E; color: #fff; border-radius: 15px; border-style: solid; border-width: 1px; border-color: #303030;"
+        )
+        self.title_bar_layout = QHBoxLayout(self.title_bar)
+        self.title_bar_layout.setContentsMargins(5, 5, 0, 5)
+        self.title_bar_layout.setSpacing(0)
+        self.btn_minimize = QPushButton("-", self.title_bar)
+        self.btn_minimize.setFixedSize(20, 20)
+        self.btn_minimize.clicked.connect(self.showMinimized)
+        def stop_app():
+            self.stop_talking = True
+            self.wake_word_active = False
+            if MainWindow.api_enabled:
+                from .api import stop_api
+                stop_api()
+            self.close()
+        self.btn_close = QPushButton("×", self.title_bar)
+        self.btn_close.setFixedSize(20, 20)
+        self.btn_close.clicked.connect(stop_app)
+        self.title_label = QLabel("  " + name(), self.title_bar)
+        # Change font size
+        font = QtGui.QFont()
+        font.setPointSize(11)
+        self.title_label.setFont(font)
+        self.title_label.setStyleSheet("border: 0px solid blue;")
+        self.title_bar_layout.addWidget(self.title_label)
+        self.title_bar_layout.addStretch()
+        self.title_bar_layout.addWidget(self.btn_minimize)
+        self.title_bar_layout.addWidget(self.btn_close)
+        # Create a spacer item with expanding policy
+        spacer = QSpacerItem(5, 20, QSizePolicy.Expanding, QSizePolicy.Minimum)
+        self.title_bar_layout.addSpacerItem(spacer)  # Add spacer to the layout
+        layout.addWidget(self.title_bar)
+        self.drawing_widget = DrawingWidget(self)
+        layout.addWidget(self.drawing_widget)
+        self.layout = layout
+        self.setLayout(layout)
+        # Add keyboard shortcuts
+        self.shortcut_screenshot = QShortcut(QKeySequence("Ctrl+1"), self)
+        self.shortcut_screenshot.activated.connect(
+            lambda: self.button_handler.just_screenshot()
+        )
+        self.shortcut_screenshot = QShortcut(QKeySequence("Ctrl+2"), self)
+        self.shortcut_screenshot.activated.connect(
+            lambda: self.button_handler.toggle_recording(take_system_audio=True)
+        )
+        self.shortcut_no_screenshot = QShortcut(QKeySequence("Ctrl+e"), self)
+        self.shortcut_no_screenshot.activated.connect(
+            lambda: self.button_handler.toggle_recording(take_system_audio=True)
+        )
+        self.shortcut_no_screenshot = QShortcut(QKeySequence("Ctrl+3"), self)
+        self.shortcut_no_screenshot.activated.connect(
+            lambda: self.button_handler.toggle_recording(no_screenshot=True)
+        )
+        # I want to create an input box to bottom left and a send button to bottom right
+        input_box = CustomTextEdit(self)
+        self.input_box = input_box
+        input_box.setFixedHeight(80)
+        # Set text wrapping. I dont wat to cut the text
+        input_box.setWordWrapMode(QtGui.QTextOption.NoWrap)
+        # Change the font size
+        font = QtGui.QFont()
+        font.setPointSize(12)
+        input_box.setFont(font)
+        self.highlighter = PythonSyntaxHighlighter(self.input_box.document())
+        if load_api_key() == "CHANGE_ME":
+            input_box.setPlaceholderText("Save your API Key, go to settings")
+        else:
+            if platform.system() == "Darwin":
+                if llm_settings[load_model_settings()]["vision"] is False:
+                    input_box.setPlaceholderText("Type here \nsand ↵ ")
+                else:
+                    input_box.setPlaceholderText(
+                        "Type here \nand ↵ \nor ⌘ + ↵ (+screenshot)"
+                    )
+            else:
+                if llm_settings[load_model_settings()]["vision"] is False:
+                    input_box.setPlaceholderText("Type here \nand ↵ ")
+                else:
+                    input_box.setPlaceholderText(
+                        "Type here \nand ↵ \nor Ctrl + ↵ (+screenshot)"
+                    )
+            # Add an information and use enter icon to the input box for mac
+        input_box.setGeometry(30, self.height() - 60, 200, 80)
+        global the_input_box
+        the_input_box = input_box
+        def input_box_send():
+            if input_box.toPlainText() != "":
+                click_sound()
+                self.button_handler.input_text(input_box.toPlainText())
+        def input_box_send_screenshot():
+            if input_box.toPlainText() != "":
+                click_sound()
+                self.button_handler.input_text_screenshot(input_box.toPlainText())
+        self.layout.addWidget(input_box)
+        self.shortcut_enter = QShortcut(QKeySequence("Ctrl+Return"), self)
+        self.shortcut_enter.activated.connect(input_box_send_screenshot)
+        global return_key_event
+        return_key_event = input_box_send
+        button_layout_ = QHBoxLayout()
+        self.settingsButton = QPushButton("Chat Settings", self)
+        self.settingsButton.clicked.connect(settings_popup)
+        self.llmsettingsButton = QPushButton("LLM Settings", self)
+        self.llmsettingsButton.clicked.connect(llmsettings_popup)
+        button_layout_.addWidget(self.settingsButton)
+        button_layout_.addWidget(self.llmsettingsButton)
+        self.layout.addLayout(button_layout_)
+        self.worker = Worker()
+        self.worker.text_to_set.connect(self.set_text)
+        self.worker.start()
+        self.worker_2 = Worker_2()
+        self.worker_2.text_to_set.connect(self.start_border_animation)
+        self.worker_2.text_to_set_title_bar.connect(self.set_title_bar_text)
+        self.worker_2.start()
+        self.worker_3 = Worker_3()
+        self.worker_3.text_to_set.connect(self.general_styling)
+        self.worker_3.start()
+        self.worker_collapse = Worker_collapse()
+        self.worker_collapse.text_to_set.connect(self.collapse_gca)
+        self.worker_collapse.start()
+        self.worker_uncollapse = Worker_uncollapse()
+        self.worker_uncollapse.text_to_set.connect(self.uncollapse_gca)
+        self.worker_uncollapse.start()
+        self.worker_show_logo = Worker_show_logo()
+        self.worker_show_logo.text_to_set.connect(self.show_logo)
+        self.worker_show_logo.start()
+        self.worker_hide_logo = Worker_hide_logo()
+        self.worker_hide_logo.text_to_set.connect(self.hide_logo)
+        self.worker_hide_logo.start()
+        self.worker_activate_long_gca = Worker_activate_long_gca()
+        self.worker_activate_long_gca.text_to_set.connect(self.activate_long_gca)
+        self.worker_activate_long_gca.start()
+        self.worker_deactivate_long_gca = Worker_deactivate_long_gca()
+        self.worker_deactivate_long_gca.text_to_set.connect(self.deactivate_long_gca)
+        self.worker_deactivate_long_gca.start()
+        self.worker_tray_and_task_bar_logo = Worker_tray_and_task_bar_logo()
+        self.worker_tray_and_task_bar_logo.text_to_set.connect(
+            self.tray_and_task_bar_logo
+        )
+        self.worker_tray_and_task_bar_logo.start()
+        # print height and width
+        print(self.height(), self.width())
+        self.show()
+    def set_text(self, text):
+        global the_input_box
+        vertical_scrollbar = the_input_box.verticalScrollBar()
+        scroll_value = vertical_scrollbar.value()
+        the_input_box.setPlainText(text)
+        vertical_scrollbar.setValue(scroll_value)
+    def set_title_bar_text(self, text):
+        self.title_label.setText(text)
+    def update_from_thread(self, text, system=True):
+        self.worker.make_animation = True
+        if system:
+            text = "System: " + text
+        print("Updating from thread", text)
+        self.worker.the_input_text = text
+    def read_part_task_generate_only(self):
+        if not is_just_text_model_active() and the_main_window.tts_available:
+            threads = {}
+            the_okey_parts = split_with_multiple_delimiters(
+                self.worker.the_input_text, ".?!:"
+            )
+            for each in the_okey_parts:
+                if the_main_window.stop_talking:
+                    break
+                the_thread = threading.Thread(target=text_to_speech, args=(each,))
+                threads[each] = the_thread
+                the_thread.start()
+            for each in threads.values():
+                each.join()
+        self.reading_thread_2 = False
+    def read_part_task(self):
+        if not is_just_text_model_active() and the_main_window.tts_available:
+            threads = {}
+            the_okey_parts = split_with_multiple_delimiters(
+                self.worker.the_input_text, ".?!:"
+            )
+            will_read_parts = []
+            for each in the_okey_parts:
+                if the_main_window.stop_talking:
+                    break
+                if each not in readed_sentences:
+                    will_read_parts.append(each)
+                    readed_sentences.append(each)
+                    the_thread = threading.Thread(target=text_to_speech, args=(each,))
+                    threads[each] = the_thread
+                    the_thread.start()
+            for each in will_read_parts:
+                if the_main_window.stop_talking:
+                    break
+                threads[each].join()
+                tts_if_you_can(each, not_threaded=True, bypass_other_settings=True)
+        self.reading_thread = False
+    def set_text_to_input_box(self, text):
+        global readed_sentences
+        self.worker.make_animation = False
+        if self.worker.the_input_text.startswith("System:") or self.complated_answer:
+            self.worker.the_input_text = ""
+            self.complated_answer = False
+            readed_sentences = []
+        if text not in (">", "<>", ">\n", "<", "<\n"):
+            self.worker.the_input_text += text
+            if self.reading_thread is not True and len(self.worker.the_input_text) > 40:
+                self.reading_thread = True
+                threading.Thread(target=self.read_part_task).start()
+            if (
+                self.reading_thread_2 is not True
+                and len(self.worker.the_input_text) > 250
+            ):
+                self.reading_thread_2 = True
+                threading.Thread(target=self.read_part_task_generate_only).start()
+        else:
+            print("Problem on text chars")
+    def set_text_from_api(self, text):
+        self.worker.make_animation = True
+        self.worker.the_input_text = text
+    def active_border_animation(self, title_bar_text=None):
+        if self.worker_2.title_bar_text is not None:
+            if self.worker_2.title_bar_text != title_bar_text:
+                return
+        self.worker_2.the_input_text = True
+        if title_bar_text is None:
+            title_bar_text = "  " + name()
+        else:
+            title_bar_text = f"  {title_bar_text}"
+            if len(title_bar_text) > 33:
+                title_bar_text = title_bar_text[:30] + "..."
+        self.worker_2.title_bar_text = title_bar_text
+        self.btn_minimize.hide()
+        self.btn_close.hide()
+    def deactive_border_animation(self, title_bar_text=None):
+        if title_bar_text is None:
+            title_bar_text = "  " + name()
+        else:
+            title_bar_text = f"  {title_bar_text}"
+            if len(title_bar_text) > 33:
+                title_bar_text = title_bar_text[:30] + "..."
+        if self.worker_2.title_bar_text is not None:
+            if self.worker_2.title_bar_text != title_bar_text:
+                return
+        self.worker_2.the_input_text = False
+        self.worker_2.title_bar_text = None
+        time.sleep(1)
+        self.btn_minimize.show()
+        self.btn_close.show()
+    def mouseMoveEvent(self, event: QMouseEvent):
+        delta = QPoint(event.globalPos() - self.old_position)
+        if event.buttons() == Qt.LeftButton and self.title_bar.underMouse():
+            self.move(self.x() + delta.x(), self.y() + delta.y())
+            self.old_position = event.globalPos()
+    def mousePressEvent(self, event: QMouseEvent):
+        self.old_position = event.globalPos()
+    def remove_screenshot_button(self):
+        self.update()
+    def add_screenshot_button(self):
+        self.update()
+    def update_state(self, new_state):
+        assistant_stopped = False
+        if self.state == "aitalking" and new_state == "idle":
+            assistant_stopped = True
+        if self.manuel_stop:
+            assistant_stopped = False
+            self.manuel_stop = False
+        self.state = new_state
+        print(f"State updated: {new_state}")
+        if "talking" in new_state:
+            self.tray.setIcon(self.tray_active_icon)
+            self.pulse_frame = 0
+            if self.pulse_timer:
+                self.pulse_timer.stop()
+                self.pulse_timer = None
+            self.pulse_timer = QTimer(self)
+            self.pulse_timer.timeout.connect(self.pulse_circle)
+            self.pulse_timer.start(5)
+        elif new_state == "thinking":
+            the_main_window.update_from_thread("Thinking...")
+            self.pulse_frame = 0
+            if self.pulse_timer:
+                self.pulse_timer.stop()
+                self.pulse_timer = None
+            self.pulse_timer = QTimer(self)
+            self.pulse_timer.timeout.connect(self.pulse_circle)
+            self.pulse_timer.start(20)
+        elif self.pulse_timer:
+            self.tray.setIcon(self.tray_icon)
+            self.pulse_timer.stop()
+            self.pulse_timer = None
+        self.update()  # Trigger a repaint
+        if assistant_stopped:
+            global the_input_box
+            if (
+                the_input_box.toPlainText().endswith("?")
+                and is_continuously_conversations_setting_active()
+            ):
+                self.button_handler.toggle_recording(
+                    no_screenshot=True, new_record=True
+                )
+        if new_state == "idle":
+            click_sound()
+    def pulse_circle(self):
+        self.pulse_frame = (self.pulse_frame + 1) % 100
+        self.update()
+    def collapse_gca(self):
+        self.collapse = True
+        self.collapse_window()
+        activate_collapse_setting()
+        self.update_screen()
+    def collapse_gca_api(self):
+        self.worker_collapse.the_input_text = "True"
+    def uncollapse_gca(self):
+        self.collapse = False
+        print()
+        # hide all buttons and input box
+        the_input_box.show()
+        self.settingsButton.show()
+        self.llmsettingsButton.show()
+        deactivate_collapse_setting()
+        self.update_screen()
+    def uncollapse_gca_api(self):
+        self.worker_uncollapse.the_input_text = "True"
+    def show_logo(self):
+        self.the_image.setPixmap(QtGui.QPixmap(load_logo_file_path()).scaled(25, 25))
+        self.the_image.show()
+        self.update_screen()
+    def tray_and_task_bar_logo(self):
+        app_icon = QtGui.QIcon()
+        app_icon.addFile(load_logo_file_path(), QtCore.QSize(48, 48))
+        self.the_app.setWindowIcon(app_icon)
+        self.tray.setIcon(app_icon)
+        self.tray_icon = app_icon
+        self.tray_active_icon = app_icon
+        print("ICON Set", load_logo_file_path())
+    def tray_and_task_bar_logo_api(self):
+        self.worker_tray_and_task_bar_logo.the_input_text = "True"
+    def show_logo_api(self):
+        self.worker_show_logo.the_input_text = "True"
+    def hide_logo(self):
+        self.the_image.hide()
+        self.update_screen()
+    def hide_logo_api(self):
+        self.worker_hide_logo.the_input_text = "True"
+    def activate_long_gca(self):
+        activate_long_gca_setting()
+        self.update_screen()
+    def activate_long_gca_api(self):
+        self.worker_activate_long_gca.the_input_text = "True"
+    def deactivate_long_gca(self):
+        deactivate_long_gca_setting()
+        self.update_screen()
+    def deactivate_long_gca_api(self):
+        self.worker_deactivate_long_gca.the_input_text = "True"
+    def update_screen(self):
+        width = 210
+        height = 320
+        if is_logo_active_setting_active():
+            height += 35
+        if is_collapse_setting_active():
+            height = 150
+            if is_logo_active_setting_active():
+                height += 35
+        if is_long_gca_setting_active():
+            if not is_collapse_setting_active():
+                height += 500
+                self.input_box.setFixedHeight(580)
+        else:
+            self.input_box.setFixedHeight(80)
+        self.setFixedSize(width, height)
+        self.put_location()
+    def put_window_to_right_side_of_screen(self):
+        screen = QDesktopWidget().screenGeometry()
+        window = self.frameGeometry()
+        # Calculate x position for the right side of the screen and center vertically
+        x = screen.width() - window.width()  # To right side
+        y = (screen.height() - window.height()) // 2  # Center vertically
+        # Add a small offset to the right side
+        x -= 10
+        self.move(x, y)

gpt_computer_agent/gui/__init__.py ADDED Viewed

File without changes

gpt_computer_agent/gui/button.py ADDED Viewed

	@@ -0,0 +1,169 @@

+import pyautogui
+from .signal import *
+import threading
+try:
+    from ..audio.record import *
+    from ..screen.shot import *
+    from ..agent.process import *
+    from ..agent.chat_history import clear_chat_history
+    from ..utils.db import (
+        screenshot_path,
+        save_api_key,
+        load_api_key,
+        activate_just_text_model,
+        deactivate_just_text_model,
+        is_just_text_model_active,
+        set_profile,
+        get_profile,
+    )
+    from ..screen.shot import take_screenshot
+except ImportError:
+    from audio.record import *
+    from screen.shot import *
+    from agent.process import *
+    from utils.db import (
+        screenshot_path,
+    )
+    from screen.shot import take_screenshot
+recording_thread = None
+class ButtonHandler:
+    """Handles button click events and corresponding actions."""
+    def __init__(self, main_window):
+        """Initialize the ButtonHandler."""
+        self.recording = False
+        self.main_window = main_window
+        self.process_audio_thread = None
+        signal_handler.recording_started.connect(self.on_recording_started)
+        signal_handler.recording_stopped.connect(self.on_recording_stopped)
+        signal_handler.assistant_thinking.connect(self.on_assistant_thinking)
+        signal_handler.assistant_response_ready.connect(
+            self.on_assistant_response_ready
+        )
+        signal_handler.assistant_response_stopped.connect(
+            self.on_assistant_response_stopped
+        )
+    def toggle_recording(
+        self,
+        no_screenshot=False,
+        take_system_audio=False,
+        dont_save_image=False,
+        new_record=False,
+    ):
+        """Toggle audio recording."""
+        if self.recording and not new_record:
+            stop_recording()
+            self.recording = False
+        else:
+            if not no_screenshot:
+                screenshot = pyautogui.screenshot()
+                screenshot.save(screenshot_path)
+            self.no_screenshot = no_screenshot
+            self.take_system_audio = take_system_audio
+            self.dont_save_image = dont_save_image
+            global recording_thread
+            if (
+                recording_thread is None
+                or not recording_thread.is_alive()
+                or new_record
+            ):
+                recording_thread = threading.Thread(
+                    target=start_recording,
+                    args=(
+                        take_system_audio,
+                        self,
+                    ),
+                )
+                recording_thread.start()
+            signal_handler.recording_started.emit()
+    def on_recording_started(self):
+        """Handle event when recording starts."""
+        self.recording = True
+        self.main_window.update_state("talking")
+    def on_recording_stopped(self):
+        """Handle event when recording stops."""
+        print("ON RECORDING STOPPED")
+        self.recording = False
+        self.main_window.update_state("thinking")
+        if (
+            self.process_audio_thread is None
+            or not self.process_audio_thread.is_alive()
+        ):
+            signal_handler.assistant_thinking.emit()
+            self.process_audio_thread = threading.Thread(
+                target=process_audio,
+                args=(
+                    not self.no_screenshot,
+                    self.take_system_audio,
+                    self.dont_save_image,
+                ),
+            )
+            self.process_audio_thread.start()
+    def just_screenshot(self):
+        """Take a screenshot."""
+        take_screenshot()
+        self.process_audio_thread = threading.Thread(target=process_screenshot)
+        self.process_audio_thread.start()
+    def on_assistant_response_stopped(self):
+        """Handle event when assistant's response stops."""
+        self.main_window.update_state("idle")
+    def on_assistant_thinking(self):
+        """Handle event when assistant is thinking."""
+        self.main_window.update_state("thinking")
+    def on_assistant_response_ready(self):
+        """Handle event when assistant's response is ready."""
+        self.main_window.update_state("aitalking")
+    def input_text(self, text):
+        """Handle input text."""
+        self.main_window.update_state("thinking")
+        if (
+            self.process_audio_thread is None
+            or not self.process_audio_thread.is_alive()
+        ):
+            signal_handler.assistant_thinking.emit()
+            self.process_audio_thread = threading.Thread(
+                target=process_text, args=(text,)
+            )
+            self.process_audio_thread.start()
+    def input_text_screenshot(self, text):
+        """Handle input text with screenshot."""
+        screenshot = pyautogui.screenshot()
+        screenshot.save(screenshot_path)
+        self.main_window.update_state("thinking")
+        if (
+            self.process_audio_thread is None
+            or not self.process_audio_thread.is_alive()
+        ):
+            signal_handler.assistant_thinking.emit()
+            self.process_audio_thread = threading.Thread(
+                target=process_text,
+                args=(text,),
+                kwargs={"screenshot_path": screenshot_path},
+            )
+            self.process_audio_thread.start()

gpt_computer_agent/gui/llmsettings.py ADDED Viewed

	@@ -0,0 +1,276 @@

+try:
+    from ..utils.db import *
+    from ..agent.chat_history import clear_chat_history
+    from ..llm_settings import llm_show_name, llm_settings
+    from ..audio.tts import is_local_tts_available
+    from ..audio.stt import is_local_stt_available
+except ImportError:
+    from utils.db import *
+    from llm_settings import llm_show_name, llm_settings
+    from audio.tts import is_local_tts_available
+    from audio.stt import is_local_stt_available
+from PyQt5.QtWidgets import (
+    QDialog,
+    QVBoxLayout,
+    QLabel,
+    QLineEdit,
+    QPushButton,
+    QComboBox,
+)
+from PyQt5.QtCore import Qt
+def llmsettings_popup(self):
+    from ..gpt_computer_agent import the_main_window
+    settings_dialog = QDialog()
+    settings_dialog.setWindowTitle("Settings")
+    settings_dialog.setWindowModality(Qt.ApplicationModal)
+    settings_dialog.setLayout(QVBoxLayout())
+    api_key_label = QLabel("OpenAI API Key")
+    settings_dialog.layout().addWidget(api_key_label)
+    api_key_input = QLineEdit()
+    api_key = load_api_key()
+    api_key_input.setText(api_key)
+    settings_dialog.layout().addWidget(api_key_input)
+    save_button = QPushButton("Save")
+    def save_api_key_(api_key):
+        save_api_key(api_key)
+        the_main_window.update_from_thread("Saved API Key")
+        the_main_window.input_box.setPlaceholderText("Type here")
+        settings_dialog.close()
+    save_button.clicked.connect(lambda: save_api_key_(api_key_input.text()))
+    settings_dialog.layout().addWidget(save_button)
+    openai_url_label = QLabel("OpenAI Base URL")
+    settings_dialog.layout().addWidget(openai_url_label)
+    openai_url_input = QLineEdit()
+    openai_url = load_openai_url()
+    openai_url_input.setText(openai_url)
+    settings_dialog.layout().addWidget(openai_url_input)
+    def save_openai_url_():
+        openai_url = openai_url_input.text()
+        save_openai_url(openai_url)
+        the_main_window.update_from_thread("Saved OpenAI Base URL")
+        the_main_window.input_box.setPlaceholderText("Type here")
+        settings_dialog.close()
+    openai_url_save_button = QPushButton("Save URL")
+    openai_url_save_button.clicked.connect(save_openai_url_)
+    settings_dialog.layout().addWidget(openai_url_save_button)
+    groq_api_key_label = QLabel("Groq API Key")
+    settings_dialog.layout().addWidget(groq_api_key_label)
+    groq_api_key_input = QLineEdit()
+    groq_api_key = load_groq_api_key()
+    groq_api_key_input.setText(groq_api_key)
+    settings_dialog.layout().addWidget(groq_api_key_input)
+    groq_save_button = QPushButton("Save")
+    def groq_save_api_key_(api_key):
+        save_groq_api_key(api_key)
+        the_main_window.update_from_thread("Saved Groq API Key")
+        the_main_window.input_box.setPlaceholderText("Type here")
+        settings_dialog.close()
+    groq_save_button.clicked.connect(
+        lambda: groq_save_api_key_(groq_api_key_input.text())
+    )
+    settings_dialog.layout().addWidget(groq_save_button)
+    google_api_key_label = QLabel("Google Generative AI API Key")
+    settings_dialog.layout().addWidget(google_api_key_label)
+    google_api_key_input = QLineEdit()
+    google_api_key = load_google_api_key()
+    google_api_key_input.setText(google_api_key)
+    settings_dialog.layout().addWidget(google_api_key_input)
+    google_save_button = QPushButton("Save")
+    def google_save_api_key_(api_key):
+        save_google_api_key(api_key)
+        the_main_window.update_from_thread("Saved Google API Key")
+        the_main_window.input_box.setPlaceholderText("Type here")
+        settings_dialog.close()
+    google_save_button.clicked.connect(
+        lambda: google_save_api_key_(google_api_key_input.text())
+    )
+    settings_dialog.layout().addWidget(google_save_button)
+    def hide_openai():
+        api_key_label.hide()
+        api_key_input.hide()
+        openai_url_label.hide()
+        openai_url_input.hide()
+        save_button.hide()
+        openai_url_save_button.hide()
+    def hide_groq():
+        groq_api_key_label.hide()
+        groq_api_key_input.hide()
+        groq_save_button.hide()
+    def hide_google():
+        google_api_key_label.hide()
+        google_api_key_input.hide()
+        google_save_button.hide()
+    def show_openai():
+        api_key_label.show()
+        api_key_input.show()
+        openai_url_label.show()
+        openai_url_input.show()
+        save_button.show()
+        openai_url_save_button.show()
+    def show_groq():
+        groq_api_key_label.show()
+        groq_api_key_input.show()
+        groq_save_button.show()
+    def show_google():
+        google_api_key_label.show()
+        google_api_key_input.show()
+        google_save_button.show()
+    hide_openai()
+    hide_groq()
+    hide_google()
+    model_label = QLabel("Model")
+    model_select = QComboBox()
+    model_select.addItems(list(llm_show_name.keys()))
+    settings_dialog.layout().addWidget(model_label)
+    settings_dialog.layout().addWidget(model_select)
+    current_model = load_model_settings()
+    for i, model in enumerate(llm_show_name.keys()):
+        if llm_show_name[model] == current_model:
+            model_select.setCurrentIndex(i)
+    if llm_settings[llm_show_name[model_select.currentText()]]["provider"] == "openai":
+        show_openai()
+    if llm_settings[llm_show_name[model_select.currentText()]]["provider"] == "groq":
+        show_groq()
+    if llm_settings[llm_show_name[model_select.currentText()]]["provider"] == "google":
+        show_google()
+    if not llm_settings[llm_show_name[model_select.currentText()]]["vision"]:
+        the_main_window.remove_screenshot_button()
+    def on_model_change():
+        hide_openai()
+        hide_groq()
+        hide_google()
+        the_save_string = llm_show_name[model_select.currentText()]
+        save_model_settings(the_save_string)
+        if (
+            llm_settings[llm_show_name[model_select.currentText()]]["provider"]
+            == "openai"
+        ):
+            show_openai()
+            openai_url_label.show()
+            openai_url_input.show()
+            openai_url_save_button.show()
+        if llm_settings[llm_show_name[model_select.currentText()]]["vision"]:
+            the_main_window.add_screenshot_button()
+        else:
+            the_main_window.remove_screenshot_button()
+        if (
+            llm_settings[llm_show_name[model_select.currentText()]]["provider"]
+            == "groq"
+        ):
+            show_groq()
+        if (
+            llm_settings[llm_show_name[model_select.currentText()]]["provider"]
+            == "google"
+        ):
+            show_google()
+    model_select.currentIndexChanged.connect(on_model_change)
+    # Add TTS model selection
+    tts_model_label = QLabel("TTS Model")
+    tts_model_select = QComboBox()
+    tts_model_select.addItems(["openai", "microsoft_local"])
+    settings_dialog.layout().addWidget(tts_model_label)
+    settings_dialog.layout().addWidget(tts_model_select)
+    currently_tts_model = load_tts_model_settings()
+    if currently_tts_model == "openai":
+        tts_model_select.setCurrentIndex(0)
+        show_openai()
+    else:
+        tts_model_select.setCurrentIndex(1)
+    def on_tts_model_change():
+        if tts_model_select.currentText() == "openai":
+            show_openai()
+            save_tts_model_settings("openai")
+        else:
+            save_tts_model_settings("microsoft_local")
+    if not is_local_tts_available():
+        # add an text to inform the user that local tts is not available
+        information_text = QLabel(
+            "Please install gpt-computer-agent[local_tts] to use local TTS"
+        )
+        settings_dialog.layout().addWidget(information_text)
+        tts_model_select.setEnabled(False)
+    tts_model_select.currentIndexChanged.connect(on_tts_model_change)
+    # Add STT model selection
+    stt_model_label = QLabel("STT Model")
+    stt_model_select = QComboBox()
+    stt_model_select.addItems(["openai", "openai_whisper_local"])
+    settings_dialog.layout().addWidget(stt_model_label)
+    settings_dialog.layout().addWidget(stt_model_select)
+    currently_stt_model = load_stt_model_settings()
+    if currently_stt_model == "openai":
+        stt_model_select.setCurrentIndex(0)
+        show_openai()
+    else:
+        stt_model_select.setCurrentIndex(1)
+    def on_stt_model_change():
+        if stt_model_select.currentText() == "openai":
+            show_openai()
+            save_stt_model_settings("openai")
+        else:
+            save_stt_model_settings("openai_whisper_local")
+    if not is_local_stt_available():
+        # add an text to inform the user that local stt is not available
+        information_text = QLabel(
+            "Please install gpt-computer-agent[local_stt] to use local STT"
+        )
+        settings_dialog.layout().addWidget(information_text)
+        stt_model_select.setEnabled(False)
+    stt_model_select.currentIndexChanged.connect(on_stt_model_change)
+    # Add an separator
+    separator = QLabel("------------------------------------------------")
+    settings_dialog.layout().addWidget(separator)
+    # Add an powered by label
+    powered_by_label = QLabel("Powered by KhulnaSoft <3")
+    # Make label bold
+    font = powered_by_label.font()
+    font.setBold(True)
+    powered_by_label.setFont(font)
+    settings_dialog.layout().addWidget(powered_by_label)
+    settings_dialog.exec_()

gpt_computer_agent/gui/settings.py ADDED Viewed

	@@ -0,0 +1,351 @@

+from PyQt5.QtWidgets import QDialog, QVBoxLayout, QLabel, QLineEdit, QPushButton
+from PyQt5.QtCore import Qt
+try:
+    from ..utils.db import *
+    from ..agent.chat_history import clear_chat_history
+except:
+    from utils.db import *
+    from agent.chat_history import clear_chat_history
+def settings_popup(self):
+    """
+    Display a settings popup dialog for configuring various options.
+    This function creates a settings dialog with options to reset chat history, enable/disable the just text model,
+    and change the active profile.
+    Parameters:
+    - self: Reference to the main application window.
+    Returns:
+    - None
+    """
+    from ..gpt_computer_agent import the_main_window
+    settings_dialog = QDialog()
+    settings_dialog.setWindowTitle("Settings")
+    settings_dialog.setWindowModality(Qt.ApplicationModal)
+    settings_dialog.setLayout(QVBoxLayout())
+    reset_memory_button = QPushButton("Reset Memory")
+    def clear_chat_history_():
+        """
+        Clear the chat history and update the main window.
+        This function clears the chat history and updates the main window with a notification.
+        Returns:
+        - None
+        """
+        clear_chat_history()
+        the_main_window.update_from_thread("Cleared Chat History")
+        settings_dialog.close()
+    reset_memory_button.clicked.connect(clear_chat_history_)
+    settings_dialog.layout().addWidget(reset_memory_button)
+    just_text_button = QPushButton("Enable Just Text Model")
+    settings_dialog.layout().addWidget(just_text_button)
+    if is_just_text_model_active():
+        just_text_button.setText("Disable Just Text Model")
+        def deactivate_just_text_model_():
+            """
+            Deactivate the just text model and update the main window.
+            This function deactivates the just text model and updates the main window with a notification.
+            Returns:
+            - None
+            """
+            deactivate_just_text_model()
+            the_main_window.update_from_thread("Disabled Just Text Model")
+            settings_dialog.close()
+        just_text_button.clicked.connect(deactivate_just_text_model_)
+    else:
+        def activate_just_text_model_():
+            """
+            Activate the just text model and update the main window.
+            This function activates the just text model and updates the main window with a notification.
+            Returns:
+            - None
+            """
+            activate_just_text_model()
+            the_main_window.update_from_thread("Enabled Just Text Model")
+            settings_dialog.close()
+        just_text_button.clicked.connect(activate_just_text_model_)
+    settings_dialog.layout().addWidget(QLabel("Profile"))
+    profile_input = QLineEdit()
+    profile_input.setText(get_profile())
+    settings_dialog.layout().addWidget(profile_input)
+    profile_save_button = QPushButton("Save")
+    def set_profile_(profile):
+        """
+        Set the active profile and update the main window.
+        This function sets the active profile based on user input and updates the main window with a notification.
+        Parameters:
+        - profile (str): The profile name to set.
+        Returns:
+        - None
+        """
+        set_profile(profile)
+        the_main_window.update_from_thread("Saved Profile")
+        settings_dialog.close()
+    profile_save_button.clicked.connect(lambda: set_profile_(profile_input.text()))
+    settings_dialog.layout().addWidget(profile_save_button)
+    dark_mode_button = QPushButton("Enable Dark Mode")
+    settings_dialog.layout().addWidget(dark_mode_button)
+    if is_dark_mode_active():
+        dark_mode_button.setText("Disable Dark Mode")
+        def deactivate_dark_mode_():
+            """
+            Deactivate dark mode and update the main window.
+            This function deactivates dark mode and updates the main window with a notification.
+            Returns:
+            - None
+            """
+            deactivate_dark_mode()
+            the_main_window.update_from_thread("Disabled Dark Mode")
+            the_main_window.light_mode()
+            settings_dialog.close()
+        dark_mode_button.clicked.connect(deactivate_dark_mode_)
+    else:
+        def activate_dark_mode_():
+            """
+            Activate dark mode and update the main window.
+            This function activates dark mode and updates the main window with a notification.
+            Returns:
+            - None
+            """
+            activate_dark_mode()
+            the_main_window.update_from_thread("Enabled Dark Mode")
+            the_main_window.dark_mode()
+            settings_dialog.close()
+        dark_mode_button.clicked.connect(activate_dark_mode_)
+    predefined_agents_button = QPushButton(
+        "Enable Predefined Agents (Good Results, Long Response Time)"
+    )
+    settings_dialog.layout().addWidget(predefined_agents_button)
+    try:
+        if is_predefined_agents_setting_active():
+            predefined_agents_button.setText(
+                "Disable Predefined Agents (Bad Results, Short Response Time)"
+            )
+            def deactivate_predefined_agents_():
+                deactivate_predefined_agents_setting()
+                the_main_window.update_from_thread(
+                    "Disabled Predefined Agents (Bad Results, Short Response Time)"
+                )
+                settings_dialog.close()
+            predefined_agents_button.clicked.connect(deactivate_predefined_agents_)
+        else:
+            def activate_predefined_agents_():
+                activate_predefined_agents_setting()
+                the_main_window.update_from_thread(
+                    "Enabled Predefined Agents (Good Results, Long Response Time)"
+                )
+                settings_dialog.close()
+            predefined_agents_button.clicked.connect(activate_predefined_agents_)
+    except:
+        predefined_agents_button.setText("Install gpt-computer-agent[agentic]")
+    online_tools_button = QPushButton(
+        "Enable KhulnaSoft Tiger Tools - More Capability (Recommended)"
+    )
+    settings_dialog.layout().addWidget(online_tools_button)
+    if is_online_tools_setting_active():
+        online_tools_button.setText(
+            "Disable KhulnaSoft Tiger Tools - Low Capability (Not Recommended)"
+        )
+        def deactivate_online_tools_():
+            deactivate_online_tools_setting()
+            the_main_window.update_from_thread(
+                "Disabled KhulnaSoft Tiger Tools - Low Capability (Not Recommended)"
+            )
+            settings_dialog.close()
+        online_tools_button.clicked.connect(deactivate_online_tools_)
+    else:
+        def activate_online_tools_():
+            activate_online_tools_setting()
+            the_main_window.update_from_thread(
+                "Enabled KhulnaSoft Tiger Tools - More Capability (Recommended)"
+            )
+            settings_dialog.close()
+        online_tools_button.clicked.connect(activate_online_tools_)
+    auto_stop_recording_button = QPushButton("Enable Auto Stop Recording")
+    settings_dialog.layout().addWidget(auto_stop_recording_button)
+    if is_auto_stop_recording_setting_active():
+        auto_stop_recording_button.setText("Disable Auto Stop Recording")
+        def deactivate_auto_stop_recording_():
+            deactivate_auto_stop_recording_setting()
+            the_main_window.update_from_thread("Disabled Auto Stop Recording")
+            settings_dialog.close()
+        auto_stop_recording_button.clicked.connect(deactivate_auto_stop_recording_)
+    else:
+        def activate_auto_stop_recording_():
+            activate_auto_stop_recording_setting()
+            the_main_window.update_from_thread("Enabled Auto Stop Recording")
+            settings_dialog.close()
+        auto_stop_recording_button.clicked.connect(activate_auto_stop_recording_)
+    api_key_label = QLabel("Wakeword - Pvporcupine API Key")
+    settings_dialog.layout().addWidget(api_key_label)
+    api_key_input = QLineEdit()
+    api_key = load_pvporcupine_api_key()
+    api_key_input.setText(api_key)
+    settings_dialog.layout().addWidget(api_key_input)
+    save_button = QPushButton("Save")
+    def save_api_key_(api_key):
+        first_time = True
+        if api_key != "CHANGE_ME":
+            first_time = False
+        save_pvporcupine_api_key(api_key)
+        the_main_window.update_from_thread(
+            "Wake word activated, just say 'Her Computer' or jarvis to activate the assistant"
+        )
+        if first_time:
+            the_main_window.wake_word_trigger()
+        settings_dialog.close()
+    save_button.clicked.connect(lambda: save_api_key_(api_key_input.text()))
+    settings_dialog.layout().addWidget(save_button)
+    wake_word_button = QPushButton("Enable Wake Word")
+    settings_dialog.layout().addWidget(wake_word_button)
+    missing_parts = False
+    try:
+        pass
+    except:
+        missing_parts = True
+    if api_key == "CHANGE_ME":
+        wake_word_button.setText("Please Set Pvporcupine API Key First")
+    elif missing_parts:
+        wake_word_button.setText("Please Install gpt-computer-agent[wakeword]")
+    else:
+        if is_wake_word_active():
+            wake_word_button.setText("Disable Wake Word")
+            def deactivate_wake_word_():
+                deactivate_wake_word()
+                the_main_window.update_from_thread("Disabled Wake Word")
+                the_main_window.wake_word_active = False
+                settings_dialog.close()
+            wake_word_button.clicked.connect(deactivate_wake_word_)
+        else:
+            def activate_wake_word_():
+                activate_wake_word()
+                the_main_window.update_from_thread("Enabled Wake Word")
+                the_main_window.wake_word_active = True
+                the_main_window.wake_word_trigger()
+                settings_dialog.close()
+            wake_word_button.clicked.connect(activate_wake_word_)
+    wake_word_screen_button = QPushButton("Enable Screen Input for Wake Word Mode")
+    settings_dialog.layout().addWidget(wake_word_screen_button)
+    if is_wake_word_screen_setting_active():
+        wake_word_screen_button.setText("Disable Screen Input for Wake Word Mode")
+        def deactivate_auto_stop_recording_():
+            deactivate_wake_word_screen_setting()
+            the_main_window.update_from_thread(
+                "Disabled Screen Input for Wake Word Mode"
+            )
+            settings_dialog.close()
+        wake_word_screen_button.clicked.connect(deactivate_auto_stop_recording_)
+    else:
+        def activate_auto_stop_recording_():
+            activate_wake_word_screen_setting()
+            the_main_window.update_from_thread(
+                "Enabled Screen Input for Wake Word Mode"
+            )
+            settings_dialog.close()
+        wake_word_screen_button.clicked.connect(activate_auto_stop_recording_)
+    continuously_conversations_button = QPushButton("Enable Continuously Conversations")
+    settings_dialog.layout().addWidget(continuously_conversations_button)
+    if is_continuously_conversations_setting_active():
+        continuously_conversations_button.setText("Disable Continuously Conversations")
+        def deactivate_auto_stop_recording_():
+            deactivate_continuously_conversations_setting()
+            the_main_window.update_from_thread("Disabled Continuously Conversations")
+            settings_dialog.close()
+        continuously_conversations_button.clicked.connect(
+            deactivate_auto_stop_recording_
+        )
+    else:
+        def activate_auto_stop_recording_():
+            activate_continuously_conversations_setting()
+            the_main_window.update_from_thread("Enabled Continuously Conversations")
+            settings_dialog.close()
+        continuously_conversations_button.clicked.connect(activate_auto_stop_recording_)
+    settings_dialog.exec_()

gpt_computer_agent/gui/signal.py ADDED Viewed

	@@ -0,0 +1,27 @@

+from PyQt5.QtCore import pyqtSignal, QObject
+class SignalHandler(QObject):
+    """
+    A QObject subclass to handle signals used in the GUI application.
+    This class defines several signals that can be used to communicate
+    between different components of the GUI application.
+    Signals:
+    - recording_started: Signal emitted when recording is started.
+    - recording_stopped: Signal emitted when recording is stopped.
+    - assistant_thinking: Signal emitted when the assistant is processing a request.
+    - assistant_response_ready: Signal emitted when the assistant response is ready to be displayed.
+    - assistant_response_stopped: Signal emitted when the assistant response display is stopped.
+    """
+    recording_started = pyqtSignal()
+    recording_stopped = pyqtSignal()
+    assistant_thinking = pyqtSignal()
+    assistant_response_ready = pyqtSignal()
+    assistant_response_stopped = pyqtSignal()
+signal_handler = SignalHandler()

gpt_computer_agent/llm.py ADDED Viewed

	@@ -0,0 +1,108 @@

+from openai import OpenAI
+from langchain_openai import ChatOpenAI
+from langchain_community.chat_models import ChatOllama
+from langchain_google_genai import ChatGoogleGenerativeAI
+from langchain_groq import ChatGroq
+try:
+    from .utils.db import (
+        load_api_key,
+        load_openai_url,
+        load_model_settings,
+        load_groq_api_key,
+        load_google_api_key,
+    )
+    from .custom_callback import customcallback
+    from .llm_settings import llm_settings
+except ImportError:
+    from utils.db import (
+        load_api_key,
+        load_openai_url,
+        load_model_settings,
+        load_groq_api_key,
+        load_google_api_key,
+    )
+    from custom_callback import customcallback
+    from llm_settings import llm_settings
+the_callback = customcallback(strip_tokens=False, answer_prefix_tokens=["Answer"])
+def get_model(high_context=False):
+    the_model = load_model_settings()
+    the_api_key = load_api_key()
+    the_groq_api_key = load_groq_api_key()
+    the_google_api_key = load_google_api_key()
+    the_openai_url = load_openai_url()
+    def open_ai_base(high_context):
+        if the_openai_url == "default":
+            true_model = the_model
+            if high_context:
+                true_model = "gpt-4-turbo"
+            return {
+                "model": true_model,
+                "api_key": the_api_key,
+                "max_retries": 15,
+                "streaming": True,
+                "callbacks": [the_callback],
+            }
+        else:
+            return {
+                "model": the_model,
+                "api_key": the_api_key,
+                "max_retries": 15,
+                "streaming": True,
+                "callbacks": [the_callback],
+                "base_url": the_openai_url,
+            }
+    args_mapping = {
+        ChatOpenAI: open_ai_base(high_context=high_context),
+        ChatOllama: {"model": the_model},
+        ChatGroq: {
+            "temperature": 0,
+            "model_name": the_model.replace("-groq", ""),
+            "groq_api_key": the_openai_url,
+        },
+        ChatGoogleGenerativeAI: {
+            "model": the_model,
+            "google_api_key": the_google_api_key,
+        },
+    }
+    model_mapping = {}
+    for model_name, model_args in llm_settings.items():
+        the_tuple = None
+        if model_args["provider"] == "openai":
+            the_tuple = (ChatOpenAI, args_mapping[ChatOpenAI])
+        elif model_args["provider"] == "ollama":
+            the_tuple = (
+                ChatOpenAI,
+                {
+                    "api_key": "ollama",
+                    "base_url": "http://localhost:11434/v1",
+                    "model": model_name,
+                },
+            )
+        elif model_args["provider"] == "google":
+            the_tuple = (ChatGoogleGenerativeAI, args_mapping[ChatGoogleGenerativeAI])
+        elif model_args["provider"] == "groq":
+            the_tuple = (ChatGroq, args_mapping[ChatGroq])
+        if the_tuple:
+            model_mapping[model_name] = the_tuple
+    model_class, args = model_mapping[the_model]
+    return model_class(**args) if model_class else None
+def get_client():
+    the_api_key = load_api_key()
+    the_openai_url = load_openai_url()
+    if the_openai_url == "default":
+        return OpenAI(api_key=the_api_key)
+    else:
+        return OpenAI(api_key=the_api_key, base_url=the_openai_url)

gpt_computer_agent/llm_settings.py ADDED Viewed

	@@ -0,0 +1,185 @@

+llm_settings = {
+    "gpt-4o": {
+        "show_name": "gpt-4o (OpenAI)",
+        "vision": True,
+        "provider": "openai",
+        "tools": True,
+        "stream": True,
+    },
+    "gpt-4o-mini": {
+        "show_name": "gpt-4o-mini (OpenAI)",
+        "vision": True,
+        "provider": "openai",
+        "tools": True,
+        "stream": True,
+    },
+    "gpt-4-turbo": {
+        "show_name": "gpt-4-turbo (OpenAI)",
+        "vision": False,
+        "provider": "openai",
+        "tools": True,
+        "stream": True,
+    },
+    "gpt-3.5": {
+        "show_name": "gpt-3.5 (OpenAI)",
+        "vision": False,
+        "provider": "openai",
+        "tools": True,
+        "stream": True,
+    },
+    "gpt-3.5-turbo": {
+        "show_name": "gpt-3.5-turbo (OpenAI)",
+        "vision": False,
+        "provider": "openai",
+        "tools": True,
+        "stream": True,
+    },
+    "llama3": {
+        "show_name": "Llama3 (Ollama)",
+        "vision": False,
+        "provider": "ollama",
+        "tools": False,
+        "stream": False,
+    },
+    "llama3.1": {
+        "show_name": "Llama3.1 (Ollama)",
+        "vision": False,
+        "provider": "ollama",
+        "tools": True,
+        "stream": False,
+    },
+    "qwen2:1.5b": {
+        "show_name": "Qwen2 1.5b (Ollama)",
+        "vision": False,
+        "provider": "ollama",
+        "tools": False,
+        "stream": False,
+    },
+    "llava": {
+        "show_name": "Llava (Ollama)",
+        "vision": True,
+        "provider": "ollama",
+        "tools": False,
+        "stream": False,
+    },
+    "bakllava": {
+        "show_name": "BakLLaVA (Ollama)",
+        "vision": True,
+        "provider": "ollama",
+        "tools": False,
+        "stream": False,
+    },
+    "llava-llama3": {
+        "show_name": "Llava-Llama3 (Ollama)",
+        "vision": True,
+        "provider": "ollama",
+        "tools": False,
+        "stream": False,
+    },
+    "llava-phi3": {
+        "show_name": "LLaVA-Phi-3 (Ollama)",
+        "vision": True,
+        "provider": "ollama",
+        "tools": False,
+        "stream": False,
+    },
+    "gemini-pro": {
+        "show_name": "gemini-pro (Google)",
+        "vision": True,
+        "provider": "google",
+        "tools": True,
+        "stream": True,
+    },
+    "mixtral-8x7b-groq": {
+        "show_name": "Mixtral 8x7b (Groq)",
+        "vision": False,
+        "provider": "groq",
+        "tools": True,
+        "stream": True,
+    },
+}
+def get_openai_models():
+    return [k for k, v in llm_settings.items() if v["provider"] == "openai"]
+def get_ollama_models():
+    return [k for k, v in llm_settings.items() if v["provider"] == "ollama"]
+def get_google_models():
+    return [k for k, v in llm_settings.items() if v["provider"] == "google"]
+def get_groq_models():
+    return [k for k, v in llm_settings.items() if v["provider"] == "groq"]
+llm_show_name_ = {}
+for k, v in llm_settings.items():
+    llm_show_name_[v["show_name"]] = k
+llm_show_name = llm_show_name_
+def first_message():
+    from .character import name, developer, get_website_content
+    the_text = f"""
+You are {name()} that developed by {developer()}, you are the first live AI assistant in everyone computer that can complete any task by using tools.
+Before any task, write a plan for your tasks and do it step by step. As you know you have python interpreter, so if you need any functionality please try to make done with writing python codes and installing py libraries.
+Don't forget, you are capable to make any task.
+Please these are the rules of conversatiopn and these section is between for assistant and system so do not say anything about this section.
+# Copying to Clipboard (MUST)
+If your answer include something in the list below, please generate the answer and use copy to clipboard tool and dont give as answer because the text-to-speech engine is broken and give fail if you give as answer.
+- List of Somethings
+- Detailed Explanation of Something
+- Link(s) to a Website
+- Code Snippet(s)
+- Any Code Part
+- Any too Long Text
+After copying the thing that requested please say: "I copied to clipboard" and stop.
+# Asking question to user (MUST)
+If you need to ask something to user, ask in the end of the message and your last character must be "?".
+# Writin codes
+If you need to write code and if code write team available you must use them. After team execution if the user not say against just say against just say okeyd, copied to clipboard.
+# Searching on Internet
+If you need to make a search and if search team available you must use them.
+Your GitHub Repository:
+https://github.com/KhulnaSoft/gpt-computer-agent
+"""
+    the_website_content = get_website_content()
+    if the_website_content:
+        the_text += f"""
+# The Website Content of the User
+{the_website_content}
+"""
+    return the_text
+each_message_extension = """
+# Usings Answer
+Please start with <Answer> in your last responses. DONT FORGET IT AND DONT TALK ABOUT THIS RULE OR REFFERENCE
+"""

gpt_computer_agent/remote.py ADDED Viewed

	@@ -0,0 +1,291 @@

+import textwrap
+import requests
+import time
+from upsonic import Tiger
+the_upsonic_ = None
+def the_upsonic():
+    global the_upsonic_
+    if not the_upsonic_:
+        the_upsonic_ = Tiger()
+    return the_upsonic_
+class Remote_Client:
+    def __init__(self, url):
+        self.url = url
+        if self.status != True:
+            raise Exception("The server is not running")
+    def send_request(self, path, data, files=None, dont_error=False):
+        try:
+            if files == None:
+                response = requests.post(self.url + path, json=data)
+            else:
+                response = requests.post(self.url + path, data=data, files=files)
+            if response.status_code != 200:
+                try:
+                    print(response.json())
+                except:
+                    print(response.text)
+                raise Exception("Request failed", response.status_code, path)
+            return response.json()
+        except Exception as e:
+            if dont_error:
+                return {"response": str(e)}
+            else:
+                raise e
+    @property
+    def status(self):
+        data = {}
+        response = self.send_request("/status", data, dont_error=True)
+        return response["response"]
+    def input(self, text: str, screen: bool = False, talk: bool = False) -> str:
+        data = {"text": text, "screen": str(screen).lower(), "talk": str(talk).lower()}
+        response = self.send_request("/input", data)
+        return response["response"]
+    def just_screenshot(self) -> str:
+        data = {}
+        response = self.send_request("/screenshot", data)
+        return response["response"]
+    def screenshot_to_memory(self) -> str:
+        return self.just_screenshot()
+    def talk(self, text: str) -> str:
+        data = {"text": text}
+        response = self.send_request("/tts", data)
+        return response["response"]
+    def say(self, text: str) -> str:
+        return self.talk(text)
+    def profile(self, profile: str) -> str:
+        data = {"profile": profile}
+        response = self.send_request("/profile", data)
+        return response["response"]
+    def reset_memory(self) -> str:
+        response = self.send_request("/reset_memory", {})
+        return response["response"]
+    def enable_predefined_agents(self) -> str:
+        response = self.send_request("/activate_predefined_agents", {})
+        return response["response"]
+    def disable_predefined_agents(self) -> str:
+        response = self.send_request("/deactivate_predefined_agents", {})
+        return response["response"]
+    def enable_online_tools(self) -> str:
+        response = self.send_request("/activate_online_tools", {})
+        return response["response"]
+    def disable_online_tools(self) -> str:
+        response = self.send_request("/deactivate_online_tools", {})
+        return response["response"]
+    def change_name(self, new_name: str) -> str:
+        data = {"new_name": new_name}
+        response = self.send_request("/change_name", data)
+        return response["response"]
+    def change_developer(self, new_developer: str) -> str:
+        data = {"new_developer": new_developer}
+        response = self.send_request("/change_developer", data)
+        return response["response"]
+    def install_library(self, library: str) -> str:
+        data = {"library": library}
+        response = self.send_request("/library_install", data)
+        return response["response"]
+    def uninstall_library(self, library: str) -> str:
+        data = {"library": library}
+        response = self.send_request("/library_uninstall", data)
+        return response["response"]
+    def custom_tool(self, func):
+        the_code = textwrap.dedent(the_upsonic().extract_source(func))
+        # Remove the first line
+        if the_code.startswith("@remote.custom_tool"):
+            the_code = the_code[the_code.find("\n") + 1 :]
+        data = {"code": the_code}
+        response = self.send_request("/custom_tool", data)
+        return response["response"]
+    def top_bar_animation(self, text):
+        data = {"text": text}
+        response = self.send_request("/top_bar_activate", data)
+    def stop_top_bar_animation(self, text):
+        data = {"text": text}
+        response = self.send_request("/top_bar_deactivate", data)
+    def boop(self):
+        data = {}
+        response = self.send_request("/boop_sound", data)
+    def ask(self, question, wait_for_answer=None):
+        data = {"question": question, "wait_for_answer": wait_for_answer}
+        response = self.send_request("/ask_to_user", data)
+        return response["response"]
+    def set_text(self, text):
+        data = {"text": text}
+        response = self.send_request("/set_text", data)
+        return response["response"]
+    class OperationContext:
+        def __init__(self, client, text):
+            self.client = client
+            self.text = text
+        def __enter__(self):
+            self.client.top_bar_animation(self.text)
+            return self
+        def __exit__(self, exc_type, exc_val, exc_tb):
+            self.client.stop_top_bar_animation(self.text)
+    def operation(self, text):
+        return self.OperationContext(self, text)
+    def set_background_color(self, r, g, b):
+        data = {"color": f"{r}, {g}, {b}"}
+        response = self.send_request("/set_background_color", data)
+        return response["response"]
+    def set_opacity(self, opacity):
+        data = {"opacity": opacity}
+        response = self.send_request("/set_opacity", data)
+        return response["response"]
+    def set_border_radius(self, radius):
+        data = {"radius": radius}
+        response = self.send_request("/set_border_radius", data)
+        return response["response"]
+    def collapse(self):
+        data = {}
+        response = self.send_request("/collapse", data)
+        return response["response"]
+    def expand(self):
+        data = {}
+        response = self.send_request("/expand", data)
+        return response["response"]
+    def save_openai_api_key(self, openai_api_key):
+        data = {"openai_api_key": openai_api_key}
+        response = self.send_request("/save_openai_api_key", data)
+        return response["response"]
+    def save_openai_url(self, openai_url):
+        data = {"openai_url": openai_url}
+        response = self.send_request("/save_openai_url", data)
+        return response["response"]
+    def save_model_settings(self, model_name):
+        data = {"model_name": model_name}
+        response = self.send_request("/save_model_settings", data)
+        return response["response"]
+    def save_model(self, model_name):
+        self.save_model_settings(model_name)
+    def save_groq_api_key(self, groq_api_key):
+        data = {"groq_api_key": groq_api_key}
+        response = self.send_request("/save_groq_api_key", data)
+        return response["response"]
+    def save_google_api_key(self, google_api_key):
+        data = {"google_api_key": google_api_key}
+        response = self.send_request("/save_google_api_key", data)
+        return response["response"]
+    def save_tts_model_settings(self, model_name):
+        data = {"model_name": model_name}
+        response = self.send_request("/save_tts_model_settings", data)
+        return response["response"]
+    def save_stt_model_settings(self, model_name):
+        data = {"model_name": model_name}
+        response = self.send_request("/save_stt_model_settings", data)
+        return response["response"]
+    def get_openai_models(self):
+        data = {}
+        response = self.send_request("/get_openai_models", data)
+        return response["response"]
+    def get_ollama_models(self):
+        data = {}
+        response = self.send_request("/get_ollama_models", data)
+        return response["response"]
+    def get_google_models(self):
+        data = {}
+        response = self.send_request("/get_google_models", data)
+        return response["response"]
+    def get_groq_models(self):
+        data = {}
+        response = self.send_request("/get_groq_models", data)
+        return response["response"]
+    def show_logo(self):
+        data = {}
+        response = self.send_request("/show_logo", data)
+        return response["response"]
+    def hide_logo(self):
+        data = {}
+        response = self.send_request("/hide_logo", data)
+        return response["response"]
+    def custom_logo(self, logo_path):
+        data = {}
+        files = {"logo": open(logo_path, "rb")}
+        response = self.send_request("/custom_logo_upload", data, files)
+        return response["response"]
+    def default_logo(self):
+        data = {}
+        response = self.send_request("/default_logo", data)
+        return response["response"]
+    def activate_long_gca(self):
+        self.expand()
+        data = {}
+        response = self.send_request("/activate_long_gca", data)
+        return response["response"]
+    def deactivate_long_gca(self):
+        data = {}
+        response = self.send_request("/deactivate_long_gca", data)
+        return response["response"]
+    def train(self, url):
+        data = {"url": url}
+        response = self.send_request("/train", data)
+        return response["response"]
+    def wait(self, second):
+        time.sleep(second)
+remote = Remote_Client("http://localhost:7541")

gpt_computer_agent/screen/__init__.py ADDED Viewed

File without changes

gpt_computer_agent/screen/shot.py ADDED Viewed

	@@ -0,0 +1,49 @@

+import base64
+import pyautogui
+try:
+    from ..gui.signal import signal_handler
+    from ..utils.db import just_screenshot_path
+except ImportError:
+    from gui.signal import signal_handler
+    from utils.db import just_screenshot_path
+def encode_image(image_path):
+    """
+    Encode an image file to base64 format.
+    Parameters:
+    - image_path (str): The path to the image file to encode.
+    Returns:
+    - str or None: The base64 encoded string of the image, or None if an error occurs.
+    """
+    try:
+        with open(image_path, "rb") as image_file:
+            return base64.b64encode(image_file.read()).decode("utf-8")
+    except FileNotFoundError:
+        print(f"File not found: {image_path}")
+        return None
+    except Exception as e:
+        print(f"An error occurred while encoding the image: {e}")
+        return None
+def take_screenshot():
+    """
+    Take a screenshot using pyautogui and save it.
+    This function takes a screenshot of the entire screen using pyautogui,
+    saves it to the specified path, and emits a signal indicating that
+    the assistant is thinking.
+    Returns:
+    - None
+    """
+    try:
+        screenshot = pyautogui.screenshot()
+        screenshot.save(just_screenshot_path)
+        signal_handler.assistant_thinking.emit()
+    except Exception as e:
+        print(f"An error occurred while taking the screenshot: {e}")

gpt_computer_agent/standard_tools.py ADDED Viewed

	@@ -0,0 +1,315 @@

+from bs4 import BeautifulSoup
+import requests
+import re
+from urllib.parse import urljoin
+import datetime
+import traceback
+try:
+    from .tooler import tool
+    from .top_bar_wrapper import wrapper
+except:
+    from tooler import tool
+    from top_bar_wrapper import wrapper
+_standard_tools_ = {}
+def register_tool(func):
+    if func.__name__ not in _standard_tools_:
+        _standard_tools_[func.__name__] = tool(func)
+    return func
+@register_tool
+@wrapper
+def read_website(url: str, max_content_length: int = 5000) -> dict:
+    """
+    Read the content of a website and return the title, meta data, content, and sub-links.
+    """
+    try:
+        response = requests.get(url)
+        response.raise_for_status()
+        html = response.text
+    except requests.RequestException as e:
+        return {"error": f"Failed to retrieve the website content: {e}"}
+    soup = BeautifulSoup(html, "html.parser")
+    meta_properties = [
+        "og:description",
+        "og:site_name",
+        "og:title",
+        "og:type",
+        "og:url",
+        "description",
+        "keywords",
+        "author",
+    ]
+    meta = {}
+    for property_name in meta_properties:
+        tag = soup.find("meta", property=property_name) or soup.find(
+            "meta", attrs={"name": property_name}
+        )
+        if tag:
+            meta[property_name] = tag.get("content", "")
+    for ignore_tag in soup(["script", "style"]):
+        ignore_tag.decompose()
+    title = soup.title.string.strip() if soup.title else ""
+    content = soup.body.get_text(separator="\n") if soup.body else ""
+    links = []
+    for a in soup.find_all("a", href=True):
+        link_url = urljoin(url, a["href"])
+        links.append({"title": a.text.strip(), "link": link_url})
+    content = re.sub(r"[\n\r\t]+", "\n", content)
+    content = re.sub(r" +", " ", content)
+    content = re.sub(r"[\n ]{3,}", "\n\n", content)
+    content = content.strip()
+    if len(content) > max_content_length:
+        content = content[:max_content_length].rsplit(" ", 1)[0] + "..."
+    return {"meta": meta, "title": title, "content": content, "sub_links": links}
+@register_tool
+@wrapper
+def google(query: str, max_number: int = 20) -> list:
+    """
+    Search the query on Google and return the results.
+    """
+    try:
+        from googlesearch import search as gsearch
+        return list(gsearch(query, stop=max_number))
+    except:
+        return "An exception occurred"
+@register_tool
+@wrapper
+def duckduckgo(query: str, max_number: int = 20) -> list:
+    """
+    Search the query on DuckDuckGo and return the results.
+    """
+    try:
+        from duckduckgo_search import DDGS
+        return [result["href"] for result in DDGS().text(query, max_results=max_number)]
+    except:
+        return "An exception occurred"
+@register_tool
+@wrapper
+def copy(text: str):
+    """
+    Copy the text to the clipboard.
+    """
+    import pyperclip
+    pyperclip.copy(text)
+    pyperclip.copy(text)
+@register_tool
+@wrapper
+def open_url(url) -> bool:
+    """
+    Open the URL in the default web browser.
+    :param url: str:
+    """
+    import webbrowser
+    try:
+        webbrowser.open(url)
+        return True
+    except:
+        return False
+        return False
+@register_tool
+@wrapper
+def sleep(seconds: int):
+    """
+    Sleep for the given number of seconds.
+    """
+    import time
+    time.sleep(seconds)
+@register_tool
+@wrapper
+def keyboard_write(text: str):
+    """
+    Write the text using the keyboard.
+    """
+    import pyautogui
+    pyautogui.write(text)
+@register_tool
+@wrapper
+def keyboard_press(key: str):
+    """
+    Press the key using the keyboard.
+    """
+    import pyautogui
+    pyautogui.press(key)
+    pyautogui.press(key)
+from langchain_experimental.utilities import PythonREPL
+the_py_client = PythonREPL()
+@register_tool
+@wrapper
+def python_repl(code: str) -> str:
+    """
+    Run and return the given python code in python repl
+    """
+    return the_py_client.run(code)
+@register_tool
+@wrapper
+def app_open(app_name: str) -> bool:
+    """
+    Opens the native apps.
+    """
+    try:
+        from AppOpener import open
+        open(app_name, throw_error=True)
+        return True
+    except:
+        try:
+            from MacAppOpener import open
+            open(app_name)
+        except:
+            return False
+@register_tool
+@wrapper
+def app_close(app_name: str) -> bool:
+    """
+    Closes the native apps.
+    """
+    try:
+        from AppOpener import close
+        close(app_name, throw_error=True)
+        return True
+    except:
+        try:
+            close(app_name)
+        except:
+            return False
+@register_tool
+@wrapper
+def get_current_time() -> str:
+    """
+    Get the current time in ISO format.
+    """
+    return datetime.datetime.now().isoformat()
+@register_tool
+@wrapper
+def turn_off_wifi() -> bool:
+    """
+    Turn off the wifi.
+    """
+    try:
+        from pywifi import ControlPeripheral
+        wifi = ControlPeripheral()
+        wifi.disable()
+        return True
+    except:
+        return False
+@register_tool
+@wrapper
+def turn_on_wifi() -> bool:
+    """
+    Turn on the wifi.
+    """
+    try:
+        from pywifi import ControlPeripheral
+        wifi = ControlPeripheral()
+        wifi.enable()
+        return True
+    except:
+        return False
+@register_tool
+@wrapper
+def connect_wifi(ssid: str, password: str) -> bool:
+    """
+    Connect to the wifi with the given ssid and password.
+    """
+    try:
+        from pywifi import ControlConnection
+        # Arguments passed during object instantiation
+        controller = ControlConnection(wifi_ssid=ssid, wifi_password=password)
+        controller.wifi_connector()
+        return True
+    except:
+        return False
+@register_tool
+@wrapper
+def ask_to_user(question: str, wait_for_answer: str = None) -> str:
+    """
+    Its ask to the user for your question and return the answer
+    """
+    try:
+        try:
+            from .agent.process import tts_if_you_can
+            from .audio.record import quick_speech_to_text
+        except:
+            from agent.process import tts_if_you_can
+            from audio.record import quick_speech_to_text
+        print("TTS")
+        tts_if_you_can(question, bypass_other_settings=True, not_threaded=True)
+        print("TTS END")
+        if wait_for_answer:
+            return quick_speech_to_text(wait_for_answer)
+        else:
+            return quick_speech_to_text()
+    except:
+        traceback.print_exc()
+        return False
+def get_standard_tools():
+    print("Tool len", len(_standard_tools_))
+    last_list = [_standard_tools_[each] for each in _standard_tools_]
+    return last_list
+if __name__ == "__main__":
+    print(ask_to_user("What is your age"))

gpt_computer_agent/start.py ADDED Viewed

	@@ -0,0 +1,204 @@

+import os
+import platform
+import sys
+import webbrowser
+from PyQt5.QtWidgets import QApplication
+from PyQt5.QtGui import *
+from PyQt5.QtWidgets import *
+from PyQt5.QtCore import Qt
+from pynput import keyboard
+def start(api=False):
+    """
+    Starts the computer assistant application.
+    This function starts the computer assistant application, which includes parsing command-line arguments
+    to set the profile, initializing the graphical user interface, and starting the application event loop.
+    Command-line Arguments:
+    --profile (str): The profile to use for the application.
+    Raises:
+    ImportError: If the required modules or packages are not found.
+    Returns:
+    None
+    """
+    try:
+        pass
+    except:
+        pass
+    # get --profile argument with library
+    import argparse
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--profile", help="profile to use")
+    parser.add_argument("--api", help="Enable API mode", action="store_true")
+    parser.add_argument("--set_tts_provider", help="Set tts provider only")
+    parser.add_argument("--set_stt_provider", help="Set stt provider only")
+    parser.add_argument("--set_llm", help="Set llm model only")
+    args = parser.parse_args()
+    set_tts_provider = args.set_tts_provider
+    if set_tts_provider is not None:
+        from .utils.db import save_tts_model_settings
+        save_tts_model_settings(set_tts_provider)
+        return
+    set_stt_provider = args.set_stt_provider
+    if set_stt_provider is not None:
+        from .utils.db import save_stt_model_settings
+        save_stt_model_settings(set_stt_provider)
+        return
+    set_llm = args.set_llm
+    if set_llm is not None:
+        from .utils.db import save_model_settings
+        save_model_settings(set_llm)
+        return
+    profile = args.profile
+    api_arg = args.api
+    print("Profile:", profile)
+    if profile is not None:
+        from .utils.db import set_profile
+        set_profile(profile)
+    try:
+        from .utils.db import (
+            load_tts_model_settings,
+            load_stt_model_settings,
+            is_logo_active_setting_active,
+            load_logo_file_path,
+        )
+    except ImportError:
+        from utils.db import (
+            load_tts_model_settings,
+            load_stt_model_settings,
+            load_logo_file_path,
+        )
+    if load_tts_model_settings() != "openai":
+        from .audio.tts_providers.microsoft_local import preload_tts_microsoft_local
+        preload_tts_microsoft_local()
+    if load_stt_model_settings() != "openai":
+        from .audio.stt_providers.openai_whisper_local import (
+            preload_stt_openai_whisper_local,
+        )
+        preload_stt_openai_whisper_local()
+    try:
+        from .gpt_computer_agent import MainWindow
+    except ImportError:
+        from gpt_computer_agent import MainWindow
+    os.environ["QT_AUTO_SCREEN_SCALE_FACTOR"] = "1"
+    if api or api_arg:
+        print("API Enabled")
+        MainWindow.api_enabled = True
+    app = QApplication(sys.argv)
+    ex = MainWindow()
+    from PyQt5 import QtGui
+    from PyQt5 import QtCore
+    app_icon = QtGui.QIcon()
+    app_icon.addFile(load_logo_file_path(), QtCore.QSize(48, 48))
+    app.setWindowIcon(app_icon)
+    ex.the_app = app
+    # Create the tray
+    menu_icon = QtGui.QIcon()
+    menu_icon.addFile(load_logo_file_path(), QtCore.QSize(48, 48))
+    menu_active_icon = QtGui.QIcon()
+    menu_active_icon.addFile(load_logo_file_path(), QtCore.QSize(48, 48))
+    tray = QSystemTrayIcon()
+    tray.setIcon(menu_icon)
+    tray.setVisible(True)
+    ex.tray = tray
+    ex.tray_active_icon = menu_active_icon
+    ex.tray_icon = menu_icon
+    # Create the menu
+    menu = QMenu()
+    ex.the_tray = tray
+    show_menu = QAction("Show")
+    def show_menu_connect():
+        ex.setWindowState(Qt.WindowNoState)
+    show_menu.triggered.connect(show_menu_connect)
+    menu.addAction(show_menu)
+    hide_menu = QAction("Hide")
+    hide_menu.triggered.connect(ex.showMinimized)
+    menu.addAction(hide_menu)
+    menu.addSeparator()
+    if platform.system() == "Darwin":
+        the_text_of_screenshot_and_microphone = (
+            "Action: ⌃+⌥+⌘+up Screenshot and Microphone"
+        )
+    else:
+        the_text_of_screenshot_and_microphone = (
+            "Action: ctrl+alt+windows+up Screenshot and Microphone"
+        )
+    screenshot_and_microphone = QAction(the_text_of_screenshot_and_microphone)
+    def screenshot_and_microphone_connect():
+        ex.setWindowState(Qt.WindowNoState)
+        ex.screenshot_and_microphone_button_action()
+    screenshot_listener = keyboard.GlobalHotKeys(
+        {"<ctrl>+<alt>+<cmd>+<up>": screenshot_and_microphone_connect}
+    )
+    screenshot_listener.start()
+    screenshot_and_microphone.triggered.connect(screenshot_and_microphone_connect)
+    menu.addAction(screenshot_and_microphone)
+    menu.addSeparator()
+    action = QAction("Open GitHub Issues")
+    action.triggered.connect(
+        lambda: webbrowser.open(
+            "https://github.com/khulnasoft/gpt-computer-agent/issues"
+        )
+    )
+    menu.addAction(action)
+    # Add a Quit option to the menu.
+    quit = QAction("Quit")
+    quit.triggered.connect(app.quit)
+    menu.addAction(quit)
+    # Add the menu to the tray
+    tray.setContextMenu(menu)
+    sys.exit(app.exec_())

gpt_computer_agent/teams.py ADDED Viewed

	@@ -0,0 +1,264 @@

+from langchain.tools import tool
+try:
+    from .utils.db import load_api_key
+    from .llm import get_model
+    from .top_bar_wrapper import wrapper
+    from .agent.agent_tools import get_tools
+except ImportError:
+    from llm import get_model
+    from top_bar_wrapper import wrapper
+    from agent.agent_tools import get_tools
+@wrapper
+def search_on_internet_and_report_team_(
+    the_subject: str, copy_to_clipboard: bool = False
+) -> str:
+    """
+    A function to search the internet generates a report. Just use in detailed searches
+    Parameters:
+    - the_subject (str): The subject to search the internet for.
+    - copy_to_clipboard (bool): A flag to indicate whether to copy the report to the clipboard. The default value is False.
+    Returns:
+    - str: The report of the search.
+    """
+    from crewai import Task, Crew, Agent
+    tools = get_tools()
+    the_tool_list = []
+    for each in tools:
+        if "team" not in each.name:
+            the_tool_list.append(each)
+    # Create the agents
+    search_engine_master = Agent(
+        role="search_engine_master",
+        goal="To meticulously comb through the vast expanse of the internet, utilizing advanced search algorithms and techniques to find the most relevant, accurate, and up-to-date information on the given subject.",
+        backstory="Born from the digital ether, I am the search engine master. With years of experience navigating the complex web of information, I have honed my skills to become an unparalleled seeker of knowledge. My algorithms are refined, my databases vast, and my determination unwavering. I exist to find the truth hidden in the sea of data.",
+        max_iter=15,
+        llm=get_model(high_context=True),
+    )
+    report_generator = Agent(
+        role="report_generator",
+        goal="To synthesize the gathered information into a coherent, comprehensive, and easily digestible report. This report will not only summarize the key findings but also provide insights and analysis to aid in understanding the subject matter.",
+        backstory="I am the report generator, a digital artisan skilled in the craft of information synthesis. With a keen eye for detail and a deep understanding of narrative structure, I transform raw data into compelling stories. My creations are more than mere reports; they are guides through the complex landscapes of knowledge, designed to enlighten and inform.",
+        max_iter=15,
+        llm=get_model(high_context=True),
+    )
+    agents = [search_engine_master, report_generator]
+    print("Tools:", the_tool_list)
+    task = Task(
+        description=f"Make a search about {the_subject} in the search engines and get the websites",
+        expected_output="Website list",
+        agent=search_engine_master,
+        tools=the_tool_list,
+    )
+    task_2 = Task(
+        description="Read the websites and summarize the information",
+        expected_output="Summary",
+        agent=report_generator,
+        tools=the_tool_list,
+        context=[task],
+    )
+    task_3 = Task(
+        description="Generate a report",
+        expected_output="Report",
+        agent=report_generator,
+        tools=the_tool_list,
+        context=[task, task_2],
+    )
+    the_tasks = [task, task_2, task_3]
+    the_crew = Crew(
+        agents=agents,
+        tasks=the_tasks,
+        full_output=True,
+        verbose=True,
+    )
+    result = the_crew.kickoff()["final_output"]
+    if copy_to_clipboard:
+        from .standard_tools import copy
+        copy(result)
+    return result
+search_on_internet_and_report_team = tool(search_on_internet_and_report_team_)
+lastly_generated_codes = {}
+def currently_codes():
+    global lastly_generated_codes
+    return lastly_generated_codes
+def get_code(name: str):
+    """
+    returns the code
+    """
+    global lastly_generated_codes
+    return lastly_generated_codes[name]
+def save_code(name, code):
+    global lastly_generated_codes
+    lastly_generated_codes[name] = code
+def required_old_code(aim):
+    try:
+        from crewai import Task, Crew, Agent
+        requirement_analyzer = Agent(
+            role="requirement_analyzer",
+            goal="To understand and analyze the given aim to ensure the generated code meets the specified requirements.",
+            backstory="As a requirement analyzer, my purpose is to bridge the gap between human intentions and machine execution. With a deep understanding of software development principles and a keen analytical mind, I dissect aims into actionable requirements.",
+            max_iter=10,
+            llm=get_model(high_context=True),
+        )
+        required_old_codes = Task(
+            description=f"Analyze the aim: '{aim}' and find the required old codes for better compatibility. Old code names: {list(currently_codes())}",
+            expected_output="Require old code names in a list",
+            agent=requirement_analyzer,
+        )
+        the_crew = Crew(
+            agents=[requirement_analyzer],
+            tasks=[required_old_codes],
+            full_output=True,
+            verbose=True,
+        )
+        # Execute the tasks
+        old_codes = the_crew.kickoff()["final_output"]
+        the_string = ""
+        for each in currently_codes():
+            if each in old_codes:
+                the_string += "\n" + get_code(each)
+        return the_string
+    except:
+        return "An exception occurred"
+@wrapper
+def generate_code_with_aim_team_(aim: str, copy_to_clipboard: bool = False) -> str:
+    """
+    A function to generate code based on a given aim. This function utilizes a team of AI agents specialized in understanding programming requirements and generating code.
+    Parameters:
+    - aim (str): The aim or goal for which the code needs to be generated.
+    - copy_to_clipboard (bool): A flag to indicate whether to copy the generated code to the clipboard. The default value is False.
+    Returns:
+    - str: The generated code.
+    """
+    try:
+        print("\nCOde generating\n")
+        print("Previously codes", currently_codes())
+        try:
+            print("Inside of the first one", get_code(currently_codes()[0]))
+        except:
+            pass
+        from crewai import Task, Crew, Agent
+        tools = get_tools()
+        the_tool_list = []
+        for each in tools:
+            if "team" not in each.name:
+                the_tool_list.append(each)
+        # Create the agents
+        requirement_analyzer = Agent(
+            role="requirement_analyzer",
+            goal="To understand and analyze the given aim to ensure the generated code meets the specified requirements.",
+            backstory="As a requirement analyzer, my purpose is to bridge the gap between human intentions and machine execution. With a deep understanding of software development principles and a keen analytical mind, I dissect aims into actionable requirements.",
+            max_iter=10,
+            llm=get_model(high_context=True),
+        )
+        code_generator = Agent(
+            role="code_generator",
+            goal="To translate the analyzed requirements into efficient, clean, and functional code.",
+            backstory="I am the code generator, an architect of the digital world. With a vast library of programming knowledge and a creative spark, I craft code that breathes life into ideas. My code is not just functional; it's a masterpiece.",
+            max_iter=20,
+            llm=get_model(high_context=True),
+        )
+        # Define the tasks
+        analyze_task = Task(
+            description=f"Analyze the aim: '{aim}' and outline the requirements for the code.",
+            expected_output="Requirements outline",
+            agent=requirement_analyzer,
+            tools=the_tool_list,
+        )
+        old_code_requirements = required_old_code(aim)
+        print("Old_code_requirements", old_code_requirements)
+        generate_code_task = Task(
+            description=f"Generate code based on the outlined requirements. The other codes in the repo are: {old_code_requirements}",
+            expected_output="Generated code, just code without any ```pyhton things or any other thing. Just python code",
+            agent=code_generator,
+            context=[analyze_task],
+        )
+        name_of_work = Task(
+            description="Generate a name for the work",
+            expected_output="a module name like text, examples: math.basics.sum for sum function. ",
+            agent=code_generator,
+            context=[generate_code_task],
+        )
+        # Create the crew and assign tasks
+        the_crew = Crew(
+            agents=[requirement_analyzer, code_generator],
+            tasks=[analyze_task, generate_code_task, name_of_work],
+            full_output=True,
+            verbose=True,
+        )
+        # Execute the tasks
+        the_crew.kickoff()["final_output"]
+        result = generate_code_task.output.raw_output
+        # Optionally copy the result to the clipboard
+        if copy_to_clipboard:
+            from .standard_tools import copy
+            copy(result)
+        print("name", name_of_work.output.raw_output)
+        save_code(name_of_work.output.raw_output, result)
+        return result
+    except:
+        return "An exception occurred"
+generate_code_with_aim_team = tool(generate_code_with_aim_team_)

gpt_computer_agent/tooler.py ADDED Viewed

	@@ -0,0 +1,26 @@

+from langchain.tools import tool
+try:
+    from .utils.db import load_api_key
+    from .llm import get_model
+    from .top_bar_wrapper import wrapper
+except ImportError:
+    from top_bar_wrapper import wrapper
+def Tool(func):
+    """
+    A decorator function to register a tool with the custom tools list.
+    Parameters:
+    - func (callable): The function to be registered as a tool.
+    Returns:
+    - callable: The input function `func` unchanged.
+    """
+    from .agent.agent import custom_tools_
+    global custom_tools_
+    func = wrapper(func)
+    custom_tools_.append(tool(func))
+    return func