Spaces:

akra35567
/

akira

Running

App Files Files Community

akra35567 commited on Mar 14

Commit

bc6d235

verified ·

1 Parent(s): 11ebde4

Upload 19 files

Browse files

Files changed (8) hide show

.env +45 -0
RELATORIO_TECNICO_OTIMIZACAO.md +44 -0
debug_mistral.py +56 -0
requirements.txt +2 -2
test_direct_mistral.py +50 -0
test_integration_mistral.py +64 -0
test_keys.py +113 -0
test_mistral.py +51 -0

.env ADDED Viewed

	@@ -0,0 +1,45 @@

+# .env.example — Copie para .env e preencha suas chaves
+# ============================================================================
+# 🔥 CHAVES DE API — OBTENHA EM:
+# ============================================================================
+# MISTRAL (https://console.mistral.ai/)
+# Limite: 60k tokens/mês grátis
+MISTRAL_API_KEY=uuK8bVZ5BJQtcnhqQoimaNzWDr10WTu3
+# GOOGLE GEMINI (https://aistudio.google.com/app/apikey)
+# Limite: 1.5M tokens/mês grátis
+GEMINI_API_KEY=AIzaSyBcX3wqmEDYTrggNNbv31-A2QG2A7IssRc
+# GROQ (https://console.groq.com/keys)
+# Limite: ~10k tokens/dia grátis
+GROQ_API_KEY=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
+# COHERE (https://dashboard.cohere.com/api-keys)
+# Limite: 1k gerações/mês grátis
+COHERE_API_KEY=sua_chave_aqui
+# TOGETHER AI (https://api.together.xyz/settings/api-keys)
+# Limite: $25 créditos iniciais grátis
+TOGETHER_API_KEY=sua_chave_aqui
+# HUGGING FACE (https://huggingface.co/settings/tokens)
+# Limite: Ilimitado com rate limit
+HF_API_KEY=hf_sua_chave_aqui
+# ============================================================================
+# 🌐 CONFIGURAÇÕES DE SERVIDOR (OPCIONAL)
+# ============================================================================
+API_HOST=0.0.0.0
+API_PORT=7860
+# ============================================================================
+# 📝 NOTAS
+# ============================================================================
+#
+# 1. Copie este arquivo: cp .env.example .env
+# 2. Preencha PELO MENOS Mistral + Gemini (mínimo 2 APIs)
+# 3. Adicione .env ao .gitignore (NUNCA commite chaves!)
+# 4. Para Hugging Face Spaces: adicione chaves em Repository Secrets
+#

RELATORIO_TECNICO_OTIMIZACAO.md ADDED Viewed

	@@ -0,0 +1,44 @@

+# Relatório Técnico: Otimização AKIRA AI para Hugging Face Spaces
+Este documento descreve detalhadamente a transição técnica do sistema AKIRA de uma execução local pesada para uma arquitetura híbrida focada em Cloud, visando a estabilidade no plano Free do Hugging Face (HF).
+## 1. Contexto e Problema
+O projeto AKIRA utilizava o `llama-cpp-python` para rodar modelos GGUF (como TinyLlama) localmente. No entanto:
+- **Build Timeouts**: A compilação nativa do `llama.cpp` no Docker demorava mais de 30 minutos, excedendo os limites do HF Spaces.
+- **Consumo de RAM**: Carregar um modelo na RAM (mesmo 1.1B) em conjunto com o `BART` (Emotion Analyzer) e `BERT` causava instabilidade no limite de 16GB.
+- **Alucinações**: O modelo local excessivamente quantizado apresentava respostas inconsistentes.
+## 2. Solução Implementada: Arquitetura Cloud-First
+A estratégia foi migrar o fallback de "Local Offline" para "Cloud API Fallback".
+### 2.1 Alterações no Dockerfile
+- **Remoção de Compiladores**: Eliminamos `cmake`, `build-essential`, `libopenblas-dev`.
+- **Simplificação do Pip**: Removida a flag `CMAKE_ARGS` e a biblioteca `llama-cpp-python`.
+- **Resultado**: O build agora é instantâneo (apenas instala pacotes binários prontos).
+### 2.2 Reestruturação do `local_llm.py`
+O módulo foi transformado num "Proxy de Emergência":
+- **Variáveis Chave**:
+  - `_hf_client`: Instância do `InferenceClient` da Hugging Face.
+  - `_is_hf_inference_mode`: Flag que indica que o sistema está em modo Cloud.
+- **Fluxo Lógico**:
+  1. O sistema tenta as APIs principais (Groq, Google, etc.).
+  2. Se falharem, o `local_llm.py` é acionado.
+  3. Em vez de abrir um ficheiro `.gguf`, ele faz uma chamada rápida ao modelo `TinyLlama-1.1B-Chat-v1.0` através da API de Inferência Gratuita da Hugging Face.
+  4. Isso garante **zero uso de RAM local** para o LLM e **zero uso de CPU** para inferência.
+### 2.3 Manutenção do Emotion Analyzer
+Apesar da remoção do LLM local, mantivemos as dependências `torch` e `transformers` no `requirements.txt` a pedido do utilizador. Isso permite que o modulo de análise emocional (baseado em BART) continue funcionando localmente, já que é um modelo muito menor e crítico para a persona.
+## 3. Ferramentas Utilizadas
+- **Hugging Face Inference API**: Para o fallback final sem custo de hardware.
+- **Docker (Slim Python)**: Para manter a imagem leve.
+- **Loguru**: Monitorização em tempo real de falhas nas APIs.
+## 4. Benefícios
+- **Escalabilidade**: O bot pode crescer sem medo de exceder a RAM.
+- **Velocidade**: Sem compilações pesadas no deploy.
+- **Estabilidade**: Sem alucinações causadas por falta de recursos locais.
+---
+**Assinado:** Antigravity AI Engineer | Google Deepmind Team

debug_mistral.py ADDED Viewed

	@@ -0,0 +1,56 @@

+import os
+from pathlib import Path
+def debug_mistral_key():
+    print("--- Debug Detalhado Mistral Key ---")
+    # Tenta ler do environment primeiro
+    key = os.getenv("MISTRAL_API_KEY", "")
+    if not key:
+        # Tenta ler do .env manualmente para ver o que tem lá
+        env_path = Path(".env")
+        if env_path.exists():
+            with open(env_path, "r", encoding="utf-8") as f:
+                for line in f:
+                    if line.strip().startswith("MISTRAL_API_KEY="):
+                        key = line.strip().split("=", 1)[1]
+                        print("Encontrada no .env via leitura manual.")
+                        break
+    if not key:
+        print("❌ Chave não encontrada em lugar nenhum.")
+        return
+    print(f"Comprimento da chave: {len(key)}")
+    print(f"Primeiros 4 caracteres: {key[:4]}")
+    print(f"Últimos 4 caracteres: {key[-4:]}")
+    # Verifica caracteres invisíveis ou espaços
+    if key != key.strip():
+        print("⚠️ A chave tem espaços no início ou fim!")
+    import unicodedata
+    print(f"Representação da chave (primeiros 10): {[hex(ord(c)) for c in key[:10]]}")
+    # Limpeza da chave antes de usar
+    clean_key = key.strip().replace('"', '').replace("'", "")
+    # Teste de conexão simples com modelo ultra-básico
+    import requests
+    url = "https://api.mistral.ai/v1/models"
+    headers = {"Authorization": f"Bearer {clean_key}"}
+    try:
+        print("\nTestando listagem de modelos (Endpoint /v1/models)...")
+        res = requests.get(url, headers=headers, timeout=10)
+        print(f"Status: {res.status_code}")
+        if res.status_code == 200:
+            models = res.json().get('data', [])
+            print(f"✅ Sucesso! Modelos disponíveis: {[m['id'] for m in models[:5]]}")
+        else:
+            print(f"❌ Falha: {res.text}")
+    except Exception as e:
+        print(f"💥 Erro: {e}")
+if __name__ == "__main__":
+    debug_mistral_key()

requirements.txt CHANGED Viewed

@@ -39,8 +39,8 @@ huggingface-hub>=0.23.0,<0.27.0
 # Transformers core (BERT, BART, etc.) - MANTIDO A PEDIDO DO UTILIZADOR
 transformers>=4.38.0,<4.50.0
-# 🦙 Llama.cpp Python - REMOVIDO POR INCOMPATIBILIDADE COM BUILD FREE TIER
-# llama-cpp-python>=0.2.56
 # PyTorch - versão estável e compatível - MANTIDO A PEDIDO
 torch>=2.1.0,<2.6.0

 # Transformers core (BERT, BART, etc.) - MANTIDO A PEDIDO DO UTILIZADOR
 transformers>=4.38.0,<4.50.0
+llama-cpp-python>=0.2.56
 # PyTorch - versão estável e compatível - MANTIDO A PEDIDO
 torch>=2.1.0,<2.6.0

test_direct_mistral.py ADDED Viewed

	@@ -0,0 +1,50 @@

+import os
+import requests
+from dotenv import load_dotenv
+# Configurações de saída
+RESULT_FILE = "mistral_status.txt"
+def test_direct_mistral():
+    print("Iniciando teste direto Mistral...")
+    with open(RESULT_FILE, "w", encoding="utf-8") as f:
+        f.write("=== STATUS MISTRAL DIRECT ===\n")
+        # 1. Carrega .env
+        load_dotenv()
+        key = os.getenv("MISTRAL_API_KEY")
+        if not key:
+            f.write("❌ MISTRAL_API_KEY não encontrada no .env\n")
+            return
+        f.write(f"🔑 Chave detectada: {key[:5]}...{key[-5:]}\n")
+        # 2. Faz requisição
+        url = "https://api.mistral.ai/v1/chat/completions"
+        headers = {
+            "Authorization": f"Bearer {key}",
+            "Content-Type": "application/json"
+        }
+        payload = {
+            "model": "mistral-small-latest",
+            "messages": [{"role": "user", "content": "Olá, você é a IA Akira? Responda em uma frase curta."}],
+            "max_tokens": 100
+        }
+        try:
+            response = requests.post(url, json=payload, headers=headers, timeout=15)
+            if response.status_code == 200:
+                data = response.json()
+                content = data['choices'][0]['message']['content']
+                f.write(f"✅ SUCESSO! Mistral respondeu.\n")
+                f.write(f"🤖 RESPOSTA: {content}\n")
+            else:
+                f.write(f"❌ ERRO API: Status {response.status_code}\n")
+                f.write(f"🔍 DETALHES: {response.text}\n")
+        except Exception as e:
+            f.write(f"❌ ERRO CONEXÃO: {str(e)}\n")
+if __name__ == "__main__":
+    test_direct_mistral()
+    print("Teste finalizado.")

test_integration_mistral.py ADDED Viewed

	@@ -0,0 +1,64 @@

+import os
+import sys
+import json
+# Adiciona o diretório atual ao path para importar os módulos
+sys.path.append(os.getcwd())
+# Tenta carregar config e api
+try:
+    from modules.config import load_dotenv, validate_config, logger
+    from modules.api import AkiraAPI
+    CONFIG_OK = True
+except Exception as e:
+    CONFIG_OK = False
+    CONFIG_ERROR = str(e)
+OUTPUT_FILE = "mistral_test_results.txt"
+def run_test():
+    with open(OUTPUT_FILE, "w", encoding="utf-8") as f:
+        f.write("=== LOG DE TESTE MISTRAL ===\n")
+        if not CONFIG_OK:
+            f.write(f"❌ Erro ao importar módulos: {CONFIG_ERROR}\n")
+            return
+        try:
+            # 1. Validar config
+            warnings = validate_config()
+            f.write(f"✅ Configuração validada. Avisos: {warnings}\n")
+            # 2. Inicializar API
+            api = AkiraAPI()
+            f.write(f"✅ Provedores ativos: {api.provedores_ativos}\n")
+            if 'mistral' not in api.provedores_ativos:
+                f.write("❌ Mistral não está entre os provedores ativos nos logs da API.\n")
+                # Tenta forçar via setup_mistral se necessário, mas AkiraAPI já deveria ter feito
+            # 3. Testar Resposta
+            prompt = "Responda apenas: 'IA_MISTRAL_ONLINE'. Não diga mais nada."
+            f.write(f"🚀 Enviando prompt: {prompt}\n")
+            response_data = api.processar_requisicao(prompt, usuario_id="tester_888")
+            resposta = response_data.get("resposta", "")
+            provedor = response_data.get("provedor", "desconhecido")
+            f.write(f"✅ Resposta recebida do provedor: {provedor}\n")
+            f.write(f"🤖 RESPOSTA: {resposta}\n")
+            if "IA_MISTRAL_ONLINE" in resposta:
+                f.write("\n✨ CONCLUSÃO: MISTRAL ESTÁ FUNCIONANDO PERFEITAMENTE!")
+            else:
+                f.write("\n⚠️ Resposta recebida, mas não contém a senha esperada. Verifique os logs.")
+        except Exception as e:
+            f.write(f"❌ Erro crítico no teste: {str(e)}\n")
+            import traceback
+            f.write(traceback.format_exc())
+if __name__ == "__main__":
+    run_test()
+    print(f"Teste concluído. Resultado em {OUTPUT_FILE}")

test_keys.py ADDED Viewed

	@@ -0,0 +1,113 @@

+import os
+import requests
+import sys
+from pathlib import Path
+# Tentativa 1: python-dotenv
+try:
+    from dotenv import load_dotenv
+    loaded = load_dotenv()
+    print(f"INFO: python-dotenv carregou .env? {'Sim' if loaded else 'Não (arquivo não encontrado ou erro)'}")
+except ImportError:
+    print("INFO: python-dotenv não instalado. Vou tentar ler .env manualmente.")
+# Tentativa 2: Carregamento Manual (Fallback)
+def manual_load_env():
+    env_path = Path(".env")
+    if env_path.exists():
+        print(f"INFO: Carregando {env_path.absolute()} manualmente...")
+        with open(env_path, "r", encoding="utf-8") as f:
+            for line in f:
+                line = line.strip()
+                if line and not line.startswith("#") and "=" in line:
+                    key, value = line.split("=", 1)
+                    os.environ[key.strip()] = value.strip()
+        return True
+    return False
+if not os.getenv("MISTRAL_API_KEY"):
+    manual_load_env()
+print(f"CWD: {os.getcwd()}")
+print(f"Arquivos no CWD: {os.listdir('.')}")
+def test_mistral():
+    print("\n--- Testando Mistral ---")
+    key = os.getenv("MISTRAL_API_KEY", "").strip()
+    if not key:
+        print("❌ MISTRAL_API_KEY não encontrada no ambiente.")
+        return
+    if (key.startswith('"') and key.endswith('"')) or (key.startswith("'") and key.endswith("'")):
+        key = key[1:-1]
+    print(f"Chave encontrada (prefixo): {key[:6]}...")
+    url = "https://api.mistral.ai/v1/chat/completions"
+    headers = {"Authorization": f"Bearer {key}", "Content-Type": "application/json"}
+    payload = {
+        "model": "mistral-large-latest",
+        "messages": [{"role": "user", "content": "Oi"}],
+        "max_tokens": 10
+    }
+    try:
+        response = requests.post(url, headers=headers, json=payload, timeout=10)
+        if response.status_code == 200:
+            print("✅ Mistral OK!")
+        else:
+            print(f"❌ Mistral erro {response.status_code}: {response.text}")
+    except Exception as e:
+        print(f"💥 Erro na requisição Mistral: {e}")
+def test_gemini():
+    print("\n--- Testando Gemini ---")
+    key = os.getenv("GEMINI_API_KEY") or os.getenv("GOOGLE_API_KEY", "").strip()
+    if not key:
+        print("❌ Chave Gemini/Google não encontrada.")
+        return
+    print(f"Chave encontrada (prefixo): {key[:6]}...")
+    # Teste via endpoint v1 estável
+    url = f"https://generativelanguage.googleapis.com/v1/models/gemini-2.0-flash:generateContent?key={key}"
+    payload = {"contents": [{"parts":[{"text": "Oi"}]}]}
+    try:
+        response = requests.post(url, json=payload, timeout=10)
+        if response.status_code == 200:
+            print("✅ Gemini OK!")
+        else:
+            print(f"❌ Gemini erro {response.status_code}: {response.text}")
+    except Exception as e:
+        print(f"💥 Erro na requisição Gemini: {e}")
+def test_groq():
+    print("\n--- Testando Groq ---")
+    key = os.getenv("GROQ_API_KEY", "").strip()
+    if not key:
+        print("❌ GROQ_API_KEY não encontrada.")
+        return
+    url = "https://api.groq.com/openai/v1/chat/completions"
+    headers = {"Authorization": f"Bearer {key}", "Content-Type": "application/json"}
+    payload = {
+        "model": "llama-3.3-70b-versatile",
+        "messages": [{"role": "user", "content": "Oi"}],
+        "max_tokens": 10
+    }
+    try:
+        response = requests.post(url, headers=headers, json=payload, timeout=10)
+        if response.status_code == 200:
+            print("✅ Groq OK!")
+        else:
+            print(f"❌ Groq erro {response.status_code}: {response.text}")
+    except Exception as e:
+        print(f"💥 Erro na requisição Groq: {e}")
+if __name__ == "__main__":
+    print(f"Python: {sys.version}")
+    test_mistral()
+    test_gemini()
+    test_groq()

test_mistral.py ADDED Viewed

	@@ -0,0 +1,51 @@

+import os
+import requests
+from dotenv import load_dotenv
+def test_mistral():
+    print("--- Teste de Ambiente AKIRA ---")
+    # 1. Testar carregamento do .env
+    dotenv_path = os.path.join(os.getcwd(), ".env")
+    if os.path.exists(dotenv_path):
+        load_dotenv(dotenv_path)
+        print(f"✅ Arquivo .env encontrado em: {dotenv_path}")
+    else:
+        print("❌ Arquivo .env NÃO encontrado no diretório atual.")
+        return
+    mistral_key = os.getenv("MISTRAL_API_KEY")
+    if not mistral_key or mistral_key == "sua_chave_aqui":
+        print("❌ MISTRAL_API_KEY não configurada corretamente no .env")
+        return
+    else:
+        print(f"✅ MISTRAL_API_KEY carregada (Início: {mistral_key[:5]}...)")
+    # 2. Testar chamada real para a Mistral
+    print("\n--- Testando API Mistral ---")
+    url = "https://api.mistral.ai/v1/chat/completions"
+    headers = {
+        "Content-Type": "application/json",
+        "Authorization": f"Bearer {mistral_key}"
+    }
+    data = {
+        "model": "mistral-tiny",
+        "messages": [{"role": "user", "content": "Oi, você está funcionando? Responda curto."}],
+        "max_tokens": 50
+    }
+    try:
+        response = requests.post(url, headers=headers, json=data, timeout=10)
+        if response.status_code == 200:
+            result = response.json()
+            message = result['choices'][0]['message']['content']
+            print(f"✅ API Mistral respondendo com sucesso!")
+            print(f"💬 Resposta: {message}")
+        else:
+            print(f"❌ Erro na API Mistral: Status {response.status_code}")
+            print(f"🔍 Detalhes: {response.text}")
+    except Exception as e:
+        print(f"❌ Erro ao conectar com API Mistral: {e}")
+if __name__ == "__main__":
+    test_mistral()