mirror of
https://github.com/xtekky/gpt4free.git
synced 2025-12-06 02:30:41 -08:00
* Update model configurations, provider implementations, and documentation - Updated model names and aliases for Qwen QVQ 72B and Qwen 2 72B (@TheFirstNoob) - Revised HuggingSpace class configuration, added default_image_model - Added llama-3.2-70b alias for Llama 3.2 70B model in AutonomousAI - Removed BlackboxCreateAgent class - Added gpt-4o alias for Copilot model - Moved api_key to Mhystical class attribute - Added models property with default_model value for Free2GPT - Simplified Jmuz class implementation - Improved image generation and model handling in DeepInfra - Standardized default models and removed aliases in Gemini - Replaced model aliases with direct model list in GlhfChat (@TheFirstNoob) - Removed trailing slash from image generation URL in PollinationsAI (https://github.com/xtekky/gpt4free/issues/2571) - Updated llama and qwen model configurations - Enhanced provider documentation and model details * Removed from (g4f/models.py) 'Yqcloud' provider from Default due to error 'ResponseStatusError: Response 429: 文字过长,请删减后重试。' * Update docs/providers-and-models.md * refactor(g4f/Provider/DDG.py): Add error handling and rate limiting to DDG provider - Add custom exception classes for rate limits, timeouts, and conversation limits - Implement rate limiting with sleep between requests (0.75s minimum delay) - Add model validation method to check supported models - Add proper error handling for API responses with custom exceptions - Improve session cookie handling for conversation persistence - Clean up User-Agent string and remove redundant code - Add proper error propagation through async generator Breaking changes: - New custom exceptions may require updates to error handling code - Rate limiting affects request timing and throughput - Model validation is now stricter Related: - Adds error handling similar to standard API clients - Improves reliability and robustness of chat interactions * Update g4f/models.py g4f/Provider/PollinationsAI.py * Update g4f/models.py * Restored provider which was not working and was disabled (g4f/Provider/DeepInfraChat.py) * Fixing a bug with Streaming Completions * Update g4f/Provider/PollinationsAI.py * Update g4f/Provider/Blackbox.py g4f/Provider/DDG.py * Added another model for generating images 'ImageGeneration2' to the 'Blackbox' provider * Update docs/providers-and-models.md * Update g4f/models.py g4f/Provider/Blackbox.py * Added a new OIVSCode provider from the Text Models and Vision (Image Upload) model * Update docs/providers-and-models.md * docs: add Conversation Memory class with context handling requested by @TheFirstNoob * Simplified README.md documentation added new docs/configuration.md documentation * Update add README.md docs/configuration.md * Update README.md * Update docs/providers-and-models.md g4f/models.py g4f/Provider/PollinationsAI.py * Added new model deepseek-r1 to Blackbox provider. @TheFirstNoob * Fixed bugs and updated docs/providers-and-models.md etc/unittest/client.py g4f/models.py g4f/Provider/. --------- Co-authored-by: kqlio67 <> Co-authored-by: H Lohaus <hlohaus@users.noreply.github.com>
206 lines
8.8 KiB
Python
206 lines
8.8 KiB
Python
from __future__ import annotations
|
|
|
|
import time
|
|
from aiohttp import ClientSession, ClientTimeout
|
|
import json
|
|
import asyncio
|
|
import random
|
|
|
|
from ..typing import AsyncResult, Messages, Cookies
|
|
from ..requests.raise_for_status import raise_for_status
|
|
from .base_provider import AsyncGeneratorProvider, ProviderModelMixin
|
|
from .helper import format_prompt
|
|
from ..providers.response import FinishReason, JsonConversation
|
|
|
|
class DuckDuckGoSearchException(Exception):
|
|
"""Base exception class for duckduckgo_search."""
|
|
|
|
class RatelimitException(DuckDuckGoSearchException):
|
|
"""Raised for rate limit exceeded errors during API requests."""
|
|
|
|
class TimeoutException(DuckDuckGoSearchException):
|
|
"""Raised for timeout errors during API requests."""
|
|
|
|
class ConversationLimitException(DuckDuckGoSearchException):
|
|
"""Raised for conversation limit during API requests to AI endpoint."""
|
|
|
|
class Conversation(JsonConversation):
|
|
vqd: str = None
|
|
message_history: Messages = []
|
|
cookies: dict = {}
|
|
|
|
def __init__(self, model: str):
|
|
self.model = model
|
|
|
|
class DDG(AsyncGeneratorProvider, ProviderModelMixin):
|
|
label = "DuckDuckGo AI Chat"
|
|
url = "https://duckduckgo.com/aichat"
|
|
api_endpoint = "https://duckduckgo.com/duckchat/v1/chat"
|
|
status_url = "https://duckduckgo.com/duckchat/v1/status"
|
|
|
|
working = True
|
|
supports_stream = True
|
|
supports_system_message = True
|
|
supports_message_history = True
|
|
|
|
default_model = "gpt-4o-mini"
|
|
models = [default_model, "claude-3-haiku-20240307", "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo", "mistralai/Mixtral-8x7B-Instruct-v0.1"]
|
|
|
|
model_aliases = {
|
|
"gpt-4": "gpt-4o-mini",
|
|
"claude-3-haiku": "claude-3-haiku-20240307",
|
|
"llama-3.1-70b": "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
|
|
"mixtral-8x7b": "mistralai/Mixtral-8x7B-Instruct-v0.1",
|
|
}
|
|
|
|
last_request_time = 0
|
|
|
|
@classmethod
|
|
def validate_model(cls, model: str) -> str:
|
|
"""Validates and returns the correct model name"""
|
|
if model in cls.model_aliases:
|
|
model = cls.model_aliases[model]
|
|
if model not in cls.models:
|
|
raise ValueError(f"Model {model} not supported. Available models: {cls.models}")
|
|
return model
|
|
|
|
@classmethod
|
|
async def sleep(cls):
|
|
"""Implements rate limiting between requests"""
|
|
now = time.time()
|
|
if cls.last_request_time > 0:
|
|
delay = max(0.0, 0.75 - (now - cls.last_request_time))
|
|
if delay > 0:
|
|
await asyncio.sleep(delay)
|
|
cls.last_request_time = now
|
|
|
|
@classmethod
|
|
async def fetch_vqd(cls, session: ClientSession, max_retries: int = 3) -> str:
|
|
"""Fetches the required VQD token for the chat session with retries."""
|
|
headers = {
|
|
"accept": "text/event-stream",
|
|
"content-type": "application/json",
|
|
"x-vqd-accept": "1",
|
|
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36"
|
|
}
|
|
|
|
for attempt in range(max_retries):
|
|
try:
|
|
await cls.sleep()
|
|
async with session.get(cls.status_url, headers=headers) as response:
|
|
if response.status == 200:
|
|
vqd = response.headers.get("x-vqd-4", "")
|
|
if vqd:
|
|
return vqd
|
|
elif response.status == 429:
|
|
if attempt < max_retries - 1:
|
|
wait_time = random.uniform(1, 3) * (attempt + 1)
|
|
await asyncio.sleep(wait_time)
|
|
continue
|
|
response_text = await response.text()
|
|
raise Exception(f"Failed to fetch VQD token: {response.status} {response_text}")
|
|
except Exception as e:
|
|
if attempt < max_retries - 1:
|
|
wait_time = random.uniform(1, 3) * (attempt + 1)
|
|
await asyncio.sleep(wait_time)
|
|
else:
|
|
raise Exception(f"Failed to fetch VQD token after {max_retries} attempts: {str(e)}")
|
|
|
|
raise Exception("Failed to fetch VQD token: Maximum retries exceeded")
|
|
|
|
@classmethod
|
|
async def create_async_generator(
|
|
cls,
|
|
model: str,
|
|
messages: Messages,
|
|
proxy: str = None,
|
|
timeout: int = 30,
|
|
cookies: Cookies = None,
|
|
conversation: Conversation = None,
|
|
return_conversation: bool = False,
|
|
**kwargs
|
|
) -> AsyncResult:
|
|
model = cls.validate_model(model)
|
|
|
|
if cookies is None and conversation is not None:
|
|
cookies = conversation.cookies
|
|
|
|
try:
|
|
async with ClientSession(timeout=ClientTimeout(total=timeout), cookies=cookies) as session:
|
|
if conversation is None:
|
|
conversation = Conversation(model)
|
|
conversation.vqd = await cls.fetch_vqd(session)
|
|
conversation.message_history = [{"role": "user", "content": format_prompt(messages)}]
|
|
else:
|
|
conversation.message_history.append(messages[-1])
|
|
|
|
headers = {
|
|
"accept": "text/event-stream",
|
|
"content-type": "application/json",
|
|
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36",
|
|
"x-vqd-4": conversation.vqd,
|
|
}
|
|
|
|
data = {
|
|
"model": model,
|
|
"messages": conversation.message_history,
|
|
}
|
|
|
|
await cls.sleep()
|
|
try:
|
|
async with session.post(cls.api_endpoint, json=data, headers=headers, proxy=proxy) as response:
|
|
await raise_for_status(response)
|
|
reason = None
|
|
full_message = ""
|
|
|
|
async for line in response.content:
|
|
line = line.decode("utf-8").strip()
|
|
if line.startswith("data:"):
|
|
try:
|
|
message = json.loads(line[5:].strip())
|
|
|
|
if "action" in message and message["action"] == "error":
|
|
error_type = message.get("type", "")
|
|
if message.get("status") == 429:
|
|
if error_type == "ERR_CONVERSATION_LIMIT":
|
|
raise ConversationLimitException(error_type)
|
|
raise RatelimitException(error_type)
|
|
raise DuckDuckGoSearchException(error_type)
|
|
|
|
if "message" in message:
|
|
if message["message"]:
|
|
yield message["message"]
|
|
full_message += message["message"]
|
|
reason = "length"
|
|
else:
|
|
reason = "stop"
|
|
except json.JSONDecodeError:
|
|
continue
|
|
|
|
if return_conversation:
|
|
conversation.message_history.append({"role": "assistant", "content": full_message})
|
|
conversation.vqd = response.headers.get("x-vqd-4", conversation.vqd)
|
|
conversation.cookies = {
|
|
n: c.value
|
|
for n, c in session.cookie_jar.filter_cookies(cls.url).items()
|
|
}
|
|
|
|
if reason is not None:
|
|
yield FinishReason(reason)
|
|
|
|
if return_conversation:
|
|
yield conversation
|
|
|
|
except asyncio.TimeoutError as e:
|
|
raise TimeoutException(f"Request timed out: {str(e)}")
|
|
except Exception as e:
|
|
if "time" in str(e).lower():
|
|
raise TimeoutException(f"Request timed out: {str(e)}")
|
|
raise DuckDuckGoSearchException(f"Request failed: {str(e)}")
|
|
|
|
except Exception as e:
|
|
if isinstance(e, (RatelimitException, TimeoutException, ConversationLimitException)):
|
|
raise
|
|
if "time" in str(e).lower():
|
|
raise TimeoutException(f"Request timed out: {str(e)}")
|
|
raise DuckDuckGoSearchException(f"Request failed: {str(e)}")
|