gpt4free/g4f/providers/response.py
hlohaus e83282fc4b feat: add EdgeTTS audio provider and global image→media refactor
- **Docs**
  - `docs/file.md`: update upload instructions to use inline `bucket` content parts instead of `tool_calls/bucket_tool`.
  - `docs/media.md`: add asynchronous audio transcription example, detailed explanation, and notes.

- **New audio provider**
  - Add `g4f/Provider/audio/EdgeTTS.py` implementing Edge Text‑to‑Speech (`EdgeTTS`).
  - Create `g4f/Provider/audio/__init__.py` for provider export.
  - Register provider in `g4f/Provider/__init__.py`.

- **Refactor image → media**
  - Introduce `generated_media/` directory and `get_media_dir()` helper in `g4f/image/copy_images.py`; add `ensure_media_dir()`; keep back‑compat with legacy `generated_images/`.
  - Replace `images_dir` references with `get_media_dir()` across:
    - `g4f/api/__init__.py`
    - `g4f/client/stubs.py`
    - `g4f/gui/server/api.py`
    - `g4f/gui/server/backend_api.py`
    - `g4f/image/copy_images.py`
  - Rename CLI/API config field/flag from `image_provider` to `media_provider` (`g4f/cli.py`, `g4f/api/__init__.py`, `g4f/client/__init__.py`).
  - Extend `g4f/image/__init__.py`
    - add `MEDIA_TYPE_MAP`, `get_extension()`
    - revise `is_allowed_extension()`, `to_input_audio()` to support wider media types.

- **Provider adjustments**
  - `g4f/Provider/ARTA.py`: swap `raise_error()` parameter order.
  - `g4f/Provider/Cloudflare.py`: drop unused `MissingRequirementsError` import; move `get_args_from_nodriver()` inside try; handle `FileNotFoundError`.

- **Core enhancements**
  - `g4f/providers/any_provider.py`: use `default_model` instead of literal `"default"`; broaden model/provider matching; update model list cleanup.
  - `g4f/models.py`: safeguard provider count logic when model name is falsy.
  - `g4f/providers/base_provider.py`: catch `json.JSONDecodeError` when reading auth cache, delete corrupted file.
  - `g4f/providers/response.py`: allow `AudioResponse` to accept extra kwargs.

- **Misc**
  - Remove obsolete `g4f/image.py`.
  - `g4f/Provider/Cloudflare.py`, `g4f/client/types.py`: minor whitespace and import tidy‑ups.
2025-04-19 03:20:57 +02:00

366 lines
11 KiB
Python

from __future__ import annotations
import re
import base64
from typing import Union, Dict, List, Optional
from abc import abstractmethod
from urllib.parse import quote_plus, unquote_plus
def quote_url(url: str) -> str:
"""
Quote parts of a URL while preserving the domain structure.
Args:
url: The URL to quote
Returns:
str: The properly quoted URL
"""
# Only unquote if needed to avoid double-unquoting
if '%' in url:
url = unquote_plus(url)
url_parts = url.split("//", maxsplit=1)
# If there is no "//" in the URL, then it is a relative URL
if len(url_parts) == 1:
return quote_plus(url_parts[0], '/?&=#')
protocol, rest = url_parts
domain_parts = rest.split("/", maxsplit=1)
# If there is no "/" after the domain, then it is a domain URL
if len(domain_parts) == 1:
return f"{protocol}//{domain_parts[0]}"
domain, path = domain_parts
return f"{protocol}//{domain}/{quote_plus(path, '/?&=#')}"
def quote_title(title: str) -> str:
"""
Normalize whitespace in a title.
Args:
title: The title to normalize
Returns:
str: The title with normalized whitespace
"""
return " ".join(title.split()) if title else ""
def format_link(url: str, title: Optional[str] = None) -> str:
"""
Format a URL and title as a markdown link.
Args:
url: The URL to link to
title: The title to display. If None, extracts from URL
Returns:
str: The formatted markdown link
"""
if title is None:
try:
title = unquote_plus(url.split("//", maxsplit=1)[1].split("?")[0].replace("www.", ""))
except IndexError:
title = url
return f"[{quote_title(title)}]({quote_url(url)})"
def format_image(image: str, alt: str, preview: Optional[str] = None) -> str:
"""
Formats the given image as a markdown string.
Args:
image: The image to format.
alt: The alt text for the image.
preview: The preview URL format. Defaults to the original image.
Returns:
str: The formatted markdown string.
"""
preview_url = preview.replace('{image}', image) if preview else image
return f"[![{quote_title(alt)}]({quote_url(preview_url)})]({quote_url(image)})"
def format_images_markdown(images: Union[str, List[str]], alt: str,
preview: Union[str, List[str]] = None) -> str:
"""
Formats the given images as a markdown string.
Args:
images: The image or list of images to format.
alt: The alt text for the images.
preview: The preview URL format or list of preview URLs.
If not provided, original images are used.
Returns:
str: The formatted markdown string.
"""
if isinstance(images, list) and len(images) == 1:
images = images[0]
if isinstance(images, str):
result = format_image(images, alt, preview)
else:
result = "\n".join(
format_image(
image,
f"#{idx+1} {alt}",
preview[idx] if isinstance(preview, list) and idx < len(preview) else preview
)
for idx, image in enumerate(images)
)
start_flag = "<!-- generated images start -->\n"
end_flag = "<!-- generated images end -->\n"
return f"\n{start_flag}{result}\n{end_flag}\n"
class ResponseType:
@abstractmethod
def __str__(self) -> str:
"""Convert the response to a string representation."""
raise NotImplementedError
class JsonMixin:
def __init__(self, **kwargs) -> None:
"""Initialize with keyword arguments as attributes."""
for key, value in kwargs.items():
setattr(self, key, value)
def get_dict(self) -> Dict:
"""Return a dictionary of non-private attributes."""
return {
key: value
for key, value in self.__dict__.items()
if not key.startswith("__")
}
def reset(self) -> None:
"""Reset all attributes."""
self.__dict__ = {}
class RawResponse(ResponseType, JsonMixin):
pass
class HiddenResponse(ResponseType):
def __str__(self) -> str:
"""Hidden responses return an empty string."""
return ""
class FinishReason(JsonMixin, HiddenResponse):
def __init__(self, reason: str) -> None:
"""Initialize with a reason."""
self.reason = reason
class ToolCalls(HiddenResponse):
def __init__(self, list: List) -> None:
"""Initialize with a list of tool calls."""
self.list = list
def get_list(self) -> List:
"""Return the list of tool calls."""
return self.list
class Usage(JsonMixin, HiddenResponse):
pass
class AuthResult(JsonMixin, HiddenResponse):
pass
class TitleGeneration(HiddenResponse):
def __init__(self, title: str) -> None:
"""Initialize with a title."""
self.title = title
class DebugResponse(HiddenResponse):
def __init__(self, log: str) -> None:
"""Initialize with a log message."""
self.log = log
class Reasoning(ResponseType):
def __init__(
self,
token: Optional[str] = None,
label: Optional[str] = None,
status: Optional[str] = None,
is_thinking: Optional[str] = None
) -> None:
"""Initialize with token, status, and thinking state."""
self.token = token
self.label = label
self.status = status
self.is_thinking = is_thinking
def __str__(self) -> str:
"""Return string representation based on available attributes."""
if self.is_thinking is not None:
return self.is_thinking
if self.token is not None:
return self.token
if self.status is not None:
if self.label is not None:
return f"{self.label}: {self.status}\n"
return f"{self.status}\n"
return ""
def __eq__(self, other: Reasoning):
return (self.token == other.token and
self.status == other.status and
self.is_thinking == other.is_thinking)
def get_dict(self) -> Dict:
"""Return a dictionary representation of the reasoning."""
if self.label is not None:
return {"label": self.label, "status": self.status}
if self.is_thinking is None:
if self.status is None:
return {"token": self.token}
return {"token": self.token, "status": self.status}
return {"token": self.token, "status": self.status, "is_thinking": self.is_thinking}
class Sources(ResponseType):
def __init__(self, sources: List[Dict[str, str]]) -> None:
"""Initialize with a list of source dictionaries."""
self.list = []
for source in sources:
self.add_source(source)
def add_source(self, source: Union[Dict[str, str], str]) -> None:
"""Add a source to the list, cleaning the URL if necessary."""
source = source if isinstance(source, dict) else {"url": source}
url = source.get("url", source.get("link", None))
if url is not None:
url = re.sub(r"[&?]utm_source=.+", "", url)
source["url"] = url
self.list.append(source)
def __str__(self) -> str:
"""Return formatted sources as a string."""
if not self.list:
return ""
return "\n\n\n\n" + ("\n>\n".join([
f"> [{idx}] {format_link(link['url'], link.get('title', None))}"
for idx, link in enumerate(self.list)
]))
class SourceLink(ResponseType):
def __init__(self, title: str, url: str) -> None:
self.title = title
self.url = url
def __str__(self) -> str:
title = f"[{self.title}]"
return f" {format_link(self.url, title)}"
class YouTube(HiddenResponse):
def __init__(self, ids: List[str]) -> None:
"""Initialize with a list of YouTube IDs."""
self.ids = ids
def to_string(self) -> str:
"""Return YouTube embeds as a string."""
if not self.ids:
return ""
return "\n\n" + ("\n".join([
f'<iframe type="text/html" src="https://www.youtube.com/embed/{id}"></iframe>'
for id in self.ids
]))
class AudioResponse(ResponseType):
def __init__(self, data: Union[bytes, str], **kwargs) -> None:
"""Initialize with audio data bytes."""
self.data = data
self.options = kwargs
def to_uri(self) -> str:
if isinstance(self.data, str):
return self.data
"""Return audio data as a base64-encoded data URI."""
data_base64 = base64.b64encode(self.data).decode()
return f"data:audio/mpeg;base64,{data_base64}"
def __str__(self) -> str:
"""Return audio as html element."""
return f'<audio controls src="{self.to_uri()}"></audio>'
class BaseConversation(ResponseType):
def __str__(self) -> str:
"""Return an empty string by default."""
return ""
class JsonConversation(BaseConversation, JsonMixin):
pass
class SynthesizeData(HiddenResponse, JsonMixin):
def __init__(self, provider: str, data: Dict) -> None:
"""Initialize with provider and data."""
self.provider = provider
self.data = data
class SuggestedFollowups(HiddenResponse):
def __init__(self, suggestions: list[str]):
self.suggestions = suggestions
class RequestLogin(HiddenResponse):
def __init__(self, label: str, login_url: str) -> None:
"""Initialize with label and login URL."""
self.label = label
self.login_url = login_url
def to_string(self) -> str:
"""Return formatted login link as a string."""
return format_link(self.login_url, f"[Login to {self.label}]") + "\n\n"
class MediaResponse(ResponseType):
def __init__(
self,
urls: Union[str, List[str]],
alt: str,
options: Dict = {},
**kwargs
) -> None:
"""Initialize with images, alt text, and options."""
self.urls = kwargs.get("images", urls)
self.alt = alt
self.options = options
def get(self, key: str) -> any:
"""Get an option value by key."""
return self.options.get(key)
def get_list(self) -> List[str]:
"""Return images as a list."""
return [self.urls] if isinstance(self.urls, str) else self.urls
class ImageResponse(MediaResponse):
def __str__(self) -> str:
"""Return images as markdown."""
return format_images_markdown(self.urls, self.alt, self.get("preview"))
class VideoResponse(MediaResponse):
def __str__(self) -> str:
"""Return videos as html elements."""
return "\n".join([f'<video controls src="{video}"></video>' for video in self.get_list()])
class ImagePreview(ImageResponse):
def __str__(self) -> str:
"""Return an empty string for preview."""
return ""
def to_string(self) -> str:
"""Return images as markdown."""
return super().__str__()
class PreviewResponse(HiddenResponse):
def __init__(self, data: str) -> None:
"""Initialize with data."""
self.data = data
def to_string(self) -> str:
"""Return data as a string."""
return self.data
class Parameters(ResponseType, JsonMixin):
def __str__(self) -> str:
"""Return an empty string."""
return ""
class ProviderInfo(JsonMixin, HiddenResponse):
pass