gradio/client/python/gradio_client/utils.py

255 lines
7.0 KiB
Python
Raw Normal View History

from __future__ import annotations
import base64
import json
import mimetypes
import os
import pkgutil
import shutil
import tempfile
from pathlib import Path
from typing import Any, Callable, Dict, Tuple
import fsspec.asyn
import requests
from websockets.legacy.protocol import WebSocketCommonProtocol
API_URL = "{}/api/predict/"
WS_URL = "{}/queue/join"
__version__ = (pkgutil.get_data(__name__, "version.txt") or b"").decode("ascii").strip()
class TooManyRequestsError(Exception):
"""Raised when the API returns a 429 status code."""
pass
class QueueError(Exception):
"""Raised when the queue is full or there is an issue adding a job to the queue."""
pass
class InvalidAPIEndpointError(Exception):
"""Raised when the API endpoint is invalid."""
pass
########################
# Network utils
########################
def is_valid_url(possible_url: str) -> bool:
headers = {"User-Agent": "gradio (https://gradio.app/; team@gradio.app)"}
try:
head_request = requests.head(possible_url, headers=headers)
if head_request.status_code == 405:
return requests.get(possible_url, headers=headers).ok
return head_request.ok
except Exception:
return False
async def get_pred_from_ws(
websocket: WebSocketCommonProtocol, data: str, hash_data: str
) -> Dict[str, Any]:
completed = False
resp = {}
while not completed:
msg = await websocket.recv()
resp = json.loads(msg)
if resp["msg"] == "queue_full":
raise QueueError("Queue is full! Please try again.")
if resp["msg"] == "send_hash":
await websocket.send(hash_data)
elif resp["msg"] == "send_data":
await websocket.send(data)
completed = resp["msg"] == "process_completed"
return resp["output"]
########################
# Data processing utils
########################
def download_tmp_copy_of_file(
url_path: str, hf_token: str | None = None, dir: str | None = None
) -> tempfile._TemporaryFileWrapper:
if dir is not None:
os.makedirs(dir, exist_ok=True)
headers = {"Authorization": "Bearer " + hf_token} if hf_token else {}
prefix = Path(url_path).stem
suffix = Path(url_path).suffix
file_obj = tempfile.NamedTemporaryFile(
delete=False,
prefix=prefix,
suffix=suffix,
dir=dir,
)
with requests.get(url_path, headers=headers, stream=True) as r:
with open(file_obj.name, "wb") as f:
shutil.copyfileobj(r.raw, f)
return file_obj
def create_tmp_copy_of_file(
file_path: str, dir: str | None = None
) -> tempfile._TemporaryFileWrapper:
if dir is not None:
os.makedirs(dir, exist_ok=True)
prefix = Path(file_path).stem
suffix = Path(file_path).suffix
file_obj = tempfile.NamedTemporaryFile(
delete=False,
prefix=prefix,
suffix=suffix,
dir=dir,
)
shutil.copy2(file_path, file_obj.name)
return file_obj
def get_mimetype(filename: str) -> str | None:
mimetype = mimetypes.guess_type(filename)[0]
if mimetype is not None:
mimetype = mimetype.replace("x-wav", "wav").replace("x-flac", "flac")
return mimetype
def get_extension(encoding: str) -> str | None:
encoding = encoding.replace("audio/wav", "audio/x-wav")
type = mimetypes.guess_type(encoding)[0]
if type == "audio/flac": # flac is not supported by mimetypes
return "flac"
elif type is None:
return None
extension = mimetypes.guess_extension(type)
if extension is not None and extension.startswith("."):
extension = extension[1:]
return extension
def encode_file_to_base64(f):
with open(f, "rb") as file:
encoded_string = base64.b64encode(file.read())
base64_str = str(encoded_string, "utf-8")
mimetype = get_mimetype(f)
return (
"data:"
+ (mimetype if mimetype is not None else "")
+ ";base64,"
+ base64_str
)
def encode_url_to_base64(url):
encoded_string = base64.b64encode(requests.get(url).content)
base64_str = str(encoded_string, "utf-8")
mimetype = get_mimetype(url)
return (
"data:" + (mimetype if mimetype is not None else "") + ";base64," + base64_str
)
def encode_url_or_file_to_base64(path: str | Path):
path = str(path)
if is_valid_url(path):
return encode_url_to_base64(path)
else:
return encode_file_to_base64(path)
def decode_base64_to_binary(encoding) -> Tuple[bytes, str | None]:
extension = get_extension(encoding)
try:
data = encoding.split(",")[1]
except IndexError:
data = ""
return base64.b64decode(data), extension
def strip_invalid_filename_characters(filename: str, max_bytes: int = 200) -> str:
"""Strips invalid characters from a filename and ensures that the file_length is less than `max_bytes` bytes."""
filename = "".join([char for char in filename if char.isalnum() or char in "._- "])
filename_len = len(filename.encode())
if filename_len > max_bytes:
while filename_len > max_bytes:
if len(filename) == 0:
break
filename = filename[:-1]
filename_len = len(filename.encode())
return filename
def decode_base64_to_file(encoding, file_path=None, dir=None, prefix=None):
if dir is not None:
os.makedirs(dir, exist_ok=True)
data, extension = decode_base64_to_binary(encoding)
if file_path is not None and prefix is None:
filename = Path(file_path).name
prefix = filename
if "." in filename:
prefix = filename[0 : filename.index(".")]
extension = filename[filename.index(".") + 1 :]
if prefix is not None:
prefix = strip_invalid_filename_characters(prefix)
if extension is None:
file_obj = tempfile.NamedTemporaryFile(delete=False, prefix=prefix, dir=dir)
else:
file_obj = tempfile.NamedTemporaryFile(
delete=False,
prefix=prefix,
suffix="." + extension,
dir=dir,
)
file_obj.write(data)
file_obj.flush()
return file_obj
def dict_or_str_to_json_file(jsn, dir=None):
if dir is not None:
os.makedirs(dir, exist_ok=True)
file_obj = tempfile.NamedTemporaryFile(
delete=False, suffix=".json", dir=dir, mode="w+"
)
if isinstance(jsn, str):
jsn = json.loads(jsn)
json.dump(jsn, file_obj)
file_obj.flush()
return file_obj
def file_to_json(file_path: str | Path) -> Dict:
with open(file_path) as f:
return json.load(f)
########################
# Misc utils
########################
def synchronize_async(func: Callable, *args, **kwargs) -> Any:
"""
Runs async functions in sync scopes. Can be used in any scope.
Example:
if inspect.iscoroutinefunction(block_fn.fn):
predictions = utils.synchronize_async(block_fn.fn, *processed_input)
Args:
func:
*args:
**kwargs:
"""
return fsspec.asyn.sync(fsspec.asyn.get_loop(), func, *args, **kwargs) # type: ignore