|
"""This module should not be used directly as its API is subject to change. Instead, |
|
use the `gr.Blocks.load()` or `gr.Interface.load()` functions.""" |
|
|
|
from __future__ import annotations |
|
|
|
import json |
|
import re |
|
import uuid |
|
import warnings |
|
from copy import deepcopy |
|
from typing import TYPE_CHECKING, Callable, Dict |
|
|
|
import requests |
|
|
|
import gradio |
|
from gradio import components, utils |
|
from gradio.exceptions import TooManyRequestsError |
|
from gradio.external_utils import ( |
|
cols_to_rows, |
|
encode_to_base64, |
|
get_tabular_examples, |
|
get_ws_fn, |
|
postprocess_label, |
|
rows_to_cols, |
|
streamline_spaces_interface, |
|
use_websocket, |
|
) |
|
from gradio.processing_utils import to_binary |
|
|
|
if TYPE_CHECKING: |
|
from gradio.blocks import Blocks |
|
from gradio.interface import Interface |
|
|
|
|
|
def load_blocks_from_repo( |
|
name: str, |
|
src: str | None = None, |
|
api_key: str | None = None, |
|
alias: str | None = None, |
|
**kwargs, |
|
) -> Blocks: |
|
"""Creates and returns a Blocks instance from a Hugging Face model or Space repo.""" |
|
if src is None: |
|
|
|
tokens = name.split("/") |
|
assert ( |
|
len(tokens) > 1 |
|
), "Either `src` parameter must be provided, or `name` must be formatted as {src}/{repo name}" |
|
src = tokens[0] |
|
name = "/".join(tokens[1:]) |
|
|
|
factory_methods: Dict[str, Callable] = { |
|
|
|
"huggingface": from_model, |
|
"models": from_model, |
|
"spaces": from_spaces, |
|
} |
|
assert src.lower() in factory_methods, "parameter: src must be one of {}".format( |
|
factory_methods.keys() |
|
) |
|
|
|
blocks: gradio.Blocks = factory_methods[src](name, api_key, alias, **kwargs) |
|
return blocks |
|
|
|
|
|
def from_model(model_name: str, api_key: str | None, alias: str | None, **kwargs): |
|
model_url = "https://huggingface.co/{}".format(model_name) |
|
api_url = "https://api-inference.huggingface.co/models/{}".format(model_name) |
|
print("Fetching model from: {}".format(model_url)) |
|
|
|
headers = {"Authorization": f"Bearer {api_key}"} if api_key is not None else {} |
|
|
|
|
|
response = requests.request("GET", api_url, headers=headers) |
|
assert ( |
|
response.status_code == 200 |
|
), f"Could not find model: {model_name}. If it is a private or gated model, please provide your Hugging Face access token (https://huggingface.co/settings/tokens) as the argument for the `api_key` parameter." |
|
p = response.json().get("pipeline_tag") |
|
|
|
pipelines = { |
|
"audio-classification": { |
|
|
|
"inputs": components.Audio(source="upload", type="filepath", label="Input"), |
|
"outputs": components.Label(label="Class"), |
|
"preprocess": lambda i: to_binary, |
|
"postprocess": lambda r: postprocess_label( |
|
{i["label"].split(", ")[0]: i["score"] for i in r.json()} |
|
), |
|
}, |
|
"audio-to-audio": { |
|
|
|
"inputs": components.Audio(source="upload", type="filepath", label="Input"), |
|
"outputs": components.Audio(label="Output"), |
|
"preprocess": to_binary, |
|
"postprocess": encode_to_base64, |
|
}, |
|
"automatic-speech-recognition": { |
|
|
|
"inputs": components.Audio(source="upload", type="filepath", label="Input"), |
|
"outputs": components.Textbox(label="Output"), |
|
"preprocess": to_binary, |
|
"postprocess": lambda r: r.json()["text"], |
|
}, |
|
"feature-extraction": { |
|
|
|
"inputs": components.Textbox(label="Input"), |
|
"outputs": components.Dataframe(label="Output"), |
|
"preprocess": lambda x: {"inputs": x}, |
|
"postprocess": lambda r: r.json()[0], |
|
}, |
|
"fill-mask": { |
|
"inputs": components.Textbox(label="Input"), |
|
"outputs": components.Label(label="Classification"), |
|
"preprocess": lambda x: {"inputs": x}, |
|
"postprocess": lambda r: postprocess_label( |
|
{i["token_str"]: i["score"] for i in r.json()} |
|
), |
|
}, |
|
"image-classification": { |
|
|
|
"inputs": components.Image(type="filepath", label="Input Image"), |
|
"outputs": components.Label(label="Classification"), |
|
"preprocess": to_binary, |
|
"postprocess": lambda r: postprocess_label( |
|
{i["label"].split(", ")[0]: i["score"] for i in r.json()} |
|
), |
|
}, |
|
"question-answering": { |
|
|
|
"inputs": [ |
|
components.Textbox(lines=7, label="Context"), |
|
components.Textbox(label="Question"), |
|
], |
|
"outputs": [ |
|
components.Textbox(label="Answer"), |
|
components.Label(label="Score"), |
|
], |
|
"preprocess": lambda c, q: {"inputs": {"context": c, "question": q}}, |
|
"postprocess": lambda r: (r.json()["answer"], {"label": r.json()["score"]}), |
|
}, |
|
"summarization": { |
|
|
|
"inputs": components.Textbox(label="Input"), |
|
"outputs": components.Textbox(label="Summary"), |
|
"preprocess": lambda x: {"inputs": x}, |
|
"postprocess": lambda r: r.json()[0]["summary_text"], |
|
}, |
|
"text-classification": { |
|
|
|
"inputs": components.Textbox(label="Input"), |
|
"outputs": components.Label(label="Classification"), |
|
"preprocess": lambda x: {"inputs": x}, |
|
"postprocess": lambda r: postprocess_label( |
|
{i["label"].split(", ")[0]: i["score"] for i in r.json()[0]} |
|
), |
|
}, |
|
"text-generation": { |
|
|
|
"inputs": components.Textbox(label="Input"), |
|
"outputs": components.Textbox(label="Output"), |
|
"preprocess": lambda x: {"inputs": x}, |
|
"postprocess": lambda r: r.json()[0]["generated_text"], |
|
}, |
|
"text2text-generation": { |
|
|
|
"inputs": components.Textbox(label="Input"), |
|
"outputs": components.Textbox(label="Generated Text"), |
|
"preprocess": lambda x: {"inputs": x}, |
|
"postprocess": lambda r: r.json()[0]["generated_text"], |
|
}, |
|
"translation": { |
|
"inputs": components.Textbox(label="Input"), |
|
"outputs": components.Textbox(label="Translation"), |
|
"preprocess": lambda x: {"inputs": x}, |
|
"postprocess": lambda r: r.json()[0]["translation_text"], |
|
}, |
|
"zero-shot-classification": { |
|
|
|
"inputs": [ |
|
components.Textbox(label="Input"), |
|
components.Textbox(label="Possible class names (" "comma-separated)"), |
|
components.Checkbox(label="Allow multiple true classes"), |
|
], |
|
"outputs": components.Label(label="Classification"), |
|
"preprocess": lambda i, c, m: { |
|
"inputs": i, |
|
"parameters": {"candidate_labels": c, "multi_class": m}, |
|
}, |
|
"postprocess": lambda r: postprocess_label( |
|
{ |
|
r.json()["labels"][i]: r.json()["scores"][i] |
|
for i in range(len(r.json()["labels"])) |
|
} |
|
), |
|
}, |
|
"sentence-similarity": { |
|
|
|
"inputs": [ |
|
components.Textbox( |
|
value="That is a happy person", label="Source Sentence" |
|
), |
|
components.Textbox( |
|
lines=7, |
|
placeholder="Separate each sentence by a newline", |
|
label="Sentences to compare to", |
|
), |
|
], |
|
"outputs": components.Label(label="Classification"), |
|
"preprocess": lambda src, sentences: { |
|
"inputs": { |
|
"source_sentence": src, |
|
"sentences": [s for s in sentences.splitlines() if s != ""], |
|
} |
|
}, |
|
"postprocess": lambda r: postprocess_label( |
|
{f"sentence {i}": v for i, v in enumerate(r.json())} |
|
), |
|
}, |
|
"text-to-speech": { |
|
|
|
"inputs": components.Textbox(label="Input"), |
|
"outputs": components.Audio(label="Audio"), |
|
"preprocess": lambda x: {"inputs": x}, |
|
"postprocess": encode_to_base64, |
|
}, |
|
"text-to-image": { |
|
|
|
"inputs": components.Textbox(label="Input"), |
|
"outputs": components.Image(label="Output"), |
|
"preprocess": lambda x: {"inputs": x}, |
|
"postprocess": encode_to_base64, |
|
}, |
|
"token-classification": { |
|
|
|
"inputs": components.Textbox(label="Input"), |
|
"outputs": components.HighlightedText(label="Output"), |
|
"preprocess": lambda x: {"inputs": x}, |
|
"postprocess": lambda r: r, |
|
}, |
|
} |
|
|
|
if p in ["tabular-classification", "tabular-regression"]: |
|
example_data = get_tabular_examples(model_name) |
|
col_names, example_data = cols_to_rows(example_data) |
|
example_data = [[example_data]] if example_data else None |
|
|
|
pipelines[p] = { |
|
"inputs": components.Dataframe( |
|
label="Input Rows", |
|
type="pandas", |
|
headers=col_names, |
|
col_count=(len(col_names), "fixed"), |
|
), |
|
"outputs": components.Dataframe( |
|
label="Predictions", type="array", headers=["prediction"] |
|
), |
|
"preprocess": rows_to_cols, |
|
"postprocess": lambda r: { |
|
"headers": ["prediction"], |
|
"data": [[pred] for pred in json.loads(r.text)], |
|
}, |
|
"examples": example_data, |
|
} |
|
|
|
if p is None or not (p in pipelines): |
|
raise ValueError("Unsupported pipeline type: {}".format(p)) |
|
|
|
pipeline = pipelines[p] |
|
|
|
def query_huggingface_api(*params): |
|
|
|
data = pipeline["preprocess"](*params) |
|
if isinstance( |
|
data, dict |
|
): |
|
data.update({"options": {"wait_for_model": True}}) |
|
data = json.dumps(data) |
|
response = requests.request("POST", api_url, headers=headers, data=data) |
|
if not (response.status_code == 200): |
|
errors_json = response.json() |
|
errors, warns = "", "" |
|
if errors_json.get("error"): |
|
errors = f", Error: {errors_json.get('error')}" |
|
if errors_json.get("warnings"): |
|
warns = f", Warnings: {errors_json.get('warnings')}" |
|
raise ValueError( |
|
f"Could not complete request to HuggingFace API, Status Code: {response.status_code}" |
|
+ errors |
|
+ warns |
|
) |
|
if ( |
|
p == "token-classification" |
|
): |
|
ner_groups = response.json() |
|
input_string = params[0] |
|
response = utils.format_ner_list(input_string, ner_groups) |
|
output = pipeline["postprocess"](response) |
|
return output |
|
|
|
if alias is None: |
|
query_huggingface_api.__name__ = model_name |
|
else: |
|
query_huggingface_api.__name__ = alias |
|
|
|
interface_info = { |
|
"fn": query_huggingface_api, |
|
"inputs": pipeline["inputs"], |
|
"outputs": pipeline["outputs"], |
|
"title": model_name, |
|
"examples": pipeline.get("examples"), |
|
} |
|
|
|
kwargs = dict(interface_info, **kwargs) |
|
kwargs["_api_mode"] = True |
|
interface = gradio.Interface(**kwargs) |
|
return interface |
|
|
|
|
|
def from_spaces( |
|
space_name: str, api_key: str | None, alias: str | None, **kwargs |
|
) -> Blocks: |
|
space_url = "https://huggingface.co/spaces/{}".format(space_name) |
|
|
|
print("Fetching Space from: {}".format(space_url)) |
|
|
|
headers = {} |
|
if api_key is not None: |
|
headers["Authorization"] = f"Bearer {api_key}" |
|
|
|
iframe_url = ( |
|
requests.get( |
|
f"https://huggingface.co/api/spaces/{space_name}/host", headers=headers |
|
) |
|
.json() |
|
.get("host") |
|
) |
|
|
|
if iframe_url is None: |
|
raise ValueError( |
|
f"Could not find Space: {space_name}. If it is a private or gated Space, please provide your Hugging Face access token (https://huggingface.co/settings/tokens) as the argument for the `api_key` parameter." |
|
) |
|
|
|
r = requests.get(iframe_url, headers=headers) |
|
|
|
result = re.search( |
|
r"window.gradio_config = (.*?);[\s]*</script>", r.text |
|
) |
|
try: |
|
config = json.loads(result.group(1)) |
|
except AttributeError: |
|
raise ValueError("Could not load the Space: {}".format(space_name)) |
|
if "allow_flagging" in config: |
|
return from_spaces_interface( |
|
space_name, config, alias, api_key, iframe_url, **kwargs |
|
) |
|
else: |
|
if kwargs: |
|
warnings.warn( |
|
"You cannot override parameters for this Space by passing in kwargs. " |
|
"Instead, please load the Space as a function and use it to create a " |
|
"Blocks or Interface locally. You may find this Guide helpful: " |
|
"https://gradio.app/using_blocks_like_functions/" |
|
) |
|
return from_spaces_blocks(config, api_key, iframe_url) |
|
|
|
|
|
def from_spaces_blocks(config: Dict, api_key: str | None, iframe_url: str) -> Blocks: |
|
api_url = "{}/api/predict/".format(iframe_url) |
|
|
|
headers = {"Content-Type": "application/json"} |
|
if api_key is not None: |
|
headers["Authorization"] = f"Bearer {api_key}" |
|
ws_url = "{}/queue/join".format(iframe_url).replace("https", "wss") |
|
|
|
ws_fn = get_ws_fn(ws_url, headers) |
|
|
|
fns = [] |
|
for d, dependency in enumerate(config["dependencies"]): |
|
if dependency["backend_fn"]: |
|
|
|
def get_fn(outputs, fn_index, use_ws): |
|
def fn(*data): |
|
data = json.dumps({"data": data, "fn_index": fn_index}) |
|
hash_data = json.dumps( |
|
{"fn_index": fn_index, "session_hash": str(uuid.uuid4())} |
|
) |
|
if use_ws: |
|
result = utils.synchronize_async(ws_fn, data, hash_data) |
|
output = result["data"] |
|
else: |
|
response = requests.post(api_url, headers=headers, data=data) |
|
result = json.loads(response.content.decode("utf-8")) |
|
try: |
|
output = result["data"] |
|
except KeyError: |
|
if "error" in result and "429" in result["error"]: |
|
raise TooManyRequestsError( |
|
"Too many requests to the Hugging Face API" |
|
) |
|
raise KeyError( |
|
f"Could not find 'data' key in response from external Space. Response received: {result}" |
|
) |
|
if len(outputs) == 1: |
|
output = output[0] |
|
return output |
|
|
|
return fn |
|
|
|
fn = get_fn( |
|
deepcopy(dependency["outputs"]), d, use_websocket(config, dependency) |
|
) |
|
fns.append(fn) |
|
else: |
|
fns.append(None) |
|
return gradio.Blocks.from_config(config, fns, iframe_url) |
|
|
|
|
|
def from_spaces_interface( |
|
model_name: str, |
|
config: Dict, |
|
alias: str | None, |
|
api_key: str | None, |
|
iframe_url: str, |
|
**kwargs, |
|
) -> Interface: |
|
|
|
config = streamline_spaces_interface(config) |
|
api_url = "{}/api/predict/".format(iframe_url) |
|
headers = {"Content-Type": "application/json"} |
|
if api_key is not None: |
|
headers["Authorization"] = f"Bearer {api_key}" |
|
|
|
|
|
def fn(*data): |
|
data = json.dumps({"data": data}) |
|
response = requests.post(api_url, headers=headers, data=data) |
|
result = json.loads(response.content.decode("utf-8")) |
|
try: |
|
output = result["data"] |
|
except KeyError: |
|
if "error" in result and "429" in result["error"]: |
|
raise TooManyRequestsError("Too many requests to the Hugging Face API") |
|
raise KeyError( |
|
f"Could not find 'data' key in response from external Space. Response received: {result}" |
|
) |
|
if ( |
|
len(config["outputs"]) == 1 |
|
): |
|
output = output[0] |
|
if len(config["outputs"]) == 1 and isinstance( |
|
output, list |
|
): |
|
output = output[0] |
|
return output |
|
|
|
fn.__name__ = alias if (alias is not None) else model_name |
|
config["fn"] = fn |
|
|
|
kwargs = dict(config, **kwargs) |
|
kwargs["_api_mode"] = True |
|
interface = gradio.Interface(**kwargs) |
|
return interface |
|
|