pythonintermediate

Hugging Face Inference API

Run ML models via the Hugging Face Inference API for text generation, classification, and embeddings.

pythonPress ⌘/Ctrl + Shift + C to copy

import httpx
from typing import Any

HF_TOKEN = "hf_..."  # Set via environment variable
API_URL = "https://api-inference.huggingface.co/models"

async def hf_inference(
    model: str,
    inputs: str | list[str],
    parameters: dict[str, Any] | None = None,
) -> Any:
    async with httpx.AsyncClient() as client:
        response = await client.post(
            f"{API_URL}/{model}",
            headers={"Authorization": f"Bearer {HF_TOKEN}"},
            json={
                "inputs": inputs,
                **(({"parameters": parameters}) if parameters else {}),
            },
            timeout=30.0,
        )
        response.raise_for_status()
        return response.json()

# Text generation
# result = await hf_inference(
#     "mistralai/Mistral-7B-Instruct-v0.2",
#     "Explain quantum computing in one sentence.",
#     {"max_new_tokens": 100, "temperature": 0.7},
# )

# Sentiment analysis
# result = await hf_inference(
#     "distilbert-base-uncased-finetuned-sst-2-english",
#     "I love this product!",
# )