Module: `hf_inference_client_workflow`

Huggingface Inference Client Workflow

This workflow uses Huggingface Inference Client library to run all models that are hosted on Huggingface Hub.

Supported Tasks

"text_generation"
"text_classification"
"token_classification"
"summarization"

Example Classification Inference

from infernet_ml.utils.hf_types import HFClassificationInferenceInput
from infernet_ml.workflows.inference.hf_inference_client_workflow import (
    HFInferenceClientWorkflow,
)


def main():
    # Initialize the workflow
    workflow = HFInferenceClientWorkflow().setup()

    # Run the inference

    output_data = workflow.inference(
        HFClassificationInferenceInput(
            text="Decentralizing AI using crypto is awesome!",
        )
    )

    print(output_data)


if __name__ == "__main__":
    main()

Outputs:

{'output': [TextClassificationOutputElement(label='POSITIVE', score=0.9997395873069763), TextClassificationOutputElement(label='NEGATIVE', score=0.00026040704688057303)]}

Example Token Classification Inference

from infernet_ml.utils.hf_types import HFTextGenerationInferenceInput
from infernet_ml.workflows.inference.hf_inference_client_workflow import (
    HFInferenceClientWorkflow,
)


def main():
    # Initialize the workflow
    workflow = HFInferenceClientWorkflow().setup()

    # Run the inference

    output_data = workflow.inference(
        HFTextGenerationInferenceInput(
            prompt="Decentralizing AI using crypto is awesome!",
        )
    )

    print(output_data)


if __name__ == "__main__":
    main()

Outputs:

{'output': '

Decentralized AI is the future of AI. It will enable the creation of more'}

Example Text Generation Inference

from infernet_ml.workflows.inference.hf_inference_client_workflow import (
    HFInferenceClientWorkflow,
)
from infernet_ml.utils.hf_types import (
    HFSummarizationInferenceInput,
    HFSummarizationConfig,
)


def main():
    # Initialize the workflow
    workflow = HFInferenceClientWorkflow().setup()

    # Run the inference

    min_length_tokens = 28
    max_length_tokens = 56
    summarization_config = HFSummarizationConfig(
        min_length=min_length_tokens,
        max_length=max_length_tokens,
    )
    input_text = "Artificial Intelligence has the capacity to positively "
    "impact humanity but the infrastructure in which it is being"
    "developed is not yet ready for the future. Decentralizing AI using "
    "crypto is awesome!"

    input_data = HFSummarizationInferenceInput(
        text=input_text,
        parameters=summarization_config,
    )
    output_data = workflow.inference(input_data)

    print(output_data)


if __name__ == "__main__":
    main()

Outputs:

{'output': SummarizationOutput(summary_text=' Artificial Intelligence has the capacity to positively impact artificial intelligence, says AI expert . Artificial Intelligence can be positively beneficial to society, he says .')}

Example Summarization Inference

from infernet_ml.workflows.inference.hf_inference_client_workflow import HFInferenceClientWorkflow
from infernet_ml.utils.hf_types import HFSummarizationInferenceInput, HFTaskId

def main():
    # Initialize the workflow
    workflow = HFInferenceClientWorkflow().setup()

    # Run the inference

    min_length_tokens = 28
    max_length_tokens = 56
    summarization_config = HFSummarizationConfig(
        min_length=min_length_tokens,
        max_length=max_length_tokens,
    )
    input_text = "Artificial Intelligence has the capacity to positively "
    "impact humanity but the infrastructure in which it is being"
    "developed is not yet ready for the future. Decentralizing AI using "
    "crypto is awesome!"

    input_data = HFSummarizationInferenceInput(
        text=input_text,
        parameters=summarization_config,
    )
    output_data = workflow.inference(input_data)

    print(output_data)

if name == "__main__":
    main()

Outputs:

{
    "output": [
        {
            "summary_text": "Decentralizing AI using crypto is awesome!"
        }
    ]
}

Input Formats

The input format is the HFInferenceClientInput pydantic model. This is one of four input formats:

`HFInferenceClientWorkflow`

Bases: BaseInferenceWorkflow

Inference workflow for models available through Huggingface Hub.

Source code in src/infernet_ml/workflows/inference/hf_inference_client_workflow.py

class HFInferenceClientWorkflow(BaseInferenceWorkflow):
    """
    Inference workflow for models available through Huggingface Hub.
    """

    def __init__(
        self,
        token: Optional[str] = None,
        *args: Any,
        **kwargs: Any,
    ) -> None:
        """
        Initialize the Huggingface Inference Workflow object

        Args:
            token (Optional[str]): API token for the inference client.
                Defaults to None.

        """
        self.token = token
        super().__init__(*args, **kwargs)

    def setup(self) -> "HFInferenceClientWorkflow":
        """
        Setup the inference client. Overriding the base class setup method to add
        typing annotations
        """
        return cast(HFInferenceClientWorkflow, super().setup())

    def do_setup(self) -> "HFInferenceClientWorkflow":
        """
        Setup the inference client
        """
        self.client = InferenceClient(token=self.token)
        return self

    def do_stream(self, preprocessed_input: Any) -> Iterator[Any]:
        raise NotImplementedError

    def inference(self, input_data: HFInferenceClientInput) -> HFInferenceClientOutput:
        """
        Overriding the inference method to add typing annotations

        Args:
            input_data (HFInferenceClientInput): Input data for the inference call

        Returns:
            Dict[str, Any]: output data from the inference call
        """
        return cast(HFInferenceClientOutput, super().inference(input_data))

    def do_run_model(self, hf_input: HFInferenceClientInput) -> HFInferenceClientOutput:
        """
        Perform inference on the hf_input data

        Args:
            hf_input (HFInferenceClientInput): Input data for the inference call

        Returns:
            HFInferenceClientOutput: Output data from the inference call
        """

        attr_lookup = {
            HFTaskId.TEXT_CLASSIFICATION: "text_classification",
            HFTaskId.SUMMARIZATION: "summarization",
            HFTaskId.TEXT_GENERATION: "text_generation",
            HFTaskId.TOKEN_CLASSIFICATION: "token_classification",
        }

        # check if the task_id is supported
        if hf_input.task_id not in SUPPORTED_TASKS:
            raise ValueError(f"Task ID {hf_input.task_id} is not supported")

        task = self.client.__getattribute__(attr_lookup.get(hf_input.task_id))
        args = hf_input.model_dump()
        del args["task_id"]
        output = task(**args)

        logger.debug(f"Output from inference call: {output}")

        return {"output": output}

    def do_postprocessing(
        self, input_data: Any, output: dict[str, Any]
    ) -> dict[str, Any]:
        # Postprocessing logic here
        return output

    def do_generate_proof(self) -> Any:
        raise NotImplementedError

`init(token=None, *args, **kwargs)`

Initialize the Huggingface Inference Workflow object

Parameters:

Name	Type	Description	Default
`token`	`Optional[str]`	API token for the inference client. Defaults to None.	`None`

Source code in src/infernet_ml/workflows/inference/hf_inference_client_workflow.py

def __init__(
    self,
    token: Optional[str] = None,
    *args: Any,
    **kwargs: Any,
) -> None:
    """
    Initialize the Huggingface Inference Workflow object

    Args:
        token (Optional[str]): API token for the inference client.
            Defaults to None.

    """
    self.token = token
    super().__init__(*args, **kwargs)

`do_run_model(hf_input)`

Perform inference on the hf_input data

Parameters:

Name	Type	Description	Default
`hf_input`	`HFInferenceClientInput`	Input data for the inference call	required

Returns:

Name	Type	Description
`HFInferenceClientOutput`	`HFInferenceClientOutput`	Output data from the inference call

Source code in src/infernet_ml/workflows/inference/hf_inference_client_workflow.py

def do_run_model(self, hf_input: HFInferenceClientInput) -> HFInferenceClientOutput:
    """
    Perform inference on the hf_input data

    Args:
        hf_input (HFInferenceClientInput): Input data for the inference call

    Returns:
        HFInferenceClientOutput: Output data from the inference call
    """

    attr_lookup = {
        HFTaskId.TEXT_CLASSIFICATION: "text_classification",
        HFTaskId.SUMMARIZATION: "summarization",
        HFTaskId.TEXT_GENERATION: "text_generation",
        HFTaskId.TOKEN_CLASSIFICATION: "token_classification",
    }

    # check if the task_id is supported
    if hf_input.task_id not in SUPPORTED_TASKS:
        raise ValueError(f"Task ID {hf_input.task_id} is not supported")

    task = self.client.__getattribute__(attr_lookup.get(hf_input.task_id))
    args = hf_input.model_dump()
    del args["task_id"]
    output = task(**args)

    logger.debug(f"Output from inference call: {output}")

    return {"output": output}

`do_setup()`

Setup the inference client

Source code in src/infernet_ml/workflows/inference/hf_inference_client_workflow.py

def do_setup(self) -> "HFInferenceClientWorkflow":
    """
    Setup the inference client
    """
    self.client = InferenceClient(token=self.token)
    return self

`inference(input_data)`

Overriding the inference method to add typing annotations

Parameters:

Name	Type	Description	Default
`input_data`	`HFInferenceClientInput`	Input data for the inference call	required

Returns:

Type	Description
`HFInferenceClientOutput`	Dict[str, Any]: output data from the inference call

Source code in src/infernet_ml/workflows/inference/hf_inference_client_workflow.py

def inference(self, input_data: HFInferenceClientInput) -> HFInferenceClientOutput:
    """
    Overriding the inference method to add typing annotations

    Args:
        input_data (HFInferenceClientInput): Input data for the inference call

    Returns:
        Dict[str, Any]: output data from the inference call
    """
    return cast(HFInferenceClientOutput, super().inference(input_data))

`setup()`

Setup the inference client. Overriding the base class setup method to add typing annotations

Source code in src/infernet_ml/workflows/inference/hf_inference_client_workflow.py

def setup(self) -> "HFInferenceClientWorkflow":
    """
    Setup the inference client. Overriding the base class setup method to add
    typing annotations
    """
    return cast(HFInferenceClientWorkflow, super().setup())

Module: hf_inference_client_workflow

Huggingface Inference Client Workflow

Supported Tasks

Example Classification Inference

Example Token Classification Inference

Example Text Generation Inference

Example Summarization Inference

Input Formats

HFInferenceClientWorkflow

__init__(token=None, *args, **kwargs)

do_run_model(hf_input)

do_setup()

inference(input_data)

setup()

Module: `hf_inference_client_workflow`

`HFInferenceClientWorkflow`

`init(token=None, *args, **kwargs)`

`do_run_model(hf_input)`

`do_setup()`

`inference(input_data)`

`setup()`