unitxt.inference module

class unitxt.inference.HFPipelineBasedInferenceEngine(__tags__: ~typing.Dict[str, str] = {}, model_name: str, max_new_tokens: int)

Bases: InferenceEngine, PackageRequirementsMixin

class unitxt.inference.IbmGenAiInferenceEngine(__tags__: ~typing.Dict[str, str] = {}, label: str = 'ibm_genai', model_name: str, parameters: ~unitxt.inference.IbmGenAiInferenceEngineParams = IbmGenAiInferenceEngineParams(decoding_method=None, max_new_tokens=None, min_new_tokens=None, random_seed=None, repetition_penalty=None, stop_sequences=None, temperature=None, top_k=None, top_p=None, typical_p=None))

Bases: InferenceEngine, PackageRequirementsMixin

parameters: IbmGenAiInferenceEngineParams = IbmGenAiInferenceEngineParams(decoding_method=None, max_new_tokens=None, min_new_tokens=None, random_seed=None, repetition_penalty=None, stop_sequences=None, temperature=None, top_k=None, top_p=None, typical_p=None)
class unitxt.inference.IbmGenAiInferenceEngineParams(decoding_method: str = None, max_new_tokens: int | NoneType = None, min_new_tokens: int | NoneType = None, random_seed: int | NoneType = None, repetition_penalty: float | NoneType = None, stop_sequences: List[str] | NoneType = None, temperature: float | NoneType = None, top_k: int | NoneType = None, top_p: float | NoneType = None, typical_p: float | NoneType = None)

Bases: object

class unitxt.inference.InferenceEngine(__tags__: Dict[str, str] = {})

Bases: ABC, Artifact

Abstract base class for inference.

class unitxt.inference.OpenAiInferenceEngine(__tags__: ~typing.Dict[str, str] = {}, label: str = 'openai', model_name: str, parameters: ~unitxt.inference.OpenAiInferenceEngineParams = OpenAiInferenceEngineParams(frequency_penalty=None, presence_penalty=None, max_tokens=None, seed=None, stop=None, temperature=None, top_p=None))

Bases: InferenceEngine, PackageRequirementsMixin

parameters: OpenAiInferenceEngineParams = OpenAiInferenceEngineParams(frequency_penalty=None, presence_penalty=None, max_tokens=None, seed=None, stop=None, temperature=None, top_p=None)
class unitxt.inference.OpenAiInferenceEngineParams(frequency_penalty: float | NoneType = None, presence_penalty: float | NoneType = None, max_tokens: int | NoneType = None, seed: int | NoneType = None, stop: str | NoneType | List[str] = None, temperature: float | NoneType = None, top_p: float | NoneType = None)

Bases: object