`mistral_common.protocol.transcription.request`

`TranscriptionRequest(**data)`

Bases: BaseCompletionRequest

A class representing a request for audio transcription.

This class handles the conversion of audio data into a format suitable for transcription using the OpenAI API. It includes methods to convert the request to and from the OpenAI format.

Attributes:

Name	Type	Description
`id`	`str \| None`	An optional identifier for the transcription request.
`model`	`str \| None`	The model to be used for transcription.
`audio`	`RawAudio`	The audio data to be transcribed.
`language`	`LanguageAlpha2 \| None`	The language of the input audio in ISO-639-1 format (optional).
`strict_audio_validation`	`bool`	A flag indicating whether to perform strict validation of the audio data.

Source code in .venv/lib/python3.13/site-packages/pydantic/main.py

def __init__(self, /, **data: Any) -> None:
    """Create a new model by parsing and validating input data from keyword arguments.

    Raises [`ValidationError`][pydantic_core.ValidationError] if the input data cannot be
    validated to form a valid model.

    `self` is explicitly positional-only to allow `self` as a field name.
    """
    # `__tracebackhide__` tells pytest and some other tools to omit this function from tracebacks
    __tracebackhide__ = True
    validated_self = self.__pydantic_validator__.validate_python(data, self_instance=self)
    if self is not validated_self:
        warnings.warn(
            'A custom validator is returning a value other than `self`.\n'
            "Returning anything other than `self` from a top level model validator isn't supported when validating via `__init__`.\n"
            'See the `model_validator` docs (https://docs.pydantic.dev/latest/concepts/validators/#model-validators) for more details.',
            stacklevel=2,
        )

`from_openai(openai_request, strict=False)` `classmethod`

Create a TranscriptionRequest instance from an OpenAI request dictionary.

This method converts an OpenAI request dictionary into a TranscriptionRequest instance, handling the conversion of audio data and other parameters.

Parameters:

Name	Type	Description	Default
`openai_request`	`dict[str, Any]`	The OpenAI request dictionary.	required
`strict`	`bool`	A flag indicating whether to perform strict validation of the audio data.	`False`

Returns:

Type	Description
`TranscriptionRequest`	An instance of TranscriptionRequest.

Source code in src/mistral_common/protocol/transcription/request.py

@classmethod
def from_openai(cls, openai_request: dict[str, Any], strict: bool = False) -> "TranscriptionRequest":
    r"""Create a TranscriptionRequest instance from an OpenAI request dictionary.

    This method converts an OpenAI request dictionary into a TranscriptionRequest instance,
    handling the conversion of audio data and other parameters.

    Args:
        openai_request: The OpenAI request dictionary.
        strict: A flag indicating whether to perform strict validation of the audio data.

    Returns:
       An instance of TranscriptionRequest.
    """
    file = openai_request.get("file")
    seed = openai_request.get("seed")
    converted_dict = {
        k: v
        for k, v in openai_request.items()
        if (k in cls.model_fields and not (v is None and k in ["temperature", "top_p"]))
    }

    assert file is not None, file
    if isinstance(file, io.BytesIO):
        audio_bytes = file.getvalue()
    else:
        # for example if file is UploadFile, this should work
        audio_bytes = file.file.read()

    audio = Audio.from_bytes(audio_bytes, strict=strict)
    audio_str = audio.to_base64(audio.format)
    raw_audio = RawAudio(data=audio_str, format=audio.format)

    converted_dict["audio"] = raw_audio
    converted_dict["random_seed"] = seed
    return cls(**converted_dict)

`to_openai(exclude=(), **kwargs)`

Convert the transcription request into the OpenAI format.

This method prepares the transcription request data for compatibility with the OpenAI API. It handles the conversion of audio data and additional parameters into the required format.

Parameters:

Name	Type	Description	Default
`exclude`	`tuple`	Fields to exclude from the conversion.	`()`
`kwargs`	`Any`	Additional parameters to be added to the request.	`{}`

Returns:

Type	Description
`dict[str, list[dict[str, Any]]]`	The request in the OpenAI format.

Raises:

Type	Description
`ImportError`	If the required soundfile library is not installed.

Source code in src/mistral_common/protocol/transcription/request.py

def to_openai(self, exclude: tuple = (), **kwargs: Any) -> dict[str, list[dict[str, Any]]]:
    r"""Convert the transcription request into the OpenAI format.

    This method prepares the transcription request data for compatibility with the OpenAI API.
    It handles the conversion of audio data and additional parameters into the required format.

    Args:
        exclude: Fields to exclude from the conversion.
        kwargs: Additional parameters to be added to the request.

    Returns:
        The request in the OpenAI format.

    Raises:
        ImportError: If the required soundfile library is not installed.
    """
    openai_request: dict[str, Any] = self.model_dump(exclude={"audio"})

    assert_soundfile_installed()

    if isinstance(self.audio.data, bytes):
        buffer = io.BytesIO(self.audio.data)
    else:
        assert isinstance(self.audio.data, str)
        audio = Audio.from_base64(self.audio.data)

        buffer = io.BytesIO()
        sf.write(buffer, audio.audio_array, audio.sampling_rate, format=audio.format)
        # reset cursor to beginning
        buffer.seek(0)

    openai_request["file"] = buffer
    openai_request["seed"] = openai_request.pop("random_seed")
    openai_request.update(kwargs)

    # remove mistral-specific
    default_exclude = ("id", "max_tokens", "strict_audio_validation")
    default_exclude += exclude
    for k in default_exclude:
        openai_request.pop(k, None)

    return openai_request

mistral_common.protocol.transcription.request

TranscriptionRequest(**data)

from_openai(openai_request, strict=False) classmethod

to_openai(exclude=(), **kwargs)

`mistral_common.protocol.transcription.request`

`TranscriptionRequest(**data)`

`from_openai(openai_request, strict=False)` `classmethod`

`to_openai(exclude=(), **kwargs)`