diff --git a/api-reference/v2/pre-recorded/init.mdx b/api-reference/v2/pre-recorded/init.mdx index 413e335..d1ba3e7 100644 --- a/api-reference/v2/pre-recorded/init.mdx +++ b/api-reference/v2/pre-recorded/init.mdx @@ -2,4 +2,8 @@ title: Initiate a transcription description: Initiate a pre-recorded transcription job. Use the returned `id` and the [GET /v2/pre-recorded/:id](/api-reference/v2/pre-recorded/get) endpoint to obtain the results. openapi: POST /v2/pre-recorded ---- \ No newline at end of file +--- + +import ChooseModel from "/snippets/choose-model.mdx"; + + \ No newline at end of file diff --git a/chapters/live-stt/quickstart.mdx b/chapters/live-stt/quickstart.mdx index 983a13a..23168e2 100644 --- a/chapters/live-stt/quickstart.mdx +++ b/chapters/live-stt/quickstart.mdx @@ -7,6 +7,10 @@ import Samples from '/snippets/samples.mdx'; import PartialsTip from '/snippets/partials-tip.mdx'; import WhyPostToOpenWebSocket from '/snippets/why-post-to-open-websocket.mdx'; + +Live transcription supports **`"solaria-1"` only**. + + diff --git a/chapters/pre-recorded-stt/quickstart.mdx b/chapters/pre-recorded-stt/quickstart.mdx index 20e59b4..2b2478c 100644 --- a/chapters/pre-recorded-stt/quickstart.mdx +++ b/chapters/pre-recorded-stt/quickstart.mdx @@ -5,6 +5,7 @@ description: How to transcribe pre-recorded audio with Gladia's speech-to-text ( import GetTranscriptionResult from "/snippets/get-transcription-result.mdx"; import Samples from "/snippets/samples.mdx"; +import ChooseModel from "/snippets/choose-model.mdx"; @@ -13,6 +14,8 @@ The SDK simplifies pre-recorded speech-to-text by abstracting upload, job creati - A `transcribe()` for an end-to-end flow - Individual steps when you need control over each step. + + ## Install the SDK @@ -73,9 +76,9 @@ const gladiaClient = new GladiaClient({ apiKey: "YOUR_GLADIA_API_KEY" }); const transcription = await gladiaClient.preRecorded().transcribe( "YOUR_AUDIO_URL_OR_LOCAL_PATH", { + model: "solaria-3", language_config: { - languages: ["en", "fr"], - code_switching: true, + languages: ["fr"], }, custom_vocabulary: true, custom_vocabulary_config: { @@ -93,9 +96,9 @@ gladia_client = GladiaClient(api_key="YOUR_GLADIA_API_KEY").prerecorded() transcription = gladia_client.transcribe( "YOUR_AUDIO_URL_OR_LOCAL_PATH", { + "model": "solaria-3", "language_config": { - "languages": ["en", "fr"], - "code_switching": True, + "languages": ["fr"], }, "custom_vocabulary": True, "custom_vocabulary_config": { @@ -106,6 +109,10 @@ transcription = gladia_client.transcribe( ``` + + With `"solaria-3"`, set **one language** in `language_config.languages` — for example `["fr"]`. Do not pass multiple languages or enable code switching. + + Want to go further? See [Audio Intelligence](/chapters/pre-recorded-stt/audio-intelligence) for add-ons like: - [Speaker diarization](/chapters/audio-intelligence/speaker-diarization): separate the speakers across the conversation @@ -174,9 +181,9 @@ const gladiaClient = new GladiaClient({ apiKey: "YOUR_GLADIA_API_KEY" }); const job = await gladiaClient.preRecorded().createUntyped({ audio_url: "YOUR_AUDIO_URL", + model: "solaria-3", language_config: { - languages: ["en", "fr"], - code_switching: true, + languages: ["fr"], }, custom_vocabulary: true, custom_vocabulary_config: { @@ -193,9 +200,9 @@ gladia_client = GladiaClient(api_key="YOUR_GLADIA_API_KEY").prerecorded() job = gladia_client.create( { "audio_url": "YOUR_AUDIO_URL", + "model": "solaria-3", "language_config": { - "languages": ["en", "fr"], - "code_switching": True, + "languages": ["fr"], }, "custom_vocabulary": True, "custom_vocabulary_config": { @@ -219,6 +226,8 @@ job = gladia_client.create( + + ## Individual steps Upload audio, create a transcription job, then poll until the job is done (or use webhooks or a callback URL). @@ -270,9 +279,9 @@ const response = await fetch("https://api.gladia.io/v2/pre-recorded", { }, body: JSON.stringify({ audio_url: "YOUR_AUDIO_URL", + model: "solaria-3", language_config: { - languages: [], - code_switching: false, + languages: ["fr"], }, diarization: true, diarization_config: { @@ -311,9 +320,9 @@ curl --request POST \ --header 'x-gladia-key: YOUR_GLADIA_API_KEY' \ --data '{ "audio_url": "YOUR_AUDIO_URL", + "model": "solaria-3", "language_config": { - "languages": [], - "code_switching": false + "languages": ["fr"] }, "diarization": true, "diarization_config": { diff --git a/snippets/choose-model.mdx b/snippets/choose-model.mdx new file mode 100644 index 0000000..7b57d01 --- /dev/null +++ b/snippets/choose-model.mdx @@ -0,0 +1,16 @@ + +Pass `model` to choose the transcription model: + +**`"solaria-3"`** — our latest model: highest accuracy on European real-world audio. +- **Async (pre-recorded) only** — not available for live transcription. +- **Languages:** English, French, German, Spanish, Italian +- **Single language only** — pass exactly one language in `language_config.languages` (no code switching). +- All Audio Intelligence add-ons available. + +**`"solaria-1"`** — our generalist model: maximum language coverage across any domain. +- Available for async and live. +- Code switching and multi-language configuration (100+ languages covered) +- All Audio Intelligence add-ons available. + +If omitted, the API uses the default model. (Solaria-1) +