MiniMax Speech 2.8 HD

curl --request POST \
  --url https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "prompt": "<string>"
}
'

import requests

url = "https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd"

payload = { "prompt": "<string>" }
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {Authorization: 'Bearer <token>', 'Content-Type': 'application/json'},
  body: JSON.stringify({prompt: '<string>'})
};

fetch('https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'prompt' => '<string>'
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd"

	payload := strings.NewReader("{\n  \"prompt\": \"<string>\"\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"prompt\": \"<string>\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"prompt\": \"<string>\"\n}"

response = http.request(request)
puts response.read_body

import Foundation

let parameters = ["prompt": "<string>"] as [String : Any?]

let postData = try JSONSerialization.data(withJSONObject: parameters, options: [])

let url = URL(string: "https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd")!
var request = URLRequest(url: url)
request.httpMethod = "POST"
request.timeoutInterval = 10
request.allHTTPHeaderFields = [
  "Authorization": "Bearer <token>",
  "Content-Type": "application/json"
]
request.httpBody = postData

let (data, _) = try await URLSession.shared.data(for: request)
print(String(decoding: data, as: UTF8.self))

{
  "id": "gen_123",
  "status": "IN_QUEUE",
  "input": {
    "prompt": "lofi piano with soft rain ambience",
    "duration": 15
  },
  "usage": {
    "total": 20,
    "subscription": 20,
    "permanent": 0
  }
}

{
  "error": "TTS_GENERATION_INVALID_INPUT",
  "code": "TTS_GENERATION_INVALID_INPUT",
  "message": "'prompt' parameter is required"
}

{
  "error": "UNAUTHORIZED",
  "code": "UNAUTHORIZED",
  "message": "Unauthorized"
}

{
  "error": "INSUFFICIENT_CREDITS",
  "code": "TTS_GENERATION_INSUFFICIENT_CREDITS",
  "message": "Insufficient credits for this generation."
}

{
  "error": "WORKSPACE_FORBIDDEN",
  "code": "WORKSPACE_FORBIDDEN",
  "message": "You do not have access to this workspace."
}

{
  "error": "TEMPLATE_NOT_FOUND",
  "code": "TEMPLATE_NOT_FOUND",
  "message": "Template not found."
}

{
  "error": "TTS_GENERATION_CONTENT_REJECTED",
  "code": "TTS_GENERATION_CONTENT_REJECTED",
  "message": "Request content was rejected by the moderation policy."
}

{
  "error": "TTS_GENERATION_RATE_LIMITED",
  "code": "TTS_GENERATION_RATE_LIMITED",
  "message": "Rate limit exceeded. Please retry later."
}

{
  "error": "TTS_GENERATION_FAILED",
  "code": "TTS_GENERATION_FAILED",
  "message": "Generation failed."
}

{
  "error": "TTS_GENERATION_FAILED",
  "code": "TTS_GENERATION_FAILED",
  "message": "Generation failed."
}

{
  "error": "TTS_GENERATION_PROVIDER_UNAVAILABLE",
  "code": "TTS_GENERATION_PROVIDER_UNAVAILABLE",
  "message": "Upstream generation provider is temporarily unavailable."
}

{
  "error": "TTS_GENERATION_TIMEOUT",
  "code": "TTS_GENERATION_TIMEOUT",
  "message": "Generation timed out."
}

POST

generation

fal-ai

minimax

speech-2.8-hd

MiniMax Speech 2.8 HD

curl --request POST \
  --url https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "prompt": "<string>"
}
'

import requests

url = "https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd"

payload = { "prompt": "<string>" }
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {Authorization: 'Bearer <token>', 'Content-Type': 'application/json'},
  body: JSON.stringify({prompt: '<string>'})
};

fetch('https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'prompt' => '<string>'
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd"

	payload := strings.NewReader("{\n  \"prompt\": \"<string>\"\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"prompt\": \"<string>\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"prompt\": \"<string>\"\n}"

response = http.request(request)
puts response.read_body

import Foundation

let parameters = ["prompt": "<string>"] as [String : Any?]

let postData = try JSONSerialization.data(withJSONObject: parameters, options: [])

let url = URL(string: "https://open.skills.video/api/v1/generation/fal-ai/minimax/speech-2.8-hd")!
var request = URLRequest(url: url)
request.httpMethod = "POST"
request.timeoutInterval = 10
request.allHTTPHeaderFields = [
  "Authorization": "Bearer <token>",
  "Content-Type": "application/json"
]
request.httpBody = postData

let (data, _) = try await URLSession.shared.data(for: request)
print(String(decoding: data, as: UTF8.self))

{
  "id": "gen_123",
  "status": "IN_QUEUE",
  "input": {
    "prompt": "lofi piano with soft rain ambience",
    "duration": 15
  },
  "usage": {
    "total": 20,
    "subscription": 20,
    "permanent": 0
  }
}

{
  "error": "TTS_GENERATION_INVALID_INPUT",
  "code": "TTS_GENERATION_INVALID_INPUT",
  "message": "'prompt' parameter is required"
}

{
  "error": "UNAUTHORIZED",
  "code": "UNAUTHORIZED",
  "message": "Unauthorized"
}

{
  "error": "INSUFFICIENT_CREDITS",
  "code": "TTS_GENERATION_INSUFFICIENT_CREDITS",
  "message": "Insufficient credits for this generation."
}

{
  "error": "WORKSPACE_FORBIDDEN",
  "code": "WORKSPACE_FORBIDDEN",
  "message": "You do not have access to this workspace."
}

{
  "error": "TEMPLATE_NOT_FOUND",
  "code": "TEMPLATE_NOT_FOUND",
  "message": "Template not found."
}

{
  "error": "TTS_GENERATION_CONTENT_REJECTED",
  "code": "TTS_GENERATION_CONTENT_REJECTED",
  "message": "Request content was rejected by the moderation policy."
}

{
  "error": "TTS_GENERATION_RATE_LIMITED",
  "code": "TTS_GENERATION_RATE_LIMITED",
  "message": "Rate limit exceeded. Please retry later."
}

{
  "error": "TTS_GENERATION_FAILED",
  "code": "TTS_GENERATION_FAILED",
  "message": "Generation failed."
}

{
  "error": "TTS_GENERATION_FAILED",
  "code": "TTS_GENERATION_FAILED",
  "message": "Generation failed."
}

{
  "error": "TTS_GENERATION_PROVIDER_UNAVAILABLE",
  "code": "TTS_GENERATION_PROVIDER_UNAVAILABLE",
  "message": "Upstream generation provider is temporarily unavailable."
}

{
  "error": "TTS_GENERATION_TIMEOUT",
  "code": "TTS_GENERATION_TIMEOUT",
  "message": "Generation timed out."
}

High-quality text-to-speech with multilingual voices and controllable voice/audio settings.

Authorizations

Authorization

string

header

required

API Key for API endpoints

Body

prompt

string

required

Text to convert to speech. Use <#x#> for pauses (x = 0.01-99.99 seconds). Supports interjection tags: (laughs), (sighs), (coughs), (clears throat), (gasps), (sniffs), (groans), (yawns).

Required string length: 1 - 10000

Example:

"Hello world! Welcome to MiniMax's new text to speech model <#0.1#> Speech 2.8 HD (laughs) now available on Fal!"

voice_id

enum<string>

default:Wise_Woman

Predefined voice ID or preset name.

Available options:

Wise_Woman,

Friendly_Person,

Inspirational_girl,

Deep_Voice_Man,

Calm_Woman,

Casual_Guy,

Lively_Girl,

Patient_Man,

Young_Knight,

Determined_Man,

Lovely_Girl,

Decent_Boy,

Imposing_Manner,

Elegant_Man,

Abbess,

Sweet_Girl_2,

Exuberant_Girl

Examples:

"Wise_Woman"

"Friendly_Person"

"Calm_Woman"

speed

number

default:1

Speech speed (0.5 - 2.0).

Required range: 0.5 <= x <= 2

vol

number

default:1

Volume (0.01 - 10).

Required range: 0.01 <= x <= 10

pitch

integer

default:0

Voice pitch (-12 to 12).

Required range: -12 <= x <= 12

emotion

enum<string>

Emotion style of generated speech.

Available options:

happy,

sad,

angry,

fearful,

disgusted,

surprised,

neutral

english_normalization

boolean

default:false

Enables English text normalization to improve number reading performance, with a slight increase in latency.

language_boost

enum<string>

default:auto

Enhance recognition of specified languages and dialects.

Available options:

auto,

Chinese,

Chinese,Yue,

English,

Arabic,

Russian,

Spanish,

French,

Portuguese,

German,

Turkish,

Dutch,

Ukrainian,

Vietnamese,

Indonesian,

Japanese,

Italian,

Korean,

Thai,

Polish,

Romanian,

Greek,

Czech,

Finnish,

Hindi,

Bulgarian,

Danish,

Hebrew,

Malay,

Slovak,

Swedish,

Croatian,

Hungarian,

Norwegian,

Slovenian,

Catalan,

Nynorsk,

Afrikaans

audio_sample_rate

default:32000

Sample rate of generated audio.

audio_bitrate

default:128000

Bitrate of generated audio.

audio_format

enum<string>

default:mp3

Audio format.

Available options:

mp3,

pcm,

flac

audio_channel

default:1

Number of audio channels (1=mono, 2=stereo).

normalization_enabled

boolean

default:true

Enable loudness normalization for the audio.

target_loudness

number

default:-18

Target loudness in LUFS (default -18.0).

Required range: -70 <= x <= -10

target_range

number

default:8

Target loudness range in LU (default 8.0).

Required range: 0 <= x <= 20

target_peak

number

default:-0.5

Target peak level in dBTP (default -0.5).

Required range: -3 <= x <= 0

voice_modify_pitch

integer

default:0

Pitch adjustment in semitones. Range: -100 to 100. Positive values raise pitch, negative values lower it.

Required range: -100 <= x <= 100

voice_modify_intensity

integer

default:0

Intensity or energy of the voice. Range: -100 to 100. Higher values create more energetic speech.

Required range: -100 <= x <= 100

voice_modify_timbre

integer

default:0

Timbre adjustment. Range: -100 to 100. Affects the tonal quality of the voice.

Required range: -100 <= x <= 100

Response

Generation submission accepted

string

required

Generation id.

status

enum<string>

required

Queue status

Available options:

IN_QUEUE,

IN_PROGRESS,

COMPLETED,

FAILED,

CANCELED

input

MiniMax Speech 2.8 HD Input · object

required

Normalized input payload for the generation task.

Show child attributes

usage

object

required

Credit usage breakdown for the request

Show child attributes

code

string

Machine-readable generation error code. Present when status is FAILED.

message

string

Sanitized human-readable failure message. Present when status is FAILED.

Generate TTS audio (synchronous)MiniMax Speech 2.8 HD

Get started

Billing

APIs

MiniMax Speech 2.8 HD

Authorizations

Body

Response