创建语音

POST

audio

speech

Python

import os
from openai import OpenAI

client = OpenAI(
    api_key=os.environ["COMETAPI_KEY"],
    base_url="https://api.cometapi.com/v1"
)

response = client.audio.speech.create(
    model="tts-1",
    voice="alloy",
    input="The quick brown fox jumped over the lazy dog."
)

response.stream_to_file("output.mp3")

import OpenAI from "openai";
import fs from "fs";

const client = new OpenAI({
  apiKey: process.env.COMETAPI_KEY,
  baseURL: "https://api.cometapi.com/v1"
});

const response = await client.audio.speech.create({
  model: "tts-1",
  voice: "alloy",
  input: "The quick brown fox jumped over the lazy dog."
});

const buffer = Buffer.from(await response.arrayBuffer());
fs.writeFileSync("output.mp3", buffer);

curl -X POST https://api.cometapi.com/v1/audio/speech \
  -H "Authorization: Bearer $COMETAPI_KEY" \
  -H "Content-Type: application/json" \
  -d '{
    "model": "tts-1",
    "input": "The quick brown fox jumped over the lazy dog.",
    "voice": "alloy"
  }' \
  --output output.mp3

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.cometapi.com/v1/audio/speech",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'model' => 'tts-1',
    'input' => 'The quick brown fox jumped over the lazy dog.',
    'voice' => 'alloy'
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.cometapi.com/v1/audio/speech"

	payload := strings.NewReader("{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.cometapi.com/v1/audio/speech")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.cometapi.com/v1/audio/speech")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}"

response = http.request(request)
puts response.read_body

"<string>"

使用此端点可通过兼容 OpenAI 的音频 API 将文本转换为音频文件。它适用于旁白、简短语音提示、朗读功能，以及其他你的应用已经有文本并需要语音输出的工作流。

首次请求

从三个字段开始：model、input 和 voice。保持首次请求简短，这样你就可以在调整速度或输出格式之前，先验证认证、音频格式和文件处理是否正常。

读取响应

响应是二进制音频，而不是 JSON。在 SDK 示例中，将响应写入文件，例如 output.mp3。在直接使用 HTTP 客户端时，保存响应体，并将文件扩展名设置为与你请求的 response_format 一致。

后续步骤

当你需要将语音转换回文本时，请使用创建转录。
当你需要从非英语音频中获取英文文本时，请使用创建翻译。

授权

Authorization

string

header

必填

Bearer token authentication. Use your CometAPI key.

请求体

application/json

model

string

默认值:tts-1

必填

The TTS model to use. Choose a current speech model from the Models page.

input

string

必填

The text to generate audio for. Maximum length is 4096 characters.

Maximum string length: 4096

voice

enum<string>

默认值:alloy

必填

The voice to use for speech synthesis.

可用选项:

alloy,

ash,

ballad,

coral,

echo,

fable,

onyx,

nova,

sage,

shimmer

response_format

enum<string>

默认值:mp3

The audio output format.

可用选项:

mp3,

opus,

aac,

flac,

wav,

pcm

speed

number

默认值:1

The speed of the generated audio. Select a value between 0.25 and 4.0.

必填范围: 0.25 <= x <= 4

响应

200 - audio/mpeg

The audio file content.

The response is of type file.

音频 API

创建转录

Python

import os
from openai import OpenAI

client = OpenAI(
    api_key=os.environ["COMETAPI_KEY"],
    base_url="https://api.cometapi.com/v1"
)

response = client.audio.speech.create(
    model="tts-1",
    voice="alloy",
    input="The quick brown fox jumped over the lazy dog."
)

response.stream_to_file("output.mp3")

import OpenAI from "openai";
import fs from "fs";

const client = new OpenAI({
  apiKey: process.env.COMETAPI_KEY,
  baseURL: "https://api.cometapi.com/v1"
});

const response = await client.audio.speech.create({
  model: "tts-1",
  voice: "alloy",
  input: "The quick brown fox jumped over the lazy dog."
});

const buffer = Buffer.from(await response.arrayBuffer());
fs.writeFileSync("output.mp3", buffer);

curl -X POST https://api.cometapi.com/v1/audio/speech \
  -H "Authorization: Bearer $COMETAPI_KEY" \
  -H "Content-Type: application/json" \
  -d '{
    "model": "tts-1",
    "input": "The quick brown fox jumped over the lazy dog.",
    "voice": "alloy"
  }' \
  --output output.mp3

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.cometapi.com/v1/audio/speech",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'model' => 'tts-1',
    'input' => 'The quick brown fox jumped over the lazy dog.',
    'voice' => 'alloy'
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.cometapi.com/v1/audio/speech"

	payload := strings.NewReader("{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.cometapi.com/v1/audio/speech")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.cometapi.com/v1/audio/speech")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}"

response = http.request(request)
puts response.read_body

"<string>"

内容审核

API 密钥

首次请求

读取响应

后续步骤

授权

请求体

响应

​首次请求

​读取响应

​后续步骤

授权

请求体

响应

首次请求

读取响应

后续步骤