建立語音

POST

audio

speech

Python

import os
from openai import OpenAI

client = OpenAI(
    api_key=os.environ["COMETAPI_KEY"],
    base_url="https://api.cometapi.com/v1"
)

response = client.audio.speech.create(
    model="tts-1",
    voice="alloy",
    input="The quick brown fox jumped over the lazy dog."
)

response.stream_to_file("output.mp3")

import OpenAI from "openai";
import fs from "fs";

const client = new OpenAI({
  apiKey: process.env.COMETAPI_KEY,
  baseURL: "https://api.cometapi.com/v1"
});

const response = await client.audio.speech.create({
  model: "tts-1",
  voice: "alloy",
  input: "The quick brown fox jumped over the lazy dog."
});

const buffer = Buffer.from(await response.arrayBuffer());
fs.writeFileSync("output.mp3", buffer);

curl -X POST https://api.cometapi.com/v1/audio/speech \
  -H "Authorization: Bearer $COMETAPI_KEY" \
  -H "Content-Type: application/json" \
  -d '{
    "model": "tts-1",
    "input": "The quick brown fox jumped over the lazy dog.",
    "voice": "alloy"
  }' \
  --output output.mp3

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.cometapi.com/v1/audio/speech",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'model' => 'tts-1',
    'input' => 'The quick brown fox jumped over the lazy dog.',
    'voice' => 'alloy'
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.cometapi.com/v1/audio/speech"

	payload := strings.NewReader("{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.cometapi.com/v1/audio/speech")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.cometapi.com/v1/audio/speech")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}"

response = http.request(request)
puts response.read_body

"<string>"

使用此端點可透過與 OpenAI 相容的音訊 API，將文字轉換為音訊檔案。它適合用於旁白、簡短語音提示、朗讀功能，以及其他你的應用程式已經有文字內容且需要語音輸出的工作流程。

First request

先從三個欄位開始：model、input 和 voice。請讓第一次請求保持簡短，以便在調整速度或輸出格式之前，先驗證驗證資訊、音訊格式與檔案處理。

Read the response

回應是二進位音訊，而非 JSON。在 SDK 範例中，請將回應寫入檔案，例如 output.mp3。在直接使用 HTTP 用戶端時，請儲存回應主體，並將副檔名設為與請求的 response_format 相符。

Next steps

當你需要將語音轉回文字時，請使用建立轉錄。
當你需要從非英文音訊取得英文文字時，請使用建立翻譯。

授權

Authorization

string

header

必填

Bearer token authentication. Use your CometAPI key.

主體

application/json

model

string

預設值:tts-1

必填

The TTS model to use. Choose a current speech model from the Models page.

input

string

必填

The text to generate audio for. Maximum length is 4096 characters.

Maximum string length: 4096

voice

enum<string>

預設值:alloy

必填

The voice to use for speech synthesis.

可用選項:

alloy,

ash,

ballad,

coral,

echo,

fable,

onyx,

nova,

sage,

shimmer

response_format

enum<string>

預設值:mp3

The audio output format.

可用選項:

mp3,

opus,

aac,

flac,

wav,

pcm

speed

number

預設值:1

The speed of the generated audio. Select a value between 0.25 and 4.0.

必填範圍: 0.25 <= x <= 4

回應

200 - audio/mpeg

The audio file content.

The response is of type file.

音訊 API

建立轉錄

Python

import os
from openai import OpenAI

client = OpenAI(
    api_key=os.environ["COMETAPI_KEY"],
    base_url="https://api.cometapi.com/v1"
)

response = client.audio.speech.create(
    model="tts-1",
    voice="alloy",
    input="The quick brown fox jumped over the lazy dog."
)

response.stream_to_file("output.mp3")

import OpenAI from "openai";
import fs from "fs";

const client = new OpenAI({
  apiKey: process.env.COMETAPI_KEY,
  baseURL: "https://api.cometapi.com/v1"
});

const response = await client.audio.speech.create({
  model: "tts-1",
  voice: "alloy",
  input: "The quick brown fox jumped over the lazy dog."
});

const buffer = Buffer.from(await response.arrayBuffer());
fs.writeFileSync("output.mp3", buffer);

curl -X POST https://api.cometapi.com/v1/audio/speech \
  -H "Authorization: Bearer $COMETAPI_KEY" \
  -H "Content-Type: application/json" \
  -d '{
    "model": "tts-1",
    "input": "The quick brown fox jumped over the lazy dog.",
    "voice": "alloy"
  }' \
  --output output.mp3

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.cometapi.com/v1/audio/speech",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'model' => 'tts-1',
    'input' => 'The quick brown fox jumped over the lazy dog.',
    'voice' => 'alloy'
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.cometapi.com/v1/audio/speech"

	payload := strings.NewReader("{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.cometapi.com/v1/audio/speech")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.cometapi.com/v1/audio/speech")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}"

response = http.request(request)
puts response.read_body

"<string>"

內容審核

API 金鑰

First request

Read the response

Next steps

授權

主體

回應

​First request

​Read the response

​Next steps

授權

主體

回應

First request

Read the response

Next steps