音声生成

POST

audio

speech

Python

import os
from openai import OpenAI

client = OpenAI(
    api_key=os.environ["COMETAPI_KEY"],
    base_url="https://api.cometapi.com/v1"
)

response = client.audio.speech.create(
    model="tts-1",
    voice="alloy",
    input="The quick brown fox jumped over the lazy dog."
)

response.stream_to_file("output.mp3")

import OpenAI from "openai";
import fs from "fs";

const client = new OpenAI({
  apiKey: process.env.COMETAPI_KEY,
  baseURL: "https://api.cometapi.com/v1"
});

const response = await client.audio.speech.create({
  model: "tts-1",
  voice: "alloy",
  input: "The quick brown fox jumped over the lazy dog."
});

const buffer = Buffer.from(await response.arrayBuffer());
fs.writeFileSync("output.mp3", buffer);

curl -X POST https://api.cometapi.com/v1/audio/speech \
  -H "Authorization: Bearer $COMETAPI_KEY" \
  -H "Content-Type: application/json" \
  -d '{
    "model": "tts-1",
    "input": "The quick brown fox jumped over the lazy dog.",
    "voice": "alloy"
  }' \
  --output output.mp3

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.cometapi.com/v1/audio/speech",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'model' => 'tts-1',
    'input' => 'The quick brown fox jumped over the lazy dog.',
    'voice' => 'alloy'
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.cometapi.com/v1/audio/speech"

	payload := strings.NewReader("{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.cometapi.com/v1/audio/speech")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.cometapi.com/v1/audio/speech")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}"

response = http.request(request)
puts response.read_body

"<string>"

このエンドポイントを使用すると、OpenAI 互換の音声 API を通じてテキストを音声ファイルに変換できます。ナレーション、短い音声プロンプト、読み上げ機能、その他、アプリにすでにテキストがあり音声出力が必要なワークフローに適しています。

First request

まずは model、input、voice の 3 つのフィールドから始めます。speed や出力形式を調整する前に、最初のリクエストは短くして、認証、音声形式、ファイル処理を確認できるようにしてください。

Read the response

レスポンスは JSON ではなくバイナリ音声です。SDK の例では、レスポンスを output.mp3 のようなファイルに書き込みます。直接 HTTP クライアントを使う場合は、レスポンスボディを保存し、要求した response_format に合わせてファイル拡張子を設定してください。

Next steps

音声を再びテキストに変換する必要がある場合は、文字起こしを使用します。
英語以外の音声から英語テキストが必要な場合は、翻訳を使用します。

承認

Authorization

string

header

必須

Bearer token authentication. Use your CometAPI key.

ボディ

application/json

model

string

デフォルト:tts-1

必須

The TTS model to use. Choose a current speech model from the Models page.

input

string

必須

The text to generate audio for. Maximum length is 4096 characters.

Maximum string length: 4096

voice

enum<string>

デフォルト:alloy

必須

The voice to use for speech synthesis.

利用可能なオプション:

alloy,

ash,

ballad,

coral,

echo,

fable,

onyx,

nova,

sage,

shimmer

response_format

enum<string>

デフォルト:mp3

The audio output format.

利用可能なオプション:

mp3,

opus,

aac,

flac,

wav,

pcm

speed

number

デフォルト:1

The speed of the generated audio. Select a value between 0.25 and 4.0.

必須範囲: 0.25 <= x <= 4

レスポンス

200 - audio/mpeg

The audio file content.

The response is of type file.

音声 API

文字起こし

Python

import os
from openai import OpenAI

client = OpenAI(
    api_key=os.environ["COMETAPI_KEY"],
    base_url="https://api.cometapi.com/v1"
)

response = client.audio.speech.create(
    model="tts-1",
    voice="alloy",
    input="The quick brown fox jumped over the lazy dog."
)

response.stream_to_file("output.mp3")

import OpenAI from "openai";
import fs from "fs";

const client = new OpenAI({
  apiKey: process.env.COMETAPI_KEY,
  baseURL: "https://api.cometapi.com/v1"
});

const response = await client.audio.speech.create({
  model: "tts-1",
  voice: "alloy",
  input: "The quick brown fox jumped over the lazy dog."
});

const buffer = Buffer.from(await response.arrayBuffer());
fs.writeFileSync("output.mp3", buffer);

curl -X POST https://api.cometapi.com/v1/audio/speech \
  -H "Authorization: Bearer $COMETAPI_KEY" \
  -H "Content-Type: application/json" \
  -d '{
    "model": "tts-1",
    "input": "The quick brown fox jumped over the lazy dog.",
    "voice": "alloy"
  }' \
  --output output.mp3

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.cometapi.com/v1/audio/speech",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'model' => 'tts-1',
    'input' => 'The quick brown fox jumped over the lazy dog.',
    'voice' => 'alloy'
  ]),
  CURLOPT_HTTPHEADER => [
    "Authorization: Bearer <token>",
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.cometapi.com/v1/audio/speech"

	payload := strings.NewReader("{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.cometapi.com/v1/audio/speech")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.cometapi.com/v1/audio/speech")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Authorization"] = 'Bearer <token>'
request["Content-Type"] = 'application/json'
request.body = "{\n  \"model\": \"tts-1\",\n  \"input\": \"The quick brown fox jumped over the lazy dog.\",\n  \"voice\": \"alloy\"\n}"

response = http.request(request)
puts response.read_body

"<string>"

コンテンツモデレーション

APIキー

First request

Read the response

Next steps

承認

ボディ

レスポンス

​First request

​Read the response

​Next steps

承認

ボディ

レスポンス

First request

Read the response

Next steps