voicevoxcorego

package module

v0.0.5 Latest Latest Go to latest Published: Jun 30, 2023 License: MIT Imports: 5 Imported by: 0

Details

Valid go.mod file
Redistributable license
Tagged version
Stable version
Learn more about best practices

Repository

github.com/sh1ma/voicevoxcore.go

Links

Open Source Insights

README ¶

voicevoxcore.go

voicevoxcore.go はvoicevox_coreを Go 言語で使えるラッパーです。 FFI を用いて、voicevox_core の C API を呼んでいます。

例

以下は本ライブラリを使用して Text to Speech を行う例です。


//go:build ignore

package main

import (
	"fmt"
	"os"

	voicevoxcorego "github.com/sh1ma/voicevoxcore.go"
)

func main() {
	args := os.Args
	if len(args) < 2 {
		fmt.Println("usage:\n\tgo run tts.go [ text ]")
		os.Exit(127)
	}
	text := os.Args[1]

	core := voicevoxcorego.NewVoicevoxCore()
	initializeOptions := voicevoxcorego.NewVoicevoxInitializeOptions(0, 0, false, "./open_jtalk_dic_utf_8-1.11")
	core.Initialize(initializeOptions)

	core.LoadModel(1)

	ttsOptions := voicevoxcorego.NewVoicevoxTtsOptions(false, true)
	result, err := core.Tts(text, 1, ttsOptions)
	if err != nil {
		fmt.Println(err)
	}
	f, _ := os.Create("out.wav")
	_, err = f.Write(result)
	if err != nil {
		fmt.Println(err)
	}
}

Documentation ¶

Index ¶

type AccentPharase
type AudioQuery
- func NewAudioQueryFromJson(queryJson []byte) (*AudioQuery, error)
- func (q *AudioQuery) ToJson() ([]byte, error)
- func (q *AudioQuery) ToJsonString() (string, error)
type Mora
type RawVoicevoxCore
type VoicevoxAudioQueryOptions
- func NewVoicevoxAudioQueryOptions(kana bool) *VoicevoxAudioQueryOptions
- func (o *VoicevoxAudioQueryOptions) UpdateKana(kana bool)
type VoicevoxCore
- func New() (core *VoicevoxCore)
- func (r *VoicevoxCore) AudioQuery(text string, speakerID uint, options *VoicevoxAudioQueryOptions) (*AudioQuery, error)
- func (r *VoicevoxCore) Decode(speakerID uint, phonemeSize int, f0 []float32, phonemeVector []float32) ([]float32, error)
- func (r *VoicevoxCore) ErrorResultToMessage(resultCode int) string
- func (r *VoicevoxCore) Finalize()
- func (r *VoicevoxCore) GetCoreVersion() string
- func (r *VoicevoxCore) GetMetasJson() string
- func (r *VoicevoxCore) GetSupportedDevicesJson() string
- func (r *VoicevoxCore) Initialize(options *VoicevoxInitializeOptions) error
- func (r *VoicevoxCore) IsGpuMode() bool
- func (r *VoicevoxCore) IsModelLoaded(speakerID uint) bool
- func (r *VoicevoxCore) LoadModel(speakerID uint) error
- func (r *VoicevoxCore) MakeDefaultAudioQueryOotions() *VoicevoxAudioQueryOptions
- func (r *VoicevoxCore) MakeDefaultInitializeOptions() *VoicevoxInitializeOptions
- func (r *VoicevoxCore) MakeDefaultSynthesisOotions() *VoicevoxSynthesisOptions
- func (r *VoicevoxCore) MakeDefaultTtsOotions() *VoicevoxTtsOptions
- func (r *VoicevoxCore) PredictDuration(speakerID int, phonemeVector []int64) ([]float32, error)
- func (r *VoicevoxCore) PredictIntonation(speakerID int, vowelPhonemeVector, consonantPhonemeVector []int64, ...) ([]float32, error)
- func (r *VoicevoxCore) Synthesis(audioQuery *AudioQuery, speakerID int, options *VoicevoxSynthesisOptions) ([]byte, error)
- func (r *VoicevoxCore) Tts(text string, speakerID int, options *VoicevoxTtsOptions) ([]byte, error)
type VoicevoxInitializeOptions
- func NewVoicevoxInitializeOptions(accelerationMode int, cpuNumThreads int, loadAllModels bool, ...) *VoicevoxInitializeOptions
- func (o *VoicevoxInitializeOptions) UpdateAccelerationMode(accelerationMode int)
- func (o *VoicevoxInitializeOptions) UpdateCpuNumThreads(cpuNumThreads int)
- func (o *VoicevoxInitializeOptions) UpdateLoadAllModels(loadAllModels bool)
- func (o *VoicevoxInitializeOptions) UpdateOpenJtalkDictDir(openJtalkDictDir string)
type VoicevoxSynthesisOptions
- func NewVoicevoxSynthesisOptions(enableInterrogativeUpspeak bool) *VoicevoxSynthesisOptions
- func (o *VoicevoxSynthesisOptions) UpdateInterrogativeUpspeak(kana bool)
type VoicevoxTtsOptions
- func NewVoicevoxTtsOptions(kana bool, enableInterrogativeUpspeak bool) *VoicevoxTtsOptions
- func (o *VoicevoxTtsOptions) UpdateInterrogativeUpspeak(kana bool)
- func (o *VoicevoxTtsOptions) UpdateKana(kana bool)

Constants ¶

This section is empty.

Variables ¶

This section is empty.

Functions ¶

This section is empty.

Types ¶

type AccentPharase ¶ added in v0.0.2

type AccentPharase struct {
	Moras           []Mora `json:"moras"`
	Accent          uint32 `json:"accent"`
	PauseMora       Mora   `json:"pause_mora,omitempty"`
	IsInterrogative bool   `json:"is_interrogative"`
}

アクセント句を表す構造体

`moras`にはモーラの配列を格納する。

`accent`はアクセント位置を表す。

`pause_mora`はポーズのモーラを表す。

`is_interrogative`は疑問文かどうかを表す。

type AudioQuery ¶ added in v0.0.2

type AudioQuery struct {
	AccentPharases     []AccentPharase `json:"accent_phrases"`
	SpeedScale         float32         `json:"speed_scale"`
	PitchScale         float32         `json:"pitch_scale"`
	IntonationScale    float32         `json:"intonation_scale"`
	VolumeScale        float32         `json:"volume_scale"`
	PrePhonemeLength   float32         `json:"pre_phoneme_length"`
	PostPhonemeLength  float32         `json:"post_phoneme_length"`
	OutputSamplingRate float32         `json:"output_sampling_rate"`
	OutputStereo       bool            `json:"output_stereo"`
	Kana               string          `json:"kana"`
}

オーディオクエリを表す構造体

`accent_phrases`にはアクセント句の配列を格納する。

`spped_scale`は発話速度の倍率を表す。

`pitch_scale`は音高の倍率を表す。

`intonation_scale`はイントネーションの倍率を表す。

`volume_scale`は音量の倍率を表す。

`pre_phoneme_length`は発声開始前の無音の長さを表す。

`post_phoneme_length`は発声終了後の無音の長さを表す。

`output_sampling_rate`は出力音声のサンプリングレートを表す。

`output_stereo`は出力音声がステレオかどうかを表す。

`kana`は読み仮名を表す。

func NewAudioQueryFromJson ¶ added in v0.0.3

func NewAudioQueryFromJson(queryJson []byte) (*AudioQuery, error)

Jsonのバイト列からAudioQuery構造体を生成する

func (*AudioQuery) ToJson ¶ added in v0.0.3

func (q *AudioQuery) ToJson() ([]byte, error)

AudioQuery構造体をJsonのバイト列に変換する

func (*AudioQuery) ToJsonString ¶ added in v0.0.3

func (q *AudioQuery) ToJsonString() (string, error)

AudioQuery構造体をJson文字列に変換する

type Mora ¶ added in v0.0.2

type Mora struct {
	Text            string  `json:"text"`
	Consonant       string  `json:"consonant,omitempty"`
	ConsonantLength float32 `json:"consonant_length,omitempty"`
	Vowel           string  `json:"vowel"`
	VowelLength     float32 `json:"vowel_length"`
	Pitch           float32 `json:"pitch"`
}

モーラを表す構造体

`text`はモーラの文字列を表す。

`consonant`は子音を表す。

`consonant_length`は子音の長さを表す。

`vowel`は母音を表す。

`vowel_length`は母音の長さを表す。

`pitch`は音高を表す。

type RawVoicevoxCore ¶

type RawVoicevoxCore struct{}

RawVoicevoxCore is a function group that wraps the C API

type VoicevoxAudioQueryOptions ¶

type VoicevoxAudioQueryOptions struct {
	// contains filtered or unexported fields
}

`AudioQuery()`を実行する際のオプションを表す構造体

func NewVoicevoxAudioQueryOptions ¶

func NewVoicevoxAudioQueryOptions(kana bool) *VoicevoxAudioQueryOptions

`AudioQuery()`の初期化オプションを生成する関数

func (*VoicevoxAudioQueryOptions) UpdateKana ¶ added in v0.0.4

func (o *VoicevoxAudioQueryOptions) UpdateKana(kana bool)

`AudioQuery()`のオプションの`kana`をアップデートする関数

type VoicevoxCore ¶

type VoicevoxCore struct {
	*RawVoicevoxCore
	// contains filtered or unexported fields
}

VoicevoxCore is top-level API Wrapper instance

func New ¶ added in v0.0.5

func New() (core *VoicevoxCore)

VoicevoxCore のコンストラクタ関数

func (*VoicevoxCore) AudioQuery ¶

func (r *VoicevoxCore) AudioQuery(text string, speakerID uint, options *VoicevoxAudioQueryOptions) (*AudioQuery, error)

オーディオクエリを発行する

func (*VoicevoxCore) Decode ¶

func (r *VoicevoxCore) Decode(speakerID uint, phonemeSize int, f0 []float32, phonemeVector []float32) ([]float32, error)

phnemeVectorを元にデコードする

func (*VoicevoxCore) ErrorResultToMessage ¶

func (r *VoicevoxCore) ErrorResultToMessage(resultCode int) string

ErrorResultCode をメッセージに変換する

func (*VoicevoxCore) Finalize ¶

func (r *VoicevoxCore) Finalize()

ファイナライズ

func (*VoicevoxCore) GetCoreVersion ¶

func (r *VoicevoxCore) GetCoreVersion() string

Coreのバージョンを取得する

func (*VoicevoxCore) GetMetasJson ¶

func (r *VoicevoxCore) GetMetasJson() string

メタ情報のjsonを取得する

func (*VoicevoxCore) GetSupportedDevicesJson ¶

func (r *VoicevoxCore) GetSupportedDevicesJson() string

サポートしているデバイス一覧のjsonを取得する

func (*VoicevoxCore) Initialize ¶

func (r *VoicevoxCore) Initialize(options *VoicevoxInitializeOptions) error

C APIを通じてVoicevox_coreを初期化する関数

func (*VoicevoxCore) IsGpuMode ¶

func (r *VoicevoxCore) IsGpuMode() bool

Gpuモードが有効になっているか確認する

func (*VoicevoxCore) IsModelLoaded ¶

func (r *VoicevoxCore) IsModelLoaded(speakerID uint) bool

モデルがロードされているか確認する

func (*VoicevoxCore) LoadModel ¶

func (r *VoicevoxCore) LoadModel(speakerID uint) error

音声合成モデルをロードする関数

func (*VoicevoxCore) MakeDefaultAudioQueryOotions ¶

func (r *VoicevoxCore) MakeDefaultAudioQueryOotions() *VoicevoxAudioQueryOptions

`AudioQuery()` のデフォルトオプションを生成する

func (*VoicevoxCore) MakeDefaultInitializeOptions ¶

func (r *VoicevoxCore) MakeDefaultInitializeOptions() *VoicevoxInitializeOptions

`Initialize()` のデフォルトオプションを生成する

func (*VoicevoxCore) MakeDefaultSynthesisOotions ¶

func (r *VoicevoxCore) MakeDefaultSynthesisOotions() *VoicevoxSynthesisOptions

`Synthesis()` のデフォルトオプションを生成する

func (*VoicevoxCore) MakeDefaultTtsOotions ¶

func (r *VoicevoxCore) MakeDefaultTtsOotions() *VoicevoxTtsOptions

`Tts()` のデフォルトオプションを生成する

func (*VoicevoxCore) PredictDuration ¶

func (r *VoicevoxCore) PredictDuration(speakerID int, phonemeVector []int64) ([]float32, error)

音素長を取得

func (*VoicevoxCore) PredictIntonation ¶

func (r *VoicevoxCore) PredictIntonation(
	speakerID int,
	vowelPhonemeVector, consonantPhonemeVector []int64,
	startAccentVector, endAccentVector []int64,
	startAccentPhraseVector, endAccentPhraseVector []int64,
) ([]float32, error)

モーラごとのF0を推論する

func (*VoicevoxCore) Synthesis ¶

func (r *VoicevoxCore) Synthesis(
	audioQuery *AudioQuery,
	speakerID int,
	options *VoicevoxSynthesisOptions,
) ([]byte, error)

Audio Queryを基に音声合成を実行する関数。実行結果はwavファイルフォーマットのバイト列。

Sample: https://github.com/sh1ma/sample-synthesis

func (*VoicevoxCore) Tts ¶

func (r *VoicevoxCore) Tts(text string, speakerID int, options *VoicevoxTtsOptions) ([]byte, error)

Text to Speechを実行する関数。実行結果はwavファイルフォーマットのバイト列。

Sample: https://github.com/sh1ma/sample-tts

type VoicevoxInitializeOptions ¶

type VoicevoxInitializeOptions struct {
	// contains filtered or unexported fields
}

`VoicevoxCore`を初期化する際のオプションを表す構造体

func NewVoicevoxInitializeOptions ¶

func NewVoicevoxInitializeOptions(accelerationMode int, cpuNumThreads int, loadAllModels bool, openJtalkDictDir string) *VoicevoxInitializeOptions

`VoiceVoxCore`の初期化オプションを生成する関数

func (*VoicevoxInitializeOptions) UpdateAccelerationMode ¶ added in v0.0.4

func (o *VoicevoxInitializeOptions) UpdateAccelerationMode(accelerationMode int)

初期化オプションの`accelerationMode`をアップデートする関数

func (*VoicevoxInitializeOptions) UpdateCpuNumThreads ¶ added in v0.0.4

func (o *VoicevoxInitializeOptions) UpdateCpuNumThreads(cpuNumThreads int)

初期化オプションの`cpuNumThreads`をアップデートする関数

func (*VoicevoxInitializeOptions) UpdateLoadAllModels ¶ added in v0.0.4

func (o *VoicevoxInitializeOptions) UpdateLoadAllModels(loadAllModels bool)

初期化オプションの`loadAllModels`をアップデートする関数

func (*VoicevoxInitializeOptions) UpdateOpenJtalkDictDir ¶ added in v0.0.4

func (o *VoicevoxInitializeOptions) UpdateOpenJtalkDictDir(openJtalkDictDir string)

初期化オプションの`openJtalkDictDir`をアップデートする関数

type VoicevoxSynthesisOptions ¶

type VoicevoxSynthesisOptions struct {
	// contains filtered or unexported fields
}

`Synthesis()`を実行する際のオプションを表す構造体

func NewVoicevoxSynthesisOptions ¶

func NewVoicevoxSynthesisOptions(enableInterrogativeUpspeak bool) *VoicevoxSynthesisOptions

`Synthesis()`の初期化オプションを生成する関数

func (*VoicevoxSynthesisOptions) UpdateInterrogativeUpspeak ¶ added in v0.0.4

func (o *VoicevoxSynthesisOptions) UpdateInterrogativeUpspeak(kana bool)

`AudioQuery()`のオプションの`kana`をアップデートする関数

type VoicevoxTtsOptions ¶

type VoicevoxTtsOptions struct {
	// contains filtered or unexported fields
}

`Tts()`を実行する際のオプションを表す構造体

func NewVoicevoxTtsOptions ¶

func NewVoicevoxTtsOptions(kana bool, enableInterrogativeUpspeak bool) *VoicevoxTtsOptions

`Tts()`の初期化オプションを生成する関数

func (*VoicevoxTtsOptions) UpdateInterrogativeUpspeak ¶ added in v0.0.4

func (o *VoicevoxTtsOptions) UpdateInterrogativeUpspeak(kana bool)

`Tts()`のオプションの`kana`をアップデートする関数

func (*VoicevoxTtsOptions) UpdateKana ¶ added in v0.0.4

func (o *VoicevoxTtsOptions) UpdateKana(kana bool)

`Tts()`のオプションの`kana`をアップデートする関数

Source Files ¶

View all Source files

Directories ¶

Path	Synopsis
examples
text-to-phoneme_id
scripts
resolve-phonemeid

?	: This menu
/	: Search site
f or F	: Jump to
y or Y	: Canonical URL

README ¶

voicevoxcore.go

例

おすすめの環境構築方法 (Linux / MacOS)

1. voicevox_core のダウンロード

2. voicevox_core を配置する

3. シンボリックリンクを張る

Documentation ¶

Index ¶

Constants ¶

Variables ¶

Functions ¶

Types ¶

type AccentPharase ¶ added in v0.0.2

type AudioQuery ¶ added in v0.0.2

func NewAudioQueryFromJson ¶ added in v0.0.3

func (*AudioQuery) ToJson ¶ added in v0.0.3

func (*AudioQuery) ToJsonString ¶ added in v0.0.3

type Mora ¶ added in v0.0.2

type RawVoicevoxCore ¶

type VoicevoxAudioQueryOptions ¶

func NewVoicevoxAudioQueryOptions ¶

func (*VoicevoxAudioQueryOptions) UpdateKana ¶ added in v0.0.4

type VoicevoxCore ¶

func New ¶ added in v0.0.5

func (*VoicevoxCore) AudioQuery ¶

func (*VoicevoxCore) Decode ¶

func (*VoicevoxCore) ErrorResultToMessage ¶

func (*VoicevoxCore) Finalize ¶

func (*VoicevoxCore) GetCoreVersion ¶

func (*VoicevoxCore) GetMetasJson ¶

func (*VoicevoxCore) GetSupportedDevicesJson ¶

func (*VoicevoxCore) Initialize ¶

func (*VoicevoxCore) IsGpuMode ¶

func (*VoicevoxCore) IsModelLoaded ¶

func (*VoicevoxCore) LoadModel ¶

func (*VoicevoxCore) MakeDefaultAudioQueryOotions ¶

func (*VoicevoxCore) MakeDefaultInitializeOptions ¶

func (*VoicevoxCore) MakeDefaultSynthesisOotions ¶

func (*VoicevoxCore) MakeDefaultTtsOotions ¶

func (*VoicevoxCore) PredictDuration ¶

func (*VoicevoxCore) PredictIntonation ¶

func (*VoicevoxCore) Synthesis ¶

func (*VoicevoxCore) Tts ¶

type VoicevoxInitializeOptions ¶

func NewVoicevoxInitializeOptions ¶

func (*VoicevoxInitializeOptions) UpdateAccelerationMode ¶ added in v0.0.4

func (*VoicevoxInitializeOptions) UpdateCpuNumThreads ¶ added in v0.0.4

func (*VoicevoxInitializeOptions) UpdateLoadAllModels ¶ added in v0.0.4

func (*VoicevoxInitializeOptions) UpdateOpenJtalkDictDir ¶ added in v0.0.4

type VoicevoxSynthesisOptions ¶

func NewVoicevoxSynthesisOptions ¶

func (*VoicevoxSynthesisOptions) UpdateInterrogativeUpspeak ¶ added in v0.0.4

type VoicevoxTtsOptions ¶

func NewVoicevoxTtsOptions ¶

func (*VoicevoxTtsOptions) UpdateInterrogativeUpspeak ¶ added in v0.0.4

func (*VoicevoxTtsOptions) UpdateKana ¶ added in v0.0.4

Source Files ¶

Directories ¶