voicevoxcorego

package module

v0.0.5 Latest Latest Go to latest Published: Jun 30, 2023 License: MIT Imports: 5 Imported by: 0

Details

Valid go.mod file

The Go module system was introduced in Go 1.11 and is the official dependency management solution for Go.
Redistributable license

Redistributable licenses place minimal restrictions on how software can be used, modified, and redistributed.
Tagged version

Modules with tagged versions give importers more predictable builds.
Stable version

When a project reaches major version v1 it is considered stable.
Learn more about best practices

Repository

github.com/sh1ma/voicevoxcore.go

Links

Open Source Insights

README ¶

voicevoxcore.go

voicevoxcore.go はvoicevox_coreを Go 言語で使えるラッパーです。 FFI を用いて、voicevox_core の C API を呼んでいます。

例

以下は本ライブラリを使用して Text to Speech を行う例です。


//go:build ignore

package main

import (
	"fmt"
	"os"

	voicevoxcorego "github.com/sh1ma/voicevoxcore.go"
)

func main() {
	args := os.Args
	if len(args) < 2 {
		fmt.Println("usage:\n\tgo run tts.go [ text ]")
		os.Exit(127)
	}
	text := os.Args[1]

	core := voicevoxcorego.NewVoicevoxCore()
	initializeOptions := voicevoxcorego.NewVoicevoxInitializeOptions(0, 0, false, "./open_jtalk_dic_utf_8-1.11")
	core.Initialize(initializeOptions)

	core.LoadModel(1)

	ttsOptions := voicevoxcorego.NewVoicevoxTtsOptions(false, true)
	result, err := core.Tts(text, 1, ttsOptions)
	if err != nil {
		fmt.Println(err)
	}
	f, _ := os.Create("out.wav")
	_, err = f.Write(result)
	if err != nil {
		fmt.Println(err)
	}
}

Documentation ¶

Index ¶

type AccentPharase
type AudioQuery
- func NewAudioQueryFromJson(queryJson []byte) (*AudioQuery, error)
- func (q *AudioQuery) ToJson() ([]byte, error)
- func (q *AudioQuery) ToJsonString() (string, error)
type Mora
type RawVoicevoxCore
type VoicevoxAudioQueryOptions
- func NewVoicevoxAudioQueryOptions(kana bool) *VoicevoxAudioQueryOptions
- func (o *VoicevoxAudioQueryOptions) UpdateKana(kana bool)
type VoicevoxCore
- func New() (core *VoicevoxCore)
- func (r *VoicevoxCore) AudioQuery(text string, speakerID uint, options *VoicevoxAudioQueryOptions) (*AudioQuery, error)
- func (r *VoicevoxCore) Decode(speakerID uint, phonemeSize int, f0 []float32, phonemeVector []float32) ([]float32, error)
- func (r *VoicevoxCore) ErrorResultToMessage(resultCode int) string
- func (r *VoicevoxCore) Finalize()
- func (r *VoicevoxCore) GetCoreVersion() string
- func (r *VoicevoxCore) GetMetasJson() string
- func (r *VoicevoxCore) GetSupportedDevicesJson() string
- func (r *VoicevoxCore) Initialize(options *VoicevoxInitializeOptions) error
- func (r *VoicevoxCore) IsGpuMode() bool
- func (r *VoicevoxCore) IsModelLoaded(speakerID uint) bool
- func (r *VoicevoxCore) LoadModel(speakerID uint) error
- func (r *VoicevoxCore) MakeDefaultAudioQueryOotions() *VoicevoxAudioQueryOptions
- func (r *VoicevoxCore) MakeDefaultInitializeOptions() *VoicevoxInitializeOptions
- func (r *VoicevoxCore) MakeDefaultSynthesisOotions() *VoicevoxSynthesisOptions
- func (r *VoicevoxCore) MakeDefaultTtsOotions() *VoicevoxTtsOptions
- func (r *VoicevoxCore) PredictDuration(speakerID int, phonemeVector []int64) ([]float32, error)
- func (r *VoicevoxCore) PredictIntonation(speakerID int, vowelPhonemeVector, consonantPhonemeVector []int64, ...) ([]float32, error)
- func (r *VoicevoxCore) Synthesis(audioQuery *AudioQuery, speakerID int, options *VoicevoxSynthesisOptions) ([]byte, error)
- func (r *VoicevoxCore) Tts(text string, speakerID int, options *VoicevoxTtsOptions) ([]byte, error)
type VoicevoxInitializeOptions
- func NewVoicevoxInitializeOptions(accelerationMode int, cpuNumThreads int, loadAllModels bool, ...) *VoicevoxInitializeOptions
- func (o *VoicevoxInitializeOptions) UpdateAccelerationMode(accelerationMode int)
- func (o *VoicevoxInitializeOptions) UpdateCpuNumThreads(cpuNumThreads int)
- func (o *VoicevoxInitializeOptions) UpdateLoadAllModels(loadAllModels bool)
- func (o *VoicevoxInitializeOptions) UpdateOpenJtalkDictDir(openJtalkDictDir string)
type VoicevoxSynthesisOptions
- func NewVoicevoxSynthesisOptions(enableInterrogativeUpspeak bool) *VoicevoxSynthesisOptions
- func (o *VoicevoxSynthesisOptions) UpdateInterrogativeUpspeak(kana bool)
type VoicevoxTtsOptions
- func NewVoicevoxTtsOptions(kana bool, enableInterrogativeUpspeak bool) *VoicevoxTtsOptions
- func (o *VoicevoxTtsOptions) UpdateInterrogativeUpspeak(kana bool)
- func (o *VoicevoxTtsOptions) UpdateKana(kana bool)

Constants ¶

This section is empty.

Variables ¶

This section is empty.

Functions ¶

This section is empty.

Types ¶

type AccentPharase ¶ added in v0.0.2

type AccentPharase struct {
	Moras           []Mora `json:"moras"`
	Accent          uint32 `json:"accent"`
	PauseMora       Mora   `json:"pause_mora,omitempty"`
	IsInterrogative bool   `json:"is_interrogative"`
}

アクセント句を表す構造体

`moras`にはモーラの配列を格納する。

`accent`はアクセント位置を表す。

`pause_mora`はポーズのモーラを表す。

`is_interrogative`は疑問文かどうかを表す。

type AudioQuery ¶ added in v0.0.2

type AudioQuery struct {
	AccentPharases     []AccentPharase `json:"accent_phrases"`
	SpeedScale         float32         `json:"speed_scale"`
	PitchScale         float32         `json:"pitch_scale"`
	IntonationScale    float32         `json:"intonation_scale"`
	VolumeScale        float32         `json:"volume_scale"`
	PrePhonemeLength   float32         `json:"pre_phoneme_length"`
	PostPhonemeLength  float32         `json:"post_phoneme_length"`
	OutputSamplingRate float32         `json:"output_sampling_rate"`
	OutputStereo       bool            `json:"output_stereo"`
	Kana               string          `json:"kana"`
}

オーディオクエリを表す構造体

`accent_phrases`にはアクセント句の配列を格納する。

`spped_scale`は発話速度の倍率を表す。

`pitch_scale`は音高の倍率を表す。

`intonation_scale`はイントネーションの倍率を表す。

`volume_scale`は音量の倍率を表す。

`pre_phoneme_length`は発声開始前の無音の長さを表す。

`post_phoneme_length`は発声終了後の無音の長さを表す。

`output_sampling_rate`は出力音声のサンプリングレートを表す。

`output_stereo`は出力音声がステレオかどうかを表す。

`kana`は読み仮名を表す。

func NewAudioQueryFromJson ¶ added in v0.0.3

func NewAudioQueryFromJson(queryJson []byte) (*AudioQuery, error)

Jsonのバイト列からAudioQuery構造体を生成する

func (*AudioQuery) ToJson ¶ added in v0.0.3

func (q *AudioQuery) ToJson() ([]byte, error)

AudioQuery構造体をJsonのバイト列に変換する

func (*AudioQuery) ToJsonString ¶ added in v0.0.3

func (q *AudioQuery) ToJsonString() (string, error)

AudioQuery構造体をJson文字列に変換する

type Mora ¶ added in v0.0.2

type Mora struct {
	Text            string  `json:"text"`
	Consonant       string  `json:"consonant,omitempty"`
	ConsonantLength float32 `json:"consonant_length,omitempty"`
	Vowel           string  `json:"vowel"`
	VowelLength     float32 `json:"vowel_length"`
	Pitch           float32 `json:"pitch"`
}

モーラを表す構造体

`text`はモーラの文字列を表す。

`consonant`は子音を表す。

`consonant_length`は子音の長さを表す。

`vowel`は母音を表す。

`vowel_length`は母音の長さを表す。

`pitch`は音高を表す。

type RawVoicevoxCore ¶

type RawVoicevoxCore struct{}

RawVoicevoxCore is a function group that wraps the C API

type VoicevoxAudioQueryOptions ¶

type VoicevoxAudioQueryOptions struct {
	// contains filtered or unexported fields
}

`AudioQuery()`を実行する際のオプションを表す構造体

func NewVoicevoxAudioQueryOptions ¶

func NewVoicevoxAudioQueryOptions(kana bool) *VoicevoxAudioQueryOptions

`AudioQuery()`の初期化オプションを生成する関数

func (*VoicevoxAudioQueryOptions) UpdateKana ¶ added in v0.0.4

func (o *VoicevoxAudioQueryOptions) UpdateKana(kana bool)

`AudioQuery()`のオプションの`kana`をアップデートする関数

type VoicevoxCore ¶

type VoicevoxCore struct {
	*RawVoicevoxCore
	// contains filtered or unexported fields
}

VoicevoxCore is top-level API Wrapper instance

func New ¶ added in v0.0.5

func New() (core *VoicevoxCore)

VoicevoxCore のコンストラクタ関数

func (*VoicevoxCore) AudioQuery ¶

func (r *VoicevoxCore) AudioQuery(text string, speakerID uint, options *VoicevoxAudioQueryOptions) (*AudioQuery, error)

オーディオクエリを発行する

func (*VoicevoxCore) Decode ¶

func (r *VoicevoxCore) Decode(speakerID uint, phonemeSize int, f0 []float32, phonemeVector []float32) ([]float32, error)

phnemeVectorを元にデコードする

func (*VoicevoxCore) ErrorResultToMessage ¶

func (r *VoicevoxCore) ErrorResultToMessage(resultCode int) string

ErrorResultCode をメッセージに変換する

func (*VoicevoxCore) Finalize ¶

func (r *VoicevoxCore) Finalize()

ファイナライズ

func (*VoicevoxCore) GetCoreVersion ¶

func (r *VoicevoxCore) GetCoreVersion() string

Coreのバージョンを取得する

func (*VoicevoxCore) GetMetasJson ¶

func (r *VoicevoxCore) GetMetasJson() string

メタ情報のjsonを取得する

func (*VoicevoxCore) GetSupportedDevicesJson ¶

func (r *VoicevoxCore) GetSupportedDevicesJson() string

サポートしているデバイス一覧のjsonを取得する

func (*VoicevoxCore) Initialize ¶

func (r *VoicevoxCore) Initialize(options *VoicevoxInitializeOptions) error

C APIを通じてVoicevox_coreを初期化する関数

func (*VoicevoxCore) IsGpuMode ¶

func (r *VoicevoxCore) IsGpuMode() bool

Gpuモードが有効になっているか確認する

func (*VoicevoxCore) IsModelLoaded ¶

func (r *VoicevoxCore) IsModelLoaded(speakerID uint) bool

モデルがロードされているか確認する

func (*VoicevoxCore) LoadModel ¶

func (r *VoicevoxCore) LoadModel(speakerID uint) error

音声合成モデルをロードする関数

func (*VoicevoxCore) MakeDefaultAudioQueryOotions ¶

func (r *VoicevoxCore) MakeDefaultAudioQueryOotions() *VoicevoxAudioQueryOptions

`AudioQuery()` のデフォルトオプションを生成する

func (*VoicevoxCore) MakeDefaultInitializeOptions ¶

func (r *VoicevoxCore) MakeDefaultInitializeOptions() *VoicevoxInitializeOptions

`Initialize()` のデフォルトオプションを生成する

func (*VoicevoxCore) MakeDefaultSynthesisOotions ¶

func (r *VoicevoxCore) MakeDefaultSynthesisOotions() *VoicevoxSynthesisOptions

`Synthesis()` のデフォルトオプションを生成する

func (*VoicevoxCore) MakeDefaultTtsOotions ¶

func (r *VoicevoxCore) MakeDefaultTtsOotions() *VoicevoxTtsOptions

`Tts()` のデフォルトオプションを生成する

func (*VoicevoxCore) PredictDuration ¶

func (r *VoicevoxCore) PredictDuration(speakerID int, phonemeVector []int64) ([]float32, error)

音素長を取得

func (*VoicevoxCore) PredictIntonation ¶

func (r *VoicevoxCore) PredictIntonation(
	speakerID int,
	vowelPhonemeVector, consonantPhonemeVector []int64,
	startAccentVector, endAccentVector []int64,
	startAccentPhraseVector, endAccentPhraseVector []int64,
) ([]float32, error)

モーラごとのF0を推論する

func (*VoicevoxCore) Synthesis ¶

func (r *VoicevoxCore) Synthesis(
	audioQuery *AudioQuery,
	speakerID int,
	options *VoicevoxSynthesisOptions,
) ([]byte, error)

Audio Queryを基に音声合成を実行する関数。実行結果はwavファイルフォーマットのバイト列。

Sample: https://github.com/sh1ma/sample-synthesis

func (*VoicevoxCore) Tts ¶

func (r *VoicevoxCore) Tts(text string, speakerID int, options *VoicevoxTtsOptions) ([]byte, error)

Text to Speechを実行する関数。実行結果はwavファイルフォーマットのバイト列。

Sample: https://github.com/sh1ma/sample-tts

type VoicevoxInitializeOptions ¶

type VoicevoxInitializeOptions struct {
	// contains filtered or unexported fields
}

`VoicevoxCore`を初期化する際のオプションを表す構造体

func NewVoicevoxInitializeOptions ¶

func NewVoicevoxInitializeOptions(accelerationMode int, cpuNumThreads int, loadAllModels bool, openJtalkDictDir string) *VoicevoxInitializeOptions

`VoiceVoxCore`の初期化オプションを生成する関数

func (*VoicevoxInitializeOptions) UpdateAccelerationMode ¶ added in v0.0.4

func (o *VoicevoxInitializeOptions) UpdateAccelerationMode(accelerationMode int)

初期化オプションの`accelerationMode`をアップデートする関数

func (*VoicevoxInitializeOptions) UpdateCpuNumThreads ¶ added in v0.0.4

func (o *VoicevoxInitializeOptions) UpdateCpuNumThreads(cpuNumThreads int)

初期化オプションの`cpuNumThreads`をアップデートする関数

func (*VoicevoxInitializeOptions) UpdateLoadAllModels ¶ added in v0.0.4

func (o *VoicevoxInitializeOptions) UpdateLoadAllModels(loadAllModels bool)

初期化オプションの`loadAllModels`をアップデートする関数

func (*VoicevoxInitializeOptions) UpdateOpenJtalkDictDir ¶ added in v0.0.4

func (o *VoicevoxInitializeOptions) UpdateOpenJtalkDictDir(openJtalkDictDir string)

初期化オプションの`openJtalkDictDir`をアップデートする関数

type VoicevoxSynthesisOptions ¶

type VoicevoxSynthesisOptions struct {
	// contains filtered or unexported fields
}

`Synthesis()`を実行する際のオプションを表す構造体

func NewVoicevoxSynthesisOptions ¶

func NewVoicevoxSynthesisOptions(enableInterrogativeUpspeak bool) *VoicevoxSynthesisOptions

`Synthesis()`の初期化オプションを生成する関数

func (*VoicevoxSynthesisOptions) UpdateInterrogativeUpspeak ¶ added in v0.0.4

func (o *VoicevoxSynthesisOptions) UpdateInterrogativeUpspeak(kana bool)

`AudioQuery()`のオプションの`kana`をアップデートする関数

type VoicevoxTtsOptions ¶

type VoicevoxTtsOptions struct {
	// contains filtered or unexported fields
}

`Tts()`を実行する際のオプションを表す構造体

func NewVoicevoxTtsOptions ¶

func NewVoicevoxTtsOptions(kana bool, enableInterrogativeUpspeak bool) *VoicevoxTtsOptions

`Tts()`の初期化オプションを生成する関数

func (*VoicevoxTtsOptions) UpdateInterrogativeUpspeak ¶ added in v0.0.4

func (o *VoicevoxTtsOptions) UpdateInterrogativeUpspeak(kana bool)

`Tts()`のオプションの`kana`をアップデートする関数

func (*VoicevoxTtsOptions) UpdateKana ¶ added in v0.0.4

func (o *VoicevoxTtsOptions) UpdateKana(kana bool)

`Tts()`のオプションの`kana`をアップデートする関数

Source Files ¶

View all Source files

Directories ¶

Path	Synopsis
examples
text-to-phoneme_id
scripts
resolve-phonemeid

?	: This menu
/	: Search site
f or F	: Jump to
y or Y	: Canonical URL

README ¶

voicevoxcore.go

例

おすすめの環境構築方法 (Linux / MacOS)

1. voicevox_core のダウンロード

2. voicevox_core を配置する

3. シンボリックリンクを張る

Documentation ¶

Index ¶

Constants ¶

Variables ¶

Functions ¶

Types ¶

type AccentPharase ¶ added in v0.0.2

type AudioQuery ¶ added in v0.0.2

func NewAudioQueryFromJson ¶ added in v0.0.3

func (*AudioQuery) ToJson ¶ added in v0.0.3

func (*AudioQuery) ToJsonString ¶ added in v0.0.3

type Mora ¶ added in v0.0.2

type RawVoicevoxCore ¶

type VoicevoxAudioQueryOptions ¶

func NewVoicevoxAudioQueryOptions ¶

func (*VoicevoxAudioQueryOptions) UpdateKana ¶ added in v0.0.4

type VoicevoxCore ¶

func New ¶ added in v0.0.5

func (*VoicevoxCore) AudioQuery ¶

func (*VoicevoxCore) Decode ¶

func (*VoicevoxCore) ErrorResultToMessage ¶

func (*VoicevoxCore) Finalize ¶

func (*VoicevoxCore) GetCoreVersion ¶

func (*VoicevoxCore) GetMetasJson ¶

func (*VoicevoxCore) GetSupportedDevicesJson ¶

func (*VoicevoxCore) Initialize ¶

func (*VoicevoxCore) IsGpuMode ¶

func (*VoicevoxCore) IsModelLoaded ¶

func (*VoicevoxCore) LoadModel ¶

func (*VoicevoxCore) MakeDefaultAudioQueryOotions ¶

func (*VoicevoxCore) MakeDefaultInitializeOptions ¶

func (*VoicevoxCore) MakeDefaultSynthesisOotions ¶

func (*VoicevoxCore) MakeDefaultTtsOotions ¶

func (*VoicevoxCore) PredictDuration ¶

func (*VoicevoxCore) PredictIntonation ¶

func (*VoicevoxCore) Synthesis ¶

func (*VoicevoxCore) Tts ¶

type VoicevoxInitializeOptions ¶

func NewVoicevoxInitializeOptions ¶

func (*VoicevoxInitializeOptions) UpdateAccelerationMode ¶ added in v0.0.4

func (*VoicevoxInitializeOptions) UpdateCpuNumThreads ¶ added in v0.0.4

func (*VoicevoxInitializeOptions) UpdateLoadAllModels ¶ added in v0.0.4

func (*VoicevoxInitializeOptions) UpdateOpenJtalkDictDir ¶ added in v0.0.4

type VoicevoxSynthesisOptions ¶

func NewVoicevoxSynthesisOptions ¶

func (*VoicevoxSynthesisOptions) UpdateInterrogativeUpspeak ¶ added in v0.0.4

type VoicevoxTtsOptions ¶

func NewVoicevoxTtsOptions ¶

func (*VoicevoxTtsOptions) UpdateInterrogativeUpspeak ¶ added in v0.0.4

func (*VoicevoxTtsOptions) UpdateKana ¶ added in v0.0.4

Source Files ¶

Directories ¶