Inheritance diagram for ailiaVoice.AiliaVoiceModel:

Collaboration diagram for ailiaVoice.AiliaVoiceModel:

Public Member Functions
int	GetEnvironmentId (bool is_gpu)
	Get the environmen id. More...

string	GetEnvironmentName ()
	Get the environmen name. More...

bool	Create (int env_id, int flag)
	Create a instance. More...

bool	SetUserDictionary (string dict_path, int dict_type)
	Set user dictionary file. More...

bool	OpenDictionary (string dict_path, int dict_type)
	Set dictionary path. More...

bool	OpenModel (string encoder, string decoder1, string decoder2, string wave, string ssl, int model_type, int cleaner_type)

bool	OpenTacotron2ModelFile (string encoder, string decoder1, string decoder2, string wave, int cleaner_type)
	Open Tacotron2 model. More...

bool	OpenGPTSoVITSV1ModelFile (string encoder, string decoder1, string decoder2, string wave, string ssl)
	Open GPT-SoVITS V1 model. More...

bool	OpenGPTSoVITSV2ModelFile (string encoder, string decoder1, string decoder2, string wave, string ssl, string chinese_bert, string vocab)
	Open GPT-SoVITS V2 model. More...

bool	OpenGPTSoVITSV3ModelFile (string encoder, string decoder1, string decoder2, string ssl, string vq, string cfm, string bigvgan, string chinese_bert, string vocab)
	Open GPT-SoVITS V3 model. More...

bool	OpenGPTSoVITSV2ProModelFile (string encoder, string decoder1, string decoder2, string ssl, string vits, string sv, string chinese_bert, string vocab)
	Open GPT-SoVITS V2-Pro model. More...

bool	SetSampleSteps (int steps)
	Set CFM sampling steps. More...

bool	SetSpeed (float speed)
	Set the speech speed for synthesis. More...

bool	SetModelType (int model_type)
	Set the model type for G2P processing. More...

virtual void	Close ()
	Destroys instance. More...

virtual void	Dispose ()
	Release resources. More...

string	G2P (string utf8, int g2p_type)
	Get features. More...

bool	SetReference (AudioClip ref_audio, string ref_text)
	Set reference audio. More...

bool	Inference (string feature)
	Perform inference. More...

AudioClip	GetAudioClip ()
	Get audio clip. More...

Protected Member Functions
virtual void	Dispose (bool disposing)

Member Function Documentation

◆ Close()

virtual void ailiaVoice.AiliaVoiceModel.Close ( )

inlinevirtual

Destroys instance.

Destroys and initializes the instance.

     {
         if (net != IntPtr.Zero){
             AiliaVoice.ailiaVoiceDestroy(net);
             net = IntPtr.Zero;
         }
     }

◆ Create()

bool ailiaVoice.AiliaVoiceModel.Create	(	int	env_id,
		int	flag
	)

inline

Create a instance.

Parameters

env_id	Environment ID of ailia
flag	OR of flags (AiliaVoice.AILIA_VOICE_FLAG_*)

Returns: If this function is successful, it returns true , or false otherwise.

                                             {
         if (net != null){
             Close();
         }
  
         AiliaVoice.AILIAVoiceApiCallback callback = AiliaVoice.GetCallback();
  
         int memory_mode = Ailia.AILIA_MEMORY_REDUCE_CONSTANT | Ailia.AILIA_MEMORY_REDUCE_CONSTANT_WITH_INPUT_INITIALIZER | Ailia.AILIA_MEMORY_REUSE_INTERSTAGE;
         int status = AiliaVoice.ailiaVoiceCreate(ref net, env_id, Ailia.AILIA_MULTITHREAD_AUTO, memory_mode, flag, callback, AiliaVoice.AILIA_VOICE_API_CALLBACK_VERSION);
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceCreate failed " + status);
             }
             return false;
         }
  
         return true;
     }

◆ Dispose() [1/2]

virtual void ailiaVoice.AiliaVoiceModel.Dispose ( )

inlinevirtual

Release resources.

     {
         Dispose(true);
     }

◆ Dispose() [2/2]

virtual void ailiaVoice.AiliaVoiceModel.Dispose ( bool disposing )

inlineprotectedvirtual

     {
         if (disposing){
             // release managed resource
         }
         Close(); // release unmanaged resource
     }

◆ G2P()

string ailiaVoice.AiliaVoiceModel.G2P	(	string	utf8,
		int	g2p_type
	)

inline

Get features.

Parameters

utf8	Input string
g2p_type	G2P type

Returns: If this function is successful, it returns string , or empty string otherwise.

                                                 {
         byte[] text = System.Text.Encoding.UTF8.GetBytes(utf8+"\u0000");
         //Debug.Log(text[text.Length - 1]);
         GCHandle handle = GCHandle.Alloc(text, GCHandleType.Pinned);
         IntPtr input = handle.AddrOfPinnedObject();
         int status = AiliaVoice.ailiaVoiceGraphemeToPhoneme(net, input, g2p_type);
         handle.Free();
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceGraphemeToPhoneme faield " + status);
             }
             return "";
         }
         uint count = 0;
         status = AiliaVoice.ailiaVoiceGetFeatureLength(net, ref count);
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceGetFeatureLength faield " + status);
             }
             return "";
         }
         byte[] texts = new byte [count];
         handle = GCHandle.Alloc(texts, GCHandleType.Pinned);
         IntPtr output = handle.AddrOfPinnedObject();
         status = AiliaVoice.ailiaVoiceGetFeatures(net, output, count);
         handle.Free();
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceGetFeatures faield " + status);
             }
             return "";
         }
         return System.Text.Encoding.UTF8.GetString(texts);
     }

◆ GetAudioClip()

AudioClip ailiaVoice.AiliaVoiceModel.GetAudioClip ( )

inline

Get audio clip.

Returns: If this function is successful, it returns AudioClip , or null otherwise.

     {
         AudioClip audioClip = AudioClip.Create(audio_clip_name, audio_data.Length, (int)channels, (int)sampling_rate, false);
         audioClip.SetData(audio_data, 0);
         return audioClip;
     }

◆ GetEnvironmentId()

int ailiaVoice.AiliaVoiceModel.GetEnvironmentId ( bool is_gpu )

inline

Get the environmen id.

Parameters

is_gpu Whether to use GPU

Returns: env_id

                                             {
         int env_id = Ailia.AILIA_ENVIRONMENT_ID_AUTO;
         if (is_gpu) { // GPU
             int count = 0;
             Ailia.ailiaGetEnvironmentCount(ref count);
             for (int i = 0; i < count; i++){
                 IntPtr env_ptr = IntPtr.Zero;
                 Ailia.ailiaGetEnvironment(ref env_ptr, (uint)i, Ailia.AILIA_ENVIRONMENT_VERSION);
                 Ailia.AILIAEnvironment env = (Ailia.AILIAEnvironment)Marshal.PtrToStructure(env_ptr, typeof(Ailia.AILIAEnvironment));
  
                 if (env.backend == Ailia.AILIA_ENVIRONMENT_BACKEND_MPS || env.backend == Ailia.AILIA_ENVIRONMENT_BACKEND_CUDA || env.backend == Ailia.AILIA_ENVIRONMENT_BACKEND_VULKAN){
                     env_id = env.id;
                     env_name = Marshal.PtrToStringAnsi(env.name);
                 }
             }
         } else {
             env_name = "cpu";
         }
         return env_id;
     }

◆ GetEnvironmentName()

string ailiaVoice.AiliaVoiceModel.GetEnvironmentName ( )

inline

Get the environmen name.

Returns: env_name

                                       {
         return env_name;
     }

◆ Inference()

bool ailiaVoice.AiliaVoiceModel.Inference ( string feature )

inline

Perform inference.

Parameters

feature Input feature string

Returns: If this function is successful, it returns true , or false otherwise.

     {
         byte[] text = System.Text.Encoding.UTF8.GetBytes(feature);
         GCHandle handle = GCHandle.Alloc(text, GCHandleType.Pinned);
         IntPtr input = handle.AddrOfPinnedObject();
         int status = AiliaVoice.ailiaVoiceInference(net, input);
         handle.Free();
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceInference faield " + status);
             }
             return false;
         }
         status = AiliaVoice.ailiaVoiceGetWaveInfo(net, ref samples, ref channels, ref sampling_rate);
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceGetWaveInfo faield " + status);
             }
             return false;
         }
  
         uint count = samples * channels;
         audio_data = new float [count];
         handle = GCHandle.Alloc(audio_data, GCHandleType.Pinned);
         IntPtr output = handle.AddrOfPinnedObject();
         status = AiliaVoice.ailiaVoiceGetWave(net, output, count * sizeof(float));
         handle.Free();
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceGetWave faield " + status);
             }
             return false;
         }
  
         audio_clip_name = feature;
  
         return true;
     }

◆ OpenDictionary()

bool ailiaVoice.AiliaVoiceModel.OpenDictionary	(	string	dict_path,
		int	dict_type
	)

inline

Set dictionary path.

Parameters

net	A network instance pointer
dictionary_path	The path name to the dictionary folder
dictionary_type	AILIA_VOICE_DICTIONARY_TYPE_*

Returns: If this function is successful, it returns true , or false otherwise.

                                                                {
         int status = AiliaVoice.ailiaVoiceOpenDictionaryFile(net, dict_path, dict_type);
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceOpenDictionaryFile faield " + status);
             }
             return false;
         }
         return true;
     }

◆ OpenGPTSoVITSV1ModelFile()

bool ailiaVoice.AiliaVoiceModel.OpenGPTSoVITSV1ModelFile	(	string	encoder,
		string	decoder1,
		string	decoder2,
		string	wave,
		string	ssl
	)

inline

Open GPT-SoVITS V1 model.

Parameters

encoder	The path name to the onnx file
decoder1	The path name to the onnx file
decoder2	The path name to the onnx file
wave	The path name to the onnx file
ssl	The path name to the onnx file

Returns: If this function is successful, it returns true , or false otherwise.

                                                                                                                    {
         AiliaLicense.CheckAndDownloadLicense();
  
         int status = AiliaVoice.ailiaVoiceOpenGPTSoVITSV1ModelFile(net, encoder, decoder1, decoder2, wave, ssl);
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceOpenGPTSoVITSV1ModelFile failed " + status);
             }
             return false;
         }
         return true;
     }

◆ OpenGPTSoVITSV2ModelFile()

bool ailiaVoice.AiliaVoiceModel.OpenGPTSoVITSV2ModelFile	(	string	encoder,
		string	decoder1,
		string	decoder2,
		string	wave,
		string	ssl,
		string	chinese_bert,
		string	vocab
	)

inline

Open GPT-SoVITS V2 model.

Parameters

encoder	The path name to the onnx file
decoder1	The path name to the onnx file
decoder2	The path name to the onnx file
wave	The path name to the onnx file
ssl	The path name to the onnx file
chinese_bert	The path name to the chinese-roberta.onnx file (null to disable Chinese BERT)
vocab	The path name to the vocab.txt file (null to disable Chinese BERT)

Returns: If this function is successful, it returns true , or false otherwise.

                                                                                                                                                       {
         AiliaLicense.CheckAndDownloadLicense();
  
         int status = AiliaVoice.ailiaVoiceOpenGPTSoVITSV2ModelFile(net, encoder, decoder1, decoder2, wave, ssl, chinese_bert, vocab);
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceOpenGPTSoVITSV2ModelFile failed " + status);
             }
             return false;
         }
         return true;
     }

◆ OpenGPTSoVITSV2ProModelFile()

bool ailiaVoice.AiliaVoiceModel.OpenGPTSoVITSV2ProModelFile	(	string	encoder,
		string	decoder1,
		string	decoder2,
		string	ssl,
		string	vits,
		string	sv,
		string	chinese_bert,
		string	vocab
	)

inline

Open GPT-SoVITS V2-Pro model.

Parameters

encoder	The path name to the onnx file
decoder1	The path name to the onnx file
decoder2	The path name to the onnx file
ssl	The path name to the onnx file
vits	The path name to the onnx file
sv	The path name to the onnx file
chinese_bert	The path name to the chinese-roberta.onnx file (null to disable Chinese BERT)
vocab	The path name to the vocab.txt file (null to disable Chinese BERT)

Returns: If this function is successful, it returns true , or false otherwise.

                                                                                                                                                                     {
         AiliaLicense.CheckAndDownloadLicense();
  
         int status = AiliaVoice.ailiaVoiceOpenGPTSoVITSV2ProModelFile(net, encoder, decoder1, decoder2, ssl, vits, sv, chinese_bert, vocab);
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceOpenGPTSoVITSV2ProModelFile failed " + status);
             }
             return false;
         }
         return true;
     }

◆ OpenGPTSoVITSV3ModelFile()

bool ailiaVoice.AiliaVoiceModel.OpenGPTSoVITSV3ModelFile	(	string	encoder,
		string	decoder1,
		string	decoder2,
		string	ssl,
		string	vq,
		string	cfm,
		string	bigvgan,
		string	chinese_bert,
		string	vocab
	)

inline

Open GPT-SoVITS V3 model.

Parameters

encoder	The path name to the onnx file
decoder1	The path name to the onnx file
decoder2	The path name to the onnx file
ssl	The path name to the onnx file
vq	The path name to the onnx file
cfm	The path name to the onnx file
bigvgan	The path name to the onnx file
chinese_bert	The path name to the chinese-roberta.onnx file (null to disable Chinese BERT)
vocab	The path name to the vocab.txt file (null to disable Chinese BERT)

Returns: If this function is successful, it returns true , or false otherwise.

                                                                                                                                                                                 {
         AiliaLicense.CheckAndDownloadLicense();
  
         int status = AiliaVoice.ailiaVoiceOpenGPTSoVITSV3ModelFile(net, encoder, decoder1, decoder2, ssl, vq, cfm, bigvgan, chinese_bert, vocab);
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceOpenGPTSoVITSV3ModelFile failed " + status);
             }
             return false;
         }
         return true;
     }

◆ OpenModel()

bool ailiaVoice.AiliaVoiceModel.OpenModel	(	string	encoder,
		string	decoder1,
		string	decoder2,
		string	wave,
		string	ssl,
		int	model_type,
		int	cleaner_type
	)

inline

Parameters

net	A network instance pointer
encoder	The path name to the onnx file
decoder1	The path name to the onnx file
decoder2	The path name to the onnx file
wave	The path name to the onnx file
ssl	The path name to the onnx file
model_type	AILIA_VOICE_MODEL_TYPE_*
cleaner_type	AILIA_VOICE_CLEANER_TYPE_*

Returns: If this function is successful, it returns true , or false otherwise.

                                                                                                                                       {
         AiliaLicense.CheckAndDownloadLicense();
  
         int status = AiliaVoice.ailiaVoiceOpenModelFile(net, encoder, decoder1, decoder2, wave, ssl, model_type, cleaner_type);
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceOpenModelFile faield " + status);
             }
             return false;
         }
         return true;
     }

◆ OpenTacotron2ModelFile()

bool ailiaVoice.AiliaVoiceModel.OpenTacotron2ModelFile	(	string	encoder,
		string	decoder1,
		string	decoder2,
		string	wave,
		int	cleaner_type
	)

inline

Open Tacotron2 model.

Parameters

encoder	The path name to the onnx file
decoder1	The path name to the onnx file
decoder2	The path name to the onnx file
wave	The path name to the onnx file
cleaner_type	AILIA_VOICE_CLEANER_TYPE_*

Returns: If this function is successful, it returns true , or false otherwise.

                                                                                                                        {
         AiliaLicense.CheckAndDownloadLicense();
  
         int status = AiliaVoice.ailiaVoiceOpenTacotron2ModelFile(net, encoder, decoder1, decoder2, wave, cleaner_type);
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceOpenTacotron2ModelFile failed " + status);
             }
             return false;
         }
         return true;
     }

◆ SetModelType()

bool ailiaVoice.AiliaVoiceModel.SetModelType ( int model_type )

inline

Set the model type for G2P processing.

Parameters

model_type AILIA_VOICE_MODEL_TYPE_*

Returns: If this function is successful, it returns true , or false otherwise.

Sets the model type when using G2P standalone without loading model files. Automatically set when OpenModel or OpenGPTSoVITSV3ModelFile is called.

                                             {
         int status = AiliaVoice.ailiaVoiceSetModelType(net, model_type);
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceSetModelType failed " + status);
             }
             return false;
         }
         return true;
     }

◆ SetReference()

bool ailiaVoice.AiliaVoiceModel.SetReference	(	AudioClip	ref_audio,
		string	ref_text
	)

inline

Set reference audio.

Parameters

ref_audio	Reference audio
ref_text	Reference text

Returns: If this function is successful, it returns AudioClip , or null otherwise.

     {
         float[] audio_data = new float[ref_audio.samples * ref_audio.channels];
         ref_audio.GetData(audio_data, 0);
  
         GCHandle audio_handle = GCHandle.Alloc(audio_data, GCHandleType.Pinned);
         IntPtr audio_input = audio_handle.AddrOfPinnedObject();
  
         byte[] text = System.Text.Encoding.UTF8.GetBytes(ref_text);
         GCHandle text_handle = GCHandle.Alloc(text, GCHandleType.Pinned);
         IntPtr text_input = text_handle.AddrOfPinnedObject();
         int status = AiliaVoice.ailiaVoiceSetReference(net, audio_input, (uint)(ref_audio.samples * ref_audio.channels * 4), (uint)(ref_audio.channels), (uint)(ref_audio.frequency), text_input);
         text_handle.Free();
         audio_handle.Free();
  
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceSetReference faield " + status);
             }
             return false;
         }
  
         return true;
     }

◆ SetSampleSteps()

bool ailiaVoice.AiliaVoiceModel.SetSampleSteps ( int steps )

inline

Set CFM sampling steps.

Parameters

steps Number of sampling steps

Returns: If this function is successful, it returns true , or false otherwise.

                                          {
         int status = AiliaVoice.ailiaVoiceSetSampleSteps(net, steps);
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceSetSampleSteps failed " + status);
             }
             return false;
         }
         return true;
     }

◆ SetSpeed()

bool ailiaVoice.AiliaVoiceModel.SetSpeed ( float speed )

inline

Set the speech speed for synthesis.

Parameters

speed Speed value (default 1.0, must be greater than 0)

Returns: If this function is successful, it returns true , or false otherwise.

Supported by GPT-SoVITS V2 and V3. Not effective for V1.

                                      {
         int status = AiliaVoice.ailiaVoiceSetSpeed(net, speed);
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceSetSpeed failed " + status);
             }
             return false;
         }
         return true;
     }

◆ SetUserDictionary()

bool ailiaVoice.AiliaVoiceModel.SetUserDictionary	(	string	dict_path,
		int	dict_type
	)

inline

Set user dictionary file.

Parameters

net	A network instance pointer
dictionary_path	The path name to the user dictionary file
dictionary_type	AILIA_VOICE_DICTIONARY_TYPE_*

Returns: If this function is successful, it returns true , or false otherwise.

You need to call before OpenDictionary.

                                                                   {
         int status = AiliaVoice.ailiaVoiceSetUserDictionaryFile(net, dict_path, dict_type);
         if (status != 0){
             if (debug_log){
                 Debug.Log("ailiaVoiceSetUserDictionaryFile faield " + status);
             }
             return false;
         }
         return true;
     }

The documentation for this class was generated from the following file:

AiliaVoiceModel.cs

Public Member Functions

Protected Member Functions

Member Function Documentation

◆ Close()

◆ Create()

◆ Dispose() [1/2]

◆ Dispose() [2/2]

◆ G2P()

◆ GetAudioClip()

◆ GetEnvironmentId()

◆ GetEnvironmentName()

◆ Inference()

◆ OpenDictionary()

◆ OpenGPTSoVITSV1ModelFile()

◆ OpenGPTSoVITSV2ModelFile()

◆ OpenGPTSoVITSV2ProModelFile()

◆ OpenGPTSoVITSV3ModelFile()

◆ OpenModel()

◆ OpenTacotron2ModelFile()

◆ SetModelType()

◆ SetReference()

◆ SetSampleSteps()

◆ SetSpeed()

◆ SetUserDictionary()