一、創建自己的應用
百度智能云控制臺網址:https://console.bce.baidu.com/
1、創建應用
2、獲取APIKey和SecretKey
3、Api調試
調試網址:https://console.bce.baidu.com/support/?timestamp=1750317430400#/api?product=AI&project=%E8%AF%AD%E9%9F%B3%E6%8A%80%E6%9C%AF&parent=%E9%89%B4%E6%9D%83%E8%AE%A4%E8%AF%81%E6%9C%BA%E5%88%B6&api=oauth%2F2.0%2Ftoken&method=post
二、在Unity中進行調用
1、相關參數說明
(1)短文本個性化語音生成相關參數
(2)長文本個性化語音生成相關參數
2、完整代碼
using Newtonsoft.Json;
using System;
using System.Collections;
using System.Collections.Generic;
using System.IO;
using System.Text;
using UnityEngine;
using UnityEngine.Networking;
using UnityEngine.UI;
public class TTS : MonoBehaviour
{#region 相關參數[Header("鑒權相關參數")][SerializeField] private string apiKey = "LFfK6DTaswy6LLtBqvHO86w0";[SerializeField] private string secretKey = "vj6JmKd7zBylDVGW2WmTNPWl9eKxxZEL";[SerializeField] private string accessToken = null;[Space][Header("長文本語音合成參數設置")][SerializeField] private string format = "mp3-16k"; // 或者 wav[SerializeField] private int voice = 0; // 語音人:0-女,1-男等[SerializeField] private string lang = "zh";[SerializeField] private int speed = 5; // 0~15[SerializeField] private int pitch = 5; // 0~15[SerializeField] private int volume = 5; // 0~15[SerializeField] private int enable_subtitle = 0;[Space][Header("短文本語音合成參數設置")][SerializeField] private string cuid = "240a906f2b88794fd0426442c4136a5a57bf5c01";[SerializeField] private string ctp = "1";[SerializeField] private string lan = "zh";[SerializeField] private string spd = "5";[SerializeField] private string pit = "5";[SerializeField] private string vol = "10";[SerializeField] private string per = "1";[SerializeField] private string aue = "3";[Space][Header("UI界面相關")]public InputField inputFieldText;public Button buttonStartTTS;//開始合成按鈕public Button buttonPlay;//播放合成的語音按鈕public AudioSource audioSource;//播放音頻組件#endregion// Start is called before the first frame updatevoid Start(){//一開始就進行鑒權StartCoroutine(GetAccessToken());//語音合成buttonStartTTS.onClick.AddListener(()=> {StartTTS(inputFieldText.text, audioSource);});//播放語音buttonPlay.onClick.AddListener(() =>{if (audioSource.clip != null){audioSource.Play();}});}/// <summary>/// 長短語音合成方法/// </summary>/// <param name="text">要合成的文本內容</param>/// <param name="audioSource">語音組件</param>public void StartTTS(string text,AudioSource audioSource){if (text.Length<60){print("開始短文本語音合成");//短文本語音合成StartCoroutine(ShortTTS(text, response => {audioSource.clip = response.clip;print("短文本語音合成結束,請播放");}));}else{print("開始長文本語音合成");//長文本語音合成StartCoroutine(LongTTS(text, clip=> { audioSource.clip = clip;print("長文本語音合成結束,請播放");}));}}#region 鑒權相關/// <summary>/// 鑒權方法/// </summary>/// <returns></returns>/// <summary>/// 獲取百度 AccessToken(已使用 using 自動釋放資源)/// </summary>public IEnumerator GetAccessToken(){string url = "https://aip.baidubce.com/oauth/2.0/token";WWWForm form = new WWWForm();form.AddField("grant_type", "client_credentials");form.AddField("client_id", apiKey);form.AddField("client_secret", secretKey);using (UnityWebRequest request = UnityWebRequest.Post(url, form)){yield return request.SendWebRequest();if (request.result == UnityWebRequest.Result.Success){try{var tokenResponse = JsonConvert.DeserializeObject<TokenResponse>(request.downloadHandler.text);accessToken = tokenResponse.access_token;Debug.Log("? 獲取語音合成 AccessToken 成功: " + accessToken);}catch (Exception ex){Debug.LogError("? 語音合成AccessToken 解析失敗: " + ex.Message);}}else{Debug.LogError("? 獲取 語音合成AccessToken 失敗: " + request.error);}}}#endregion#region 短文本語音合成相關/// <summary>/// 請求短文本語音合成(MP3格式)/// </summary>/// <param name="text">需要合成的文本</param>/// <param name="callback">返回結果回調</param>public IEnumerator ShortTTS(string text, Action<TtsResponse> callback){string url = "http://tsn.baidu.com/text2audio";var param = new Dictionary<string, string>{{ "tex", text },{ "tok", accessToken },{ "cuid", cuid},{ "ctp", ctp},{ "lan", lan},{ "spd", spd},{ "pit", pit},{ "vol", vol},{ "per", per},{ "aue", aue} // 固定為 MP3 格式};// 構建請求 URLint i = 0;foreach (var p in param){url += i != 0 ? "&" : "?";url += p.Key + "=" + UnityWebRequest.EscapeURL(p.Value);i++;}using (UnityWebRequest www = UnityWebRequestMultimedia.GetAudioClip(url, AudioType.MPEG)){//Debug.Log("[TTS] 請求URL: " + www.url);//測試使用yield return www.SendWebRequest();if (www.result != UnityWebRequest.Result.Success){Debug.LogError("[TTS] 請求失敗: " + www.error);callback?.Invoke(new TtsResponse{error_index = -1,error_msg = www.error});}else{string type = www.GetResponseHeader("Content-Type");//Debug.Log("[TTS] Content-Type: " + type);//測試使用if (!string.IsNullOrEmpty(type) && type.Contains("audio")){AudioClip clip = DownloadHandlerAudioClip.GetContent(www);callback?.Invoke(new TtsResponse { clip = clip });}else{string errorText = Encoding.UTF8.GetString(www.downloadHandler.data);Debug.LogError("[TTS] 文本響應錯誤: " + errorText);callback?.Invoke(new TtsResponse{error_index = -2,error_msg = errorText});}}}}/// <summary>/// 返回的語音合成結果/// </summary>public class TtsResponse{public int error_index;public string error_msg;public string sn;public int idx;public bool Success => error_index == 0;public AudioClip clip;}#endregion#region 長文本語音合成相關/// <summary>/// 按順序執行長語音合成對應的方法/// </summary>/// <param name="text">需要合成的文本</param>/// <param name="callback">回調函數,返回合成的clip</param>/// <returns></returns>IEnumerator LongTTS(String text, Action<AudioClip> callback){string taskId = null;//語音合成任務創建成功返回的id//創建語音合成任務yield return StartCoroutine(CreateTTSTask(text,TaskId => { taskId = TaskId; },errorMsg => { Debug.LogError("? 合成失敗: " + errorMsg); }));if (taskId != null && accessToken != null){string audioUrl = null;//語音合成任務合成成功返回的語音下載鏈接//查詢語音合成任務yield return StartCoroutine(QueryTTSTaskStatus(accessToken, taskId,AudioAddress => { audioUrl = AudioAddress; },errorMsg => {Debug.LogError("? 查詢失敗:" + errorMsg);}));//下載語音,并賦值給指定的AudioSource組件if (audioUrl != null){yield return StartCoroutine(DownloadAudio(audioUrl, clip =>{if (clip != null){callback?.Invoke(clip);}else{Debug.LogError("下載的音頻 Clip 為 null");}}));}}}/// <summary>/// 創建語音合成任務/// </summary>/// <returns>TaskId</returns>public IEnumerator CreateTTSTask(string text, Action<string> onSuccess, Action<string> onError){string url = $"https://aip.baidubce.com/rpc/2.0/tts/v1/create?access_token={accessToken}";var bodyObj = new{text = text,format = format,voice = voice,lang = lang,speed = speed,pitch = pitch,volume = volume,enable_subtitle = enable_subtitle};string jsonBody = JsonConvert.SerializeObject(bodyObj);using (UnityWebRequest request = new UnityWebRequest(url, "POST")){byte[] bodyRaw = Encoding.UTF8.GetBytes(jsonBody);request.uploadHandler = new UploadHandlerRaw(bodyRaw);request.downloadHandler = new DownloadHandlerBuffer();request.SetRequestHeader("Content-Type", "application/json");request.SetRequestHeader("Accept", "application/json");yield return request.SendWebRequest();if (request.result == UnityWebRequest.Result.Success){string responseText = request.downloadHandler.text;Debug.Log("? 創建語音任務返回:" + responseText);if (responseText.Contains("task_id")){var response = JsonConvert.DeserializeObject<TTSTaskSuccessResponse>(responseText);onSuccess?.Invoke(response.TaskId);}else if (responseText.Contains("error_code")){var error = JsonConvert.DeserializeObject<TTSTaskErrorResponse>(responseText);onError?.Invoke(error.ErrorMsg);}else{onError?.Invoke("無法識別的返回內容");}}else{Debug.LogError("? 網絡請求失敗:" + request.error);onError?.Invoke(request.error);}}}/// <summary>/// 語音合成任務查詢/// </summary>/// <param name="accessToken">accessToken</param>/// <param name="taskId">合成任務id</param>/// <param name="onSuccess">合成成功返回音頻鏈接</param>/// <param name="onError">合成失敗返回錯誤碼</param>/// <returns></returns>public IEnumerator QueryTTSTaskStatus(string accessToken, string taskId, Action<string> onSuccess, Action<string> onError){string url = $"https://aip.baidubce.com/rpc/2.0/tts/v1/query?access_token={accessToken}";string jsonBody = JsonConvert.SerializeObject(new { task_ids = new string[] { taskId } });float delaySeconds = 2f;while (true){using (UnityWebRequest request = new UnityWebRequest(url, "POST")){request.uploadHandler = new UploadHandlerRaw(Encoding.UTF8.GetBytes(jsonBody));request.downloadHandler = new DownloadHandlerBuffer();request.SetRequestHeader("Content-Type", "application/json");request.SetRequestHeader("Accept", "application/json");yield return request.SendWebRequest();if (request.result == UnityWebRequest.Result.Success){string json = request.downloadHandler.text;var root = JsonConvert.DeserializeObject<TTSQueryResponse>(json);if (root.TasksInfo != null && root.TasksInfo.Count > 0){var task = root.TasksInfo[0];switch (task.TaskStatus){case "Success":if (!string.IsNullOrEmpty(task.TaskResult?.SpeechUrl))onSuccess?.Invoke(task.TaskResult.SpeechUrl);elseonError?.Invoke("合成成功但未返回語音地址");yield break;case "Failure":onError?.Invoke(task.TaskResult?.ErrMsg ?? "未知錯誤");yield break;case "Running":Debug.Log("🎙 正在合成...");yield return new WaitForSeconds(delaySeconds);continue;default:onError?.Invoke("未知狀態:" + task.TaskStatus);yield break;}}else{onError?.Invoke("未找到任務信息");yield break;}}else{onError?.Invoke("網絡錯誤:" + request.error);yield break;}}}}/// <summary>/// 下載音頻,并將音頻賦給指定的AudioSource/// </summary>/// <param name="url">音頻下載鏈接</param>/// <param name="audioSource">要賦給的音頻播放組件</param>/// <returns></returns>public IEnumerator DownloadAudio(string url, Action<AudioClip> onComplete){using (UnityWebRequest request = UnityWebRequestMultimedia.GetAudioClip(url, AudioType.MPEG)){yield return request.SendWebRequest();if (request.result == UnityWebRequest.Result.Success){AudioClip clip = DownloadHandlerAudioClip.GetContent(request);if (clip != null){Debug.Log("? 音頻合成結束,等待播放");onComplete?.Invoke(clip); // ? 返回 clip}else{Debug.LogError("? 無法解析音頻 Clip");onComplete?.Invoke(null);}}else{Debug.LogError("? 下載音頻失敗:" + request.error);onComplete?.Invoke(null);}}}[Serializable]public class TokenResponse{/// <summary>/// 鑒權返回的數據JSON結構/// </summary>public string access_token;public int expires_in;}[Serializable]public class TTSTaskSuccessResponse{/// <summary>/// 創建語音合成成功返回的數據JSON結構/// </summary>[JsonProperty("log_id")]public long LogId { get; set; }[JsonProperty("task_id")]public string TaskId { get; set; }[JsonProperty("task_status")]public string TaskStatus { get; set; } // "Running"}[Serializable]public class TTSTaskErrorResponse{/// <summary>/// 創建語音合成成功返回的數據JSON結構/// </summary>[JsonProperty("error_code")]public int ErrorCode { get; set; }[JsonProperty("error_msg")]public string ErrorMsg { get; set; }[JsonProperty("log_id")]public long LogId { get; set; }}[Serializable]public class TTSQueryResponse{[JsonProperty("log_id")]public long LogId { get; set; }[JsonProperty("tasks_info")]public List<TTSQueryTaskInfo> TasksInfo { get; set; }}[Serializable]public class TTSQueryTaskInfo{[JsonProperty("task_id")]public string TaskId { get; set; }[JsonProperty("task_status")]public string TaskStatus { get; set; }[JsonProperty("task_result")]public TTSQueryTaskResult TaskResult { get; set; }}[Serializable]public class TTSQueryTaskResult{[JsonProperty("speech_url")]public string SpeechUrl { get; set; }[JsonProperty("err_no")]public int ErrNo { get; set; }[JsonProperty("err_msg")]public string ErrMsg { get; set; }[JsonProperty("sn")]public string Sn { get; set; }}#endregion}