OkGoDoIt
diff --git a/‎OpenAI_API/Audio/ITextToSpeechEndpoint.cs
Lines changed: 57 additions & 0 deletions b/‎OpenAI_API/Audio/ITextToSpeechEndpoint.cs
Lines changed: 57 additions & 0 deletions
diff --git a/‎OpenAI_API/Audio/TextToSpeechEndpoint.cs
Lines changed: 106 additions & 0 deletions b/‎OpenAI_API/Audio/TextToSpeechEndpoint.cs
Lines changed: 106 additions & 0 deletions
diff --git a/‎OpenAI_API/Audio/TextToSpeechRequest.cs
Lines changed: 78 additions & 0 deletions b/‎OpenAI_API/Audio/TextToSpeechRequest.cs
Lines changed: 78 additions & 0 deletions
diff --git a/‎OpenAI_API/Chat/ChatRequest.cs
Lines changed: 1 addition & 1 deletion b/‎OpenAI_API/Chat/ChatRequest.cs
Lines changed: 1 addition & 1 deletion
@@ -0,0 +1,57 @@
+using System.IO;
+using System.Threading.Tasks;
+using OpenAI_API.Models;
+
+namespace OpenAI_API.Audio
+{
+	/// <summary>
+	/// The Endpoint for the Text to Speech API.  This allows you to generate audio from text.  See <seealso href="https://platform.openai.com/docs/guides/text-to-speech"/>
+	/// </summary>
+	public interface ITextToSpeechEndpoint
+	{
+		/// <summary>
+		/// This allows you to set default parameters for every request, for example to set a default voice or model.  For every request, if you do not have a parameter set on the request but do have it set here as a default, the request will automatically pick up the default value.
+		/// </summary>
+		TextToSpeechRequest DefaultTTSRequestArgs { get; set; }
+
+		/// <summary>
+		/// Calls the API to create speech from text, and returns the raw stream of the audio file.
+		/// </summary>
+		/// <param name="request">The text to speech request to submit to the API</param>
+		/// <returns>A stream of the audio file in the requested format.</returns>
+		Task<Stream> GetSpeechAsStreamAsync(TextToSpeechRequest request);
+
+		/// <summary>
+		/// Calls the API to create speech from text, and returns the raw stream of the audio file.
+		/// </summary>
+		/// <param name="input">The text to generate audio for. The maximum length is 4096 characters.</param>
+		/// <param name="voice">The voice to use when generating the audio. Supported voices can be found in <see cref="TextToSpeechRequest.Voices"/>.</param>
+		/// <param name="speed">The speed of the generated audio. Select a value from 0.25 to 4.0. 1.0 is the default.</param>
+		/// <param name="responseFormat">The default response format is "mp3", but other formats are available in <see cref="TextToSpeechRequest.ResponseFormats"/>.  See <seealso href="https://platform.openai.com/docs/guides/text-to-speech/supported-output-formats"/></param>
+		/// <param name="model">TTS is an AI model that converts text to natural sounding spoken text. OpenAI offers two different model variates, <see cref="Model.TTS_Speed"/> is optimized for real time text to speech use cases and <see cref="Model.TTS_HD"/> is optimized for quality.</param>
+		/// <returns>A stream of the audio file in the requested format.</returns>
+		Task<Stream> GetSpeechAsStreamAsync(string input, string voice = null, decimal? speed = null, string responseFormat = null, Model model = null);
+
+		/// <summary>
+		/// Calls the API to create speech from text, and saves the audio file to disk.
+		/// </summary>
+		/// <param name="request">The text to speech request to submit to the API</param>
+		/// <param name="localPath">The local path to save the audio file to.</param>
+		/// <returns>A <see cref="FileInfo"/> representing the saved speech file.</returns>
+		Task<FileInfo> SaveSpeechToFileAsync(TextToSpeechRequest request, string localPath);
+
+		/// <summary>
+		/// Calls the API to create speech from text, and saves the audio file to disk.
+		/// </summary>
+		/// <param name="input">The text to generate audio for. The maximum length is 4096 characters.</param>
+		/// <param name="localPath">The local path to save the audio file to.</param>
+		/// <param name="voice">The voice to use when generating the audio. Supported voices can be found in <see cref="TextToSpeechRequest.Voices"/>.</param>
+		/// <param name="speed">The speed of the generated audio. Select a value from 0.25 to 4.0. 1.0 is the default.</param>
+		/// <param name="responseFormat">The default response format is "mp3", but other formats are available in <see cref="TextToSpeechRequest.ResponseFormats"/>.  See <seealso href="https://platform.openai.com/docs/guides/text-to-speech/supported-output-formats"/></param>
+		/// <param name="model">TTS is an AI model that converts text to natural sounding spoken text. OpenAI offers two different model variates, <see cref="Model.TTS_Speed"/> is optimized for real time text to speech use cases and <see cref="Model.TTS_HD"/> is optimized for quality.</param>
+		/// <returns>A stream of the audio file in the requested format.</returns>
+		Task<FileInfo> SaveSpeechToFileAsync(string input, string localPath, string voice = null, decimal? speed = null, string responseFormat = null, Model model = null);
+
+		
+	}
+}
@@ -0,0 +1,106 @@
+using System;
+using System.Collections.Generic;
+using System.IO;
+using System.Net.Http;
+using System.Text;
+using System.Threading.Tasks;
+using OpenAI_API.Chat;
+using OpenAI_API.Models;
+using static System.Net.WebRequestMethods;
+
+namespace OpenAI_API.Audio
+{
+	/// <summary>
+	/// The Endpoint for the Text to Speech API.  This allows you to generate audio from text.  See <seealso href="https://platform.openai.com/docs/guides/text-to-speech"/>
+	/// </summary>
+	public class TextToSpeechEndpoint : EndpointBase, ITextToSpeechEndpoint
+	{
+		/// <inheritdoc/>
+		protected override string Endpoint => "audio/speech";
+
+		/// <summary>
+		/// This allows you to set default parameters for every request, for example to set a default voice or model.  For every request, if you do not have a parameter set on the request but do have it set here as a default, the request will automatically pick up the default value.
+		/// </summary>
+		public TextToSpeechRequest DefaultTTSRequestArgs { get; set; } = new TextToSpeechRequest();
+
+		/// <summary>
+		/// Constructor of the api endpoint.  Rather than instantiating this yourself, access it through an instance of <see cref="OpenAIAPI"/> as <see cref="OpenAIAPI.Completions"/>.
+		/// </summary>
+		/// <param name="api">Pass in the instance of the api</param>
+		internal TextToSpeechEndpoint(OpenAIAPI api) : base(api) { }
+
+		/// <summary>
+		/// Calls the API to create speech from text, and returns the raw stream of the audio file.
+		/// </summary>
+		/// <param name="request">The text to speech request to submit to the API</param>
+		/// <returns>A stream of the audio file in the requested format.</returns>
+		public async Task<Stream> GetSpeechAsStreamAsync(TextToSpeechRequest request)
+		{
+			return await HttpRequest(verb: HttpMethod.Post, postData: request);
+		}
+
+		/// <summary>
+		/// Calls the API to create speech from text, and returns the raw stream of the audio file.
+		/// </summary>
+		/// <param name="input">The text to generate audio for. The maximum length is 4096 characters.</param>
+		/// <param name="voice">The voice to use when generating the audio. Supported voices can be found in <see cref="TextToSpeechRequest.Voices"/>.</param>
+		/// <param name="speed">The speed of the generated audio. Select a value from 0.25 to 4.0. 1.0 is the default.</param>
+		/// <param name="responseFormat">The default response format is "mp3", but other formats are available in <see cref="TextToSpeechRequest.ResponseFormats"/>.  See <seealso href="https://platform.openai.com/docs/guides/text-to-speech/supported-output-formats"/></param>
+		/// <param name="model">TTS is an AI model that converts text to natural sounding spoken text. OpenAI offers two different model variates, <see cref="Model.TTS_Speed"/> is optimized for real time text to speech use cases and <see cref="Model.TTS_HD"/> is optimized for quality.</param>
+		/// <returns>A stream of the audio file in the requested format.</returns>
+		public async Task<Stream> GetSpeechAsStreamAsync(string input, string voice = null, decimal? speed = null, string responseFormat = null, Model model = null)
+		{
+			var request = new TextToSpeechRequest()
+			{
+				Input = input,
+				Voice = voice ?? DefaultTTSRequestArgs.Voice,
+				Speed = speed ?? DefaultTTSRequestArgs.Speed,
+				Model = model ?? DefaultTTSRequestArgs.Model,
+				ResponseFormat = responseFormat ?? DefaultTTSRequestArgs.ResponseFormat
+			};
+			return await HttpRequest(verb: HttpMethod.Post, postData: request);
+		}
+
+		/// <summary>
+		/// Calls the API to create speech from text, and saves the audio file to disk.
+		/// </summary>
+		/// <param name="request">The text to speech request to submit to the API</param>
+		/// <param name="localPath">The local path to save the audio file to.</param>
+		/// <returns>A <see cref="FileInfo"/> representing the saved speech file.</returns>
+		public async Task<FileInfo> SaveSpeechToFileAsync(TextToSpeechRequest request, string localPath)
+		{
+			using (var stream = await GetSpeechAsStreamAsync(request))
+			using (var outputFileStream = new FileStream(localPath, FileMode.Create))
+			{
+				await stream.CopyToAsync(outputFileStream);
+			}
+			return new FileInfo(localPath);
+		}
+
+		/// <summary>
+		/// Calls the API to create speech from text, and saves the audio file to disk.
+		/// </summary>
+		/// <param name="input">The text to generate audio for. The maximum length is 4096 characters.</param>
+		/// <param name="localPath">The local path to save the audio file to.</param>
+		/// <param name="voice">The voice to use when generating the audio. Supported voices can be found in <see cref="TextToSpeechRequest.Voices"/>.</param>
+		/// <param name="speed">The speed of the generated audio. Select a value from 0.25 to 4.0. 1.0 is the default.</param>
+		/// <param name="responseFormat">The default response format is "mp3", but other formats are available in <see cref="TextToSpeechRequest.ResponseFormats"/>.  See <seealso href="https://platform.openai.com/docs/guides/text-to-speech/supported-output-formats"/></param>
+		/// <param name="model">TTS is an AI model that converts text to natural sounding spoken text. OpenAI offers two different model variates, <see cref="Model.TTS_Speed"/> is optimized for real time text to speech use cases and <see cref="Model.TTS_HD"/> is optimized for quality.</param>
+		/// <returns>A stream of the audio file in the requested format.</returns>
+		public async Task<FileInfo> SaveSpeechToFileAsync(string input, string localPath, string voice = null, decimal? speed = null, string responseFormat = null, Model model = null)
+		{
+			var request = new TextToSpeechRequest()
+			{
+				Input = input,
+				Voice = voice ?? DefaultTTSRequestArgs.Voice,
+				Speed = speed ?? DefaultTTSRequestArgs.Speed,
+				Model = model ?? DefaultTTSRequestArgs.Model,
+				ResponseFormat = responseFormat ?? DefaultTTSRequestArgs.ResponseFormat
+			};
+			return await SaveSpeechToFileAsync(request, localPath);
+		}
+
+
+
+	}
+}
@@ -0,0 +1,78 @@
+using System;
+using System.Collections.Generic;
+using System.Text;
+using Newtonsoft.Json;
+
+namespace OpenAI_API.Audio
+{
+	public class TextToSpeechRequest
+	{
+		/// <summary>
+		/// The model to use for this request
+		/// </summary>
+		[JsonProperty("model")]
+		public string Model { get; set; } = OpenAI_API.Models.Model.DefaultTTSModel;
+
+		/// <summary>
+		/// The text to generate audio for. The maximum length is 4096 characters.
+		/// </summary>
+		[JsonProperty("input")]
+		public string Input { get; set; }
+
+		/// <summary>
+		/// The voice to use when generating the audio. Supported voices can be found in <see cref="Voices"/>.
+		/// </summary>
+		[JsonProperty("voice")]
+		public string Voice { get; set; } = Voices.Alloy;
+
+		/// <summary>
+		/// The default response format is "mp3", but other formats are available in <see cref="TextToSpeechRequest.ResponseFormats"/>.  See <seealso href="https://platform.openai.com/docs/guides/text-to-speech/supported-output-formats"/>
+		/// </summary>
+		[JsonProperty("response_format", DefaultValueHandling=DefaultValueHandling.Ignore)]
+		public string ResponseFormat { get; set; } = null;
+
+		/// <summary>
+		/// The speed of the generated audio. Select a value from 0.25 to 4.0. 1.0 is the default.
+		/// </summary>
+		[JsonProperty("speed", DefaultValueHandling = DefaultValueHandling.Ignore)]
+		public decimal? Speed { get; set; } = null;
+
+		/// <summary>
+		/// Supported voices are alloy, echo, fable, onyx, nova, and shimmer. Previews of the voices are available in the Text to speech guide. See <seealso href="https://platform.openai.com/docs/guides/text-to-speech/voice-options"/>.
+		/// </summary>
+		public static class Voices
+		{
+#pragma warning disable CS1591 // Missing XML comment for publicly visible type or member
+			public const string Alloy = "alloy";
+			public const string Echo = "echo";
+			public const string Fable = "fable";
+			public const string Onyx = "onyx";
+			public const string Nova = "nova";
+			public const string Shimmer = "shimmer";
+#pragma warning restore CS1591 // Missing XML comment for publicly visible type or member
+		}
+
+		/// <summary>
+		/// The format to return for the generated audio.  See <seealso href="https://platform.openai.com/docs/guides/text-to-speech/supported-output-formats"/>
+		/// </summary>
+		public static class ResponseFormats
+		{
+			/// <summary>
+			/// The default, industry-standard audio format
+			/// </summary>
+			public const string MP3 = "mp3";
+			/// <summary>
+			/// For lossless audio compression, favored by audio enthusiasts for archiving
+			/// </summary>
+			public const string FLAC = "flac";
+			/// <summary>
+			/// For digital audio compression, preferred by YouTube, Android, iOS
+			/// </summary>
+			public const string AAC = "aac";
+			/// <summary>
+			/// For internet streaming and communication, low latency.
+			/// </summary>
+			public const string OPUS = "opus";
+		}
+	}
+}
@@ -20,7 +20,7 @@ public class ChatRequest
 		/// The model to use for this request
 		/// </summary>
 		[JsonProperty("model")]
-		public string Model { get; set; } = OpenAI_API.Models.Model.ChatGPTTurbo;
+		public string Model { get; set; } = OpenAI_API.Models.Model.DefaultChatModel;
 
 		/// <summary>
 		/// The messages to send with this Chat Request