Skip to content

Commit

Permalink
Merge pull request #5 from kojix2/transcription
Browse files Browse the repository at this point in the history
Rename audio classes to transcription
  • Loading branch information
stakach authored Nov 3, 2024
2 parents 7ee8d51 + f4a4ced commit 8c8358e
Show file tree
Hide file tree
Showing 3 changed files with 12 additions and 12 deletions.
4 changes: 2 additions & 2 deletions spec/audio_spec.cr
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,7 @@ module OpenAI
HTTP::Client::Response.new(200, body: AUDIO_RES)
end

req = AudioRequest.new(AUDIO_SAMPLE)
req = TranscriptionRequest.new(AUDIO_SAMPLE)
res = client.transcription(req)
res.text.should_not be_nil
end
Expand All @@ -35,7 +35,7 @@ module OpenAI
HTTP::Client::Response.new(200, body: AUDIO_RES)
end

req = AudioRequest.new(AUDIO_SAMPLE)
req = TranscriptionRequest.new(AUDIO_SAMPLE)
res = client.translation(req)
res.text.should_not be_nil
end
Expand Down
12 changes: 6 additions & 6 deletions src/openai/api/audio.cr
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@ require "file"

module OpenAI
# Whisper response formats. Whisper uses JSON format by default
enum AudioRespFormat
enum TranscriptionRespFormat
JSON
TEXT
SRT
Expand All @@ -16,8 +16,8 @@ module OpenAI
end
end

# AudioRequest represents a request structure for audio API
class AudioRequest
# TranscriptionRequest represents a request structure for audio API
class TranscriptionRequest
include JSON::Serializable

# The audio file object to transcribe, in one of these formats: flac, mp3, mp4, mpeg, mpga, m4a, ogg, wav, or webm.
Expand All @@ -31,7 +31,7 @@ module OpenAI
property prompt : String?

# The format of the transcript output, in one of these options: json, text, srt, verbose_json, or vtt.
property response_format : AudioRespFormat
property response_format : TranscriptionRespFormat

# The sampling temperature, between 0 and 1. Higher values like 0.8 will make the output more random, while lower values like 0.2 will make it
# more focused and deterministic. If set to 0, the model will use log probability to automatically increase the temperature until certain thresholds are hit.
Expand All @@ -40,7 +40,7 @@ module OpenAI
# The language of the input audio. Supplying the input language in ISO-639-1 format will improve accuracy and latency.
property language : String?

def initialize(@file, @model = "whisper-1", @prompt = nil, @response_format = AudioRespFormat::JSON, @temperature = 0.0, @language = nil)
def initialize(@file, @model = "whisper-1", @prompt = nil, @response_format = TranscriptionRespFormat::JSON, @temperature = 0.0, @language = nil)
end

def build_metada(builder : HTTP::FormData::Builder)
Expand All @@ -65,7 +65,7 @@ module OpenAI
include JSON::Serializable
end

record AudioResponse, task : String?, language : String?, duration : Float64?, segments : Array(Segment)?, text : String? do
record TranscriptionResponse, task : String?, language : String?, duration : Float64?, segments : Array(Segment)?, text : String? do
include JSON::Serializable
end
end
8 changes: 4 additions & 4 deletions src/openai/client.cr
Original file line number Diff line number Diff line change
Expand Up @@ -36,15 +36,15 @@ module OpenAI
#######################

# API call to transcribe audio into the input language.
def transcription(req : AudioRequest) : AudioResponse
multipart_api("/audio/transcriptions", req.model.to_s, AudioResponse) { |builder|
def transcription(req : TranscriptionRequest) : TranscriptionResponse
multipart_api("/audio/transcriptions", req.model.to_s, TranscriptionResponse) { |builder|
req.build_metada(builder)
}
end

# API call to translate audio into English.
def translation(req : AudioRequest) : AudioResponse
multipart_api("/audio/translations", req.model.to_s, AudioResponse) { |builder|
def translation(req : TranscriptionRequest) : TranscriptionResponse
multipart_api("/audio/translations", req.model.to_s, TranscriptionResponse) { |builder|
req.build_metada(builder)
}
end
Expand Down

0 comments on commit 8c8358e

Please sign in to comment.