Add whisper 1 support (#117)
* Add whisper 1 support * Resolve linting issues for audio source files
This commit is contained in:
100
audio.go
Normal file
100
audio.go
Normal file
@@ -0,0 +1,100 @@
|
||||
package gogpt
|
||||
|
||||
import (
|
||||
"bytes"
|
||||
"context"
|
||||
"fmt"
|
||||
"io"
|
||||
"mime/multipart"
|
||||
"net/http"
|
||||
"os"
|
||||
)
|
||||
|
||||
// Whisper Defines the models provided by OpenAI to use when processing audio with OpenAI.
|
||||
const (
|
||||
Whisper1 = "whisper-1"
|
||||
)
|
||||
|
||||
// AudioRequest represents a request structure for audio API.
|
||||
type AudioRequest struct {
|
||||
Model string
|
||||
FilePath string
|
||||
}
|
||||
|
||||
// AudioResponse represents a response structure for audio API.
|
||||
type AudioResponse struct {
|
||||
Text string `json:"text"`
|
||||
}
|
||||
|
||||
// CreateTranscription — API call to create a transcription. Returns transcribed text.
|
||||
func (c *Client) CreateTranscription(
|
||||
ctx context.Context,
|
||||
request AudioRequest,
|
||||
) (response AudioResponse, err error) {
|
||||
response, err = c.callAudioAPI(ctx, request, "transcriptions")
|
||||
return
|
||||
}
|
||||
|
||||
// CreateTranscription — API call to create a transcription. Returns transcribed text.
|
||||
func (c *Client) CreateTranslation(
|
||||
ctx context.Context,
|
||||
request AudioRequest,
|
||||
) (response AudioResponse, err error) {
|
||||
response, err = c.callAudioAPI(ctx, request, "translations")
|
||||
return
|
||||
}
|
||||
|
||||
// callAudioAPI — API call to an audio endpoint.
|
||||
func (c *Client) callAudioAPI(
|
||||
ctx context.Context,
|
||||
request AudioRequest,
|
||||
endpointSuffix string,
|
||||
) (response AudioResponse, err error) {
|
||||
var formBody bytes.Buffer
|
||||
w := multipart.NewWriter(&formBody)
|
||||
|
||||
if err = audioMultipartForm(request, w); err != nil {
|
||||
return
|
||||
}
|
||||
|
||||
urlSuffix := fmt.Sprintf("/audio/%s", endpointSuffix)
|
||||
req, err := http.NewRequestWithContext(ctx, http.MethodPost, c.fullURL(urlSuffix), &formBody)
|
||||
if err != nil {
|
||||
return
|
||||
}
|
||||
req.Header.Add("Content-Type", w.FormDataContentType())
|
||||
|
||||
err = c.sendRequest(req, &response)
|
||||
return
|
||||
}
|
||||
|
||||
// audioMultipartForm creates a form with audio file contents and the name of the model to use for
|
||||
// audio processing.
|
||||
func audioMultipartForm(request AudioRequest, w *multipart.Writer) error {
|
||||
f, err := os.Open(request.FilePath)
|
||||
if err != nil {
|
||||
return fmt.Errorf("opening audio file: %w", err)
|
||||
}
|
||||
|
||||
fw, err := w.CreateFormFile("file", f.Name())
|
||||
if err != nil {
|
||||
return fmt.Errorf("creating form file: %w", err)
|
||||
}
|
||||
|
||||
if _, err = io.Copy(fw, f); err != nil {
|
||||
return fmt.Errorf("reading from opened audio file: %w", err)
|
||||
}
|
||||
|
||||
fw, err = w.CreateFormField("model")
|
||||
if err != nil {
|
||||
return fmt.Errorf("creating form field: %w", err)
|
||||
}
|
||||
|
||||
modelName := bytes.NewReader([]byte(request.Model))
|
||||
if _, err = io.Copy(fw, modelName); err != nil {
|
||||
return fmt.Errorf("writing model name: %w", err)
|
||||
}
|
||||
w.Close()
|
||||
|
||||
return nil
|
||||
}
|
||||
Reference in New Issue
Block a user