-
-
Notifications
You must be signed in to change notification settings - Fork 17
/
Copy pathopenai-audio.el
115 lines (97 loc) · 4.57 KB
/
openai-audio.el
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
;;; openai-audio.el --- Create audio with OpenAI API -*- lexical-binding: t; -*-
;; Copyright (C) 2023-2025 Shen, Jen-Chieh
;; This file is not part of GNU Emacs.
;; This program is free software: you can redistribute it and/or modify
;; it under the terms of the GNU General Public License as published by
;; the Free Software Foundation, either version 3 of the License, or
;; (at your option) any later version.
;; This program is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
;; GNU General Public License for more details.
;; You should have received a copy of the GNU General Public License
;; along with this program. If not, see <https://www.gnu.org/licenses/>.
;;; Commentary:
;;
;; Create audio with OpenAI API.
;;
;; See https://platform.openai.com/docs/api-reference/audio
;;
;;; Code:
(require 'openai)
;;
;;; API
;;;###autoload
(cl-defun openai-audio-create-transcription ( file callback
&key
(base-url openai-base-url)
(parameters openai-parameters)
(content-type "application/json")
(key openai-key)
org-id
(model "whisper-1")
prompt
response-format
temperature
language)
"Send transcribe audio request.
Argument FILE is audio file to transcribe, in one of these formats: mp3, mp4,
mpeg, mpga, m4a, wav, or webm. CALLBACK is the execuation after request is
made.
Arguments BASE-URL, PARAMETERS, CONTENT-TYPE, KEY and ORG-ID are global
options; however, you can overwrite the value by passing it in.
The rest of the arugments are optional, please see OpenAI API reference page
for more information. Arguments here refer to MODEL PROMPT, RESPONSE-FORMAT,
TEMPERATURE, and LANGUAGE."
(openai-request (concat base-url "/audio/transcriptions")
:type "POST"
:params parameters
:headers (openai--headers content-type key org-id)
:data (openai--json-encode
`(("model" . ,model)
("file" . ,file)
("prompt" . ,prompt)
("response_format" . ,response-format)
("temperature" . ,temperature)
("language" . ,language)))
:parser 'json-read
:complete (cl-function
(lambda (&key data &allow-other-keys)
(funcall callback data)))))
;;;###autoload
(cl-defun openai-audio-create-translation ( file callback
&key
(base-url openai-base-url)
(parameters openai-parameters)
(content-type "application/json")
(key openai-key)
org-id
(model "whisper-1")
prompt
response-format
temperature)
"Send translate audio request.
Argument FILE is the audio file to translate, in one of these formats: mp3,
mp4, mpeg, mpga, m4a, wav, or webm. CALLBACK is the execuation after request
is made.
Arguments BASE-URL, PARAMETERS, CONTENT-TYPE, KEY and ORG-ID are global
options; however, you can overwrite the value by passing it in.
The rest of the arugments are optional, please see OpenAI API reference page
for more information. Arguments here refer to MODEL PROMPT, RESPONSE-FORMAT,
and TEMPERATURE."
(openai-request (concat base-url "/audio/translations")
:type "POST"
:params parameters
:headers (openai--headers content-type key org-id)
:data (openai--json-encode
`(("model" . ,model)
("file" . ,file)
("prompt" . ,prompt)
("response_format" . ,response-format)
("temperature" . ,temperature)))
:parser 'json-read
:complete (cl-function
(lambda (&key data &allow-other-keys)
(funcall callback data)))))
(provide 'openai-audio)
;;; openai-audio.el ends here