-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathtranscribe.py
69 lines (56 loc) · 2.1 KB
/
transcribe.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
from enum import Enum
from urllib.parse import urljoin
import requests
# Define available Whisper model names
class ModelNames(str, Enum):
tiny = 'tiny'
tiny_en = 'tiny_en'
base = 'base'
base_en = 'base_en'
small = 'small'
small_en = 'small_en'
medium = 'medium'
medium_en = 'medium_en'
large_v1 = 'large_v1'
large_v2 = 'large_v2'
large_v3 = 'large_v3'
large = 'large'
large_v3_turbo = 'large_v3_turbo'
turbo = 'turbo'
class Transcriber:
def __init__(self, api_url):
self.api_url = api_url
@property
def transcribe_endpoint(self):
return urljoin(self.api_url, 'transcribe')
def is_remote_url(self, file):
return isinstance(file, str) and (file.startswith('http') or file.startswith('https'))
def transcribe(self, file, model=ModelNames.tiny):
if self.is_remote_url(file):
return self.transcribe_remote(file, model)
else:
return self.transcribe_local(file, model)
def transcribe_remote(self, url, model):
json_data = {'file': url, 'model': model}
response = requests.post(self.transcribe_endpoint, json=json_data)
response.raise_for_status()
return response.json()
def transcribe_local(self, file_path, model):
with open(file_path, 'rb') as file:
files = {'file': file}
data = {'model': model.value}
response = requests.post(self.transcribe_endpoint, files=files, data=data)
response.raise_for_status()
return response.json()
if __name__ == "__main__":
API_URL = "http://127.0.0.1:8008/"
# Or your ngrok url when running in colab: https://YOUR-URL.ngrok-free.app/"
transcriber = Transcriber(API_URL)
# Remote file example
remote_result = transcriber.transcribe(
'https://storage.googleapis.com/aai-web-samples/Custom-Home-Builder.mp3',
ModelNames.medium)
print("Remote transcription:", remote_result)
# Local file example
local_result = transcriber.transcribe('Custom-Home-Builder.mp3')
print("Local transcription:", local_result)