-
Notifications
You must be signed in to change notification settings - Fork 11
/
Copy pathlong_audio_recognition.py
48 lines (37 loc) · 1.61 KB
/
long_audio_recognition.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
import os
import time
from sys import argv
from speechkit import RecognitionLongAudio, Session
from speechkit.auth import generate_jwt
_, filename = argv
bucket_name = os.environ.get('BUCKET_NAME')
service_account_id = os.environ.get('SERVICE_ACCOUNT_ID')
key_id = os.environ.get('YANDEX_KEY_ID')
private_key = os.environ.get('YANDEX_PRIVATE_KEY').replace('\\n', '\n').encode()
if not key_id or not service_account_id or not bucket_name or not private_key:
print("Specify `YANDEX_KEY_ID`, `SERVICE_ACCOUNT_ID`, `BUCKET_NAME`, `private_key` environment variables.")
exit()
jwt = generate_jwt(service_account_id, key_id, private_key)
session = Session.from_jwt(jwt)
# Maybe you want to create aws s3 key only once
# In that case from version 2.2.0 you can do:
access_key_id, secret = RecognitionLongAudio.get_aws_credentials(session, service_account_id)
# And then use it:
recognize_long_audio = RecognitionLongAudio(session, service_account_id, bucket_name, aws_access_key_id=access_key_id,
aws_secret=secret)
# Or you can do it automatically
# recognize_long_audio = RecognitionLongAudio(session, service_account_id, bucket_name)
print("Sending file for recognition...")
recognize_long_audio.send_for_recognition(
filename, audioEncoding='LINEAR16_PCM', sampleRateHertz='48000',
audioChannelCount=1, rawResults=False
)
while True:
time.sleep(2)
if recognize_long_audio.get_recognition_results():
break
print("Recognizing...")
data = recognize_long_audio.get_data()
print("DATA:\n\n", data)
text = recognize_long_audio.get_raw_text()
print("TEXT:\n\n", text)