forked from nagaoka252510/dsc_readup
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathvoice.py
115 lines (91 loc) · 3.36 KB
/
voice.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
# ソースはこちらから引用・改修 http://blog.cgfm.jp/garyu/archives/3396
import json
import os
import sys
import datetime
import argparse
import subprocess
import requests
import aiohttp
import asyncio
import async_timeout
import pprint
# config
# ===========================================
with open('token.json') as f:
df = json.load(f)
#Docomo 音声合成 API
API_KEY = df['docomo']
url = "https://api.apigw.smt.docomo.ne.jp/aiTalk/v1/textToSpeech?APIKEY="+API_KEY
async def fetch(session, url, data_fm, headers):
with async_timeout.timeout(10):
async with session.post(url, data=data_fm, headers=headers) as response:
if response.status != 200 :
print("Error API : " + str(response.status))
exit()
return await response.read()
async def knockApi(makemsg, msger, speed, r_range, pitch, group):
#バイナリデータの一時保存場所
tmp = "./cache/{}/".format(group)
if not os.path.isdir(tmp):
os.makedirs(tmp)
# aitalk パラメーター設定
# ===========================================
"""
参考)音声合成 | docomo Developer support
https://dev.smt.docomo.ne.jp/?p=docs.api.page&api_name=text_to_speech&p_name=api_1#tag01
'speaker' : "nozomi"、"seiji"、"akari"、"anzu"、"hiroshi"、"kaho"、"koutarou"、"maki"、"nanako"、"osamu"、"sumire"
'pitch' : ベースライン・ピッチ。 基準値:1.0、範囲:0.50~2.00
'range' : ピッチ・レンジ。基準値:1.0、範囲:0.00~2.00
'rate' : 読み上げる速度。基準値:1.0、範囲:0.50~4.00
'volume' : 音量。基準値:1.0、範囲:0.00~2.00
"""
prm = {
'speaker' : msger,
'pitch' : str(pitch),
'range' : str(r_range),
'rate' : str(speed),
'volume' : '2'
}
# パラメーター受取
# ===========================================
#%% arguments
"""
parser = argparse.ArgumentParser()
parser.add_argument('--text', type=str, required=True)
args = parser.parse_args()
text = args.text
"""
text = makemsg
# SSML生成
# ===========================================
xml = u'<?xml version="1.0" encoding="utf-8" ?>'
voice = '<voice name="' + prm["speaker"] + '">'
prosody = '<prosody rate="'+ prm['rate'] +'" pitch="'+ prm['pitch'] +'" range="'+ prm['range'] +'">'
xml += '<speak version="1.1">'+ voice + prosody + text + '</prosody></voice></speak>'
# utf-8にエンコード
xml = xml.encode("UTF-8")
# Docomo APIアクセス
# ===========================================
#print("Start API")
async with aiohttp.ClientSession() as session:
response = await fetch(session,
url,
data_fm=xml,
headers={
'Content-Type': 'application/ssml+xml',
'Accept' : 'audio/L16',
'Content-Length' : str(len(xml))
}
)
#現在日時を取得
now = datetime.datetime.now()
tstr = datetime.datetime.strftime(now, '%Y%m%d-%H%M%S%f')
#保存するファイル名
rawFile = tstr + ".raw"
#バイナリデータを保存
fp = open(tmp + rawFile, 'wb')
fp.write(response)
fp.close()
# PCM名を返す
return rawFile