main
HuangHai 3 months ago
parent 13b8b26f0c
commit 570a6406b5

@ -0,0 +1,180 @@
#coding=utf-8
'''
requires Python 3.6 or later
pip install asyncio
pip install websockets
'''
import asyncio
import websockets
import uuid
import json
import gzip
import copy
MESSAGE_TYPES = {11: "audio-only server response", 12: "frontend server response", 15: "error message from server"}
MESSAGE_TYPE_SPECIFIC_FLAGS = {0: "no sequence number", 1: "sequence number > 0",
2: "last message from server (seq < 0)", 3: "sequence number < 0"}
MESSAGE_SERIALIZATION_METHODS = {0: "no serialization", 1: "JSON", 15: "custom type"}
MESSAGE_COMPRESSIONS = {0: "no compression", 1: "gzip", 15: "custom compression method"}
# Q1哪里可以获取到以下参数appidclustertokenauthorization_typesecret_key
# https://www.volcengine.com/docs/6561/196768#q1%EF%BC%9A%E5%93%AA%E9%87%8C%E5%8F%AF%E4%BB%A5%E8%8E%B7%E5%8F%96%E5%88%B0%E4%BB%A5%E4%B8%8B%E5%8F%82%E6%95%B0appid%EF%BC%8Ccluster%EF%BC%8Ctoken%EF%BC%8Cauthorization-type%EF%BC%8Csecret-key-%EF%BC%9F
# https://www.volcengine.com/docs/6561/1257544
appid = "2258132518"
token = "kwC-THR8FyGqwCfhSvQI0nqB_VBS9mGW"
cluster = "volcano_tts"
# 湾湾小何
voice_type = "zh_female_wanwanxiaohe_moon_bigtts"
host = "openspeech.bytedance.com"
api_url = f"wss://{host}/api/v1/tts/ws_binary"
# version: b0001 (4 bits)
# header size: b0001 (4 bits)
# message type: b0001 (Full client request) (4bits)
# message type specific flags: b0000 (none) (4bits)
# message serialization method: b0001 (JSON) (4 bits)
# message compression: b0001 (gzip) (4bits)
# reserved data: 0x00 (1 byte)
default_header = bytearray(b'\x11\x10\x11\x00')
request_json = {
"app": {
"appid": appid,
"token": "access_token",
"cluster": cluster
},
"user": {
"uid": "388808087185088"
},
"audio": {
"voice_type": "xxx",
"encoding": "mp3",
"speed_ratio": 1.0,
"volume_ratio": 1.0,
"pitch_ratio": 1.0,
},
"request": {
"reqid": "xxx",
"text": "字节跳动语音合成。",
"text_type": "plain",
"operation": "xxx"
}
}
async def test_submit():
submit_request_json = copy.deepcopy(request_json)
submit_request_json["audio"]["voice_type"] = voice_type
submit_request_json["request"]["reqid"] = str(uuid.uuid4())
submit_request_json["request"]["operation"] = "submit"
payload_bytes = str.encode(json.dumps(submit_request_json))
payload_bytes = gzip.compress(payload_bytes) # if no compression, comment this line
full_client_request = bytearray(default_header)
full_client_request.extend((len(payload_bytes)).to_bytes(4, 'big')) # payload size(4 bytes)
full_client_request.extend(payload_bytes) # payload
print("\n------------------------ test 'submit' -------------------------")
print("request json: ", submit_request_json)
print("\nrequest bytes: ", full_client_request)
file_to_save = open("test_submit.mp3", "wb")
header = {"Authorization": f"Bearer; {token}"}
async with websockets.connect(api_url, extra_headers=header, ping_interval=None) as ws:
await ws.send(full_client_request)
while True:
res = await ws.recv()
done = parse_response(res, file_to_save)
if done:
file_to_save.close()
break
print("\nclosing the connection...")
async def test_query():
query_request_json = copy.deepcopy(request_json)
query_request_json["audio"]["voice_type"] = voice_type
query_request_json["request"]["reqid"] = str(uuid.uuid4())
query_request_json["request"]["operation"] = "query"
payload_bytes = str.encode(json.dumps(query_request_json))
payload_bytes = gzip.compress(payload_bytes) # if no compression, comment this line
full_client_request = bytearray(default_header)
full_client_request.extend((len(payload_bytes)).to_bytes(4, 'big')) # payload size(4 bytes)
full_client_request.extend(payload_bytes) # payload
print("\n------------------------ test 'query' -------------------------")
print("request json: ", query_request_json)
print("\nrequest bytes: ", full_client_request)
file_to_save = open("test_query.mp3", "wb")
header = {"Authorization": f"Bearer; {token}"}
async with websockets.connect(api_url, extra_headers=header, ping_interval=None) as ws:
await ws.send(full_client_request)
res = await ws.recv()
parse_response(res, file_to_save)
file_to_save.close()
print("\nclosing the connection...")
def parse_response(res, file):
print("--------------------------- response ---------------------------")
# print(f"response raw bytes: {res}")
protocol_version = res[0] >> 4
header_size = res[0] & 0x0f
message_type = res[1] >> 4
message_type_specific_flags = res[1] & 0x0f
serialization_method = res[2] >> 4
message_compression = res[2] & 0x0f
reserved = res[3]
header_extensions = res[4:header_size*4]
payload = res[header_size*4:]
print(f" Protocol version: {protocol_version:#x} - version {protocol_version}")
print(f" Header size: {header_size:#x} - {header_size * 4} bytes ")
print(f" Message type: {message_type:#x} - {MESSAGE_TYPES[message_type]}")
print(f" Message type specific flags: {message_type_specific_flags:#x} - {MESSAGE_TYPE_SPECIFIC_FLAGS[message_type_specific_flags]}")
print(f"Message serialization method: {serialization_method:#x} - {MESSAGE_SERIALIZATION_METHODS[serialization_method]}")
print(f" Message compression: {message_compression:#x} - {MESSAGE_COMPRESSIONS[message_compression]}")
print(f" Reserved: {reserved:#04x}")
if header_size != 1:
print(f" Header extensions: {header_extensions}")
if message_type == 0xb: # audio-only server response
if message_type_specific_flags == 0: # no sequence number as ACK
print(" Payload size: 0")
return False
else:
sequence_number = int.from_bytes(payload[:4], "big", signed=True)
payload_size = int.from_bytes(payload[4:8], "big", signed=False)
payload = payload[8:]
print(f" Sequence number: {sequence_number}")
print(f" Payload size: {payload_size} bytes")
file.write(payload)
if sequence_number < 0:
return True
else:
return False
elif message_type == 0xf:
code = int.from_bytes(payload[:4], "big", signed=False)
msg_size = int.from_bytes(payload[4:8], "big", signed=False)
error_msg = payload[8:]
if message_compression == 1:
error_msg = gzip.decompress(error_msg)
error_msg = str(error_msg, "utf-8")
print(f" Error message code: {code}")
print(f" Error message size: {msg_size} bytes")
print(f" Error message: {error_msg}")
return True
elif message_type == 0xc:
msg_size = int.from_bytes(payload[:4], "big", signed=False)
payload = payload[4:]
if message_compression == 1:
payload = gzip.decompress(payload)
print(f" Frontend message: {payload}")
else:
print("undefined message type!")
return True
if __name__ == '__main__':
loop = asyncio.get_event_loop()
loop.run_until_complete(test_submit())
loop.run_until_complete(test_query())
Loading…
Cancel
Save