所需文件下载地址
链接:https://pan.baidu.com/s/1Dzbv8gPUZJ3T8Fe02hOJvg
提取码:zbgt
py文件
from flask import Flask, jsonify,send_file
from flask import render_template
from flask import request
from uuid import uuid4
from other import audio2text, text2audio, my_nlp app = Flask(__name__) @app.route("/")
def index():
return render_template("WebToy.html") @app.route("/upload", methods=["POST"])
def upload():
fi = request.files.get("reco")
fi_name = f"{uuid4()}.wav"
fi.save(fi_name)
text = audio2text(fi_name)
new_test = my_nlp(text)
filename = text2audio(new_test)
ret = {
"filename": filename,
"content":new_test,
"code": 0,
} return jsonify(ret)
@app.route("/get_file/<filename>")
def get_file(filename):
return send_file(filename) if __name__ == '__main__':
app.run('0.0.0.0', 9527, debug=True)
app.py
from aip import AipNlp
from aip import AipSpeech
from uuid import uuid4
import requests
import os APP_ID = ''
API_KEY = 'gBsfoHWw4pOh9n3sNhwoB853'
SECRET_KEY = '4e0WXxlTo5lMgFu45lLnO490SnnpLQLN' client = AipSpeech(APP_ID, API_KEY, SECRET_KEY)
nlp_client = AipNlp(APP_ID, API_KEY, SECRET_KEY) def get_file_content(filePath):
os.system(f"ffmpeg -y -i {filePath} -acodec pcm_s16le -f s16le -ac 1 -ar 16000 {filePath}.pcm")
with open(f"{filePath}.pcm", 'rb') as fp:
return fp.read() def audio2text(filePath):
ret = client.asr(get_file_content(filePath), 'pcm', 16000, {
'dev_pid': 1536,
}) text = ret.get("result")[0]
return text def to_tuling(text, uid):
data = {
"perception": {
"inputText": {
"text": "北京"
},
},
"userInfo": {
"apiKey": "934b6f5ee4c44370bd2daf71ed7b0b77",
"userId": ""
}
}
data["perception"]["inputText"]["text"] = text
data["userInfo"]["userId"] = uid
res = requests.post("http://openapi.tuling123.com/openapi/api/v2", json=data)
text = res.json().get('results')[0].get('values').get('text')
return text def my_nlp(text):
if nlp_client.simnet(text, "你叫什么名字").get('score') >= 0.58:
a = '我叫人工智障'
return a if nlp_client.simnet(text, "你今年几岁了").get('score') >= 0.75:
a = '永远18岁'
return a
a = to_tuling(text, 'open123')
return a def text2audio(text):
result = client.synthesis(text, 'zh', 1, {
'vol': 5,
'spd': 4,
'pit': 7,
'per': 4,
})
filename = f"{uuid4()}.mp3"
# 识别正确返回语音二进制 错误则返回dict 参照下面错误码
if not isinstance(result, dict):
with open(filename, 'wb') as f:
f.write(result)
return filename
other.py