import io import json import os import traceback from typing import * import soundfile as sf from flask import Flask, make_response, request, send_file from scipy.io.wavfile import write from modules.server.model import VoiceServerModel model: Optional[VoiceServerModel] = None app = Flask(__name__) @app.route('/ping') def ping(): return make_response("server is alive", 200) @app.route('/upload_model', methods=['POST']) def upload_model(): """ input: json: rvc_model_file: str specify rvc model's absolute path (.pt, .pth) faiss_index_file: Optional[str] specify faiss index'S absolute path (.index) """ global model if request.method == "POST": rvc_model_file = request.json["rvc_model_file"] faiss_index_file =request.json["faiss_index_file"] if "faiss_index_file" in request.json else "" try: model = VoiceServerModel(rvc_model_file, faiss_index_file) return make_response("model is load", 200) except: traceback.print_exc() return make_response("model load error", 400) else: return make_response("use post method", 400) @app.route('/convert_sound', methods=['POST']) def convert_sound(): """ input: params: json speaker_id: int default: 0 transpose: int default: 0 pitch_extraction_algo: str default: dio value: ["dio", "harvest", "mangio-crepe", "crepe"] retrieval_feature_ratio: float default: 0 value: 0. ~ 1. input_wav: wav file output: wavfile """ global model if model is None: return make_response("please upload model", 400) print("start") if request.method == "POST": input_buffer = io.BytesIO(request.files["input_wav"].stream.read()) audio, sr = sf.read(input_buffer) req_json = json.load(io.BytesIO(request.files["params"].stream.read())) sid = int(req_json.get("speaker_id", 0)) transpose = int(req_json.get("transpose", 0)) pitch_extraction_algo = req_json.get("pitch_extraction_algo", "dio") if not pitch_extraction_algo in ["dio", "harvest", "mangio-crepe", "crepe"]: return make_response("bad pitch extraction algo", 400) retrieval_feature_ratio = float(req_json.get("retrieval_feature_ratio", 0.)) out_audio = model(audio, sr, sid, transpose, pitch_extraction_algo, retrieval_feature_ratio) output_buffer = io.BytesIO() write(output_buffer, rate=model.tgt_sr, data=out_audio) output_buffer.seek(0) response = make_response(send_file(output_buffer, mimetype="audio/wav"), 200) return response else: return make_response("use post method", 400) if __name__ == "__main__": app.run()