diff --git a/requirements_o2.6.txt b/requirements_o2.6.txt index ae9ac2f..be94820 100644 --- a/requirements_o2.6.txt +++ b/requirements_o2.6.txt @@ -13,6 +13,8 @@ librosa==0.9.0 decord moviepy -# for web +# for web demo +aiofiles==24.1.0 +onnxruntime==1.20.1 fastapi uvicorn diff --git a/web_demos/minicpm-o_2.6/model_server.py b/web_demos/minicpm-o_2.6/model_server.py index 9cfb876..8f37bf8 100644 --- a/web_demos/minicpm-o_2.6/model_server.py +++ b/web_demos/minicpm-o_2.6/model_server.py @@ -54,7 +54,7 @@ app = FastAPI() logger = setup_logger() ap = argparse.ArgumentParser() -ap.add_argument('--port', type=int , default=8088) +ap.add_argument('--port', type=int , default=32550) args = ap.parse_args() @@ -523,13 +523,13 @@ class StreamManager: for r in self.minicpmo_model.streaming_generate( session_id=str(self.session_id), tokenizer=self.minicpmo_tokenizer, - use_tts=True, + generate_audio=True, # enable_regenerate=True, ): if self.stop_response: self.generate_end() return - audio_np, sr, text = r + audio_np, sr, text = r["audio_wav"], r["sampling_rate"], r["text"] output_audio_path = self.savedir + f'/output_audio_log/output_audio_{self.output_audio_id}.wav' self.output_audio_id += 1