| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455 |
- /**
- * Copyright FunASR (https://github.com/alibaba-damo-academy/FunASR). All Rights
- * Reserved. MIT License (https://opensource.org/licenses/MIT)
- */
- /* 2022-2023 by zhaomingwork */
- // client for websocket, support multiple threads
- // ./funasr-wss-client --server-ip <string>
- // --port <string>
- // --wav-path <string>
- // [--thread-num <int>]
- // [--is-ssl <int>] [--]
- // [--version] [-h]
- // example:
- // ./funasr-wss-client --server-ip 127.0.0.1 --port 10095 --wav-path test.wav --thread-num 1 --is-ssl 1
- #define ASIO_STANDALONE 1
- #include <websocketpp/client.hpp>
- #include <websocketpp/common/thread.hpp>
- #include <websocketpp/config/asio_client.hpp>
- #include <fstream>
- #include <atomic>
- #include <thread>
- #include <glog/logging.h>
- #include "util.h"
- #include "audio.h"
- #include "nlohmann/json.hpp"
- #include "tclap/CmdLine.h"
- /**
- * Define a semi-cross platform helper method that waits/sleeps for a bit.
- */
- void WaitABit() {
- #ifdef WIN32
- Sleep(200);
- #else
- usleep(200);
- #endif
- }
- std::atomic<int> wav_index(0);
- typedef websocketpp::config::asio_client::message_type::ptr message_ptr;
- typedef websocketpp::lib::shared_ptr<websocketpp::lib::asio::ssl::context> context_ptr;
- using websocketpp::lib::bind;
- using websocketpp::lib::placeholders::_1;
- using websocketpp::lib::placeholders::_2;
- context_ptr OnTlsInit(websocketpp::connection_hdl) {
- context_ptr ctx = websocketpp::lib::make_shared<asio::ssl::context>(
- asio::ssl::context::sslv23);
- try {
- ctx->set_options(
- asio::ssl::context::default_workarounds | asio::ssl::context::no_sslv2 |
- asio::ssl::context::no_sslv3 | asio::ssl::context::single_dh_use);
- } catch (std::exception& e) {
- LOG(ERROR) << e.what();
- }
- return ctx;
- }
- // template for tls or not config
- template <typename T>
- class WebsocketClient {
- public:
- // typedef websocketpp::client<T> client;
- // typedef websocketpp::client<websocketpp::config::asio_tls_client>
- // wss_client;
- typedef websocketpp::lib::lock_guard<websocketpp::lib::mutex> scoped_lock;
- WebsocketClient(int is_ssl) : m_open(false), m_done(false) {
- // set up access channels to only log interesting things
- m_client.clear_access_channels(websocketpp::log::alevel::all);
- m_client.set_access_channels(websocketpp::log::alevel::connect);
- m_client.set_access_channels(websocketpp::log::alevel::disconnect);
- m_client.set_access_channels(websocketpp::log::alevel::app);
- // Initialize the Asio transport policy
- m_client.init_asio();
- // Bind the handlers we are using
- using websocketpp::lib::bind;
- using websocketpp::lib::placeholders::_1;
- m_client.set_open_handler(bind(&WebsocketClient::on_open, this, _1));
- m_client.set_close_handler(bind(&WebsocketClient::on_close, this, _1));
- m_client.set_message_handler(
- [this](websocketpp::connection_hdl hdl, message_ptr msg) {
- on_message(hdl, msg);
- });
- m_client.set_fail_handler(bind(&WebsocketClient::on_fail, this, _1));
- m_client.clear_access_channels(websocketpp::log::alevel::all);
- }
- void on_message(websocketpp::connection_hdl hdl, message_ptr msg) {
- const std::string& payload = msg->get_payload();
- switch (msg->get_opcode()) {
- case websocketpp::frame::opcode::text:
- total_recv=total_recv+1;
- LOG(INFO)<< "Thread: " << this_thread::get_id() << ", total_recv=" << total_recv <<", on_message = " << payload;
- std::unique_lock<std::mutex> lock(msg_lock);
- cv.notify_one();
- if(close_client)
- {
- LOG(INFO)<< "Thread: " << this_thread::get_id() << ", close client thread";
- websocketpp::lib::error_code ec;
- m_client.close(m_hdl, websocketpp::close::status::going_away, "", ec);
- if (ec){
- LOG(ERROR)<< "Error closing connection " << ec.message();
- }
- }
- }
- }
- // This method will block until the connection is complete
- void run(const std::string& uri, const std::vector<string>& wav_list, const std::vector<string>& wav_ids,
- int audio_fs, const std::unordered_map<std::string, int>& hws_map, int use_itn=1) {
- // Create a new connection to the given URI
- websocketpp::lib::error_code ec;
- typename websocketpp::client<T>::connection_ptr con =
- m_client.get_connection(uri, ec);
- if (ec) {
- m_client.get_alog().write(websocketpp::log::alevel::app,
- "Get Connection Error: " + ec.message());
- return;
- }
- // Grab a handle for this connection so we can talk to it in a thread
- // safe manor after the event loop starts.
- m_hdl = con->get_handle();
- // Queue the connection. No DNS queries or network connections will be
- // made until the io_service event loop is run.
- m_client.connect(con);
- // Create a thread to run the ASIO io_service event loop
- websocketpp::lib::thread asio_thread(&websocketpp::client<T>::run,
- &m_client);
- bool send_hotword = true;
- while(true){
- int i = wav_index.fetch_add(1);
- if (i >= wav_list.size()) {
- break;
- }
- if (total_send !=0){
- std::unique_lock<std::mutex> lock(msg_lock);
- cv.wait(lock);
- }
- total_send += 1;
- send_wav_data(wav_list[i], wav_ids[i], audio_fs, hws_map, send_hotword, use_itn);
- if(send_hotword){
- send_hotword = false;
- }
- }
- close_client = true;
- asio_thread.join();
- }
- // The open handler will signal that we are ready to start sending data
- void on_open(websocketpp::connection_hdl) {
- m_client.get_alog().write(websocketpp::log::alevel::app,
- "Connection opened, starting data!");
- scoped_lock guard(m_lock);
- m_open = true;
- }
- // The close handler will signal that we should stop sending data
- void on_close(websocketpp::connection_hdl) {
- m_client.get_alog().write(websocketpp::log::alevel::app,
- "Connection closed, stopping data!");
- scoped_lock guard(m_lock);
- m_done = true;
- }
- // The fail handler will signal that we should stop sending data
- void on_fail(websocketpp::connection_hdl) {
- m_client.get_alog().write(websocketpp::log::alevel::app,
- "Connection failed, stopping data!");
- scoped_lock guard(m_lock);
- m_done = true;
- }
- // send wav to server
- void send_wav_data(string wav_path, string wav_id, int audio_fs,
- const std::unordered_map<std::string, int>& hws_map,
- bool send_hotword, bool use_itn) {
- uint64_t count = 0;
- std::stringstream val;
- funasr::Audio audio(1);
- int32_t sampling_rate = audio_fs;
- std::string wav_format = "pcm";
- if (funasr::IsTargetFile(wav_path.c_str(), "wav")) {
- if (!audio.LoadWav(wav_path.c_str(), &sampling_rate, false))
- return;
- } else if(funasr::IsTargetFile(wav_path.c_str(), "pcm")){
- if (!audio.LoadPcmwav(wav_path.c_str(), &sampling_rate, false))
- return ;
- }else{
- wav_format = "others";
- if (!audio.LoadOthers2Char(wav_path.c_str()))
- return ;
- }
- float* buff;
- int len;
- int flag = 0;
- bool wait = false;
- while (1) {
- {
- scoped_lock guard(m_lock);
- // If the connection has been closed, stop generating data
- if (m_done) {
- break;
- }
- // If the connection hasn't been opened yet wait a bit and retry
- if (!m_open) {
- wait = true;
- } else {
- break;
- }
- }
- if (wait) {
- // LOG(INFO) << "wait.." << m_open;
- WaitABit();
- continue;
- }
- }
- websocketpp::lib::error_code ec;
- nlohmann::json jsonbegin;
- nlohmann::json chunk_size = nlohmann::json::array();
- chunk_size.push_back(5);
- chunk_size.push_back(10);
- chunk_size.push_back(5);
- jsonbegin["chunk_size"] = chunk_size;
- jsonbegin["chunk_interval"] = 10;
- jsonbegin["wav_name"] = wav_id;
- jsonbegin["wav_format"] = wav_format;
- jsonbegin["audio_fs"] = sampling_rate;
- jsonbegin["itn"] = true;
- if(use_itn == 0){
- jsonbegin["itn"] = false;
- }
- jsonbegin["is_speaking"] = true;
- if(send_hotword){
- if(!hws_map.empty()){
- LOG(INFO) << "hotwords: ";
- for (const auto& pair : hws_map) {
- LOG(INFO) << pair.first << " : " << pair.second;
- }
- nlohmann::json json_map(hws_map);
- std::string json_map_str = json_map.dump();
- jsonbegin["hotwords"] = json_map_str;
- }
- }
- m_client.send(m_hdl, jsonbegin.dump(), websocketpp::frame::opcode::text,
- ec);
- // fetch wav data use asr engine api
- if(wav_format == "pcm"){
- while (audio.Fetch(buff, len, flag) > 0) {
- short* iArray = new short[len];
- for (size_t i = 0; i < len; ++i) {
- iArray[i] = (short)(buff[i]*32768);
- }
- // send data to server
- int offset = 0;
- int block_size = 102400;
- while(offset < len){
- int send_block = 0;
- if (offset + block_size <= len){
- send_block = block_size;
- }else{
- send_block = len - offset;
- }
- m_client.send(m_hdl, iArray+offset, send_block * sizeof(short),
- websocketpp::frame::opcode::binary, ec);
- offset += send_block;
- }
- LOG(INFO)<< "Thread: " << this_thread::get_id() << ", sended data len=" << len * sizeof(short);
- // The most likely error that we will get is that the connection is
- // not in the right state. Usually this means we tried to send a
- // message to a connection that was closed or in the process of
- // closing. While many errors here can be easily recovered from,
- // in this simple example, we'll stop the data loop.
- if (ec) {
- m_client.get_alog().write(websocketpp::log::alevel::app,
- "Send Error: " + ec.message());
- break;
- }
- delete[] iArray;
- // WaitABit();
- }
- }else{
- int offset = 0;
- int block_size = 204800;
- len = audio.GetSpeechLen();
- char* others_buff = audio.GetSpeechChar();
- while(offset < len){
- int send_block = 0;
- if (offset + block_size <= len){
- send_block = block_size;
- }else{
- send_block = len - offset;
- }
- m_client.send(m_hdl, others_buff+offset, send_block,
- websocketpp::frame::opcode::binary, ec);
- offset += send_block;
- }
- LOG(INFO)<< "Thread: " << this_thread::get_id() << ", sended data len=" << len;
- // The most likely error that we will get is that the connection is
- // not in the right state. Usually this means we tried to send a
- // message to a connection that was closed or in the process of
- // closing. While many errors here can be easily recovered from,
- // in this simple example, we'll stop the data loop.
- if (ec) {
- m_client.get_alog().write(websocketpp::log::alevel::app,
- "Send Error: " + ec.message());
- }
- }
- nlohmann::json jsonresult;
- jsonresult["is_speaking"] = false;
- m_client.send(m_hdl, jsonresult.dump(), websocketpp::frame::opcode::text,
- ec);
- std::this_thread::sleep_for(std::chrono::milliseconds(20));
- }
- websocketpp::client<T> m_client;
- private:
- websocketpp::connection_hdl m_hdl;
- websocketpp::lib::mutex m_lock;
- websocketpp::lib::mutex msg_lock;
- websocketpp::lib::condition_variable cv;
- bool m_open;
- bool m_done;
- bool close_client=false;
- int total_send=0;
- int total_recv=0;
- };
- int main(int argc, char* argv[]) {
- #ifdef _WIN32
- #include <windows.h>
- SetConsoleOutputCP(65001);
- #endif
- google::InitGoogleLogging(argv[0]);
- FLAGS_logtostderr = true;
- TCLAP::CmdLine cmd("funasr-wss-client", ' ', "1.0");
- TCLAP::ValueArg<std::string> server_ip_("", "server-ip", "server-ip", true,
- "127.0.0.1", "string");
- TCLAP::ValueArg<std::string> port_("", "port", "port", true, "10095", "string");
- TCLAP::ValueArg<std::string> wav_path_("", "wav-path",
- "the input could be: wav_path, e.g.: asr_example.wav; pcm_path, e.g.: asr_example.pcm; wav.scp, kaldi style wav list (wav_id \t wav_path)",
- true, "", "string");
- TCLAP::ValueArg<std::int32_t> audio_fs_("", "audio-fs", "the sample rate of audio", false, 16000, "int32_t");
- TCLAP::ValueArg<int> thread_num_("", "thread-num", "thread-num",
- false, 1, "int");
- TCLAP::ValueArg<int> is_ssl_(
- "", "is-ssl", "is-ssl is 1 means use wss connection, or use ws connection",
- false, 1, "int");
- TCLAP::ValueArg<int> use_itn_(
- "", "use-itn",
- "use-itn is 1 means use itn, 0 means not use itn", false, 1, "int");
- TCLAP::ValueArg<std::string> hotword_("", HOTWORD,
- "the hotword file, one hotword perline, Format: Hotword Weight (could be: 阿里巴巴 20)", false, "", "string");
- cmd.add(server_ip_);
- cmd.add(port_);
- cmd.add(wav_path_);
- cmd.add(audio_fs_);
- cmd.add(thread_num_);
- cmd.add(is_ssl_);
- cmd.add(use_itn_);
- cmd.add(hotword_);
- cmd.parse(argc, argv);
- std::string server_ip = server_ip_.getValue();
- std::string port = port_.getValue();
- std::string wav_path = wav_path_.getValue();
- int threads_num = thread_num_.getValue();
- int is_ssl = is_ssl_.getValue();
- int use_itn = use_itn_.getValue();
- std::vector<websocketpp::lib::thread> client_threads;
- std::string uri = "";
- if (is_ssl == 1) {
- uri = "wss://" + server_ip + ":" + port;
- } else {
- uri = "ws://" + server_ip + ":" + port;
- }
- // hotwords
- std::string hotword_path = hotword_.getValue();
- unordered_map<string, int> hws_map;
- if(!hotword_path.empty()){
- LOG(INFO) << "hotword path: " << hotword_path;
- funasr::ExtractHws(hotword_path, hws_map);
- }
- // read wav_path
- std::vector<string> wav_list;
- std::vector<string> wav_ids;
- string default_id = "wav_default_id";
- if(funasr::IsTargetFile(wav_path, "scp")){
- ifstream in(wav_path);
- if (!in.is_open()) {
- printf("Failed to open scp file");
- return 0;
- }
- string line;
- while(getline(in, line))
- {
- istringstream iss(line);
- string column1, column2;
- iss >> column1 >> column2;
- wav_list.emplace_back(column2);
- wav_ids.emplace_back(column1);
- }
- in.close();
- }else{
- wav_list.emplace_back(wav_path);
- wav_ids.emplace_back(default_id);
- }
-
- int audio_fs = audio_fs_.getValue();
- for (size_t i = 0; i < threads_num; i++) {
- client_threads.emplace_back([uri, wav_list, wav_ids, audio_fs, is_ssl, hws_map, use_itn]() {
- if (is_ssl == 1) {
- WebsocketClient<websocketpp::config::asio_tls_client> c(is_ssl);
- c.m_client.set_tls_init_handler(bind(&OnTlsInit, ::_1));
- c.run(uri, wav_list, wav_ids, audio_fs, hws_map, use_itn);
- } else {
- WebsocketClient<websocketpp::config::asio_client> c(is_ssl);
- c.run(uri, wav_list, wav_ids, audio_fs, hws_map, use_itn);
- }
- });
- }
- for (auto& t : client_threads) {
- t.join();
- }
- }
|