Przeglądaj źródła

add function IsPunc

雾聪 2 lat temu
rodzic
commit
049e0c3523

+ 8 - 0
funasr/runtime/onnxruntime/src/tokenizer.cpp

@@ -142,6 +142,14 @@ vector<int> CTokenizer::Punc2Ids(vector<string> input)
 	return result;
 }
 
+bool CTokenizer::IsPunc(string& Punc)
+{
+	if (m_punc2id.find(Punc) != m_punc2id.end())
+		return true;
+	else
+		return false;
+}
+
 vector<string> CTokenizer::SplitChineseString(const string & str_info)
 {
 	vector<string> list;

+ 1 - 1
funasr/runtime/onnxruntime/src/tokenizer.h

@@ -30,7 +30,7 @@ public:
 	vector<string> SplitChineseString(const string& str_info);
 	void StrSplit(const string& str, const char split, vector<string>& res);
 	void Tokenize(const char* str_info, vector<string>& str_out, vector<int>& id_out);
-
+	bool IsPunc(string& Punc);
 };
 
 } // namespace funasr