| | |
| | | } |
| | | |
| | | bool TimestampIsPunctuation(U16CHAR_T &u16) { |
| | | // (& ' -) in the dict |
| | | if (u16 == 0x26 || u16 == 0x27 || u16 == 0x2D){ |
| | | return false; |
| | | } |
| | | return (u16 >= 0x21 && u16 <= 0x2F) // 标准ASCII标点 |
| | | || (u16 >= 0x3A && u16 <= 0x40) // 标准ASCII标点 |
| | | || (u16 >= 0x5B && u16 <= 0x60) // 标准ASCII标点 |
| | |
| | | } else{ |
| | | ts_sentences += ts_sent + ","; |
| | | } |
| | | |
| | | // clear |
| | | idx_str++; |
| | | text_seg = ""; |
| | | ts_sent = ""; |
| | | start = 0; |
| | |
| | | text_seg += " " + characters[idx_str]; |
| | | } |
| | | ts_seg.push_back(timestamps[idx_ts]); |
| | | idx_str++; |
| | | idx_ts++; |
| | | } |
| | | idx_str++; |
| | | } |
| | | // for none punc results |
| | | if(ts_seg.size() >0){ |