Add Handling for Dangling Characters in "trimToEndSentence" - utils.js
New: Considered the presence of whitespace or newline characters preceding the punctuation for accurate trimming.
This commit is contained in:
parent
3b739cceed
commit
e4025cb413
|
@ -471,14 +471,18 @@ export function sortByCssOrder(a, b) {
|
|||
* trimToEndSentence('Hello, world! I am from'); // 'Hello, world!'
|
||||
*/
|
||||
export function trimToEndSentence(input, include_newline = false) {
|
||||
const punctuation = new Set(['.', '!', '?', '*', '"', ')', '}', '`', ']', '$', '。', '!', '?', '”', ')', '】', '】', '’', '」', '】']); // extend this as you see fit
|
||||
const punctuation = new Set(['.', '!', '?', '*', '"', ')', '}', '`', ']', '$', '。', '!', '?', '”', ')', '】', '’', '」']); // extend this as you see fit
|
||||
let last = -1;
|
||||
|
||||
for (let i = input.length - 1; i >= 0; i--) {
|
||||
const char = input[i];
|
||||
|
||||
if (punctuation.has(char)) {
|
||||
last = i;
|
||||
if (i > 0 && (input[i - 1] === ' ' || input[i - 1] === '\n')) {
|
||||
last = i - 1;
|
||||
} else {
|
||||
last = i;
|
||||
}
|
||||
break;
|
||||
}
|
||||
|
||||
|
|
Loading…
Reference in New Issue