forked from ashi009/node-fast-html-parser
-
Notifications
You must be signed in to change notification settings - Fork 104
/
text.ts
111 lines (95 loc) · 2.59 KB
/
text.ts
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
import { decode } from 'he';
import HTMLElement from './html';
import Node from './node';
import NodeType from './type';
/**
* TextNode to contain a text element in DOM tree.
* @param {string} value [description]
*/
export default class TextNode extends Node {
public clone(): TextNode {
return new TextNode(this._rawText, null);
}
public constructor(rawText: string, parentNode = null as HTMLElement | null, range?: [number, number]) {
super(parentNode, range);
this._rawText = rawText;
}
/**
* Node Type declaration.
* @type {Number}
*/
public nodeType = NodeType.TEXT_NODE;
private _rawText: string;
private _trimmedRawText?: string;
private _trimmedText?: string;
public get rawText() {
return this._rawText;
}
/**
* Set rawText and invalidate trimmed caches
*/
public set rawText(text: string) {
this._rawText = text;
this._trimmedRawText = void 0;
this._trimmedText = void 0;
}
/**
* Returns raw text with all whitespace trimmed except single leading/trailing non-breaking space
*/
public get trimmedRawText() {
if (this._trimmedRawText !== undefined) return this._trimmedRawText;
this._trimmedRawText = trimText(this.rawText);
return this._trimmedRawText;
}
/**
* Returns text with all whitespace trimmed except single leading/trailing non-breaking space
*/
public get trimmedText() {
if (this._trimmedText !== undefined) return this._trimmedText;
this._trimmedText = trimText(this.text);
return this._trimmedText;
}
/**
* Get unescaped text value of current node and its children.
* @return {string} text content
*/
public get text() {
return decode(this.rawText);
}
/**
* Detect if the node contains only white space.
* @return {boolean}
*/
public get isWhitespace() {
return /^(\s| )*$/.test(this.rawText);
}
public toString() {
return this.rawText;
}
}
/**
* Trim whitespace except single leading/trailing non-breaking space
*/
function trimText(text: string): string {
let i = 0;
let startPos;
let endPos;
while (i >= 0 && i < text.length) {
if (/\S/.test(text[i])) {
if (startPos === undefined) {
startPos = i;
i = text.length;
} else {
endPos = i;
i = void 0;
}
}
if (startPos === undefined) i++;
else i--;
}
if (startPos === undefined) startPos = 0;
if (endPos === undefined) endPos = text.length - 1;
const hasLeadingSpace = startPos > 0 && /[^\S\r\n]/.test(text[startPos - 1]);
const hasTrailingSpace = endPos < (text.length - 1) && /[^\S\r\n]/.test(text[endPos + 1]);
return (hasLeadingSpace ? ' ' : '') + text.slice(startPos, endPos + 1) + (hasTrailingSpace ? ' ' : '');
}