-
Notifications
You must be signed in to change notification settings - Fork 3
/
html.ts
39 lines (31 loc) · 1.02 KB
/
html.ts
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
import { TScrapedData, TSelectors } from "../../types"
import { applyConditions } from "../tools/condition"
const getSelectorValue = (element: Element, selector: any): string | null => {
const value = selector.attribute
? element.getAttribute(selector.attribute) || ""
: element.textContent?.trim() || ""
if (selector.conditions && !applyConditions(value, selector.conditions)) {
return null
}
return value
}
const extractData = (
document: Document,
selectors: TSelectors
): TScrapedData => {
const data: TScrapedData = {}
for (const [key, selector] of Object.entries(selectors)) {
const elements = document.querySelectorAll(selector.selector)
if (!elements.length) {
data[key] = ""
} else if (elements.length === 1) {
data[key] = getSelectorValue(elements[0], selector) || ""
} else {
data[key] = Array.from(elements)
.map((element) => getSelectorValue(element, selector))
.filter((value) => value !== null)
}
}
return data
}
export default extractData