-
Notifications
You must be signed in to change notification settings - Fork 29
/
converter.js
589 lines (531 loc) · 20.8 KB
/
converter.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
import {
replaceAll,
getBeforeRegExp,
substringAfter,
substringBefore,
wrapInSingleQuotes,
getStringInBraces,
} from './string-utils';
import { isExisting } from './array-utils';
import validator from './validator';
import { ADG_SCRIPTLET_MASK, parseRule } from './parse-rule';
import * as scriptletList from '../scriptlets/scriptlets-list';
/**
* AdGuard scriptlet rule
*/
const ADGUARD_SCRIPTLET_MASK_REG = /#@?%#\/\/scriptlet\(.+\)/;
// eslint-disable-next-line no-template-curly-in-string
const ADGUARD_SCRIPTLET_TEMPLATE = '${domains}#%#//scriptlet(${args})';
// eslint-disable-next-line no-template-curly-in-string
const ADGUARD_SCRIPTLET_EXCEPTION_TEMPLATE = '${domains}#@%#//scriptlet(${args})';
/**
* uBlock scriptlet rule mask
*/
// eslint-disable-next-line no-template-curly-in-string
const UBO_SCRIPTLET_TEMPLATE = '${domains}##+js(${args})';
// eslint-disable-next-line no-template-curly-in-string
const UBO_SCRIPTLET_EXCEPTION_TEMPLATE = '${domains}#@#+js(${args})';
const UBO_ALIAS_NAME_MARKER = 'ubo-';
const UBO_SCRIPTLET_JS_ENDING = '.js';
// https://github.com/gorhill/uBlock/wiki/Static-filter-syntax#xhr
const UBO_XHR_TYPE = 'xhr';
const ADG_XHR_TYPE = 'xmlhttprequest';
const ADG_SET_CONSTANT_NAME = 'set-constant';
const ADG_SET_CONSTANT_EMPTY_STRING = '';
const ADG_SET_CONSTANT_EMPTY_ARRAY = 'emptyArr';
const ADG_SET_CONSTANT_EMPTY_OBJECT = 'emptyObj';
const UBO_SET_CONSTANT_EMPTY_STRING = '\'\'';
const UBO_SET_CONSTANT_EMPTY_ARRAY = '[]';
const UBO_SET_CONSTANT_EMPTY_OBJECT = '{}';
const ADG_PREVENT_FETCH_NAME = 'prevent-fetch';
const ADG_PREVENT_FETCH_EMPTY_STRING = '';
const ADG_PREVENT_FETCH_WILDCARD = '*';
const UBO_NO_FETCH_IF_WILDCARD = '/^/';
const ESCAPED_COMMA_SEPARATOR = '\\,';
const COMMA_SEPARATOR = ',';
const REMOVE_ATTR_METHOD = 'removeAttr';
const REMOVE_CLASS_METHOD = 'removeClass';
const REMOVE_ATTR_ALIASES = scriptletList[REMOVE_ATTR_METHOD].names;
const REMOVE_CLASS_ALIASES = scriptletList[REMOVE_CLASS_METHOD].names;
const ADG_REMOVE_ATTR_NAME = REMOVE_ATTR_ALIASES[0];
const ADG_REMOVE_CLASS_NAME = REMOVE_CLASS_ALIASES[0];
const REMOVE_ATTR_CLASS_APPLYING = ['asap', 'stay', 'complete'];
/**
* Returns array of strings separated by space which is not in quotes
*
* @param {string} str arbitrary string
* @returns {string[]} result array
*/
const getSentences = (str) => {
const reg = /'.*?'|".*?"|\S+/g;
return str.match(reg);
};
/**
* Replaces string with data by placeholders
*
* @param {string} str string with placeholders
* @param {Object} data where keys are placeholders names
* @returns {string} string filled with data
*/
const replacePlaceholders = (str, data) => {
return Object.keys(data).reduce((acc, key) => {
const reg = new RegExp(`\\$\\{${key}\\}`, 'g');
acc = acc.replace(reg, data[key]);
return acc;
}, str);
};
const splitArgs = (str) => {
const args = [];
let prevArgStart = 0;
for (let i = 0; i < str.length; i += 1) {
// do not split args by escaped comma
// https://github.com/AdguardTeam/Scriptlets/issues/133
if (str[i] === COMMA_SEPARATOR && str[i - 1] !== '\\') {
args.push(str.slice(prevArgStart, i).trim());
prevArgStart = i + 1;
}
}
// collect arg after last comma
args.push(str.slice(prevArgStart, str.length).trim());
return args;
};
/**
* Validates remove-attr/class scriptlet args
*
* @param {string[]} parsedArgs scriptlet arguments
* @returns {string[]|Error} valid args OR error for invalid selector
*/
const validateRemoveAttrClassArgs = (parsedArgs) => {
const [name, value, ...restArgs] = parsedArgs;
// no extra checking if there are only scriptlet name and value
// https://github.com/AdguardTeam/Scriptlets/issues/235
if (restArgs.length === 0) {
return [name, value];
}
// remove-attr/class scriptlet might have multiple selectors separated by comma. so we should:
// 1. check if last arg is 'applying' parameter
// 2. join 'selector' into one arg
// 3. combine all args
// https://github.com/AdguardTeam/Scriptlets/issues/133
const lastArg = restArgs.pop();
let applying;
// check the last parsed arg for matching possible 'applying' vale
if (REMOVE_ATTR_CLASS_APPLYING.some((el) => lastArg.includes(el))) {
applying = lastArg;
} else {
restArgs.push(lastArg);
}
const selector = replaceAll(
restArgs.join(', '),
ESCAPED_COMMA_SEPARATOR,
COMMA_SEPARATOR,
);
if (selector.length > 0 && typeof document !== 'undefined') {
// empty selector is valid for these scriptlets as it applies to all elements,
// all other selectors should be validated
// e.g. #%#//scriptlet('ubo-remove-class.js', 'blur', ', html')
document.querySelectorAll(selector);
}
const validArgs = applying
? [name, value, selector, applying]
: [name, value, selector];
return validArgs;
};
/**
* Converts string of UBO scriptlet rule to AdGuard scriptlet rule
*
* @param {string} rule UBO scriptlet rule
* @returns {string[]} array with one AdGuard scriptlet rule
*/
export const convertUboScriptletToAdg = (rule) => {
const domains = getBeforeRegExp(rule, validator.UBO_SCRIPTLET_MASK_REG);
const mask = rule.match(validator.UBO_SCRIPTLET_MASK_REG)[0];
let template;
if (mask.includes('@')) {
template = ADGUARD_SCRIPTLET_EXCEPTION_TEMPLATE;
} else {
template = ADGUARD_SCRIPTLET_TEMPLATE;
}
const argsStr = getStringInBraces(rule);
let parsedArgs = splitArgs(argsStr);
const scriptletName = parsedArgs[0].includes(UBO_SCRIPTLET_JS_ENDING)
? `ubo-${parsedArgs[0]}`
: `ubo-${parsedArgs[0]}${UBO_SCRIPTLET_JS_ENDING}`;
if (REMOVE_ATTR_ALIASES.includes(scriptletName) || REMOVE_CLASS_ALIASES.includes(scriptletName)) {
parsedArgs = validateRemoveAttrClassArgs(parsedArgs);
}
const args = parsedArgs
.map((arg, index) => {
let outputArg = arg;
if (index === 0) {
outputArg = scriptletName;
}
// for example: example.org##+js(abort-current-inline-script, $, popup)
if (arg === '$') {
outputArg = '$$';
}
return outputArg;
})
.map((arg) => wrapInSingleQuotes(arg))
.join(`${COMMA_SEPARATOR} `);
const adgRule = replacePlaceholders(
template,
{ domains, args },
);
return [adgRule];
};
/**
* Convert string of ABP snippet rule to AdGuard scriptlet rule
*
* @param {string} rule ABP snippet rule
* @returns {Array} array of AdGuard scriptlet rules, one or few items depends on Abp-rule
*/
export const convertAbpSnippetToAdg = (rule) => {
const SEMICOLON_DIVIDER = /;(?=(?:(?:[^"]*"){2})*[^"]*$)/g;
const mask = rule.includes(validator.ABP_SCRIPTLET_MASK)
? validator.ABP_SCRIPTLET_MASK
: validator.ABP_SCRIPTLET_EXCEPTION_MASK;
const template = mask === validator.ABP_SCRIPTLET_MASK
? ADGUARD_SCRIPTLET_TEMPLATE
: ADGUARD_SCRIPTLET_EXCEPTION_TEMPLATE;
const domains = substringBefore(rule, mask);
const args = substringAfter(rule, mask);
return args.split(SEMICOLON_DIVIDER)
// abp-rule may have `;` at the end which makes last array item irrelevant
// https://github.com/AdguardTeam/Scriptlets/issues/236
.filter(isExisting)
.map((args) => getSentences(args)
.map((arg, index) => (index === 0 ? `abp-${arg}` : arg))
.map((arg) => wrapInSingleQuotes(arg))
.join(`${COMMA_SEPARATOR} `))
.map((args) => replacePlaceholders(template, { domains, args }));
};
/**
* Validates ADG scriptlet rule syntax.
*
* IMPORTANT! The method is not very fast as it parses the rule and checks its syntax.
*
* @param {string} adgRuleText Single ADG scriptlet rule.
*
* @returns {boolean} False if ADG scriptlet rule syntax is not valid
* or `adgRuleText` is not an ADG scriptlet rule.
*/
const isValidAdgScriptletRuleSyntax = (adgRuleText) => {
if (!adgRuleText) {
return false;
}
if (!validator.isAdgScriptletRule(adgRuleText)) {
return false;
}
// isAdgScriptletRule() does not check the rule syntax
let parsedRule;
try {
// parseRule() ensures that the rule syntax is valid
// and it will throw an error if it is not
parsedRule = parseRule(adgRuleText);
return validator.isValidScriptletName(parsedRule.name);
} catch (e) {
return false;
}
};
/**
* Converts any scriptlet rule into AdGuard syntax rule.
* Comment is returned as is.
*
* @param {string} rule Scriptlet rule.
*
* @returns {string[]} Array of AdGuard scriptlet rules: one array item for ADG and UBO or few items for ABP.
* For the ADG `rule`, validates its syntax and returns an empty array if it is invalid.
*/
export const convertScriptletToAdg = (rule) => {
let result;
// TODO: multiple conditions may be refactored
if (validator.isUboScriptletRule(rule)) {
result = convertUboScriptletToAdg(rule);
} else if (validator.isAbpSnippetRule(rule)) {
result = convertAbpSnippetToAdg(rule);
} else if (validator.isAdgScriptletRule(rule)) {
if (isValidAdgScriptletRuleSyntax(rule)) {
result = [rule];
} else {
// eslint-disable-next-line no-console
console.log(`Invalid AdGuard scriptlet rule: ${rule}`);
result = [];
}
} else if (validator.isComment(rule)) {
result = [rule];
}
return result;
};
/**
* Converts UBO scriptlet rule to AdGuard one
*
* @param {string} rule AdGuard scriptlet rule
* @returns {string} UBO scriptlet rule
*/
export const convertAdgScriptletToUbo = (rule) => {
let res;
if (validator.isAdgScriptletRule(rule)) {
const { name: parsedName, args: parsedParams } = parseRule(rule);
let preparedParams;
if (parsedName === ADG_SET_CONSTANT_NAME
// https://github.com/AdguardTeam/FiltersCompiler/issues/102
&& parsedParams[1] === ADG_SET_CONSTANT_EMPTY_STRING) {
preparedParams = [parsedParams[0], UBO_SET_CONSTANT_EMPTY_STRING];
} else if (parsedName === ADG_SET_CONSTANT_NAME
// https://github.com/uBlockOrigin/uBlock-issues/issues/2411
&& parsedParams[1] === ADG_SET_CONSTANT_EMPTY_ARRAY) {
preparedParams = [parsedParams[0], UBO_SET_CONSTANT_EMPTY_ARRAY];
} else if (parsedName === ADG_SET_CONSTANT_NAME
&& parsedParams[1] === ADG_SET_CONSTANT_EMPTY_OBJECT) {
preparedParams = [parsedParams[0], UBO_SET_CONSTANT_EMPTY_OBJECT];
} else if (parsedName === ADG_PREVENT_FETCH_NAME
// https://github.com/AdguardTeam/Scriptlets/issues/109
&& (parsedParams[0] === ADG_PREVENT_FETCH_WILDCARD
|| parsedParams[0] === ADG_PREVENT_FETCH_EMPTY_STRING)) {
preparedParams = [UBO_NO_FETCH_IF_WILDCARD];
} else if ((parsedName === ADG_REMOVE_ATTR_NAME || parsedName === ADG_REMOVE_CLASS_NAME)
&& parsedParams[1] && parsedParams[1].includes(COMMA_SEPARATOR)) {
preparedParams = [
parsedParams[0],
replaceAll(parsedParams[1], COMMA_SEPARATOR, ESCAPED_COMMA_SEPARATOR),
];
} else {
preparedParams = parsedParams;
}
// object of name and aliases for the Adg-scriptlet
const adgScriptletObject = Object
.keys(scriptletList)
.map((el) => scriptletList[el])
.map((s) => {
const [name, ...aliases] = s.names;
return { name, aliases };
})
.find((el) => (el.name === parsedName
|| el.aliases.includes(parsedName)));
const { aliases } = adgScriptletObject;
if (aliases.length > 0) {
const uboAlias = adgScriptletObject.aliases
// eslint-disable-next-line no-restricted-properties
.find((alias) => alias.includes(UBO_ALIAS_NAME_MARKER));
if (uboAlias) {
const mask = rule.match(ADGUARD_SCRIPTLET_MASK_REG)[0];
let template;
if (mask.includes('@')) {
template = UBO_SCRIPTLET_EXCEPTION_TEMPLATE;
} else {
template = UBO_SCRIPTLET_TEMPLATE;
}
const domains = getBeforeRegExp(rule, ADGUARD_SCRIPTLET_MASK_REG);
const uboName = uboAlias
.replace(UBO_ALIAS_NAME_MARKER, '')
// '.js' in the Ubo scriptlet name can be omitted
// https://github.com/gorhill/uBlock/wiki/Resources-Library#general-purpose-scriptlets
.replace(UBO_SCRIPTLET_JS_ENDING, '');
const args = (preparedParams.length > 0)
? `${uboName}, ${preparedParams.join(`${COMMA_SEPARATOR} `)}`
: uboName;
const uboRule = replacePlaceholders(
template,
{ domains, args },
);
res = uboRule;
}
}
}
return res;
};
/**
* Returns scriptlet name from `rule`.
*
* @param {string} rule AdGuard syntax scriptlet rule.
* @returns {string|null} Scriptlet name or null.
*/
const getAdgScriptletName = (rule) => {
// get substring after '#//scriptlet('
let buffer = substringAfter(rule, `${ADG_SCRIPTLET_MASK}(`);
if (!buffer) {
return null;
}
// get the quote used for the first scriptlet parameter which is a name
const nameQuote = buffer[0];
// delete the quote from the buffer
buffer = buffer.slice(1);
if (!buffer) {
return null;
}
// get a supposed scriptlet name
const name = substringBefore(buffer, nameQuote);
return name === buffer
? null
: name;
};
/**
* 1. For ADG scriptlet checks whether the scriptlet syntax and name are valid.
* 2. For UBO and ABP scriptlet first checks their compatibility with ADG
* by converting them into ADG syntax, and after that checks the name.
*
* ADG or UBO rules are "single-scriptlet", but ABP rule may contain more than one snippet
* so if at least one of them is not valid — whole `ruleText` rule is not valid too.
*
* @param {string} ruleText Any scriptlet rule — ADG or UBO or ABP.
*
* @returns {boolean} True if scriptlet name is valid in rule.
*/
export const isValidScriptletRule = (ruleText) => {
if (!ruleText) {
return false;
}
// `ruleText` with ABP syntax may contain more than one snippet in one rule
const rulesArray = convertScriptletToAdg(ruleText);
// for ADG rule with invalid syntax convertScriptletToAdg() will return empty array
if (rulesArray.length === 0) {
return false;
}
// checking if each of parsed scriptlets is valid
// if at least one of them is not valid - whole `ruleText` is not valid too
const isValid = rulesArray.every((rule) => {
const name = getAdgScriptletName(rule);
return validator.isValidScriptletName(name);
});
return isValid;
};
/**
* Gets index and redirect resource marker from UBO/ADG modifiers array
*
* @param {string[]} modifiers rule modifiers
* @param {Object} redirectsData validator.REDIRECT_RULE_TYPES.(UBO|ADG)
* @param {string} rule rule string
* @returns {Object} { index, marker }
*/
const getMarkerData = (modifiers, redirectsData, rule) => {
let marker;
let index = modifiers.findIndex((m) => m.includes(redirectsData.redirectRuleMarker));
if (index > -1) {
marker = redirectsData.redirectRuleMarker;
} else {
index = modifiers.findIndex((m) => m.includes(redirectsData.redirectMarker));
if (index > -1) {
marker = redirectsData.redirectMarker;
} else {
throw new Error(`No redirect resource modifier found in rule: ${rule}`);
}
}
return { index, marker };
};
/**
* Converts Ubo redirect rule to Adg one
*
* @param {string} rule ubo redirect rule
* @returns {string} converted adg rule
*/
export const convertUboRedirectToAdg = (rule) => {
const firstPartOfRule = substringBefore(rule, '$');
const uboModifiers = validator.parseModifiers(rule);
const uboMarkerData = getMarkerData(uboModifiers, validator.REDIRECT_RULE_TYPES.UBO, rule);
const adgModifiers = uboModifiers
.map((modifier, index) => {
if (index === uboMarkerData.index) {
const uboName = substringAfter(modifier, uboMarkerData.marker);
const adgName = validator.REDIRECT_RULE_TYPES.UBO.compatibility[uboName];
const adgMarker = uboMarkerData.marker === validator.ADG_UBO_REDIRECT_RULE_MARKER
? validator.REDIRECT_RULE_TYPES.ADG.redirectRuleMarker
: validator.REDIRECT_RULE_TYPES.ADG.redirectMarker;
return `${adgMarker}${adgName}`;
}
if (modifier === UBO_XHR_TYPE) {
return ADG_XHR_TYPE;
}
return modifier;
})
.join(COMMA_SEPARATOR);
return `${firstPartOfRule}$${adgModifiers}`;
};
/**
* Converts Abp redirect rule to Adg one
*
* @param {string} rule abp redirect rule
* @returns {string} converted adg rule
*/
export const convertAbpRedirectToAdg = (rule) => {
const firstPartOfRule = substringBefore(rule, '$');
const abpModifiers = validator.parseModifiers(rule);
const adgModifiers = abpModifiers
.map((modifier) => {
if (modifier.includes(validator.REDIRECT_RULE_TYPES.ABP.redirectMarker)) {
const abpName = substringAfter(
modifier,
validator.REDIRECT_RULE_TYPES.ABP.redirectMarker,
);
const adgName = validator.REDIRECT_RULE_TYPES.ABP.compatibility[abpName];
return `${validator.REDIRECT_RULE_TYPES.ADG.redirectMarker}${adgName}`;
}
return modifier;
})
.join(COMMA_SEPARATOR);
return `${firstPartOfRule}$${adgModifiers}`;
};
/**
* Converts redirect rule to AdGuard one
*
* @param {string} rule redirect rule
* @returns {string} converted adg rule
*/
export const convertRedirectToAdg = (rule) => {
let result;
if (validator.isUboRedirectCompatibleWithAdg(rule)) {
result = convertUboRedirectToAdg(rule);
} else if (validator.isAbpRedirectCompatibleWithAdg(rule)) {
result = convertAbpRedirectToAdg(rule);
} else if (validator.isValidAdgRedirectRule(rule)) {
result = rule;
}
return result;
};
/**
* Converts Adg redirect rule to Ubo one
* 1. Checks if there is Ubo analog for Adg rule
* 2. Parses the rule and checks if there are any source type modifiers which are required by Ubo
* and if there are no one we add it manually to the end.
* Source types are chosen according to redirect name
* e.g. ||ad.com^$redirect=<name>,important ->> ||ad.com^$redirect=<name>,important,script
* 3. Replaces Adg redirect name by Ubo analog
*
* @param {string} rule adg rule
* @returns {string} converted ubo rule
* @throws on incompatible rule
*/
export const convertAdgRedirectToUbo = (rule) => {
if (!validator.isAdgRedirectCompatibleWithUbo(rule)) {
throw new Error(`Unable to convert for uBO - unsupported redirect in rule: ${rule}`);
}
const basePart = substringBefore(rule, '$');
const adgModifiers = validator.parseModifiers(rule);
const adgMarkerData = getMarkerData(adgModifiers, validator.REDIRECT_RULE_TYPES.ADG, rule);
const adgRedirectName = adgModifiers[adgMarkerData.index].slice(adgMarkerData.marker.length);
if (!validator.hasValidContentType(rule)) {
// add missed source types as content type modifiers
const sourceTypesData = validator.ABSENT_SOURCE_TYPE_REPLACEMENT
.find((el) => el.NAME === adgRedirectName);
if (typeof sourceTypesData === 'undefined') {
// eslint-disable-next-line max-len
throw new Error(`Unable to convert for uBO - no types to add for specific redirect in rule: ${rule}`);
}
const additionModifiers = sourceTypesData.TYPES;
adgModifiers.push(...additionModifiers);
}
const uboModifiers = adgModifiers
.map((el, index) => {
if (index === adgMarkerData.index) {
const uboMarker = adgMarkerData.marker === validator.ADG_UBO_REDIRECT_RULE_MARKER
? validator.REDIRECT_RULE_TYPES.UBO.redirectRuleMarker
: validator.REDIRECT_RULE_TYPES.UBO.redirectMarker;
// eslint-disable-next-line max-len
const uboRedirectName = validator.REDIRECT_RULE_TYPES.ADG.compatibility[adgRedirectName];
return `${uboMarker}${uboRedirectName}`;
}
return el;
})
.join(COMMA_SEPARATOR);
return `${basePart}$${uboModifiers}`;
};