/
stringparser.py
80 lines (63 loc) · 2.15 KB
/
stringparser.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
"""A simple file parser that can tell whether the first character of a line
is quoted or not"""
from .languages import _COMMENT
class StringParser:
"""A simple file parser that can tell whether the first character of a line
is quoted or not"""
single = None
triple = None
triple_start = None
def __init__(self, language):
self.ignore = language is None
self.python = language != "R"
self.comment = _COMMENT.get(language)
def is_quoted(self):
"""Is the next line quoted?"""
if self.ignore:
return False
return self.single or self.triple
def read_line(self, line):
"""Read a new line"""
if self.ignore:
return
# Do not search for quotes when the line is commented out (and not quoted)
if (
not self.is_quoted()
and self.comment is not None
and line.startswith(self.comment)
):
return
self.triple_start = -1
for i, char in enumerate(line):
if char not in ['"', "'"]:
continue
# Is the char escaped?
if line[i - 1 : i] == "\\":
continue
if self.single == char:
self.single = None
continue
if self.single is not None:
continue
if not self.python:
continue
if line[i - 2 : i + 1] == 3 * char and i >= self.triple_start + 3:
# End of a triple quote
if self.triple == char:
self.triple = None
self.triple_start = i
continue
# Are we looking for a different triple quote?
if self.triple is not None:
continue
# Triple quote starting
self.triple = char
self.triple_start = i
continue
# Inside a multiline quote
if self.triple is not None:
continue
self.single = char
# Line ended
if self.python:
self.single = None