add: better support for converter tool on windows

basxsoftwareassociation · Nov 13, 2022 · 0c0a8dc · 0c0a8dc · Eiltherune · Nov 14, 2022
1 parent 68bf97d
commit 0c0a8dc
Show file tree

Hide file tree

Showing 2 changed files with 17 additions and 6 deletions.
diff --git a/htmlgenerator/contrib/convertfromhtml.py b/htmlgenerator/contrib/convertfromhtml.py
@@ -1,4 +1,5 @@
 import codecs
+import os
 
 import black  # type: ignore
 from bs4 import BeautifulSoup, Comment, Doctype, NavigableString, Tag  # type: ignore
@@ -122,10 +123,12 @@ def parsehtml(html, formatting, compact):
 html = hg.BaseElement(""",
     ]
 
-    soup = BeautifulSoup(
-        html,
-        "lxml",
-    )
+    if os.name == "nt":
+        parser = "html.parser"
+    else:
+        parser = "lxml"
+
+    soup = BeautifulSoup(html, parser)
     for subtag in soup.contents:
         tags = convert(subtag, 1, compact)
         if tags:
@@ -146,6 +149,7 @@ def main():
 
     formatflag = "--no-formatting"
     compactflag = "--compact"
+    encodingflag = "--encoding"
 
     files = sys.argv[1:]
     formatting = formatflag not in files
@@ -154,10 +158,15 @@ def main():
         files.remove(formatflag)
     if compactflag in files:
         files.remove(compactflag)
+    if encodingflag in files:
+        encoding = files[files.index(encodingflag) + 1]
+        files.remove(encodingflag)
+        files.remove(encoding)
+
     if not files:
         print(parsehtml(sys.stdin.read(), formatting, compact), end="")
     for _file in files:
-        with open(_file) as rf:
+        with open(_file, encoding=encoding) as rf:
             with open(_file + ".py", "w") as wf:
                 wf.write(parsehtml(rf.read(), formatting, compact))
 

diff --git a/setup.py b/setup.py
@@ -25,7 +25,9 @@
     packages=find_packages(),
     zip_safe=False,
     include_package_data=True,
-    extras_require={"all": ["black", "beautifulsoup4", "lxml"]},
+    extras_require={
+        "all": ["black", "beautifulsoup4", "lxml;platform_system!='Windows'"]
+    },
     entry_points={
         "console_scripts": [
             "convertfromhtml = htmlgenerator.contrib.convertfromhtml:main",