In [55]:
import logging
import re
from bs4 import BeautifulSoup

In [47]:
!rm -f example.xml

In [48]:
%%writefile example.xml
<?xml version="1.0" encoding="UTF-8"?>
<xbrl
    xmlns="http://www.xbrl.org/2003/instance"
    xmlns:country="http://xbrl.sec.gov/country/2020-01-31"
    xmlns:dei="http://xbrl.sec.gov/dei/2020-01-31"
    xmlns:iso4217="http://www.xbrl.org/2003/iso4217"
    xmlns:link="http://www.xbrl.org/2003/linkbase"
    xmlns:rfmd="http://www.rfmd.com/20210403"
    xmlns:srt="http://fasb.org/srt/2020-01-31"
    xmlns:us-gaap="http://fasb.org/us-gaap/2020-01-31"
    xmlns:xbrldi="http://xbrl.org/2006/xbrldi"
    xmlns:xlink="http://www.w3.org/1999/xlink"
    xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="en-US">
</xbrl>

Writing example.xml


In [49]:
def load_from_xml(filepath:str) -> str:
    """Load the XML contents from the filepath
    Args:
        filepath: path to the XML file
    Returns: XML content
    """
    try:
        with open(filepath, "r") as f:
            content = f.read()
    except OSError as e:
        logging.error("load_from_xml():failed to read [%s] as [%s]" % (filepath, e))
        raise RuntimeError("load_from_xml()") from e
    pass
    return content


In [50]:
xml = load_from_xml("./example.xml")

In [51]:
soup = BeautifulSoup(xml, 'xml')

In [52]:
soup.is_xml

True

In [53]:
print(soup.prettify())

<?xml version="1.0" encoding="utf-8"?>
<xbrl xml:lang="en-US" xmlns="http://www.xbrl.org/2003/instance" xmlns:country="http://xbrl.sec.gov/country/2020-01-31" xmlns:dei="http://xbrl.sec.gov/dei/2020-01-31" xmlns:iso4217="http://www.xbrl.org/2003/iso4217" xmlns:link="http://www.xbrl.org/2003/linkbase" xmlns:rfmd="http://www.rfmd.com/20210403" xmlns:srt="http://fasb.org/srt/2020-01-31" xmlns:us-gaap="http://fasb.org/us-gaap/2020-01-31" xmlns:xbrldi="http://xbrl.org/2006/xbrldi" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
</xbrl>


In [58]:
soup.find(re.compile("XBRL", re.I))

<xbrl xml:lang="en-US" xmlns="http://www.xbrl.org/2003/instance" xmlns:country="http://xbrl.sec.gov/country/2020-01-31" xmlns:dei="http://xbrl.sec.gov/dei/2020-01-31" xmlns:iso4217="http://www.xbrl.org/2003/iso4217" xmlns:link="http://www.xbrl.org/2003/linkbase" xmlns:rfmd="http://www.rfmd.com/20210403" xmlns:srt="http://fasb.org/srt/2020-01-31" xmlns:us-gaap="http://fasb.org/us-gaap/2020-01-31" xmlns:xbrldi="http://xbrl.org/2006/xbrldi" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
</xbrl>