In [1]:
# 1. 2021/07/06 까지

import os
import pandas as pd
import xml.etree.ElementTree as ET
from datetime import datetime

def parse_xml_to_df(xml_file):
    try:
        with open(xml_file, 'r', encoding='utf-8') as file:
            xml_content = file.read()
        
        # Parse the XML content
        root = ET.fromstring(xml_content)

        # Prepare lists to store the data
        titles = []
        pub_dates = []

        # Iterate through each item in the XML
        for item in root.findall('item'):
            # Check if the language is 'en'
            language = item.find('ns0language')
            if language is not None and language.text == 'en':
                # Extract title, description, and pubDate
                title = item.find('title').text if item.find('title') is not None else ''
                pub_date = item.find('pubDate').text if item.find('pubDate') is not None else ''
                
                # Convert pub_date to the desired format (YYYY-MM-DD)
                if pub_date:
                    pub_date = datetime.strptime(pub_date, '%a, %d %b %Y %H:%M:%S %z').strftime('%Y-%m-%d')
                
                # Append to lists
                titles.append(title)
                pub_dates.append(pub_date)

        # Create a DataFrame
        df = pd.DataFrame({
            'Title': titles,
            'Date': pub_dates
        })

        return df

    except ET.ParseError as e:
        print(f"Error parsing {xml_file}: {e}")
        return pd.DataFrame()

def process_all_xml_files(root_folder):
    all_dfs = []
    
    # Iterate through each folder in the root directory
    for folder_name in os.listdir(root_folder):
        folder_path = os.path.join(root_folder, folder_name)
        
        if os.path.isdir(folder_path):
            # Iterate through each XML file in the folder
            for file_name in os.listdir(folder_path):
                if file_name.endswith('.xml'):
                    file_path = os.path.join(folder_path, file_name)
                    df = parse_xml_to_df(file_path)
                    if not df.empty:
                        all_dfs.append(df)

    # Concatenate all dataframes
    final_df = pd.concat(all_dfs, ignore_index=True)
    
    return final_df

def save_df_to_csv(df, output_file):
    df.to_csv(output_file, index=False, encoding='utf-8')

# Example usage
root_folder_path = 'data/news'  # Change this to the path of the root folder containing the dated folders
output_csv_path = 'filtered_news_title_1.csv'

final_df = process_all_xml_files(root_folder_path)
save_df_to_csv(final_df, output_csv_path)


  from pandas.core.computation.check import NUMEXPR_INSTALLED
  from pandas.core import (


Error parsing data/news\20180927\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20180928\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20180929\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20180930\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181001\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181002\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181003\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181004\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181005\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181007\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/n

Error parsing data/news\20181219\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181220\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181221\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181222\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181223\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181224\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181225\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181226\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181227\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20181228\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/n

Error parsing data/news\20190311\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190312\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190313\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190314\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190315\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190316\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190317\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190318\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190320\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190321\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/n

Error parsing data/news\20190605\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190606\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190607\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190608\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190609\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190610\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190611\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190612\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190613\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190614\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/n

Error parsing data/news\20190828\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190829\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190830\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190831\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190901\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190902\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190903\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190904\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190905\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20190906\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/n

Error parsing data/news\20191125\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20191126\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20191127\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20191128\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20191129\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20191130\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20191201\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20191202\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20191203\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20191204\Rotavirus.xml: no element found: line 4, column 6978
Error parsing data/news\20191204

Error parsing data/news\20200118\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20200119\Food-borne.xml: mismatched tag: line 6, column 2
Error parsing data/news\20200119\Giardiasis.xml: mismatched tag: line 6, column 2
Error parsing data/news\20200119\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20200120\Fasciola.xml: mismatched tag: line 6, column 2
Error parsing data/news\20200120\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20200121\Hookworm.xml: mismatched tag: line 6, column 2
Error parsing data/news\20200121\Hymenolepsis.xml: mismatched tag: line 6, column 2
Error parsing data/news\20200121\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20200122\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Error parsing data/news\20200123\Yersinia Pestis (Plague).xml: mismatched tag: line 1, column 956
Erro

Error parsing data/news\20200305\Yersinia Pestis (Plague).xml: not well-formed (invalid token): line 1, column 129
Error parsing data/news\20200306\Babesiosis.xml: mismatched tag: line 6, column 2
Error parsing data/news\20200306\Yersinia Pestis (Plague).xml: not well-formed (invalid token): line 1, column 129
Error parsing data/news\20200307\Avian flu.xml: mismatched tag: line 6, column 2
Error parsing data/news\20200309\Dengue Fever.xml: mismatched tag: line 6, column 2
Error parsing data/news\20200309\Yersinia Pestis (Plague).xml: not well-formed (invalid token): line 1, column 129
Error parsing data/news\20200310\Brucellosis.xml: mismatched tag: line 6, column 2
Error parsing data/news\20200310\Yersinia Pestis (Plague).xml: not well-formed (invalid token): line 1, column 129
Error parsing data/news\20200312\Yersinia Pestis (Plague).xml: not well-formed (invalid token): line 1, column 129
Error parsing data/news\20200313\Yersinia Pestis (Plague).xml: not well-formed (invalid token):

Error parsing data/news\20200508\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200509\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200510\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200511\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200512\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200513\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200514\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200515\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200516\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200517\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200518\Yersinia Pestis (Plague).xm

Error parsing data/news\20200714\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200715\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 4735
Error parsing data/news\20200715\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200716\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 4735
Error parsing data/news\20200716\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200718\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 4735
Error parsing data/news\20200718\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200719\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 4735
Error parsing data/news\20200719\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200720\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 4735
Error pars

Error parsing data/news\20200826\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 4546
Error parsing data/news\20200826\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200827\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 4546
Error parsing data/news\20200827\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200828\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 4546
Error parsing data/news\20200828\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200829\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 5659
Error parsing data/news\20200829\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20200830\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 5659
Error parsing data/news\20200830\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error pars

Error parsing data/news\20201006\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201007\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 6599
Error parsing data/news\20201007\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201008\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 6599
Error parsing data/news\20201008\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201009\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 6599
Error parsing data/news\20201009\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201010\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 6599
Error parsing data/news\20201010\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201011\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 6599
Error pars

Error parsing data/news\20201217\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201218\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201219\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201220\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201221\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201222\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201223\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201224\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201225\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201226\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20201227\Yersinia Pestis (Plague).xm

Error parsing data/news\20210213\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210214\Fasciolopsiasis.xml: not well-formed (invalid token): line 1, column 1139
Error parsing data/news\20210214\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210215\Fasciolopsiasis.xml: not well-formed (invalid token): line 1, column 1139
Error parsing data/news\20210215\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210216\Fasciolopsiasis.xml: not well-formed (invalid token): line 1, column 1139
Error parsing data/news\20210216\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210217\Fasciolopsiasis.xml: not well-formed (invalid token): line 1, column 1139
Error parsing data/news\20210217\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210218\Fasciolopsiasis.xml: not well-formed (invalid token): line 1, column 

Error parsing data/news\20210428\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210429\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210430\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210501\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210502\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210503\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210504\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210505\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210506\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210507\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210508\Yersinia Pestis (Plague).xm

Error parsing data/news\20210717\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210718\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210719\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210720\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210721\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210722\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210723\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210724\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210725\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210726\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210727\Yersinia Pestis (Plague).xm

Error parsing data/news\20211216\HendraVirus.xml: syntax error: line 1, column 0
Error parsing data/news\20211216\Hepatitis A.xml: syntax error: line 1, column 0
Error parsing data/news\20211216\Hepatitis B.xml: syntax error: line 1, column 0
Error parsing data/news\20211216\Hepatitis C.xml: syntax error: line 1, column 0
Error parsing data/news\20211216\Hepatitis E.xml: syntax error: line 1, column 0
Error parsing data/news\20211216\Herpes Zoster.xml: syntax error: line 1, column 0
Error parsing data/news\20211216\Herpes.xml: syntax error: line 1, column 0
Error parsing data/news\20211216\Hookworm.xml: syntax error: line 1, column 0
Error parsing data/news\20211216\Hymenolepsis.xml: syntax error: line 1, column 0
Error parsing data/news\20211216\Influenza.xml: syntax error: line 1, column 0
Error parsing data/news\20211216\Japanese Encephalitis.xml: syntax error: line 1, column 0
Error parsing data/news\20211216\Kaposis Sarcoma.xml: syntax error: line 1, column 0
Error parsing data/ne

In [2]:
import os
import pandas as pd
import xml.etree.ElementTree as ET
from datetime import datetime, timedelta

def parse_xml_to_df(xml_file):
    try:
        with open(xml_file, 'r', encoding='utf-8') as file:
            xml_content = file.read()
        
        # Parse the XML content
        root = ET.fromstring(xml_content)

        # Extract namespaces
        namespaces = {'ns0': root.tag.split('}')[0].strip('{')}

        # Prepare lists to store the data
        titles = []
        pub_dates = []

        # Iterate through each item in the XML
        for item in root.findall('item'):
            # Check if the language is 'en'
            language = item.find('ns1language', namespaces)
            if language is not None and language.text == 'en':
                # Extract title and pubDate
                title = item.find('title').text if item.find('title') is not None else ''
                pub_date = item.find('pubDate').text if item.find('pubDate') is not None else ''
                
                # Convert pub_date to the desired format (YYYY-MM-DD) or set it to an empty string
                if pub_date:
                    pub_date = datetime.strptime(pub_date, '%a, %d %b %Y %H:%M:%S %z').strftime('%Y-%m-%d')
                else:
                    pub_date = ''

                # Append to lists
                titles.append(title)
                pub_dates.append(pub_date)

        # Create a DataFrame if lists are not empty
        if titles:
            df = pd.DataFrame({
                'Title': titles,
                'Date': pub_dates
            })
            return df
        else:
            return pd.DataFrame()

    except ET.ParseError as e:
        print(f"Error parsing {xml_file}: {e}")
        return pd.DataFrame()

def process_all_xml_files(root_folder, start_date, end_date):
    all_dfs = []
    current_date = start_date
    
    while current_date <= end_date:
        folder_name = current_date.strftime('%Y%m%d')
        folder_path = os.path.join(root_folder, folder_name)
        
        if os.path.isdir(folder_path):
            # Iterate through each XML file in the folder
            for file_name in os.listdir(folder_path):
                if file_name.endswith('.xml'):
                    file_path = os.path.join(folder_path, file_name)
                    df = parse_xml_to_df(file_path)
                    if not df.empty:
                        all_dfs.append(df)
        else:
            print(f"Folder {folder_name} does not exist. Skipping.")
        
        # Move to the next day
        current_date += timedelta(days=1)

    # Concatenate all dataframes if any
    if all_dfs:
        final_df = pd.concat(all_dfs, ignore_index=True)
    else:
        final_df = pd.DataFrame(columns=['Title', 'Date'])
    
    return final_df

def save_df_to_csv(df, output_file):
    df.to_csv(output_file, index=False, encoding='utf-8')

# Example usage
root_folder_path = 'data/news'  # Change this to the path of the root folder containing the dated folders
start_date = datetime.strptime('20210701', '%Y%m%d')
end_date = datetime.strptime('20230922', '%Y%m%d')
output_csv_path = 'filtered_news_title_2.csv'

final_df = process_all_xml_files(root_folder_path, start_date, end_date)
save_df_to_csv(final_df, output_csv_path)


Error parsing data/news\20210701\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210702\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210703\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210704\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210705\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210706\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210707\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210708\Hymenolepsis.xml: not well-formed (invalid token): line 1, column 1007
Error parsing data/news\20210708\SchmallenbergVirus.xml: not well-formed (invalid token): line 1, column 6056
Error parsing data/news\20210708\Yersinia Pestis (Plague).xml: syntax error: line 1, column 0
Error parsing data/news\20210709\H

Error parsing data/news\20220414\Equine encephalitis.xml: no element found: line 1, column 0
Error parsing data/news\20220414\Hanta Fever.xml: no element found: line 1, column 0
Error parsing data/news\20220414\Leishmaniasis.xml: no element found: line 1, column 0
Error parsing data/news\20220414\Leptospirosis.xml: no element found: line 1, column 0
Error parsing data/news\20220414\Malaria.xml: no element found: line 1, column 0
Error parsing data/news\20220414\Measles.xml: no element found: line 1, column 0
Error parsing data/news\20220414\Meningitis.xml: no element found: line 1, column 0
Error parsing data/news\20220414\Mumps.xml: no element found: line 1, column 0
Error parsing data/news\20220414\Nosocomial.xml: no element found: line 1, column 0
Error parsing data/news\20220414\Pneumonia.xml: no element found: line 1, column 0
Error parsing data/news\20220414\Poliomyelitis.xml: no element found: line 1, column 0
Error parsing data/news\20220414\Swine Flu.xml: no element found: lin