In [None]:
import os
import logging
import csv
import xml.etree.ElementTree as ET
from docx_extraction import extract_docx_properties
from docx import Document

def process_folder(folder_path, output_folder):
    if not os.path.exists(output_folder):
        os.makedirs(output_folder)
    
    for root, dirs, files in os.walk(folder_path):
        for file in files:
            if file.endswith('.docx'):
                input_file_path = os.path.join(root, file)
                output_csv_path = os.path.join(output_folder, os.path.splitext(file)[0] + '.csv')
                extract_and_save_properties(input_file_path, output_csv_path)

def extract_and_save_properties(input_file_path, output_csv_path):
    logging.info(f"Started to extract the docx properties from {input_file_path}")
    doc = Document(input_file_path)
    remove_empty_paragraphs(doc)
    doc.save(input_file_path)  # Save the cleaned document
    para_properties_xml = extract_docx_properties(input_file_path)
    if para_properties_xml:
        logging.info(f"Converting properties XML to CSV: {output_csv_path}")
        xml_to_csv(para_properties_xml, output_csv_path)
    else:
        logging.warning(f"No properties extracted from {input_file_path}")

def xml_to_csv(para_properties_xml, output_csv_path):
    root = ET.fromstring(para_properties_xml)
    properties_list = []
    for para in root.findall('ParagraphProperties'):
        properties_dict = {}
        for prop in para:
            properties_dict[prop.tag] = prop.text
        properties_list.append(properties_dict)
    
    fieldnames = properties_list[0].keys() if properties_list else []
    with open(output_csv_path, 'w', newline='', encoding='utf-8-sig') as csvfile:
        writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
        writer.writeheader()
        writer.writerows(properties_list)

def remove_empty_paragraphs(doc):
    for para in doc.paragraphs[:]:
        if not para.text.strip():
            doc._element.body.remove(para._element)

if __name__ == "__main__":
    folder_path = '/Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx'
    output_folder = '/Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset'
    process_folder(folder_path, output_folder)


In [9]:
import os
import logging
import csv
import xml.etree.ElementTree as ET
from docx_extraction import extract_docx_properties
from docx import Document

def process_folder(folder_path, output_folder):
    if not os.path.exists(output_folder):
        os.makedirs(output_folder)
    
    for root, dirs, files in os.walk(folder_path):
        for file in files:
            if file.endswith('.docx'):
                input_file_path = os.path.join(root, file)
                output_csv_path = os.path.join(output_folder, os.path.splitext(file)[0] + '.csv')
                try:
                    extract_and_save_properties(input_file_path, output_csv_path)
                except Exception as e:
                    logging.warning(f"Error processing file {input_file_path}: {str(e)}")

def extract_and_save_properties(input_file_path, output_csv_path):
    logging.info(f"Started to extract the docx properties from {input_file_path}")
    doc = Document(input_file_path)
    remove_empty_paragraphs(doc)
    doc.save(input_file_path)  # Save the cleaned document
    try:
        para_properties_xml = extract_docx_properties(input_file_path)
        if para_properties_xml:
            logging.info(f"Converting properties XML to CSV: {output_csv_path}")
            xml_to_csv(para_properties_xml, output_csv_path)
        else:
            logging.warning(f"No properties extracted from {input_file_path}")
    except Exception as e:
        logging.warning(f"Error extracting properties from {input_file_path}: {str(e)}")

def xml_to_csv(para_properties_xml, output_csv_path):
    try:
        root = ET.fromstring(para_properties_xml)
        properties_list = []
        for para in root.findall('ParagraphProperties'):
            properties_dict = {}
            for prop in para:
                properties_dict[prop.tag] = prop.text
            properties_list.append(properties_dict)
        
        fieldnames = properties_list[0].keys() if properties_list else []
        with open(output_csv_path, 'w', newline='', encoding='utf-8-sig') as csvfile:
            writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
            writer.writeheader()
            writer.writerows(properties_list)
    except Exception as e:
        logging.warning(f"Error converting properties XML to CSV: {str(e)}")

def remove_empty_paragraphs(doc):
    for para in doc.paragraphs[:]:
        if not para.text.strip():
            doc._element.body.remove(para._element)

if __name__ == "__main__":
    folder_path = '/Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx'
    output_folder = '/Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset'
    process_folder(folder_path, output_folder)


2024-02-10 22:08:53 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/ESE_20236882.docx
2024-02-10 22:08:53 INFO     Started creating the docx object
2024-02-10 22:08:53 INFO     Extracting the properties of the document
2024-02-10 22:08:53 INFO     Started processing the components to extract the properties
2024-02-10 22:08:55 INFO     Writing the extracted properties into XML
2024-02-10 22:08:55 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/ESE_20236882.csv
2024-02-10 22:08:55 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/ETJ_230108.docx
2024-02-10 22:08:55 INFO     Started creating the docx object
2024-02-10 22:08:55 INFO     Extracting the properties of the document
2024-02-10 22:08:55 INFO     Started proce

Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from lis

2024-02-10 22:10:08 INFO     Writing the extracted properties into XML
2024-02-10 22:10:08 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/JN_20230505.csv
2024-02-10 22:10:08 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/REP_230067.docx
2024-02-10 22:10:08 INFO     Started creating the docx object
2024-02-10 22:10:08 INFO     Extracting the properties of the document
2024-02-10 22:10:08 INFO     Started processing the components to extract the properties
2024-02-10 22:10:14 INFO     Writing the extracted properties into XML
2024-02-10 22:10:14 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/REP_230067.csv
2024-02-10 22:10:14 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-10 22:20:47 INFO     Writing the extracted properties into XML
2024-02-10 22:20:47 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/CMJ_20220117.csv
2024-02-10 22:20:47 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/OIKOS_oik_09929.docx
2024-02-10 22:20:47 INFO     Started creating the docx object
2024-02-10 22:20:47 INFO     Extracting the properties of the document
2024-02-10 22:20:47 INFO     Started processing the components to extract the properties
2024-02-10 22:20:59 INFO     Writing the extracted properties into XML
2024-02-10 22:20:59 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/OIKOS_oik_09929.csv
2024-02-10 22:20:59 INFO     Started to extract the docx properties from /Users/senthil/Downloads/J

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-10 22:22:29 INFO     Writing the extracted properties into XML
2024-02-10 22:22:29 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/EDM_230088.csv
2024-02-10 22:22:29 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/TJG_20230492.docx
2024-02-10 22:22:29 INFO     Started creating the docx object
2024-02-10 22:22:29 INFO     Extracting the properties of the document
2024-02-10 22:22:29 INFO     Started processing the components to extract the properties
2024-02-10 22:22:32 INFO     Writing the extracted properties into XML
2024-02-10 22:22:32 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/TJG_20230492.csv
2024-02-10 22:22:32 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journ

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-10 22:23:17 INFO     Writing the extracted properties into XML
2024-02-10 22:23:17 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/TJN_20230573.csv
2024-02-10 22:23:17 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/OIKOS_lind_25251.docx
2024-02-10 22:23:17 INFO     Started creating the docx object
2024-02-10 22:23:17 INFO     Extracting the properties of the document
2024-02-10 22:23:17 INFO     Started processing the components to extract the properties
2024-02-10 22:23:19 INFO     Writing the extracted properties into XML
2024-02-10 22:23:19 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/OIKOS_lind_25251.csv
2024-02-10 22:23:19 INFO     Started to extract the docx properties from /Users/senthil/Downloads

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-10 22:25:46 INFO     Writing the extracted properties into XML
2024-02-10 22:25:46 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/OIKOS_oik_09952.csv
2024-02-10 22:25:46 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/AJC_20233695.docx
2024-02-10 22:25:46 INFO     Started creating the docx object
2024-02-10 22:25:46 INFO     Extracting the properties of the document
2024-02-10 22:25:46 INFO     Started processing the components to extract the properties
2024-02-10 22:25:50 INFO     Writing the extracted properties into XML
2024-02-10 22:25:50 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/AJC_20233695.csv
2024-02-10 22:25:50 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/

Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range


2024-02-11 00:06:30 INFO     Writing the extracted properties into XML
2024-02-11 00:06:30 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/TJG_23116.csv
2024-02-11 00:06:30 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/AOTT_20230184.docx
2024-02-11 00:06:30 INFO     Started creating the docx object
2024-02-11 00:06:30 INFO     Extracting the properties of the document
2024-02-11 00:06:30 INFO     Started processing the components to extract the properties
2024-02-11 00:06:31 INFO     Writing the extracted properties into XML
2024-02-11 00:06:31 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/AOTT_20230184.csv
2024-02-11 00:06:31 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/jour

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 00:43:42 INFO     Writing the extracted properties into XML
2024-02-11 00:43:42 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/AJC_20233779.csv
2024-02-11 00:43:42 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/JME_230087.docx
2024-02-11 00:43:42 INFO     Started creating the docx object
2024-02-11 00:43:42 INFO     Extracting the properties of the document
2024-02-11 00:43:42 INFO     Started processing the components to extract the properties
2024-02-11 00:43:47 INFO     Writing the extracted properties into XML
2024-02-11 00:43:47 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/JME_230087.csv
2024-02-11 00:43:47 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journal

Error while fetching the list style information from para: 'NoneType' object has no attribute 'val'
Error while fetching the left indent information from list para: 'NoneType' object has no attribute 'val'
Error while fetching the list style information from para: 'NoneType' object has no attribute 'val'
Error while fetching the left indent information from list para: 'NoneType' object has no attribute 'val'
Error while fetching the list style information from para: 'NoneType' object has no attribute 'val'
Error while fetching the left indent information from list para: 'NoneType' object has no attribute 'val'
Error while fetching the list style information from para: 'NoneType' object has no attribute 'val'
Error while fetching the left indent information from list para: 'NoneType' object has no attribute 'val'
Error while fetching the list style information from para: 'NoneType' object has no attribute 'val'
Error while fetching the left indent information from list para: 'NoneType' 

2024-02-11 02:45:48 INFO     Writing the extracted properties into XML
2024-02-11 02:45:48 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/JIAO_20220806.csv
2024-02-11 02:45:48 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/AUJWS_20230033.docx
2024-02-11 02:45:48 INFO     Started creating the docx object
2024-02-11 02:45:48 INFO     Extracting the properties of the document
2024-02-11 02:45:48 INFO     Started processing the components to extract the properties
2024-02-11 02:45:49 INFO     Writing the extracted properties into XML
2024-02-11 02:45:49 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/AUJWS_20230033.csv
2024-02-11 02:45:49 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JP

Error while fetching the list style information from para: 'NoneType' object has no attribute 'val'
Error while fetching the left indent information from list para: 'NoneType' object has no attribute 'val'
Error while fetching the list style information from para: 'NoneType' object has no attribute 'val'
Error while fetching the left indent information from list para: 'NoneType' object has no attribute 'val'


2024-02-11 05:49:03 INFO     Writing the extracted properties into XML
2024-02-11 05:49:03 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/JN_20230446.csv
2024-02-11 05:49:03 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/OIKOS_oik_10328.docx
2024-02-11 05:49:03 INFO     Started creating the docx object
2024-02-11 05:49:03 INFO     Extracting the properties of the document
2024-02-11 05:49:03 INFO     Started processing the components to extract the properties
2024-02-11 06:49:46 INFO     Writing the extracted properties into XML
2024-02-11 06:49:46 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/OIKOS_oik_10328.csv
2024-02-11 06:49:46 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JP

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 07:41:02 INFO     Writing the extracted properties into XML
2024-02-11 07:41:02 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/AHSR_20230133.csv
2024-02-11 07:41:02 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/REP_230237.docx
2024-02-11 07:41:02 INFO     Started creating the docx object
2024-02-11 07:41:02 INFO     Extracting the properties of the document
2024-02-11 07:41:02 INFO     Started processing the components to extract the properties
2024-02-11 07:41:08 INFO     Writing the extracted properties into XML
2024-02-11 07:41:08 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/REP_230237.csv
2024-02-11 07:41:08 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journa

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 07:41:28 INFO     Writing the extracted properties into XML
2024-02-11 07:41:28 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/ECC_230472.csv
2024-02-11 07:41:28 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/ENTU_20230338.docx
2024-02-11 07:41:28 INFO     Started creating the docx object
2024-02-11 07:41:28 INFO     Extracting the properties of the document
2024-02-11 07:41:28 INFO     Started processing the components to extract the properties
2024-02-11 07:41:29 INFO     Writing the extracted properties into XML
2024-02-11 07:41:30 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/ENTU_20230338.csv
2024-02-11 07:41:30 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/jou

Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from lis

2024-02-11 07:43:28 INFO     Writing the extracted properties into XML
2024-02-11 07:43:28 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/TJG_20230267.csv
2024-02-11 07:43:28 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/CRDS_20220002.docx
2024-02-11 07:43:28 INFO     Started creating the docx object
2024-02-11 07:43:28 INFO     Extracting the properties of the document
2024-02-11 07:43:28 INFO     Started processing the components to extract the properties
2024-02-11 07:43:31 INFO     Writing the extracted properties into XML
2024-02-11 07:43:31 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/CRDS_20220002.csv
2024-02-11 07:43:31 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/j

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 07:48:00 INFO     Writing the extracted properties into XML
2024-02-11 07:48:00 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/ERP_20230395.csv
2024-02-11 07:48:00 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/EAJM_20230376.docx
2024-02-11 07:48:00 INFO     Started creating the docx object
2024-02-11 07:48:00 INFO     Extracting the properties of the document
2024-02-11 07:48:00 INFO     Started processing the components to extract the properties
2024-02-11 07:48:02 INFO     Writing the extracted properties into XML
2024-02-11 07:48:02 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/EAJM_20230376.csv
2024-02-11 07:48:02 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/j

Error while fetching the list style information from para: list index out of range
Error while fetching the list style information from para: list index out of range


2024-02-11 07:48:17 INFO     Writing the extracted properties into XML
2024-02-11 07:48:17 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/AP_20231223.csv
2024-02-11 07:48:17 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/EAJM_20230360.docx
2024-02-11 07:48:18 INFO     Started creating the docx object
2024-02-11 07:48:18 INFO     Extracting the properties of the document
2024-02-11 07:48:18 INFO     Started processing the components to extract the properties
2024-02-11 07:48:22 INFO     Writing the extracted properties into XML
2024-02-11 07:48:22 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/EAJM_20230360.csv
2024-02-11 07:48:22 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/jo

Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range


2024-02-11 08:03:53 INFO     Writing the extracted properties into XML
2024-02-11 08:03:53 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/TJG_20230116.csv
2024-02-11 08:03:53 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/AJC_20233517.docx
2024-02-11 08:03:53 INFO     Started creating the docx object
2024-02-11 08:03:53 INFO     Extracting the properties of the document
2024-02-11 08:03:53 INFO     Started processing the components to extract the properties
2024-02-11 08:04:03 INFO     Writing the extracted properties into XML
2024-02-11 08:04:03 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/AJC_20233517.csv
2024-02-11 08:04:03 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/jou

Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range


2024-02-11 08:05:36 INFO     Writing the extracted properties into XML
2024-02-11 08:05:36 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/JIAO_20231393.csv
2024-02-11 08:05:36 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/ELECT_220230001.docx
2024-02-11 08:05:36 INFO     Started creating the docx object
2024-02-11 08:05:36 INFO     Extracting the properties of the document
2024-02-11 08:05:36 INFO     Started processing the components to extract the properties
2024-02-11 08:05:40 INFO     Writing the extracted properties into XML
2024-02-11 08:05:40 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/ELECT_220230001.csv
2024-02-11 08:05:40 INFO     Started to extract the docx properties from /Users/senthil/Downloads/

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 08:06:23 INFO     Writing the extracted properties into XML
2024-02-11 08:06:23 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/BENT_20231468.csv
2024-02-11 08:06:23 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/AOTT_20230132.docx
2024-02-11 08:06:23 INFO     Started creating the docx object
2024-02-11 08:06:23 INFO     Extracting the properties of the document
2024-02-11 08:06:23 INFO     Started processing the components to extract the properties
2024-02-11 08:06:27 INFO     Writing the extracted properties into XML
2024-02-11 08:06:27 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/AOTT_20230132.csv
2024-02-11 08:06:27 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 08:18:07 INFO     Writing the extracted properties into XML
2024-02-11 08:18:07 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/TJN_20230605.csv
2024-02-11 08:18:07 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/VSP_20230172.docx
2024-02-11 08:18:08 INFO     Started creating the docx object
2024-02-11 08:18:08 INFO     Extracting the properties of the document
2024-02-11 08:18:08 INFO     Started processing the components to extract the properties
2024-02-11 08:18:09 INFO     Writing the extracted properties into XML
2024-02-11 08:18:09 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/VSP_20230172.csv
2024-02-11 08:18:09 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/jou

Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from lis

2024-02-11 08:19:12 INFO     Writing the extracted properties into XML
2024-02-11 08:19:12 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/Pharmata_20230030.csv
2024-02-11 08:19:12 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/JIRS_20230031.docx
2024-02-11 08:19:13 INFO     Started creating the docx object
2024-02-11 08:19:13 INFO     Extracting the properties of the document
2024-02-11 08:19:13 INFO     Started processing the components to extract the properties
2024-02-11 08:19:13 INFO     Writing the extracted properties into XML
2024-02-11 08:19:13 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/JIRS_20230031.csv
2024-02-11 08:19:13 INFO     Started to extract the docx properties from /Users/senthil/Downloads/

Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range


2024-02-11 08:39:21 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/OIKOS_WLB3_01195.docx
2024-02-11 08:39:21 INFO     Started creating the docx object
2024-02-11 08:39:21 INFO     Extracting the properties of the document
2024-02-11 08:39:21 INFO     Started processing the components to extract the properties
2024-02-11 08:39:27 INFO     Writing the extracted properties into XML
2024-02-11 08:39:27 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/OIKOS_WLB3_01195.csv
2024-02-11 08:39:27 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/OIKOS_njb_04151.docx
2024-02-11 08:39:27 INFO     Started creating the docx object
2024-02-11 08:39:27 INFO     Extracting the properties of the document
2024-02-11 08:39:27 INFO     

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 08:45:57 INFO     Writing the extracted properties into XML
2024-02-11 08:45:57 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/DIE_20230080.csv
2024-02-11 08:45:57 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/ERP_20230339.docx
2024-02-11 08:45:57 INFO     Started creating the docx object
2024-02-11 08:45:57 INFO     Extracting the properties of the document
2024-02-11 08:45:57 INFO     Started processing the components to extract the properties
2024-02-11 08:45:59 INFO     Writing the extracted properties into XML
2024-02-11 08:45:59 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/ERP_20230339.csv
2024-02-11 08:45:59 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/jou

Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range
Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range


2024-02-11 08:57:14 INFO     Writing the extracted properties into XML
2024-02-11 08:57:14 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/REP_230225.csv
2024-02-11 08:57:14 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/TJN_20220442.docx
2024-02-11 08:57:14 INFO     Started creating the docx object
2024-02-11 08:57:14 INFO     Extracting the properties of the document
2024-02-11 08:57:14 INFO     Started processing the components to extract the properties
2024-02-11 08:57:18 INFO     Writing the extracted properties into XML
2024-02-11 08:57:18 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/TJN_20220442.csv
2024-02-11 08:57:18 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journ

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 08:58:03 INFO     Writing the extracted properties into XML
2024-02-11 08:58:03 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/OIKOS_oik_09766.csv
2024-02-11 08:58:03 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/TJG_20230262.docx
2024-02-11 08:58:03 INFO     Started creating the docx object
2024-02-11 08:58:03 INFO     Extracting the properties of the document
2024-02-11 08:58:03 INFO     Started processing the components to extract the properties
2024-02-11 08:58:05 INFO     Writing the extracted properties into XML
2024-02-11 08:58:05 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/TJG_20230262.csv
2024-02-11 08:58:05 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 09:08:16 INFO     Writing the extracted properties into XML
2024-02-11 09:08:16 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/AOTT_20230067.csv
2024-02-11 09:08:16 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/REM_230026.docx
2024-02-11 09:08:16 INFO     Started creating the docx object
2024-02-11 09:08:16 INFO     Extracting the properties of the document
2024-02-11 09:08:16 INFO     Started processing the components to extract the properties
2024-02-11 09:08:24 INFO     Writing the extracted properties into XML
2024-02-11 09:08:24 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/REM_230026.csv
2024-02-11 09:08:24 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journa

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 09:09:44 INFO     Writing the extracted properties into XML
2024-02-11 09:09:44 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/REP_230229.csv
2024-02-11 09:09:44 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/REP_230383.docx
2024-02-11 09:09:44 INFO     Started creating the docx object
2024-02-11 09:09:44 INFO     Extracting the properties of the document
2024-02-11 09:09:44 INFO     Started processing the components to extract the properties
2024-02-11 09:09:49 INFO     Writing the extracted properties into XML
2024-02-11 09:09:49 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/REP_230383.csv
2024-02-11 09:09:49 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 09:37:00 INFO     Writing the extracted properties into XML
2024-02-11 09:37:00 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/OIKOS_oik_10248.csv
2024-02-11 09:37:00 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/ESE_20234977.docx
2024-02-11 09:37:00 INFO     Started creating the docx object
2024-02-11 09:37:00 INFO     Extracting the properties of the document
2024-02-11 09:37:00 INFO     Started processing the components to extract the properties
2024-02-11 09:37:00 INFO     Writing the extracted properties into XML
2024-02-11 09:37:00 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/ESE_20234977.csv
2024-02-11 09:37:01 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/

Error while fetching the list style information from para: 'NoneType' object has no attribute 'val'
Error while fetching the left indent information from list para: 'NoneType' object has no attribute 'val'
Error while fetching the list style information from para: 'NoneType' object has no attribute 'val'
Error while fetching the left indent information from list para: 'NoneType' object has no attribute 'val'
Error while fetching the list style information from para: 'NoneType' object has no attribute 'val'
Error while fetching the left indent information from list para: 'NoneType' object has no attribute 'val'
Error while fetching the list style information from para: 'NoneType' object has no attribute 'val'
Error while fetching the left indent information from list para: 'NoneType' object has no attribute 'val'
Error while fetching the list style information from para: 'NoneType' object has no attribute 'val'
Error while fetching the left indent information from list para: 'NoneType' 

2024-02-11 09:37:48 INFO     Writing the extracted properties into XML
2024-02-11 09:37:48 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/JOE_230330.csv
2024-02-11 09:37:48 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/CMJ_20230050.docx
2024-02-11 09:37:48 INFO     Started creating the docx object
2024-02-11 09:37:48 INFO     Extracting the properties of the document
2024-02-11 09:37:48 INFO     Started processing the components to extract the properties
2024-02-11 09:37:51 INFO     Writing the extracted properties into XML
2024-02-11 09:37:51 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/CMJ_20230050.csv
2024-02-11 09:37:51 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journ

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 09:53:14 INFO     Writing the extracted properties into XML
2024-02-11 09:53:14 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/AP_20231323.csv
2024-02-11 09:53:14 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/MAH_230015.docx
2024-02-11 09:53:14 INFO     Started creating the docx object
2024-02-11 09:53:14 INFO     Extracting the properties of the document
2024-02-11 09:53:14 INFO     Started processing the components to extract the properties
2024-02-11 09:53:27 INFO     Writing the extracted properties into XML
2024-02-11 09:53:27 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/MAH_230015.csv
2024-02-11 09:53:27 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals

Error while fetching the list style information from para: list index out of range
Error while fetching the left indent information from list para: list index out of range


2024-02-11 09:53:40 INFO     Writing the extracted properties into XML
2024-02-11 09:53:41 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/ETJ_230193.csv
2024-02-11 09:53:41 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/JN_20220249.docx
2024-02-11 09:53:41 INFO     Started creating the docx object
2024-02-11 09:53:41 INFO     Extracting the properties of the document
2024-02-11 09:53:41 INFO     Started processing the components to extract the properties
2024-02-11 09:53:44 INFO     Writing the extracted properties into XML
2024-02-11 09:53:44 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/JN_20220249.csv
2024-02-11 09:53:44 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journal

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 09:54:25 INFO     Writing the extracted properties into XML
2024-02-11 09:54:25 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/ERC_230235.csv
2024-02-11 09:54:25 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/OIKOS_WLB3_01131.docx
2024-02-11 09:54:25 INFO     Started creating the docx object
2024-02-11 09:54:25 INFO     Extracting the properties of the document
2024-02-11 09:54:25 INFO     Started processing the components to extract the properties
2024-02-11 09:54:34 INFO     Writing the extracted properties into XML
2024-02-11 09:54:34 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/OIKOS_WLB3_01131.csv
2024-02-11 09:54:34 INFO     Started to extract the docx properties from /Users/senthil/Downloads/J

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 09:55:28 INFO     Writing the extracted properties into XML
2024-02-11 09:55:28 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/OIKOS_ecog_07041.csv
2024-02-11 09:55:28 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/EOR_230055.docx
2024-02-11 09:55:28 INFO     Started creating the docx object
2024-02-11 09:55:28 INFO     Extracting the properties of the document
2024-02-11 09:55:28 INFO     Started processing the components to extract the properties
2024-02-11 09:55:32 INFO     Writing the extracted properties into XML
2024-02-11 09:55:32 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/EOR_230055.csv
2024-02-11 09:55:32 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/jou

Error while fetching the left indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'
Error while fetching the right indent information from para: '_CharacterStyle' object has no attribute 'paragraph_format'


2024-02-11 09:56:01 INFO     Writing the extracted properties into XML
2024-02-11 09:56:01 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/ESE_202303445.csv
2024-02-11 09:56:01 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/EDM_230086.docx
2024-02-11 09:56:01 INFO     Started creating the docx object
2024-02-11 09:56:01 INFO     Extracting the properties of the document
2024-02-11 09:56:01 INFO     Started processing the components to extract the properties
2024-02-11 09:56:04 INFO     Writing the extracted properties into XML
2024-02-11 09:56:04 INFO     Converting properties XML to CSV: /Users/senthil/Downloads/JPT/journals_data_element_prediction/dataset prep/updated_docx/dataset/EDM_230086.csv
2024-02-11 09:56:04 INFO     Started to extract the docx properties from /Users/senthil/Downloads/JPT/journa