Source code for preprocessing.main_xml_files
"""
Main method that calls for EVS/ESS scripts to generate MCSQ spreadsheet inputs
Author: Danielly Sorato
Author contact: danielly.sorato@gmail.com
"""
import os
import sys
sys.path.insert(0, 'evs_xml_data_extraction')
sys.path.insert(0, 'ess_xml_data_extraction')
sys.path.insert(0, 'share_xml_data_extraction')
import evs_xml_data_extraction
import ess_xml_data_extraction
import share_xml_data_extraction
[docs]def main(folder_path):
"""
This main file calls the transformation algorithms inside evs_xml_data_extraction,
ess_xml_data_extraction and ess_xml_data_extraction scripts.
evs_xml_data_extraction is called for EVS files
ess_xml_data_extraction is called for ESS files
share_xml_data_extraction is called for SHARE files
The algorithm transforms a XML file to a structured spreadsheet format
with valuable metadata.
Call main script using folder_path, for instance:
reset && python3 main.py /path/to/your/data
Args:
param1 folder_path: the path of the directory containing the files to tranform
"""
path = os.chdir(folder_path)
files = os.listdir(path)
for index, file in enumerate(files):
if file.endswith(".xml"):
print('Transforming XML file:', file)
if 'EVS' in file:
evs_xml_data_extraction.main(file)
elif 'ESS' in file:
ess_xml_data_extraction.main(file)
elif 'SHA' in file:
share_xml_data_extraction.main(file)
if __name__ == "__main__":
folder_path = str(sys.argv[1])
main(folder_path)