PatentSolver / App /run_normal_folder.py
xin's picture
initial commit
22738ca
raw
history blame contribute delete
806 Bytes
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
# @File : run_normal_folder.py
# @Author: nixin
# @Date : 2021/11/11
from App.bin import constants
from App.bin.InputHandler import InputHandler
from App.bin.PatentHandler import PatentHandler
from App.bin.CorpusProcessor import CorpusProcessor
import time
start_time = time.time()
input_folder = constants.DATA_INPUT + 'US_patents'
files_extension = "*." + 'txt'
iInput = InputHandler(input_folder, files_extension)
input_data = iInput.get_input()
pretreat_data = PatentHandler(input_data)
clean_patent_data = pretreat_data.pretreat_data()
process_data = CorpusProcessor(clean_patent_data,input_folder, files_extension)
processed_data = process_data.process_corpus()
print("Process is finished within %s seconds" % round(time.time() - start_time,2))