Spaces:
Build error
Build error
| # -*- coding: utf-8 -*- | |
| #java -mx4g -cp "*" edu.stanford.nlp.pipeline.StanfordCoreNLPServer --port 8080 | |
| import glob | |
| import os | |
| class InputHandler(object): | |
| def __init__(self, folder_path, extension): | |
| self.folder_path = folder_path | |
| self.extension = extension | |
| print("Handling Corpus...") | |
| def _get_dirs(self, base): | |
| return [x for x in glob.iglob(os.path.join(base, '*')) if os.path.isdir(x)] | |
| def get_base_file(self, base, pattern): | |
| lList = [] | |
| lList.extend(glob.glob(os.path.join(base, pattern))) | |
| dirs = self._get_dirs(base) | |
| if len(dirs): | |
| for d in dirs: | |
| lList.extend(self.get_base_file(os.path.join(base, d), pattern)) | |
| return lList | |
| def get_input(self): | |
| folder_path = self.folder_path | |
| extension = self.extension | |
| patent_files = self.get_base_file(folder_path, extension) | |
| return patent_files | |