update folders
This commit is contained in:
@@ -34,7 +34,8 @@ def _load_json_from_path(json_path: str) -> Dict:
|
|||||||
|
|
||||||
def get_raw_english_texts_of_project(project_dirname: str, oracc_site: str = 'oracc.museum.upenn.edu') -> List[Dict]:
|
def get_raw_english_texts_of_project(project_dirname: str, oracc_site: str = 'oracc.museum.upenn.edu') -> List[Dict]:
|
||||||
raw_jsons = list()
|
raw_jsons = list()
|
||||||
all_paths = glob.glob(f'jsons_unzipped/{project_dirname}/**/corpusjson/*.json', recursive=True)
|
all_paths = glob.glob(f'jsons_unzipped/{project_dirname}/**/corpusjson/*.json', recursive=True) + glob.glob(
|
||||||
|
f'jsons_unzipped/{project_dirname}/corpusjson/*.json', recursive=True)
|
||||||
# path = Path(os.path.join(JSONS_DIR, project_dirname, 'catalogue.json'))
|
# path = Path(os.path.join(JSONS_DIR, project_dirname, 'catalogue.json'))
|
||||||
# if not os.path.isfile(path):
|
# if not os.path.isfile(path):
|
||||||
# return raw_jsons
|
# return raw_jsons
|
||||||
|
Reference in New Issue
Block a user