Spaces:
Running
on
Zero
Running
on
Zero
''' | |
THis file is to collect all lang.txt and move to a new directory, this is for the convenience to compress and scp the lang for post-processing | |
''' | |
import os, sys, shutil | |
if __name__ == "__main__": | |
parent_dir = "../datasets_rob" | |
dataset_paths = ["Bridge_v1_TT14", "Bridge_v2_TT14"] | |
store_folder = "../full_text_tmp" | |
# Manage the store folder | |
if os.path.exists(store_folder): | |
shutil.rmtree(store_folder) | |
os.makedirs(store_folder) | |
for dataset_name in dataset_paths: | |
store_path = os.path.join(store_folder, dataset_name) | |
if os.path.exists(store_path): | |
shutil.rmtree(store_path) | |
os.makedirs(store_path) | |
# Iterate all the files | |
for sub_folder_name in os.listdir(os.path.join(parent_dir, dataset_name)): | |
print("We are processing ", sub_folder_name) | |
lang_txt_path = os.path.join(parent_dir, dataset_name, sub_folder_name, "lang.txt") | |
# Store on the new address | |
store_file_path = os.path.join(store_path, sub_folder_name) | |
os.makedirs(store_file_path) | |
shutil.copyfile(lang_txt_path, os.path.join(store_file_path, "lang.txt")) | |