Spaces:
Running
on
Zero
Running
on
Zero
| ''' | |
| This is a script to processs Mark's data. | |
| ''' | |
| import os, sys, shutil | |
| if __name__ == "__main__": | |
| file_path = "/nfs/turbo/coe-jjparkcv/datasets/isaac-gym-pick-place/full/dataset_v3_proc" | |
| store_path = "../datasets_rob/sim_raw" | |
| most_descriptive_prompt_idx = 6 # Start from the 0 | |
| # Folder management | |
| if os.path.exists(store_path): | |
| shutil.rmtree(store_path) | |
| os.makedirs(store_path) | |
| # Check length | |
| file_names = os.listdir(file_path) | |
| target_length = len(file_names) // 10 # 10 files as a cycle | |
| for idx in range(target_length): | |
| sub_folder_path = os.path.join(file_path, "run_"+str(10*idx)) | |
| if not os.path.exists(sub_folder_path): | |
| continue | |
| # Prepare the target position | |
| sub_store_path = os.path.join(store_path, str(idx)) | |
| os.makedirs(sub_store_path) | |
| # Find the key prompt to read it | |
| prompt_content = [] | |
| for tmp_idx in range(10): | |
| tmp_text_path = os.path.join(file_path, "run_"+str(10*idx + tmp_idx), "lang.txt") # Usually, the 6th is the most concrete version | |
| if not os.path.exists(tmp_text_path): | |
| continue | |
| file = open(tmp_text_path, 'r') | |
| prompt_content.append(file.readlines()[0]) | |
| file.close() | |
| print("prompt_content we have num ", len(prompt_content)) | |
| # Copy the image into the target position and copy the data.txt | |
| for file_name in os.listdir(sub_folder_path): | |
| if file_name == "lang.txt": | |
| continue | |
| shutil.copyfile(os.path.join(sub_folder_path, file_name), os.path.join(sub_store_path, file_name)) | |
| # Handle the lang.txt | |
| target_lang_txt_path = os.path.join(sub_store_path, "lang.txt") | |
| f = open(target_lang_txt_path, "a") | |
| f.write(prompt_content[most_descriptive_prompt_idx]+"\n") | |
| for tmp_idx in range(10): | |
| if tmp_idx == most_descriptive_prompt_idx: | |
| continue | |
| f.write(prompt_content[tmp_idx]+"\n") | |
| f.close() | |