Spaces:
Running
Running
import argparse | |
import json | |
import os | |
def parse_args(): | |
parser = argparse.ArgumentParser(description="Convert jsonl to json.") | |
parser.add_argument("--video_folder", type=str, default="", help="The video folder.") | |
parser.add_argument( | |
"--jsonl_load_path", type=str, default=None, help="The path to the video dataset metadata (csv/jsonl)." | |
) | |
parser.add_argument("--save_path", type=str, default=None, help="The save path to the output results.") | |
args = parser.parse_args() | |
return args | |
def main(): | |
args = parse_args() | |
with open(args.jsonl_load_path, "r") as read: | |
_lines = read.readlines() | |
output = [] | |
for line in _lines: | |
try: | |
line = json.loads(line.strip()) | |
videoid, name = line['video_path'], line['summary_caption'] | |
output.append( | |
{ | |
"file_path": os.path.join(args.video_folder, videoid), | |
"text": name, | |
"type": "video", | |
} | |
) | |
except: | |
pass | |
with open(args.save_path, mode="w", encoding="utf-8") as f: | |
json.dump(output, f, indent=2) | |
if __name__ == "__main__": | |
main() |