{ "architectures": [ "MotionEncoder" ], "model_type": "motion_encoder", "motion_num_frames": 25, "torch_dtype": "bfloat16", "transformers_version": "4.47.1", "vit_model_name": "google/vivit-b-16x2" }