End of training
Browse files- .gitattributes +2 -0
- checkpoint-1000/motion_encoder/config.json +10 -0
- checkpoint-1000/motion_encoder/model.safetensors +3 -0
- checkpoint-1000/optimizer.bin +3 -0
- checkpoint-1000/random_states_0.pkl +3 -0
- checkpoint-1000/scheduler.bin +3 -0
- checkpoint-1000/unet/config.json +38 -0
- checkpoint-1000/unet/diffusion_pytorch_model.safetensors +3 -0
- checkpoint-500/motion_encoder/config.json +10 -0
- checkpoint-500/motion_encoder/model.safetensors +3 -0
- checkpoint-500/optimizer.bin +3 -0
- checkpoint-500/random_states_0.pkl +3 -0
- checkpoint-500/scheduler.bin +3 -0
- checkpoint-500/unet/config.json +38 -0
- checkpoint-500/unet/diffusion_pytorch_model.safetensors +3 -0
- diffusion_pytorch_model.safetensors +2 -2
- model.safetensors +1 -1
- validation_images/step_1000_val_cross_0.mp4 +0 -0
- validation_images/step_1000_val_recon_0.mp4 +2 -2
- validation_images/step_1000_val_source_0.mp4 +2 -2
- validation_images/step_1_val_cross_0.mp4 +2 -2
- validation_images/step_1_val_recon_0.mp4 +2 -2
- validation_images/step_1_val_source_0.mp4 +2 -2
- validation_images/step_500_val_cross_0.mp4 +0 -0
- validation_images/step_500_val_recon_0.mp4 +2 -2
- validation_images/step_500_val_source_0.mp4 +2 -2
.gitattributes
CHANGED
@@ -98,3 +98,5 @@ validation_images/step_9500_val_source_0.mp4 filter=lfs diff=lfs merge=lfs -text
|
|
98 |
validation_images/step_17500_val_source_0.mp4 filter=lfs diff=lfs merge=lfs -text
|
99 |
validation_images/step_18500_val_source_0.mp4 filter=lfs diff=lfs merge=lfs -text
|
100 |
validation_images/step_1_val_cross_0.mp4 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
98 |
validation_images/step_17500_val_source_0.mp4 filter=lfs diff=lfs merge=lfs -text
|
99 |
validation_images/step_18500_val_source_0.mp4 filter=lfs diff=lfs merge=lfs -text
|
100 |
validation_images/step_1_val_cross_0.mp4 filter=lfs diff=lfs merge=lfs -text
|
101 |
+
validation_images/step_1000_val_cross_0.mp4 filter=lfs diff=lfs merge=lfs -text
|
102 |
+
validation_images/step_500_val_cross_0.mp4 filter=lfs diff=lfs merge=lfs -text
|
checkpoint-1000/motion_encoder/config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"MotionEncoder"
|
4 |
+
],
|
5 |
+
"model_type": "motion_encoder",
|
6 |
+
"motion_num_frames": 25,
|
7 |
+
"torch_dtype": "bfloat16",
|
8 |
+
"transformers_version": "4.47.1",
|
9 |
+
"vit_model_name": "google/vivit-b-16x2"
|
10 |
+
}
|
checkpoint-1000/motion_encoder/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f0196ed4a201cc36c1f9604318b9acdf774c3a0e9a526e4068b7a88ea5622df
|
3 |
+
size 179679088
|
checkpoint-1000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48a402afc3675cd076a83a9a3cc0dca78ec584d0481b05b90836da09bb3ddfc6
|
3 |
+
size 566968174
|
checkpoint-1000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e68e3048029548bea9cd453742a6ba5a815a8c590dc421ae98b95fb4628c724
|
3 |
+
size 14408
|
checkpoint-1000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1ef945fb67548939f1340070803ddc6f91925dd6d43f8c15ba25d113f03c5ed
|
3 |
+
size 1000
|
checkpoint-1000/unet/config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "MAMUNetSpatioTemporalConditionModel",
|
3 |
+
"_diffusers_version": "0.32.1",
|
4 |
+
"_name_or_path": "/home/suraj_huggingface_co/.cache/huggingface/hub/models--diffusers--svd-xt/snapshots/9703ded20c957c340781ee710b75660826deb487/unet",
|
5 |
+
"addition_time_embed_dim": 256,
|
6 |
+
"block_out_channels": [
|
7 |
+
320,
|
8 |
+
640,
|
9 |
+
1280,
|
10 |
+
1280
|
11 |
+
],
|
12 |
+
"cross_attention_dim": 1024,
|
13 |
+
"down_block_types": [
|
14 |
+
"MAMCrossAttnDownBlockSpatioTemporal",
|
15 |
+
"MAMCrossAttnDownBlockSpatioTemporal",
|
16 |
+
"MAMCrossAttnDownBlockSpatioTemporal",
|
17 |
+
"MAMDownBlockSpatioTemporal"
|
18 |
+
],
|
19 |
+
"in_channels": 8,
|
20 |
+
"layers_per_block": 2,
|
21 |
+
"num_attention_heads": [
|
22 |
+
5,
|
23 |
+
10,
|
24 |
+
20,
|
25 |
+
20
|
26 |
+
],
|
27 |
+
"num_frames": 25,
|
28 |
+
"out_channels": 4,
|
29 |
+
"projection_class_embeddings_input_dim": 768,
|
30 |
+
"sample_size": 96,
|
31 |
+
"transformer_layers_per_block": 1,
|
32 |
+
"up_block_types": [
|
33 |
+
"UpBlockSpatioTemporal",
|
34 |
+
"CrossAttnUpBlockSpatioTemporal",
|
35 |
+
"CrossAttnUpBlockSpatioTemporal",
|
36 |
+
"CrossAttnUpBlockSpatioTemporal"
|
37 |
+
]
|
38 |
+
}
|
checkpoint-1000/unet/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06e846cbb38081ac232011d823389dba3bb2ae2f3bbdfcf51affd3978cbc4e69
|
3 |
+
size 5156265940
|
checkpoint-500/motion_encoder/config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"MotionEncoder"
|
4 |
+
],
|
5 |
+
"model_type": "motion_encoder",
|
6 |
+
"motion_num_frames": 25,
|
7 |
+
"torch_dtype": "bfloat16",
|
8 |
+
"transformers_version": "4.47.1",
|
9 |
+
"vit_model_name": "google/vivit-b-16x2"
|
10 |
+
}
|
checkpoint-500/motion_encoder/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1de23f6ba107e07dcf62f059b050773babc5432f674e667860900c0bbea167c
|
3 |
+
size 179679088
|
checkpoint-500/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0fc6c35163f3a37faf4f29f7547988b585645e4bef2653380f3857e45f407d3
|
3 |
+
size 566968174
|
checkpoint-500/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5170399267664320416714d10028896cf2d6de5c404be1822d85fc2a5502def7
|
3 |
+
size 14408
|
checkpoint-500/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6cf34ac8dd2addc454aeb1ee4eaba3267c2841857e117be40ac2ed02cf581c9c
|
3 |
+
size 1000
|
checkpoint-500/unet/config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "MAMUNetSpatioTemporalConditionModel",
|
3 |
+
"_diffusers_version": "0.32.1",
|
4 |
+
"_name_or_path": "/home/suraj_huggingface_co/.cache/huggingface/hub/models--diffusers--svd-xt/snapshots/9703ded20c957c340781ee710b75660826deb487/unet",
|
5 |
+
"addition_time_embed_dim": 256,
|
6 |
+
"block_out_channels": [
|
7 |
+
320,
|
8 |
+
640,
|
9 |
+
1280,
|
10 |
+
1280
|
11 |
+
],
|
12 |
+
"cross_attention_dim": 1024,
|
13 |
+
"down_block_types": [
|
14 |
+
"MAMCrossAttnDownBlockSpatioTemporal",
|
15 |
+
"MAMCrossAttnDownBlockSpatioTemporal",
|
16 |
+
"MAMCrossAttnDownBlockSpatioTemporal",
|
17 |
+
"MAMDownBlockSpatioTemporal"
|
18 |
+
],
|
19 |
+
"in_channels": 8,
|
20 |
+
"layers_per_block": 2,
|
21 |
+
"num_attention_heads": [
|
22 |
+
5,
|
23 |
+
10,
|
24 |
+
20,
|
25 |
+
20
|
26 |
+
],
|
27 |
+
"num_frames": 25,
|
28 |
+
"out_channels": 4,
|
29 |
+
"projection_class_embeddings_input_dim": 768,
|
30 |
+
"sample_size": 96,
|
31 |
+
"transformer_layers_per_block": 1,
|
32 |
+
"up_block_types": [
|
33 |
+
"UpBlockSpatioTemporal",
|
34 |
+
"CrossAttnUpBlockSpatioTemporal",
|
35 |
+
"CrossAttnUpBlockSpatioTemporal",
|
36 |
+
"CrossAttnUpBlockSpatioTemporal"
|
37 |
+
]
|
38 |
+
}
|
checkpoint-500/unet/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82ec21609a3d5e4dc9e6b4ebdc056a8758383e03ea393ec17df249ef22025871
|
3 |
+
size 5156265940
|
diffusion_pytorch_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06e846cbb38081ac232011d823389dba3bb2ae2f3bbdfcf51affd3978cbc4e69
|
3 |
+
size 5156265940
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 179679088
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f0196ed4a201cc36c1f9604318b9acdf774c3a0e9a526e4068b7a88ea5622df
|
3 |
size 179679088
|
validation_images/step_1000_val_cross_0.mp4
CHANGED
Binary files a/validation_images/step_1000_val_cross_0.mp4 and b/validation_images/step_1000_val_cross_0.mp4 differ
|
|
validation_images/step_1000_val_recon_0.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b7d629f8186315d1cda830513bc2c00bd72e4b71ea9f2c4781d59b5be5d1759
|
3 |
+
size 98920
|
validation_images/step_1000_val_source_0.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b67b28e733eb00c1f8ff61632633264e092fca3febd6ad0a13cb0d8086a5261c
|
3 |
+
size 118765
|
validation_images/step_1_val_cross_0.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c264d5f4c7781a16f29d5aa81b213311f0d3665f353ff3aef3a661edfb58a66d
|
3 |
+
size 512781
|
validation_images/step_1_val_recon_0.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8b6b82995f5ae50a6c4058736b698188399406a03940e23bfc735c5501e7d7c
|
3 |
+
size 207469
|
validation_images/step_1_val_source_0.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f0bebd663535aaf7fd1abc93f1abe7ba046d5f9051f8ae069a688f7452e84ab
|
3 |
+
size 124005
|
validation_images/step_500_val_cross_0.mp4
CHANGED
Binary files a/validation_images/step_500_val_cross_0.mp4 and b/validation_images/step_500_val_cross_0.mp4 differ
|
|
validation_images/step_500_val_recon_0.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:723aa176f7fb4f51da06ee6ea2a48686fcc587f78ae35555a6d693f7b332a11f
|
3 |
+
size 106499
|
validation_images/step_500_val_source_0.mp4
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b67b28e733eb00c1f8ff61632633264e092fca3febd6ad0a13cb0d8086a5261c
|
3 |
+
size 118765
|