yevvonlim commited on
Commit
9d68c5d
·
verified ·
1 Parent(s): 43d2365

End of training

Browse files
.gitattributes CHANGED
@@ -98,3 +98,5 @@ validation_images/step_9500_val_source_0.mp4 filter=lfs diff=lfs merge=lfs -text
98
  validation_images/step_17500_val_source_0.mp4 filter=lfs diff=lfs merge=lfs -text
99
  validation_images/step_18500_val_source_0.mp4 filter=lfs diff=lfs merge=lfs -text
100
  validation_images/step_1_val_cross_0.mp4 filter=lfs diff=lfs merge=lfs -text
 
 
 
98
  validation_images/step_17500_val_source_0.mp4 filter=lfs diff=lfs merge=lfs -text
99
  validation_images/step_18500_val_source_0.mp4 filter=lfs diff=lfs merge=lfs -text
100
  validation_images/step_1_val_cross_0.mp4 filter=lfs diff=lfs merge=lfs -text
101
+ validation_images/step_1000_val_cross_0.mp4 filter=lfs diff=lfs merge=lfs -text
102
+ validation_images/step_500_val_cross_0.mp4 filter=lfs diff=lfs merge=lfs -text
checkpoint-1000/motion_encoder/config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "MotionEncoder"
4
+ ],
5
+ "model_type": "motion_encoder",
6
+ "motion_num_frames": 25,
7
+ "torch_dtype": "bfloat16",
8
+ "transformers_version": "4.47.1",
9
+ "vit_model_name": "google/vivit-b-16x2"
10
+ }
checkpoint-1000/motion_encoder/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f0196ed4a201cc36c1f9604318b9acdf774c3a0e9a526e4068b7a88ea5622df
3
+ size 179679088
checkpoint-1000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48a402afc3675cd076a83a9a3cc0dca78ec584d0481b05b90836da09bb3ddfc6
3
+ size 566968174
checkpoint-1000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e68e3048029548bea9cd453742a6ba5a815a8c590dc421ae98b95fb4628c724
3
+ size 14408
checkpoint-1000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1ef945fb67548939f1340070803ddc6f91925dd6d43f8c15ba25d113f03c5ed
3
+ size 1000
checkpoint-1000/unet/config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "MAMUNetSpatioTemporalConditionModel",
3
+ "_diffusers_version": "0.32.1",
4
+ "_name_or_path": "/home/suraj_huggingface_co/.cache/huggingface/hub/models--diffusers--svd-xt/snapshots/9703ded20c957c340781ee710b75660826deb487/unet",
5
+ "addition_time_embed_dim": 256,
6
+ "block_out_channels": [
7
+ 320,
8
+ 640,
9
+ 1280,
10
+ 1280
11
+ ],
12
+ "cross_attention_dim": 1024,
13
+ "down_block_types": [
14
+ "MAMCrossAttnDownBlockSpatioTemporal",
15
+ "MAMCrossAttnDownBlockSpatioTemporal",
16
+ "MAMCrossAttnDownBlockSpatioTemporal",
17
+ "MAMDownBlockSpatioTemporal"
18
+ ],
19
+ "in_channels": 8,
20
+ "layers_per_block": 2,
21
+ "num_attention_heads": [
22
+ 5,
23
+ 10,
24
+ 20,
25
+ 20
26
+ ],
27
+ "num_frames": 25,
28
+ "out_channels": 4,
29
+ "projection_class_embeddings_input_dim": 768,
30
+ "sample_size": 96,
31
+ "transformer_layers_per_block": 1,
32
+ "up_block_types": [
33
+ "UpBlockSpatioTemporal",
34
+ "CrossAttnUpBlockSpatioTemporal",
35
+ "CrossAttnUpBlockSpatioTemporal",
36
+ "CrossAttnUpBlockSpatioTemporal"
37
+ ]
38
+ }
checkpoint-1000/unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06e846cbb38081ac232011d823389dba3bb2ae2f3bbdfcf51affd3978cbc4e69
3
+ size 5156265940
checkpoint-500/motion_encoder/config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "MotionEncoder"
4
+ ],
5
+ "model_type": "motion_encoder",
6
+ "motion_num_frames": 25,
7
+ "torch_dtype": "bfloat16",
8
+ "transformers_version": "4.47.1",
9
+ "vit_model_name": "google/vivit-b-16x2"
10
+ }
checkpoint-500/motion_encoder/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1de23f6ba107e07dcf62f059b050773babc5432f674e667860900c0bbea167c
3
+ size 179679088
checkpoint-500/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0fc6c35163f3a37faf4f29f7547988b585645e4bef2653380f3857e45f407d3
3
+ size 566968174
checkpoint-500/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5170399267664320416714d10028896cf2d6de5c404be1822d85fc2a5502def7
3
+ size 14408
checkpoint-500/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cf34ac8dd2addc454aeb1ee4eaba3267c2841857e117be40ac2ed02cf581c9c
3
+ size 1000
checkpoint-500/unet/config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "MAMUNetSpatioTemporalConditionModel",
3
+ "_diffusers_version": "0.32.1",
4
+ "_name_or_path": "/home/suraj_huggingface_co/.cache/huggingface/hub/models--diffusers--svd-xt/snapshots/9703ded20c957c340781ee710b75660826deb487/unet",
5
+ "addition_time_embed_dim": 256,
6
+ "block_out_channels": [
7
+ 320,
8
+ 640,
9
+ 1280,
10
+ 1280
11
+ ],
12
+ "cross_attention_dim": 1024,
13
+ "down_block_types": [
14
+ "MAMCrossAttnDownBlockSpatioTemporal",
15
+ "MAMCrossAttnDownBlockSpatioTemporal",
16
+ "MAMCrossAttnDownBlockSpatioTemporal",
17
+ "MAMDownBlockSpatioTemporal"
18
+ ],
19
+ "in_channels": 8,
20
+ "layers_per_block": 2,
21
+ "num_attention_heads": [
22
+ 5,
23
+ 10,
24
+ 20,
25
+ 20
26
+ ],
27
+ "num_frames": 25,
28
+ "out_channels": 4,
29
+ "projection_class_embeddings_input_dim": 768,
30
+ "sample_size": 96,
31
+ "transformer_layers_per_block": 1,
32
+ "up_block_types": [
33
+ "UpBlockSpatioTemporal",
34
+ "CrossAttnUpBlockSpatioTemporal",
35
+ "CrossAttnUpBlockSpatioTemporal",
36
+ "CrossAttnUpBlockSpatioTemporal"
37
+ ]
38
+ }
checkpoint-500/unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82ec21609a3d5e4dc9e6b4ebdc056a8758383e03ea393ec17df249ef22025871
3
+ size 5156265940
diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d361bcb77834fc65703901d932485693ca6f2575cc88dc6de478e42f1592ab1
3
- size 7445309980
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06e846cbb38081ac232011d823389dba3bb2ae2f3bbdfcf51affd3978cbc4e69
3
+ size 5156265940
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8057ff9bf263f2c51ca5e1c56aa30fae0d4a7e9a3498bce4a9436a005cce96b2
3
  size 179679088
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f0196ed4a201cc36c1f9604318b9acdf774c3a0e9a526e4068b7a88ea5622df
3
  size 179679088
validation_images/step_1000_val_cross_0.mp4 CHANGED
Binary files a/validation_images/step_1000_val_cross_0.mp4 and b/validation_images/step_1000_val_cross_0.mp4 differ
 
validation_images/step_1000_val_recon_0.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e24fe42f15b2462a85c485e099155c871fec001e0538442b74b82b7f7e7ba0f
3
- size 44191
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b7d629f8186315d1cda830513bc2c00bd72e4b71ea9f2c4781d59b5be5d1759
3
+ size 98920
validation_images/step_1000_val_source_0.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2480d19019e586212350459ba52620ea2216c329e8927c951f835e4d81f42365
3
- size 44943
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b67b28e733eb00c1f8ff61632633264e092fca3febd6ad0a13cb0d8086a5261c
3
+ size 118765
validation_images/step_1_val_cross_0.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d072cec9412389d8f9af33cc286e2fc6016b337584f6f0e2888e4390936d30ad
3
- size 202814
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c264d5f4c7781a16f29d5aa81b213311f0d3665f353ff3aef3a661edfb58a66d
3
+ size 512781
validation_images/step_1_val_recon_0.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87af28ff6573352d98b860ebf714c2d99195381b7f776e34de99c1fdcdd1e388
3
- size 104103
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8b6b82995f5ae50a6c4058736b698188399406a03940e23bfc735c5501e7d7c
3
+ size 207469
validation_images/step_1_val_source_0.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2480d19019e586212350459ba52620ea2216c329e8927c951f835e4d81f42365
3
- size 44943
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f0bebd663535aaf7fd1abc93f1abe7ba046d5f9051f8ae069a688f7452e84ab
3
+ size 124005
validation_images/step_500_val_cross_0.mp4 CHANGED
Binary files a/validation_images/step_500_val_cross_0.mp4 and b/validation_images/step_500_val_cross_0.mp4 differ
 
validation_images/step_500_val_recon_0.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:756f02604b6be17f84d421ef338fde80a48a7554b284818f577feb4f9856b88f
3
- size 41602
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:723aa176f7fb4f51da06ee6ea2a48686fcc587f78ae35555a6d693f7b332a11f
3
+ size 106499
validation_images/step_500_val_source_0.mp4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a31e75ec31d79711c87ec48a40e418b973c91b8638ac5a85c80584066b7cf73
3
- size 43886
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b67b28e733eb00c1f8ff61632633264e092fca3febd6ad0a13cb0d8086a5261c
3
+ size 118765