Spaces:
Running
on
Zero
Running
on
Zero
upload checkpoints
Browse files- results/car_turn/cached_latents/cached_0.pt +3 -0
- results/car_turn/checkpoint/motion_embed.pt +3 -0
- results/car_turn/config.yaml +61 -0
- results/car_turn/source.mp4 +0 -0
- results/dolly_zoom/cached_latents/cached_0.pt +3 -0
- results/dolly_zoom/checkpoint/motion_embed.pt +3 -0
- results/dolly_zoom/config.yaml +61 -0
- results/dolly_zoom/source.mp4 +0 -0
- results/orbit_shot/cached_latents/cached_0.pt +3 -0
- results/orbit_shot/checkpoint/motion_embed.pt +3 -0
- results/orbit_shot/config.yaml +61 -0
- results/orbit_shot/source.mp4 +0 -0
- results/pan_up/cached_latents/cached_0.pt +3 -0
- results/pan_up/checkpoint/motion_embed.pt +3 -0
- results/pan_up/config.yaml +61 -0
- results/pan_up/source.mp4 +0 -0
- results/santa_dance/cached_latents/cached_0.pt +3 -0
- results/santa_dance/checkpoint/motion_embed.pt +3 -0
- results/santa_dance/config.yaml +61 -0
- results/santa_dance/source.mp4 +0 -0
- results/train_ride/cached_latents/cached_0.pt +3 -0
- results/train_ride/checkpoint/motion_embed.pt +3 -0
- results/train_ride/config.yaml +61 -0
- results/train_ride/source.mp4 +0 -0
- results/walk/checkpoint/motion_embed.pt +3 -0
- results/walk/config.yaml +61 -0
- results/walk/source.mp4 +0 -0
results/car_turn/cached_latents/cached_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8df8248bd60072f838fe9ecb16aa483fd3d84a459f83de0f7155f0f178df361f
|
3 |
+
size 54192856
|
results/car_turn/checkpoint/motion_embed.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0221e70227a25ae58f1767fb37d48b4721240aa962aad85f06eff95dbed4d72c
|
3 |
+
size 295737352
|
results/car_turn/config.yaml
ADDED
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
model:
|
2 |
+
type: unet
|
3 |
+
pretrained_model_path: cerspense/zeroscope_v2_576w
|
4 |
+
motion_embeddings:
|
5 |
+
combinations:
|
6 |
+
- - down
|
7 |
+
- 1280
|
8 |
+
- - up
|
9 |
+
- 1280
|
10 |
+
unet: videoCrafter2
|
11 |
+
train:
|
12 |
+
output_dir: results/02
|
13 |
+
validation_steps: 2000
|
14 |
+
checkpointing_steps: 50
|
15 |
+
checkpointing_start: 200
|
16 |
+
train_batch_size: 1
|
17 |
+
max_train_steps: 500
|
18 |
+
gradient_accumulation_steps: 1
|
19 |
+
cache_latents: true
|
20 |
+
cached_latent_dir: null
|
21 |
+
logger_type: tensorboard
|
22 |
+
mixed_precision: fp16
|
23 |
+
use_8bit_adam: false
|
24 |
+
resume_from_checkpoint: null
|
25 |
+
resume_step: null
|
26 |
+
dataset:
|
27 |
+
type:
|
28 |
+
- single_video
|
29 |
+
single_video_path: /tmp/gradio/5048253f30b40909d274ab1248fa8a0bf881ea4976ceab7f4957313b7d15be67/hybrid.mp4
|
30 |
+
single_video_prompt: A car turnaround in a city street
|
31 |
+
width: 576
|
32 |
+
height: 320
|
33 |
+
n_sample_frames: 24
|
34 |
+
fps: 8
|
35 |
+
sample_start_idx: 1
|
36 |
+
frame_step: 1
|
37 |
+
use_bucketing: false
|
38 |
+
use_caption: false
|
39 |
+
loss:
|
40 |
+
type: BaseLoss
|
41 |
+
learning_rate: 0.02
|
42 |
+
lr_scheduler: constant
|
43 |
+
lr_warmup_steps: 0
|
44 |
+
noise_init:
|
45 |
+
type: BlendInit
|
46 |
+
noise_prior: 0.5
|
47 |
+
val:
|
48 |
+
prompt:
|
49 |
+
- A skateboard slides along a city lane
|
50 |
+
negative_prompt: ''
|
51 |
+
sample_preview: true
|
52 |
+
width: 576
|
53 |
+
height: 320
|
54 |
+
num_frames: 24
|
55 |
+
num_inference_steps: 30
|
56 |
+
guidance_scale: 12.0
|
57 |
+
seeds:
|
58 |
+
- 0
|
59 |
+
strategy:
|
60 |
+
vSpatial_frameSubtraction: false
|
61 |
+
removeMFromV: false
|
results/car_turn/source.mp4
ADDED
Binary file (560 kB). View file
|
|
results/dolly_zoom/cached_latents/cached_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d20dc41f61c7d58ad6609566e1ed6eac5d0e52bce494e84e2609b114ddd78c4e
|
3 |
+
size 31362776
|
results/dolly_zoom/checkpoint/motion_embed.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:450e0f53ab4872ba2ade2f3bbe7c651464e39a2cfad9336f4de3d9a1cc8028fd
|
3 |
+
size 277714952
|
results/dolly_zoom/config.yaml
ADDED
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
model:
|
2 |
+
type: unet
|
3 |
+
pretrained_model_path: cerspense/zeroscope_v2_576w
|
4 |
+
motion_embeddings:
|
5 |
+
combinations:
|
6 |
+
- - down
|
7 |
+
- 1280
|
8 |
+
- - up
|
9 |
+
- 1280
|
10 |
+
unet: videoCrafter2
|
11 |
+
train:
|
12 |
+
output_dir: results/04
|
13 |
+
validation_steps: 2000
|
14 |
+
checkpointing_steps: 100
|
15 |
+
checkpointing_start: 200
|
16 |
+
train_batch_size: 1
|
17 |
+
max_train_steps: 400
|
18 |
+
gradient_accumulation_steps: 1
|
19 |
+
cache_latents: true
|
20 |
+
cached_latent_dir: null
|
21 |
+
logger_type: tensorboard
|
22 |
+
mixed_precision: fp16
|
23 |
+
use_8bit_adam: false
|
24 |
+
resume_from_checkpoint: null
|
25 |
+
resume_step: null
|
26 |
+
dataset:
|
27 |
+
type:
|
28 |
+
- single_video
|
29 |
+
single_video_path: /tmp/gradio/a31b567c8f08f688bd0a79e5f3f5af57a7967ba4d054e0f4c5b71f192af241e9/dolly_zoom_out.mp4
|
30 |
+
single_video_prompt: A car turnaround in a city street
|
31 |
+
width: 400
|
32 |
+
height: 400
|
33 |
+
n_sample_frames: 16
|
34 |
+
fps: 8
|
35 |
+
sample_start_idx: 1
|
36 |
+
frame_step: 1
|
37 |
+
use_bucketing: false
|
38 |
+
use_caption: false
|
39 |
+
loss:
|
40 |
+
type: BaseLoss
|
41 |
+
learning_rate: 0.02
|
42 |
+
lr_scheduler: constant
|
43 |
+
lr_warmup_steps: 0
|
44 |
+
noise_init:
|
45 |
+
type: BlendInit
|
46 |
+
noise_prior: 0.5
|
47 |
+
val:
|
48 |
+
prompt:
|
49 |
+
- A skateboard slides along a city lane
|
50 |
+
negative_prompt: ''
|
51 |
+
sample_preview: true
|
52 |
+
width: 400
|
53 |
+
height: 400
|
54 |
+
num_frames: 16
|
55 |
+
num_inference_steps: 30
|
56 |
+
guidance_scale: 12.0
|
57 |
+
seeds:
|
58 |
+
- 0
|
59 |
+
strategy:
|
60 |
+
vSpatial_frameSubtraction: false
|
61 |
+
removeMFromV: false
|
results/dolly_zoom/source.mp4
ADDED
Binary file (38.5 kB). View file
|
|
results/orbit_shot/cached_latents/cached_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20561bf4fc68685f5e1339a9b4c9cc749266a85984ba2284ca309cfc769803b8
|
3 |
+
size 46164696
|
results/orbit_shot/checkpoint/motion_embed.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3006dbf459be771c60d6d4334f2dac63bd845905e61bddfbd98186bf5f2565f
|
3 |
+
size 394041352
|
results/orbit_shot/config.yaml
ADDED
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
model:
|
2 |
+
type: unet
|
3 |
+
pretrained_model_path: cerspense/zeroscope_v2_576w
|
4 |
+
motion_embeddings:
|
5 |
+
combinations:
|
6 |
+
- - down
|
7 |
+
- 1280
|
8 |
+
- - up
|
9 |
+
- 1280
|
10 |
+
unet: videoCrafter2
|
11 |
+
train:
|
12 |
+
output_dir: results/07
|
13 |
+
validation_steps: 2000
|
14 |
+
checkpointing_steps: 100
|
15 |
+
checkpointing_start: 200
|
16 |
+
train_batch_size: 1
|
17 |
+
max_train_steps: 500
|
18 |
+
gradient_accumulation_steps: 1
|
19 |
+
cache_latents: true
|
20 |
+
cached_latent_dir: null
|
21 |
+
logger_type: tensorboard
|
22 |
+
mixed_precision: fp16
|
23 |
+
use_8bit_adam: false
|
24 |
+
resume_from_checkpoint: null
|
25 |
+
resume_step: null
|
26 |
+
dataset:
|
27 |
+
type:
|
28 |
+
- single_video
|
29 |
+
single_video_path: /tmp/gradio/5353948117dc7b8683fe28682a334e8076ba7e9ec45763cc8860b1758fb29b94/orbit_shot.mp4
|
30 |
+
single_video_prompt: A car turnaround in a city street
|
31 |
+
width: 640
|
32 |
+
height: 368
|
33 |
+
n_sample_frames: 16
|
34 |
+
fps: 8
|
35 |
+
sample_start_idx: 1
|
36 |
+
frame_step: 1
|
37 |
+
use_bucketing: false
|
38 |
+
use_caption: false
|
39 |
+
loss:
|
40 |
+
type: BaseLoss
|
41 |
+
learning_rate: 0.02
|
42 |
+
lr_scheduler: constant
|
43 |
+
lr_warmup_steps: 0
|
44 |
+
noise_init:
|
45 |
+
type: BlendInit
|
46 |
+
noise_prior: 0.5
|
47 |
+
val:
|
48 |
+
prompt:
|
49 |
+
- A skateboard slides along a city lane
|
50 |
+
negative_prompt: ''
|
51 |
+
sample_preview: true
|
52 |
+
width: 640
|
53 |
+
height: 368
|
54 |
+
num_frames: 16
|
55 |
+
num_inference_steps: 30
|
56 |
+
guidance_scale: 12.0
|
57 |
+
seeds:
|
58 |
+
- 0
|
59 |
+
strategy:
|
60 |
+
vSpatial_frameSubtraction: false
|
61 |
+
removeMFromV: false
|
results/orbit_shot/source.mp4
ADDED
Binary file (383 kB). View file
|
|
results/pan_up/cached_latents/cached_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c02007a490e09f7f835e48a078e46b5204df7f3eb5ccfbe8000b4867c094ecb
|
3 |
+
size 36129496
|
results/pan_up/checkpoint/motion_embed.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf9b7c679cc3c028f52a688f983de3a9e74a81e86f33423eceaf99189ae67035
|
3 |
+
size 295737352
|
results/pan_up/config.yaml
ADDED
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
model:
|
2 |
+
type: unet
|
3 |
+
pretrained_model_path: cerspense/zeroscope_v2_576w
|
4 |
+
motion_embeddings:
|
5 |
+
combinations:
|
6 |
+
- - down
|
7 |
+
- 1280
|
8 |
+
- - up
|
9 |
+
- 1280
|
10 |
+
unet: videoCrafter2
|
11 |
+
train:
|
12 |
+
output_dir: results/03
|
13 |
+
validation_steps: 2000
|
14 |
+
checkpointing_steps: 50
|
15 |
+
checkpointing_start: 200
|
16 |
+
train_batch_size: 1
|
17 |
+
max_train_steps: 500
|
18 |
+
gradient_accumulation_steps: 1
|
19 |
+
cache_latents: true
|
20 |
+
cached_latent_dir: null
|
21 |
+
logger_type: tensorboard
|
22 |
+
mixed_precision: fp16
|
23 |
+
use_8bit_adam: false
|
24 |
+
resume_from_checkpoint: null
|
25 |
+
resume_step: null
|
26 |
+
dataset:
|
27 |
+
type:
|
28 |
+
- single_video
|
29 |
+
single_video_path: /tmp/gradio/f794a1692f7472c03b0ad36870908f81af7ce5ee7cc61a73ccda287da11f5dfa/camera.mp4
|
30 |
+
single_video_prompt: A car turnaround in a city street
|
31 |
+
width: 576
|
32 |
+
height: 320
|
33 |
+
n_sample_frames: 24
|
34 |
+
fps: 8
|
35 |
+
sample_start_idx: 1
|
36 |
+
frame_step: 1
|
37 |
+
use_bucketing: false
|
38 |
+
use_caption: false
|
39 |
+
loss:
|
40 |
+
type: BaseLoss
|
41 |
+
learning_rate: 0.02
|
42 |
+
lr_scheduler: constant
|
43 |
+
lr_warmup_steps: 0
|
44 |
+
noise_init:
|
45 |
+
type: BlendInit
|
46 |
+
noise_prior: 0.5
|
47 |
+
val:
|
48 |
+
prompt:
|
49 |
+
- A skateboard slides along a city lane
|
50 |
+
negative_prompt: ''
|
51 |
+
sample_preview: true
|
52 |
+
width: 576
|
53 |
+
height: 320
|
54 |
+
num_frames: 24
|
55 |
+
num_inference_steps: 30
|
56 |
+
guidance_scale: 12.0
|
57 |
+
seeds:
|
58 |
+
- 0
|
59 |
+
strategy:
|
60 |
+
vSpatial_frameSubtraction: false
|
61 |
+
removeMFromV: false
|
results/pan_up/source.mp4
ADDED
Binary file (359 kB). View file
|
|
results/santa_dance/cached_latents/cached_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b4347b062704cb98a54d53ac42d63c01e5e37f2b96bdc38a6726aa4f35c1c47
|
3 |
+
size 46164696
|
results/santa_dance/checkpoint/motion_embed.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d499bd32fdfd0b07e61f5c52e4a76ad43fb7c849f245f5a1bb3e33f765fba6aa
|
3 |
+
size 394041352
|
results/santa_dance/config.yaml
ADDED
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
model:
|
2 |
+
type: unet
|
3 |
+
pretrained_model_path: cerspense/zeroscope_v2_576w
|
4 |
+
motion_embeddings:
|
5 |
+
combinations:
|
6 |
+
- - down
|
7 |
+
- 1280
|
8 |
+
- - up
|
9 |
+
- 1280
|
10 |
+
unet: videoCrafter2
|
11 |
+
train:
|
12 |
+
output_dir: results/07
|
13 |
+
validation_steps: 2000
|
14 |
+
checkpointing_steps: 100
|
15 |
+
checkpointing_start: 200
|
16 |
+
train_batch_size: 1
|
17 |
+
max_train_steps: 500
|
18 |
+
gradient_accumulation_steps: 1
|
19 |
+
cache_latents: true
|
20 |
+
cached_latent_dir: null
|
21 |
+
logger_type: tensorboard
|
22 |
+
mixed_precision: fp16
|
23 |
+
use_8bit_adam: false
|
24 |
+
resume_from_checkpoint: null
|
25 |
+
resume_step: null
|
26 |
+
dataset:
|
27 |
+
type:
|
28 |
+
- single_video
|
29 |
+
single_video_path: /tmp/gradio/e9c3bf4f837c93c3246204098c8139985534a94dfef880786ca6fd89c9ff89d1/santa_dance.mp4
|
30 |
+
single_video_prompt: A car turnaround in a city street
|
31 |
+
width: 640
|
32 |
+
height: 368
|
33 |
+
n_sample_frames: 16
|
34 |
+
fps: 8
|
35 |
+
sample_start_idx: 1
|
36 |
+
frame_step: 1
|
37 |
+
use_bucketing: false
|
38 |
+
use_caption: false
|
39 |
+
loss:
|
40 |
+
type: BaseLoss
|
41 |
+
learning_rate: 0.02
|
42 |
+
lr_scheduler: constant
|
43 |
+
lr_warmup_steps: 0
|
44 |
+
noise_init:
|
45 |
+
type: BlendInit
|
46 |
+
noise_prior: 0.5
|
47 |
+
val:
|
48 |
+
prompt:
|
49 |
+
- A skateboard slides along a city lane
|
50 |
+
negative_prompt: ''
|
51 |
+
sample_preview: true
|
52 |
+
width: 640
|
53 |
+
height: 368
|
54 |
+
num_frames: 16
|
55 |
+
num_inference_steps: 30
|
56 |
+
guidance_scale: 12.0
|
57 |
+
seeds:
|
58 |
+
- 0
|
59 |
+
strategy:
|
60 |
+
vSpatial_frameSubtraction: false
|
61 |
+
removeMFromV: false
|
results/santa_dance/source.mp4
ADDED
Binary file (122 kB). View file
|
|
results/train_ride/cached_latents/cached_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52600e72a6e4f5dbfaa02dddfafd68744b59d209398c0b8964ffa797036b8db7
|
3 |
+
size 32115416
|
results/train_ride/checkpoint/motion_embed.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec2ad3186c036c32f25b07c3c978c91a75872b33145c85b1e26a618eec825988
|
3 |
+
size 262969352
|
results/train_ride/config.yaml
ADDED
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
model:
|
2 |
+
type: unet
|
3 |
+
pretrained_model_path: cerspense/zeroscope_v2_576w
|
4 |
+
motion_embeddings:
|
5 |
+
combinations:
|
6 |
+
- - down
|
7 |
+
- 1280
|
8 |
+
- - up
|
9 |
+
- 1280
|
10 |
+
unet: videoCrafter2
|
11 |
+
train:
|
12 |
+
output_dir: results/06
|
13 |
+
validation_steps: 2000
|
14 |
+
checkpointing_steps: 100
|
15 |
+
checkpointing_start: 200
|
16 |
+
train_batch_size: 1
|
17 |
+
max_train_steps: 400
|
18 |
+
gradient_accumulation_steps: 1
|
19 |
+
cache_latents: true
|
20 |
+
cached_latent_dir: null
|
21 |
+
logger_type: tensorboard
|
22 |
+
mixed_precision: fp16
|
23 |
+
use_8bit_adam: false
|
24 |
+
resume_from_checkpoint: null
|
25 |
+
resume_step: null
|
26 |
+
dataset:
|
27 |
+
type:
|
28 |
+
- single_video
|
29 |
+
single_video_path: /tmp/gradio/91dd9b06d279d3b24bced706161c8fe3a911d3e853ed9bb6d92fbd69127e07ac/train_ride.mp4
|
30 |
+
single_video_prompt: A car turnaround in a city street
|
31 |
+
width: 512
|
32 |
+
height: 320
|
33 |
+
n_sample_frames: 16
|
34 |
+
fps: 8
|
35 |
+
sample_start_idx: 1
|
36 |
+
frame_step: 1
|
37 |
+
use_bucketing: false
|
38 |
+
use_caption: false
|
39 |
+
loss:
|
40 |
+
type: BaseLoss
|
41 |
+
learning_rate: 0.02
|
42 |
+
lr_scheduler: constant
|
43 |
+
lr_warmup_steps: 0
|
44 |
+
noise_init:
|
45 |
+
type: BlendInit
|
46 |
+
noise_prior: 0.5
|
47 |
+
val:
|
48 |
+
prompt:
|
49 |
+
- A skateboard slides along a city lane
|
50 |
+
negative_prompt: ''
|
51 |
+
sample_preview: true
|
52 |
+
width: 512
|
53 |
+
height: 320
|
54 |
+
num_frames: 16
|
55 |
+
num_inference_steps: 30
|
56 |
+
guidance_scale: 12.0
|
57 |
+
seeds:
|
58 |
+
- 0
|
59 |
+
strategy:
|
60 |
+
vSpatial_frameSubtraction: false
|
61 |
+
removeMFromV: false
|
results/train_ride/source.mp4
ADDED
Binary file (191 kB). View file
|
|
results/walk/checkpoint/motion_embed.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ed1d3c74c0e870c764550e7b5dea07fa6392e5e9c6851591db24459531f81a4
|
3 |
+
size 262969352
|
results/walk/config.yaml
ADDED
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
model:
|
2 |
+
type: unet
|
3 |
+
pretrained_model_path: cerspense/zeroscope_v2_576w
|
4 |
+
motion_embeddings:
|
5 |
+
combinations:
|
6 |
+
- - down
|
7 |
+
- 1280
|
8 |
+
- - up
|
9 |
+
- 1280
|
10 |
+
unet: videoCrafter2
|
11 |
+
train:
|
12 |
+
output_dir: results/05
|
13 |
+
validation_steps: 2000
|
14 |
+
checkpointing_steps: 100
|
15 |
+
checkpointing_start: 200
|
16 |
+
train_batch_size: 1
|
17 |
+
max_train_steps: 200
|
18 |
+
gradient_accumulation_steps: 1
|
19 |
+
cache_latents: true
|
20 |
+
cached_latent_dir: null
|
21 |
+
logger_type: tensorboard
|
22 |
+
mixed_precision: fp16
|
23 |
+
use_8bit_adam: false
|
24 |
+
resume_from_checkpoint: null
|
25 |
+
resume_step: null
|
26 |
+
dataset:
|
27 |
+
type:
|
28 |
+
- single_video
|
29 |
+
single_video_path: /tmp/gradio/399a0cb64057460050f4db313c05d150200f8a54bbbd783d56f078e74ee64037/walk.mp4
|
30 |
+
single_video_prompt: A car turnaround in a city street
|
31 |
+
width: 512
|
32 |
+
height: 320
|
33 |
+
n_sample_frames: 16
|
34 |
+
fps: 8
|
35 |
+
sample_start_idx: 1
|
36 |
+
frame_step: 1
|
37 |
+
use_bucketing: false
|
38 |
+
use_caption: false
|
39 |
+
loss:
|
40 |
+
type: BaseLoss
|
41 |
+
learning_rate: 0.02
|
42 |
+
lr_scheduler: constant
|
43 |
+
lr_warmup_steps: 0
|
44 |
+
noise_init:
|
45 |
+
type: BlendInit
|
46 |
+
noise_prior: 0.5
|
47 |
+
val:
|
48 |
+
prompt:
|
49 |
+
- A skateboard slides along a city lane
|
50 |
+
negative_prompt: ''
|
51 |
+
sample_preview: true
|
52 |
+
width: 512
|
53 |
+
height: 320
|
54 |
+
num_frames: 16
|
55 |
+
num_inference_steps: 30
|
56 |
+
guidance_scale: 12.0
|
57 |
+
seeds:
|
58 |
+
- 0
|
59 |
+
strategy:
|
60 |
+
vSpatial_frameSubtraction: false
|
61 |
+
removeMFromV: false
|
results/walk/source.mp4
ADDED
Binary file (131 kB). View file
|
|