cocktailpeanut commited on
Commit
cabc97a
1 Parent(s): 9db1345
app.py CHANGED
@@ -202,7 +202,9 @@ pipeline = XoraVideoPipeline(
202
  tokenizer=tokenizer,
203
  scheduler=scheduler,
204
  vae=vae,
205
- ).to(device)
 
 
206
 
207
 
208
  def generate_video_from_text(
 
202
  tokenizer=tokenizer,
203
  scheduler=scheduler,
204
  vae=vae,
205
+ )
206
+ #).to(device)
207
+ pipeline.enable_model_cpu_offload()
208
 
209
 
210
  def generate_video_from_text(
requirements.txt CHANGED
@@ -6,7 +6,7 @@ sentencepiece>=0.1.96
6
  accelerate
7
  einops
8
  matplotlib
9
- opencv-python
10
  beautifulsoup4
11
  ftfy
12
  gradio
 
6
  accelerate
7
  einops
8
  matplotlib
9
+ opencv-python==4.5.5
10
  beautifulsoup4
11
  ftfy
12
  gradio
xora/models/autoencoders/vae_encode.py CHANGED
@@ -127,6 +127,7 @@ def _run_decoder(
127
  *_, fl, hl, wl = latents.shape
128
  temporal_scale, spatial_scale, _ = get_vae_size_scale_factor(vae)
129
  latents = latents.to(vae.dtype)
 
130
  image = vae.decode(
131
  un_normalize_latents(latents, vae, vae_per_channel_normalize),
132
  return_dict=False,
 
127
  *_, fl, hl, wl = latents.shape
128
  temporal_scale, spatial_scale, _ = get_vae_size_scale_factor(vae)
129
  latents = latents.to(vae.dtype)
130
+ vae = vae.to(latents.device, vae.dtype)
131
  image = vae.decode(
132
  un_normalize_latents(latents, vae, vae_per_channel_normalize),
133
  return_dict=False,