Spaces:
Paused
Paused
Update app.py
Browse files
app.py
CHANGED
|
@@ -44,6 +44,12 @@ base_model_id = "hunyuanvideo-community/HunyuanVideo"
|
|
| 44 |
|
| 45 |
device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
|
| 46 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 47 |
def init_predictor():
|
| 48 |
global pipe
|
| 49 |
text_encoder = LlamaModel.from_pretrained(
|
|
@@ -63,26 +69,21 @@ def init_predictor():
|
|
| 63 |
quantize_(transformer, float8_weight_only(), device="cpu")
|
| 64 |
transformer.to("cpu")
|
| 65 |
torch.cuda.empty_cache()
|
| 66 |
-
offload_config=OffloadConfig(
|
| 67 |
-
high_cpu_memory=True,
|
| 68 |
-
parameters_level=True,
|
| 69 |
-
compiler_transformer=False,
|
| 70 |
-
)
|
| 71 |
pipe = SkyreelsVideoPipeline.from_pretrained(
|
| 72 |
base_model_id,
|
| 73 |
transformer=transformer,
|
| 74 |
text_encoder=text_encoder,
|
| 75 |
torch_dtype=torch.bfloat16,
|
| 76 |
).to("cpu")
|
| 77 |
-
Offload.offload(
|
| 78 |
-
pipeline=pipe,
|
| 79 |
-
config=offload_config,
|
| 80 |
-
)
|
| 81 |
|
| 82 |
negative_prompt = "Aerial view, aerial view, overexposed, low quality, deformation, a poor composition, bad hands, bad teeth, bad eyes, bad limbs, distortion"
|
| 83 |
|
| 84 |
@spaces.GPU(duration=60)
|
| 85 |
def generate(segment, image, prompt, size, guidance_scale, num_inference_steps, frames, seed, progress=gr.Progress(track_tqdm=True) ):
|
|
|
|
|
|
|
|
|
|
|
|
|
| 86 |
random.seed(time.time())
|
| 87 |
seed = int(random.randrange(4294967294))
|
| 88 |
if segment==1:
|
|
|
|
| 44 |
|
| 45 |
device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
|
| 46 |
|
| 47 |
+
offload_config=OffloadConfig(
|
| 48 |
+
high_cpu_memory=True,
|
| 49 |
+
parameters_level=True,
|
| 50 |
+
compiler_transformer=False,
|
| 51 |
+
)
|
| 52 |
+
|
| 53 |
def init_predictor():
|
| 54 |
global pipe
|
| 55 |
text_encoder = LlamaModel.from_pretrained(
|
|
|
|
| 69 |
quantize_(transformer, float8_weight_only(), device="cpu")
|
| 70 |
transformer.to("cpu")
|
| 71 |
torch.cuda.empty_cache()
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 72 |
pipe = SkyreelsVideoPipeline.from_pretrained(
|
| 73 |
base_model_id,
|
| 74 |
transformer=transformer,
|
| 75 |
text_encoder=text_encoder,
|
| 76 |
torch_dtype=torch.bfloat16,
|
| 77 |
).to("cpu")
|
|
|
|
|
|
|
|
|
|
|
|
|
| 78 |
|
| 79 |
negative_prompt = "Aerial view, aerial view, overexposed, low quality, deformation, a poor composition, bad hands, bad teeth, bad eyes, bad limbs, distortion"
|
| 80 |
|
| 81 |
@spaces.GPU(duration=60)
|
| 82 |
def generate(segment, image, prompt, size, guidance_scale, num_inference_steps, frames, seed, progress=gr.Progress(track_tqdm=True) ):
|
| 83 |
+
Offload.offload(
|
| 84 |
+
pipeline=pipe,
|
| 85 |
+
config=offload_config,
|
| 86 |
+
)
|
| 87 |
random.seed(time.time())
|
| 88 |
seed = int(random.randrange(4294967294))
|
| 89 |
if segment==1:
|