Upload handler.py
Browse files- handler.py +10 -10
handler.py
CHANGED
|
@@ -26,17 +26,17 @@ class EndpointHandler:
|
|
| 26 |
self.pipe.enable_vae_tiling()
|
| 27 |
#self.pipe.transformer.fuse_qkv_projections()
|
| 28 |
#self.pipe.vae.fuse_qkv_projections()
|
| 29 |
-
self.pipe.transformer.to(memory_format=torch.channels_last)
|
| 30 |
-
self.pipe.vae.to(memory_format=torch.channels_last)
|
| 31 |
apply_cache_on_pipe(self.pipe, residual_diff_threshold=0.12)
|
| 32 |
-
self.pipe.transformer = torch.compile(
|
| 33 |
-
|
| 34 |
-
)
|
| 35 |
-
self.pipe.vae = torch.compile(
|
| 36 |
-
|
| 37 |
-
)
|
| 38 |
-
|
| 39 |
-
|
| 40 |
|
| 41 |
gc.collect()
|
| 42 |
torch.cuda.empty_cache()
|
|
|
|
| 26 |
self.pipe.enable_vae_tiling()
|
| 27 |
#self.pipe.transformer.fuse_qkv_projections()
|
| 28 |
#self.pipe.vae.fuse_qkv_projections()
|
| 29 |
+
#self.pipe.transformer.to(memory_format=torch.channels_last)
|
| 30 |
+
#self.pipe.vae.to(memory_format=torch.channels_last)
|
| 31 |
apply_cache_on_pipe(self.pipe, residual_diff_threshold=0.12)
|
| 32 |
+
#self.pipe.transformer = torch.compile(
|
| 33 |
+
# self.pipe.transformer, mode="max-autotune-no-cudagraphs",
|
| 34 |
+
#)
|
| 35 |
+
#self.pipe.vae = torch.compile(
|
| 36 |
+
# self.pipe.vae, mode="max-autotune-no-cudagraphs",
|
| 37 |
+
#)
|
| 38 |
+
self.pipe.transformer = autoquant(self.pipe.transformer, error_on_unseen=False)
|
| 39 |
+
self.pipe.vae = autoquant(self.pipe.vae, error_on_unseen=False)
|
| 40 |
|
| 41 |
gc.collect()
|
| 42 |
torch.cuda.empty_cache()
|