English
John6666 commited on
Commit
a5cb0bf
·
verified ·
1 Parent(s): 0880fdf

Upload handler.py

Browse files
Files changed (1) hide show
  1. handler.py +10 -10
handler.py CHANGED
@@ -26,17 +26,17 @@ class EndpointHandler:
26
  self.pipe.enable_vae_tiling()
27
  #self.pipe.transformer.fuse_qkv_projections()
28
  #self.pipe.vae.fuse_qkv_projections()
29
- self.pipe.transformer.to(memory_format=torch.channels_last)
30
- self.pipe.vae.to(memory_format=torch.channels_last)
31
  apply_cache_on_pipe(self.pipe, residual_diff_threshold=0.12)
32
- self.pipe.transformer = torch.compile(
33
- self.pipe.transformer, mode="max-autotune-no-cudagraphs",
34
- )
35
- self.pipe.vae = torch.compile(
36
- self.pipe.vae, mode="max-autotune-no-cudagraphs",
37
- )
38
- #self.pipe.transformer = autoquant(self.pipe.transformer, error_on_unseen=False)
39
- #self.pipe.vae = autoquant(self.pipe.vae, error_on_unseen=False)
40
 
41
  gc.collect()
42
  torch.cuda.empty_cache()
 
26
  self.pipe.enable_vae_tiling()
27
  #self.pipe.transformer.fuse_qkv_projections()
28
  #self.pipe.vae.fuse_qkv_projections()
29
+ #self.pipe.transformer.to(memory_format=torch.channels_last)
30
+ #self.pipe.vae.to(memory_format=torch.channels_last)
31
  apply_cache_on_pipe(self.pipe, residual_diff_threshold=0.12)
32
+ #self.pipe.transformer = torch.compile(
33
+ # self.pipe.transformer, mode="max-autotune-no-cudagraphs",
34
+ #)
35
+ #self.pipe.vae = torch.compile(
36
+ # self.pipe.vae, mode="max-autotune-no-cudagraphs",
37
+ #)
38
+ self.pipe.transformer = autoquant(self.pipe.transformer, error_on_unseen=False)
39
+ self.pipe.vae = autoquant(self.pipe.vae, error_on_unseen=False)
40
 
41
  gc.collect()
42
  torch.cuda.empty_cache()