NoMoreCopyrightOrg
/

flux-test

Model card Files Files and versions

John6666 commited on Mar 4

Commit

b883a97

·

verified ·

1 Parent(s): e23cbc1

Upload 2 files

Files changed (2) hide show

handler.py +5 -5
requirements.txt +1 -2

handler.py CHANGED Viewed

@@ -8,7 +8,7 @@ import torch
 #import torch._dynamo
 #torch._dynamo.config.suppress_errors = True
-from huggingface_inference_toolkit.logging import logger
 def compile_pipeline(pipe) -> Any:
     pipe.transformer.fuse_qkv_projections()
@@ -19,8 +19,8 @@ def compile_pipeline(pipe) -> Any:
 class EndpointHandler:
     def __init__(self, path="NoMoreCopyright/FLUX.1-dev-test"):
         is_compile = False
-        #repo_id = "camenduru/FLUX.1-dev-diffusers"
-        repo_id = "NoMoreCopyright/FLUX.1-dev-test"
         dtype = torch.bfloat16
         quantization_config = TorchAoConfig("int4dq")
         vae = AutoencoderKL.from_pretrained(repo_id, subfolder="vae", torch_dtype=dtype)
@@ -29,9 +29,9 @@ class EndpointHandler:
         if is_compile: self.pipeline = compile_pipeline(self.pipeline)
         self.pipeline.to("cuda")
-    @torch.inference_mode()
     def __call__(self, data: Dict[str, Any]) -> Image:
-        logger.info(f"Received incoming request with {data=}")
         if "inputs" in data and isinstance(data["inputs"], str):
             prompt = data.pop("inputs")

 #import torch._dynamo
 #torch._dynamo.config.suppress_errors = True
+#from huggingface_inference_toolkit.logging import logger
 def compile_pipeline(pipe) -> Any:
     pipe.transformer.fuse_qkv_projections()
 class EndpointHandler:
     def __init__(self, path="NoMoreCopyright/FLUX.1-dev-test"):
         is_compile = False
+        repo_id = "camenduru/FLUX.1-dev-diffusers"
+        #repo_id = "NoMoreCopyright/FLUX.1-dev-test"
         dtype = torch.bfloat16
         quantization_config = TorchAoConfig("int4dq")
         vae = AutoencoderKL.from_pretrained(repo_id, subfolder="vae", torch_dtype=dtype)
         if is_compile: self.pipeline = compile_pipeline(self.pipeline)
         self.pipeline.to("cuda")
+    #@torch.inference_mode()
     def __call__(self, data: Dict[str, Any]) -> Image:
+        #logger.info(f"Received incoming request with {data=}")
         if "inputs" in data and isinstance(data["inputs"], str):
             prompt = data.pop("inputs")

requirements.txt CHANGED Viewed

@@ -7,5 +7,4 @@ accelerate
 transformers
 numpy
 scipy
-Pillow
-triton

 transformers
 numpy
 scipy
+Pillow