Spaces:

helblazer811
/

ConceptAttention

Running on Zero

App Files Files Community

helblazer811 commited on Feb 16

Commit

4b30dce

1 Parent(s): 8fd23f8

app changes

Browse files

Files changed (4) hide show

app.py +1 -2
concept_attention/binary_segmentation_baselines/__pycache__/raw_cross_attention.cpython-310.pyc +0 -0
concept_attention/binary_segmentation_baselines/__pycache__/raw_output_space.cpython-310.pyc +0 -0
concept_attention/flux/src/flux/util.py +39 -3

app.py CHANGED Viewed

@@ -28,12 +28,11 @@ EXAMPLES = [
     # ["Portrait of a young woman", "monkey.png", "face, hair, eyes", 456],
 ]
 pipeline = ConceptAttentionFluxPipeline(model_name="flux-schnell", device="cuda")
 @spaces.GPU(duration=60)
 def process_inputs(prompt, input_image, word_list, seed):
     prompt = prompt.strip()
     if not word_list.strip():
         return None, "Please enter comma-separated words"

     # ["Portrait of a young woman", "monkey.png", "face, hair, eyes", 456],
 ]
 pipeline = ConceptAttentionFluxPipeline(model_name="flux-schnell", device="cuda")
 @spaces.GPU(duration=60)
 def process_inputs(prompt, input_image, word_list, seed):
+    print("Processing inputs")
     prompt = prompt.strip()
     if not word_list.strip():
         return None, "Please enter comma-separated words"

concept_attention/binary_segmentation_baselines/__pycache__/raw_cross_attention.cpython-310.pyc CHANGED Viewed

Binary files a/concept_attention/binary_segmentation_baselines/__pycache__/raw_cross_attention.cpython-310.pyc and b/concept_attention/binary_segmentation_baselines/__pycache__/raw_cross_attention.cpython-310.pyc differ

concept_attention/binary_segmentation_baselines/__pycache__/raw_output_space.cpython-310.pyc CHANGED Viewed

Binary files a/concept_attention/binary_segmentation_baselines/__pycache__/raw_output_space.cpython-310.pyc and b/concept_attention/binary_segmentation_baselines/__pycache__/raw_output_space.cpython-310.pyc differ

concept_attention/flux/src/flux/util.py CHANGED Viewed

@@ -2,6 +2,7 @@ import os
 from dataclasses import dataclass
 import torch
 from einops import rearrange
 from huggingface_hub import hf_hub_download
 from imwatermark import WatermarkEncoder
@@ -126,6 +127,34 @@ def load_flow_model(name: str, device: str | torch.device = "cuda", hf_download:
     return model
 def load_t5(device: str | torch.device = "cuda", max_length: int = 512) -> HFEmbedder:
     # Download each of the files
     config_file = hf_hub_download(configs["flux-schnell"].repo_id, "text_encoder_2/config.json") # File 1: config.json
@@ -139,13 +168,20 @@ def load_t5(device: str | torch.device = "cuda", max_length: int = 512) -> HFEmb
     state_dict.update(load_sft(safe_tensor_1, device=str(device)))
     state_dict.update(load_sft(safe_tensor_2, device=str(device)))
     # Load the state dict
-    t5_encoder = T5EncoderModel(config=model_config)
     t5_encoder.load_state_dict(state_dict, strict=False)
     # Load the tokenizer
     tokenizer = T5Tokenizer.from_pretrained("google/t5-v1_1-xxl")
     t5_encoder.tokenizer = tokenizer
     # max length 64, 128, 256 and 512 should work (if your sequence is short enough)
     # Load the safe tensors model
     # ckpt_path = hf_hub_download(configs["name"].repo_id, configs["name"].repo_flow)
@@ -156,8 +192,8 @@ def load_t5(device: str | torch.device = "cuda", max_length: int = 512) -> HFEmb
     #     max_length=max_length,
     #     torch_dtype=torch.bfloat16,
     # ).to(device)
-    return t5_encoder
     # return HFEmbedder("google/t5-v1_1-xxl", max_length=max_length, torch_dtype=torch.bfloat16).to(device)
 def load_clip(device: str | torch.device = "cuda") -> HFEmbedder:

 from dataclasses import dataclass
 import torch
+from torch import nn
 from einops import rearrange
 from huggingface_hub import hf_hub_download
 from imwatermark import WatermarkEncoder
     return model
+class T5Embedder(nn.Module):
+    def __init__(self, hf_module, tokenizer, max_length=512, output_key="last_hidden_state"):
+        super().__init__()
+        self.max_length = max_length
+        self.output_key = output_key
+        self.hf_module = hf_module
+        self.tokenizer = tokenizer
+    def forward(self, text: list[str]) -> torch.Tensor:
+        batch_encoding = self.tokenizer(
+            text,
+            truncation=True,
+            max_length=self.max_length,
+            return_length=False,
+            return_overflowing_tokens=False,
+            padding="max_length",
+            return_tensors="pt",
+        )
+        outputs = self.hf_module(
+            input_ids=batch_encoding["input_ids"].to(self.hf_module.device),
+            attention_mask=None,
+            output_hidden_states=False,
+        )
+        return outputs[self.output_key]
 def load_t5(device: str | torch.device = "cuda", max_length: int = 512) -> HFEmbedder:
     # Download each of the files
     config_file = hf_hub_download(configs["flux-schnell"].repo_id, "text_encoder_2/config.json") # File 1: config.json
     state_dict.update(load_sft(safe_tensor_1, device=str(device)))
     state_dict.update(load_sft(safe_tensor_2, device=str(device)))
     # Load the state dict
+    t5_encoder = T5EncoderModel(config=model_config).to(torch.bfloat16)
     t5_encoder.load_state_dict(state_dict, strict=False)
     # Load the tokenizer
     tokenizer = T5Tokenizer.from_pretrained("google/t5-v1_1-xxl")
     t5_encoder.tokenizer = tokenizer
+    # Now make t5 a custom model that tokenizes the input and then passes it through the model
+    return T5Embedder(
+        t5_encoder,
+        tokenizer,
+        max_length=max_length,
+        output_key="last_hidden_state"
+    ).to(device)
     # max length 64, 128, 256 and 512 should work (if your sequence is short enough)
     # Load the safe tensors model
     # ckpt_path = hf_hub_download(configs["name"].repo_id, configs["name"].repo_flow)
     #     max_length=max_length,
     #     torch_dtype=torch.bfloat16,
     # ).to(device)
+#
+    # return t5_encoder
     # return HFEmbedder("google/t5-v1_1-xxl", max_length=max_length, torch_dtype=torch.bfloat16).to(device)
 def load_clip(device: str | torch.device = "cuda") -> HFEmbedder: