FramePack / diffusers_helper /clip_vision.py
MohamedRashad's picture
Add initial implementation of helper functions and requirements for diffusers
a252b0c
raw
history blame contribute delete
449 Bytes
import numpy as np
def hf_clip_vision_encode(image, feature_extractor, image_encoder):
assert isinstance(image, np.ndarray)
assert image.ndim == 3 and image.shape[2] == 3
assert image.dtype == np.uint8
preprocessed = feature_extractor.preprocess(images=image, return_tensors="pt").to(device=image_encoder.device, dtype=image_encoder.dtype)
image_encoder_output = image_encoder(**preprocessed)
return image_encoder_output