from .clip_model import convert_weights_to_precision, VisionTransformer, LayerNorm # ... rest of ImageEncoder implementation ...