|
from transformers import PretrainedConfig |
|
|
|
|
|
class MarlinConfig(PretrainedConfig): |
|
model_type = "marlin" |
|
|
|
def __init__(self, **kwargs): |
|
self.img_size = kwargs.pop("img_size", None) |
|
self.patch_size = kwargs.pop("patch_size", None) |
|
self.n_frames = kwargs.pop("n_frames", None) |
|
self.encoder_embed_dim = kwargs.pop("encoder_embed_dim", None) |
|
self.encoder_depth = kwargs.pop("encoder_depth", None) |
|
self.encoder_num_heads = kwargs.pop("encoder_num_heads", None) |
|
self.decoder_embed_dim = kwargs.pop("decoder_embed_dim", None) |
|
self.decoder_depth = kwargs.pop("decoder_depth", None) |
|
self.decoder_num_heads = kwargs.pop("decoder_num_heads", None) |
|
self.mlp_ratio = kwargs.pop("mlp_ratio", None) |
|
self.qkv_bias = kwargs.pop("qkv_bias", None) |
|
self.qk_scale = kwargs.pop("qk_scale", None) |
|
self.drop_rate = kwargs.pop("drop_rate", None) |
|
self.attn_drop_rate = kwargs.pop("attn_drop_rate", None) |
|
self.norm_layer = kwargs.pop("norm_layer", None) |
|
self.init_values = kwargs.pop("init_values", None) |
|
self.tubelet_size = kwargs.pop("tubelet_size", None) |
|
self.as_feature_extractor = kwargs.pop("as_feature_extractor", True) |
|
|
|
super().__init__(**kwargs) |
|
|