from transformers import PretrainedConfig class ActEstimatorConfig(PretrainedConfig): model_type = "ACT-Estimator" def __init__( self, input_shape=(3, 44, 224, 224), num_classes=9, max_seq_len=44, timestamp_dim=1, d_model=512, num_heads=8, dropout=0.1, feature_map_size=4, **kwargs ): self.input_shape = input_shape self.num_classes = num_classes self.max_seq_len = max_seq_len self.timestamp_dim = timestamp_dim self.d_model = d_model self.num_heads = num_heads self.dropout = dropout self.feature_map_size = feature_map_size super().__init__(**kwargs)