Spaces:
Paused
Paused
import torch | |
from transformers import PretrainedConfig, BitsAndBytesConfig | |
import math | |
from typing import Optional | |
class VisionProjectorConfig(PretrainedConfig): | |
def __init__( | |
self, | |
input_dim=768, | |
hidden_dim=256, | |
num_tokens=1, | |
output_dim=2560, | |
**kwargs | |
): | |
#super.__init__(**kwargs) | |
self.input_dim = input_dim | |
self.hidden_dim = hidden_dim | |
self.output_dim = output_dim | |
self.num_tokens = num_tokens | |
self.kwargs = kwargs | |
app_config = dict( | |
max_seqlen=512, | |
max_caption_len=100, | |
data_dir='../data', | |
output_dir="./results", | |
vision_model=True, | |
vision_projector_file='models/vision_projector/vp_ckpt_0.pth', | |
phi_adapter_dir='models/phi_adapter' | |
) |