Spaces:
Runtime error
Runtime error
folder
Browse files
configs/clm_models/agent_7b_sft.yaml
CHANGED
@@ -15,4 +15,5 @@ output_resampler:
|
|
15 |
|
16 |
lm_loss_scale: 1.0
|
17 |
rec_loss_scale: 1.0
|
18 |
-
pretrained_model_path: TencentARC/SEED-Story
|
|
|
|
15 |
|
16 |
lm_loss_scale: 1.0
|
17 |
rec_loss_scale: 1.0
|
18 |
+
pretrained_model_path: TencentARC/SEED-Story
|
19 |
+
subfolder: seed_story/george_sft
|
src/models_clm/models.py
CHANGED
@@ -221,23 +221,22 @@ class ContinuousLVLM(nn.Module):
|
|
221 |
'past_key_values': output_past_key_values
|
222 |
}
|
223 |
|
224 |
-
|
225 |
@classmethod
|
226 |
-
def from_pretrained(cls, llm, input_resampler, output_resampler, pretrained_model_path=None, **kwargs):
|
227 |
model = cls(llm=llm, input_resampler=input_resampler, output_resampler=output_resampler, **kwargs)
|
228 |
|
229 |
if pretrained_model_path is not None:
|
230 |
-
#
|
231 |
if 'TencentARC/SEED-Story' in pretrained_model_path:
|
232 |
-
#
|
233 |
-
ckpt = AutoModel.from_pretrained(pretrained_model_path, subfolder=
|
234 |
missing, unexpected = model.load_state_dict(ckpt.state_dict(), strict=False)
|
235 |
-
print('
|
236 |
else:
|
237 |
# For local path loading
|
238 |
ckpt = torch.load(pretrained_model_path, map_location='cpu')
|
239 |
missing, unexpected = model.load_state_dict(ckpt, strict=False)
|
240 |
-
print('
|
241 |
|
242 |
return model
|
243 |
|
|
|
221 |
'past_key_values': output_past_key_values
|
222 |
}
|
223 |
|
|
|
224 |
@classmethod
|
225 |
+
def from_pretrained(cls, llm, input_resampler, output_resampler, pretrained_model_path=None, subfolder=None, **kwargs):
|
226 |
model = cls(llm=llm, input_resampler=input_resampler, output_resampler=output_resampler, **kwargs)
|
227 |
|
228 |
if pretrained_model_path is not None:
|
229 |
+
# Load model from Hugging Face Hub with subfolder specification
|
230 |
if 'TencentARC/SEED-Story' in pretrained_model_path:
|
231 |
+
# Use `subfolder` to specify the location within the repository
|
232 |
+
ckpt = AutoModel.from_pretrained(pretrained_model_path, subfolder=subfolder)
|
233 |
missing, unexpected = model.load_state_dict(ckpt.state_dict(), strict=False)
|
234 |
+
print('Detokenizer model, missing keys: ', len(missing), 'unexpected keys:', len(unexpected))
|
235 |
else:
|
236 |
# For local path loading
|
237 |
ckpt = torch.load(pretrained_model_path, map_location='cpu')
|
238 |
missing, unexpected = model.load_state_dict(ckpt, strict=False)
|
239 |
+
print('Detokenizer model, missing keys: ', len(missing), 'unexpected keys:', len(unexpected))
|
240 |
|
241 |
return model
|
242 |
|