Spaces:
Runtime error
Runtime error
folder
Browse files
configs/clm_models/agent_7b_sft.yaml
CHANGED
|
@@ -15,4 +15,5 @@ output_resampler:
|
|
| 15 |
|
| 16 |
lm_loss_scale: 1.0
|
| 17 |
rec_loss_scale: 1.0
|
| 18 |
-
pretrained_model_path: TencentARC/SEED-Story
|
|
|
|
|
|
| 15 |
|
| 16 |
lm_loss_scale: 1.0
|
| 17 |
rec_loss_scale: 1.0
|
| 18 |
+
pretrained_model_path: TencentARC/SEED-Story
|
| 19 |
+
subfolder: seed_story/george_sft
|
src/models_clm/models.py
CHANGED
|
@@ -221,23 +221,22 @@ class ContinuousLVLM(nn.Module):
|
|
| 221 |
'past_key_values': output_past_key_values
|
| 222 |
}
|
| 223 |
|
| 224 |
-
|
| 225 |
@classmethod
|
| 226 |
-
def from_pretrained(cls, llm, input_resampler, output_resampler, pretrained_model_path=None, **kwargs):
|
| 227 |
model = cls(llm=llm, input_resampler=input_resampler, output_resampler=output_resampler, **kwargs)
|
| 228 |
|
| 229 |
if pretrained_model_path is not None:
|
| 230 |
-
#
|
| 231 |
if 'TencentARC/SEED-Story' in pretrained_model_path:
|
| 232 |
-
#
|
| 233 |
-
ckpt = AutoModel.from_pretrained(pretrained_model_path, subfolder=
|
| 234 |
missing, unexpected = model.load_state_dict(ckpt.state_dict(), strict=False)
|
| 235 |
-
print('
|
| 236 |
else:
|
| 237 |
# For local path loading
|
| 238 |
ckpt = torch.load(pretrained_model_path, map_location='cpu')
|
| 239 |
missing, unexpected = model.load_state_dict(ckpt, strict=False)
|
| 240 |
-
print('
|
| 241 |
|
| 242 |
return model
|
| 243 |
|
|
|
|
| 221 |
'past_key_values': output_past_key_values
|
| 222 |
}
|
| 223 |
|
|
|
|
| 224 |
@classmethod
|
| 225 |
+
def from_pretrained(cls, llm, input_resampler, output_resampler, pretrained_model_path=None, subfolder=None, **kwargs):
|
| 226 |
model = cls(llm=llm, input_resampler=input_resampler, output_resampler=output_resampler, **kwargs)
|
| 227 |
|
| 228 |
if pretrained_model_path is not None:
|
| 229 |
+
# Load model from Hugging Face Hub with subfolder specification
|
| 230 |
if 'TencentARC/SEED-Story' in pretrained_model_path:
|
| 231 |
+
# Use `subfolder` to specify the location within the repository
|
| 232 |
+
ckpt = AutoModel.from_pretrained(pretrained_model_path, subfolder=subfolder)
|
| 233 |
missing, unexpected = model.load_state_dict(ckpt.state_dict(), strict=False)
|
| 234 |
+
print('Detokenizer model, missing keys: ', len(missing), 'unexpected keys:', len(unexpected))
|
| 235 |
else:
|
| 236 |
# For local path loading
|
| 237 |
ckpt = torch.load(pretrained_model_path, map_location='cpu')
|
| 238 |
missing, unexpected = model.load_state_dict(ckpt, strict=False)
|
| 239 |
+
print('Detokenizer model, missing keys: ', len(missing), 'unexpected keys:', len(unexpected))
|
| 240 |
|
| 241 |
return model
|
| 242 |
|