Upload model

Browse files

Files changed (4) hide show

config.json +21 -0
configuration_custom5.py +17 -0
modeling_custom5.py +48 -0
pytorch_model.bin +3 -0

config.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "architectures": [
+    "CustomModel5"
+  ],
+  "auto_map": {
+    "AutoConfig": "configuration_custom5.CustomConfig5",
+    "AutoModelForCausalLM": "modeling_custom5.CustomModel5"
+  },
+  "coeffs": [
+    1.0,
+    -1.0
+  ],
+  "model_type": "custom5",
+  "models": [
+    "EleutherAI/pythia-160m",
+    "EleutherAI/pythia-70m"
+  ],
+  "torch_dtype": "float16",
+  "transformers_version": "4.34.0",
+  "vocab_size": 50304
+}

configuration_custom5.py ADDED Viewed

	@@ -0,0 +1,17 @@

+from transformers import PretrainedConfig, AutoConfig
+class CustomConfig5(PretrainedConfig):
+    model_type = "custom5"
+    def __init__(
+        self,
+        models=None,
+        coeffs=None,
+        **kwargs,
+    ):
+        super().__init__(**kwargs)
+        self.models = models
+        self.coeffs = coeffs
+        if models:
+            configs = [ AutoConfig.from_pretrained(model) for model in models ]
+            self.vocab_size = configs[0].vocab_size

modeling_custom5.py ADDED Viewed

	@@ -0,0 +1,48 @@

+# https://huggingface.co/docs/transformers/custom_models
+from transformers import PreTrainedModel, AutoModelForCausalLM, AutoTokenizer, AutoModel, AutoConfig
+from transformers.modeling_outputs import CausalLMOutputWithPast
+from torch.nn import CrossEntropyLoss
+from torch.nn.functional import log_softmax
+from torch.nn.modules.container import ModuleList
+from .configuration_custom5 import CustomConfig5
+class CustomModel5(PreTrainedModel):
+    config_class = CustomConfig5
+    def __init__(self, config):
+        super().__init__(config)
+        self.model = ModuleList([AutoModelForCausalLM.from_pretrained(m) for m in config.models])
+    def forward(self, *args, labels=None, **kwargs):
+        loss = None
+        logits = None
+        for model, coeff in zip(self.model, self.config.coeffs):
+            logp = log_softmax(model.forward(*args, **kwargs).logits, dim=-1)
+            logits = coeff * logp if logits is None else logits + coeff * logp
+        # The rest copied from modeling_llama.py:
+        if labels is not None:
+            # Shift so that tokens < n predict n
+            shift_logits = logits[..., :-1, :].contiguous()
+            shift_labels = labels[..., 1:].contiguous()
+            # Flatten the tokens
+            loss_fct = CrossEntropyLoss()
+            shift_logits = shift_logits.view(-1, self.config.vocab_size)
+            shift_labels = shift_labels.view(-1)
+            # Enable model parallelism
+            shift_labels = shift_labels.to(shift_logits.device)
+            loss = loss_fct(shift_logits, shift_labels)
+        return CausalLMOutputWithPast(loss=loss, logits=logits)
+## Which one do we use?
+## You have to tell the library you want to copy the code files of those objects when using the save_pretrained method and properly register them with a given Auto class (especially for models), just run:
+# CustomConfig5.register_for_auto_class()
+# CustomModel5.register_for_auto_class('AutoModelForCausalLM')
+# CustomModel5.register_for_auto_class('AutoModel')
+## If you are writing a library that extends 🤗 Transformers, you may want to extend the auto classes to include your own model. This is different from pushing the code to the Hub in the sense that users will need to import your library to get the custom models (contrarily to automatically downloading the model code from the Hub).
+## As long as your config has a model_type attribute that is different from existing model types, and that your model classes have the right config_class attributes, you can just add them to the auto classes like this:
+# AutoConfig.register("custom5", CustomConfig5)
+# AutoModel.register(CustomConfig5, CustomModel5)
+# AutoModelForCausalLM.register(CustomConfig5, CustomModel5)

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d39c55bd4bf0be5a6d21ae200275a23b07f3fbd4c803959ce3341a5210a2aea1
+size 465582677