samkeet
/

GPT_124M

samkeet commited on Jan 30

Commit

1d7f089

verified ·

1 Parent(s): 5c2d7dc

Upload model

Files changed (2) hide show

config.json CHANGED Viewed

@@ -7,21 +7,6 @@
     "AutoModelForCausalLM": "modeling_gpt.GPTModelForTextGeneration"
   },
   "block_size": 1024,
-  "custom_pipelines": {
-    "text-generation": {
-      "default": {
-        "model": {
-          "pt": "samkeet/GPT_124M"
-        }
-      },
-      "impl": "pipeline_gpt.GPT124MTextGenerationPipeline",
-      "pt": [
-        "AutoModelForCausalLM"
-      ],
-      "tf": [],
-      "type": "text"
-    }
-  },
   "model_type": "custom_gpt",
   "n_embd": 768,
   "n_head": 12,

     "AutoModelForCausalLM": "modeling_gpt.GPTModelForTextGeneration"
   },
   "block_size": 1024,
   "model_type": "custom_gpt",
   "n_embd": 768,
   "n_head": 12,

modeling_gpt.py CHANGED Viewed

@@ -1,7 +1,6 @@
 # Importing libraries
 import torch
 import torch.nn as nn
-from typing import Generator
 import torch.nn.functional as F
 from transformers import PreTrainedModel
 from .configuration_gpt import GPTConfig
@@ -250,7 +249,7 @@ class GPTModelForTextGeneration(PreTrainedModel):
         # Autoregressive token generation loop
         while tokens.size(1) < max_length:
             logits = self.forward(tokens)["logits"][:, -1, :]
-            logits = logits / temperature
             if do_sample:
                 top_k = min(top_k, logits.size(-1))  # Safety check

 # Importing libraries
 import torch
 import torch.nn as nn
 import torch.nn.functional as F
 from transformers import PreTrainedModel
 from .configuration_gpt import GPTConfig
         # Autoregressive token generation loop
         while tokens.size(1) < max_length:
             logits = self.forward(tokens)["logits"][:, -1, :]
+            logits = logits / max(0.01, temperature)
             if do_sample:
                 top_k = min(top_k, logits.size(-1))  # Safety check