denizyuret-shallowai
/

foo3

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

denizyuret-shallowai commited on Oct 21, 2023

Commit

cb95e0b

•

1 Parent(s): 9a64e09

Upload model

Files changed (3) hide show

config.json +1 -1
modeling_custom.py +1 -1
pytorch_model.bin +2 -2

config.json CHANGED Viewed

@@ -24,7 +24,7 @@
   "rotary_emb_base": 10000,
   "rotary_pct": 0.25,
   "tie_word_embeddings": false,
-  "torch_dtype": "float32",
   "transformers_version": "4.31.0",
   "use_cache": true,
   "use_parallel_residual": true,

   "rotary_emb_base": 10000,
   "rotary_pct": 0.25,
   "tie_word_embeddings": false,
+  "torch_dtype": "float16",
   "transformers_version": "4.31.0",
   "use_cache": true,
   "use_parallel_residual": true,

modeling_custom.py CHANGED Viewed

@@ -18,7 +18,7 @@ class CustomModel(GPTNeoXForCausalLM):
     @classmethod
     def copy_from_neox(cls, *args, **kwargs):
         m0 = GPTNeoXForCausalLM.from_pretrained(*args, **kwargs)
-        m1 = cls(m0.config)
         m1.load_state_dict(m0.state_dict())
         return m1

     @classmethod
     def copy_from_neox(cls, *args, **kwargs):
         m0 = GPTNeoXForCausalLM.from_pretrained(*args, **kwargs)
+        m1 = cls(m0.config).to(dtype=m0.dtype, device=m0.device)
         m1.load_state_dict(m0.state_dict())
         return m1

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3e4128420302e58c85fc79e4553c320c270cab3169bc72310bdf2b5b75032a6d
-size 281732711

 version https://git-lfs.github.com/spec/v1
+oid sha256:781eaeb60eaee1da015e90d41470942b4597682f8ead7b94aa29676139808cd7
+size 140879463