bananaml · bishwenduk029 · Oct 23, 2022
diff --git a/download.py b/download.py
@@ -1,13 +1,22 @@
 # In this file, we define download_model
 # It runs during container build time to get model weights built into the container
 
-# In this example: A Huggingface BERT model
+# In this example: A Huggingface GPT-NeoX model
 
-from transformers import pipeline
+from transformers import GPTNeoXForCausalLM, GPTNeoXTokenizerFast
+import torch
 
 def download_model():
     # do a dry run of loading the huggingface model, which will download weights
-    pipeline('fill-mask', model='bert-base-uncased')
+    print("downloading model...")
+    GPTNeoXForCausalLM.from_pretrained(
+        "EleutherAI/gpt-neox-20b", revision="float16", torch_dtype=torch.float16, low_cpu_mem_usage=True
+    )
+    print("done")
+
+    print("downloading tokenizer...")
+    GPTNeoXTokenizerFast.from_pretrained("EleutherAI/gpt-neox-20b")
+    print("done")
 
 if __name__ == "__main__":
     download_model()