updates for 70b and gpu process monitor

lessw2020 · lessw2020 · commit 03e5909a0804 · 2024-10-29T15:54:52.000-07:00
diff --git a/dist_run.py b/dist_run.py
@@ -58,6 +58,7 @@
 NAME_TO_DISTRIBUTION_AND_DTYPE = {
     "llama2-7b-chat": ("meta-llama/Llama-2-7b-chat-hf", torch.float16),
     "llama3": ("meta-llama/Meta-Llama-3-8B-Instruct", torch.bfloat16),
+    "llama3-70b": ("meta-llama/Meta-Llama-3-70B-Instruct", torch.bfloat16),
 }
 
 
diff --git a/torchchat/distributed/force_download.py b/torchchat/distributed/force_download.py
@@ -1,5 +1,5 @@
 from transformers import AutoModelForCausalLM, AutoTokenizer
 
-tokenizer = AutoTokenizer.from_pretrained("meta-llama/Meta-Llama-3-8B-Instruct")
-model = AutoModelForCausalLM.from_pretrained("meta-llama/Meta-Llama-3-8B-Instruct")
+# tokenizer = AutoTokenizer.from_pretrained("meta-llama/Meta-Llama-3-8B-Instruct")
+model = AutoModelForCausalLM.from_pretrained("meta-llama/Meta-Llama-3-70B-Instruct")
 print("Model weights and tokenizer downloaded")
diff --git a/torchchat/distributed/gpu_process_monitor.py b/torchchat/distributed/gpu_process_monitor.py

Original file line number	Diff line number	Diff line change
`@@ -58,6 +58,7 @@`
`58`	`58`	`NAME_TO_DISTRIBUTION_AND_DTYPE = {`
`59`	`59`	`"llama2-7b-chat": ("meta-llama/Llama-2-7b-chat-hf", torch.float16),`
`60`	`60`	`"llama3": ("meta-llama/Meta-Llama-3-8B-Instruct", torch.bfloat16),`
	`61`	`+ "llama3-70b": ("meta-llama/Meta-Llama-3-70B-Instruct", torch.bfloat16),`
`61`	`62`	`}`
`62`	`63`
`63`	`64`