flas attn, default temp, in last commit worked well. set temp 0.7, tr…

…y to induce more code-switching
ctarnold · Mar 22, 2024 · b505367 · b505367
1 parent b64385e
commit b505367
Show file tree

Hide file tree

Showing 2 changed files with 10 additions and 4 deletions.
diff --git a/jobZero.slurm b/jobZero.slurm
@@ -3,7 +3,7 @@
 #SBATCH --nodes=1                # node count
 #SBATCH --ntasks=1               # total number of tasks across all nodes
 #SBATCH --cpus-per-task=1        # cpu-cores per task (>1 if multi-threaded tasks)
-#SBATCH --mem-per-cpu=190G        # memory per cpu-core (4G is default)
+#SBATCH --mem-per-cpu=64G        # memory per cpu-core (4G is default)
 #SBATCH --gres=gpu:1             # of gpus per node
 #SBATCH --time=00:30:00          # total run time limit (HH:MM:SS)
 #SBATCH --mail-type=begin        # send email when job begins

diff --git a/mistralPromptingZeroShot.py b/mistralPromptingZeroShot.py
@@ -2,10 +2,13 @@
 from transformers import AutoModelForCausalLM, AutoTokenizer
 
 model_id = "/scratch/gpfs/ca2992/Mixtral-8x7B-v0.1"
-model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.float16, attn_implementation="flash_attention_2", device_map="auto")
+model = AutoModelForCausalLM.from_pretrained(model_id, 
+                                             torch_dtype=torch.float16, 
+                                             attn_implementation="flash_attention_2", 
+                                             device_map="auto")
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 
-prefix = "Answer this prompt as a bilingual English/Spanish Miami speaker. "
+prefix = "Answer this prompt as a bilingual English/Spanish Miami speaker who code-switches:"
 prompt = "Escribeme un cuento que tiene palabras mezcladas between English and Spanish."
 
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
@@ -15,7 +18,10 @@
 
 model_inputs = tokenizer([prefix + prompt], return_tensors="pt").to(device)
 
-generated_ids = model.generate(**model_inputs, max_new_tokens=512, do_sample=True)
+generated_ids = model.generate(**model_inputs, 
+                               max_new_tokens=200, 
+                               temperature = 0.7, 
+                               do_sample=True)
 
 
 with open("outputZero.txt", "a") as f: