Fix test_greedy_generation() for llama

bigscience-workshop · borzunov · Aug 8, 2023 · Aug 8, 2023 · Aug 8, 2023 · Aug 8, 2023
commit 0040539202ce2f3a41301ea5983341ae8100e511
diff --git a/tests/test_full_model.py b/tests/test_full_model.py
@@ -100,9 +100,12 @@ def test_greedy_generation(tokenizer, max_new_tokens=4):
     hf_outputs = HfGenerationMixin.greedy_search(model, input_ids=inputs, max_length=inputs.size(1) + max_new_tokens)
     assert torch.allclose(remote_outputs, hf_outputs), "Greedy search results are not identical to HF"
 
+    if tokenizer.pad_token_id is None:
+        tokenizer.pad_token_id = tokenizer.eos_token_id
     inputs_batch = tokenizer(["A cat sat on a mat", "A dog sat on a mat"], return_tensors="pt", padding=True)[
         "input_ids"
     ]
+
     remote_outputs_batch = model.generate(
         inputs_batch,
         max_new_tokens=max_new_tokens,