Use text config's vocab size in testing models (#30568)

use text config's vocab size
huggingface · May 14, 2024 · e2e4dad · e2e4dad
1 parent a4e43b2
commit e2e4dad
Show file tree

Hide file tree

Showing 4 changed files with 42 additions and 509 deletions.
diff --git a/tests/models/llava/test_modeling_llava.py b/tests/models/llava/test_modeling_llava.py
@@ -14,7 +14,6 @@
 # limitations under the License.
 """Testing suite for the PyTorch Llava model."""
 
-import copy
 import gc
 import unittest
 
@@ -192,171 +191,6 @@ def test_training_gradient_checkpointing_use_reentrant(self):
  def test_training_gradient_checkpointing_use_reentrant_false(self):
  pass
 
- # Copied from tests.test_modeling_common.ModelTesterMixin.test_resize_tokens_embeddings with config.vocab_size->config.text_config.vocab_size
- def test_resize_tokens_embeddings(self):
- (
- original_config,
- inputs_dict,
- ) = self.model_tester.prepare_config_and_inputs_for_common()
- if not self.test_resize_embeddings:
- return
-
- for model_class in self.all_model_classes:
- config = copy.deepcopy(original_config)
- model = model_class(config)
- model.to(torch_device)
-
- if self.model_tester.is_training is False:
- model.eval()
-
- model_vocab_size = config.text_config.vocab_size
- # Retrieve the embeddings and clone theme
- model_embed = model.resize_token_embeddings(model_vocab_size)
- cloned_embeddings = model_embed.weight.clone()
-
- # Check that resizing the token embeddings with a larger vocab size increases the model's vocab size
- model_embed = model.resize_token_embeddings(model_vocab_size + 10)
- self.assertEqual(model.config.text_config.vocab_size, model_vocab_size + 10)
- # Check that it actually resizes the embeddings matrix
- self.assertEqual(model_embed.weight.shape[0], cloned_embeddings.shape[0] + 10)
- # Check that the model can still do a forward pass successfully (every parameter should be resized)
- model(**self._prepare_for_class(inputs_dict, model_class))
-
- # Check that resizing the token embeddings with a smaller vocab size decreases the model's vocab size
- model_embed = model.resize_token_embeddings(model_vocab_size - 15)
- self.assertEqual(model.config.text_config.vocab_size, model_vocab_size - 15)
- # Check that it actually resizes the embeddings matrix
- self.assertEqual(model_embed.weight.shape[0], cloned_embeddings.shape[0] - 15)
-
- # Check that the model can still do a forward pass successfully (every parameter should be resized)
- # Input ids should be clamped to the maximum size of the vocabulary
- inputs_dict["input_ids"].clamp_(max=model_vocab_size - 15 - 1)
-
- # make sure that decoder_input_ids are resized as well
- if "decoder_input_ids" in inputs_dict:
- inputs_dict["decoder_input_ids"].clamp_(max=model_vocab_size - 15 - 1)
- model(**self._prepare_for_class(inputs_dict, model_class))
-
- # Check that adding and removing tokens has not modified the first part of the embedding matrix.
- models_equal = True
- for p1, p2 in zip(cloned_embeddings, model_embed.weight):
- if p1.data.ne(p2.data).sum() > 0:
- models_equal = False
-
- self.assertTrue(models_equal)
-
- config = copy.deepcopy(original_config)
- model = model_class(config)
- model.to(torch_device)
-
- model_vocab_size = config.text_config.vocab_size
- model.resize_token_embeddings(model_vocab_size + 10, pad_to_multiple_of=1)
- self.assertTrue(model.config.text_config.vocab_size + 10, model_vocab_size)
-
- model_embed = model.resize_token_embeddings(model_vocab_size, pad_to_multiple_of=64)
- self.assertTrue(model_embed.weight.shape[0] // 64, 0)
-
- self.assertTrue(model_embed.weight.shape[0], model.config.text_config.vocab_size)
- self.assertTrue(model.config.text_config.vocab_size, model.vocab_size)
-
- model_embed = model.resize_token_embeddings(model_vocab_size + 13, pad_to_multiple_of=64)
- self.assertTrue(model_embed.weight.shape[0] // 64, 0)
-
- # Check that resizing a model to a multiple of pad_to_multiple leads to a model of exactly that size
- target_dimension = 128
- model_embed = model.resize_token_embeddings(target_dimension, pad_to_multiple_of=64)
- self.assertTrue(model_embed.weight.shape[0], target_dimension)
-
- with self.assertRaisesRegex(
- ValueError,
- "Asking to pad the embedding matrix to a multiple of `1.3`, which is not and integer. Please make sure to pass an integer",
- ):
- model.resize_token_embeddings(model_vocab_size, pad_to_multiple_of=1.3)
-
- # Copied from tests.test_modeling_common.ModelTesterMixin.test_resize_embeddings_untied with config.vocab_size->config.text_config.vocab_size
- def test_resize_embeddings_untied(self):
- (
- original_config,
- inputs_dict,
- ) = self.model_tester.prepare_config_and_inputs_for_common()
- if not self.test_resize_embeddings:
- return
-
- original_config.tie_word_embeddings = False
-
- # if model cannot untied embeddings -> leave test
- if original_config.tie_word_embeddings:
- return
-
- for model_class in self.all_model_classes:
- config = copy.deepcopy(original_config)
- model = model_class(config).to(torch_device)
-
- # if no output embeddings -> leave test
- if model.get_output_embeddings() is None:
- continue
-
- # Check that resizing the token embeddings with a larger vocab size increases the model's vocab size
- model_vocab_size = config.text_config.vocab_size
- model.resize_token_embeddings(model_vocab_size + 10)
- self.assertEqual(model.config.text_config.vocab_size, model_vocab_size + 10)
- output_embeds = model.get_output_embeddings()
- self.assertEqual(output_embeds.weight.shape[0], model_vocab_size + 10)
- # Check bias if present
- if output_embeds.bias is not None:
- self.assertEqual(output_embeds.bias.shape[0], model_vocab_size + 10)
- # Check that the model can still do a forward pass successfully (every parameter should be resized)
- model(**self._prepare_for_class(inputs_dict, model_class))
-
- # Check that resizing the token embeddings with a smaller vocab size decreases the model's vocab size
- model.resize_token_embeddings(model_vocab_size - 15)
- self.assertEqual(model.config.text_config.vocab_size, model_vocab_size - 15)
- # Check that it actually resizes the embeddings matrix
- output_embeds = model.get_output_embeddings()
- self.assertEqual(output_embeds.weight.shape[0], model_vocab_size - 15)
- # Check bias if present
- if output_embeds.bias is not None:
- self.assertEqual(output_embeds.bias.shape[0], model_vocab_size - 15)
- # Check that the model can still do a forward pass successfully (every parameter should be resized)
- # Input ids should be clamped to the maximum size of the vocabulary
- inputs_dict["input_ids"].clamp_(max=model_vocab_size - 15 - 1)
- if "decoder_input_ids" in inputs_dict:
- inputs_dict["decoder_input_ids"].clamp_(max=model_vocab_size - 15 - 1)
- # Check that the model can still do a forward pass successfully (every parameter should be resized)
- model(**self._prepare_for_class(inputs_dict, model_class))
-
- # Copied from tests.test_modeling_common.ModelTesterMixin.test_tie_model_weights with config.vocab_size->config.text_config.vocab_size
- def test_tie_model_weights(self):
- if not self.test_torchscript:
- return
-
- config, inputs_dict = self.model_tester.prepare_config_and_inputs_for_common()
-
- def check_same_values(layer_1, layer_2):
- equal = True
- for p1, p2 in zip(layer_1.weight, layer_2.weight):
- if p1.data.ne(p2.data).sum() > 0:
- equal = False
- return equal
-
- for model_class in self.all_model_classes:
- config.torchscript = True
- model_not_tied = model_class(config)
- if model_not_tied.get_output_embeddings() is None:
- continue
-
- config_tied = copy.deepcopy(config)
- config_tied.torchscript = False
- model_tied = model_class(config_tied)
- params_tied = list(model_tied.parameters())
- # Check that the embedding layer and decoding layer are the same in size and in value
- # self.assertTrue(check_same_values(embeddings, decoding))
-
- # Check that after resize they remain tied.
- model_tied.resize_token_embeddings(config.text_config.vocab_size + 10)
- params_tied_2 = list(model_tied.parameters())
- self.assertEqual(len(params_tied_2), len(params_tied))
-
 
 @require_torch
 class LlavaForConditionalGenerationIntegrationTest(unittest.TestCase):

diff --git a/tests/models/llava_next/test_modeling_llava_next.py b/tests/models/llava_next/test_modeling_llava_next.py
@@ -14,7 +14,6 @@
 # limitations under the License.
 """ Testing suite for the PyTorch Llava-NeXT model. """
 
-import copy
 import gc
 import unittest
 
@@ -215,171 +214,6 @@ def test_feed_forward_chunking(self):
  def test_cpu_offload(self):
  pass
 
- # Copied from tests.test_modeling_common.ModelTesterMixin.test_resize_tokens_embeddings with config.vocab_size->config.text_config.vocab_size
- def test_resize_tokens_embeddings(self):
- (
- original_config,
- inputs_dict,
- ) = self.model_tester.prepare_config_and_inputs_for_common()
- if not self.test_resize_embeddings:
- return
-
- for model_class in self.all_model_classes:
- config = copy.deepcopy(original_config)
- model = model_class(config)
- model.to(torch_device)
-
- if self.model_tester.is_training is False:
- model.eval()
-
- model_vocab_size = config.text_config.vocab_size
- # Retrieve the embeddings and clone theme
- model_embed = model.resize_token_embeddings(model_vocab_size)
- cloned_embeddings = model_embed.weight.clone()
-
- # Check that resizing the token embeddings with a larger vocab size increases the model's vocab size
- model_embed = model.resize_token_embeddings(model_vocab_size + 10)
- self.assertEqual(model.config.text_config.vocab_size, model_vocab_size + 10)
- # Check that it actually resizes the embeddings matrix
- self.assertEqual(model_embed.weight.shape[0], cloned_embeddings.shape[0] + 10)
- # Check that the model can still do a forward pass successfully (every parameter should be resized)
- model(**self._prepare_for_class(inputs_dict, model_class))
-
- # Check that resizing the token embeddings with a smaller vocab size decreases the model's vocab size
- model_embed = model.resize_token_embeddings(model_vocab_size - 15)
- self.assertEqual(model.config.text_config.vocab_size, model_vocab_size - 15)
- # Check that it actually resizes the embeddings matrix
- self.assertEqual(model_embed.weight.shape[0], cloned_embeddings.shape[0] - 15)
-
- # Check that the model can still do a forward pass successfully (every parameter should be resized)
- # Input ids should be clamped to the maximum size of the vocabulary
- inputs_dict["input_ids"].clamp_(max=model_vocab_size - 15 - 1)
-
- # make sure that decoder_input_ids are resized as well
- if "decoder_input_ids" in inputs_dict:
- inputs_dict["decoder_input_ids"].clamp_(max=model_vocab_size - 15 - 1)
- model(**self._prepare_for_class(inputs_dict, model_class))
-
- # Check that adding and removing tokens has not modified the first part of the embedding matrix.
- models_equal = True
- for p1, p2 in zip(cloned_embeddings, model_embed.weight):
- if p1.data.ne(p2.data).sum() > 0:
- models_equal = False
-
- self.assertTrue(models_equal)
-
- config = copy.deepcopy(original_config)
- model = model_class(config)
- model.to(torch_device)
-
- model_vocab_size = config.text_config.vocab_size
- model.resize_token_embeddings(model_vocab_size + 10, pad_to_multiple_of=1)
- self.assertTrue(model.config.text_config.vocab_size + 10, model_vocab_size)
-
- model_embed = model.resize_token_embeddings(model_vocab_size, pad_to_multiple_of=64)
- self.assertTrue(model_embed.weight.shape[0] // 64, 0)
-
- self.assertTrue(model_embed.weight.shape[0], model.config.text_config.vocab_size)
- self.assertTrue(model.config.text_config.vocab_size, model.vocab_size)
-
- model_embed = model.resize_token_embeddings(model_vocab_size + 13, pad_to_multiple_of=64)
- self.assertTrue(model_embed.weight.shape[0] // 64, 0)
-
- # Check that resizing a model to a multiple of pad_to_multiple leads to a model of exactly that size
- target_dimension = 128
- model_embed = model.resize_token_embeddings(target_dimension, pad_to_multiple_of=64)
- self.assertTrue(model_embed.weight.shape[0], target_dimension)
-
- with self.assertRaisesRegex(
- ValueError,
- "Asking to pad the embedding matrix to a multiple of `1.3`, which is not and integer. Please make sure to pass an integer",
- ):
- model.resize_token_embeddings(model_vocab_size, pad_to_multiple_of=1.3)
-
- # Copied from tests.test_modeling_common.ModelTesterMixin.test_resize_embeddings_untied with config.vocab_size->config.text_config.vocab_size
- def test_resize_embeddings_untied(self):
- (
- original_config,
- inputs_dict,
- ) = self.model_tester.prepare_config_and_inputs_for_common()
- if not self.test_resize_embeddings:
- return
-
- original_config.tie_word_embeddings = False
-
- # if model cannot untied embeddings -> leave test
- if original_config.tie_word_embeddings:
- return
-
- for model_class in self.all_model_classes:
- config = copy.deepcopy(original_config)
- model = model_class(config).to(torch_device)
-
- # if no output embeddings -> leave test
- if model.get_output_embeddings() is None:
- continue
-
- # Check that resizing the token embeddings with a larger vocab size increases the model's vocab size
- model_vocab_size = config.text_config.vocab_size
- model.resize_token_embeddings(model_vocab_size + 10)
- self.assertEqual(model.config.text_config.vocab_size, model_vocab_size + 10)
- output_embeds = model.get_output_embeddings()
- self.assertEqual(output_embeds.weight.shape[0], model_vocab_size + 10)
- # Check bias if present
- if output_embeds.bias is not None:
- self.assertEqual(output_embeds.bias.shape[0], model_vocab_size + 10)
- # Check that the model can still do a forward pass successfully (every parameter should be resized)
- model(**self._prepare_for_class(inputs_dict, model_class))
-
- # Check that resizing the token embeddings with a smaller vocab size decreases the model's vocab size
- model.resize_token_embeddings(model_vocab_size - 15)
- self.assertEqual(model.config.text_config.vocab_size, model_vocab_size - 15)
- # Check that it actually resizes the embeddings matrix
- output_embeds = model.get_output_embeddings()
- self.assertEqual(output_embeds.weight.shape[0], model_vocab_size - 15)
- # Check bias if present
- if output_embeds.bias is not None:
- self.assertEqual(output_embeds.bias.shape[0], model_vocab_size - 15)
- # Check that the model can still do a forward pass successfully (every parameter should be resized)
- # Input ids should be clamped to the maximum size of the vocabulary
- inputs_dict["input_ids"].clamp_(max=model_vocab_size - 15 - 1)
- if "decoder_input_ids" in inputs_dict:
- inputs_dict["decoder_input_ids"].clamp_(max=model_vocab_size - 15 - 1)
- # Check that the model can still do a forward pass successfully (every parameter should be resized)
- model(**self._prepare_for_class(inputs_dict, model_class))
-
- # Copied from tests.test_modeling_common.ModelTesterMixin.test_tie_model_weights with config.vocab_size->config.text_config.vocab_size
- def test_tie_model_weights(self):
- if not self.test_torchscript:
- return
-
- config, inputs_dict = self.model_tester.prepare_config_and_inputs_for_common()
-
- def check_same_values(layer_1, layer_2):
- equal = True
- for p1, p2 in zip(layer_1.weight, layer_2.weight):
- if p1.data.ne(p2.data).sum() > 0:
- equal = False
- return equal
-
- for model_class in self.all_model_classes:
- config.torchscript = True
- model_not_tied = model_class(config)
- if model_not_tied.get_output_embeddings() is None:
- continue
-
- config_tied = copy.deepcopy(config)
- config_tied.torchscript = False
- model_tied = model_class(config_tied)
- params_tied = list(model_tied.parameters())
- # Check that the embedding layer and decoding layer are the same in size and in value
- # self.assertTrue(check_same_values(embeddings, decoding))
-
- # Check that after resize they remain tied.
- model_tied.resize_token_embeddings(config.text_config.vocab_size + 10)
- params_tied_2 = list(model_tied.parameters())
- self.assertEqual(len(params_tied_2), len(params_tied))
-
 
 @require_torch
 class LlavaNextForConditionalGenerationIntegrationTest(unittest.TestCase):