customizable zeroing indexes, model config complete

gsarti · gsarti · commit efa9ca39a06c · 2024-02-27T13:27:23.000+01:00
diff --git a/inseq/attr/feat/feature_attribution.py b/inseq/attr/feat/feature_attribution.py
@@ -514,7 +514,6 @@ def attribute(
                 attributions=attribution_outputs,
                 tokenized_target_sentences=target_tokens_with_ids,
                 pad_token=self.attribution_model.pad_token,
-                has_bos_token=self.attribution_model.is_encoder_decoder,
                 attr_pos_end=attr_pos_end,
             ),
             step_attributions=attribution_outputs if output_step_attributions else None,
diff --git a/inseq/attr/feat/ops/value_zeroing.py b/inseq/attr/feat/ops/value_zeroing.py
@@ -294,7 +294,9 @@ def attribute(
         inputs: TensorOrTupleOfTensorsGeneric,
         additional_forward_args: TensorOrTupleOfTensorsGeneric,
         similarity_metric: str = ValueZeroingSimilarityMetric.COSINE.value,
-        zeroed_units_indices: Optional[OneOrMoreIndicesDict] = None,
+        encoder_zeroed_units_indices: Optional[OneOrMoreIndicesDict] = None,
+        decoder_zeroed_units_indices: Optional[OneOrMoreIndicesDict] = None,
+        cross_zeroed_units_indices: Optional[OneOrMoreIndicesDict] = None,
         encoder_hidden_states: Optional[MultiLayerEmbeddingsTensor] = None,
         decoder_hidden_states: Optional[MultiLayerEmbeddingsTensor] = None,
     ) -> TensorOrTupleOfTensorsGeneric:
@@ -312,7 +314,8 @@ def attribute(
                     - If a list of integers, the attention heads in the list are zeroed across all layers.
                     - If a dictionary, the keys are the layer indices and the values are the zeroed attention heads for
                         the corresponding layer.
-                Default: None.
+
+                Default: None (all heads are zeroed for every layer).
             encoder_hidden_states (:obj:`torch.Tensor`, optional): A tensor of shape ``[batch_size, num_layers + 1,
                 source_seq_len, hidden_size]`` containing hidden states of the encoder. Available only for
                 encoder-decoders models. Default: None.
@@ -335,21 +338,20 @@ def attribute(
             attention_module_name=self.forward_func.config.self_attention_module,
             similarity_metric=similarity_metric,
             mode=ValueZeroingModule.DECODER.value,
-            zeroed_units_indices=zeroed_units_indices,
+            zeroed_units_indices=decoder_zeroed_units_indices,
             use_causal_mask=True,
         )
         # Encoder-decoder models also perform zeroing on the encoder self-attention and cross-attention values
         # Adapted from https://github.com/hmohebbi/ContextMixingASR/blob/master/scoring/valueZeroing.py
         if self.forward_func.is_encoder_decoder:
-            # TODO: Enable different encoder/decoder/cross zeroing indices
             encoder_scores = self.compute_modules_post_zeroing_similarity(
                 inputs=inputs,
                 additional_forward_args=additional_forward_args,
                 hidden_states=encoder_hidden_states,
                 attention_module_name=self.forward_func.config.self_attention_module,
                 similarity_metric=similarity_metric,
                 mode=ValueZeroingModule.ENCODER.value,
-                zeroed_units_indices=zeroed_units_indices,
+                zeroed_units_indices=encoder_zeroed_units_indices,
             )
             cross_scores = self.compute_modules_post_zeroing_similarity(
                 inputs=inputs,
@@ -359,7 +361,12 @@ def attribute(
                 attention_module_name=self.forward_func.config.cross_attention_module,
                 similarity_metric=similarity_metric,
                 mode=ValueZeroingModule.DECODER.value,
-                zeroed_units_indices=zeroed_units_indices,
+                zeroed_units_indices=cross_zeroed_units_indices,
             )
             return encoder_scores, cross_scores, decoder_scores
+        elif encoder_zeroed_units_indices is not None or cross_zeroed_units_indices is not None:
+            logger.warning(
+                "Zeroing indices for encoder and cross-attentions were specified, but the model is not an "
+                "encoder-decoder. Use `decoder_zeroed_units_indices` to parametrize zeroing for the decoder module."
+            )
         return (decoder_scores,)
diff --git a/inseq/data/attribution.py b/inseq/data/attribution.py
@@ -181,7 +181,6 @@ def from_step_attributions(
         attributions: list["FeatureAttributionStepOutput"],
         tokenized_target_sentences: list[list[TokenWithId]],
         pad_token: Optional[Any] = None,
-        has_bos_token: bool = True,
         attr_pos_end: Optional[int] = None,
     ) -> list["FeatureAttributionSequenceOutput"]:
         """Converts a list of :class:`~inseq.data.attribution.FeatureAttributionStepOutput` objects containing multiple
@@ -208,9 +207,9 @@ def from_step_attributions(
                 sources.append(drop_padding(attr.source[seq_idx], pad_token))
             curr_target = [a.target[seq_idx][0] for a in attributions]
             targets.append(drop_padding(curr_target, pad_token))
-            if has_bos_token:
+            if all(attr.prefix[seq_idx][0] == pad_token for seq_idx in range(num_sequences)):
                 tokenized_target_sentences[seq_idx] = tokenized_target_sentences[seq_idx][:1] + drop_padding(
-                    tokenized_target_sentences[seq_idx], pad_token
+                    tokenized_target_sentences[seq_idx][1:], pad_token
                 )
             else:
                 tokenized_target_sentences[seq_idx] = drop_padding(tokenized_target_sentences[seq_idx], pad_token)
diff --git a/inseq/models/model_config.yaml b/inseq/models/model_config.yaml
@@ -1,11 +1,29 @@
-# AutoModelForCausalLM
+# Decoder-only models
+BioGptForCausalLM:
+    self_attention_module: "self_attn"
+    value_vector: "value_states"
 BloomForCausalLM:
     self_attention_module: "self_attention"
     value_vector: "value_layer"
+CodeGenForCausalLM:
+    self_attention_module: "attn"
+    value_vector: "value"
+FalconForCausalLM:
+    self_attention_module: "self_attention"
+    value_vector: "value_layer"
+GemmaForCausalLM:
+    self_attention_module: "self_attn"
+    value_vector: "value_states"
+GPTBigCodeForCausalLM:
+    self_attention_module: "attn"
+    value_vector: "value"
+GPTJForCausalLM:
+    self_attention_module: "attn"
+    value_vector: "value"
 GPT2LMHeadModel:
     self_attention_module: "attn"
     value_vector: "value"
-OpenAIGPTLMHeadModel:
+GPTNeoForCausalLM:
     self_attention_module: "attn"
     value_vector: "value"
 GPTNeoXForCausalLM:
@@ -14,40 +32,80 @@ GPTNeoXForCausalLM:
 LlamaForCausalLM:
     self_attention_module: "self_attn"
     value_vector: "value_states"
-GPTBigCodeForCausalLM:
+MistralForCausalLM:
+    self_attention_module: "self_attn"
+    value_vector: "value_states"
+MixtralForCausalLM:
+    self_attention_module: "self_attn"
+    value_vector: "value_states"
+MptForCausalLM:
     self_attention_module: "attn"
-    value_vector: "value"
-CodeGenForCausalLM:
+    value_vector: "value_states"
+OpenAIGPTLMHeadModel:
     self_attention_module: "attn"
     value_vector: "value"
-# TODO
-# BioGptForCausalLM
-# GemmaForCausalLM
-# GPTNeoForCausalLM
-# GPTJForCausalLM
-# MistralForCausalLM
-# MixtralForCausalLM
-# MptForCausalLM
-# OpenLlamaForCausalLM
-# OPTForCausalLM
-# PhiForCausalLM
-# StableLmForCausalLM
-# XGLMForCausalLM
+OPTForCausalLM:
+    self_attention_module: "self_attn"
+    value_vector: "value_states"
+PhiForCausalLM:
+    self_attention_module: "self_attn"
+    value_vector: "value_states"
+Qwen2ForCausalLM:
+    self_attention_module: "self_attn"
+    value_vector: "value_states"
+StableLmForCausalLM:
+    self_attention_module: "self_attn"
+    value_vector: "value_states"
+XGLMForCausalLM:
+    self_attention_module: "self_attn"
+    value_vector: "value_states"
 
-# AutoModelForSeq2SeqLM
+# Encoder-decoder models
+BartForConditionalGeneration:
+    self_attention_module: "self_attn"
+    cross_attention_module: "encoder_attn"
+    value_vector: "value_states"
 MarianMTModel:
     self_attention_module: "self_attn"
     cross_attention_module: "encoder_attn"
     value_vector: "value_states"
- 
-# TODO ForConditionalGeneration
-# BartForConditionalGeneration
-# FSMTForConditionalGeneration
-# LongT5ForConditionalGeneration
-# M2M100ForConditionalGeneration
-# MBartForConditionalGeneration
-# MT5ForConditionalGeneration
-# NllbMoeForConditionalGeneration
-# SeamlessM4TForTextToText
-# SeamlessM4Tv2ForTextToText
-# T5ForConditionalGeneration
+FSMTForConditionalGeneration:
+    self_attention_module: "self_attn"
+    cross_attention_module: "encoder_attn"
+    value_vector: "v"
+M2M100ForConditionalGeneration:
+    self_attention_module: "self_attn"
+    cross_attention_module: "encoder_attn"
+    value_vector: "value_states"
+MBartForConditionalGeneration:
+    self_attention_module: "self_attn"
+    cross_attention_module: "encoder_attn"
+    value_vector: "value_states"
+MT5ForConditionalGeneration:
+    self_attention_module: "SelfAttention"
+    cross_attention_module: "EncDecAttention"
+    value_vector: "value_states"
+NllbMoeForConditionalGeneration:
+    self_attention_module: "self_attn"
+    cross_attention_module: "cross_attention"
+    value_vector: "value_states"
+PegasusForConditionalGeneration:
+    self_attention_module: "self_attn"
+    cross_attention_module: "encoder_attn"
+    value_vector: "value_states"
+SeamlessM4TForTextToText:
+    self_attention_module: "self_attn"
+    cross_attention_module: "cross_attention"
+    value_vector: "value"
+SeamlessM4Tv2ForTextToText:
+    self_attention_module: "self_attn"
+    cross_attention_module: "cross_attention"
+    value_vector: "value"
+T5ForConditionalGeneration:
+    self_attention_module: "SelfAttention"
+    cross_attention_module: "EncDecAttention"
+    value_vector: "value_states"
+UMT5ForConditionalGeneration:
+    self_attention_module: "SelfAttention"
+    cross_attention_module: "EncDecAttention"
+    value_vector: "value_states"