Spaces:

MrVicente
/

RA-BART

Runtime error

App Files Files Community

MrVicente commited on Sep 14, 2022

Commit

4ae80b2

•

1 Parent(s): d74add2

added attention vizualization and qa model

Browse files

Files changed (3) hide show

app.py +31 -8
attention_viz.py +227 -0
custom_bart/bart_attention.py +1 -1

app.py CHANGED Viewed

@@ -2,7 +2,8 @@ import gradio as gr
 import matplotlib.pyplot as plt
 from inference import RelationsInference
-from utils import KGType,Model_Type
 #prep
 import nltk
@@ -16,28 +17,50 @@ examples = [["What's the meaning of life?", "eli5", "constraint"],
             ["boat, water, bird", "commongen", "constraint"],
             ["What flows under a bridge?", "commonsense_qa", "constraint"]]
-bart = RelationsInference(
     model_path='MrVicente/commonsense_bart_commongen',
     kg_type=KGType.CONCEPTNET,
     model_type=Model_Type.RELATIONS,
     max_length=32
 )
 #############################
 #   Helper
 #############################
 def infer_bart(context, task_type, decoding_type_str):
-    response, encoder_attentions, model_input = bart.generate_based_on_context(context, use_kg=False)
     return response[0]
-def plot_attention(layer, head):
     fig = plt.figure()
-    plt.plot([1, 2, 3], [2, 4, 6])
-    plt.title("Things")
-    plt.ylabel("Cases")
-    plt.xlabel("Days since Day 0")
     return fig

 import matplotlib.pyplot as plt
 from inference import RelationsInference
+from attention_viz import AttentionVisualizer
+from utils import KGType, Model_Type, Data_Type
 #prep
 import nltk
             ["boat, water, bird", "commongen", "constraint"],
             ["What flows under a bridge?", "commonsense_qa", "constraint"]]
+commongen_bart = RelationsInference(
     model_path='MrVicente/commonsense_bart_commongen',
     kg_type=KGType.CONCEPTNET,
     model_type=Model_Type.RELATIONS,
     max_length=32
 )
+qa_bart = RelationsInference(
+    model_path='MrVicente/commonsense_bart_absqa',
+    kg_type=KGType.CONCEPTNET,
+    model_type=Model_Type.RELATIONS,
+    max_length=128
+)
+att_viz = AttentionVisualizer(device='cpu')
 #############################
 #   Helper
 #############################
 def infer_bart(context, task_type, decoding_type_str):
+    if Data_Type(task_type) == Data_Type.COMMONGEN:
+        if decoding_type_str =='default':
+            response, _, _ = commongen_bart.generate_based_on_context(context, use_kg=False)
+        else:
+            response, _, _ = commongen_bart.generate_contrained_based_on_context([context], use_kg=True)
+    elif Data_Type(task_type) == Data_Type.ELI5:
+        response, _, _ = qa_bart.generate_based_on_context(context, use_kg=False)
+    else:
+        raise NotImplementedError()
     return response[0]
+def plot_attention(context, task_type, layer, head):
     fig = plt.figure()
+    if Data_Type(task_type) == Data_Type.COMMONGEN:
+        model = commongen_bart
+    elif Data_Type(task_type) == Data_Type.ELI5:
+        model = qa_bart
+    else:
+        raise NotImplementedError()
+    response, examples, relations = model.prepare_context_for_visualization(context)
+    att_viz.plot_attn_lines_concepts_ids('Input text importance visualized',
+                                 examples,
+                                 layer, head,
+                                 relations)
     return fig

attention_viz.py ADDED Viewed

	@@ -0,0 +1,227 @@

+#############################
+#   Imports
+#############################
+# Python modules
+# Remote modules
+import matplotlib.pyplot as plt
+import numpy as np
+import torch
+# Local modules
+#############################
+#   Constants
+#############################
+class AttentionVisualizer:
+    def __init__(self, device):
+        self.device = device
+    def visualize_token2token_scores(self, all_tokens,
+                                     scores_mat,
+                                     useful_indeces,
+                                     x_label_name='Head',
+                                     apply_normalization=True):
+        fig = plt.figure(figsize=(20, 20))
+        all_tokens = np.array(all_tokens)[useful_indeces]
+        for idx, scores in enumerate(scores_mat):
+            if apply_normalization:
+                scores = torch.from_numpy(scores)
+                shape = scores.shape
+                scores = scores.reshape((shape[0],shape[1], 1))
+                scores = torch.linalg.norm(scores, dim=2)
+            scores_np = np.array(scores)
+            scores_np = scores_np[useful_indeces, :]
+            scores_np = scores_np[:, useful_indeces]
+            ax = fig.add_subplot(4, 4, idx + 1)
+            # append the attention weights
+            im = ax.imshow(scores_np, cmap='viridis')
+            fontdict = {'fontsize': 10}
+            ax.set_xticks(range(len(all_tokens)))
+            ax.set_yticks(range(len(all_tokens)))
+            ax.set_xticklabels(all_tokens, fontdict=fontdict, rotation=90)
+            ax.set_yticklabels(all_tokens, fontdict=fontdict)
+            ax.set_xlabel('{} {}'.format(x_label_name, idx + 1))
+            fig.colorbar(im, fraction=0.046, pad=0.04)
+        plt.tight_layout()
+        plt.show()
+    def visualize_matrix(self,
+                         scores_mat,
+                         label_name='heads_layers'):
+        _fig = plt.figure(figsize=(20, 20))
+        scores_np = np.array(scores_mat)
+        fig, ax = plt.subplots()
+        im = ax.imshow(scores_np, cmap='viridis')
+        fontdict = {'fontsize': 10}
+        ax.set_xticks(range(len(scores_mat[0])))
+        ax.set_yticks(range(len(scores_mat)))
+        x_labels = [f'head-{i}' for i in range(1, len(scores_mat[0])+1)]
+        y_labels = [f'layer-{i}' for i in range(1, len(scores_mat) + 1)]
+        ax.set_xticklabels(x_labels, fontdict=fontdict, rotation=90)
+        ax.set_yticklabels(y_labels, fontdict=fontdict)
+        ax.set_xlabel('{}'.format(label_name))
+        fig.colorbar(im, fraction=0.046, pad=0.04)
+        plt.tight_layout()
+        #plt.show()
+        plt.savefig(f'figs/{label_name}.png', dpi=fig.dpi)
+    def visualize_token2head_scores(self, all_tokens, scores_mat):
+        fig = plt.figure(figsize=(30, 50))
+        for idx, scores in enumerate(scores_mat):
+            scores_np = np.array(scores)
+            ax = fig.add_subplot(6, 3, idx + 1)
+            # append the attention weights
+            im = ax.matshow(scores_np, cmap='viridis')
+            fontdict = {'fontsize': 20}
+            ax.set_xticks(range(len(all_tokens)))
+            ax.set_yticks(range(len(scores)))
+            ax.set_xticklabels(all_tokens, fontdict=fontdict, rotation=90)
+            ax.set_yticklabels(range(len(scores[0])), fontdict=fontdict)
+            ax.set_xlabel('Layer {}'.format(idx + 1))
+            fig.colorbar(im, fraction=0.046, pad=0.04)
+        plt.tight_layout()
+        plt.show()
+    def plot_attn_lines(self, data, heads):
+        """Plots attention maps for the given example and attention heads."""
+        width = 3
+        example_sep = 3
+        word_height = 1
+        pad = 0.1
+        for ei, (layer, head) in enumerate(heads):
+            yoffset = 1
+            xoffset = ei * width * example_sep
+            attn = data["attns"][layer][head]
+            attn = np.array(attn)
+            attn /= attn.sum(axis=-1, keepdims=True)
+            words = data["tokens"]
+            words[0] = "..."
+            n_words = len(words)
+            for position, word in enumerate(words):
+                plt.text(xoffset + 0, yoffset - position * word_height, word,
+                         ha="right", va="center")
+                plt.text(xoffset + width, yoffset - position * word_height, word,
+                         ha="left", va="center")
+            for i in range(1, n_words):
+                for j in range(1, n_words):
+                    plt.plot([xoffset + pad, xoffset + width - pad],
+                             [yoffset - word_height * i, yoffset - word_height * j],
+                             color="blue", linewidth=1, alpha=attn[i, j])
+    def plot_attn_lines_concepts(self, title, examples, layer, head, color_words,
+                  color_from=True, width=3, example_sep=3,
+                  word_height=1, pad=0.1, hide_sep=False):
+        # examples -> {'words': tokens, 'attentions': [layer][head]}
+        plt.figure(figsize=(4, 4))
+        for i, example in enumerate(examples):
+            yoffset = 0
+            if i == 0:
+                yoffset += (len(examples[0]["words"]) -
+                            len(examples[1]["words"])) * word_height / 2
+            xoffset = i * width * example_sep
+            attn = example["attentions"][layer][head]
+            if hide_sep:
+                attn = np.array(attn)
+                attn[:, 0] = 0
+                attn[:, -1] = 0
+                attn /= attn.sum(axis=-1, keepdims=True)
+            words = example["words"]
+            n_words = len(words)
+            for position, word in enumerate(words):
+                for x, from_word in [(xoffset, True), (xoffset + width, False)]:
+                    color = "k"
+                    if from_word == color_from and word in color_words:
+                        color = "#cc0000"
+                    plt.text(x, yoffset - (position * word_height), word,
+                             ha="right" if from_word else "left", va="center",
+                             color=color)
+            for i in range(n_words):
+                for j in range(n_words):
+                    color = "b"
+                    if words[i if color_from else j] in color_words:
+                        color = "r"
+                    print(attn[i, j])
+                    plt.plot([xoffset + pad, xoffset + width - pad],
+                             [yoffset - word_height * i, yoffset - word_height * j],
+                             color=color, linewidth=1, alpha=attn[i, j])
+        plt.axis("off")
+        plt.title(title)
+        plt.show()
+    def plot_attn_lines_concepts_ids(title, examples, layer, head,
+                                     relations_total, width=3, example_sep=3,
+                                     word_height=1, pad=0.1, hide_sep=False):
+        # examples -> {'words': tokens, 'attentions': [layer][head]}
+        plt.clf()
+        plt.figure(figsize=(10, 5))
+        # print('relations_total:', relations_total)
+        # print(examples[0])
+        for idx, example in enumerate(examples):
+            yoffset = 0
+            if idx == 0:
+                yoffset += (len(examples[0]["words"]) -
+                            len(examples[0]["words"])) * word_height / 2
+            xoffset = idx * width * example_sep
+            attn = example["attentions"][layer][head]
+            if hide_sep:
+                attn = np.array(attn)
+                attn[:, 0] = 0
+                attn[:, -1] = 0
+                attn /= attn.sum(axis=-1, keepdims=True)
+            words = example["words"]
+            n_words = len(words)
+            example_rel = relations_total[idx]
+            for position, word in enumerate(words):
+                for x, from_word in [(xoffset, True), (xoffset + width, False)]:
+                    color = "k"
+                    for y_idx, y in enumerate(words):
+                        if from_word and example_rel[position, y_idx] > 0:
+                            # print('outgoing', position, y_idx)
+                            color = "r"
+                        if not from_word and example_rel[y_idx, position] > 0:
+                            # print('coming', position, y_idx)
+                            color = "g"
+                    # if from_word == color_from and word in color_words:
+                    #    color = "#cc0000"
+                    plt.text(x, yoffset - (position * word_height), word,
+                             ha="right" if from_word else "left", va="center",
+                             color=color)
+            for i in range(n_words):
+                for j in range(n_words):
+                    color = "k"
+                    # print(i,j, example_rel[i,j])
+                    if example_rel[i, j].item() > 0 and i <= j:
+                        color = "r"
+                    if example_rel[i, j].item() > 0 and i >= j:
+                        color = "g"
+                    plt.plot([xoffset + pad, xoffset + width - pad],
+                             [yoffset - word_height * i, yoffset - word_height * j],
+                             color=color, linewidth=1, alpha=attn[i, j])
+                    # color=color, linewidth=1, alpha=min(attn[i, j]*10,1))
+        plt.axis("off")
+        plt.title(title)
+        plt.show()

custom_bart/bart_attention.py CHANGED Viewed

@@ -94,7 +94,7 @@ class BartCustomAttention(nn.Module):
             # TODO
             print('oh no')
             relation_inputs = torch.zeros((bsz, tgt_len, tgt_len)).to('cuda').long()
-        print(relation_inputs.shape, ' | ', (bsz, tgt_len, tgt_len))
         assert relation_inputs.shape == (bsz, tgt_len, tgt_len)
         # (batch_size, seq_length, seq_length, self.num_relation_kinds, self.inner_dim // num_relation_kinds)

             # TODO
             print('oh no')
             relation_inputs = torch.zeros((bsz, tgt_len, tgt_len)).to('cuda').long()
+        #print(relation_inputs.shape, ' | ', (bsz, tgt_len, tgt_len))
         assert relation_inputs.shape == (bsz, tgt_len, tgt_len)
         # (batch_size, seq_length, seq_length, self.num_relation_kinds, self.inner_dim // num_relation_kinds)