Cleaned up old comments

mkranzlein · Dec 6, 2023 · b45eab7 · b45eab7
1 parent 1436161
commit b45eab7
Showing 1 changed file with 6 additions and 68 deletions.
diff --git a/src/hipool/models.py b/src/hipool/models.py
@@ -7,7 +7,6 @@
 """
 
 import networkx as nx
-import transformers
 import torch
 from jaxtyping import Float, Integer, jaxtyped
 from torch import nn, Tensor
@@ -38,8 +37,12 @@ def __init__(self, chunk_len, device, linear_dim=64, hidden_dim=32, output_dim=3
                           hidden_dim=32, output_dim=self.output_dim).to(device)
 
     def forward(self, chunk_bert_embeddings: dict):
-        # Pooled bert output for each chunk goes through a linear layer and then
-        # through HiPool
+        """Forward pass through HiPool.
+
+        Pooled BERT output for each chunk goes through a linear layer and then
+        through HiPool graph convolutional network.
+
+        """
         linear_layer_output: Float[Tensor, "k lin_dim"] = self.linear(chunk_bert_embeddings)
 
         num_nodes = linear_layer_output.shape[0]  # TODO: might need different index
@@ -82,68 +85,3 @@ def forward(self, ids: Integer[Tensor, "_ c"],
         else:
             output = self.linear(x)
         return output
-
-        # Don't want to repeat tokenization of sentences; get sentence IDs and
-        # figure out padding; take a look at BertForTokenClassification
-
-    # def get_hipool_embedding(chunks):
-    #     hipool_embedding = None
-
-        # Chunking approaches: equal number of sentences, equal number of tokens,
-        #   unequal number of sentences that approximates an equal number of tokens
-
-        # Pad such that each sequence has the same number of chunks
-        # Padding chunks c-dim vectors, where all the input ids are 0, which is
-        # BERT's padding token
-        # padded_ids: Integer[Tensor, "k b c"] = pad_sequence(ids)
-        # padded_ids: Integer[Tensor, "b k c"] = padded_ids.permute(1, 0, 2).to(self.device)
-        # padded_masks: Integer[Tensor, "k b c"] = pad_sequence(mask)
-        # padded_masks: Integer[Tensor, "b k c"] = padded_masks.permute(1, 0, 2).to(self.device)
-        # padded_token_type_ids: Integer[Tensor, "k b c"] = pad_sequence(token_type_ids)
-        # padded_token_type_ids: Integer[Tensor, "b k c"] = padded_token_type_ids.permute(1, 0, 2).to(self.device)
-        # batch_chunk_embeddings = []
-        # batch_token_embeddings = []
-        # for ids, mask, token_type_ids in zip(padded_ids, padded_masks, padded_token_type_ids):
-        #     results = self.bert(ids, attention_mask=mask, token_type_ids=token_type_ids)
-        #     # One 768-dim embedding for each chunk
-        #     pooler_output: Float[Tensor, "k 768"] = results["pooler_output"]
-        #     last_hidden_state: Float[Tensor, "k c 768"] = results["last_hidden_state"]
-        #     batch_token_embeddings.append(last_hidden_state)
-        #     batch_chunk_embeddings.append(pooler_output)
-
-        # batch_chunk_embeddings: Float[Tensor, "b k 768"] = torch.stack(batch_chunk_embeddings, 0)
-
-        # linear_layer_output: Float[Tensor, "b k lin_dim"] = self.linear(batch_chunk_embeddings)
-
-        # num_nodes = linear_layer_output.shape[1]
-        # graph = nx.path_graph(num_nodes)
-        # adjacency_matrix = nx.adjacency_matrix(graph).todense()
-        # adjacency_matrix = torch.from_numpy(adjacency_matrix).to(self.device).float()
-
-        # # Pass each sequence through HiPool GCN individually then stack
-        # gcn_output_batch = []
-        # for node in linear_layer_output:
-        #     gcn_output = self.gcn(node, adjacency_matrix)
-        #     gcn_output_batch.append(gcn_output)
-        # gcn_output_batch: Float[Tensor, "b gcn"] = torch.stack(gcn_output_batch)
-
-        # batch_token_embeddings: Float[Tensor, "b k c 768"] = torch.stack(batch_token_embeddings, 0)
-
-        # batch_model_output = []
-        # for sequence_token_embedding, sequence_gcn_output in zip(batch_token_embeddings, gcn_output_batch):
-        #     sequence_outputs = []
-        #     sequence_gcn_output = sequence_gcn_output.unsqueeze(0)
-        #     repeated_sequence_gcn_output: Float[Tensor, "c gcn"] = sequence_gcn_output.repeat(self.chunk_len, 1)
-        #     for chunk_token_embedding in sequence_token_embedding:
-        #         # combined_embedding: Float[Tensor, "c 768+gcn"] = torch.cat((chunk_token_embedding,
-        #         #                                                             repeated_sequence_gcn_output), dim=1)
-        #         combined_embedding: Float[Tensor, "c 768"] = chunk_token_embedding
-        #         l2_output: Float[Tensor, "c num_labels"] = self.linear2(combined_embedding)
-        #         # l2_output = nn.functional.sigmoid(l2_output)
-        #         sequence_outputs.append(l2_output)
-        #     sequence_outputs: Float[Tensor, "k c num_labels"] = torch.stack(sequence_outputs)
-        #     batch_model_output.append(sequence_outputs)
-        # batch_model_output = torch.stack(batch_model_output)
-        # return batch_model_output
-
-        # return hipool_embedding