Yale-LILY · niansong1996 · Nov 30, 2021 · Nov 29, 2021
diff --git a/summertime/model/__init__.py b/summertime/model/__init__.py
@@ -3,6 +3,7 @@
     MBartModel,
     LexRankModel,
     LongformerModel,
+    T5Model,
     PegasusModel,
     TextRankModel,
 )
@@ -16,6 +17,7 @@
     MBartModel,
     LexRankModel,
     LongformerModel,
+    T5Model,
     PegasusModel,
     TextRankModel,
     MultiDocJointModel,

diff --git a/summertime/model/defaults.py b/summertime/model/defaults.py
@@ -6,5 +6,5 @@ def __init__(self, device="cpu"):
         super(summarizer, self).__init__(device)
 
     def show_capability(self):
-        print("Pegasus is the default singe-document summarization model.")
+        print("Pegasus is the default single-document summarization model.")
         super(summarizer, self).show_capability()
diff --git a/summertime/model/single_doc/__init__.py b/summertime/model/single_doc/__init__.py
@@ -3,5 +3,6 @@
 from .lexrank_model import LexRankModel
 from .longformer_model import LongformerModel
 from .textrank_model import TextRankModel
+from .t5_model import T5Model
 
 from .multilingual import MBartModel
diff --git a/summertime/model/single_doc/t5_model.py b/summertime/model/single_doc/t5_model.py
@@ -0,0 +1,47 @@
+from transformers import T5Tokenizer, T5ForConditionalGeneration
+from .base_single_doc_model import SingleDocSummModel
+
+
+class T5Model(SingleDocSummModel):
+
+    # static variables
+    model_name = "T5"
+    is_extractive = False
+    is_neural = True
+
+    def __init__(self, device="cpu"):
+        super(T5Model, self).__init__(
+            trained_domain="Web Crawl", max_input_length=1024, max_output_length=None
+        )
+
+        self.device = device
+        model_name = "t5-large"
+        self.tokenizer = T5Tokenizer.from_pretrained(model_name)
+        self.model = T5ForConditionalGeneration.from_pretrained(model_name).to(device)
+
+    def summarize(self, corpus, queries=None):
+        self.assert_summ_input_type(corpus, queries)
+
+        batch = self.tokenizer(
+            corpus, truncation=True, padding="longest", return_tensors="pt"
+        ).to(self.device)
+        encoded_summaries = self.model.generate(**batch)
+        summaries = self.tokenizer.batch_decode(
+            encoded_summaries, skip_special_tokens=True
+        )
+
+        return summaries
+
+    @classmethod
+    def show_capability(cls) -> None:
+        basic_description = cls.generate_basic_description()
+        more_details = (
+            "Introduced in 2020, T5 is a large pretrained language model trained on web crawl using "
+            "transfer learning approaches and teacher forcing.\n "
+            "Strengths: \n - High accuracy \n "
+            "Weaknesses: \n - High memory usage \n "
+            "Initialization arguments: \n "
+            "- `device = 'cpu'` specifies the device the model is stored on and uses for computation. "
+            "Use `device='gpu'` to run on an Nvidia GPU."
+        )
+        print(f"{basic_description} \n {'#'*20} \n {more_details}")