recommenders-team · simonzhaoms · Feb 28, 2022 · Dec 17, 2021 · Dec 17, 2021 · Jan 21, 2022
@@ -205,10 +205,13 @@ def set_index(self, df):
     def fit(self, df):
         """Main fit method for SAR.
 
+        .. note::
+
+        Please make sure that `df` has no duplicates.
+
         Args:
-            df (pandas.DataFrame): User item rating dataframe
+            df (pandas.DataFrame): User item rating dataframe (without duplicates).
         """
-
         # generate continuous indices if this hasn't been done
         if self.index2item is None:
             self.set_index(df)
@@ -226,12 +229,6 @@ def fit(self, df):
         if self.time_decay_flag:
             logger.info("Calculating time-decayed affinities")
             temp_df = self.compute_time_decay(df=temp_df, decay_column=self.col_rating)
-        else:
-            # without time decay use the latest user-item rating in the dataset as the affinity score
-            logger.info("De-duplicating the user-item counts")
-            temp_df = temp_df.drop_duplicates(
-                [self.col_user, self.col_item], keep="last"
-            )
 
         logger.info("Creating index columns")
         # add mapping of user and item ids to indices