diff --git a/src/scala/com/twitter/interaction_graph/scio/agg_negative/InteractionGraphNegativeJob.scala b/src/scala/com/twitter/interaction_graph/scio/agg_negative/InteractionGraphNegativeJob.scala index 2f173df77..ecf3c9177 100644 --- a/src/scala/com/twitter/interaction_graph/scio/agg_negative/InteractionGraphNegativeJob.scala +++ b/src/scala/com/twitter/interaction_graph/scio/agg_negative/InteractionGraphNegativeJob.scala @@ -78,6 +78,7 @@ object InteractionGraphNegativeJob extends ScioBeamJob[InteractionGraphNegativeO readSnapshot(FlockReportAsSpamEdgesScalaDataset, sc), FeatureName.NumReportAsSpams, endTs) + .filter(_.age < accountLevelShadowbanMaxTime) // we only keep unfollows in the past X days due to the huge size of this dataset, // and to prevent permanent "shadow-banning" in the event of accidental unfollows.