mirror of
https://github.com/twitter/the-algorithm.git
synced 2024-06-01 08:48:46 +02:00
39 lines
1.8 KiB
Scala
39 lines
1.8 KiB
Scala
package com.twitter.home_mixer.product.scored_tweets.filter
|
|
|
|
import com.twitter.home_mixer.model.HomeFeatures.InNetworkFeature
|
|
import com.twitter.home_mixer.model.HomeFeatures.IsRetweetFeature
|
|
import com.twitter.home_mixer.model.HomeFeatures.TweetUrlsFeature
|
|
import com.twitter.home_mixer.product.scored_tweets.param.ScoredTweetsParam.CompetitorURLSeqParam
|
|
import com.twitter.product_mixer.component_library.model.candidate.TweetCandidate
|
|
import com.twitter.product_mixer.core.functional_component.filter.Filter
|
|
import com.twitter.product_mixer.core.functional_component.filter.FilterResult
|
|
import com.twitter.product_mixer.core.model.common.CandidateWithFeatures
|
|
import com.twitter.product_mixer.core.model.common.identifier.FilterIdentifier
|
|
import com.twitter.product_mixer.core.pipeline.PipelineQuery
|
|
import com.twitter.stitch.Stitch
|
|
|
|
object OutOfNetworkCompetitorURLFilter extends Filter[PipelineQuery, TweetCandidate] {
|
|
|
|
override val identifier: FilterIdentifier = FilterIdentifier("OutOfNetworkCompetitorURL")
|
|
|
|
override def apply(
|
|
query: PipelineQuery,
|
|
candidates: Seq[CandidateWithFeatures[TweetCandidate]]
|
|
): Stitch[FilterResult[TweetCandidate]] = {
|
|
val competitorUrls = query.params(CompetitorURLSeqParam).toSet
|
|
val (removed, kept) = candidates.partition(hasOutOfNetworkUrlFromCompetitor(_, competitorUrls))
|
|
|
|
Stitch.value(FilterResult(kept = kept.map(_.candidate), removed = removed.map(_.candidate)))
|
|
}
|
|
|
|
def hasOutOfNetworkUrlFromCompetitor(
|
|
candidate: CandidateWithFeatures[TweetCandidate],
|
|
competitorUrls: Set[String]
|
|
): Boolean = {
|
|
!candidate.features.getOrElse(InNetworkFeature, true) &&
|
|
!candidate.features.getOrElse(IsRetweetFeature, false) &&
|
|
candidate.features
|
|
.getOrElse(TweetUrlsFeature, Seq.empty).toSet.intersect(competitorUrls).nonEmpty
|
|
}
|
|
}
|