mirror of
https://github.com/twitter/the-algorithm.git
synced 2024-06-01 08:48:46 +02:00
62 lines
2.7 KiB
Scala
62 lines
2.7 KiB
Scala
package com.twitter.home_mixer.product.scored_tweets.filter
|
|
|
|
import com.twitter.home_mixer.model.HomeFeatures._
|
|
import com.twitter.product_mixer.component_library.model.candidate.TweetCandidate
|
|
import com.twitter.product_mixer.core.feature.featuremap.FeatureMap
|
|
import com.twitter.product_mixer.core.functional_component.filter.Filter
|
|
import com.twitter.product_mixer.core.functional_component.filter.FilterResult
|
|
import com.twitter.product_mixer.core.model.common.CandidateWithFeatures
|
|
import com.twitter.product_mixer.core.model.common.identifier.FilterIdentifier
|
|
import com.twitter.product_mixer.core.pipeline.PipelineQuery
|
|
import com.twitter.stitch.Stitch
|
|
import com.twitter.timelineservice.suggests.{thriftscala => st}
|
|
|
|
object ScoredTweetsSocialContextFilter extends Filter[PipelineQuery, TweetCandidate] {
|
|
|
|
override val identifier: FilterIdentifier = FilterIdentifier("ScoredTweetsSocialContext")
|
|
|
|
// Tweets from candidate sources which don't need generic like/follow/topic proof
|
|
private val AllowedSources: Set[st.SuggestType] = Set(
|
|
st.SuggestType.RankedListTweet,
|
|
st.SuggestType.RecommendedTrendTweet,
|
|
st.SuggestType.MediaTweet
|
|
)
|
|
|
|
override def apply(
|
|
query: PipelineQuery,
|
|
candidates: Seq[CandidateWithFeatures[TweetCandidate]]
|
|
): Stitch[FilterResult[TweetCandidate]] = {
|
|
val validTweetIds = candidates
|
|
.filter { candidate =>
|
|
candidate.features.getOrElse(InNetworkFeature, true) ||
|
|
candidate.features.getOrElse(SuggestTypeFeature, None).exists(AllowedSources.contains) ||
|
|
candidate.features.getOrElse(InReplyToTweetIdFeature, None).isDefined ||
|
|
hasLikedBySocialContext(candidate.features) ||
|
|
hasFollowedBySocialContext(candidate.features) ||
|
|
hasTopicSocialContext(candidate.features)
|
|
}.map(_.candidate.id).toSet
|
|
|
|
val (kept, removed) =
|
|
candidates.map(_.candidate).partition(candidate => validTweetIds.contains(candidate.id))
|
|
|
|
Stitch.value(FilterResult(kept = kept, removed = removed))
|
|
}
|
|
|
|
private def hasLikedBySocialContext(candidateFeatures: FeatureMap): Boolean =
|
|
candidateFeatures
|
|
.getOrElse(SGSValidLikedByUserIdsFeature, Seq.empty)
|
|
.exists(
|
|
candidateFeatures
|
|
.getOrElse(PerspectiveFilteredLikedByUserIdsFeature, Seq.empty)
|
|
.toSet.contains
|
|
)
|
|
|
|
private def hasFollowedBySocialContext(candidateFeatures: FeatureMap): Boolean =
|
|
candidateFeatures.getOrElse(SGSValidFollowedByUserIdsFeature, Seq.empty).nonEmpty
|
|
|
|
private def hasTopicSocialContext(candidateFeatures: FeatureMap): Boolean = {
|
|
candidateFeatures.getOrElse(TopicIdSocialContextFeature, None).isDefined &&
|
|
candidateFeatures.getOrElse(TopicContextFunctionalityTypeFeature, None).isDefined
|
|
}
|
|
}
|