mirror of
https://github.com/twitter/the-algorithm.git
synced 2025-01-20 16:01:16 +01:00
Merge e1691d5f258b54548b542a36d35c4d1eff12b2e9 into fb54d8b54984f89f7dba90a18e7c3048421464c3
This commit is contained in:
commit
79da407152
@ -120,32 +120,28 @@ object UpdateKnownFor {
|
|||||||
clusterScoresToFinalScore: ClusterScoresForNode => Double,
|
clusterScoresToFinalScore: ClusterScoresForNode => Double,
|
||||||
minNeighborsInCluster: Int
|
minNeighborsInCluster: Int
|
||||||
): Option[(Int, Double)] = {
|
): Option[(Int, Double)] = {
|
||||||
val clusterToScores = statsOfClustersInNeighborhood.toList.flatMap {
|
statsOfClustersInNeighborhood
|
||||||
case (clusterId, statsInNeighborhood) =>
|
.toList
|
||||||
val clusterOverallStats = clusterOverallStatsMap(clusterId)
|
.flatMap {
|
||||||
if (statsInNeighborhood.nodeCount >= minNeighborsInCluster) {
|
case (clusterId, statsInNeighborhood) =>
|
||||||
Some(
|
val clusterOverallStats = clusterOverallStatsMap(clusterId)
|
||||||
(
|
statsInNeighborhood match {
|
||||||
clusterId,
|
case statsInNeighborhood if statsInNeighborhood.nodeCount < minNeighborsInCluster => None
|
||||||
clusterScoresToFinalScore(
|
case _ =>
|
||||||
getScoresForCluster(
|
val score = getScoresForCluster(
|
||||||
overallNeighborhoodStats,
|
overallNeighborhoodStats,
|
||||||
statsInNeighborhood,
|
statsInNeighborhood,
|
||||||
clusterOverallStats.nodeCount,
|
clusterOverallStats.nodeCount,
|
||||||
clusterOverallStats.sumOfMembershipWeights,
|
clusterOverallStats.sumOfMembershipWeights,
|
||||||
globalAvgEdgeWeight,
|
globalAvgEdgeWeight,
|
||||||
truePositiveWtFactor
|
truePositiveWtFactor
|
||||||
)
|
|
||||||
)
|
)
|
||||||
)
|
Some((clusterId, clusterScoresToFinalScore(score)))
|
||||||
)
|
}
|
||||||
} else {
|
} match {
|
||||||
None
|
case scores if scores.isEmpty => None
|
||||||
}
|
case _ => Some(clusterToScores.maxBy(_._2))
|
||||||
}
|
}
|
||||||
if (clusterToScores.nonEmpty) {
|
|
||||||
Some(clusterToScores.maxBy(_._2))
|
|
||||||
} else None
|
|
||||||
}
|
}
|
||||||
|
|
||||||
def updateGeneric(
|
def updateGeneric(
|
||||||
@ -170,35 +166,32 @@ object UpdateKnownFor {
|
|||||||
collectInformationPerNode(graph, inputUserToClusters, avgMembershipScore)
|
collectInformationPerNode(graph, inputUserToClusters, avgMembershipScore)
|
||||||
.mapValues {
|
.mapValues {
|
||||||
case NodeInformation(originalClusters, overallStats, statsOfClustersInNeighborhood) =>
|
case NodeInformation(originalClusters, overallStats, statsOfClustersInNeighborhood) =>
|
||||||
val newClusterWithScoreOpt = if (overallStats.nodeCount < minNeighborsInCluster) {
|
overallStats match {
|
||||||
nodesWithSmallDegree.inc()
|
case stats if (overallStats.nodeCount < minNeighborsInCluster) =>
|
||||||
None
|
nodesWithSmallDegree.inc()
|
||||||
} else {
|
None
|
||||||
pickBestCluster(
|
case _ =>
|
||||||
overallStats,
|
pickBestCluster(
|
||||||
statsOfClustersInNeighborhood,
|
overallStats,
|
||||||
clusterOverallStatsMap,
|
statsOfClustersInNeighborhood,
|
||||||
globalAvgWeight,
|
clusterOverallStatsMap,
|
||||||
truePositiveWtFactor,
|
globalAvgWeight,
|
||||||
clusterScoresToFinalScore,
|
truePositiveWtFactor,
|
||||||
minNeighborsInCluster
|
clusterScoresToFinalScore,
|
||||||
)
|
minNeighborsInCluster
|
||||||
}
|
)
|
||||||
newClusterWithScoreOpt match {
|
} match {
|
||||||
case Some((newClusterId, score)) =>
|
case Some((newClusterId, score)) =>
|
||||||
if (originalClusters.isEmpty) {
|
originalClusters match {
|
||||||
emptyToSomething.inc()
|
case cluster if cluster.isEmpty => emptyToSomething.inc()
|
||||||
} else if (originalClusters.contains(newClusterId)) {
|
case cluster if cluster.contains(newClusterId) => sameCluster.inc()
|
||||||
sameCluster.inc()
|
case _ => diffCluster.inc()
|
||||||
} else {
|
|
||||||
diffCluster.inc()
|
|
||||||
}
|
}
|
||||||
Array((newClusterId, score.toFloat))
|
Array((newClusterId, score.toFloat))
|
||||||
case None =>
|
case None =>
|
||||||
if (originalClusters.isEmpty) {
|
originalClusters match {
|
||||||
emptyToEmpty.inc()
|
case cluster if cluster.isEmpty => emptyToEmpty.inc()
|
||||||
} else {
|
case _ => somethingToEmpty.inc()
|
||||||
somethingToEmpty.inc()
|
|
||||||
}
|
}
|
||||||
Array.empty[(Int, Float)]
|
Array.empty[(Int, Float)]
|
||||||
}
|
}
|
||||||
|
Loading…
x
Reference in New Issue
Block a user