Merge e1691d5f258b54548b542a36d35c4d1eff12b2e9 into fb54d8b54984f89f7dba90a18e7c3048421464c3

This commit is contained in:
ImperiumTakp 2023-05-22 17:39:13 -05:00 committed by GitHub
commit 79da407152
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -120,32 +120,28 @@ object UpdateKnownFor {
clusterScoresToFinalScore: ClusterScoresForNode => Double, clusterScoresToFinalScore: ClusterScoresForNode => Double,
minNeighborsInCluster: Int minNeighborsInCluster: Int
): Option[(Int, Double)] = { ): Option[(Int, Double)] = {
val clusterToScores = statsOfClustersInNeighborhood.toList.flatMap { statsOfClustersInNeighborhood
case (clusterId, statsInNeighborhood) => .toList
val clusterOverallStats = clusterOverallStatsMap(clusterId) .flatMap {
if (statsInNeighborhood.nodeCount >= minNeighborsInCluster) { case (clusterId, statsInNeighborhood) =>
Some( val clusterOverallStats = clusterOverallStatsMap(clusterId)
( statsInNeighborhood match {
clusterId, case statsInNeighborhood if statsInNeighborhood.nodeCount < minNeighborsInCluster => None
clusterScoresToFinalScore( case _ =>
getScoresForCluster( val score = getScoresForCluster(
overallNeighborhoodStats, overallNeighborhoodStats,
statsInNeighborhood, statsInNeighborhood,
clusterOverallStats.nodeCount, clusterOverallStats.nodeCount,
clusterOverallStats.sumOfMembershipWeights, clusterOverallStats.sumOfMembershipWeights,
globalAvgEdgeWeight, globalAvgEdgeWeight,
truePositiveWtFactor truePositiveWtFactor
)
) )
) Some((clusterId, clusterScoresToFinalScore(score)))
) }
} else { } match {
None case scores if scores.isEmpty => None
} case _ => Some(clusterToScores.maxBy(_._2))
} }
if (clusterToScores.nonEmpty) {
Some(clusterToScores.maxBy(_._2))
} else None
} }
def updateGeneric( def updateGeneric(
@ -170,35 +166,32 @@ object UpdateKnownFor {
collectInformationPerNode(graph, inputUserToClusters, avgMembershipScore) collectInformationPerNode(graph, inputUserToClusters, avgMembershipScore)
.mapValues { .mapValues {
case NodeInformation(originalClusters, overallStats, statsOfClustersInNeighborhood) => case NodeInformation(originalClusters, overallStats, statsOfClustersInNeighborhood) =>
val newClusterWithScoreOpt = if (overallStats.nodeCount < minNeighborsInCluster) { overallStats match {
nodesWithSmallDegree.inc() case stats if (overallStats.nodeCount < minNeighborsInCluster) =>
None nodesWithSmallDegree.inc()
} else { None
pickBestCluster( case _ =>
overallStats, pickBestCluster(
statsOfClustersInNeighborhood, overallStats,
clusterOverallStatsMap, statsOfClustersInNeighborhood,
globalAvgWeight, clusterOverallStatsMap,
truePositiveWtFactor, globalAvgWeight,
clusterScoresToFinalScore, truePositiveWtFactor,
minNeighborsInCluster clusterScoresToFinalScore,
) minNeighborsInCluster
} )
newClusterWithScoreOpt match { } match {
case Some((newClusterId, score)) => case Some((newClusterId, score)) =>
if (originalClusters.isEmpty) { originalClusters match {
emptyToSomething.inc() case cluster if cluster.isEmpty => emptyToSomething.inc()
} else if (originalClusters.contains(newClusterId)) { case cluster if cluster.contains(newClusterId) => sameCluster.inc()
sameCluster.inc() case _ => diffCluster.inc()
} else {
diffCluster.inc()
} }
Array((newClusterId, score.toFloat)) Array((newClusterId, score.toFloat))
case None => case None =>
if (originalClusters.isEmpty) { originalClusters match {
emptyToEmpty.inc() case cluster if cluster.isEmpty => emptyToEmpty.inc()
} else { case _ => somethingToEmpty.inc()
somethingToEmpty.inc()
} }
Array.empty[(Int, Float)] Array.empty[(Int, Float)]
} }