This commit is contained in:
ImperiumTakp 2023-07-17 21:42:19 -05:00 committed by GitHub
commit b572e6b1ba
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
1 changed files with 11 additions and 11 deletions

View File

@ -102,23 +102,23 @@ object KnownForSources {
TypedPipe
.from(TextLine(textFile))
.flatMap { str =>
if (!str.startsWith("#")) {
try {
str match {
case s"#$_" => None
case _ => try {
val tokens = str.trim.split("\\s+")
val res = Array.newBuilder[(Int, Float)]
val userId = tokens(0).toLong
for (i <- 1 until tokens.length) {
(1 until tokens.length).foldRight(Array.newBuilder[(Int, Float)])((i, r) => {
val Array(cIdStr, scoreStr) = tokens(i).split(":")
val clusterId = cIdStr.toInt
val score = scoreStr.toFloat
val newEntry = (clusterId, score)
res += newEntry
r += newEntry
}).result() match {
case (res) if res.nonEmpty => Some((userId, res.result()))
_ => None
}
val result = res.result
if (result.nonEmpty) {
Some((userId, res.result()))
} else None
} catch {
}
catch {
case ex: Throwable =>
log.warning(
s"Error while loading knownFor from $textFile for line <$str>: " +
@ -126,7 +126,7 @@ object KnownForSources {
)
None
}
} else None
}
}
}