Compare commits

...

2 Commits

Author SHA1 Message Date
Shail Shah
d33f3821de
Merge 5ecf79363a into fb54d8b549 2023-05-22 17:38:13 -05:00
Shail Shah
5ecf79363a Simplify getDocIdSetIterator
* Rename tweetIDs to distinctTweetIDs
* Use Java Stream
2023-04-01 13:33:32 -07:00

View File

@ -3,6 +3,7 @@ package com.twitter.search.earlybird.index;
import java.io.IOException; import java.io.IOException;
import java.util.Arrays; import java.util.Arrays;
import java.util.Set; import java.util.Set;
import java.util.stream.Collectors;
import com.google.common.collect.Sets; import com.google.common.collect.Sets;
@ -20,11 +21,11 @@ import com.twitter.search.core.earlybird.index.EarlybirdIndexSegmentAtomicReader
import com.twitter.search.core.earlybird.index.EarlybirdIndexSegmentData; import com.twitter.search.core.earlybird.index.EarlybirdIndexSegmentData;
public class TweetIDQuery extends Query { public class TweetIDQuery extends Query {
private final Set<Long> tweetIDs = Sets.newHashSet(); private final Set<Long> distinctTweetIDs = Sets.newHashSet();
public TweetIDQuery(long... tweetIDs) { public TweetIDQuery(long... tweetIDs) {
for (long tweetID : tweetIDs) { for (long tweetID : tweetIDs) {
this.tweetIDs.add(tweetID); this.distinctTweetIDs.add(tweetID);
} }
} }
@ -37,32 +38,23 @@ public class TweetIDQuery extends Query {
((EarlybirdIndexSegmentAtomicReader) context.reader()).getSegmentData(); ((EarlybirdIndexSegmentAtomicReader) context.reader()).getSegmentData();
DocIDToTweetIDMapper docIdToTweetIdMapper = segmentData.getDocIDToTweetIDMapper(); DocIDToTweetIDMapper docIdToTweetIdMapper = segmentData.getDocIDToTweetIDMapper();
Set<Integer> set = Sets.newHashSet(); int[] distinctSortedDocIDs = distinctTweetIDs.stream()
for (long tweetID : tweetIDs) { .map(tweetID -> docIdToTweetIdMapper.getDocID(tweetID))
int docID = docIdToTweetIdMapper.getDocID(tweetID); .filter(docID -> docID != DocIDToTweetIDMapper.ID_NOT_FOUND)
if (docID != DocIDToTweetIDMapper.ID_NOT_FOUND) { .sorted()
set.add(docID); .mapToInt(Integer::intValue)
} .toArray();
}
if (set.isEmpty()) { return distinctSortedDocIDs.length == 0 ?
return DocIdSetIterator.empty(); DocIdSetIterator.empty() :
} new IntArrayDocIdSetIterator(distinctSortedDocIDs);
int[] docIDs = new int[set.size()];
int i = 0;
for (int docID : set) {
docIDs[i++] = docID;
}
Arrays.sort(docIDs);
return new IntArrayDocIdSetIterator(docIDs);
} }
}; };
} }
@Override @Override
public int hashCode() { public int hashCode() {
return tweetIDs.hashCode(); return distinctTweetIDs.hashCode();
} }
@Override @Override
@ -71,11 +63,11 @@ public class TweetIDQuery extends Query {
return false; return false;
} }
return tweetIDs.equals(TweetIDQuery.class.cast(obj).tweetIDs); return distinctTweetIDs.equals(TweetIDQuery.class.cast(obj).distinctTweetIDs);
} }
@Override @Override
public String toString(String field) { public String toString(String field) {
return "TWEET_ID_QUERY: " + tweetIDs; return "TWEET_ID_QUERY: " + distinctTweetIDs;
} }
} }