Skip to content

Commit 60499a5

Browse files
committed
Prototype bitmap frequency aggs
1 parent 74a66f9 commit 60499a5

8 files changed

+835
-16
lines changed

solr/core/src/java/org/apache/solr/search/ValueSourceParser.java

+7-1
Original file line numberDiff line numberDiff line change
@@ -57,14 +57,16 @@
5757
import org.apache.solr.search.facet.AggValueSource;
5858
import org.apache.solr.search.facet.AvgAgg;
5959
import org.apache.solr.search.facet.BitmapCollectorAgg;
60+
import org.apache.solr.search.facet.BitmapFrequencyAgg;
6061
import org.apache.solr.search.facet.CountAgg;
62+
import org.apache.solr.search.facet.FrequencyOfFrequenciesAgg;
6163
import org.apache.solr.search.facet.HLLAgg;
6264
import org.apache.solr.search.facet.MinMaxAgg;
6365
import org.apache.solr.search.facet.PercentileAgg;
66+
import org.apache.solr.search.facet.RelatednessAgg;
6467
import org.apache.solr.search.facet.StddevAgg;
6568
import org.apache.solr.search.facet.SumAgg;
6669
import org.apache.solr.search.facet.SumsqAgg;
67-
import org.apache.solr.search.facet.RelatednessAgg;
6870
import org.apache.solr.search.facet.TopDocsAgg;
6971
import org.apache.solr.search.facet.UniqueAgg;
7072
import org.apache.solr.search.facet.UniqueBlockAgg;
@@ -1059,6 +1061,10 @@ public ValueSource parse(FunctionQParser fp) throws SyntaxError {
10591061

10601062
addParser("agg_bitmapcollector", new BitmapCollectorAgg.Parser());
10611063

1064+
addParser("agg_bitmapfreq", new BitmapFrequencyAgg.Parser());
1065+
1066+
addParser("agg_bitmapfreqfreq", new FrequencyOfFrequenciesAgg.Parser());
1067+
10621068
addParser("childfield", new ChildFieldValueSourceParser());
10631069
}
10641070

solr/core/src/java/org/apache/solr/search/facet/BitmapCollectorAgg.java

+2-15
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,5 @@
11
package org.apache.solr.search.facet;
22

3-
import java.io.ByteArrayOutputStream;
4-
import java.io.DataOutputStream;
53
import java.io.IOException;
64
import java.nio.ByteBuffer;
75
import java.util.Arrays;
@@ -73,7 +71,7 @@ public Object getValue(int slotNum) {
7371
byte[] serialised;
7472
if (result[slotNum] != null) {
7573
result[slotNum].runOptimize();
76-
serialised = bitmapToBytes(result[slotNum]);
74+
serialised = BitmapUtil.bitmapToBytes(result[slotNum]);
7775
} else {
7876
serialised = new byte[0];
7977
}
@@ -116,20 +114,9 @@ public void finish(Context mcontext) {
116114
public Object getMergedResult() {
117115
combined.runOptimize();
118116
SimpleOrderedMap map = new SimpleOrderedMap();
119-
map.add(KEY, bitmapToBytes(combined));
117+
map.add(KEY, BitmapUtil.bitmapToBytes(combined));
120118
return map;
121119
}
122120
}
123121

124-
private static byte[] bitmapToBytes(MutableRoaringBitmap bitmap) {
125-
ByteArrayOutputStream bos = new ByteArrayOutputStream();
126-
DataOutputStream dos = new DataOutputStream(bos);
127-
try {
128-
bitmap.serialize(dos);
129-
dos.close();
130-
return bos.toByteArray();
131-
} catch (IOException ioe) {
132-
throw new RuntimeException("Failed to serialise RoaringBitmap to bytes", ioe);
133-
}
134-
}
135122
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,81 @@
1+
package org.apache.solr.search.facet;
2+
3+
import org.apache.lucene.queries.function.ValueSource;
4+
import org.apache.solr.common.util.SimpleOrderedMap;
5+
import org.apache.solr.search.FunctionQParser;
6+
import org.apache.solr.search.SyntaxError;
7+
import org.apache.solr.search.ValueSourceParser;
8+
9+
/**
10+
* Calculates the frequency of ordinal values using Roaring Bitmaps.
11+
*
12+
* The response is a map with the following fields:
13+
* - bitmaps: an array of bitmaps, where the frequency of a value x is given by the sum of {@code 2^i} for all values
14+
* of {@code i} where {@code bitmaps[i].contains(x)}
15+
* - overflow: a bitmap of ordinal values with {@code frequency >= 2^(bitmaps.length)}
16+
*
17+
* Lacking a coherent definition of magnitude other than the raw count, this aggregate cannot be used for sorting.
18+
*/
19+
public class BitmapFrequencyAgg extends SimpleAggValueSource {
20+
private final int size;
21+
22+
public BitmapFrequencyAgg(ValueSource vs, int size) {
23+
super("bitmapfreq", vs);
24+
25+
this.size = size;
26+
}
27+
28+
@Override
29+
public SlotAcc createSlotAcc(FacetContext fcontext, int numDocs, int numSlots) {
30+
return new BitmapFrequencySlotAcc(getArg(), fcontext, numSlots, size);
31+
}
32+
33+
@Override
34+
public FacetMerger createFacetMerger(Object prototype) {
35+
return new Merger(size);
36+
}
37+
38+
public static class Parser extends ValueSourceParser {
39+
@Override
40+
public ValueSource parse(FunctionQParser fp) throws SyntaxError {
41+
ValueSource valueSource = fp.parseValueSource();
42+
43+
int size = 16;
44+
if (fp.hasMoreArguments()) {
45+
size = fp.parseInt();
46+
}
47+
48+
return new BitmapFrequencyAgg(valueSource, size);
49+
}
50+
}
51+
52+
private static class Merger extends FacetMerger {
53+
private final int size;
54+
private BitmapFrequencyCounter result;
55+
56+
public Merger(int size) {
57+
this.size = size;
58+
this.result = new BitmapFrequencyCounter(size);
59+
}
60+
61+
@Override
62+
public void merge(Object facetResult, Context mcontext) {
63+
if (facetResult instanceof SimpleOrderedMap) {
64+
BitmapFrequencyCounter deserialized = new BitmapFrequencyCounter(size);
65+
deserialized.deserialize((SimpleOrderedMap<Object>) facetResult);
66+
67+
result = result.merge(deserialized);
68+
}
69+
}
70+
71+
@Override
72+
public void finish(Context mcontext) {
73+
// never called
74+
}
75+
76+
@Override
77+
public Object getMergedResult() {
78+
return result.serialize();
79+
}
80+
}
81+
}

0 commit comments

Comments
 (0)