-
Notifications
You must be signed in to change notification settings - Fork 31
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
FMWK-196 Index Cardinality #657
Changes from 1 commit
3750e4d
acc3c09
f97b47a
7d83440
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -20,11 +20,16 @@ | |
import org.slf4j.Logger; | ||
import org.slf4j.LoggerFactory; | ||
import org.springframework.data.aerospike.query.cache.IndexesCache; | ||
import org.springframework.data.aerospike.query.model.Index; | ||
import org.springframework.data.aerospike.query.model.IndexedField; | ||
import org.springframework.data.aerospike.repository.query.Query; | ||
import org.springframework.lang.Nullable; | ||
import org.springframework.util.StringUtils; | ||
|
||
import java.util.Comparator; | ||
import java.util.List; | ||
import java.util.Optional; | ||
|
||
import static org.springframework.data.aerospike.query.QualifierUtils.queryCriteriaIsNotNull; | ||
|
||
/** | ||
|
@@ -59,13 +64,44 @@ public Statement build(String namespace, String set, @Nullable Query query, Stri | |
} | ||
|
||
private void setStatementFilterFromQualifiers(Statement stmt, Qualifier qualifier) { | ||
/* | ||
* query with qualifier | ||
*/ | ||
if (qualifier == null) return; | ||
// No qualifier, no need to set statement filter | ||
if (qualifier == null) { | ||
return; | ||
} | ||
|
||
// Multiple qualifiers | ||
// No sense to use secondary index in case of OR as it requires to enlarge selection to more than 1 field | ||
if (qualifier.getOperation() == FilterOperation.AND) { | ||
// no sense to use secondary index in case of OR | ||
// as it requires to enlarge selection to more than 1 field | ||
setFilterFromMultipleQualifiers(stmt, qualifier); | ||
} else if (isIndexedBin(stmt, qualifier)) { // Single qualifier | ||
setFilterFromSingleQualifier(stmt, qualifier); | ||
} | ||
} | ||
|
||
private void setFilterFromMultipleQualifiers(Statement stmt, Qualifier qualifier) { | ||
int minBinValuesRatio = Integer.MAX_VALUE; | ||
Qualifier minBinValuesRatioQualifier = null; | ||
|
||
for (Qualifier innerQualifier : qualifier.getQualifiers()) { | ||
if (innerQualifier != null && isIndexedBin(stmt, innerQualifier)) { | ||
int currBinValuesRatio = getMinBinValuesRatioForQualifier(stmt, innerQualifier); | ||
// Compare the cardinality of each qualifier and select the qualifier that has the index with | ||
// the lowest bin values ratio | ||
if (currBinValuesRatio < minBinValuesRatio && currBinValuesRatio != 0) { | ||
minBinValuesRatio = currBinValuesRatio; | ||
minBinValuesRatioQualifier = innerQualifier; | ||
} | ||
} | ||
} | ||
|
||
// If index with min bin values ratio found, set filter with the matching qualifier | ||
if (minBinValuesRatioQualifier != null) { | ||
Filter filter = minBinValuesRatioQualifier.setQueryAsFilter(); | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. The |
||
if (filter != null) { | ||
stmt.setFilter(filter); | ||
minBinValuesRatioQualifier.setQueryAsFilter(true); | ||
} | ||
} else { // No index with bin values ratio found, do not consider cardinality when setting a filter | ||
for (Qualifier innerQualifier : qualifier.getQualifiers()) { | ||
if (innerQualifier != null && isIndexedBin(stmt, innerQualifier)) { | ||
Filter filter = innerQualifier.setQueryAsFilter(); | ||
|
@@ -76,13 +112,15 @@ private void setStatementFilterFromQualifiers(Statement stmt, Qualifier qualifie | |
} | ||
} | ||
} | ||
} else if (isIndexedBin(stmt, qualifier)) { | ||
Filter filter = qualifier.setQueryAsFilter(); | ||
if (filter != null) { | ||
stmt.setFilter(filter); | ||
// the filter from the first processed qualifier becomes statement's sIndex filter | ||
qualifier.setQueryAsFilter(true); | ||
} | ||
} | ||
} | ||
|
||
private void setFilterFromSingleQualifier(Statement stmt, Qualifier qualifier) { | ||
Filter filter = qualifier.setQueryAsFilter(); | ||
if (filter != null) { | ||
stmt.setFilter(filter); | ||
// the filter from the first processed qualifier becomes statement's sIndex filter | ||
qualifier.setQueryAsFilter(true); | ||
} | ||
} | ||
|
||
|
@@ -101,4 +139,20 @@ private boolean isIndexedBin(Statement stmt, Qualifier qualifier) { | |
} | ||
return hasIndex; | ||
} | ||
|
||
private int getMinBinValuesRatioForQualifier(Statement stmt, Qualifier qualifier) { | ||
// Get all indexes that uses this field | ||
List<Index> indexList = indexesCache.getAllIndexesForField( | ||
new IndexedField(stmt.getNamespace(), stmt.getSetName(), qualifier.getField())); | ||
|
||
// Return the lowest bin values ratio of the indexes in indexList | ||
Optional<Index> minBinValuesRatio = indexList.stream() | ||
.filter(index -> index.getBinValuesRatio() != 0) | ||
.min(Comparator.comparing(Index::getBinValuesRatio)); | ||
|
||
if (minBinValuesRatio.isPresent()) { | ||
return minBinValuesRatio.get().getBinValuesRatio(); | ||
} | ||
return 0; | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. refactor to: return minBinValuesRatio.map(Index::getBinValuesRatio).orElse(0); |
||
} | ||
} |
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -15,12 +15,19 @@ | |
*/ | ||
package org.springframework.data.aerospike.query.cache; | ||
|
||
import com.aerospike.client.IAerospikeClient; | ||
import com.aerospike.client.Info; | ||
import org.slf4j.Logger; | ||
import org.slf4j.LoggerFactory; | ||
import org.springframework.data.aerospike.query.model.Index; | ||
import org.springframework.data.aerospike.query.model.IndexKey; | ||
import org.springframework.data.aerospike.query.model.IndexesInfo; | ||
import org.springframework.data.aerospike.utility.ServerVersionUtils; | ||
|
||
import java.util.Arrays; | ||
import java.util.Collections; | ||
import java.util.Map; | ||
import java.util.stream.Collectors; | ||
|
||
import static java.util.stream.Collectors.collectingAndThen; | ||
import static java.util.stream.Collectors.toMap; | ||
|
@@ -37,6 +44,8 @@ public class InternalIndexOperations { | |
|
||
private final IndexInfoParser indexInfoParser; | ||
|
||
private final Logger log = LoggerFactory.getLogger(InternalIndexOperations.class); | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Use the |
||
|
||
public InternalIndexOperations(IndexInfoParser indexInfoParser) { | ||
this.indexInfoParser = indexInfoParser; | ||
} | ||
|
@@ -60,4 +69,35 @@ public IndexesInfo parseIndexesInfo(String infoResponse) { | |
public String buildGetIndexesCommand() { | ||
return SINDEX_WITH_BASE64; | ||
} | ||
|
||
public void enrichIndexesWithCardinality(IAerospikeClient client, Map<IndexKey, Index> indexes) { | ||
log.debug("Enriching secondary indexes with cardinality"); | ||
// TODO: can improve by fetching index stats with 1 request instead of per index | ||
indexes.values().forEach( | ||
index -> index.setBinValuesRatio(getIndexBinValuesRatio(client, index.getNamespace(), index.getName())) | ||
); | ||
} | ||
|
||
public Integer getIndexBinValuesRatio(IAerospikeClient client, String namespace, String indexName) { | ||
if (ServerVersionUtils.isSIndexCardinalitySupported(client)) { | ||
|
||
try { | ||
String indexStatData = Info.request(null, client.getCluster().getRandomNode(), | ||
String.format("sindex-stat:ns=%s;indexname=%s", namespace, indexName)); | ||
|
||
return Integer.valueOf( | ||
Arrays.stream(indexStatData.split(";")) | ||
.map(String::trim) | ||
.toList().stream() | ||
.map(stat -> Arrays.stream(stat.split("=")) | ||
.map(String::trim) | ||
.collect(Collectors.toList())) | ||
.collect(Collectors.toMap(t -> t.get(0), t -> t.get(1))) | ||
.get("entries_per_bval")); | ||
} catch (Exception e) { | ||
log.warn("Failed to fetch secondary index %s cardinality".formatted(indexName), e); | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Use log.warn("Failed to fetch secondary index {} cardinality", indexName, e); instead. |
||
} | ||
} | ||
return 0; | ||
} | ||
} |
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -19,30 +19,35 @@ | |
import com.aerospike.client.cdt.CTX; | ||
import com.aerospike.client.query.IndexCollectionType; | ||
import com.aerospike.client.query.IndexType; | ||
import lombok.AllArgsConstructor; | ||
import lombok.Builder; | ||
import lombok.EqualsAndHashCode; | ||
import lombok.Getter; | ||
import lombok.RequiredArgsConstructor; | ||
import lombok.Value; | ||
import lombok.Setter; | ||
|
||
/** | ||
* This class represents a Secondary Index created in the cluster. | ||
* | ||
* @author Peter Milne | ||
* @author Anastasiia Smirnova | ||
*/ | ||
@Value | ||
@Builder | ||
@RequiredArgsConstructor | ||
@AllArgsConstructor | ||
@EqualsAndHashCode | ||
@Getter | ||
public class Index { | ||
|
||
String name; | ||
String namespace; | ||
String set; | ||
String bin; | ||
IndexType indexType; | ||
IndexCollectionType indexCollectionType; | ||
CTX[] ctx; | ||
private final String name; | ||
private final String namespace; | ||
private final String set; | ||
private final String bin; | ||
private final IndexType indexType; | ||
private final IndexCollectionType indexCollectionType; | ||
private final CTX[] ctx; | ||
@Setter | ||
private Integer binValuesRatio; | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Can be |
||
|
||
public Index(String name, String namespace, String set, String bin, IndexType indexType, | ||
IndexCollectionType indexCollectionType) { | ||
|
@@ -53,5 +58,6 @@ public Index(String name, String namespace, String set, String bin, IndexType in | |
this.indexType = indexType; | ||
this.indexCollectionType = indexCollectionType; | ||
this.ctx = null; | ||
this.binValuesRatio = 0; | ||
} | ||
} |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
I would move
currBinValuesRatio != 0
to be first in this statement.