Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add logging of query IDs via QueryLogIterator class #2451

Open
wants to merge 44 commits into
base: integration
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
44 commits
Select commit Hold shift + click to select a range
aab6f6b
Add TServer logging of query IDs
SethSmucker Mar 21, 2024
7a967cf
Removed star imports
SethSmucker Jun 6, 2024
e80161d
tserverLoggingActivce added to ShardQueryConfiguraitonTest
SethSmucker Jun 6, 2024
27285cc
tserverLoggingActivce added to ShardQueryConfiguraitonTest
SethSmucker Jun 6, 2024
031adf8
Fix CountQueryTest issues (#1)
lbschanno Jun 6, 2024
879f0b2
Fix NPE issues (#2)
lbschanno Jun 6, 2024
4dfab3d
Add TserverLoggingTest and make configuration changes (#3)
lbschanno Jun 7, 2024
8347fa3
Added javadocs
SethSmucker Jun 7, 2024
75bcf9e
Added class comment
SethSmucker Jun 7, 2024
aa123f7
Formatting
SethSmucker Jun 7, 2024
c5c75a9
Merge branch 'integration' into log-iterator
SethSmucker Jun 7, 2024
e5e1883
Add TServer logging of query IDs and Tests
SethSmucker Mar 21, 2024
9550f60
Merged with upstream/log-iterator
SethSmucker Jun 20, 2024
09cb6e1
Suggested formatting tweaks
SethSmucker Jun 25, 2024
4575f22
Suggested formatting tweaks
SethSmucker Jun 25, 2024
c44ce02
Merge branch 'integration' into log-iterator
lbschanno Jun 25, 2024
e48807b
Commit test
SethSmucker Jun 28, 2024
43f8f32
Fixed SQL bug
SethSmucker Jun 28, 2024
3aed0d6
Merge branch 'integration' into log-iterator
SethSmucker Jun 28, 2024
2a7f891
Merge branch 'integration' into log-iterator
SethSmucker Jul 1, 2024
4838e69
Merge branch 'integration' into log-iterator
lbschanno Jul 1, 2024
49600e5
Merge branch 'integration' into log-iterator
SethSmucker Jul 2, 2024
93d38c8
Merge branch 'integration' into log-iterator
SethSmucker Jul 5, 2024
9d6f82e
Merge branch 'integration' into log-iterator
SethSmucker Jul 30, 2024
4751377
Merge branch 'integration' into log-iterator
SethSmucker Aug 1, 2024
5311519
Merge branch 'integration' into log-iterator
SethSmucker Aug 15, 2024
f6fccf5
Merge branch 'integration' into log-iterator
SethSmucker Aug 16, 2024
abf28e9
Merge branch 'integration' into log-iterator
SethSmucker Sep 5, 2024
647ab9c
switch to debug
SethSmucker Sep 5, 2024
67eb398
Merge branch 'integration' into log-iterator
SethSmucker Sep 9, 2024
58af31e
Merge branch 'integration' into log-iterator
ivakegg Nov 4, 2024
aaa120f
Merge branch 'integration' into log-iterator
ivakegg Nov 6, 2024
1db40f0
Wrap iterator logic with thread name changing logic
SethSmucker Jan 16, 2025
47d0791
Remove overkill logging
SethSmucker Jan 16, 2025
2fd9f76
Merge integration
SethSmucker Jan 16, 2025
9241a06
Merge
SethSmucker Jan 22, 2025
d46a109
Merge
SethSmucker Jan 22, 2025
b43e2a5
Merge
SethSmucker Jan 22, 2025
cbc571d
Merge branch 'integration' into log-iterator
SethSmucker Jan 23, 2025
0ff338c
Rollback DefaultQueryPlanner
SethSmucker Jan 23, 2025
78ad1af
GitHub Actions: Fix Formatting
Jan 23, 2025
998059e
Manually fix DefaultQueryPlanner
SethSmucker Jan 23, 2025
a7241bd
Merge
SethSmucker Jan 23, 2025
57e5ab8
GitHub Actions: Fix Formatting
Jan 23, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -529,6 +529,11 @@ public class ShardQueryConfiguration extends GenericQueryConfiguration implement
*/
private double fieldIndexHoleMinThreshold = 1.0d;

/**
* Controls whether query IDs are logged on the tserver level via {@link datawave.query.iterator.QueryLogIterator}.
*/
private boolean tserverLoggingActive = true;

/**
* The set of date types that, if the query's end date is the current date, will NOT result in any date range adjustments or the addition of a
* SHARDS_AND_DAYS hint.
Expand Down Expand Up @@ -784,6 +789,7 @@ public void copyFrom(ShardQueryConfiguration other) {
this.setUseQueryTreeScanHintRules(other.isUseQueryTreeScanHintRules());
this.setQueryTreeScanHintRules(other.getQueryTreeScanHintRules());
this.setFieldIndexHoleMinThreshold(other.getFieldIndexHoleMinThreshold());
this.setTserverLoggingActive(other.isTserverLoggingActive());
this.setNoExpansionIfCurrentDateTypes(
other.getNoExpansionIfCurrentDateTypes() == null ? null : Sets.newHashSet(other.getNoExpansionIfCurrentDateTypes()));
this.setShardsAndDaysHintAllowed(other.isShardsAndDaysHintAllowed());
Expand Down Expand Up @@ -2845,6 +2851,14 @@ public void setSortQueryPostIndexWithTermCounts(boolean sortQueryPostIndexWithTe
this.sortQueryPostIndexWithTermCounts = sortQueryPostIndexWithTermCounts;
}

public boolean isTserverLoggingActive() {
return this.tserverLoggingActive;
}

public void setTserverLoggingActive(boolean tserverLoggingActive) {
this.tserverLoggingActive = tserverLoggingActive;
}

public int getCardinalityThreshold() {
return cardinalityThreshold;
}
Expand Down Expand Up @@ -3061,14 +3075,14 @@ public boolean equals(Object o) {
getDocAggregationThresholdMs() == that.getDocAggregationThresholdMs() &&
getTfAggregationThresholdMs() == that.getTfAggregationThresholdMs() &&
getPruneQueryOptions() == that.getPruneQueryOptions() &&
isSortQueryPreIndexWithImpliedCounts() == that.isSortQueryPreIndexWithImpliedCounts() &&
isSortQueryPreIndexWithFieldCounts() == that.isSortQueryPreIndexWithFieldCounts() &&
isSortQueryPostIndexWithTermCounts() == that.isSortQueryPostIndexWithTermCounts() &&
isSortQueryPostIndexWithFieldCounts() == that.isSortQueryPostIndexWithFieldCounts() &&
isSortQueryPreIndexWithImpliedCounts() == isSortQueryPreIndexWithImpliedCounts() &&
isSortQueryPreIndexWithFieldCounts() == isSortQueryPreIndexWithFieldCounts() &&
isSortQueryPostIndexWithTermCounts() == isSortQueryPostIndexWithTermCounts() &&
isSortQueryPostIndexWithFieldCounts() == isSortQueryPostIndexWithFieldCounts() &&
isTserverLoggingActive() == that.isTserverLoggingActive() &&
getCardinalityThreshold() == that.getCardinalityThreshold() &&
Objects.equals(getNoExpansionIfCurrentDateTypes(), that.getNoExpansionIfCurrentDateTypes()) &&
isShardsAndDaysHintAllowed() == that.isShardsAndDaysHintAllowed();

// @formatter:on
}

Expand Down Expand Up @@ -3275,6 +3289,7 @@ public int hashCode() {
isSortQueryPreIndexWithFieldCounts(),
isSortQueryPostIndexWithTermCounts(),
isSortQueryPostIndexWithFieldCounts(),
isTserverLoggingActive(),
getCardinalityThreshold(),
getNoExpansionIfCurrentDateTypes(),
isShardsAndDaysHintAllowed()
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,250 @@
package datawave.query.iterator;

import static datawave.query.iterator.QueryOptions.QUERY_ID;

import java.io.IOException;
import java.lang.reflect.InvocationTargetException;
import java.lang.reflect.Method;
import java.util.Collection;
import java.util.HashMap;
import java.util.Map;
import java.util.function.Function;

import org.apache.accumulo.core.data.ByteSequence;
import org.apache.accumulo.core.data.Key;
import org.apache.accumulo.core.data.Range;
import org.apache.accumulo.core.data.Value;
import org.apache.accumulo.core.iterators.IteratorEnvironment;
import org.apache.accumulo.core.iterators.OptionDescriber;
import org.apache.accumulo.core.iterators.SortedKeyValueIterator;
import org.apache.log4j.Logger;
import org.apache.log4j.MDC;

/**
* An iterator used to log the start and end of each method run by the {@link SortedKeyValueIterator} above it in the iterator stack. Logs the QueryID
* associated with each method. Logs are written on the TServer where the iterator is running
*/
public class QueryLogIterator implements SortedKeyValueIterator<Key,Value>, OptionDescriber {

private static final Logger log = Logger.getLogger(QueryLogIterator.class);
private static final String CLASS_NAME = QueryLogIterator.class.getSimpleName();

private String queryID;
private SortedKeyValueIterator<Key,Value> source;
private IteratorEnvironment env;

/**
* Default constructor
*/
public QueryLogIterator() {
// no-arg constructor
}

/**
* Class copy constructor
*/
public QueryLogIterator(QueryLogIterator other, IteratorEnvironment env) {
this.source = other.source.deepCopy(env);
this.env = other.env;
this.queryID = other.queryID;
}

/**
* Wraps the init() method of the iterator above it, logging the start/end of the method along with its query id.
*/
@Override
public void init(SortedKeyValueIterator<Key,Value> source, Map<String,String> options, IteratorEnvironment env) throws IOException {

String oldName = Thread.currentThread().getName();
Thread.currentThread().setName(oldName + " -> " + this.queryID);
MDC.put("queryID", queryID);
try {
try {
this.queryID = options.get(QUERY_ID);
this.source = source;
this.env = env;
} catch (Exception e) {
throw new RuntimeException(e);
}
} finally {
Thread.currentThread().setName(oldName);
MDC.remove("queryID");
}
}

/**
* Logs the query id and {@link SortedKeyValueIterator} method name before the method is run.
*/
private void logStartOf(String methodName) {
if (log.isDebugEnabled()) {
log.debug(CLASS_NAME + " " + methodName + " Started QueryID: " + this.queryID);
}
}

/**
* Logs the query id and {@link SortedKeyValueIterator} method name after the method is run.
*/
private void logEndOf(String methodName) {
if (log.isDebugEnabled()) {
log.debug(CLASS_NAME + " " + methodName + " Ended QueryID: " + this.queryID);
}
}

/**
* Wraps the hasTop() method of the iterator above it, logging the start and end of the method along with its query id.
*/
@Override
public boolean hasTop() {
String oldName = Thread.currentThread().getName();
Thread.currentThread().setName(oldName + " -> " + this.queryID);
MDC.put("queryID", queryID);
try {
boolean result;

try {
result = source.hasTop();
} catch (Exception e) {
throw new RuntimeException(e);
}
return result;
} finally {
Thread.currentThread().setName(oldName);
MDC.remove("queryID");
}

}

/**
* Wraps the next() method of the iterator above it, logging the start and end of the method along with its query id.
*/
@Override
public void next() throws IOException {
String oldName = Thread.currentThread().getName();
Thread.currentThread().setName(oldName + " -> " + this.queryID);
MDC.put("queryID", queryID);
try {
try {
source.next();
} catch (Exception e) {
throw new RuntimeException(e);
}
} finally {
Thread.currentThread().setName(oldName);
MDC.remove("queryID");
}

}

/**
* Wraps the getTopKey() method of the iterator above it, logging the start and end of the method along with its query id.
*/
@Override
public Key getTopKey() {
String oldName = Thread.currentThread().getName();
Thread.currentThread().setName(oldName + " -> " + this.queryID);
MDC.put("queryID", queryID);
try {
Key k;
try {
k = source.getTopKey();
} catch (Exception e) {
throw new RuntimeException(e);
}
return k;
} finally {
Thread.currentThread().setName(oldName);
MDC.remove("queryID");
}

}

/**
* Wraps the getTopValue() method of the iterator above it, logging the start and end of the method along with its query id.
*/
@Override
public Value getTopValue() {
String oldName = Thread.currentThread().getName();
Thread.currentThread().setName(oldName + " -> " + this.queryID);
MDC.put("queryID", queryID);
try {
Value v;
try {
v = source.getTopValue();
} catch (Exception e) {
throw new RuntimeException(e);
}
return v;
} finally {
Thread.currentThread().setName(oldName);
MDC.remove("queryID");
}

}

/**
* Wraps the deepCopy() method of the iterator above it, logging the start and end of the method along with its query id.
*/
@Override
public SortedKeyValueIterator<Key,Value> deepCopy(IteratorEnvironment iteratorEnvironment) {
String oldName = Thread.currentThread().getName();
Thread.currentThread().setName(oldName + " -> " + this.queryID);
MDC.put("queryID", queryID);
try {
QueryLogIterator copy;

try {
copy = new QueryLogIterator(this, this.env);
} catch (Exception e) {
throw new RuntimeException(e);
}
return copy;
} finally {
Thread.currentThread().setName(oldName);
MDC.remove("queryID");
}

}

/**
* Wraps the seek() method of the iterator above it, logging the start and end of the method along with its query id.
*/
@Override
public void seek(Range range, Collection<ByteSequence> collection, boolean b) throws IOException {
String oldName = Thread.currentThread().getName();
Thread.currentThread().setName(oldName + " -> " + this.queryID);
MDC.put("queryID", queryID);
try {
try {
logStartOf("seek()");
this.source.seek(range, collection, b);
} finally {
logEndOf("seek()");
}
} finally {
Thread.currentThread().setName(oldName);
MDC.remove("queryID");
}

}

/**
* Returns a {@link org.apache.accumulo.core.iterators.OptionDescriber.IteratorOptions} object containing a description of the iterator and an option for
* the QueryID.
*/
@Override
public IteratorOptions describeOptions() {
Map<String,String> options = new HashMap<>();
options.put(QUERY_ID, "The QueryID to be logged as methods are invoked");

return new IteratorOptions(getClass().getSimpleName(), "An iterator used to log the QueryID", options, null);
}

/**
* Returns true if the options provided contains the QueryID.
*/
@Override
public boolean validateOptions(Map<String,String> options) {
return options.containsKey(QUERY_ID);
}

}
Loading