Skip to content

Commit

Permalink
Merge branch 'integration' into log-iterator
Browse files Browse the repository at this point in the history
  • Loading branch information
SethSmucker committed Jun 28, 2024
2 parents 43f8f32 + 6e516bf commit 3aed0d6
Show file tree
Hide file tree
Showing 28 changed files with 609 additions and 802 deletions.
2 changes: 1 addition & 1 deletion core/in-memory-accumulo
Original file line number Diff line number Diff line change
Expand Up @@ -95,35 +95,6 @@ public QueryData(QueryData other) {
this.finished = other.finished;
}

@Deprecated(since = "6.5.0", forRemoval = true)
public QueryData(String tableName, String query, Collection<Range> ranges, List<IteratorSetting> settings) {
setTableName(tableName);
setQuery(query);
setRanges(ranges);
setSettings(settings);
}

/**
* Weak copy constructor that updates the ranges
*
* @param other
* another QueryData
* @param ranges
* a collection of updated ranges
* @deprecated
*/
@Deprecated(since = "6.5.0", forRemoval = true)
public QueryData(QueryData other, Collection<Range> ranges) {
this(other);
setRanges(ranges);
}

@Deprecated(since = "6.5.0", forRemoval = true)
public QueryData(String tableName, String queryString, List<Range> ranges, List<IteratorSetting> settings, Collection<String> columnFamilies) {
this(tableName, queryString, ranges, settings);
this.columnFamilies.addAll(columnFamilies);
}

// builder style methods

public QueryData withTableName(String tableName) {
Expand Down
2 changes: 1 addition & 1 deletion core/utils/type-utils
Submodule type-utils updated 79 files
+12 −1 pom.xml
+4 −5 src/main/java/datawave/data/normalizer/NumberNormalizer.java
+38 −0 src/main/java/datawave/data/normalizer/regex/AlternationNode.java
+32 −0 src/main/java/datawave/data/normalizer/regex/AnyCharNode.java
+48 −0 src/main/java/datawave/data/normalizer/regex/CharClassNode.java
+59 −0 src/main/java/datawave/data/normalizer/regex/CharRangeNode.java
+34 −0 src/main/java/datawave/data/normalizer/regex/DigitCharClassNode.java
+32 −0 src/main/java/datawave/data/normalizer/regex/EmptyNode.java
+37 −0 src/main/java/datawave/data/normalizer/regex/EncodedNumberNode.java
+41 −0 src/main/java/datawave/data/normalizer/regex/EncodedPatternNode.java
+32 −0 src/main/java/datawave/data/normalizer/regex/EndAnchorNode.java
+46 −0 src/main/java/datawave/data/normalizer/regex/EscapedSingleCharNode.java
+41 −0 src/main/java/datawave/data/normalizer/regex/ExpressionNode.java
+41 −0 src/main/java/datawave/data/normalizer/regex/GroupNode.java
+48 −0 src/main/java/datawave/data/normalizer/regex/IntegerNode.java
+67 −0 src/main/java/datawave/data/normalizer/regex/IntegerRangeNode.java
+333 −0 src/main/java/datawave/data/normalizer/regex/Node.java
+192 −0 src/main/java/datawave/data/normalizer/regex/NodeListIterator.java
+25 −0 src/main/java/datawave/data/normalizer/regex/NodeType.java
+457 −0 src/main/java/datawave/data/normalizer/regex/NumericRegexEncoder.java
+32 −0 src/main/java/datawave/data/normalizer/regex/OneOrMoreNode.java
+32 −0 src/main/java/datawave/data/normalizer/regex/QuestionMarkNode.java
+65 −0 src/main/java/datawave/data/normalizer/regex/RegexConstants.java
+305 −0 src/main/java/datawave/data/normalizer/regex/RegexParser.java
+246 −0 src/main/java/datawave/data/normalizer/regex/RegexReader.java
+604 −0 src/main/java/datawave/data/normalizer/regex/RegexUtils.java
+36 −0 src/main/java/datawave/data/normalizer/regex/RepetitionNode.java
+46 −0 src/main/java/datawave/data/normalizer/regex/SingleCharNode.java
+34 −0 src/main/java/datawave/data/normalizer/regex/StartAnchorNode.java
+32 −0 src/main/java/datawave/data/normalizer/regex/ZeroOrMoreNode.java
+57 −0 src/main/java/datawave/data/normalizer/regex/visitor/AlternationDeduper.java
+29 −0 src/main/java/datawave/data/normalizer/regex/visitor/AnchorTrimmer.java
+148 −0 src/main/java/datawave/data/normalizer/regex/visitor/BaseVisitor.java
+210 −0 src/main/java/datawave/data/normalizer/regex/visitor/BinFinder.java
+161 −0 src/main/java/datawave/data/normalizer/regex/visitor/CopyVisitor.java
+561 −0 src/main/java/datawave/data/normalizer/regex/visitor/DecimalPointPlacer.java
+58 −0 src/main/java/datawave/data/normalizer/regex/visitor/DecimalPointValidator.java
+79 −0 src/main/java/datawave/data/normalizer/regex/visitor/EmptyLeafTrimmer.java
+169 −0 src/main/java/datawave/data/normalizer/regex/visitor/EqualityVisitor.java
+154 −0 src/main/java/datawave/data/normalizer/regex/visitor/ExponentialBinAdder.java
+143 −0 src/main/java/datawave/data/normalizer/regex/visitor/GTEOneBinFinder.java
+143 −0 src/main/java/datawave/data/normalizer/regex/visitor/LTOneBinFinder.java
+567 −0 src/main/java/datawave/data/normalizer/regex/visitor/NegativeNumberPatternInverter.java
+64 −0 src/main/java/datawave/data/normalizer/regex/visitor/NegativeVariantExpander.java
+68 −0 src/main/java/datawave/data/normalizer/regex/visitor/NonEncodedNumbersChecker.java
+61 −0 src/main/java/datawave/data/normalizer/regex/visitor/NumericCharClassValidator.java
+167 −0 src/main/java/datawave/data/normalizer/regex/visitor/OptionalVariantExpander.java
+223 −0 src/main/java/datawave/data/normalizer/regex/visitor/PrintVisitor.java
+90 −0 src/main/java/datawave/data/normalizer/regex/visitor/SimpleNumberEncoder.java
+192 −0 src/main/java/datawave/data/normalizer/regex/visitor/StringVisitor.java
+98 −0 src/main/java/datawave/data/normalizer/regex/visitor/SubExpressionVisitor.java
+65 −0 src/main/java/datawave/data/normalizer/regex/visitor/Visitor.java
+97 −0 src/main/java/datawave/data/normalizer/regex/visitor/ZeroLengthRepetitionTrimmer.java
+664 −0 src/main/java/datawave/data/normalizer/regex/visitor/ZeroTrimmer.java
+157 −0 src/main/java/datawave/data/normalizer/regex/visitor/ZeroValueNormalizer.java
+102 −146 src/main/java/datawave/data/type/util/NumericalEncoder.java
+260 −0 src/test/java/datawave/data/normalizer/NumberNormalizerTest.java
+337 −0 src/test/java/datawave/data/normalizer/regex/NodeAssert.java
+607 −0 src/test/java/datawave/data/normalizer/regex/NumericRegexEncoderTest.java
+306 −0 src/test/java/datawave/data/normalizer/regex/RegexParserTest.java
+191 −0 src/test/java/datawave/data/normalizer/regex/RegexUtilsTest.java
+42 −0 src/test/java/datawave/data/normalizer/regex/visitor/AlternationDeduperTest.java
+52 −0 src/test/java/datawave/data/normalizer/regex/visitor/AnchorTrimmerTest.java
+426 −0 src/test/java/datawave/data/normalizer/regex/visitor/DecimalPointPlacerTest.java
+64 −0 src/test/java/datawave/data/normalizer/regex/visitor/DecimalPointValidatorTest.java
+74 −0 src/test/java/datawave/data/normalizer/regex/visitor/EmptyLeafTrimmerTest.java
+445 −0 src/test/java/datawave/data/normalizer/regex/visitor/ExponentialBinAdderTest.java
+125 −0 src/test/java/datawave/data/normalizer/regex/visitor/NegativeNumberPatternInverterTest.java
+66 −0 src/test/java/datawave/data/normalizer/regex/visitor/NegativeVariantExpanderTest.java
+48 −0 src/test/java/datawave/data/normalizer/regex/visitor/NonEncodedNumbersCheckerTest.java
+84 −0 src/test/java/datawave/data/normalizer/regex/visitor/NumericCharClassValidatorTest.java
+83 −0 src/test/java/datawave/data/normalizer/regex/visitor/OptionalVariantExpanderTest.java
+78 −0 src/test/java/datawave/data/normalizer/regex/visitor/SimpleNumberEncoderTest.java
+44 −0 src/test/java/datawave/data/normalizer/regex/visitor/StringVisitorTest.java
+64 −0 src/test/java/datawave/data/normalizer/regex/visitor/ZeroLengthRepetitionTrimmerTest.java
+323 −0 src/test/java/datawave/data/normalizer/regex/visitor/ZeroTrimmerTest.java
+85 −0 src/test/java/datawave/data/normalizer/regex/visitor/ZeroValueNormalizerTest.java
+0 −74 src/test/java/datawave/data/normalizer/testNumberNormalizer.java
+0 −1 src/test/java/datawave/data/type/util/NumericalEncoderTest.java
38 changes: 19 additions & 19 deletions docker/docker-compose.yml
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@ services:
- quickstart
# To run the wildfly webservice, change `--accumulo` to `--web`
command: ["datawave-bootstrap.sh", "--accumulo"]
image: datawave/quickstart-compose:7.0.1-SNAPSHOT
image: datawave/quickstart-compose
environment:
- DW_CONTAINER_HOST=quickstart
- DW_DATAWAVE_WEB_JAVA_OPTS=-agentlib:jdwp=transport=dt_socket,server=y,suspend=n,address=*:8787 -Duser.timezone=GMT -Dfile.encoding=UTF-8 -Djava.net.preferIPv4Stack=true
Expand Down Expand Up @@ -47,7 +47,7 @@ services:
test: ["CMD-SHELL", "! accumuloStatus | grep DW-WARN > /dev/null"]

consul:
image: consul:1.15.4
image: docker.io/hashicorp/consul:1.15.4
hostname: localhost
environment:
- 'CONSUL_LOCAL_CONFIG={"log_level": "trace", "datacenter": "demo_dc", "disable_update_check": true, "enable_agent_tls_for_checks": true, "addresses": {"https": "0.0.0.0"}, "ports": {"https": 8501, "grpc_tls": 8503}, "tls": {"defaults": {"key_file": "/etc/pki/testServer.key", "cert_file": "/etc/pki/testServer.crt", "ca_file": "/etc/pki/testCA.pem", "verify_outgoing": true}, "internal_rpc": {"verify_server_hostname": false}}}'
Expand All @@ -65,7 +65,7 @@ services:
- demo

rabbitmq:
image: rabbitmq:3.12.4-alpine
image: docker.io/rabbitmq:3.12.4
volumes:
- ${RABBITMQ_CONFIG_DIR:-./rabbitmq-config}:/etc/rabbitmq
- ./logs:/logs
Expand All @@ -82,7 +82,7 @@ services:

# When auto.create.topics.enable is true, this causes deleted topics to be recreated at random. So, leave it disabled.
kafka:
image: bitnami/kafka:3.2.3
image: docker.io/bitnami/kafka:3.2
ports:
- "9094:9094"
networks:
Expand All @@ -104,7 +104,7 @@ services:
profiles:
- management
- full
image: obsidiandynamics/kafdrop
image: docker.io/obsidiandynamics/kafdrop
ports:
- "8999:9000"
networks:
Expand All @@ -122,7 +122,7 @@ services:

configuration:
entrypoint: [ "java","-agentlib:jdwp=transport=dt_socket,server=y,suspend=n,address=*:5009","-jar","app.jar" ]
image: datawave/config-service:4.0.1-SNAPSHOT
image: datawave/config-service
command:
- --spring.output.ansi.enabled=ALWAYS
- --spring.profiles.active=consul,native,open_actuator
Expand All @@ -146,7 +146,7 @@ services:
condition: service_started

cache:
image: datawave/hazelcast-service:4.0.1-SNAPSHOT
image: datawave/hazelcast-service
scale: 1
command:
- --spring.profiles.active=consul,compose,remoteauth
Expand Down Expand Up @@ -174,7 +174,7 @@ services:

authorization:
entrypoint: [ "java","-agentlib:jdwp=transport=dt_socket,server=y,suspend=n,address=*:5008","-jar","app.jar" ]
image: datawave/authorization-service:4.0.1-SNAPSHOT
image: datawave/authorization-service
command:
- --spring.output.ansi.enabled=ALWAYS
- --spring.profiles.active=consul,mock,compose,federation
Expand Down Expand Up @@ -203,7 +203,7 @@ services:
profiles:
- accumulo
- full
image: datawave/accumulo-service:4.0.1-SNAPSHOT
image: datawave/accumulo-service
command:
- --spring.output.ansi.enabled=ALWAYS
- --spring.profiles.active=consul,compose,remoteauth
Expand Down Expand Up @@ -236,7 +236,7 @@ services:
condition: service_healthy

audit:
image: datawave/audit-service:4.0.1-SNAPSHOT
image: datawave/audit-service
command:
- --spring.output.ansi.enabled=ALWAYS
- --spring.profiles.active=consul,compose,remoteauth
Expand Down Expand Up @@ -270,7 +270,7 @@ services:

metrics:
entrypoint: ["java","-agentlib:jdwp=transport=dt_socket,server=y,suspend=n,address=*:5007","-jar","app.jar"]
image: datawave/query-metric-service:4.0.2-SNAPSHOT
image: datawave/query-metric-service
command:
- --spring.output.ansi.enabled=ALWAYS
- --spring.profiles.active=consul,compose,remoteauth
Expand Down Expand Up @@ -307,7 +307,7 @@ services:
profiles:
- dictionary
- full
image: datawave/dictionary-service:4.0.1-SNAPSHOT
image: datawave/dictionary-service
command:
- --spring.output.ansi.enabled=ALWAYS
- --spring.profiles.active=consul,compose,remoteauth
Expand Down Expand Up @@ -339,7 +339,7 @@ services:
mysql:
profiles:
- cachedresults
image: mysql:8.0.32
image: docker.io/mysql:8.0.32
environment:
- MYSQL_RANDOM_ROOT_PASSWORD=true
- MYSQL_DATABASE=cachedresults
Expand All @@ -355,7 +355,7 @@ services:
# If you want to test cached results, set the CACHED_RESULTS environment variable to 'true'
query:
entrypoint: ["java","-agentlib:jdwp=transport=dt_socket,server=y,suspend=n,address=*:5005","-jar","app.jar"]
image: datawave/query-service:1.0.1-SNAPSHOT
image: datawave/query-service
command:
- --spring.output.ansi.enabled=ALWAYS
- --spring.profiles.active=consul,compose,remoteauth,querymessaging,metricssource,query,mrquery,cachedresults,federation
Expand Down Expand Up @@ -399,7 +399,7 @@ services:
profiles:
- full
entrypoint: ["java","-agentlib:jdwp=transport=dt_socket,server=y,suspend=n,address=*:5005","-jar","app.jar"]
image: datawave/mapreduce-query-service:1.0.1-SNAPSHOT
image: datawave/mapreduce-query-service
command:
- --spring.output.ansi.enabled=ALWAYS
- --spring.profiles.active=consul,compose,remoteauth,query,mrquery,federation
Expand Down Expand Up @@ -437,7 +437,7 @@ services:

executor-pool1:
entrypoint: ["java","-agentlib:jdwp=transport=dt_socket,server=y,suspend=n,address=*:5006","-jar","app.jar"]
image: datawave/query-executor-service:1.0.1-SNAPSHOT
image: datawave/query-executor-service
command:
- --spring.application.name=executor-pool1
- --spring.cloud.config.name=executor
Expand Down Expand Up @@ -486,7 +486,7 @@ services:
profiles:
- pool2
- full
image: datawave/query-executor-service:1.0.1-SNAPSHOT
image: datawave/query-executor-service
command:
- --spring.application.name=executor-pool2
- --spring.cloud.config.name=executor
Expand Down Expand Up @@ -533,7 +533,7 @@ services:
profiles:
- modification
- full
image: datawave/modification-service:1.0.1-SNAPSHOT
image: datawave/modification-service
command:
- --spring.output.ansi.enabled=ALWAYS
- --spring.profiles.active=consul,compose,remoteauth,query
Expand Down Expand Up @@ -584,7 +584,7 @@ services:
profiles:
- management
- full
image: hazelcast/management-center:5.1.2
image: docker.io/hazelcast/management-center:5.1.2
environment:
- |-
JAVA_OPTS=
Expand Down
2 changes: 1 addition & 1 deletion pom.xml
Original file line number Diff line number Diff line change
Expand Up @@ -74,7 +74,7 @@
<version.hamcrest>1.3</version.hamcrest>
<version.httpcomponents-httpclient>4.5.13</version.httpcomponents-httpclient>
<version.httpcomponents-httpcore>4.4.8</version.httpcomponents-httpcore>
<version.in-memory-accumulo>4.0.0</version.in-memory-accumulo>
<version.in-memory-accumulo>4.0.1</version.in-memory-accumulo>
<version.infinispan>9.4.21.Final</version.infinispan>
<version.jackson>2.10.0.pr1</version.jackson>
<version.jackson-mapper-asl>1.9.13</version.jackson-mapper-asl>
Expand Down
2 changes: 0 additions & 2 deletions properties/default.properties
Original file line number Diff line number Diff line change
Expand Up @@ -425,8 +425,6 @@ hierarchy.field.options=

# BaseEventQuery (beq) thresholds
beq.baseIteratorPriority=100
beq.eventPerDayThreshold=40000
beq.shardsPerDayThreshold=20
# max number of terms BEFORE all expansions (calculated based on how much the initial parser can handle before hitting a stack overflow: between 3500 and 3750)
beq.initialMaxTermThreshold=2000
# max number of terms AFTER all expansions (calculated based on how much the initial parser can handle before hitting a stack overflow: between 3500 and 3750)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -239,7 +239,7 @@ protected void printUsage() {
System.out.println(" [-collectDistributionStats]");
System.out.println(" [-ingestMetricsDisabled]");
System.out.println(" [-ingestMetricsLabel label]");
System.out.println(" [-compressionType lzo|gz]");
System.out.println(" [-compressionType lzo|gz|zstd]");
System.out.println(" [-compressionTableDisallowList table,table,...");
System.out.println(" [-maxRFileUndeduppedEntries maxEntries]");
System.out.println(" [-maxRFileUncompressedSize maxSize]");
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -241,10 +241,12 @@ public String getQueryIteratorClass() {
return queryIteratorClass;
}

@Deprecated(since = "7.1.0", forRemoval = true)
public int getMaxShardsPerDayThreshold() {
return maxShardsPerDayThreshold;
}

@Deprecated(since = "7.1.0", forRemoval = true)
public void setMaxShardsPerDayThreshold(int maxShardsPerDayThreshold) {
this.maxShardsPerDayThreshold = maxShardsPerDayThreshold;
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -1297,18 +1297,22 @@ public void setUnevaluatedFields(Collection<String> unevaluatedFields) {
}
}

@Deprecated(since = "7.1.0", forRemoval = true)
public int getEventPerDayThreshold() {
return eventPerDayThreshold;
}

@Deprecated(since = "7.1.0", forRemoval = true)
public void setEventPerDayThreshold(int eventPerDayThreshold) {
this.eventPerDayThreshold = eventPerDayThreshold;
}

@Deprecated(since = "7.1.0", forRemoval = true)
public int getShardsPerDayThreshold() {
return shardsPerDayThreshold;
}

@Deprecated(since = "7.1.0", forRemoval = true)
public void setShardsPerDayThreshold(int shardsPerDayThreshold) {
this.shardsPerDayThreshold = shardsPerDayThreshold;
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -570,8 +570,7 @@ public ScannerStream visit(ASTEQNode node, Object data) {

if (limitScanners) {
// Setup the CreateUidsIterator
scannerSession = scanners.newRangeScanner(config.getIndexTableName(), config.getAuthorizations(), config.getQuery(),
config.getShardsPerDayThreshold());
scannerSession = scanners.newRangeScanner(config.getIndexTableName(), config.getAuthorizations(), config.getQuery());

uidSetting = new IteratorSetting(stackStart++, createUidsIteratorClass);
uidSetting.addOption(CreateUidsIterator.COLLAPSE_UIDS, Boolean.toString(collapseUids));
Expand All @@ -581,8 +580,7 @@ public ScannerStream visit(ASTEQNode node, Object data) {

} else {
// Setup so this is a pass-through
scannerSession = scanners.newRangeScanner(config.getIndexTableName(), config.getAuthorizations(), config.getQuery(),
config.getShardsPerDayThreshold());
scannerSession = scanners.newRangeScanner(config.getIndexTableName(), config.getAuthorizations(), config.getQuery());

uidSetting = new IteratorSetting(stackStart++, createUidsIteratorClass);
uidSetting.addOption(CreateUidsIterator.COLLAPSE_UIDS, Boolean.toString(false));
Expand Down
Loading

0 comments on commit 3aed0d6

Please sign in to comment.