Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
34 commits
Select commit Hold shift + click to select a range
11e5dad
[ML] Log categorization multi-bucket agg
benwtrent Apr 2, 2021
f384c16
addressing PR comments
benwtrent Sep 14, 2021
3d7c10e
Merge remote-tracking branch 'upstream/master' into experiment/catego…
benwtrent Sep 14, 2021
397c18e
fixing docs
benwtrent Sep 14, 2021
0999c36
fixing docs
benwtrent Sep 14, 2021
580eb3b
setting maximum values for aggregation
benwtrent Sep 14, 2021
1b70178
adding analyzer etc.
benwtrent Sep 14, 2021
0fe0778
fixing docs
benwtrent Sep 14, 2021
e358ea6
Merge remote-tracking branch 'upstream/master' into experiment/catego…
benwtrent Sep 14, 2021
b4eb65b
fixing result consistency and docs
benwtrent Sep 14, 2021
d81faca
more doc fixes
benwtrent Sep 14, 2021
c67812d
Apply suggestions from code review
benwtrent Sep 15, 2021
1a357dd
Merge branch 'master' into experiment/categorization-aggregation
elasticmachine Sep 20, 2021
a01595f
moving to using token IDs and hashes
benwtrent Sep 22, 2021
bd12b5b
Merge remote-tracking branch 'upstream/master' into experiment/catego…
benwtrent Sep 22, 2021
9ba60fb
moving to bytes ref hash and fixing two bugs
benwtrent Sep 22, 2021
fc1656a
fixing tokenization bug and addressing PR comments
benwtrent Sep 23, 2021
5deb203
updating docs, restricting to 2billion unique tokens
benwtrent Sep 23, 2021
f942f5e
Merge remote-tracking branch 'upstream/master' into experiment/catego…
benwtrent Sep 23, 2021
5aadd74
Merge remote-tracking branch 'upstream/master' into experiment/catego…
benwtrent Sep 23, 2021
1cf93eb
renaming parameters and updating docs
benwtrent Sep 23, 2021
6f940e3
fixing accidental code change
benwtrent Sep 27, 2021
191e9ad
Addressing PR comments
benwtrent Sep 27, 2021
98dc45b
Merge remote-tracking branch 'upstream/master' into experiment/catego…
benwtrent Sep 27, 2021
d49879f
Merge remote-tracking branch 'upstream/master' into experiment/catego…
benwtrent Sep 28, 2021
3210d54
fixing benchmark spotless
benwtrent Sep 28, 2021
41bffb9
Merge branch 'master' into experiment/categorization-aggregation
elasticmachine Sep 28, 2021
b1d2ad0
Merge remote-tracking branch 'upstream/master' into experiment/catego…
benwtrent Sep 29, 2021
6cf0c29
addressing PR comments
benwtrent Sep 29, 2021
80f9f20
Merge branch 'master' into experiment/categorization-aggregation
elasticmachine Sep 30, 2021
9aba6ae
Addressing PR comments and fixing bug
benwtrent Sep 30, 2021
d0b7649
Merge remote-tracking branch 'upstream/master' into experiment/catego…
benwtrent Sep 30, 2021
e483cde
Merge branch 'experiment/categorization-aggregation' of github.com:be…
benwtrent Sep 30, 2021
d82af0a
Merge branch 'master' into experiment/categorization-aggregation
elasticmachine Oct 4, 2021
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -22,6 +22,7 @@
import org.elasticsearch.core.Releasables;
import org.elasticsearch.index.Index;
import org.elasticsearch.index.IndexSettings;
import org.elasticsearch.index.analysis.NameOrDefinition;
import org.elasticsearch.index.analysis.NamedAnalyzer;
import org.elasticsearch.index.cache.bitset.BitsetFilterCache;
import org.elasticsearch.index.fielddata.IndexFieldData;
Expand Down Expand Up @@ -197,6 +198,22 @@ public long nowInMillis() {
return 0;
}

@Override
public Analyzer getNamedAnalyzer(String analyzer) {
return null;
}

@Override
public Analyzer buildCustomAnalyzer(
IndexSettings indexSettings,
boolean normalizer,
NameOrDefinition tokenizer,
List<NameOrDefinition> charFilters,
List<NameOrDefinition> tokenFilters
) {
return null;
}

@Override
protected IndexFieldData<?> buildFieldData(MappedFieldType ft) {
IndexFieldDataCache indexFieldDataCache = indicesFieldDataCache.buildIndexFieldDataCache(new IndexFieldDataCache.Listener() {
Expand Down
33 changes: 33 additions & 0 deletions docs/build.gradle
Original file line number Diff line number Diff line change
Expand Up @@ -1071,6 +1071,39 @@ buildRestTests.setups['farequote_datafeed'] = buildRestTests.setups['farequote_j
"indexes":"farequote"
}
'''
buildRestTests.setups['categorize_text'] = '''
- do:
indices.create:
index: log-messages
body:
settings:
number_of_shards: 1
number_of_replicas: 0
mappings:
properties:
time:
type: date
message:
type: text

- do:
bulk:
index: log-messages
refresh: true
body: |
{"index": {"_id":"1"}}
{"time":"2016-02-07T00:01:00+0000", "message": "2016-02-07T00:00:00+0000 Node 3 shutting down"}
{"index": {"_id":"2"}}
{"time":"2016-02-07T00:02:00+0000", "message": "2016-02-07T00:00:00+0000 Node 5 starting up"}
{"index": {"_id":"3"}}
{"time":"2016-02-07T00:03:00+0000", "message": "2016-02-07T00:00:00+0000 Node 4 shutting down"}
{"index": {"_id":"4"}}
{"time":"2016-02-08T00:01:00+0000", "message": "2016-02-08T00:00:00+0000 Node 5 shutting down"}
{"index": {"_id":"5"}}
{"time":"2016-02-08T00:02:00+0000", "message": "2016-02-08T00:00:00+0000 User foo_325 logging on"}
{"index": {"_id":"6"}}
{"time":"2016-02-08T00:04:00+0000", "message": "2016-02-08T00:00:00+0000 User foo_864 logged off"}
'''
buildRestTests.setups['server_metrics_index'] = '''
- do:
indices.create:
Expand Down
2 changes: 2 additions & 0 deletions docs/reference/aggregations/bucket.asciidoc
Original file line number Diff line number Diff line change
Expand Up @@ -20,6 +20,8 @@ include::bucket/adjacency-matrix-aggregation.asciidoc[]

include::bucket/autodatehistogram-aggregation.asciidoc[]

include::bucket/categorize-text-aggregation.asciidoc[]

include::bucket/children-aggregation.asciidoc[]

include::bucket/composite-aggregation.asciidoc[]
Expand Down
Loading