Skip to content

Commit 3e30d8c

Browse files
committed
Indexing performance improvements
1 parent d799f87 commit 3e30d8c

File tree

4 files changed

+7
-8
lines changed

4 files changed

+7
-8
lines changed

projects/person-search-index-from-delius/container/pipelines/contact/index/index-template-semantic.yml

Lines changed: 2 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1236,8 +1236,8 @@ template:
12361236
endTime:
12371237
type: date
12381238
format: hour_minute_second
1239-
text:
1240-
type: text
1239+
textChunks:
1240+
type: keyword
12411241
textEmbedding:
12421242
type: nested
12431243
properties:
@@ -1249,17 +1249,14 @@ template:
12491249
name: hnsw
12501250
engine: lucene
12511251
notes:
1252-
copy_to: text
12531252
type: text
12541253
analyzer: probation_text_analyzer
12551254
boost: 5
12561255
description:
1257-
copy_to: text
12581256
type: text
12591257
analyzer: probation_text_analyzer
12601258
boost: 4
12611259
outcome:
1262-
copy_to: text
12631260
type: text
12641261
analyzer: probation_text_analyzer
12651262
store: true
@@ -1268,7 +1265,6 @@ template:
12681265
keyword:
12691266
type: keyword
12701267
type:
1271-
copy_to: text
12721268
type: text
12731269
analyzer: probation_text_analyzer
12741270
store: true

projects/person-search-index-from-delius/container/pipelines/contact/index/ingest-pipeline.tpl.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -16,6 +16,7 @@
1616
"algorithm": {
1717
"fixed_token_length": {
1818
"token_limit": 32,
19+
"max_chunk_limit": -1,
1920
"overlap_rate": 0.125,
2021
"tokenizer": "standard"
2122
}

projects/person-search-index-from-delius/container/pipelines/contact/logstash-incremental.conf

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -49,6 +49,7 @@ filter {
4949
jdbc_password => "${JDBC_PASSWORD}"
5050
jdbc_validate_connection => true
5151
jdbc_validation_timeout => 120
52+
sequel_opts => { max_connections => 100 }
5253
statement => "
5354
select contact_id
5455
from contact join offender on offender.offender_id = contact.offender_id
@@ -89,6 +90,7 @@ filter {
8990
jdbc_password => "${JDBC_PASSWORD}"
9091
jdbc_validate_connection => true
9192
jdbc_validation_timeout => 120
93+
sequel_opts => { max_connections => 100 }
9294
statement => "${INCREMENTAL_STATEMENT_SQL}"
9395
use_prepared_statements => true
9496
prepared_statement_name => "search_indexer_contact_incremental"

projects/person-search-index-from-delius/deploy/values.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -29,8 +29,8 @@ generic-service:
2929
CONTACT_INDEX_PREFIX: contact-search
3030
PERSON_INDEX_PREFIX: person-search
3131
PIPELINES_ENABLED: person-incremental,contact-incremental
32-
PIPELINE_WORKERS: 10
33-
PIPELINE_BATCH_SIZE: 1
32+
PIPELINE_WORKERS: 50
33+
PIPELINE_BATCH_SIZE: 5
3434
JDK_JAVA_OPTIONS: ''
3535
LS_JAVA_OPTS: -Xms3g -Xmx3g # = 75% of pod memory limit (see above)
3636

0 commit comments

Comments
 (0)