Skip to content

Commit

Permalink
fix: sort on all languages for anbefaltTerm, case-insensitive
Browse files Browse the repository at this point in the history
  • Loading branch information
jeffreiffers committed Oct 16, 2024
1 parent 8f4f10f commit e0f7300
Show file tree
Hide file tree
Showing 9 changed files with 218 additions and 33 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -21,12 +21,18 @@ class ElasticUpdater(
fun reindexElastic() = runBlocking {
launch {
try {
logger.info("deleting all current concepts")

Check warning on line 24 in src/main/kotlin/no/fdk/concept_catalog/elastic/ElasticUpdater.kt

View check run for this annotation

Codecov / codecov/patch

src/main/kotlin/no/fdk/concept_catalog/elastic/ElasticUpdater.kt#L24

Added line #L24 was not covered by tests
currentConceptRepository.deleteAll()
} catch (_: Exception) { }

conceptRepository.findAll<BegrepDBO>()
.forEach {
if (it.shouldBeCurrent(currentConceptRepository.findByIdOrNull(it.originaltBegrep))) currentConceptRepository.save(CurrentConcept(it))
if (it.shouldBeCurrent(currentConceptRepository.findByIdOrNull(it.originaltBegrep))) {
logger.info("reindexing ${it.id}, ${it.ansvarligVirksomhet.id}")
currentConceptRepository.save(CurrentConcept(it))

Check warning on line 32 in src/main/kotlin/no/fdk/concept_catalog/elastic/ElasticUpdater.kt

View check run for this annotation

Codecov / codecov/patch

src/main/kotlin/no/fdk/concept_catalog/elastic/ElasticUpdater.kt#L31-L32

Added lines #L31 - L32 were not covered by tests
} else {
logger.info("skipping not current ${it.id}, ${it.ansvarligVirksomhet.id}")

Check warning on line 34 in src/main/kotlin/no/fdk/concept_catalog/elastic/ElasticUpdater.kt

View check run for this annotation

Codecov / codecov/patch

src/main/kotlin/no/fdk/concept_catalog/elastic/ElasticUpdater.kt#L34

Added line #L34 was not covered by tests
}
}

logger.info("finished reindexing elastic")
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -6,10 +6,14 @@ import org.springframework.data.annotation.Id
import org.springframework.data.elasticsearch.annotations.Document
import org.springframework.data.elasticsearch.annotations.Field
import org.springframework.data.elasticsearch.annotations.FieldType
import org.springframework.data.elasticsearch.annotations.Mapping
import org.springframework.data.elasticsearch.annotations.Setting
import java.time.Instant
import java.time.LocalDate

@Document(indexName = "concepts-current")
@Setting(settingPath = "/elasticsearch/current-concept-settings.json")
@Mapping(mappingPath = "/elasticsearch/current-concept-mappings.json")
@JsonInclude(JsonInclude.Include.NON_NULL)
data class CurrentConcept(
val idOfThisVersion: String,
Expand Down
12 changes: 6 additions & 6 deletions src/main/kotlin/no/fdk/concept_catalog/model/SortField.kt
Original file line number Diff line number Diff line change
@@ -1,13 +1,13 @@
package no.fdk.concept_catalog.model

enum class SortFieldEnum(val label: String) {
SIST_ENDRET("sistEndret"),
ANBEFALT_TERM_NB("anbefaltTerm.nb"),
enum class SortFieldEnum {
SIST_ENDRET,
ANBEFALT_TERM,
}

enum class SortDirection(val label: String) {
ASC("ASC"),
DESC("DESC"),
enum class SortDirection {
ASC,
DESC,
}

class SortField(
Expand Down
120 changes: 98 additions & 22 deletions src/main/kotlin/no/fdk/concept_catalog/service/ConceptSearchService.kt
Original file line number Diff line number Diff line change
@@ -1,9 +1,11 @@
package no.fdk.concept_catalog.service

import co.elastic.clients.elasticsearch._types.ScriptSortType
import co.elastic.clients.elasticsearch._types.SortOrder
import co.elastic.clients.elasticsearch._types.query_dsl.Operator
import co.elastic.clients.elasticsearch._types.query_dsl.TextQueryType
import no.fdk.concept_catalog.model.*
import org.slf4j.LoggerFactory
import org.springframework.data.domain.Pageable
import org.springframework.data.elasticsearch.client.elc.NativeQuery
import org.springframework.data.elasticsearch.client.elc.NativeQueryBuilder
Expand All @@ -18,19 +20,28 @@ class ConceptSearchService(
private val elasticsearchOperations: ElasticsearchOperations
) {

private val logger = LoggerFactory.getLogger(ConceptSearchService::class.java)

fun suggestConcepts(orgNumber: String, published: Boolean?, query: String): SearchHits<CurrentConcept> =
elasticsearchOperations.search(
suggestionQuery(orgNumber, published, query),
CurrentConcept::class.java,
IndexCoordinates.of("concepts-current")
)

fun searchCurrentConcepts(orgNumber: String, search: SearchOperation): SearchHits<CurrentConcept> =
elasticsearchOperations.search(
search.toElasticQuery(orgNumber),
CurrentConcept::class.java,
IndexCoordinates.of("concepts-current")
)
fun searchCurrentConcepts(orgNumber: String, search: SearchOperation): SearchHits<CurrentConcept> {
try {
val query = search.toElasticQuery(orgNumber)
return elasticsearchOperations.search(
query,
CurrentConcept::class.java,
IndexCoordinates.of("concepts-current")
)
} catch (e: Exception) {
logger.error("Failed to search for concepts", e)
throw RuntimeException("Failed to search for concepts", e)

Check warning on line 42 in src/main/kotlin/no/fdk/concept_catalog/service/ConceptSearchService.kt

View check run for this annotation

Codecov / codecov/patch

src/main/kotlin/no/fdk/concept_catalog/service/ConceptSearchService.kt#L40-L42

Added lines #L40 - L42 were not covered by tests
}
}

private fun suggestionQuery(orgNumber: String, published: Boolean?, query: String): Query {
val builder = NativeQuery.builder()
Expand All @@ -40,14 +51,89 @@ class ConceptSearchService(
}
}
builder.withQuery { queryBuilder ->
queryBuilder.matchPhrasePrefix { matchBuilder ->
matchBuilder.query(query)
.field("anbefaltTerm.navn.nb")
queryBuilder.bool { boolBuilder ->
boolBuilder.should { shouldBuilder1 ->
shouldBuilder1.matchPhrasePrefix { matchBuilder ->
matchBuilder.query(query)
.field("anbefaltTerm.navn.nb")
}
}
boolBuilder.should { shouldBuilder2 ->
shouldBuilder2.bool { nnFieldCheck ->
nnFieldCheck.mustNot { mustNotBuilder ->
mustNotBuilder.exists { existsBuilder ->
existsBuilder.field("anbefaltTerm.navn.nb")
}
mustNotBuilder.term { termBuilder ->
termBuilder
.field("anbefaltTerm.navn.nb")
.value("")
}
}
nnFieldCheck.should { shouldBuilder ->
shouldBuilder.matchPhrasePrefix { matchBuilder ->
matchBuilder.query(query)
.field("anbefaltTerm.navn.nn")
}
}
}
}
boolBuilder.should { shouldBuilder3 ->
shouldBuilder3.bool { enFieldCheck ->
enFieldCheck.mustNot { mustNotBuilder1 ->
mustNotBuilder1.exists { existsBuilder1 ->
existsBuilder1.field("anbefaltTerm.navn.nb")
}
mustNotBuilder1.term { termBuilder ->
termBuilder
.field("anbefaltTerm.navn.nb")
.value("")
}
}
enFieldCheck.mustNot { mustNotBuilder2 ->
mustNotBuilder2.exists { existsBuilder2 ->
existsBuilder2.field("anbefaltTerm.navn.nn")
}
mustNotBuilder2.term { termBuilder ->
termBuilder
.field("anbefaltTerm.navn.nn")
.value("")
}
}
enFieldCheck.should { shouldBuilder ->
shouldBuilder.matchPhrasePrefix { matchBuilder ->
matchBuilder.query(query)
.field("anbefaltTerm.navn.en")
}
}
}
}
}
}
builder.withSort { sortBuilder ->
sortBuilder.field { fieldBuilder ->
fieldBuilder.field("anbefaltTerm_sort").order(SortOrder.Desc)
}
}
return builder.build()
}

private fun SortField.buildSort(builder: NativeQueryBuilder) {
if (field == SortFieldEnum.ANBEFALT_TERM) {
builder.withSort { sortBuilder ->
sortBuilder.field { fieldBuilder ->
fieldBuilder.field("anbefaltTerm_sort").order(sortDirection())
}
}
} else {
builder.withSort { sortBuilder ->
sortBuilder.field { fieldBuilder ->
fieldBuilder.field("endringslogelement.endringstidspunkt").order(sortDirection())
}
}
}
}

private fun SearchOperation.toElasticQuery(orgNumber: String): Query {
val builder = NativeQuery.builder()
builder.withFilter { queryBuilder ->
Expand All @@ -59,13 +145,7 @@ class ConceptSearchService(
)
}
}
if (sort != null) {
builder.withSort { sortBuilder ->
sortBuilder.field { fieldBuilder ->
fieldBuilder.field(sort.sortField()).order(sort.sortDirection())
}
}
}
sort?.buildSort(builder)
if (!query.isNullOrBlank()) builder.addFieldsQuery(fields, query)
builder.withPageable(Pageable.ofSize(pagination.getSize()).withPage(pagination.getPage()))

Expand Down Expand Up @@ -105,12 +185,6 @@ class ConceptSearchService(
else -> SortOrder.Desc
}

private fun SortField.sortField(): String =
when (field) {
SortFieldEnum.ANBEFALT_TERM_NB -> "anbefaltTerm.navn.nb.keyword"
else -> "endringslogelement.endringstidspunkt"
}

private fun QueryFields.exactPaths(): List<String> =
listOf(
if (anbefaltTerm) languagePaths("anbefaltTerm.navn", 30)
Expand Down Expand Up @@ -153,3 +227,5 @@ class ConceptSearchService(
"$basePath.en${if (boost != null) "^$boost" else ""}")

}


Original file line number Diff line number Diff line change
Expand Up @@ -266,7 +266,6 @@ class ConceptService(

fun searchConcepts(orgNumber: String, search: SearchOperation): Paginated {
val hits = conceptSearchService.searchCurrentConcepts(orgNumber, search)

return hits.map { it.content }
.map { it.toDBO() }
.map { it.withHighestVersionDTO() }
Expand Down
68 changes: 68 additions & 0 deletions src/main/resources/elasticsearch/current-concept-mappings.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,68 @@
{
"runtime": {
"anbefaltTerm_sort": {
"type": "keyword",
"script": {
"source": "if (doc.containsKey('anbefaltTerm.navn.nb.keyword_lower') && doc['anbefaltTerm.navn.nb.keyword_lower'].size() > 0 && doc['anbefaltTerm.navn.nb.keyword_lower'].value != null && !doc['anbefaltTerm.navn.nb.keyword_lower'].value.isEmpty()) {emit(doc['anbefaltTerm.navn.nb.keyword_lower'].value);} else if (doc.containsKey('anbefaltTerm.navn.nn.keyword_lower') && doc['anbefaltTerm.navn.nn.keyword_lower'].size() > 0 && doc['anbefaltTerm.navn.nn.keyword_lower'].value != null && !doc['anbefaltTerm.navn.nn.keyword_lower'].value.isEmpty()) {emit(doc['anbefaltTerm.navn.nn.keyword_lower'].value);} else if (doc.containsKey('anbefaltTerm.navn.en.keyword_lower') && doc['anbefaltTerm.navn.en.keyword_lower'].size() > 0 && doc['anbefaltTerm.navn.en.keyword_lower'].value != null && !doc['anbefaltTerm.navn.en.keyword_lower'].value.isEmpty()) {emit(doc['anbefaltTerm.navn.en.keyword_lower'].value);} else {emit(null);}"
}
}
},
"properties": {
"anbefaltTerm": {
"properties": {
"navn": {
"properties": {
"en": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256,
"doc_values": true
},
"keyword_lower": {
"type": "keyword",
"ignore_above": 256,
"normalizer": "lowercase_normalizer",
"doc_values": true
}
}
},
"nb": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256,
"doc_values": true
},
"keyword_lower": {
"type": "keyword",
"ignore_above": 256,
"normalizer": "lowercase_normalizer",
"doc_values": true
}
}
},
"nn": {
"type": "text",
"fields": {
"keyword": {
"type": "keyword",
"ignore_above": 256,
"doc_values": true
},
"keyword_lower": {
"type": "keyword",
"ignore_above": 256,
"normalizer": "lowercase_normalizer",
"doc_values": true
}
}
}
}
}
}
}
}
}
11 changes: 11 additions & 0 deletions src/main/resources/elasticsearch/current-concept-settings.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,11 @@
{
"analysis": {
"normalizer": {
"lowercase_normalizer": {
"type": "custom",
"char_filter": [],
"filter": ["lowercase"]
}
}
}
}
25 changes: 23 additions & 2 deletions src/test/kotlin/no/fdk/concept_catalog/contract/SearchConcepts.kt
Original file line number Diff line number Diff line change
Expand Up @@ -572,11 +572,30 @@ class SearchConcepts : ApiTestContext() {
assertEquals(listOf(BEGREP_2, BEGREP_0, BEGREP_1), result.hits)
}

@Test
fun `Query returns sorted results ordered by anbefaltTerm ascending`() {
val searchOp = SearchOperation(
query = "",
sort = SortField(field = SortFieldEnum.ANBEFALT_TERM, direction = SortDirection.ASC)
)
val rsp = authorizedRequest(
"/begreper/search?orgNummer=123456789",
port, mapper.writeValueAsString(searchOp), JwtToken(Access.ORG_WRITE).toString(),
HttpMethod.POST
)
assertEquals(HttpStatus.OK.value(), rsp["status"])

val result: Paginated = mapper.readValue(rsp["body"] as String)
assertEquals(BEGREP_0.id, result.hits[0].id)
assertEquals(BEGREP_1.id, result.hits[1].id)
assertEquals(BEGREP_2.id, result.hits[2].id)
}

@Test
fun `Query returns sorted results ordered by anbefaltTerm descending`() {
val searchOp = SearchOperation(
query = "",
sort = SortField(field = SortFieldEnum.ANBEFALT_TERM_NB, direction = SortDirection.DESC)
sort = SortField(field = SortFieldEnum.ANBEFALT_TERM, direction = SortDirection.DESC)
)
val rsp = authorizedRequest(
"/begreper/search?orgNummer=123456789",
Expand All @@ -586,7 +605,9 @@ class SearchConcepts : ApiTestContext() {
assertEquals(HttpStatus.OK.value(), rsp["status"])

val result: Paginated = mapper.readValue(rsp["body"] as String)
assertEquals(listOf(BEGREP_0, BEGREP_2, BEGREP_1), result.hits)
assertEquals(BEGREP_2.id, result.hits[0].id)
assertEquals(BEGREP_1.id, result.hits[1].id)
assertEquals(BEGREP_0.id, result.hits[2].id)
}

@Test
Expand Down
2 changes: 1 addition & 1 deletion src/test/kotlin/no/fdk/concept_catalog/utils/TestData.kt
Original file line number Diff line number Diff line change
Expand Up @@ -160,7 +160,7 @@ val BEGREP_2 = Begrep(
gjeldendeRevisjon = null,
status = Status.HOERING,
statusURI = "http://publications.europa.eu/resource/authority/concept-status/CANDIDATE",
anbefaltTerm = Term(navn = mapOf(Pair("nb", "Begrep 2"))),
anbefaltTerm = Term(navn = mapOf(Pair("nb", ""), Pair("nn", "begrep 2"))),
tillattTerm = mapOf(Pair("nb", listOf("Lorem ipsum"))),
ansvarligVirksomhet = Virksomhet(
id = "123456789"
Expand Down

0 comments on commit e0f7300

Please sign in to comment.