KafkaTopology.kt 6.14 KB
Newer Older
Jonas Waeber's avatar
Jonas Waeber committed
1
/*
Jonas Waeber's avatar
Jonas Waeber committed
2
 * search-doc-service
Jonas Waeber's avatar
Jonas Waeber committed
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
 * Copyright (C) 2020 Memoriav
 *
 * This program is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Affero General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Affero General Public License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <https://www.gnu.org/licenses/>.
 */

package org.memobase

21
22
23
import ch.memobase.reporting.Report
import ch.memobase.reporting.ReportStatus
import ch.memobase.settings.SettingsLoader
Jonas Waeber's avatar
Jonas Waeber committed
24
25
import com.fasterxml.jackson.databind.ObjectMapper
import com.fasterxml.jackson.module.kotlin.registerKotlinModule
26
import java.io.StringWriter
Jonas Waeber's avatar
Jonas Waeber committed
27
28
import org.apache.kafka.streams.StreamsBuilder
import org.apache.kafka.streams.Topology
29
30
import org.apache.kafka.streams.kstream.KStream
import org.apache.kafka.streams.kstream.Predicate
Jonas Waeber's avatar
Jonas Waeber committed
31
import org.apache.logging.log4j.LogManager
32
import org.memobase.helpers.ElasticSearchWrapper
Jonas Waeber's avatar
Jonas Waeber committed
33
import org.memobase.helpers.JSON
34
import org.memobase.helpers.KEYS.SettingsProps
35
import org.memobase.helpers.TranslationMappers
36
import org.memobase.model.DocumentsSearchDoc
37
38
import org.memobase.model.InstitutionSearchDoc
import org.memobase.model.RecordSetSearchDoc
39
import org.memobase.model.Schema
Jonas Waeber's avatar
Jonas Waeber committed
40

41
42
43
44
45
class KafkaTopology(
    private val settings: SettingsLoader,
    translationMappers: TranslationMappers,
    elasticSearchWrapper: ElasticSearchWrapper
) {
Jonas Waeber's avatar
Jonas Waeber committed
46
47
    private val log = LogManager.getLogger("SearchDocService")

48
    private val appSettings = settings.appSettings
49
    private val mediaUrl = appSettings.getProperty(SettingsProps.mediaUrl)
Jonas Waeber's avatar
Jonas Waeber committed
50
    private val reportTopic = settings.processReportTopic
Jonas Waeber's avatar
Jonas Waeber committed
51

52
53
    private val documentSearchDocBuilder = DocumentsSearchDocBuilder(translationMappers, mediaUrl)
    private val institutionSearchDoc = InstitutionSearchDocBuilder(translationMappers, elasticSearchWrapper)
54

55
    private val recordSetSearchDocBuilder =
56
        RecordSetSearchDocBuilder(elasticSearchWrapper)
57

58
59
    private val jsonWriter = ObjectMapper().registerKotlinModule().writer()

Jonas Waeber's avatar
Jonas Waeber committed
60
61
62
    fun build(): Topology {
        val builder = StreamsBuilder()
        val stream = builder.stream<String, String>(settings.inputTopic)
63
        val branchedStream = stream
64
65
66
67
68
69
70
71
72
            .mapValues { value -> JSON.parse(value) }
            .filter { _, value -> value.isNotEmpty() }
            .mapValues { value -> JSON.unpack(value) }
            .branch(
                Predicate { _, value -> value.containsKey(JSON.recordTag) },
                Predicate { _, value -> value.containsKey(JSON.institutionTag) },
                Predicate { _, value -> value.containsKey(JSON.recordSetTag) },
                Predicate { _, _ -> true }
            )
73
74

        val recordStream = branchedStream[0]
75
76
77
78
79
80
81
82
83
84
85
            .mapValues { readOnlyKey, value ->
                try {
                    Pair(
                        documentSearchDocBuilder.transform(readOnlyKey, value),
                        Report(readOnlyKey, ReportStatus.success, "Transformed message into search doc.", Service.name)
                    )
                } catch (ex: InvalidInputException) {
                    Pair(
                        DocumentsSearchDoc.DEFAULT,
                        Report(readOnlyKey, ReportStatus.warning, ex.localizedMessage, Service.name)
                    )
86
                }
87
            }
88
89
90
91

        outputStreams(recordStream)

        val institutionStream = branchedStream[1]
92
93
94
95
96
97
98
99
100
101
102
103
104
            .mapValues { readOnlyKey, value ->
                try {
                    Pair(
                        institutionSearchDoc.transform(readOnlyKey, value),
                        Report(readOnlyKey, ReportStatus.success, "Transformed message into search doc.", Service.name)
                    )
                } catch (ex: InvalidInputException) {
                    Pair(
                        InstitutionSearchDoc.DEFAULT, Report(
                            readOnlyKey,
                            ReportStatus.warning,
                            ex.localizedMessage,
                            Service.name
105
                        )
106
                    )
Jonas Waeber's avatar
Jonas Waeber committed
107
                }
108
            }
109
        outputStreams(institutionStream)
110

111
        val recordSetStream = branchedStream[2]
112
113
114
115
116
117
118
119
120
121
122
123
124
            .mapValues { readOnlyKey, value ->
                try {
                    Pair(
                        recordSetSearchDocBuilder.transform(readOnlyKey, value),
                        Report(readOnlyKey, ReportStatus.success, "Transformed message into search doc.", Service.name)
                    )
                } catch (ex: InvalidInputException) {
                    Pair(
                        RecordSetSearchDoc.DEFAULT, Report(
                            readOnlyKey,
                            ReportStatus.warning,
                            ex.localizedMessage,
                            Service.name
125
                        )
126
                    )
127
                }
128
            }
129
130
        outputStreams(recordSetStream)

131
        branchedStream[3]
132
133
134
135
136
137
138
139
140
            .mapValues { readOnlyKey, value ->
                Report(
                    readOnlyKey,
                    ReportStatus.fatal,
                    "No record, memobase institution or record set present in input data: $value.",
                    Service.name
                )
            }
            .to(reportTopic)
141
142
143
144
145
        return builder.build()
    }

    private fun outputStreams(stream: KStream<String, Pair<Schema, Report>>) {
        stream
146
147
            .mapValues { value -> value.second.toJson() }
            .to(reportTopic)
Jonas Waeber's avatar
Jonas Waeber committed
148

149
        stream
150
151
152
153
154
155
156
157
            .filterNot { _, value -> value.second.status == ReportStatus.fatal }
            .mapValues { value -> value.first }
            .mapValues { value ->
                val out = StringWriter()
                jsonWriter.writeValue(out, value)
                out.toString()
            }
            .to(settings.outputTopic)
Jonas Waeber's avatar
Jonas Waeber committed
158
159
    }
}