KafkaTopology.kt 6.16 KB
Newer Older
Jonas Waeber's avatar
Jonas Waeber committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
/*
 * Table Data Import Service
 * Copyright (C) 2020 Memoriav
 *
 * This program is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Affero General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Affero General Public License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <https://www.gnu.org/licenses/>.
 */

package org.memobase

21
22
23
import ch.memobase.reporting.Report
import ch.memobase.reporting.ReportStatus
import ch.memobase.settings.SettingsLoader
Jonas Waeber's avatar
Jonas Waeber committed
24
25
import com.fasterxml.jackson.databind.ObjectMapper
import com.fasterxml.jackson.module.kotlin.registerKotlinModule
26
import java.io.StringWriter
Jonas Waeber's avatar
Jonas Waeber committed
27
28
import org.apache.kafka.streams.StreamsBuilder
import org.apache.kafka.streams.Topology
29
30
import org.apache.kafka.streams.kstream.KStream
import org.apache.kafka.streams.kstream.Predicate
Jonas Waeber's avatar
Jonas Waeber committed
31
import org.apache.logging.log4j.LogManager
32
import org.memobase.helpers.ElasticSearchWrapper
Jonas Waeber's avatar
Jonas Waeber committed
33
import org.memobase.helpers.JSON
34
import org.memobase.helpers.KEYS
35
import org.memobase.model.DocumentsSearchDoc
36
37
import org.memobase.model.InstitutionSearchDoc
import org.memobase.model.RecordSetSearchDoc
38
import org.memobase.model.Schema
Jonas Waeber's avatar
Jonas Waeber committed
39
40

class KafkaTopology(private val settings: SettingsLoader) {
Jonas Waeber's avatar
Jonas Waeber committed
41
42
    private val log = LogManager.getLogger("SearchDocService")

43
    private val appSettings = settings.appSettings
Jonas Waeber's avatar
Jonas Waeber committed
44
    private val reportTopic = settings.processReportTopic
Jonas Waeber's avatar
Jonas Waeber committed
45

46
    private val searchDocTransform = DocumentsSearchDocBuilder(appSettings.getProperty(KEYS.SettingsProps.mediaUrl))
47
    private val institutionSearchDoc =
48
            InstitutionSearchDocBuilder(appSettings.getProperty(KEYS.SettingsProps.institutionTypeLabelsPath), appSettings)
49

50
51
52
53
    private val elasticSearchWrapper = ElasticSearchWrapper(settings.appSettings)
    private val recordSetSearchDocBuilder =
            RecordSetSearchDocBuilder(elasticSearchWrapper)

54
55
    private val jsonWriter = ObjectMapper().registerKotlinModule().writer()

Jonas Waeber's avatar
Jonas Waeber committed
56
57
58
    fun build(): Topology {
        val builder = StreamsBuilder()
        val stream = builder.stream<String, String>(settings.inputTopic)
59
        val branchedStream = stream
60
61
62
63
64
65
66
67
68
                .mapValues { value -> JSON.parse(value) }
                .filter { _, value -> value.isNotEmpty() }
                .mapValues { value -> JSON.unpack(value) }
                .branch(
                        Predicate { _, value -> value.containsKey(JSON.record) },
                        Predicate { _, value -> value.containsKey(JSON.institution) },
                        Predicate { _, value -> value.containsKey(JSON.recordSet) },
                        Predicate { _, _ -> true }
                )
69
70

        val recordStream = branchedStream[0]
71
72
73
74
75
76
77
78
79
                .mapValues { readOnlyKey, value ->
                    try {
                        Pair(
                                searchDocTransform.transform(value),
                                Report(readOnlyKey, ReportStatus.success, "Transformed message into search doc.", Service.name)
                        )
                    } catch (ex: InvalidInputException) {
                        Pair(DocumentsSearchDoc.DEFAULT, Report(readOnlyKey, ReportStatus.warning, ex.localizedMessage, Service.name))
                    }
80
81
82
83
84
                }

        outputStreams(recordStream)

        val institutionStream = branchedStream[1]
85
86
87
88
89
90
91
                .mapValues { readOnlyKey, value ->
                    try {
                        Pair(
                                institutionSearchDoc.transform(readOnlyKey, value),
                                Report(readOnlyKey, ReportStatus.success, "Transformed message into search doc.", Service.name)
                        )
                    } catch (ex: InvalidInputException) {
92
                        Pair(InstitutionSearchDoc.DEFAULT, Report(
93
94
95
96
97
                                readOnlyKey,
                                ReportStatus.warning,
                                ex.localizedMessage,
                                Service.name))
                    }
Jonas Waeber's avatar
Jonas Waeber committed
98
                }
99
        outputStreams(institutionStream)
100

101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
        val recordSetStream = branchedStream[2]
                .mapValues { readOnlyKey, value ->
                    try {
                        Pair(
                                recordSetSearchDocBuilder.transform(readOnlyKey, value),
                                Report(readOnlyKey, ReportStatus.success, "Transformed message into search doc.", Service.name)
                        )
                    } catch (ex: InvalidInputException) {
                        Pair(RecordSetSearchDoc.DEFAULT, Report(
                                readOnlyKey,
                                ReportStatus.warning,
                                ex.localizedMessage,
                                Service.name))
                    }
                }
        outputStreams(recordSetStream)

118
        branchedStream[3]
119
120
121
122
123
124
125
126
127
                .mapValues { readOnlyKey, value ->
                    Report(
                            readOnlyKey,
                            ReportStatus.fatal,
                            "No record, memobase institution or record set present in input data: $value.",
                            Service.name
                    )
                }
                .to(reportTopic)
128
129
130
131
132
        return builder.build()
    }

    private fun outputStreams(stream: KStream<String, Pair<Schema, Report>>) {
        stream
133
134
                .mapValues { value -> value.second.toJson() }
                .to(reportTopic)
Jonas Waeber's avatar
Jonas Waeber committed
135

136
        stream
137
                .filterNot { _, value -> value.second.status == ReportStatus.fatal }
138
139
140
141
142
143
144
                .mapValues { value -> value.first }
                .mapValues { value ->
                    val out = StringWriter()
                    jsonWriter.writeValue(out, value)
                    out.toString()
                }
                .to(settings.outputTopic)
Jonas Waeber's avatar
Jonas Waeber committed
145
146
    }
}