KafkaTopology.kt 4.58 KB
Newer Older
Jonas Waeber's avatar
Jonas Waeber committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
/*
 * Table Data Import Service
 * Copyright (C) 2020 Memoriav
 *
 * This program is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Affero General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Affero General Public License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <https://www.gnu.org/licenses/>.
 */

package org.memobase

Jonas Waeber's avatar
Jonas Waeber committed
21
22
import com.fasterxml.jackson.databind.ObjectMapper
import com.fasterxml.jackson.module.kotlin.registerKotlinModule
Jonas Waeber's avatar
Jonas Waeber committed
23
24
import org.apache.kafka.streams.StreamsBuilder
import org.apache.kafka.streams.Topology
25
26
import org.apache.kafka.streams.kstream.KStream
import org.apache.kafka.streams.kstream.Predicate
Jonas Waeber's avatar
Jonas Waeber committed
27
import org.apache.logging.log4j.LogManager
28
import org.memobase.helpers.Default
Jonas Waeber's avatar
Jonas Waeber committed
29
import org.memobase.helpers.JSON
30
import org.memobase.helpers.KEYS
31
import org.memobase.helpers.ReportStatus
32
import org.memobase.model.DocumentsSearchDoc
Jonas Waeber's avatar
Jonas Waeber committed
33
import org.memobase.model.Report
34
import org.memobase.model.Schema
Jonas Waeber's avatar
Jonas Waeber committed
35
import org.memobase.settings.SettingsLoader
36
import java.io.StringWriter
Jonas Waeber's avatar
Jonas Waeber committed
37
38

class KafkaTopology(private val settings: SettingsLoader) {
Jonas Waeber's avatar
Jonas Waeber committed
39
40
    private val log = LogManager.getLogger("SearchDocService")

41
    private val appSettings = settings.appSettings
Jonas Waeber's avatar
Jonas Waeber committed
42
    private val reportTopic = settings.processReportTopic
Jonas Waeber's avatar
Jonas Waeber committed
43

44
    private val searchDocTransform = DocumentsSearchDocBuilder(appSettings.getProperty(KEYS.SettingsProps.mediaUrl))
45
    private val institutionSearchDoc =
46
        InstitutionSearchDocBuilder(appSettings.getProperty(KEYS.SettingsProps.institutionTypeLabelsPath), appSettings)
47

48
49
    private val jsonWriter = ObjectMapper().registerKotlinModule().writer()

Jonas Waeber's avatar
Jonas Waeber committed
50
51
52
    fun build(): Topology {
        val builder = StreamsBuilder()
        val stream = builder.stream<String, String>(settings.inputTopic)
53
        val branchedStream = stream
54
55
            .mapValues { value -> JSON.parse(value) }
            .filter { _, value -> value.isNotEmpty() }
Jonas Waeber's avatar
Jonas Waeber committed
56
            .mapValues { value -> JSON.unpack(value) }
57
58
59
60
61
62
63
64
65
66
            .branch(
                Predicate { _, value -> value.containsKey(JSON.record) },
                Predicate { _, value -> value.containsKey(JSON.institution) },
                Predicate { _, value -> value.containsKey(JSON.recordSet) },
                Predicate { _, _ -> true }
            )

        val recordStream = branchedStream[0]
            .mapValues { readOnlyKey, value ->
                try {
67
68
69
70
                    Pair(
                        searchDocTransform.transform(value),
                        Report(readOnlyKey, "SUCCESS", "Transformed message into search doc.")
                    )
71
                } catch (ex: InvalidInputException) {
72
                    Pair(DocumentsSearchDoc.DEFAULT, Report(readOnlyKey, "FAILURE", ex.localizedMessage))
73
74
75
76
77
78
                }
            }

        outputStreams(recordStream)

        val institutionStream = branchedStream[1]
Jonas Waeber's avatar
Jonas Waeber committed
79
80
            .mapValues { readOnlyKey, value ->
                try {
81
82
83
84
                    Pair(
                        institutionSearchDoc.transform(readOnlyKey, value),
                        Report(readOnlyKey, "SUCCESS", "Transformed message into search doc.")
                    )
Jonas Waeber's avatar
Jonas Waeber committed
85
                } catch (ex: InvalidInputException) {
86
                    Pair(Default.institutionSearchDoc, Report(readOnlyKey, "FAILURE", ex.localizedMessage))
Jonas Waeber's avatar
Jonas Waeber committed
87
88
                }
            }
89
        outputStreams(institutionStream)
90
91
92
93
94
95
96
97
98
99

        branchedStream[3]
            .mapValues { readOnlyKey, value ->
                Report(
                    readOnlyKey,
                    ReportStatus.fatal,
                    "No record, memobase institution or record set present in input data: $value."
                )
            }
            .to(reportTopic)
100
101
102
103
104
        return builder.build()
    }

    private fun outputStreams(stream: KStream<String, Pair<Schema, Report>>) {
        stream
105
            .mapValues { value -> value.second.toJson() }
Jonas Waeber's avatar
Jonas Waeber committed
106
107
            .to(reportTopic)

108
        stream
Jonas Waeber's avatar
Jonas Waeber committed
109
            .filterNot { _, value -> value.second.status == "FAILURE" }
110
            .mapValues { value -> value.first }
Jonas Waeber's avatar
Jonas Waeber committed
111
            .mapValues { value ->
112
113
114
                val out = StringWriter()
                jsonWriter.writeValue(out, value)
                out.toString()
Jonas Waeber's avatar
Jonas Waeber committed
115
            }
Jonas Waeber's avatar
Jonas Waeber committed
116
117
118
            .to(settings.outputTopic)
    }
}