KafkaTopology.kt 4.54 KB
Newer Older
Jonas Waeber's avatar
Jonas Waeber committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
/*
 * Table Data Import Service
 * Copyright (C) 2020 Memoriav
 *
 * This program is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Affero General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Affero General Public License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <https://www.gnu.org/licenses/>.
 */

package org.memobase

Jonas Waeber's avatar
Jonas Waeber committed
21
22
import com.fasterxml.jackson.databind.ObjectMapper
import com.fasterxml.jackson.module.kotlin.registerKotlinModule
Jonas Waeber's avatar
Jonas Waeber committed
23
24
import org.apache.kafka.streams.StreamsBuilder
import org.apache.kafka.streams.Topology
25
26
import org.apache.kafka.streams.kstream.KStream
import org.apache.kafka.streams.kstream.Predicate
Jonas Waeber's avatar
Jonas Waeber committed
27
import org.apache.logging.log4j.LogManager
28
import org.memobase.helpers.Default
Jonas Waeber's avatar
Jonas Waeber committed
29
import org.memobase.helpers.JSON
30
import org.memobase.helpers.KEYS
31
import org.memobase.helpers.ReportStatus
32
import org.memobase.model.DocumentsSearchDoc
Jonas Waeber's avatar
Jonas Waeber committed
33
import org.memobase.model.Report
34
import org.memobase.model.Schema
Jonas Waeber's avatar
Jonas Waeber committed
35
import org.memobase.settings.SettingsLoader
36
import java.io.StringWriter
Jonas Waeber's avatar
Jonas Waeber committed
37
38

class KafkaTopology(private val settings: SettingsLoader) {
Jonas Waeber's avatar
Jonas Waeber committed
39
40
41
    private val log = LogManager.getLogger("SearchDocService")

    private val reportTopic = settings.processReportTopic
Jonas Waeber's avatar
Jonas Waeber committed
42

43
    private val searchDocTransform = DocumentsSearchDocBuilder(settings.appSettings.getProperty(KEYS.SettingsProps.mediaUrl))
44
45
    private val institutionSearchDoc =
        InstitutionSearchDocBuilder(settings.appSettings.getProperty(KEYS.SettingsProps.institutionTypeLabelsPath))
46

47
48
    private val jsonWriter = ObjectMapper().registerKotlinModule().writer()

Jonas Waeber's avatar
Jonas Waeber committed
49
50
51
    fun build(): Topology {
        val builder = StreamsBuilder()
        val stream = builder.stream<String, String>(settings.inputTopic)
52
        val branchedStream = stream
53
54
            .mapValues { value -> JSON.parse(value) }
            .filter { _, value -> value.isNotEmpty() }
Jonas Waeber's avatar
Jonas Waeber committed
55
            .mapValues { value -> JSON.unpack(value) }
56
57
58
59
60
61
62
63
64
65
            .branch(
                Predicate { _, value -> value.containsKey(JSON.record) },
                Predicate { _, value -> value.containsKey(JSON.institution) },
                Predicate { _, value -> value.containsKey(JSON.recordSet) },
                Predicate { _, _ -> true }
            )

        val recordStream = branchedStream[0]
            .mapValues { readOnlyKey, value ->
                try {
66
67
68
69
                    Pair(
                        searchDocTransform.transform(value),
                        Report(readOnlyKey, "SUCCESS", "Transformed message into search doc.")
                    )
70
                } catch (ex: InvalidInputException) {
71
                    Pair(DocumentsSearchDoc.DEFAULT, Report(readOnlyKey, "FAILURE", ex.localizedMessage))
72
73
74
75
76
77
                }
            }

        outputStreams(recordStream)

        val institutionStream = branchedStream[1]
Jonas Waeber's avatar
Jonas Waeber committed
78
79
            .mapValues { readOnlyKey, value ->
                try {
80
81
82
83
                    Pair(
                        institutionSearchDoc.transform(readOnlyKey, value),
                        Report(readOnlyKey, "SUCCESS", "Transformed message into search doc.")
                    )
Jonas Waeber's avatar
Jonas Waeber committed
84
                } catch (ex: InvalidInputException) {
85
                    Pair(Default.institutionSearchDoc, Report(readOnlyKey, "FAILURE", ex.localizedMessage))
Jonas Waeber's avatar
Jonas Waeber committed
86
87
                }
            }
88
        outputStreams(institutionStream)
89
90
91
92
93
94
95
96
97
98

        branchedStream[3]
            .mapValues { readOnlyKey, value ->
                Report(
                    readOnlyKey,
                    ReportStatus.fatal,
                    "No record, memobase institution or record set present in input data: $value."
                )
            }
            .to(reportTopic)
99
100
101
102
103
        return builder.build()
    }

    private fun outputStreams(stream: KStream<String, Pair<Schema, Report>>) {
        stream
104
            .mapValues { value -> value.second.toJson() }
Jonas Waeber's avatar
Jonas Waeber committed
105
106
            .to(reportTopic)

107
        stream
Jonas Waeber's avatar
Jonas Waeber committed
108
            .filterNot { _, value -> value.second.status == "FAILURE" }
109
            .mapValues { value -> value.first }
Jonas Waeber's avatar
Jonas Waeber committed
110
            .mapValues { value ->
111
112
113
                val out = StringWriter()
                jsonWriter.writeValue(out, value)
                out.toString()
Jonas Waeber's avatar
Jonas Waeber committed
114
            }
Jonas Waeber's avatar
Jonas Waeber committed
115
116
117
            .to(settings.outputTopic)
    }
}