Tests.kt 8.75 KB
Newer Older
Jonas Waeber's avatar
Jonas Waeber committed
1
/*
Jonas Waeber's avatar
Jonas Waeber committed
2
 * sftp-reader
Jonas Waeber's avatar
Jonas Waeber committed
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
 * Copyright (C) 2019  Memobase
 *
 * This program is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Affero General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Affero General Public License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <https://www.gnu.org/licenses/>.
 */
18
package org.memobase
Jonas Waeber's avatar
Jonas Waeber committed
19

Jonas Waeber's avatar
Jonas Waeber committed
20
21
import com.beust.klaxon.Klaxon
import java.io.FileInputStream
Jonas Waeber's avatar
Jonas Waeber committed
22
23
24
import java.time.Duration
import java.util.Properties
import java.util.stream.Stream
Jonas Waeber's avatar
Jonas Waeber committed
25
26
import org.apache.kafka.clients.admin.AdminClient
import org.apache.kafka.clients.admin.AdminClientConfig
Jonas Waeber's avatar
Jonas Waeber committed
27
28
29
30
import org.apache.kafka.clients.consumer.ConsumerConfig
import org.apache.kafka.clients.consumer.KafkaConsumer
import org.apache.kafka.common.TopicPartition
import org.apache.kafka.common.serialization.StringDeserializer
Jonas Waeber's avatar
Jonas Waeber committed
31
import org.apache.logging.log4j.LogManager
Jonas Waeber's avatar
Jonas Waeber committed
32
import org.assertj.core.api.Assertions.assertThat
Jonas Waeber's avatar
Jonas Waeber committed
33
import org.junit.jupiter.api.TestInstance
34
import org.junit.jupiter.api.extension.ExtendWith
Jonas Waeber's avatar
Jonas Waeber committed
35
36
37
38
import org.junit.jupiter.params.ParameterizedTest
import org.junit.jupiter.params.provider.MethodSource
import org.memobase.extensions.EmbeddedKafkaExtension
import org.memobase.extensions.EmbeddedSftpServer
Jonas Waeber's avatar
Jonas Waeber committed
39

Jonas Waeber's avatar
Jonas Waeber committed
40
@ExtendWith(EmbeddedKafkaExtension::class)
Jonas Waeber's avatar
Jonas Waeber committed
41
@TestInstance(TestInstance.Lifecycle.PER_CLASS)
Jonas Waeber's avatar
Jonas Waeber committed
42
class Tests {
Jonas Waeber's avatar
Jonas Waeber committed
43
    private val log = LogManager.getLogger("LocalTestsLogger")
Jonas Waeber's avatar
Jonas Waeber committed
44

Jonas Waeber's avatar
Jonas Waeber committed
45
46
    private val sftpServer = EmbeddedSftpServer(22000, "user", "password")

Jonas Waeber's avatar
Jonas Waeber committed
47
48
49
    private val adminClient =
            AdminClient.create(mapOf(Pair(AdminClientConfig.BOOTSTRAP_SERVERS_CONFIG, "localhost:12345")))

Jonas Waeber's avatar
Jonas Waeber committed
50
51
    init {
        sftpServer.createDirectories(
Jonas Waeber's avatar
Jonas Waeber committed
52
53
                "/memobase/test_institution_1/test_record_set_1/",
                "/memobase/test_institution_2/test_record_set_2/"
Jonas Waeber's avatar
Jonas Waeber committed
54
        )
Jonas Waeber's avatar
Jonas Waeber committed
55
56
        sftpServer.putFile("/memobase/test_institution_1/test_record_set_1/brandt.csv", FileInputStream("src/test/resources/data/brandt.csv"))
        sftpServer.putFile("/memobase/test_institution_2/test_record_set_2/bauGAZH_metadaten.csv", FileInputStream("src/test/resources/data/bauGAZH_metadaten.csv"))
57
58
        sftpServer.putFile("/memobase/test_institution_3/test_record_set_3/invalid.csv", FileInputStream("src/test/resources/data/invalid.csv"))
        sftpServer.putFile("/memobase/test_institution_4/test_record_set_4/file.txt", FileInputStream("src/test/resources/data/file.txt"))
Jonas Waeber's avatar
Jonas Waeber committed
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
    }

    private val consumer: KafkaConsumer<String, String>

    init {
        val props = Properties()
        props.setProperty(ConsumerConfig.BOOTSTRAP_SERVERS_CONFIG, "localhost:12345")
        props.setProperty(ConsumerConfig.CLIENT_ID_CONFIG, "test-group-1")
        props.setProperty(ConsumerConfig.GROUP_ID_CONFIG, "test-group-1")
        props.setProperty(ConsumerConfig.KEY_DESERIALIZER_CLASS_CONFIG, StringDeserializer::class.qualifiedName)
        props.setProperty(ConsumerConfig.VALUE_DESERIALIZER_CLASS_CONFIG, StringDeserializer::class.qualifiedName)
        props.setProperty(ConsumerConfig.AUTO_OFFSET_RESET_CONFIG, "earliest")
        consumer = KafkaConsumer(props)
    }

    @ParameterizedTest
    @MethodSource("directoryReaderTests")
    fun `read valid csv from sftp`(params: TestParams) {
77
78
        val service = Service(params.configFile)
        service.run()
Jonas Waeber's avatar
Jonas Waeber committed
79

80
81
82
        val topic = service.settings.outputTopic
        val reportingTopic = service.settings.outputTopic + "-reporting"
        val processReportingTopic = service.settings.processReportTopic
Jonas Waeber's avatar
Jonas Waeber committed
83

84
        consumer.assign(listOf(TopicPartition(topic, 0)))
Jonas Waeber's avatar
Jonas Waeber committed
85
86
87
88
89
        var result = consumer.poll(Duration.ofMillis(10))
        while (result.count() == 0) {
            result = consumer.poll(Duration.ofMillis(10))
        }

90
        consumer.assign(listOf(TopicPartition(reportingTopic, 0)))
Jonas Waeber's avatar
Jonas Waeber committed
91
92
93
94
        var resultReport = consumer.poll(Duration.ofMillis(10))
        while (resultReport.count() == 0) {
            resultReport = consumer.poll(Duration.ofMillis(10))
        }
Jonas Waeber's avatar
Jonas Waeber committed
95

96
97
98
99
100
101
102
        consumer.assign(listOf(TopicPartition(processReportingTopic, 0)))
        var processReportResult = consumer.poll(Duration.ofMillis(10))
        while (processReportResult.count() == 0) {
            processReportResult = consumer.poll(Duration.ofMillis(10))
        }

        assertThat(result.records(topic))
Jonas Waeber's avatar
Jonas Waeber committed
103
104
105
106
107
108
                .describedAs("Record Results")
                .hasSize(1)
                .first()
                .hasFieldOrPropertyWithValue("key", params.expectedKey)
                .hasFieldOrPropertyWithValue("value", params.expectedValue)

109
        assertThat(resultReport.records(reportingTopic))
Jonas Waeber's avatar
Jonas Waeber committed
110
111
112
113
114
115
                .describedAs("Report Results")
                .hasSize(1)
                .first()
                .hasFieldOrPropertyWithValue("key", params.expectedKey)
                .hasFieldOrPropertyWithValue("value", params.expectedReportValue)

116
117
118
119
120
121
122
        assertThat(processReportResult.records(processReportingTopic))
                .describedAs("Report Process Results")
                .hasSize(1)
                .first()
                .hasFieldOrPropertyWithValue("key", params.expectedProcessReport.id)
                .hasFieldOrPropertyWithValue("value", Klaxon().toJsonString(params.expectedProcessReport))

Jonas Waeber's avatar
Jonas Waeber committed
123
        // cleanup inside of class because there is no way to access topics outside of this function.
124
        adminClient.deleteTopics(listOf(topic, reportingTopic, processReportingTopic))
Jonas Waeber's avatar
Jonas Waeber committed
125
    }
Jonas Waeber's avatar
Jonas Waeber committed
126
127

    private fun directoryReaderTests() = Stream.of(
Jonas Waeber's avatar
Jonas Waeber committed
128
129
130
131
132
133
134
            TestParams(
                    "test1.yml",
                    expectedKey = "brandt.csv",
                    expectedValue = "{\"format\" : \"CSV\", \"path\" : \"/memobase/test_institution_1/test_record_set_1/brandt.csv\"}",
                    expectedReportValue = Klaxon().toJsonString(Report(
                            id = "brandt.csv",
                            status = "SUCCESS",
135
136
137
138
139
140
                            message = "Validated file at path /memobase/test_institution_1/test_record_set_1/brandt.csv with format CSV.")),
                    expectedProcessReport = Report(
                        id = "jobXYZ",
                        status = "SUCCESS",
                        message = "Successfully validated 1 files."
                    )
Jonas Waeber's avatar
Jonas Waeber committed
141
142
143
144
145
146
147
148
            ),
            TestParams(
                    "test2.yml",
                    expectedKey = "bauGAZH_metadaten.csv",
                    expectedValue = "{\"format\" : \"CSV\", \"path\" : \"/memobase/test_institution_2/test_record_set_2/bauGAZH_metadaten.csv\"}",
                    expectedReportValue = Klaxon().toJsonString(Report(
                            id = "bauGAZH_metadaten.csv",
                            status = "SUCCESS",
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
                            message = "Validated file at path /memobase/test_institution_2/test_record_set_2/bauGAZH_metadaten.csv with format CSV.")),
                    expectedProcessReport = Report(
                        id = "jobXYZ",
                        status = "SUCCESS",
                        message = "Successfully validated 1 files."
                )
            ),
            TestParams(
                    "test3.yml",
                    expectedKey = "invalid.csv",
                    expectedValue = "{\"format\" : \"ERROR\", \"path\" : \"/memobase/test_institution_3/test_record_set_3/invalid.csv\"}",
                    expectedReportValue = Klaxon().toJsonString(Report(
                            id = "invalid.csv",
                            status = "FAILURE",
                            message = "CSV ERROR: Fields num seems to be 5 on each row, but on 2th csv row, fields num is 7.")),
                expectedProcessReport = Report(
                    id = "jobXYZ",
                    status = "FAILURE",
                    message = "Failed to validate 1 of 1 files."
                )
            ),
            TestParams(
                    "test4.yml",
                    expectedKey = "file.txt",
                    expectedValue = "{\"format\" : \"ERROR\", \"path\" : \"/memobase/test_institution_4/test_record_set_4/file.txt\"}",
                    expectedReportValue = Klaxon().toJsonString(Report(
                            id = "file.txt",
                            status = "FAILURE",
                            message = "File Extension Error: Not a valid file extension: file.txt.")),
                expectedProcessReport = Report(
                    id = "jobXYZ",
                    status = "FAILURE",
                    message = "Failed to validate 1 of 1 files."
                )
Jonas Waeber's avatar
Jonas Waeber committed
183
184
            )
    )
Jonas Waeber's avatar
Jonas Waeber committed
185
}