Tests.kt 8.75 KB
Newer Older
Jonas Waeber's avatar
Jonas Waeber committed
1
/*
Jonas Waeber's avatar
Jonas Waeber committed
2
 * sftp-reader
Jonas Waeber's avatar
Jonas Waeber committed
3 4 5 6 7 8 9 10 11 12 13 14 15 16 17
 * Copyright (C) 2019  Memobase
 *
 * This program is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Affero General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Affero General Public License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <https://www.gnu.org/licenses/>.
 */
18
package org.memobase
Jonas Waeber's avatar
Jonas Waeber committed
19

Jonas Waeber's avatar
Jonas Waeber committed
20 21
import com.beust.klaxon.Klaxon
import java.io.FileInputStream
Jonas Waeber's avatar
Jonas Waeber committed
22 23 24
import java.time.Duration
import java.util.Properties
import java.util.stream.Stream
Jonas Waeber's avatar
Jonas Waeber committed
25 26
import org.apache.kafka.clients.admin.AdminClient
import org.apache.kafka.clients.admin.AdminClientConfig
Jonas Waeber's avatar
Jonas Waeber committed
27 28 29 30
import org.apache.kafka.clients.consumer.ConsumerConfig
import org.apache.kafka.clients.consumer.KafkaConsumer
import org.apache.kafka.common.TopicPartition
import org.apache.kafka.common.serialization.StringDeserializer
Jonas Waeber's avatar
Jonas Waeber committed
31
import org.apache.logging.log4j.LogManager
Jonas Waeber's avatar
Jonas Waeber committed
32
import org.assertj.core.api.Assertions.assertThat
Jonas Waeber's avatar
Jonas Waeber committed
33
import org.junit.jupiter.api.TestInstance
34
import org.junit.jupiter.api.extension.ExtendWith
Jonas Waeber's avatar
Jonas Waeber committed
35 36 37 38
import org.junit.jupiter.params.ParameterizedTest
import org.junit.jupiter.params.provider.MethodSource
import org.memobase.extensions.EmbeddedKafkaExtension
import org.memobase.extensions.EmbeddedSftpServer
Jonas Waeber's avatar
Jonas Waeber committed
39

Jonas Waeber's avatar
Jonas Waeber committed
40
@ExtendWith(EmbeddedKafkaExtension::class)
Jonas Waeber's avatar
Jonas Waeber committed
41
@TestInstance(TestInstance.Lifecycle.PER_CLASS)
Jonas Waeber's avatar
Jonas Waeber committed
42
class Tests {
Jonas Waeber's avatar
Jonas Waeber committed
43
    private val log = LogManager.getLogger("LocalTestsLogger")
Jonas Waeber's avatar
Jonas Waeber committed
44

Jonas Waeber's avatar
Jonas Waeber committed
45 46
    private val sftpServer = EmbeddedSftpServer(22000, "user", "password")

Jonas Waeber's avatar
Jonas Waeber committed
47 48 49
    private val adminClient =
            AdminClient.create(mapOf(Pair(AdminClientConfig.BOOTSTRAP_SERVERS_CONFIG, "localhost:12345")))

Jonas Waeber's avatar
Jonas Waeber committed
50 51
    init {
        sftpServer.createDirectories(
Jonas Waeber's avatar
Jonas Waeber committed
52 53
                "/memobase/test_institution_1/test_record_set_1/",
                "/memobase/test_institution_2/test_record_set_2/"
Jonas Waeber's avatar
Jonas Waeber committed
54
        )
Jonas Waeber's avatar
Jonas Waeber committed
55 56
        sftpServer.putFile("/memobase/test_institution_1/test_record_set_1/brandt.csv", FileInputStream("src/test/resources/data/brandt.csv"))
        sftpServer.putFile("/memobase/test_institution_2/test_record_set_2/bauGAZH_metadaten.csv", FileInputStream("src/test/resources/data/bauGAZH_metadaten.csv"))
57 58
        sftpServer.putFile("/memobase/test_institution_3/test_record_set_3/invalid.csv", FileInputStream("src/test/resources/data/invalid.csv"))
        sftpServer.putFile("/memobase/test_institution_4/test_record_set_4/file.txt", FileInputStream("src/test/resources/data/file.txt"))
Jonas Waeber's avatar
Jonas Waeber committed
59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76
    }

    private val consumer: KafkaConsumer<String, String>

    init {
        val props = Properties()
        props.setProperty(ConsumerConfig.BOOTSTRAP_SERVERS_CONFIG, "localhost:12345")
        props.setProperty(ConsumerConfig.CLIENT_ID_CONFIG, "test-group-1")
        props.setProperty(ConsumerConfig.GROUP_ID_CONFIG, "test-group-1")
        props.setProperty(ConsumerConfig.KEY_DESERIALIZER_CLASS_CONFIG, StringDeserializer::class.qualifiedName)
        props.setProperty(ConsumerConfig.VALUE_DESERIALIZER_CLASS_CONFIG, StringDeserializer::class.qualifiedName)
        props.setProperty(ConsumerConfig.AUTO_OFFSET_RESET_CONFIG, "earliest")
        consumer = KafkaConsumer(props)
    }

    @ParameterizedTest
    @MethodSource("directoryReaderTests")
    fun `read valid csv from sftp`(params: TestParams) {
77 78
        val service = Service(params.configFile)
        service.run()
Jonas Waeber's avatar
Jonas Waeber committed
79

80 81 82
        val topic = service.settings.outputTopic
        val reportingTopic = service.settings.outputTopic + "-reporting"
        val processReportingTopic = service.settings.processReportTopic
Jonas Waeber's avatar
Jonas Waeber committed
83

84
        consumer.assign(listOf(TopicPartition(topic, 0)))
Jonas Waeber's avatar
Jonas Waeber committed
85 86 87 88 89
        var result = consumer.poll(Duration.ofMillis(10))
        while (result.count() == 0) {
            result = consumer.poll(Duration.ofMillis(10))
        }

90
        consumer.assign(listOf(TopicPartition(reportingTopic, 0)))
Jonas Waeber's avatar
Jonas Waeber committed
91 92 93 94
        var resultReport = consumer.poll(Duration.ofMillis(10))
        while (resultReport.count() == 0) {
            resultReport = consumer.poll(Duration.ofMillis(10))
        }
Jonas Waeber's avatar
Jonas Waeber committed
95

96 97 98 99 100 101 102
        consumer.assign(listOf(TopicPartition(processReportingTopic, 0)))
        var processReportResult = consumer.poll(Duration.ofMillis(10))
        while (processReportResult.count() == 0) {
            processReportResult = consumer.poll(Duration.ofMillis(10))
        }

        assertThat(result.records(topic))
Jonas Waeber's avatar
Jonas Waeber committed
103 104 105 106 107 108
                .describedAs("Record Results")
                .hasSize(1)
                .first()
                .hasFieldOrPropertyWithValue("key", params.expectedKey)
                .hasFieldOrPropertyWithValue("value", params.expectedValue)

109
        assertThat(resultReport.records(reportingTopic))
Jonas Waeber's avatar
Jonas Waeber committed
110 111 112 113 114 115
                .describedAs("Report Results")
                .hasSize(1)
                .first()
                .hasFieldOrPropertyWithValue("key", params.expectedKey)
                .hasFieldOrPropertyWithValue("value", params.expectedReportValue)

116 117 118 119 120 121 122
        assertThat(processReportResult.records(processReportingTopic))
                .describedAs("Report Process Results")
                .hasSize(1)
                .first()
                .hasFieldOrPropertyWithValue("key", params.expectedProcessReport.id)
                .hasFieldOrPropertyWithValue("value", Klaxon().toJsonString(params.expectedProcessReport))

Jonas Waeber's avatar
Jonas Waeber committed
123
        // cleanup inside of class because there is no way to access topics outside of this function.
124
        adminClient.deleteTopics(listOf(topic, reportingTopic, processReportingTopic))
Jonas Waeber's avatar
Jonas Waeber committed
125
    }
Jonas Waeber's avatar
Jonas Waeber committed
126 127

    private fun directoryReaderTests() = Stream.of(
Jonas Waeber's avatar
Jonas Waeber committed
128 129 130 131 132 133 134
            TestParams(
                    "test1.yml",
                    expectedKey = "brandt.csv",
                    expectedValue = "{\"format\" : \"CSV\", \"path\" : \"/memobase/test_institution_1/test_record_set_1/brandt.csv\"}",
                    expectedReportValue = Klaxon().toJsonString(Report(
                            id = "brandt.csv",
                            status = "SUCCESS",
135 136 137 138 139 140
                            message = "Validated file at path /memobase/test_institution_1/test_record_set_1/brandt.csv with format CSV.")),
                    expectedProcessReport = Report(
                        id = "jobXYZ",
                        status = "SUCCESS",
                        message = "Successfully validated 1 files."
                    )
Jonas Waeber's avatar
Jonas Waeber committed
141 142 143 144 145 146 147 148
            ),
            TestParams(
                    "test2.yml",
                    expectedKey = "bauGAZH_metadaten.csv",
                    expectedValue = "{\"format\" : \"CSV\", \"path\" : \"/memobase/test_institution_2/test_record_set_2/bauGAZH_metadaten.csv\"}",
                    expectedReportValue = Klaxon().toJsonString(Report(
                            id = "bauGAZH_metadaten.csv",
                            status = "SUCCESS",
149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182
                            message = "Validated file at path /memobase/test_institution_2/test_record_set_2/bauGAZH_metadaten.csv with format CSV.")),
                    expectedProcessReport = Report(
                        id = "jobXYZ",
                        status = "SUCCESS",
                        message = "Successfully validated 1 files."
                )
            ),
            TestParams(
                    "test3.yml",
                    expectedKey = "invalid.csv",
                    expectedValue = "{\"format\" : \"ERROR\", \"path\" : \"/memobase/test_institution_3/test_record_set_3/invalid.csv\"}",
                    expectedReportValue = Klaxon().toJsonString(Report(
                            id = "invalid.csv",
                            status = "FAILURE",
                            message = "CSV ERROR: Fields num seems to be 5 on each row, but on 2th csv row, fields num is 7.")),
                expectedProcessReport = Report(
                    id = "jobXYZ",
                    status = "FAILURE",
                    message = "Failed to validate 1 of 1 files."
                )
            ),
            TestParams(
                    "test4.yml",
                    expectedKey = "file.txt",
                    expectedValue = "{\"format\" : \"ERROR\", \"path\" : \"/memobase/test_institution_4/test_record_set_4/file.txt\"}",
                    expectedReportValue = Klaxon().toJsonString(Report(
                            id = "file.txt",
                            status = "FAILURE",
                            message = "File Extension Error: Not a valid file extension: file.txt.")),
                expectedProcessReport = Report(
                    id = "jobXYZ",
                    status = "FAILURE",
                    message = "Failed to validate 1 of 1 files."
                )
Jonas Waeber's avatar
Jonas Waeber committed
183 184
            )
    )
Jonas Waeber's avatar
Jonas Waeber committed
185
}