XMLTransformer.kt 2.93 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
/*
 * xml-data-transform
 * Copyright (C) 2020 Memoriav
 *
 * This program is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Affero General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Affero General Public License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <https://www.gnu.org/licenses/>.
 */
package org.memobase

Jonas Waeber's avatar
Jonas Waeber committed
20
import net.schmizz.sshj.sftp.RemoteFile
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
import net.sf.saxon.s9api.Processor
import net.sf.saxon.s9api.SAXDestination
import net.sf.saxon.s9api.StaticError
import net.sf.saxon.s9api.XsltExecutable
import org.apache.kafka.streams.KeyValue
import org.apache.logging.log4j.LogManager
import java.io.File
import java.io.FileInputStream
import java.io.InputStream
import java.util.Properties
import javax.xml.transform.stream.StreamSource

class XMLTransformer(appSettings: Properties) {
    private val log = LogManager.getLogger("XMLTransformer")

    private val xlstFilePath = appSettings.getProperty("xsltFilePath")
    private val identifierFieldName = appSettings.getProperty("identifierFieldName")
    private val recordTag = appSettings.getProperty("recordTag")

    init {
        if (identifierFieldName == "placeholderValue") {
            log.error("Requires a value for identifier field name, but found default value.")
        }
    }

    private val processor = Processor(false)
    private val xslt = compileXslt()
    private val transformer = xslt.load()

    private fun compileXslt(): XsltExecutable {
        val errorList = mutableListOf<StaticError>()
        val xsltCompiler = processor.newXsltCompiler()
        xsltCompiler.setErrorList(errorList)
        val source = StreamSource(FileInputStream(File(xlstFilePath)))
        val executable = xsltCompiler.compile(source)
        if (errorList.isEmpty()) {
            return executable
        } else {
            throw Exception(errorList.joinToString())
        }
    }

Jonas Waeber's avatar
Jonas Waeber committed
63
    fun applyXSLT(key: String, data: RemoteFile): KeyValue<String, SAXContentHandler> {
64
        val contentHandler = SAXContentHandler(key, identifierFieldName, recordTag)
Jonas Waeber's avatar
Jonas Waeber committed
65
66
67
68
69
70
        data.use { file ->
            file.RemoteFileInputStream().use {
                transformer.setSource(StreamSource(it))
                transformer.destination = SAXDestination(contentHandler)
                transformer.transform()
            }
71
72
73
74
75
76
77
78
        }
        if (contentHandler.identifier.isEmpty()) {
            throw Exception("No valid identifier found in record $key in field $identifierFieldName.")
        } else {
            return KeyValue(contentHandler.identifier, contentHandler)
        }
    }
}