Compare commits
No commits in common. "ed5f272c07ec33ed2fc7b2e473fab983fe42bc28" and "52bf9daa7d2296ed0ffc9fef7f2cd2b80a4fdcba" have entirely different histories.
ed5f272c07
...
52bf9daa7d
|
@ -16,9 +16,6 @@ val kotlinCoroutinesVersion: String by project
|
||||||
|
|
||||||
val mustangVersion: String by project
|
val mustangVersion: String by project
|
||||||
|
|
||||||
val textInfoExtractor: String by project
|
|
||||||
val pdfboxTextExtractor: String by project
|
|
||||||
|
|
||||||
val angusMailVersion: String by project
|
val angusMailVersion: String by project
|
||||||
|
|
||||||
val klfVersion: String by project
|
val klfVersion: String by project
|
||||||
|
@ -33,10 +30,6 @@ dependencies {
|
||||||
implementation("org.mustangproject:library:$mustangVersion")
|
implementation("org.mustangproject:library:$mustangVersion")
|
||||||
implementation("org.mustangproject:validator:$mustangVersion")
|
implementation("org.mustangproject:validator:$mustangVersion")
|
||||||
|
|
||||||
// pdf invoice data extraction
|
|
||||||
api("net.dankito.text.extraction:text-info-extractor:$textInfoExtractor")
|
|
||||||
api("net.dankito.text.extraction:pdfbox-text-extractor:$pdfboxTextExtractor")
|
|
||||||
|
|
||||||
implementation("org.eclipse.angus:angus-mail:$angusMailVersion")
|
implementation("org.eclipse.angus:angus-mail:$angusMailVersion")
|
||||||
|
|
||||||
implementation("net.codinux.log:klf:$klfVersion")
|
implementation("net.codinux.log:klf:$klfVersion")
|
||||||
|
|
|
@ -9,17 +9,11 @@ import kotlinx.coroutines.*
|
||||||
import net.codinux.invoicing.email.model.*
|
import net.codinux.invoicing.email.model.*
|
||||||
import net.codinux.invoicing.filesystem.FileUtil
|
import net.codinux.invoicing.filesystem.FileUtil
|
||||||
import net.codinux.invoicing.model.Invoice
|
import net.codinux.invoicing.model.Invoice
|
||||||
import net.codinux.invoicing.pdf.PdfInvoiceData
|
|
||||||
import net.codinux.invoicing.pdf.PdfInvoiceDataExtractor
|
|
||||||
import net.codinux.invoicing.reader.EInvoiceReader
|
import net.codinux.invoicing.reader.EInvoiceReader
|
||||||
import net.codinux.invoicing.util.ExceptionHelper
|
|
||||||
import net.codinux.log.logger
|
import net.codinux.log.logger
|
||||||
import org.eclipse.angus.mail.imap.IMAPFolder
|
import org.eclipse.angus.mail.imap.IMAPFolder
|
||||||
import org.eclipse.angus.mail.imap.IMAPMessage
|
import org.eclipse.angus.mail.imap.IMAPMessage
|
||||||
import org.eclipse.angus.mail.util.MailConnectException
|
|
||||||
import java.io.File
|
import java.io.File
|
||||||
import java.net.ConnectException
|
|
||||||
import java.net.UnknownHostException
|
|
||||||
import java.time.Instant
|
import java.time.Instant
|
||||||
import java.util.*
|
import java.util.*
|
||||||
import java.util.concurrent.Executors
|
import java.util.concurrent.Executors
|
||||||
|
@ -27,9 +21,7 @@ import kotlin.math.max
|
||||||
|
|
||||||
open class EmailsFetcher(
|
open class EmailsFetcher(
|
||||||
protected open val eInvoiceReader: EInvoiceReader = EInvoiceReader(),
|
protected open val eInvoiceReader: EInvoiceReader = EInvoiceReader(),
|
||||||
protected open val pdfInvoiceDataExtractor: PdfInvoiceDataExtractor = PdfInvoiceDataExtractor(),
|
protected open val coroutineDispatcher: CoroutineDispatcher = Executors.newFixedThreadPool(max(24, Runtime.getRuntime().availableProcessors() * 4)).asCoroutineDispatcher()
|
||||||
protected open val coroutineDispatcher: CoroutineDispatcher = Executors.newFixedThreadPool(max(24, Runtime.getRuntime().availableProcessors() * 4)).asCoroutineDispatcher(),
|
|
||||||
protected open val exceptionHelper: ExceptionHelper = ExceptionHelper()
|
|
||||||
) {
|
) {
|
||||||
|
|
||||||
protected data class MessagePart(
|
protected data class MessagePart(
|
||||||
|
@ -48,64 +40,34 @@ open class EmailsFetcher(
|
||||||
protected val log by logger()
|
protected val log by logger()
|
||||||
|
|
||||||
|
|
||||||
open fun checkCredentials(account: EmailAccount): CheckCredentialsResult {
|
|
||||||
try {
|
|
||||||
val status = connect(account, FetchEmailsOptions(showDebugOutputOnConsole = true))
|
|
||||||
|
|
||||||
close(status)
|
|
||||||
|
|
||||||
return CheckCredentialsResult.Ok
|
|
||||||
} catch (e: Throwable) {
|
|
||||||
log.info(e) { "Could not connect to account '$account'" }
|
|
||||||
return mapConnectResultError(e)
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
protected open fun mapConnectResultError(exception: Throwable): CheckCredentialsResult {
|
|
||||||
if (exception is AuthenticationFailedException) {
|
|
||||||
return CheckCredentialsResult.WrongUsername
|
|
||||||
} else if (exception is MailConnectException) {
|
|
||||||
val innerInnerException = exceptionHelper.getInnerException(exception, 1)
|
|
||||||
|
|
||||||
if (innerInnerException is UnknownHostException) {
|
|
||||||
return CheckCredentialsResult.InvalidImapServerAddress
|
|
||||||
} else if (innerInnerException is ConnectException) {
|
|
||||||
return CheckCredentialsResult.InvalidImapServerPort
|
|
||||||
}
|
|
||||||
} else if (exception is MessagingException) { // MessagingException is derived from MailConnectException, so place after MailConnectException
|
|
||||||
return CheckCredentialsResult.WrongPassword
|
|
||||||
}
|
|
||||||
|
|
||||||
return CheckCredentialsResult.UnknownError // fallback for cases i am not aware of
|
|
||||||
}
|
|
||||||
|
|
||||||
|
|
||||||
open fun listenForNewEmails(account: EmailAccount, options: ListenForNewMailsOptions) = runBlocking {
|
open fun listenForNewEmails(account: EmailAccount, options: ListenForNewMailsOptions) = runBlocking {
|
||||||
try {
|
try {
|
||||||
val status = connect(account, options)
|
connect(account, options) { store ->
|
||||||
|
val folder = store.getFolder(options.emailFolderName) as IMAPFolder
|
||||||
|
folder.open(Folder.READ_ONLY)
|
||||||
|
|
||||||
status.folder.addMessageCountListener(object : MessageCountAdapter() {
|
val status = FetchEmailsStatus(account, folder, options)
|
||||||
override fun messagesAdded(event: MessageCountEvent) {
|
|
||||||
event.messages.forEach { message ->
|
folder.addMessageCountListener(object : MessageCountAdapter() {
|
||||||
getEmail(message, status)
|
override fun messagesAdded(event: MessageCountEvent) {
|
||||||
|
event.messages.forEach { message ->
|
||||||
|
getEmail(message, status)
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
})
|
||||||
|
|
||||||
|
launch(coroutineDispatcher) {
|
||||||
|
keepConnectionOpen(status, folder, options)
|
||||||
}
|
}
|
||||||
})
|
|
||||||
|
|
||||||
launch(coroutineDispatcher) {
|
|
||||||
keepConnectionOpen(status, options)
|
|
||||||
}
|
}
|
||||||
|
|
||||||
close(status)
|
|
||||||
} catch (e: Throwable) {
|
} catch (e: Throwable) {
|
||||||
log.error(e) { "Listening to new emails of '${account.username}' failed" }
|
log.error(e) { "Listening to new emails of '${account.username}' failed" }
|
||||||
options.onError?.invoke(FetchEmailError(FetchEmailErrorType.ListenForNewEmails, null, e))
|
options.onError?.invoke(FetchEmailError(FetchEmailErrorType.ListenForNewEmails, null, e))
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
protected open suspend fun keepConnectionOpen(status: FetchEmailsStatus, options: ListenForNewMailsOptions) {
|
protected open suspend fun keepConnectionOpen(status: FetchEmailsStatus, folder: IMAPFolder, options: ListenForNewMailsOptions) {
|
||||||
val account = status.account
|
val account = status.account
|
||||||
val folder = status.folder
|
|
||||||
log.info { "Listening to new emails of $account" }
|
log.info { "Listening to new emails of $account" }
|
||||||
|
|
||||||
// Use IMAP IDLE to keep the connection alive
|
// Use IMAP IDLE to keep the connection alive
|
||||||
|
@ -126,13 +88,18 @@ open class EmailsFetcher(
|
||||||
|
|
||||||
open fun fetchAllEmails(account: EmailAccount, options: FetchEmailsOptions = FetchEmailsOptions()): FetchEmailsResult {
|
open fun fetchAllEmails(account: EmailAccount, options: FetchEmailsOptions = FetchEmailsOptions()): FetchEmailsResult {
|
||||||
try {
|
try {
|
||||||
val status = connect(account, options)
|
return connect(account, options) { store ->
|
||||||
|
val folder = store.getFolder(options.emailFolderName) as IMAPFolder
|
||||||
|
folder.open(Folder.READ_ONLY)
|
||||||
|
|
||||||
val emails = fetchAllEmailsInFolder(status)
|
val status = FetchEmailsStatus(account, folder, options)
|
||||||
|
|
||||||
close(status)
|
val emails = fetchAllEmailsInFolder(status).also {
|
||||||
|
folder.close(false)
|
||||||
|
}
|
||||||
|
|
||||||
return FetchEmailsResult(emails, null, status.messageSpecificErrors)
|
FetchEmailsResult(emails, null, status.messageSpecificErrors)
|
||||||
|
}
|
||||||
} catch (e: Throwable) {
|
} catch (e: Throwable) {
|
||||||
log.error(e) { "Could not fetch emails of account $account" }
|
log.error(e) { "Could not fetch emails of account $account" }
|
||||||
|
|
||||||
|
@ -241,14 +208,12 @@ open class EmailsFetcher(
|
||||||
|
|
||||||
val (invoice, invoiceFile) = tryToReadEInvoice(part, extension, messagePart.mediaType, status)
|
val (invoice, invoiceFile) = tryToReadEInvoice(part, extension, messagePart.mediaType, status)
|
||||||
|
|
||||||
val pdfInvoiceData: PdfInvoiceData? = tryToReadInvoiceDataFromPdf(extension, messagePart.mediaType, invoiceFile)
|
|
||||||
|
|
||||||
if (invoice != null || Part.ATTACHMENT.equals(part.disposition, ignoreCase = true)) {
|
if (invoice != null || Part.ATTACHMENT.equals(part.disposition, ignoreCase = true)) {
|
||||||
val file = invoiceFile ?:
|
val file = invoiceFile ?:
|
||||||
if (extension !in status.options.downloadAttachmentsWithExtensions) null
|
if (extension !in status.options.downloadAttachmentsWithExtensions) null
|
||||||
else downloadAttachment(part, status)
|
else downloadAttachment(part, status)
|
||||||
|
|
||||||
return EmailAttachment(part.fileName, extension, part.size.takeIf { it > 0 }, mapDisposition(part), messagePart.mediaType, part.contentType, invoice, pdfInvoiceData, file)
|
return EmailAttachment(part.fileName, extension, part.size.takeIf { it > 0 }, mapDisposition(part), messagePart.mediaType, part.contentType, invoice, file)
|
||||||
}
|
}
|
||||||
} catch (e: Throwable) {
|
} catch (e: Throwable) {
|
||||||
log.error(e) { "Could not check attachment '${messagePart.part.fileName}' (${messagePart.mediaType}) for eInvoice" }
|
log.error(e) { "Could not check attachment '${messagePart.part.fileName}' (${messagePart.mediaType}) for eInvoice" }
|
||||||
|
@ -285,14 +250,6 @@ open class EmailsFetcher(
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
private fun tryToReadInvoiceDataFromPdf(extension: String, mediaType: String, invoiceFile: File?): PdfInvoiceData? =
|
|
||||||
// if it's a PDF than () already downloaded invoiceFile, so it must be non null then
|
|
||||||
if (invoiceFile != null && (extension == "pdf" || mediaType == "application/pdf" || mediaType == "application/octet-stream")) {
|
|
||||||
pdfInvoiceDataExtractor.tryToExtractInvoiceData(invoiceFile).data // TODO: pass result.error to status.onError()
|
|
||||||
} else {
|
|
||||||
null
|
|
||||||
}
|
|
||||||
|
|
||||||
|
|
||||||
protected open fun getAllMessageParts(part: Part): List<MessagePart> {
|
protected open fun getAllMessageParts(part: Part): List<MessagePart> {
|
||||||
return if (part.isMimeType("multipart/*")) {
|
return if (part.isMimeType("multipart/*")) {
|
||||||
|
@ -369,22 +326,18 @@ open class EmailsFetcher(
|
||||||
date.toInstant()
|
date.toInstant()
|
||||||
|
|
||||||
|
|
||||||
protected open fun connect(account: EmailAccount, options: FetchEmailsOptions): FetchEmailsStatus {
|
protected open fun <T> connect(account: EmailAccount, options: FetchEmailsOptions, connected: (Store) -> T): T {
|
||||||
val properties = mapAccountToJavaMailProperties(account, options)
|
val properties = mapAccountToJavaMailProperties(account, options)
|
||||||
|
|
||||||
val session = Session.getInstance(properties)
|
val session = Session.getInstance(properties)
|
||||||
session.debug = options.showDebugOutputOnConsole
|
session.getStore("imap").use { store ->
|
||||||
|
store.connect(account.serverAddress, account.username, account.password)
|
||||||
|
|
||||||
val store = session.getStore("imap")
|
return connected(store)
|
||||||
store.connect(account.serverAddress, account.username, account.password)
|
}
|
||||||
|
|
||||||
val folder = store.getFolder(options.emailFolderName) as IMAPFolder
|
|
||||||
folder.open(Folder.READ_ONLY)
|
|
||||||
|
|
||||||
return FetchEmailsStatus(account, store, folder, options)
|
|
||||||
}
|
}
|
||||||
|
|
||||||
protected open fun mapAccountToJavaMailProperties(account: EmailAccount, options: FetchEmailsOptions = FetchEmailsOptions()) = Properties().apply {
|
protected open fun mapAccountToJavaMailProperties(account: EmailAccount, options: FetchEmailsOptions) = Properties().apply {
|
||||||
// the documentation of all properties can be found here: https://javaee.github.io/javamail/docs/api/com/sun/mail/imap/package-summary.html
|
// the documentation of all properties can be found here: https://javaee.github.io/javamail/docs/api/com/sun/mail/imap/package-summary.html
|
||||||
put("mail.store.protocol", "imap")
|
put("mail.store.protocol", "imap")
|
||||||
|
|
||||||
|
@ -401,14 +354,4 @@ open class EmailsFetcher(
|
||||||
put("mail.imap.partialfetch", "false") // Controls whether the IMAP partial-fetch capability should be used. Defaults to true.
|
put("mail.imap.partialfetch", "false") // Controls whether the IMAP partial-fetch capability should be used. Defaults to true.
|
||||||
}
|
}
|
||||||
|
|
||||||
protected open fun close(status: FetchEmailsStatus) {
|
|
||||||
try {
|
|
||||||
status.folder.close(false)
|
|
||||||
|
|
||||||
status.store.close()
|
|
||||||
} catch (e: Exception) {
|
|
||||||
log.error(e) { "Could not close folder or store" }
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
}
|
}
|
|
@ -1,4 +1,4 @@
|
||||||
package net.codinux.invoicing.email.model
|
package net.codinux.invoicing.email
|
||||||
|
|
||||||
data class FetchEmailError(
|
data class FetchEmailError(
|
||||||
val type: FetchEmailErrorType,
|
val type: FetchEmailErrorType,
|
|
@ -0,0 +1,13 @@
|
||||||
|
package net.codinux.invoicing.email
|
||||||
|
|
||||||
|
enum class FetchEmailErrorType {
|
||||||
|
GetEmail,
|
||||||
|
|
||||||
|
GetMesssageBody,
|
||||||
|
|
||||||
|
GetAttachment,
|
||||||
|
|
||||||
|
ExtractInvoice,
|
||||||
|
|
||||||
|
ListenForNewEmails
|
||||||
|
}
|
|
@ -1,7 +1,6 @@
|
||||||
package net.codinux.invoicing.email
|
package net.codinux.invoicing.email
|
||||||
|
|
||||||
import net.codinux.invoicing.email.model.Email
|
import net.codinux.invoicing.email.model.Email
|
||||||
import net.codinux.invoicing.email.model.FetchEmailError
|
|
||||||
import java.io.File
|
import java.io.File
|
||||||
import java.time.Instant
|
import java.time.Instant
|
||||||
import java.time.LocalDate
|
import java.time.LocalDate
|
||||||
|
@ -30,8 +29,6 @@ open class FetchEmailsOptions(
|
||||||
val emailFolderName: String = "INBOX",
|
val emailFolderName: String = "INBOX",
|
||||||
val connectTimeoutSeconds: Int = 5,
|
val connectTimeoutSeconds: Int = 5,
|
||||||
|
|
||||||
val showDebugOutputOnConsole: Boolean = false,
|
|
||||||
|
|
||||||
val onError: ((FetchEmailError) -> Unit)? = null,
|
val onError: ((FetchEmailError) -> Unit)? = null,
|
||||||
val onEmailReceived: ((Email) -> Unit)? = null
|
val onEmailReceived: ((Email) -> Unit)? = null
|
||||||
) {
|
) {
|
||||||
|
|
|
@ -1,4 +1,6 @@
|
||||||
package net.codinux.invoicing.email.model
|
package net.codinux.invoicing.email
|
||||||
|
|
||||||
|
import net.codinux.invoicing.email.model.Email
|
||||||
|
|
||||||
data class FetchEmailsResult(
|
data class FetchEmailsResult(
|
||||||
val emails: List<Email>,
|
val emails: List<Email>,
|
|
@ -3,17 +3,13 @@ package net.codinux.invoicing.email
|
||||||
import jakarta.mail.BodyPart
|
import jakarta.mail.BodyPart
|
||||||
import jakarta.mail.Message
|
import jakarta.mail.Message
|
||||||
import jakarta.mail.Part
|
import jakarta.mail.Part
|
||||||
import jakarta.mail.Store
|
|
||||||
import net.codinux.invoicing.email.model.EmailAccount
|
import net.codinux.invoicing.email.model.EmailAccount
|
||||||
import net.codinux.invoicing.email.model.FetchEmailError
|
|
||||||
import net.codinux.invoicing.email.model.FetchEmailErrorType
|
|
||||||
import net.codinux.invoicing.filesystem.FileUtil
|
import net.codinux.invoicing.filesystem.FileUtil
|
||||||
import org.eclipse.angus.mail.imap.IMAPFolder
|
import org.eclipse.angus.mail.imap.IMAPFolder
|
||||||
import java.io.File
|
import java.io.File
|
||||||
|
|
||||||
data class FetchEmailsStatus(
|
data class FetchEmailsStatus(
|
||||||
val account: EmailAccount,
|
val account: EmailAccount,
|
||||||
val store: Store,
|
|
||||||
val folder: IMAPFolder,
|
val folder: IMAPFolder,
|
||||||
val options: FetchEmailsOptions,
|
val options: FetchEmailsOptions,
|
||||||
val messageSpecificErrors: MutableList<FetchEmailError> = mutableListOf()
|
val messageSpecificErrors: MutableList<FetchEmailError> = mutableListOf()
|
||||||
|
|
|
@ -1,7 +1,6 @@
|
||||||
package net.codinux.invoicing.email
|
package net.codinux.invoicing.email
|
||||||
|
|
||||||
import net.codinux.invoicing.email.model.Email
|
import net.codinux.invoicing.email.model.Email
|
||||||
import net.codinux.invoicing.email.model.FetchEmailError
|
|
||||||
import java.io.File
|
import java.io.File
|
||||||
import java.util.concurrent.atomic.AtomicBoolean
|
import java.util.concurrent.atomic.AtomicBoolean
|
||||||
|
|
||||||
|
@ -17,13 +16,11 @@ open class ListenForNewMailsOptions(
|
||||||
emailFolderName: String = "INBOX",
|
emailFolderName: String = "INBOX",
|
||||||
connectTimeoutSeconds: Int = 5,
|
connectTimeoutSeconds: Int = 5,
|
||||||
|
|
||||||
showDebugOutputOnConsole: Boolean = false,
|
|
||||||
|
|
||||||
onError: ((FetchEmailError) -> Unit)? = null,
|
onError: ((FetchEmailError) -> Unit)? = null,
|
||||||
onEmailReceived: (Email) -> Unit
|
onEmailReceived: (Email) -> Unit
|
||||||
) : FetchEmailsOptions(
|
) : FetchEmailsOptions(
|
||||||
null,
|
null,
|
||||||
downloadMessageBody, downloadOnlyPlainTextOrHtmlMessageBody, null,
|
downloadMessageBody, downloadOnlyPlainTextOrHtmlMessageBody, null,
|
||||||
downloadAttachmentsWithExtensions, attachmentsDownloadDirectory,
|
downloadAttachmentsWithExtensions, attachmentsDownloadDirectory,
|
||||||
emailFolderName, connectTimeoutSeconds, showDebugOutputOnConsole, onError, onEmailReceived
|
emailFolderName, connectTimeoutSeconds, onError, onEmailReceived
|
||||||
)
|
)
|
|
@ -1,18 +0,0 @@
|
||||||
package net.codinux.invoicing.email.model
|
|
||||||
|
|
||||||
|
|
||||||
enum class CheckCredentialsResult {
|
|
||||||
|
|
||||||
Ok,
|
|
||||||
|
|
||||||
WrongUsername,
|
|
||||||
|
|
||||||
WrongPassword,
|
|
||||||
|
|
||||||
InvalidImapServerAddress,
|
|
||||||
|
|
||||||
InvalidImapServerPort,
|
|
||||||
|
|
||||||
UnknownError
|
|
||||||
|
|
||||||
}
|
|
|
@ -36,11 +36,9 @@ class Email(
|
||||||
|
|
||||||
val hasAttachments: Boolean by lazy { attachments.isNotEmpty() }
|
val hasAttachments: Boolean by lazy { attachments.isNotEmpty() }
|
||||||
|
|
||||||
val hasPdfAttachment: Boolean by lazy { attachments.any { it.isPdfFile } }
|
|
||||||
|
|
||||||
val hasEInvoiceAttachment: Boolean by lazy { attachments.any { it.containsEInvoice } }
|
val hasEInvoiceAttachment: Boolean by lazy { attachments.any { it.containsEInvoice } }
|
||||||
|
|
||||||
val hasAttachmentsWithExtractedInvoiceData: Boolean by lazy { attachments.any { it.couldExtractPdfInvoiceData } }
|
val hasPdfAttachment: Boolean by lazy { attachments.any { it.isPdfFile } }
|
||||||
|
|
||||||
|
|
||||||
override fun toString() = "${date.atZone(ZoneId.systemDefault()).toLocalDate()} $sender: $subject, ${attachments.size} attachment(s)"
|
override fun toString() = "${date.atZone(ZoneId.systemDefault()).toLocalDate()} $sender: $subject, ${attachments.size} attachment(s)"
|
||||||
|
|
|
@ -1,7 +1,6 @@
|
||||||
package net.codinux.invoicing.email.model
|
package net.codinux.invoicing.email.model
|
||||||
|
|
||||||
import net.codinux.invoicing.model.Invoice
|
import net.codinux.invoicing.model.Invoice
|
||||||
import net.codinux.invoicing.pdf.PdfInvoiceData
|
|
||||||
import java.io.File
|
import java.io.File
|
||||||
|
|
||||||
class EmailAttachment(
|
class EmailAttachment(
|
||||||
|
@ -17,14 +16,11 @@ class EmailAttachment(
|
||||||
val mediaType: String?,
|
val mediaType: String?,
|
||||||
val contentType: String?,
|
val contentType: String?,
|
||||||
val invoice: Invoice? = null,
|
val invoice: Invoice? = null,
|
||||||
val pdfInvoiceData: PdfInvoiceData? = null,
|
|
||||||
val file: File? = null
|
val file: File? = null
|
||||||
) {
|
) {
|
||||||
val isPdfFile: Boolean by lazy { extension == "pdf" || mediaType == "application/pdf" }
|
|
||||||
|
|
||||||
val containsEInvoice: Boolean by lazy { invoice != null }
|
val containsEInvoice: Boolean by lazy { invoice != null }
|
||||||
|
|
||||||
val couldExtractPdfInvoiceData: Boolean by lazy { pdfInvoiceData != null }
|
val isPdfFile: Boolean by lazy { extension == "pdf" || mediaType == "application/pdf" }
|
||||||
|
|
||||||
override fun toString() = "$filename: $invoice"
|
override fun toString() = "$filename: $invoice"
|
||||||
}
|
}
|
|
@ -1,13 +0,0 @@
|
||||||
package net.codinux.invoicing.email.model
|
|
||||||
|
|
||||||
enum class FetchEmailErrorType {
|
|
||||||
GetEmail,
|
|
||||||
|
|
||||||
GetMesssageBody,
|
|
||||||
|
|
||||||
GetAttachment,
|
|
||||||
|
|
||||||
ExtractInvoice, // TODO: due to orNull() these errors aren't caught anymore
|
|
||||||
|
|
||||||
ListenForNewEmails
|
|
||||||
}
|
|
|
@ -1,11 +0,0 @@
|
||||||
package net.codinux.invoicing.pdf
|
|
||||||
|
|
||||||
import java.math.BigDecimal
|
|
||||||
|
|
||||||
class AmountOfMoney(
|
|
||||||
val amount: BigDecimal,
|
|
||||||
val currency: String,
|
|
||||||
val amountWithCurrency: String = "$amount $currency"
|
|
||||||
) {
|
|
||||||
override fun toString() = amountWithCurrency
|
|
||||||
}
|
|
|
@ -1,17 +0,0 @@
|
||||||
package net.codinux.invoicing.pdf
|
|
||||||
|
|
||||||
import net.dankito.text.extraction.ITextExtractor
|
|
||||||
import net.dankito.text.extraction.pdf.PdfBoxPdfTextExtractor
|
|
||||||
import java.io.File
|
|
||||||
|
|
||||||
open class PdfBoxPdfTextExtractor(
|
|
||||||
protected open val textExtractor: ITextExtractor = PdfBoxPdfTextExtractor()
|
|
||||||
) : PdfTextExtractor {
|
|
||||||
|
|
||||||
override fun extractTextFromPdf(pdfFile: File): PdfTextExtractorResult {
|
|
||||||
val result = textExtractor.extractText(pdfFile)
|
|
||||||
|
|
||||||
return PdfTextExtractorResult(result.text, result.error?.exception)
|
|
||||||
}
|
|
||||||
|
|
||||||
}
|
|
|
@ -1,33 +0,0 @@
|
||||||
package net.codinux.invoicing.pdf
|
|
||||||
|
|
||||||
import java.math.BigDecimal
|
|
||||||
import java.time.LocalDate
|
|
||||||
|
|
||||||
/**
|
|
||||||
* PDFs contain only unstructured data, so it's way harder to get invoice data from PDFs then from structured XML eInvoice files.
|
|
||||||
*
|
|
||||||
* So we can only guess which is the total amount, which the net and vat amount, which the invoice date, ...
|
|
||||||
*
|
|
||||||
* Therefor this class' properties all contain 'possible' in their name to reflect this circumstance.
|
|
||||||
*/
|
|
||||||
class PdfInvoiceData(
|
|
||||||
val potentialTotalAmount: AmountOfMoney,
|
|
||||||
val potentialNetAmount: AmountOfMoney? = null,
|
|
||||||
val potentialValueAddedTax: AmountOfMoney? = null,
|
|
||||||
val potentialValueAddedTaxRate: BigDecimal? = null,
|
|
||||||
|
|
||||||
val potentialIban: String? = null,
|
|
||||||
val potentialBic: String? = null,
|
|
||||||
|
|
||||||
val foundAmounts: List<AmountOfMoney> = emptyList(),
|
|
||||||
val foundPercentages: List<AmountOfMoney> = emptyList(),
|
|
||||||
|
|
||||||
val foundDates: List<LocalDate> = emptyList(),
|
|
||||||
|
|
||||||
val foundPotentialIbans: List<String> = emptyList(),
|
|
||||||
val foundPotentialBics: List<String> = emptyList(),
|
|
||||||
|
|
||||||
val pdfText: String
|
|
||||||
) {
|
|
||||||
override fun toString() = "$potentialTotalAmount"
|
|
||||||
}
|
|
|
@ -1,10 +0,0 @@
|
||||||
package net.codinux.invoicing.pdf
|
|
||||||
|
|
||||||
class PdfInvoiceDataExtractionResult(
|
|
||||||
val error: Throwable?,
|
|
||||||
val data: PdfInvoiceData?
|
|
||||||
) {
|
|
||||||
override fun toString() =
|
|
||||||
if (data != null) "Success: $data"
|
|
||||||
else "Error: $error"
|
|
||||||
}
|
|
|
@ -1,58 +0,0 @@
|
||||||
package net.codinux.invoicing.pdf
|
|
||||||
|
|
||||||
import net.dankito.text.extraction.info.invoice.InvoiceDataExtractor
|
|
||||||
import net.dankito.text.extraction.info.model.InvoiceData
|
|
||||||
import java.io.File
|
|
||||||
import java.time.LocalDate
|
|
||||||
|
|
||||||
/**
|
|
||||||
* PDFs contain only unstructured data, so it's way harder to get invoice data from PDFs then from structured XML eInvoice files.
|
|
||||||
*
|
|
||||||
* But for validation purposes or PDFs without attached eInvoice XML we also try to extract unstructured invoice data from PDFs.
|
|
||||||
*/
|
|
||||||
open class PdfInvoiceDataExtractor(
|
|
||||||
protected open val textExtractor: PdfTextExtractor = PdfBoxPdfTextExtractor(),
|
|
||||||
protected open val invoiceDataExtractor: InvoiceDataExtractor = InvoiceDataExtractor()
|
|
||||||
) {
|
|
||||||
|
|
||||||
open fun tryToExtractInvoiceData(file: File): PdfInvoiceDataExtractionResult {
|
|
||||||
val textExtractionResult = extractTextFromPdf(file)
|
|
||||||
if (textExtractionResult.error != null || textExtractionResult.text == null) {
|
|
||||||
return PdfInvoiceDataExtractionResult(textExtractionResult.error, null)
|
|
||||||
}
|
|
||||||
|
|
||||||
val pdfText = textExtractionResult.text
|
|
||||||
val result = invoiceDataExtractor.extractInvoiceData(pdfText)
|
|
||||||
|
|
||||||
return if (result.error != null) {
|
|
||||||
PdfInvoiceDataExtractionResult(result.error, null)
|
|
||||||
} else if (result.potentialTotalAmount == null) {
|
|
||||||
PdfInvoiceDataExtractionResult(IllegalStateException("Could not find total amount of invoice in PDF $file"), null)
|
|
||||||
} else {
|
|
||||||
PdfInvoiceDataExtractionResult(null, mapInvoiceData(result, pdfText))
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
protected open fun extractTextFromPdf(file: File): PdfTextExtractorResult =
|
|
||||||
textExtractor.extractTextFromPdf(file)
|
|
||||||
|
|
||||||
|
|
||||||
protected open fun mapInvoiceData(result: InvoiceData, pdfText: String) = PdfInvoiceData(
|
|
||||||
mapAmount(result.potentialTotalAmount)!!, mapAmount(result.potentialNetAmount),
|
|
||||||
mapAmount(result.potentialValueAddedTax), result.potentialValueAddedTaxRate?.amount,
|
|
||||||
|
|
||||||
result.potentialIban, result.potentialBic,
|
|
||||||
|
|
||||||
result.allAmounts.mapNotNull { mapAmount(it) }, result.percentages.mapNotNull { mapAmount(it) },
|
|
||||||
|
|
||||||
result.dates.map { LocalDate.of(it.year, it.month, it.day) },
|
|
||||||
|
|
||||||
result.ibans.map { it.hit }, result.bics.map { it.hit },
|
|
||||||
|
|
||||||
pdfText
|
|
||||||
)
|
|
||||||
|
|
||||||
protected open fun mapAmount(amount: net.dankito.text.extraction.info.model.AmountOfMoney?) =
|
|
||||||
amount?.let { AmountOfMoney(it.amount, it.currency, it.amountWithCurrency) }
|
|
||||||
|
|
||||||
}
|
|
|
@ -1,9 +0,0 @@
|
||||||
package net.codinux.invoicing.pdf
|
|
||||||
|
|
||||||
import java.io.File
|
|
||||||
|
|
||||||
interface PdfTextExtractor {
|
|
||||||
|
|
||||||
fun extractTextFromPdf(pdfFile: File): PdfTextExtractorResult
|
|
||||||
|
|
||||||
}
|
|
|
@ -1,10 +0,0 @@
|
||||||
package net.codinux.invoicing.pdf
|
|
||||||
|
|
||||||
data class PdfTextExtractorResult(
|
|
||||||
val text: String?,
|
|
||||||
val error: Throwable?
|
|
||||||
) {
|
|
||||||
override fun toString() =
|
|
||||||
if (text != null) "Success: $text"
|
|
||||||
else "Error: $error"
|
|
||||||
}
|
|
|
@ -1,17 +0,0 @@
|
||||||
package net.codinux.invoicing.util
|
|
||||||
|
|
||||||
open class ExceptionHelper {
|
|
||||||
|
|
||||||
open fun getInnerException(exception: Exception, maxDepth: Int = 3): Exception {
|
|
||||||
var innerException = exception
|
|
||||||
var depth = 0
|
|
||||||
|
|
||||||
while(innerException.cause is Exception && depth < maxDepth) {
|
|
||||||
innerException = innerException.cause as Exception
|
|
||||||
depth++
|
|
||||||
}
|
|
||||||
|
|
||||||
return innerException
|
|
||||||
}
|
|
||||||
|
|
||||||
}
|
|
|
@ -14,13 +14,8 @@ kotlinCoroutinesVersion=1.9.0
|
||||||
quarkusVersion=3.16.3
|
quarkusVersion=3.16.3
|
||||||
|
|
||||||
|
|
||||||
# Mustang 2.14 pulls PDFBox 3.x on the classpath, which is incompatible with PDFBox 2.x used by pdfbox-text-extractor
|
|
||||||
# but Mustang version 2.13 and 2.12 is missing its dependencies in pom.xml
|
|
||||||
mustangVersion=2.14.2
|
mustangVersion=2.14.2
|
||||||
|
|
||||||
textInfoExtractor=1.0.3
|
|
||||||
pdfboxTextExtractor=0.6.1
|
|
||||||
|
|
||||||
angusMailVersion=2.0.3
|
angusMailVersion=2.0.3
|
||||||
|
|
||||||
klfVersion=1.6.2
|
klfVersion=1.6.2
|
||||||
|
|
Loading…
Reference in New Issue