feat(metadata-extractor): allow de-AMP plugin to change our target URL

This commit is contained in:
Harsh Shandilya 2022-10-05 12:23:04 +05:30
parent 8060c347cc
commit 8eee42ae0f
No known key found for this signature in database

View file

@ -1,6 +1,7 @@
package dev.msfjarvis.claw.metadata
import com.chimbori.crux.Crux
import com.chimbori.crux.api.Fields.CANONICAL_URL
import com.chimbori.crux.api.Fields.DURATION_MS
import com.chimbori.crux.api.Fields.FAVICON_URL
import dev.msfjarvis.claw.model.LinkMetadata
@ -30,8 +31,9 @@ constructor(
val extractedMetadata = crux.extractFrom(parsedUrl, Jsoup.parse(htmlContent, url))
val faviconUrl = extractedMetadata.urls[FAVICON_URL].toString()
val readingTime = extractedMetadata[DURATION_MS]
val overriddenUrl = extractedMetadata[CANONICAL_URL] ?: url
LinkMetadata(
url = url,
url = overriddenUrl,
faviconUrl = faviconUrl,
readingTime = readingTime,
)