mirror of
https://github.com/msfjarvis/compose-lobsters
synced 2025-08-16 12:47:02 +05:30
feat(metadata-extractor): allow de-AMP plugin to change our target URL
This commit is contained in:
parent
8060c347cc
commit
8eee42ae0f
1 changed files with 3 additions and 1 deletions
|
@ -1,6 +1,7 @@
|
||||||
package dev.msfjarvis.claw.metadata
|
package dev.msfjarvis.claw.metadata
|
||||||
|
|
||||||
import com.chimbori.crux.Crux
|
import com.chimbori.crux.Crux
|
||||||
|
import com.chimbori.crux.api.Fields.CANONICAL_URL
|
||||||
import com.chimbori.crux.api.Fields.DURATION_MS
|
import com.chimbori.crux.api.Fields.DURATION_MS
|
||||||
import com.chimbori.crux.api.Fields.FAVICON_URL
|
import com.chimbori.crux.api.Fields.FAVICON_URL
|
||||||
import dev.msfjarvis.claw.model.LinkMetadata
|
import dev.msfjarvis.claw.model.LinkMetadata
|
||||||
|
@ -30,8 +31,9 @@ constructor(
|
||||||
val extractedMetadata = crux.extractFrom(parsedUrl, Jsoup.parse(htmlContent, url))
|
val extractedMetadata = crux.extractFrom(parsedUrl, Jsoup.parse(htmlContent, url))
|
||||||
val faviconUrl = extractedMetadata.urls[FAVICON_URL].toString()
|
val faviconUrl = extractedMetadata.urls[FAVICON_URL].toString()
|
||||||
val readingTime = extractedMetadata[DURATION_MS]
|
val readingTime = extractedMetadata[DURATION_MS]
|
||||||
|
val overriddenUrl = extractedMetadata[CANONICAL_URL] ?: url
|
||||||
LinkMetadata(
|
LinkMetadata(
|
||||||
url = url,
|
url = overriddenUrl,
|
||||||
faviconUrl = faviconUrl,
|
faviconUrl = faviconUrl,
|
||||||
readingTime = readingTime,
|
readingTime = readingTime,
|
||||||
)
|
)
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue