Add HTML parsing to element loader
[Sone.git] / src / test / kotlin / net / pterodactylus / sone / core / DefaultElementLoaderTest.kt
index 03b42c3..ed66dd9 100644 (file)
@@ -8,6 +8,7 @@ import net.pterodactylus.sone.test.capture
 import net.pterodactylus.sone.test.mock
 import org.hamcrest.MatcherAssert.assertThat
 import org.hamcrest.Matchers.`is`
+import org.hamcrest.Matchers.equalTo
 import org.junit.Test
 import org.mockito.ArgumentMatchers.any
 import org.mockito.ArgumentMatchers.eq
@@ -27,6 +28,7 @@ class DefaultElementLoaderTest {
                private val freenetURI = FreenetURI(IMAGE_ID)
                private const val decomposedKey = "CHK@DCiVgTWW9nnWHJc9EVwtFJ6jAfBSVyy~rgiPvhUKbS4,mNY85V0x7dYcv7SnEYo1PCC6y2wNWMDNt-y9UWQx9fI,AAMC--8/fru%CC%88hstu%CC%88ck.jpg"
                private const val normalizedKey = "CHK@DCiVgTWW9nnWHJc9EVwtFJ6jAfBSVyy~rgiPvhUKbS4,mNY85V0x7dYcv7SnEYo1PCC6y2wNWMDNt-y9UWQx9fI,AAMC--8/frühstück.jpg"
+               private const val textKey = "KSK@gpl.html"
                private val sizeOkay = 2097152L
                private val sizeNotOkay = sizeOkay + 1
        }
@@ -99,6 +101,62 @@ class DefaultElementLoaderTest {
        }
 
        @Test
+       fun `element loader can extract description from description header`() {
+           elementLoader.loadElement(textKey)
+               verify(freenetInterface).startFetch(eq(FreenetURI(textKey)), callback.capture())
+               callback.value.loaded(FreenetURI(textKey), "text/html; charset=UTF-8", read("element-loader.html"))
+               val linkedElement = elementLoader.loadElement(textKey)
+               assertThat(linkedElement, equalTo(LinkedElement(textKey, properties = mapOf(
+                               "size" to 266,
+                               "sizeHuman" to "266 B",
+                               "title" to "Some Nice Page Title",
+                               "description" to "This is an example of a very nice freesite."
+               ))))
+       }
+
+       @Test
+       fun `element loader can extract description from first non-heading paragraph`() {
+           elementLoader.loadElement(textKey)
+               verify(freenetInterface).startFetch(eq(FreenetURI(textKey)), callback.capture())
+               callback.value.loaded(FreenetURI(textKey), "text/html; charset=UTF-8", read("element-loader2.html"))
+               val linkedElement = elementLoader.loadElement(textKey)
+               assertThat(linkedElement, equalTo(LinkedElement(textKey, properties = mapOf(
+                               "size" to 185,
+                               "sizeHuman" to "185 B",
+                               "title" to "Some Nice Page Title",
+                               "description" to "This is the first paragraph of the very nice freesite."
+               ))))
+       }
+
+       @Test
+       fun `element loader can not extract description if html is more complicated`() {
+           elementLoader.loadElement(textKey)
+               verify(freenetInterface).startFetch(eq(FreenetURI(textKey)), callback.capture())
+               callback.value.loaded(FreenetURI(textKey), "text/html; charset=UTF-8", read("element-loader3.html"))
+               val linkedElement = elementLoader.loadElement(textKey)
+               assertThat(linkedElement, equalTo(LinkedElement(textKey, properties = mapOf(
+                               "size" to 204,
+                               "sizeHuman" to "204 B",
+                               "title" to "Some Nice Page Title",
+                               "description" to null
+               ))))
+       }
+
+       @Test
+       fun `element loader can not extract title if it is missing`() {
+           elementLoader.loadElement(textKey)
+               verify(freenetInterface).startFetch(eq(FreenetURI(textKey)), callback.capture())
+               callback.value.loaded(FreenetURI(textKey), "text/html; charset=UTF-8", read("element-loader4.html"))
+               val linkedElement = elementLoader.loadElement(textKey)
+               assertThat(linkedElement, equalTo(LinkedElement(textKey, properties = mapOf(
+                               "size" to 229,
+                               "sizeHuman" to "229 B",
+                               "title" to null,
+                               "description" to "This is an example of a very nice freesite."
+               ))))
+       }
+
+       @Test
        fun `image is not loaded again after it failed`() {
                elementLoader.loadElement(IMAGE_ID)
                verify(freenetInterface).startFetch(eq(freenetURI), callback.capture())