Add HTML filter and state.
authorDavid ‘Bombe’ Roden <bombe@pterodactylus.net>
Wed, 2 Jan 2013 17:56:21 +0000 (18:56 +0100)
committerDavid ‘Bombe’ Roden <bombe@pterodactylus.net>
Wed, 2 Jan 2013 20:15:04 +0000 (21:15 +0100)
pom.xml
src/main/java/net/pterodactylus/reactor/filters/HtmlFilter.java [new file with mode: 0644]
src/main/java/net/pterodactylus/reactor/states/HtmlState.java [new file with mode: 0644]

diff --git a/pom.xml b/pom.xml
index 3d6265c..d16a214 100644 (file)
--- a/pom.xml
+++ b/pom.xml
                        <artifactId>httpclient</artifactId>
                        <version>4.2.2</version>
                </dependency>
+               <dependency>
+                       <groupId>org.jsoup</groupId>
+                       <artifactId>jsoup</artifactId>
+                       <version>1.7.1</version>
+               </dependency>
        </dependencies>
 </project>
diff --git a/src/main/java/net/pterodactylus/reactor/filters/HtmlFilter.java b/src/main/java/net/pterodactylus/reactor/filters/HtmlFilter.java
new file mode 100644 (file)
index 0000000..83b961d
--- /dev/null
@@ -0,0 +1,50 @@
+/*
+ * Reactor - HtmlFilter.java - Copyright © 2013 David Roden
+ *
+ * This program is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+package net.pterodactylus.reactor.filters;
+
+import static com.google.common.base.Preconditions.checkState;
+import net.pterodactylus.reactor.Filter;
+import net.pterodactylus.reactor.State;
+import net.pterodactylus.reactor.states.FailedState;
+import net.pterodactylus.reactor.states.HtmlState;
+import net.pterodactylus.reactor.states.HttpState;
+
+import org.jsoup.Jsoup;
+import org.jsoup.nodes.Document;
+
+/**
+ * {@link Filter} that converts a {@link HttpState} into an {@link HtmlState}.
+ *
+ * @author <a href="mailto:bombe@pterodactylus.net">David ‘Bombe’ Roden</a>
+ */
+public class HtmlFilter implements Filter {
+
+       /**
+        * {@inheritDoc}
+        */
+       @Override
+       public State filter(State state) {
+               if (!state.success()) {
+                       return FailedState.from(state);
+               }
+               checkState(state instanceof HttpState, "state is not a HttpState but a %s", state.getClass().getName());
+               Document document = Jsoup.parse(((HttpState) state).content(), ((HttpState) state).uri());
+               return new HtmlState(((HttpState) state).uri(), document);
+       }
+
+}
diff --git a/src/main/java/net/pterodactylus/reactor/states/HtmlState.java b/src/main/java/net/pterodactylus/reactor/states/HtmlState.java
new file mode 100644 (file)
index 0000000..ce89a98
--- /dev/null
@@ -0,0 +1,84 @@
+/*
+ * Reactor - HtmlState.java - Copyright © 2013 David Roden
+ *
+ * This program is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+package net.pterodactylus.reactor.states;
+
+import net.pterodactylus.reactor.State;
+
+import org.jsoup.nodes.Document;
+
+/**
+ * {@link State} implementation that contains a parsed HTML {@link Document}.
+ *
+ * @author <a href="mailto:bombe@pterodactylus.net">David ‘Bombe’ Roden</a>
+ */
+public class HtmlState extends AbstractState {
+
+       /** The URI of the parsed document. */
+       private final String uri;
+
+       /** The parsed document. */
+       private final Document document;
+
+       /**
+        * Creates a new HTML state.
+        *
+        * @param uri
+        *            The URI of the parsed document
+        * @param document
+        *            The parsed documnet
+        */
+       public HtmlState(String uri, Document document) {
+               this.uri = uri;
+               this.document = document;
+       }
+
+       //
+       // ACCESSORS
+       //
+
+       /**
+        * Returns the URI of the parsed document.
+        *
+        * @return The URI of the parsed document
+        */
+       public String uri() {
+               return uri;
+       }
+
+       /**
+        * Returns the parsed document.
+        *
+        * @return The parsed document
+        */
+       public Document document() {
+               return document;
+       }
+
+       //
+       // OBJECT METHODS
+       //
+
+       /**
+        * {@inheritDoc}
+        */
+       @Override
+       public String toString() {
+               return String.format("%s[document=(%s chars)]", getClass().getSimpleName(), document().toString().length());
+       }
+
+}