From 9bb2923cab6693bd736c1bd7d297e94e9d81d150 Mon Sep 17 00:00:00 2001 From: =?utf8?q?David=20=E2=80=98Bombe=E2=80=99=20Roden?= Date: Wed, 2 Jan 2013 19:02:37 +0100 Subject: [PATCH] Add filter to extract a torrent state from an HTML state. --- .../reactor/filters/KickAssTorrentsFilter.java | 132 +++++++++++++++++++++ 1 file changed, 132 insertions(+) create mode 100644 src/main/java/net/pterodactylus/reactor/filters/KickAssTorrentsFilter.java diff --git a/src/main/java/net/pterodactylus/reactor/filters/KickAssTorrentsFilter.java b/src/main/java/net/pterodactylus/reactor/filters/KickAssTorrentsFilter.java new file mode 100644 index 0000000..02a356a --- /dev/null +++ b/src/main/java/net/pterodactylus/reactor/filters/KickAssTorrentsFilter.java @@ -0,0 +1,132 @@ +/* + * Reactor - KickAssTorrentsFilter.java - Copyright © 2013 David Roden + * + * This program is free software: you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation, either version 3 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program. If not, see . + */ + +package net.pterodactylus.reactor.filters; + +import static com.google.common.base.Preconditions.checkState; + +import java.net.URI; +import java.net.URISyntaxException; + +import net.pterodactylus.reactor.Filter; +import net.pterodactylus.reactor.State; +import net.pterodactylus.reactor.queries.HttpQuery; +import net.pterodactylus.reactor.states.FailedState; +import net.pterodactylus.reactor.states.HtmlState; +import net.pterodactylus.reactor.states.TorrentState; +import net.pterodactylus.reactor.states.TorrentState.TorrentFile; + +import org.jsoup.nodes.Document; +import org.jsoup.nodes.Element; +import org.jsoup.select.Elements; + +/** + * {@link Filter} implementation that parses a {@link TorrentState} from an + * {@link HtmlState} which was generated by a {@link HttpQuery} to + * {@code kickasstorrents.ph}. + * + * @author David ‘Bombe’ Roden + */ +public class KickAssTorrentsFilter implements Filter { + + /** + * {@inheritDoc} + */ + @Override + public State filter(State state) { + if (!state.success()) { + return FailedState.from(state); + } + checkState(state instanceof HtmlState, "state is not an HtmlState but a %s", state.getClass().getName()); + + /* get result table. */ + Document document = ((HtmlState) state).document(); + Elements mainTable = document.select("table.data"); + if (mainTable.isEmpty()) { + /* no main table? */ + return new FailedState(); + } + + /* iterate over all rows. */ + TorrentState torrentState = new TorrentState(); + Elements dataRows = mainTable.select("tr:gt(0)"); + for (Element dataRow : dataRows) { + String name = extractName(dataRow); + String size = extractSize(dataRow); + String magnetUri = extractMagnetUri(dataRow); + String downloadUri; + try { + downloadUri = new URI(((HtmlState) state).uri()).resolve(extractDownloadUri(dataRow)).toString(); + TorrentFile torrentFile = new TorrentFile(name, size, magnetUri, downloadUri); + torrentState.addTorrentFile(torrentFile); + } catch (URISyntaxException use1) { + /* ignore; if uri was wrong, we wouldn’t be here. */ + } + } + + return torrentState; + } + + // + // STATIC METHODS + // + + /** + * Extracts the name from the given row. + * + * @param dataRow + * The row to extract the name from + * @return The extracted name + */ + private static String extractName(Element dataRow) { + return dataRow.select("div.torrentname a.normalgrey").text(); + } + + /** + * Extracts the size from the given row. + * + * @param dataRow + * The row to extract the size from + * @return The extracted size + */ + private static String extractSize(Element dataRow) { + return dataRow.select("td:eq(1)").text(); + } + + /** + * Extracts the magnet URI from the given row. + * + * @param dataRow + * The row to extract the magnet URI from + * @return The extracted magnet URI + */ + private static String extractMagnetUri(Element dataRow) { + return dataRow.select("a.imagnet").attr("href"); + } + + /** + * Extracts the download URI from the given row. + * + * @param dataRow + * The row to extract the download URI from + * @return The extracted download URI + */ + private static String extractDownloadUri(Element dataRow) { + return dataRow.select("a.idownload:not(.partner1Button)").attr("href"); + } + +} -- 2.7.4