From 5369a54caaff2b484f7c3c690d1a83893a9e10e1 Mon Sep 17 00:00:00 2001 From: cyian-1756 Date: Mon, 30 Apr 2018 13:22:51 -0400 Subject: [PATCH] Added ripper and unit test for dynasty-scans.com --- .../ripper/rippers/DynastyscansRipper.java | 84 +++++++++++++++++++ .../rippers/DynastyscansRipperTest.java | 18 ++++ 2 files changed, 102 insertions(+) create mode 100644 src/main/java/com/rarchives/ripme/ripper/rippers/DynastyscansRipper.java create mode 100644 src/test/java/com/rarchives/ripme/tst/ripper/rippers/DynastyscansRipperTest.java diff --git a/src/main/java/com/rarchives/ripme/ripper/rippers/DynastyscansRipper.java b/src/main/java/com/rarchives/ripme/ripper/rippers/DynastyscansRipper.java new file mode 100644 index 00000000..37d3ad93 --- /dev/null +++ b/src/main/java/com/rarchives/ripme/ripper/rippers/DynastyscansRipper.java @@ -0,0 +1,84 @@ +package com.rarchives.ripme.ripper.rippers; + +import java.io.IOException; +import java.net.MalformedURLException; +import java.net.URL; +import java.util.ArrayList; +import java.util.List; +import java.util.regex.Matcher; +import java.util.regex.Pattern; + +import org.json.JSONArray; +import org.jsoup.nodes.Document; +import org.jsoup.nodes.Element; + +import com.rarchives.ripme.ripper.AbstractHTMLRipper; +import com.rarchives.ripme.utils.Http; + +public class DynastyscansRipper extends AbstractHTMLRipper { + + public DynastyscansRipper(URL url) throws IOException { + super(url); + } + + @Override + public String getHost() { + return "dynasty-scans"; + } + + @Override + public String getDomain() { + return "dynasty-scans.com"; + } + + @Override + public String getGID(URL url) throws MalformedURLException { + Pattern p = Pattern.compile("https?://dynasty-scans.com/chapters/([\\S]+)/?$"); + Matcher m = p.matcher(url.toExternalForm()); + if (m.matches()) { + return m.group(1); + } + throw new MalformedURLException("Expected dynasty-scans URL format: " + + "dynasty-scans.com/chapters/ID - got " + url + " instead"); + } + + @Override + public Document getFirstPage() throws IOException { + // "url" is an instance field of the superclass + return Http.url(url).get(); + } + + @Override + public Document getNextPage(Document doc) throws IOException { + Element elem = doc.select("a[id=next_link]").first(); + if (elem == null || elem.attr("href").equals("#")) { + throw new IOException("No more pages"); + } + return Http.url("https://dynasty-scans.com" + elem.attr("href")).get(); + + } + + @Override + public List getURLsFromPage(Document doc) { + List result = new ArrayList<>(); + String jsonText = null; + for (Element script : doc.select("script")) { + if (script.data().contains("var pages")) { + jsonText = script.data().replaceAll("var pages = ", ""); + jsonText = jsonText.replaceAll("//", ""); + } + } + JSONArray imageArray = new JSONArray(jsonText); + for (int i = 0; i < imageArray.length(); i++) { + result.add("https://dynasty-scans.com" + imageArray.getJSONObject(i).getString("image")); + } + + return result; + } + + @Override + public void downloadURL(URL url, int index) { + addURLToDownload(url, getPrefix(index)); + } +} diff --git a/src/test/java/com/rarchives/ripme/tst/ripper/rippers/DynastyscansRipperTest.java b/src/test/java/com/rarchives/ripme/tst/ripper/rippers/DynastyscansRipperTest.java new file mode 100644 index 00000000..8eb8d88f --- /dev/null +++ b/src/test/java/com/rarchives/ripme/tst/ripper/rippers/DynastyscansRipperTest.java @@ -0,0 +1,18 @@ +package com.rarchives.ripme.tst.ripper.rippers; + +import java.io.IOException; +import java.net.URL; + +import com.rarchives.ripme.ripper.rippers.DynastyscansRipper; + +public class DynastyscansRipperTest extends RippersTest { + public void testRip() throws IOException { + DynastyscansRipper ripper = new DynastyscansRipper(new URL("https://dynasty-scans.com/chapters/under_one_roof_ch01")); + testRipper(ripper); + } + + public void testGetGID() throws IOException { + DynastyscansRipper ripper = new DynastyscansRipper(new URL("https://dynasty-scans.com/chapters/under_one_roof_ch01")); + assertEquals("under_one_roof_ch01", ripper.getGID(new URL("https://dynasty-scans.com/chapters/under_one_roof_ch01"))); + } +}