From 3ebb7d1874e61f6f06c9e670b9106f07e8f265ac Mon Sep 17 00:00:00 2001 From: cyian-1756 Date: Sun, 17 Jun 2018 15:55:57 -0400 Subject: [PATCH 1/3] Started work on Picstatio ripper --- .../ripme/ripper/rippers/PicstatioRipper.java | 82 +++++++++++++++++++ 1 file changed, 82 insertions(+) create mode 100644 src/main/java/com/rarchives/ripme/ripper/rippers/PicstatioRipper.java diff --git a/src/main/java/com/rarchives/ripme/ripper/rippers/PicstatioRipper.java b/src/main/java/com/rarchives/ripme/ripper/rippers/PicstatioRipper.java new file mode 100644 index 00000000..29c71a08 --- /dev/null +++ b/src/main/java/com/rarchives/ripme/ripper/rippers/PicstatioRipper.java @@ -0,0 +1,82 @@ +package com.rarchives.ripme.ripper.rippers; + +import java.io.IOException; +import java.net.MalformedURLException; +import java.net.URL; +import java.util.ArrayList; +import java.util.List; +import java.util.regex.Matcher; +import java.util.regex.Pattern; + +import org.jsoup.nodes.Document; +import org.jsoup.nodes.Element; + +import com.rarchives.ripme.ripper.AbstractHTMLRipper; +import com.rarchives.ripme.utils.Http; + +public class PicstatioRipper extends AbstractHTMLRipper { + + public PicstatioRipper(URL url) throws IOException { + super(url); + } + + private String getFullSizedImageFromURL(String fileName) { + try { + return Http.url("https://www.picstatio.com/wallpaper/" + fileName + "/download").get().select("p.text-center > a").attr("href"); + } catch (IOException e) { + e.printStackTrace(); + return null; + } + } + + @Override + public String getHost() { + return "picstatio"; + } + + @Override + public String getDomain() { + return "picstatio.com"; + } + + @Override + public String getGID(URL url) throws MalformedURLException { + Pattern p = Pattern.compile("https?://www.picstatio.com/([a-zA-Z1-9_-]*)/?$"); + Matcher m = p.matcher(url.toExternalForm()); + if (m.matches()) { + return m.group(1); + } + throw new MalformedURLException("Expected picstatio URL format: " + + "www.picstatio.com//ID - got " + url + " instead"); + } + + @Override + public Document getFirstPage() throws IOException { + // "url" is an instance field of the superclass + return Http.url(url).get(); + } + + @Override + public Document getNextPage(Document doc) throws IOException { + if (doc.select("a.next_page") != null) { + return Http.url("https://www.picstatio.com" + doc.select("a.next_page").attr("href")).get(); + } + throw new IOException("No more pages"); + } + + @Override + public List getURLsFromPage(Document doc) { + List result = new ArrayList<>(); + for (Element e : doc.select("img.img")) { + String imageName = e.parent().attr("href"); + LOGGER.info(getFullSizedImageFromURL(imageName.split("/")[2])); + result.add(getFullSizedImageFromURL(imageName.split("/")[2])); + } + return result; + } + + @Override + public void downloadURL(URL url, int index) { + addURLToDownload(url, getPrefix(index)); + } +} \ No newline at end of file From f34b1273f5a38fa494c1bd9b9ec6119a80aa676a Mon Sep 17 00:00:00 2001 From: cyian-1756 Date: Mon, 18 Jun 2018 11:29:10 -0400 Subject: [PATCH 2/3] Got PicstatioRipper working --- .../com/rarchives/ripme/ripper/rippers/PicstatioRipper.java | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/src/main/java/com/rarchives/ripme/ripper/rippers/PicstatioRipper.java b/src/main/java/com/rarchives/ripme/ripper/rippers/PicstatioRipper.java index 29c71a08..1bd103b5 100644 --- a/src/main/java/com/rarchives/ripme/ripper/rippers/PicstatioRipper.java +++ b/src/main/java/com/rarchives/ripme/ripper/rippers/PicstatioRipper.java @@ -22,7 +22,8 @@ public class PicstatioRipper extends AbstractHTMLRipper { private String getFullSizedImageFromURL(String fileName) { try { - return Http.url("https://www.picstatio.com/wallpaper/" + fileName + "/download").get().select("p.text-center > a").attr("href"); + LOGGER.info("https://www.picstatio.com/wallpaper/" + fileName + "/download"); + return Http.url("https://www.picstatio.com/wallpaper/" + fileName + "/download").get().select("p.text-center > span > a").attr("href"); } catch (IOException e) { e.printStackTrace(); return null; From 7102bdec6f478c21521c84ddf6bacbf5fd265c13 Mon Sep 17 00:00:00 2001 From: cyian-1756 Date: Mon, 18 Jun 2018 11:37:24 -0400 Subject: [PATCH 3/3] Added PicstatioRipper unit test --- .../ripper/rippers/PicstatioRipperTest.java | 19 +++++++++++++++++++ 1 file changed, 19 insertions(+) create mode 100644 src/test/java/com/rarchives/ripme/tst/ripper/rippers/PicstatioRipperTest.java diff --git a/src/test/java/com/rarchives/ripme/tst/ripper/rippers/PicstatioRipperTest.java b/src/test/java/com/rarchives/ripme/tst/ripper/rippers/PicstatioRipperTest.java new file mode 100644 index 00000000..606cd569 --- /dev/null +++ b/src/test/java/com/rarchives/ripme/tst/ripper/rippers/PicstatioRipperTest.java @@ -0,0 +1,19 @@ +package com.rarchives.ripme.tst.ripper.rippers; + +import java.io.IOException; +import java.net.URL; + +import com.rarchives.ripme.ripper.rippers.PicstatioRipper; + +public class PicstatioRipperTest extends RippersTest { + + public void testRip() throws IOException { + PicstatioRipper ripper = new PicstatioRipper(new URL("https://www.picstatio.com/aerial-view-wallpapers")); + testRipper(ripper); + } + + public void testGID() throws IOException { + PicstatioRipper ripper = new PicstatioRipper(new URL("https://www.picstatio.com/aerial-view-wallpapers")); + assertEquals("aerial-view-wallpapers", ripper.getGID(new URL("https://www.picstatio.com/aerial-view-wallpapers"))); + } +} \ No newline at end of file