ImgScroll/src/main/java/com/rarchives/ripme/ripper/rippers/VineboxRipper.java

80 lines
2.3 KiB
Java
Raw Normal View History

2014-03-08 11:38:52 +01:00
package com.rarchives.ripme.ripper.rippers;
import java.io.IOException;
import java.net.MalformedURLException;
import java.net.URL;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import org.apache.log4j.Logger;
import org.jsoup.HttpStatusException;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import com.rarchives.ripme.ripper.AbstractRipper;
public class VineboxRipper extends AbstractRipper {
private static final String DOMAIN = "vinebox.co",
HOST = "vinebox";
private static final Logger logger = Logger.getLogger(VineboxRipper.class);
public VineboxRipper(URL url) throws IOException {
super(url);
}
@Override
public boolean canRip(URL url) {
return url.getHost().endsWith(DOMAIN);
}
@Override
public URL sanitizeURL(URL url) throws MalformedURLException {
2014-03-08 20:23:21 +01:00
return new URL("http://vinebox.co/u/" + getGID(url));
2014-03-08 11:38:52 +01:00
}
@Override
public void rip() throws IOException {
int page = 0;
Document doc;
while (true) {
page++;
String urlPaged = this.url.toExternalForm() + "?page=" + page;
logger.info(" Retrieving " + urlPaged);
2014-03-08 11:38:52 +01:00
try {
doc = Jsoup.connect(urlPaged).get();
} catch (HttpStatusException e) {
logger.debug("Hit end of pages at page " + page, e);
break;
}
for (Element element : doc.select("video")) {
addURLToDownload(new URL(element.attr("src")));
}
try {
Thread.sleep(1000);
} catch (InterruptedException e) {
logger.error("[!] Interrupted while waiting to load next page", e);
break;
}
}
waitForThreads();
}
@Override
public String getHost() {
return HOST;
}
@Override
public String getGID(URL url) throws MalformedURLException {
Pattern p = Pattern.compile("^https?://(www\\.)?vinebox\\.co/u/([a-zA-Z0-9]{1,}).*$");
Matcher m = p.matcher(url.toExternalForm());
if (!m.matches()) {
throw new MalformedURLException("Expected format: http://vinebox.co/u/USERNAME");
}
return m.group(m.groupCount());
}
}