ImgScroll/src/main/java/com/rarchives/ripme/ripper/rippers/EHentaiRipper.java

package com.rarchives.ripme.ripper.rippers;

import java.io.File;
import java.io.IOException;
import java.net.MalformedURLException;
import java.net.URL;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.select.Elements;

import com.rarchives.ripme.ripper.AbstractHTMLRipper;
import com.rarchives.ripme.ripper.DownloadThreadPool;
import com.rarchives.ripme.ui.RipStatusMessage.STATUS;
import com.rarchives.ripme.utils.Http;
import com.rarchives.ripme.utils.Utils;

public class EHentaiRipper extends AbstractHTMLRipper {
    // All sleep times are in milliseconds
    private static final int PAGE_SLEEP_TIME     = 3000;
    private static final int IMAGE_SLEEP_TIME    = 1500;
    private static final int IP_BLOCK_SLEEP_TIME = 60  * 1000;

    private String lastURL = null;

    // Thread pool for finding direct image links from "image" pages (html)
    private DownloadThreadPool ehentaiThreadPool = new DownloadThreadPool("ehentai");
    @Override
    public DownloadThreadPool getThreadPool() {
        return ehentaiThreadPool;
    }

    // Current HTML document
    private Document albumDoc = null;

    private static final Map<String,String> cookies = new HashMap<>();
    static {
        cookies.put("nw", "1");
        cookies.put("tip", "1");
    }

    public EHentaiRipper(URL url) throws IOException {
        super(url);
    }

    @Override
    public String getHost() {
        return "e-hentai";
    }

    @Override
    public String getDomain() {
        return "e-hentai.org";
    }

    public String getAlbumTitle(URL url) throws MalformedURLException {
        try {
            // Attempt to use album title as GID
            if (albumDoc == null) {
                albumDoc = getPageWithRetries(url);
            }
            Elements elems = albumDoc.select("#gn");
            return getHost() + "_" + elems.first().text();
        } catch (Exception e) {
            // Fall back to default album naming convention
            logger.warn("Failed to get album title from " + url, e);
        }
        return super.getAlbumTitle(url);
    }

    @Override
    public String getGID(URL url) throws MalformedURLException {
        Pattern p;
        Matcher m;

        p = Pattern.compile("^https?://e-hentai\\.org/g/([0-9]+)/([a-fA-F0-9]+)/$");
        m = p.matcher(url.toExternalForm());
        if (m.matches()) {
            return m.group(1) + "-" + m.group(2);
        }

        throw new MalformedURLException(
                "Expected e-hentai.org gallery format: "
                        + "http://e-hentai.org/g/####/####/"
                        + " Got: " + url);
    }

    /**
     * Attempts to get page, checks for IP ban, waits.
     * @param url
     * @return Page document
     * @throws IOException If page loading errors, or if retries are exhausted
     */
    private Document getPageWithRetries(URL url) throws IOException {
        Document doc;
        int retries = 3;
        while (true) {
            sendUpdate(STATUS.LOADING_RESOURCE, url.toExternalForm());
            logger.info("Retrieving " + url);
            doc = Http.url(url)
                      .referrer(this.url)
                      .cookies(cookies)
                      .get();
            if (doc.toString().contains("IP address will be automatically banned")) {
                if (retries == 0) {
                    throw new IOException("Hit rate limit and maximum number of retries, giving up");
                }
                logger.warn("Hit rate limit while loading " + url + ", sleeping for " + IP_BLOCK_SLEEP_TIME + "ms, " + retries + " retries remaining");
                retries--;
                try {
                    Thread.sleep(IP_BLOCK_SLEEP_TIME);
                } catch (InterruptedException e) {
                    throw new IOException("Interrupted while waiting for rate limit to subside");
                }
            }
            else {
                return doc;
            }
        }
    }

    @Override
    public Document getFirstPage() throws IOException {
        if (albumDoc == null) {
            albumDoc = getPageWithRetries(this.url);
        }
        this.lastURL = this.url.toExternalForm();
        return albumDoc;
    }

    @Override
    public Document getNextPage(Document doc) throws IOException {
        // Check if we've stopped
        if (isStopped()) {
            throw new IOException("Ripping interrupted");
        }
        // Find next page
        Elements hrefs = doc.select(".ptt a");
        if (hrefs.size() == 0) {
            logger.info("doc: " + doc.html());
            throw new IOException("No navigation links found");
        }
        // Ensure next page is different from the current page
        String nextURL = hrefs.last().attr("href");
        if (nextURL.equals(this.lastURL)) {
            logger.info("lastURL = nextURL : " + nextURL);
            throw new IOException("Reached last page of results");
        }
        // Sleep before loading next page
        sleep(PAGE_SLEEP_TIME);
        // Load next page
        Document nextPage = getPageWithRetries(new URL(nextURL));
        this.lastURL = nextURL;
        return nextPage;
    }

    @Override
    public List<String> getURLsFromPage(Document page) {
        List<String> imageURLs = new ArrayList<>();
        Elements thumbs = page.select("#gdt > .gdtm a");
        // Iterate over images on page
        for (Element thumb : thumbs) {
            imageURLs.add(thumb.attr("href"));
        }
        return imageURLs;
    }

    @Override
    public void downloadURL(URL url, int index) {
        EHentaiImageThread t = new EHentaiImageThread(url, index, this.workingDir);
        ehentaiThreadPool.addThread(t);
        try {
            Thread.sleep(IMAGE_SLEEP_TIME);
        }
        catch (InterruptedException e) {
            logger.warn("Interrupted while waiting to load next image", e);
        }
    }

    /**
     * Helper class to find and download images found on "image" pages
     *
     * Handles case when site has IP-banned the user.
     */
    private class EHentaiImageThread extends Thread {
        private URL url;
        private int index;
        private File workingDir;

        EHentaiImageThread(URL url, int index, File workingDir) {
            super();
            this.url = url;
            this.index = index;
            this.workingDir = workingDir;
        }

        @Override
        public void run() {
            fetchImage();
        }

        private void fetchImage() {
            try {
                Document doc = getPageWithRetries(this.url);

                // Find image
                Elements images = doc.select(".sni > a > img");
                if (images.size() == 0) {
                    // Attempt to find image elsewise (Issue #41)
                    images = doc.select("img#img");
                    if (images.size() == 0) {
                        logger.warn("Image not found at " + this.url);
                        return;
                    }
                }
                Element image = images.first();
                String imgsrc = image.attr("src");
                logger.info("Found URL " + imgsrc + " via " + images.get(0));
                Pattern p = Pattern.compile("^http://.*/ehg/image.php.*&n=([^&]+).*$");
                Matcher m = p.matcher(imgsrc);
                if (m.matches()) {
                    // Manually discover filename from URL
                    String savePath = this.workingDir + File.separator;
                    if (Utils.getConfigBoolean("download.save_order", true)) {
                        savePath += String.format("%03d_", index);
                    }
                    savePath += m.group(1);
                    addURLToDownload(new URL(imgsrc), new File(savePath));
                }
                else {
                    // Provide prefix and let the AbstractRipper "guess" the filename
                    String prefix = "";
                    if (Utils.getConfigBoolean("download.save_order", true)) {
                        prefix = String.format("%03d_", index);
                    }
                    addURLToDownload(new URL(imgsrc), prefix);
                }
            } catch (IOException e) {
                logger.error("[!] Exception while loading/parsing " + this.url, e);
            }
        }
    }
}
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`package com.rarchives.ripme.ripper.rippers;`

Fix ehentai "image.php" filenames. Closes #37 2014-05-14 07:40:47 +02:00			`import java.io.File;`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`import java.io.IOException;`
			`import java.net.MalformedURLException;`
			`import java.net.URL;`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`import java.util.ArrayList;`
Unifying external page requests to a single method 2014-06-20 13:09:36 +02:00			`import java.util.HashMap;`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`import java.util.List;`
Unifying external page requests to a single method 2014-06-20 13:09:36 +02:00			`import java.util.Map;`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`import java.util.regex.Matcher;`
			`import java.util.regex.Pattern;`

			`import org.jsoup.nodes.Document;`
			`import org.jsoup.nodes.Element;`
			`import org.jsoup.select.Elements;`

Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`import com.rarchives.ripme.ripper.AbstractHTMLRipper;`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00			`import com.rarchives.ripme.ripper.DownloadThreadPool;`
			`import com.rarchives.ripme.ui.RipStatusMessage.STATUS;`
Using new wrapper for HTTP requests, started abstract classes to simplify rippers 2014-06-22 02:08:42 +02:00			`import com.rarchives.ripme.utils.Http;`
1.0.46 - Auto-indexing images is now a config option Files saved with auto-indexing are numbered 001_, 002_, etc This can now be toggled off via a config switch. Should close #44 2014-05-26 09:31:58 +02:00			`import com.rarchives.ripme.utils.Utils;`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`public class EHentaiRipper extends AbstractHTMLRipper {`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00			`// All sleep times are in milliseconds`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`private static final int PAGE_SLEEP_TIME = 3000;`
			`private static final int IMAGE_SLEEP_TIME = 1500;`
			`private static final int IP_BLOCK_SLEEP_TIME = 60 * 1000;`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`private String lastURL = null;`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00			`// Thread pool for finding direct image links from "image" pages (html)`
			`private DownloadThreadPool ehentaiThreadPool = new DownloadThreadPool("ehentai");`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`@Override`
			`public DownloadThreadPool getThreadPool() {`
			`return ehentaiThreadPool;`
			`}`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00
			`// Current HTML document`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`private Document albumDoc = null;`
removed the unused g subdomain from the ehentai ripper (#453) 2017-02-22 07:24:52 +01:00
Update to Java 8 * Changed the Maven target to 1.8 * Performed a preliminary cleanup using IntelliJ's Code Analysis (Only Java 7/8 updates and a few other entries in the Error and Warnings categories) * Updated the readme to change the required Java version 2017-10-24 16:33:28 +02:00			`private static final Map<String,String> cookies = new HashMap<>();`
Unifying external page requests to a single method 2014-06-20 13:09:36 +02:00			`static {`
			`cookies.put("nw", "1");`
			`cookies.put("tip", "1");`
			`}`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00
			`public EHentaiRipper(URL url) throws IOException {`
			`super(url);`
			`}`

			`@Override`
			`public String getHost() {`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`return "e-hentai";`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`}`
removed the unused g subdomain from the ehentai ripper (#453) 2017-02-22 07:24:52 +01:00
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`@Override`
			`public String getDomain() {`
removed the unused g subdomain from the ehentai ripper (#453) 2017-02-22 07:24:52 +01:00			`return "e-hentai.org";`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`}`

			`public String getAlbumTitle(URL url) throws MalformedURLException {`
			`try {`
			`// Attempt to use album title as GID`
			`if (albumDoc == null) {`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`albumDoc = getPageWithRetries(url);`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`}`
			`Elements elems = albumDoc.select("#gn");`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`return getHost() + "_" + elems.first().text();`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`} catch (Exception e) {`
			`// Fall back to default album naming convention`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00			`logger.warn("Failed to get album title from " + url, e);`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`}`
			`return super.getAlbumTitle(url);`
			`}`

			`@Override`
			`public String getGID(URL url) throws MalformedURLException {`
			`Pattern p;`
			`Matcher m;`

removed the unused g subdomain from the ehentai ripper (#453) 2017-02-22 07:24:52 +01:00			`p = Pattern.compile("^https?://e-hentai\\.org/g/([0-9]+)/([a-fA-F0-9]+)/$");`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`m = p.matcher(url.toExternalForm());`
			`if (m.matches()) {`
Fixing ehentai regex for #41 2014-05-14 07:56:02 +02:00			`return m.group(1) + "-" + m.group(2);`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`}`

			`throw new MalformedURLException(`
removed the unused g subdomain from the ehentai ripper (#453) 2017-02-22 07:24:52 +01:00			`"Expected e-hentai.org gallery format: "`
			`+ "http://e-hentai.org/g/####/####/"`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`+ " Got: " + url);`
			`}`
removed the unused g subdomain from the ehentai ripper (#453) 2017-02-22 07:24:52 +01:00
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`/**`
			`* Attempts to get page, checks for IP ban, waits.`
			`* @param url`
			`* @return Page document`
			`* @throws IOException If page loading errors, or if retries are exhausted`
			`*/`
			`private Document getPageWithRetries(URL url) throws IOException {`
			`Document doc;`
			`int retries = 3;`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00			`while (true) {`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`sendUpdate(STATUS.LOADING_RESOURCE, url.toExternalForm());`
			`logger.info("Retrieving " + url);`
			`doc = Http.url(url)`
			`.referrer(this.url)`
			`.cookies(cookies)`
			`.get();`
			`if (doc.toString().contains("IP address will be automatically banned")) {`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00			`if (retries == 0) {`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`throw new IOException("Hit rate limit and maximum number of retries, giving up");`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00			`}`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`logger.warn("Hit rate limit while loading " + url + ", sleeping for " + IP_BLOCK_SLEEP_TIME + "ms, " + retries + " retries remaining");`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00			`retries--;`
			`try {`
			`Thread.sleep(IP_BLOCK_SLEEP_TIME);`
			`} catch (InterruptedException e) {`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`throw new IOException("Interrupted while waiting for rate limit to subside");`
1.0.55 - Ehentai ripper bypasses content warning Closes #57 2014-06-07 10:05:30 +02:00			`}`
1.0.47 - E-hentai: URL validation, logs more info For troubleshooting #41 2014-05-26 11:13:56 +02:00			`}`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`else {`
			`return doc;`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00			`}`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`}`
			`}`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`@Override`
			`public Document getFirstPage() throws IOException {`
			`if (albumDoc == null) {`
			`albumDoc = getPageWithRetries(this.url);`
			`}`
			`this.lastURL = this.url.toExternalForm();`
			`return albumDoc;`
			`}`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`@Override`
			`public Document getNextPage(Document doc) throws IOException {`
			`// Check if we've stopped`
			`if (isStopped()) {`
			`throw new IOException("Ripping interrupted");`
			`}`
			`// Find next page`
			`Elements hrefs = doc.select(".ptt a");`
			`if (hrefs.size() == 0) {`
			`logger.info("doc: " + doc.html());`
			`throw new IOException("No navigation links found");`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`}`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`// Ensure next page is different from the current page`
			`String nextURL = hrefs.last().attr("href");`
			`if (nextURL.equals(this.lastURL)) {`
			`logger.info("lastURL = nextURL : " + nextURL);`
			`throw new IOException("Reached last page of results");`
			`}`
			`// Sleep before loading next page`
			`sleep(PAGE_SLEEP_TIME);`
			`// Load next page`
			`Document nextPage = getPageWithRetries(new URL(nextURL));`
			`this.lastURL = nextURL;`
			`return nextPage;`
			`}`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`@Override`
			`public List<String> getURLsFromPage(Document page) {`
Update to Java 8 * Changed the Maven target to 1.8 * Performed a preliminary cleanup using IntelliJ's Code Analysis (Only Java 7/8 updates and a few other entries in the Error and Warnings categories) * Updated the readme to change the required Java version 2017-10-24 16:33:28 +02:00			`List<String> imageURLs = new ArrayList<>();`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`Elements thumbs = page.select("#gdt > .gdtm a");`
			`// Iterate over images on page`
			`for (Element thumb : thumbs) {`
			`imageURLs.add(thumb.attr("href"));`
			`}`
			`return imageURLs;`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`}`

Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`@Override`
			`public void downloadURL(URL url, int index) {`
			`EHentaiImageThread t = new EHentaiImageThread(url, index, this.workingDir);`
			`ehentaiThreadPool.addThread(t);`
			`try {`
			`Thread.sleep(IMAGE_SLEEP_TIME);`
			`}`
			`catch (InterruptedException e) {`
			`logger.warn("Interrupted while waiting to load next image", e);`
			`}`
implemented ripper for EHentai galleries 2014-05-08 20:31:29 +02:00			`}`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00
			`/**`
			`* Helper class to find and download images found on "image" pages`
removed the unused g subdomain from the ehentai ripper (#453) 2017-02-22 07:24:52 +01:00			`*`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00			`* Handles case when site has IP-banned the user.`
			`*/`
			`private class EHentaiImageThread extends Thread {`
			`private URL url;`
			`private int index;`
			`private File workingDir;`

Update to Java 8 * Changed the Maven target to 1.8 * Performed a preliminary cleanup using IntelliJ's Code Analysis (Only Java 7/8 updates and a few other entries in the Error and Warnings categories) * Updated the readme to change the required Java version 2017-10-24 16:33:28 +02:00			`EHentaiImageThread(URL url, int index, File workingDir) {`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00			`super();`
			`this.url = url;`
			`this.index = index;`
			`this.workingDir = workingDir;`
			`}`

			`@Override`
			`public void run() {`
			`fetchImage();`
			`}`
removed the unused g subdomain from the ehentai ripper (#453) 2017-02-22 07:24:52 +01:00
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00			`private void fetchImage() {`
			`try {`
Moving from MultiPage ripper to HTML ripper, added JSON ripper 2014-06-23 04:12:29 +02:00			`Document doc = getPageWithRetries(this.url);`
1.0.49 - Ehentai ripper revamped For #41: * Multi-threading * Longer wait periods * Rate-limit checks & retries * New method for retrieving image from page 2014-06-01 08:53:35 +02:00
			`// Find image`
			`Elements images = doc.select(".sni > a > img");`
			`if (images.size() == 0) {`
			`// Attempt to find image elsewise (Issue #41)`
			`images = doc.select("img#img");`
			`if (images.size() == 0) {`
			`logger.warn("Image not found at " + this.url);`
			`return;`
			`}`
			`}`
			`Element image = images.first();`
			`String imgsrc = image.attr("src");`
			`logger.info("Found URL " + imgsrc + " via " + images.get(0));`
			`Pattern p = Pattern.compile("^http://./ehg/image.php.&n=([^&]+).*$");`
			`Matcher m = p.matcher(imgsrc);`
			`if (m.matches()) {`
			`// Manually discover filename from URL`
			`String savePath = this.workingDir + File.separator;`
			`if (Utils.getConfigBoolean("download.save_order", true)) {`
			`savePath += String.format("%03d_", index);`
			`}`
			`savePath += m.group(1);`
			`addURLToDownload(new URL(imgsrc), new File(savePath));`
			`}`
			`else {`
			`// Provide prefix and let the AbstractRipper "guess" the filename`
			`String prefix = "";`
			`if (Utils.getConfigBoolean("download.save_order", true)) {`
			`prefix = String.format("%03d_", index);`
			`}`
			`addURLToDownload(new URL(imgsrc), prefix);`
			`}`
			`} catch (IOException e) {`
			`logger.error("[!] Exception while loading/parsing " + this.url, e);`
			`}`
			`}`
			`}`
removed the unused g subdomain from the ehentai ripper (#453) 2017-02-22 07:24:52 +01:00			`}`