From e9bee91aba119d2a5fffe50f02ace9dab3d8e6dc Mon Sep 17 00:00:00 2001 From: 4pr0n Date: Sun, 1 Jun 2014 01:26:35 -0700 Subject: [PATCH] 1.0.50 - Smutty.com ripper --- pom.xml | 2 +- .../ripper/rippers/ImagestashRipper.java | 1 - .../ripme/ripper/rippers/SmuttyRipper.java | 113 ++++++++++++++++++ .../com/rarchives/ripme/ui/UpdateUtils.java | 2 +- 4 files changed, 115 insertions(+), 3 deletions(-) create mode 100644 src/main/java/com/rarchives/ripme/ripper/rippers/SmuttyRipper.java diff --git a/pom.xml b/pom.xml index 75bfff8ce..b57558a6c 100644 --- a/pom.xml +++ b/pom.xml @@ -4,7 +4,7 @@ com.rarchives.ripme ripme jar - 1.0.49 + 1.0.50 ripme http://rip.rarchives.com diff --git a/src/main/java/com/rarchives/ripme/ripper/rippers/ImagestashRipper.java b/src/main/java/com/rarchives/ripme/ripper/rippers/ImagestashRipper.java index f666ce21a..321779692 100644 --- a/src/main/java/com/rarchives/ripme/ripper/rippers/ImagestashRipper.java +++ b/src/main/java/com/rarchives/ripme/ripper/rippers/ImagestashRipper.java @@ -27,7 +27,6 @@ public ImagestashRipper(URL url) throws IOException { } public boolean canRip(URL url) { - System.err.println(url.getHost() +"/"+DOMAIN); return url.getHost().equals(DOMAIN); } diff --git a/src/main/java/com/rarchives/ripme/ripper/rippers/SmuttyRipper.java b/src/main/java/com/rarchives/ripme/ripper/rippers/SmuttyRipper.java new file mode 100644 index 000000000..2edfd0392 --- /dev/null +++ b/src/main/java/com/rarchives/ripme/ripper/rippers/SmuttyRipper.java @@ -0,0 +1,113 @@ +package com.rarchives.ripme.ripper.rippers; + +import java.io.IOException; +import java.net.MalformedURLException; +import java.net.URL; +import java.util.regex.Matcher; +import java.util.regex.Pattern; + +import org.apache.log4j.Logger; +import org.jsoup.Jsoup; +import org.jsoup.nodes.Document; +import org.jsoup.nodes.Element; + +import com.rarchives.ripme.ripper.AlbumRipper; +import com.rarchives.ripme.ui.RipStatusMessage.STATUS; + +public class SmuttyRipper extends AlbumRipper { + + private static final String DOMAIN = "smutty.com", + HOST = "smutty"; + private static final Logger logger = Logger.getLogger(SmuttyRipper.class); + + public SmuttyRipper(URL url) throws IOException { + super(url); + } + + @Override + public boolean canRip(URL url) { + return (url.getHost().endsWith(DOMAIN)); + } + + @Override + public URL sanitizeURL(URL url) throws MalformedURLException { + return url; + } + + @Override + public void rip() throws IOException { + int page = 0; + String url, tag = getGID(this.url); + boolean hasNextPage = true; + while (hasNextPage) { + page++; + url = "http://smutty.com/h/" + tag + "/?q=%23" + tag + "&page=" + page + "&sort=date&lazy=1"; + this.sendUpdate(STATUS.LOADING_RESOURCE, url); + logger.info(" Retrieving " + url); + Document doc; + try { + doc = Jsoup.connect(url) + .userAgent(USER_AGENT) + .ignoreContentType(true) + .get(); + } catch (IOException e) { + if (e.toString().contains("Status=404")) { + logger.info("No more pages to load"); + } else { + logger.warn("Exception while loading " + url, e); + } + break; + } + for (Element image : doc.select("a.l > img")) { + String imageUrl = image.attr("src"); + + // Construct direct link to image based on thumbnail + StringBuilder sb = new StringBuilder(); + String[] fields = imageUrl.split("/"); + for (int i = 0; i < fields.length; i++) { + if (i == fields.length - 2 && fields[i].equals("m")) { + fields[i] = "b"; + } + sb.append(fields[i]); + if (i < fields.length - 1) { + sb.append("/"); + } + } + imageUrl = sb.toString(); + addURLToDownload(new URL(imageUrl)); + } + if (doc.select("#next").size() == 0) { + break; // No more pages + } + // Wait before loading next page + try { + Thread.sleep(1000); + } catch (InterruptedException e) { + logger.error("[!] Interrupted while waiting to load next album:", e); + break; + } + } + waitForThreads(); + } + + @Override + public String getHost() { + return HOST; + } + + @Override + public String getGID(URL url) throws MalformedURLException { + Pattern p = Pattern.compile("^https?://smutty\\.com/h/([a-zA-Z0-9\\-_]+).*$"); + Matcher m = p.matcher(url.toExternalForm()); + if (m.matches()) { + return m.group(1); + } + p = Pattern.compile("^https?://[wm.]*smutty\\.com/search/\\?q=([a-zA-Z0-9\\-_%]+).*$"); + m = p.matcher(url.toExternalForm()); + if (m.matches()) { + return m.group(1).replace("%23", ""); + } + throw new MalformedURLException("Expected tag in URL (smutty.com/h/tag and not " + url); + } + +} diff --git a/src/main/java/com/rarchives/ripme/ui/UpdateUtils.java b/src/main/java/com/rarchives/ripme/ui/UpdateUtils.java index 93c6d54f1..00d551da6 100644 --- a/src/main/java/com/rarchives/ripme/ui/UpdateUtils.java +++ b/src/main/java/com/rarchives/ripme/ui/UpdateUtils.java @@ -21,7 +21,7 @@ public class UpdateUtils { private static final Logger logger = Logger.getLogger(UpdateUtils.class); - private static final String DEFAULT_VERSION = "1.0.49"; + private static final String DEFAULT_VERSION = "1.0.50"; private static final String updateJsonURL = "http://rarchives.com/ripme.json"; private static final String updateJarURL = "http://rarchives.com/ripme.jar"; private static final String mainFileName = "ripme.jar";