From 1d0c7698e25139f8968b7e8ac66d38a753c07d76 Mon Sep 17 00:00:00 2001 From: MetaPrime Date: Mon, 13 Jan 2025 14:01:49 -0800 Subject: [PATCH] Implement FapwizRipper --- .../ripme/ripper/rippers/FapwizRipper.java | 112 ++++++++++++++++++ .../tst/ripper/rippers/FapwizRipperTest.java | 27 +++++ 2 files changed, 139 insertions(+) create mode 100644 src/main/java/com/rarchives/ripme/ripper/rippers/FapwizRipper.java create mode 100644 src/test/java/com/rarchives/ripme/tst/ripper/rippers/FapwizRipperTest.java diff --git a/src/main/java/com/rarchives/ripme/ripper/rippers/FapwizRipper.java b/src/main/java/com/rarchives/ripme/ripper/rippers/FapwizRipper.java new file mode 100644 index 000000000..ad2013830 --- /dev/null +++ b/src/main/java/com/rarchives/ripme/ripper/rippers/FapwizRipper.java @@ -0,0 +1,112 @@ +package com.rarchives.ripme.ripper.rippers; + +import java.io.IOException; +import java.net.MalformedURLException; +import java.net.URL; +import java.util.ArrayList; +import java.util.List; +import java.util.regex.Matcher; +import java.util.regex.Pattern; + +import org.jsoup.nodes.Document; +import org.apache.logging.log4j.LogManager; +import org.apache.logging.log4j.Logger; +import org.jsoup.nodes.Element; +import org.jsoup.select.Elements; + +import com.rarchives.ripme.ripper.AbstractHTMLRipper; + +public class FapwizRipper extends AbstractHTMLRipper { + + private static final Logger logger = LogManager.getLogger(FapwizRipper.class); + + private static final Pattern CATEGORY_PATTERN = + Pattern.compile("https?://fapwiz.com/category/([a-zA-Z1-9_-]+)/?$"); + + private static final Pattern USER_PATTERN = + Pattern.compile("https?://fapwiz.com/([a-zA-Z1-9_-]+)/?$"); + + private static final Pattern POST_PATTERN = + Pattern.compile("https?://fapwiz.com/([a-zA-Z1-9_-]+)/([a-zA-Z1-9_-]+)/?$"); + + public FapwizRipper(URL url) throws IOException { + super(url); + } + + @Override + public String getHost() { + return "fapwiz"; + } + + @Override + public String getDomain() { + return "fapwiz.com"; + } + + @Override + public String getGID(URL url) throws MalformedURLException { + Matcher m; + + m = CATEGORY_PATTERN.matcher(url.toExternalForm()); + if (m.matches()) { + return "category_" + m.group(1); + } + + m = USER_PATTERN.matcher(url.toExternalForm()); + if (m.matches()) { + return "user_" + m.group(1); + } + + m = POST_PATTERN.matcher(url.toExternalForm()); + if (m.matches()) { + return m.group(1) + "_" + m.group(2); + } + + throw new MalformedURLException("Expected fapwiz URL format: " + + "fapwiz.com/NAME - got " + url + " instead"); + } + + @Override + public List getURLsFromPage(Document doc) { + List result = new ArrayList<>(); + + Matcher m; + + m = CATEGORY_PATTERN.matcher(url.toExternalForm()); + if (m.matches()) { + // structure of user page - does it work for category pages too? + doc.select(".post-items-holder img").forEach(e -> { + String imgSrc = e.attr("src"); + // Replace -thumbnail.jpg with .mp4 + String videoSrc = imgSrc.replace("-thumbnail.jpg", ".mp4"); + result.add(videoSrc); + }); + } + + m = USER_PATTERN.matcher(url.toExternalForm()); + if (m.matches()) { + // structure of user page + doc.select(".post-items-holder img").forEach(e -> { + String imgSrc = e.attr("src"); + // Replace -thumbnail.jpg with .mp4 + String videoSrc = imgSrc.replace("-thumbnail.jpg", ".mp4"); + result.add(videoSrc); + }); + } + + m = POST_PATTERN.matcher(url.toExternalForm()); + if (m.matches()) { + doc.select("video source").forEach(video -> { + result.add(video.attr("src")); + }); + } + + return result; + } + + @Override + public void downloadURL(URL url, int index) { + sleep(2000); + addURLToDownload(url, getPrefix(index)); + } +} diff --git a/src/test/java/com/rarchives/ripme/tst/ripper/rippers/FapwizRipperTest.java b/src/test/java/com/rarchives/ripme/tst/ripper/rippers/FapwizRipperTest.java new file mode 100644 index 000000000..7b417df75 --- /dev/null +++ b/src/test/java/com/rarchives/ripme/tst/ripper/rippers/FapwizRipperTest.java @@ -0,0 +1,27 @@ +package com.rarchives.ripme.tst.ripper.rippers; + +import java.io.IOException; +import java.net.URI; +import java.net.URISyntaxException; +import java.net.URL; + +import com.rarchives.ripme.ripper.rippers.FapwizRipper; +import org.junit.jupiter.api.Assertions; +import org.junit.jupiter.api.Tag; +import org.junit.jupiter.api.Test; + +public class FapwizRipperTest extends RippersTest { + @Test + @Tag("flaky") + public void testRip() throws IOException, URISyntaxException { + FapwizRipper ripper = new FapwizRipper(new URI("https://Fapwiz.com/blowjob-bunny-puts-on-a-show/").toURL()); + testRipper(ripper); + } + + @Test + public void testGetGID() throws IOException, URISyntaxException { + URL url = new URI("https://Fapwiz.com/blowjob-bunny-puts-on-a-show/").toURL(); + FapwizRipper ripper = new FapwizRipper(url); + Assertions.assertEquals("blowjob-bunny-puts-on-a-show", ripper.getGID(url)); + } +}