1
0
mirror of https://github.com/RipMeApp/ripme.git synced 2025-08-15 10:24:04 +02:00

Add Ripper for nsfwalbum.com (#1691)

I've gone ahead and added a ripper for nsfwalbum.com.
They host their images on many different image hosting sites so you must replace part of the image urls to get the full image instead of the thumbnails.
There may be more hosts that I did not find, they can be added in later very easily.
This commit is contained in:
Issung
2025-01-04 21:11:15 +11:00
committed by MetaPrime
parent ba76d3d8b8
commit c1e805d214

View File

@@ -0,0 +1,108 @@
package com.rarchives.ripme.ripper.rippers;
import java.net.MalformedURLException;
import java.net.URL;
import java.util.regex.Pattern;
import java.io.IOException;
import java.net.MalformedURLException;
import java.net.URL;
import java.util.ArrayList;
import java.util.List;
import java.util.regex.Matcher;
import org.jsoup.*;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.select.Elements;
import com.rarchives.ripme.ripper.AbstractHTMLRipper;
import com.rarchives.ripme.utils.Http;
//https://github.com/ripmeapp/ripme/wiki/How-To-Create-A-Ripper-for-HTML-websites
public class NsfwAlbumRipper extends AbstractHTMLRipper
{
private static final String HOST = "nsfwalbum";
private static final String DOMAIN = "nsfwalbum.com";
public NsfwAlbumRipper(URL url) throws IOException
{
super(url);
}
@Override
public String getHost()
{
return HOST;
}
@Override
public String getDomain()
{
return DOMAIN;
}
@Override
public String getGID(URL url) throws MalformedURLException
{
Pattern pattern = Pattern.compile("(?!https:\\/\\/nsfwalbum.com\\/album\\/)\\d+");
Matcher matcher = pattern.matcher(url.toExternalForm());
if (matcher.find())
{
return matcher.group();
}
throw new MalformedURLException("Expected https://nsfwalbum.com/album/albumid URL format nsfwalbum.com/album/albumid - got " + url + " instead.");
}
@Override
public Document getFirstPage() throws IOException
{
return Http.url(url).get();
}
@Override
public List<String> getURLsFromPage(Document doc)
{
List<String> results = new ArrayList<String>();
Elements imgs = doc.select(".album img");
System.out.println(imgs.size() + " elements (thumbnails) found.");
for (Element img : imgs)
{
String thumbURL = img.attr("data-src");
String fullResURL = null;
if (thumbURL.contains("imgspice.com"))
{
fullResURL = thumbURL.replace("_t.jpg", ".jpg");
}
else if (thumbURL.contains("imagetwist.com"))
{
fullResURL = thumbURL.replace("/th/", "/i/");
}
else if (thumbURL.contains("pixhost.com"))
{
fullResURL = thumbURL.replace("https://t", "https://img");
fullResURL = fullResURL.replace("/thumbs/", "/images/");
}
else if (thumbURL.contains("imx.to"))
{
fullResURL = thumbURL.replace("/t/", "/i/");
}
if (fullResURL != null)
results.add(fullResURL);
}
return results;
}
@Override
public void downloadURL(URL url, int index)
{
addURLToDownload(url);
}
}