2022-02-21 01:10:57 -06:00
|
|
|
import aiohttp
|
|
|
|
import tldextract
|
|
|
|
import lightbulb
|
|
|
|
import pysaucenao
|
|
|
|
|
|
|
|
import config as c
|
|
|
|
|
|
|
|
|
2022-02-21 14:53:53 -06:00
|
|
|
plugin = lightbulb.Plugin("scraper")
|
|
|
|
sauce = pysaucenao.SauceNao(api_key=c.config["saucenao"], priority=(29, 40, 41)) # e621 > Fur Affinity > Twitter
|
2022-02-21 01:10:57 -06:00
|
|
|
|
|
|
|
|
2022-03-03 23:59:46 -06:00
|
|
|
# Return list of matches
|
2022-02-21 01:10:57 -06:00
|
|
|
async def reverse(urls):
|
2022-02-21 13:43:53 -06:00
|
|
|
return [await _saucenao(url) or await _kheina(url) for url in urls]
|
2022-02-21 01:10:57 -06:00
|
|
|
|
2022-02-21 14:53:53 -06:00
|
|
|
|
2022-02-21 01:10:57 -06:00
|
|
|
async def _saucenao(url):
|
|
|
|
try:
|
|
|
|
results = await sauce.from_url(url)
|
|
|
|
except pysaucenao.FileSizeLimitException:
|
|
|
|
raise pysaucenao.FileSizeLimitException(url)
|
|
|
|
except pysaucenao.ImageSizeException:
|
|
|
|
raise pysaucenao.ImageSizeException(url)
|
|
|
|
except pysaucenao.InvalidImageException:
|
|
|
|
raise pysaucenao.InvalidImageException(url)
|
|
|
|
|
2022-02-21 14:53:53 -06:00
|
|
|
return (
|
|
|
|
{
|
|
|
|
"url": results[0].url,
|
2022-02-23 16:20:59 -06:00
|
|
|
"artist": results[0].title
|
|
|
|
if results[0].author_name == "Unknown"
|
|
|
|
else ", ".join(results[0].authors) or "Unknown",
|
2022-02-21 14:53:53 -06:00
|
|
|
"thumbnail": results[0].thumbnail,
|
|
|
|
"similarity": round(results[0].similarity),
|
|
|
|
"source": tldextract.extract(results[0].index).domain,
|
|
|
|
}
|
|
|
|
if results
|
|
|
|
else None
|
|
|
|
)
|
|
|
|
|
2022-02-21 01:10:57 -06:00
|
|
|
|
|
|
|
async def _kheina(url):
|
2022-02-21 14:53:53 -06:00
|
|
|
content = await _post("https://api.kheina.com/v1/search", {"url": url})
|
2022-02-21 13:43:53 -06:00
|
|
|
|
2022-02-21 14:53:53 -06:00
|
|
|
if content["results"][0]["similarity"] < 50:
|
2022-02-21 13:43:53 -06:00
|
|
|
return None
|
|
|
|
|
|
|
|
return {
|
2022-02-21 14:53:53 -06:00
|
|
|
"url": content["results"][0]["sources"][0]["source"],
|
|
|
|
"artist": content["results"][0]["sources"][0]["artist"] or "Unknown",
|
2022-02-23 17:47:12 -06:00
|
|
|
"thumbnail": f"https://cdn.kheina.com/file/kheinacom/{content['results'][0]['sources'][0]['sha1']}.jpg",
|
2022-02-21 14:53:53 -06:00
|
|
|
"similarity": round(content["results"][0]["similarity"]),
|
|
|
|
"source": tldextract.extract(content["results"][0]["sources"][0]["source"]).domain,
|
2022-02-21 13:43:53 -06:00
|
|
|
}
|
2022-02-21 01:10:57 -06:00
|
|
|
|
2022-02-21 14:53:53 -06:00
|
|
|
|
2022-02-21 13:43:53 -06:00
|
|
|
async def _post(url, data):
|
2022-02-21 01:10:57 -06:00
|
|
|
async with aiohttp.ClientSession() as session:
|
2022-02-22 13:11:35 -06:00
|
|
|
async with session.post(url, data=data) as response:
|
2022-02-21 01:10:57 -06:00
|
|
|
return await response.json() if response.status == 200 else None
|
|
|
|
|
|
|
|
|
|
|
|
def load(bot):
|
|
|
|
bot.add_plugin(plugin)
|
2022-02-21 14:53:53 -06:00
|
|
|
|
|
|
|
|
2022-02-21 01:10:57 -06:00
|
|
|
def unload(bot):
|
|
|
|
bot.remove_plugin(plugin)
|