import requests | |||||
from libs.scrapper.scrappersites import imgur, reddit, gfy, tumblr | from libs.scrapper.scrappersites import imgur, reddit, gfy, tumblr | ||||
class scrapper(): | class scrapper(): | ||||
def __init__(self): | def __init__(self): | ||||
pass | pass | ||||
def get(self, url): | |||||
def linkget(self, subreddit): | |||||
html = requests.get("https://reddit.com/r/"+subreddit+".json", headers = {'User-agent': 'RoxBot Discord Bot'}) | |||||
reddit = html.json()["data"]["children"] | |||||
return reddit | |||||
def retriveurl(self, url): | |||||
url2 = "" | url2 = "" | ||||
if "imgur" in url: | if "imgur" in url: | ||||
url2 = imgur.imgur().get(url) | url2 = imgur.imgur().get(url) | ||||
url2 = reddit.reddit().get(url) | url2 = reddit.reddit().get(url) | ||||
elif "media.tumblr" in url: | elif "media.tumblr" in url: | ||||
url2 = tumblr.tumblr().get(url) | url2 = tumblr.tumblr().get(url) | ||||
return url2 | |||||
return url2 |
class eroshare(): | class eroshare(): | ||||
def __init__(self): | def __init__(self): | ||||
pass | pass |
import requests | import requests | ||||
import os | |||||
import wget | |||||
from bs4 import BeautifulSoup | from bs4 import BeautifulSoup | ||||
class imgur(): | class imgur(): | ||||
elif url.split("/")[-2] == "a": | elif url.split("/")[-2] == "a": | ||||
page = requests.get(url) | page = requests.get(url) | ||||
soup = BeautifulSoup(page.content, 'html.parser') | soup = BeautifulSoup(page.content, 'html.parser') | ||||
list = [] | |||||
links = [] | |||||
for img in soup.find_all("img"): | for img in soup.find_all("img"): | ||||
if "imgur" in img["src"]: | if "imgur" in img["src"]: | ||||
if not img["src"] in list: | |||||
list.append(img["src"]) | |||||
if len(list) > 1: | |||||
if not img["src"] in links: | |||||
links.append(img["src"]) | |||||
if len(links) > 1: | |||||
return False | return False | ||||
else: | else: | ||||
return list[0] | |||||
return links[0] |
class tumblr(): | class tumblr(): | ||||
def get(self,url): | def get(self,url): | ||||
return url | |||||
return url |