proof of concept

This commit is contained in:
Bryan Bailey
2019-11-07 10:21:56 -05:00
commit fbcf6769ce
25 changed files with 258 additions and 0 deletions

0
app/panelrip/__init__.py Normal file
View File

47
app/panelrip/ripper.py Normal file
View File

@@ -0,0 +1,47 @@
import os
import urllib.request
from bs4 import BeautifulSoup
def get_soup_obj(url, headers):
req = urllib.request.Request(url, headers=headers)
raw = urllib.request.urlopen(req)
return BeautifulSoup(raw, 'html.parser')
def get_title(soup):
''' Grab the title element string from a Beautiful Soup object
removing the last 45 garbage characters'''
comic_title = soup.title.string.replace('Read All Comics Online For Free', '').replace('', '').replace('|', '')
return comic_title.strip()
def get_img_links(soup):
images = []
for link in soup.findAll('a'):
if not link.has_attr('href'):
img = link.img['src']
images.append(img)
return images
def download_img_links(links, soup, folder, title=None):
# test to see if the folder exists
if title is None:
print('No title specified\ncreating from reqest')
title = get_title(soup)
# if it doesn't, create it
if not os.path.exists(os.path.join(folder, title)):
os.makedirs(os.path.join(folder, title), mode=0o777)
print('Folder {} created...'.format(os.path.join(folder, title)))
# retrieve files from server
for link in links:
opener = urllib.request.build_opener()
opener.addheaders = [('User-agent', 'Mozilla/5.0')]
urllib.request.install_opener(opener)
print('Downloading file {} from {}'.format((link[-6:] if link[-11:-4] != '%2Bcopy' else (link[-13:-11] + link[-4:]) ), title))
urllib.request.urlretrieve(link, filename=os.path.join(folder + '/' + title, title + ' 0' + (link[-6:] if link[-11:-4] != '%2Bcopy' else (link[-13:-11] + link[-4:]) )))
print("Download Complete!")

15
app/panelrip/zipper.py Normal file
View File

@@ -0,0 +1,15 @@
import os
import shutil
import zipfile
basedir = os.path.dirname(__file__)
def create_comic_archive(title, folder):
print('Creating comic archive: {}.cbr'.format(title))
output = shutil.make_archive(title, 'zip', folder)
os.rename(output, os.path.join(folder, title +'.cbr'))
print('Performing folder cleanup...')
for img in os.listdir(folder):
if not img.endswith('.cbr'):
os.remove(os.path.join(folder, img))