redditpaper.pyw

#! /usr/bin/env python3.4

# Created by Cameron Gagnon
# Version: beta
# Contact: cgagnon@umich.edu or 
#          cameron.gagnon@gmail.com
#
# If you have any questions, comments or concerns,
# or improvements to this code,
# feel free to email me and we can go from there.
# I'd love to help anyone use this to make their
# desktop backgrounds always look awesome.
# If you're having trouble using this program,
# please reach out and I can try
# my best to help you out!
#
# This is under the GNU GPL V3 so use it
# and modify it however you want
#
# Inspiration for this program came from: 
# http://goo.gl/729Qdg
# http://goo.gl/2MD8tZ 
# Check 'em out and give 'em some love

#what to import
import praw
import sqlite3
import pprint
import argparse
import configparser
import json
import os
import subprocess
import re
import sys 
import time
import urllib.request
import subprocess
import logging
import logging.handlers
from detools import wallpaper
from PIL import Image
from bs4 import BeautifulSoup
from socket import timeout
from urllib.error import HTTPError,URLError
from requests.exceptions import ConnectionError
from collections import OrderedDict
#sets up global var
USERAGENT = "Reddit wallpaper changer script:v1.0 /u/camerongagnon"

# MANY DEFAULT VALUES ARE DECLARED GLOBAL IN THE PARSE ARGUMENTS
# FUNCTION TO SET UP THE VALUES FOR THE RUN OF THE PROGRAM

# declared as global in functions so we can
# decrement MAXPOSTS when we encounter an img
# that != width/height requirements. This is
# because in Cycle_wallpaper, it will cycle
# the list of images from 0 to MAXPOSTS


# make sure to have a file in the same directory with your username
# on the first line, and password on the second
def main(argList = None):
    image_list = []
    try:
        # preliminary functions
        try:
            if log:
                pass
        except NameError:
            # likely occurs when log is not
            # defined, so we must define it
            Config_logging()

        args = Parse_cmd_args(argList)
        config = Config.config(args)
        
        Database()    
        sql, cur = Database.connect_to_DB()
        log.debug("made database connection")
        r = Connected("https://www.reddit.com/.json")
        

        # this is the main function that will download and parse
        # the images

        Main_photo_controller(r, image_list)
        Cycle_wallpaper(image_list)

        sql.close()
        # this is printed for ease of use when viewing the debug file
        log.debug("################################################"
                  "################################################\n")
        Config.writeStatusBar("")
    
    except KeyboardInterrupt:
        log.info("CTRL + C entered from command line, exiting...")
        Config.writeStatusBar("")
        sql.close()
        sys.exit(0)

    except:
        log.debug("Unknown error occured", exc_info = True)

####################################################################
### CLASS IMPLEMNTATIONS
####################################################################
class BaseImg():

    def setAsWallpaper(self):
        """ 
            Sets the image as the wallpaper. This is called toward the
            end of the program, so the image_name, and save location
            should be set.
        """
        try:                            
            # call wallpaper program to set the image as the
            # wallpaper
            print(Config.downloadLoc() + self.image_name) 
            wallpaper.set_wallpaper(self.save_location)
            
            statusStr = "Wallpaper should be set to: %s " % (self.image_name)
            Config.writeStatusBar(statusStr) 
            log.debug(statusStr)
             
            # sets the last wallpaper to the config file
            config = Config.file_found()
            if config:
                config.set('Last Wallpaper', 'Wallpaper', self.image_name)
                with open('settings.conf', 'w') as configfile:
                    config.write(configfile)
   
        except KeyboardInterrupt:
                sys.exit(0)
        except:
            log.exception("Error setting wallpaper, it is likely the "
                          "file path is not 100% correct. Make sure "
                          "there is a foward slash at the end of the "
                          "path in the SETWALLPAPER variable.", exc_info=True)
            sys.exit(1)


class Img(BaseImg):
    """
        Creates an img instance for each post found when returning
        content from reddit, encapsulates title, id, image name, etc.
        into one container to operate on.
    """

    def __init__(self, post):
        self.setProperties(post)
 
    def setProperties(self, post):
        self.setTitle(post.title)
        self.setPost(post.permalink)
        self.setLink(post.url)
        self.setID(post.id)
        self.setNSFW(post.over_18)

    def setImgName(self, image_name):
        self.image_name = image_name
        self.setSaveLoc()

    def setTitle(self, title):
        self.title = title

    def setLink(self, link):
        self.link = link

    def setPost(self, post):
        self.post = post

    def setID(self, id):
        self.id = id

    def setNSFW(self, nsfw):
        self.nsfw = nsfw
    
    def setSaveLoc(self):
        self.save_location = Config.downloadLoc() + str(self.image_name)

    def formatImgName(self):
        # finds last '/' in url
        remove = self.link.rindex('/')
        # returns only past the last '/'
        self.image_name =  self.link[remove + 1:]


########################################################################
class SingleImg(Img):
    """
        Downloads the image from the link manually entered by the user
    """
    def __init__(self, link):
        if link:
            self.setLink(link)
            flag = self.download(link)
            if flag:
                self.setAsWallpaper()
                
                sql, cur = Database.connect_to_DB()
                cur.execute('INSERT INTO oldposts (ImgName, ImgTitle,\
                             ImgLink, ImgPost) VALUES (?, ?, ?, ?)',
                            [self.image_name, self.title, self.link, self.link])
                sql.commit()


    def download(self, link):
        """ Downloads the image to the save location  """
        try:
            self.formatImgName()
            self.setSaveLoc()
            self.title = "User downloaded: " + self.image_name
        except:
            return False

        # gets the pic download information
        try:
            picdl = urllib.request.Request(link, headers = {'User-Agent':USERAGENT})
        except ValueError:
            # invalid url loaded in probably
            return False

        try:
            picdl = urllib.request.urlopen(picdl, cafile = 'cacert.pem')
        
        except urllib.error.HTTPError:
            log.exception("Could not open the specified picture webpage!!\n",
                          exc_info = True)
            Config.writeStatusBar("Error downloading %s" % link)
            sys.exit(0)
    
        log.info("Downloading: %s \n\t\t\t\t\t\t  as: %s "\
                 "\n\t\t\t\t\t\t  to: %s",
                 self.link, self.image_name, self.save_location)
        Config.writeStatusBar("Downloading %s" % link)
        
        try:

            with open(self.save_location, "wb") as picfile:
                picfile.write(picdl.read())
            return True

        except FileNotFoundError:
            return False

#######################################################################
class DBImg(BaseImg):
    """
        Creates an encapsulation of data about previously downloaded
        images by looking it up in the database. This is called to create
        the image list for the past pictures page in the GUI
    """

    def __init__(self, image_name):
        self.setLookUpInfo(image_name)

    def setLookUpInfo(self, image_name):
        sql, cur = Database.connect_to_DB()
        
        try:
            cur.execute('SELECT ImgTitle, ImgLink, ImgPost, Width, Height\
                                  FROM oldposts WHERE ImgName=?',
                                  [image_name])
        
            result = cur.fetchone()
            self.title = result[0]
            self.link = result[1]
            self.post = result[2]
            self.width = result[3]
            self.height = result[4]
            self.image_name = image_name
            self.save_location = Config.downloadLoc() + self.image_name
        except (sqlite3.OperationalError, TypeError):
            log.debug("Error occured in making a DBImg()")

    def updateSaveLoc(self):
        self.thumb_save_loc_C = Config.downloadLoc() + self.thumb_name_C
        self.thumb_save_loc_P = Config.downloadLoc() + self.thumb_name_P

    def strip_file_ext(self):
        """
            Used to remove the .jpg or other ending from im.image_name
            so that we can resave the thumbnail with .png
        """
        index = self.image_name.rfind('.')
        self.thumb_name = self.image_name[:index]
        self.add_P()
        self.add_C()
        self.add_png()
    
    def add_P(self):
        self.thumb_name_P = self.thumb_name + "_P.png"
    
    def add_C(self):
        self.thumb_name_C = self.thumb_name + "_C.png"

    def add_png(self):
        """
            Appends the .png to the end of im.image_name to save the
            thumbnail with .png
        """
        self.thumb_name = self.thumb_name + ".png"


########################################################################
class PictureList():
    """
        Returns information/list of images that have been downloaded
        by the program for use in the GUI to display the past images
    """

    def list_pics():
        sql, cur = Database.connect_to_DB() 
        image_list = []
        
        try:
            cur.execute('SELECT * FROM oldposts')
        except sqlite3.OperationalError:
            # return empty list so when iterating the fn 
            # has no objects to iterate over
            log.debug("No images in database to select from currently")
            return image_list 

        results = cur.fetchall()
        for image in results:
            pic = DBImg(image[1]) # image[1] is ImgName
            image_list.append(pic)
        return image_list


########################################################################
class AboutInfo():
    _version = "1.0"

    def version():
        return AboutInfo._version


########################################################################
class Database():

    def __init__(self):
        global cur
        global sql
        """
            creates the database if it does not exist already
        """
        log.info("Accessing database for submission ID's")
        sql, cur = Database.connect_to_DB() 
        # create image database
        cur.execute('CREATE TABLE IF NOT EXISTS oldposts(ID TEXT,\
                     ImgName TEXT, ImgTitle TEXT, ImgLink TEXT,\
                     ImgPost TEXT, Width INT, Height INT)')
    
        # commit dem changes yo
        sql.commit()

    # connects to the wallpaper.db which holds the image info
    def connect_to_DB():
        sql = sqlite3.connect('wallpaper.db')
        cur = sql.cursor()
        return sql, cur

    
    #REQUIRES id of submission to insert
    #MODIFIES database of id's already downloaded
    #EFFECTS  Inserts the submission id into the database after a 
    #         successful download
    def Insert_ImgDB(im):
        log.debug("Data to insert\n\t\t\t\t\t\t  id: %s"
                  "\n\t\t\t\t\t\t  image_name: %s"
                  "\n\t\t\t\t\t\t  title: %s"
                  "\n\t\t\t\t\t\t  Post: %s"
                  "\n\t\t\t\t\t\t  link: %s",
                  im.id, im.image_name, im.title, im.post, im.link) 
        cur.execute('INSERT INTO oldposts (ID, ImgName, ImgTitle,\
                     ImgPost, ImgLink) VALUES (?, ?, ?, ?, ?)',
                    [im.id, im.image_name, im.title, im.post, im.link])
        sql.commit()

    # REQUIRES: valid width/heights to be updated in DB
    # MODIFIES: width and height of specified image
    # EFFECTS:  updates DB with width and height of image
    def updateWH(im, width, height):
        log.debug("Updating %s with width: %s and height: %s" %\
                  (im.image_name, width, height))
        cur.execute('UPDATE oldposts SET Width=?, Height=? WHERE ImgName=?', 
                    [width, height, im.image_name])
        sql.commit()

    # REQUIRES: valid name in oldposts
    # MODIFIES: oldposts DB table
    # EFFECTS:  removes the image and its associated data from the
    #           database.
    def del_img(image_name):
        try:
            sql, cur = Database.connect_to_DB()
            log.debug("Deleting %s from database" % image_name)
            cur.execute('DELETE FROM oldposts WHERE ImgName = ?', [image_name])
            sql.commit()
        except:
            rp.log("ERROR WHILE DELETING DB OBJECT", exc_info = True)
            sys.exit(1)

###########################################################################
class Config():
    """
        Values used to initiate the settings file.
    """

    dir_ = os.path.expanduser("~") + "\\Pictures\\RedditPaper\\"
    try:
        # tries to create this directory, if it already exists
        # then we're good to go
        os.makedirs(dir_)
    except FileExistsError:
        pass
    except:
        # excepts any other error and creates an image folder
        # in the directory where the program was downloaded to
        dir_ = os.getcwd() + "\\Downloaded Images\\"

    default_values = {'DWNLDLOC': dir_,
                      'MINWIDTH': 1024,
                      'MINHEIGHT': 768,
                      'SUBREDDITS': "futureporn+earthporn+"
                                    "technologyporn+spaceporn+"
                                    "imaginarystarscapes+lavaporn",
                      'CATEGORY': "hot",
                      'CYCLETIME' : 0.05,
                      'MAXPOSTS': 5,
                      'NSFW': False,
                      'WALLPAPER': '',
                      'STATUSBAR': ''
                     }
    
    def config(args):
        """
            Updates/creates the config file with the default/new values
            determined by the dict that is passed in
        """
        # split up the jumble of time to set the hr and min correctly
        args['CYCLEHR'], args['CYCLEMIN']=Config.format_time(args['CYCLETIME'])
        # convert NSFW from on/off to True/False 
        args['NSFW'] = Config.convert_NSFW(args['NSFW'])

        config = configparser.ConfigParser()
        config['Statusbar'] = OrderedDict([('Statusbar Text',
                                            args['STATUSBAR'])])
        config['Save Location'] = OrderedDict([('Directory',
                                                args['DWNLDLOC'])])
        config['Options'] = OrderedDict([('Minwidth', args['MINWIDTH']),
                                         ('Minheight', args['MINHEIGHT']),
                                         ('Subreddits', args['SUBREDDITS']),
                                         ('Category', args['CATEGORY']),
                                         ('Maxposts', args['MAXPOSTS'])])
        config['Cycletime'] = OrderedDict([('Hours', args['CYCLEHR']),
                                           ('Minutes', args['CYCLEMIN'])])
        config['Adult Content'] = OrderedDict([('NSFW', args['NSFW'])])
        # this try/except is used because the cmdline args come through here
        # and doesn't contain the wallpaper argument, so it is not always
        # provided
        try: 
            config['Last Wallpaper'] = OrderedDict([('Wallpaper',
                                                     args['WALLPAPER'])])
        except KeyError:
            configParser = configparser.ConfigParser()
            # this is cyclical because we must read the setting in order
            # to reset it with the same value, as this file is rewritten
            # each call to this function. This is so we can pass one of
            # two dictionarys to it without rewriting similar code.
            # ^^CLArgs or DefaultValues
            args['WALLPAPER'] = Config.lastImg()
            config['Last Wallpaper'] = OrderedDict([('Wallpaper',
                                                     args['WALLPAPER'])])
    
        with open('settings.conf', 'w') as configfile:
            config.write(configfile)

        log.debug("Set config file")
    
    def convert_NSFW(nsfw):
        log.debug("nsfw in convert is: %s " % nsfw)
        if nsfw:
            return True
        return False


    def format_time(time):
        """
             Converts the minutes only time to hours and minutes for
             use when updating the config file
        """
        hr = float(time//60)
        min_ = float(time % 60)
        return hr, min_
  

    def file_found():
        """
            Returns true if the file exists, otherwise it returns false
        """
        config = configparser.ConfigParser()
        if config.read("settings.conf") == []:
            log.debug("Settings.conf does not exist.")
            return False
        else:
            return config

    def read_config():
        """
            Reads the values from the config file and also will call config if
            a new file needs to be created. With the read in values, it passes
            them to parse_cmd_args() to set as default values, since that is
            the point of the config file.
        """
        global URL
        
        # create default config file if not created
        config = Config.file_found()

        # if the config file does not exist, create it
        # and make sure config var is set to good parser
        if not config:
            log.debug("Creating configuration file")
            Config.config(Config.default_values)
            config = configparser.ConfigParser()

        config.read('settings.conf')

        # get values stored in settings.conf
        args = {} 
        args['SUBREDDITS'] = config.get('Options', 'Subreddits',
                                fallback = "futureporn+wallpapers+lavaporn+"
                                  "earthporn+imaginarystarscapes+spaceporn")
        args['MINWIDTH'] = config.getint('Options', 'Minwidth', fallback = 1024)
        args['MINHEIGHT'] = config.getint('Options', 'Minheight',
                                          fallback = 768)
        args['MAXPOSTS'] = config.getint('Options', 'Max posts',
                                         fallback = 5)
        args['CYCLETIME'] = config.getfloat('Cycletime', 'Minutes',
                                            fallback = 0.05)
        # must convert minutes and hours to only minutes as that's how the 
        # cycle time works
        hours = config.getfloat('Cycletime', 'Hours', fallback = 0)
        args['CYCLETIME'] = hours * 60 + args['CYCLETIME']
        args['CATEGORY'] = config.get('Options', 'Category', fallback = "hot")
        args['NSFW'] = config.getboolean('Adult Content', 'NSFW',
                                         fallback = False)
        dir_ = os.getcwd() + "\\Downloaded Images\\"
        args['DWNLDLOC'] = config.get('Save Location', 'Directory',
                                              fallback = dir_)
        URL = "https://www.reddit.com/r/" + args['SUBREDDITS'] + "/" + \
                                            args['CATEGORY'] + "/"
        return args

    def minwidth():
        """
            returns the value specified by the method name from the
            settings.conf file. These methods are mostly used in the
            GUI to insert the values stored in settings.conf into the
            Entries on the GUI.
        """
        config = Config.file_found()
        
        if config:
            minwidth = config.getint('Options', 'Minwidth')
            return minwidth

        # this is so we don't break anything if no value is set
        # for this particular value in settings.conf
        return ""

    def minheight():
        config = Config.file_found()
        if config:
            minheight = config.getint('Options', 'Minheight')
            return minheight
        return ""

    def cycletime():
        config = Config.file_found()
        if config:
            min_ = config.getfloat('Cycletime', 'Minutes')
            hr = config.getfloat('Cycletime', 'Hours')
            return hr, min_
        return "", ""

    def downloadLoc():
        config = Config.file_found()
        if config:
            downloadLoc = config.get('Save Location', 'Directory')
            return downloadLoc
        return ""
  
    def nsfw():
        config = Config.file_found()
        if config:
            nsfw = config.getboolean('Adult Content', 'NSFW')
            return nsfw
        return False 

    def subreddits():
        config = Config.file_found()
        if config:
            subreddits = config.get('Options', 'Subreddits')
            subreddits = subreddits.replace("+", " ")
            return subreddits 
        return ""

    def category():
        config = Config.file_found()
        if config:
            category = config.get('Options', 'Category')
            firstLetter = category[0].upper()
            category = firstLetter + category[1:]
            log.debug("Category is: %s" % category)
            return category
        return "Hot"

    def maxposts():
        config = Config.file_found()
        if config:
            maxposts = config.getint('Options', 'Maxposts')
            return maxposts 
        return ""
    
    def lastImg():
        config = Config.file_found()
        if config:
            lastImg = config.get('Last Wallpaper', 'Wallpaper')
            return lastImg
        return ""
    
    def statusBar():
        config = Config.file_found()
        if config:
            statusText = config.get('Statusbar', 'Statusbar Text')
            return statusText
        return ""

    def writeStatusBar(statusText):
        config = Config.file_found()
        if config:
            config['Statusbar'] = OrderedDict([('Statusbar Text',
                                                statusText)])
            with open('settings.conf', 'w+') as configfile:
                config.write(configfile)

####################################################################
### FUNCTION IMPLEMENTATIONS
####################################################################
def Config_logging():
    """ Configures the logging to external file """
    global log

    # set file logger
    rootLog = logging.getLogger('')
    rootLog.setLevel(logging.DEBUG)
    
    # set format for output to file
    formatFile = logging.Formatter(fmt='%(asctime)-s %(levelname)-6s: '\
                                       '%(lineno)d : %(message)s',
                                   datefmt='%m-%d %H:%M')
    
    # add filehandler so once the filesize reaches 5MB a new file is 
    # created, up to 3 files
    fileHandle = logging.handlers.RotatingFileHandler("CrashReport.log",
                                                      maxBytes=5000000,
                                                      backupCount=3,
                                                      encoding = "utf-8")
    fileHandle.setFormatter(formatFile)
    rootLog.addHandler(fileHandle)
    
    # configures logging to console
    # set console logger
    console = logging.StreamHandler()
    console.setLevel(logging.DEBUG) #toggle console level output with this line
    
    # set format for console logger
    consoleFormat = logging.Formatter('%(levelname)-6s %(message)s')
    console.setFormatter(consoleFormat)
    
    # add handler to root logger so console && file are written to
    logging.getLogger('').addHandler(console)
    log = logging.getLogger('reddit-paper')


#####################################################################
#REQUIRES url
#MODIFIES nothing
#EFFECTS  returns true if able to connect to specified url, returns
#         false if not able to connect, or timesout
def Connected(url):
    r = praw.Reddit(user_agent = USERAGENT)

    try:
        uaurl = urllib.request.Request(url,
                 headers={'User-Agent' : USERAGENT})
        url = urllib.request.urlopen(uaurl,
                                     timeout = 3,
                                     cafile = 'cacert.pem')

        content = url.read().decode('utf-8')
        json.loads(content)
        url.close()
        Config.writeStatusBar("Connecting to Reddit...") 
    # Error that usually occurs when there is no internet connection        
    except URLError as e:
        Config.writeStatusBar("Not connected to the internet.") 
        log.error("Not connected to the internet. Check "
                  "your internet connection and try again.")
        log.debug("Error is: %s" % e)
        sys.exit(0)

    except (HTTPError, timeout, AttributeError, ValueError) as e:
        Config.writeStatusBar("Not connected to reddit.com. Sign in to"
                              "internet and try again.")
        log.error("You do not appear to be connected to Reddit.com."
                  " This is likely due to a redirect by the internet connection"
                  " you are on. Check to make sure no login is required and the"
                  " connection is stable, and then try again.")
        log.debug("Error is: %s" % e)
        sys.exit(0)

    return r


####################################################################
#MODIFIES Downloads the image specified by the user 
#EFFECTS  Sets image as wallpaper
def Single_link(link):
    if link:
        SingleImg(link)


####################################################################
#REQUIRES img_link
#MODIFIES img_link
#EFFECTS  Performs operations on url to derive image name and then
#         returns the img_name
def General_parser(img_link):
    if img_link == []:
        return False
    try:
        remove_index = img_link.rindex('/')                        
    except ValueError:
        # occurs when index is not found
        log.debug("'/' in img_link is not found", exc_info = True)
        return False

    image_name =  img_link[remove_index + 1:]
    
    # checks for file format ending, and appends .jpg
    # if none is found
    if image_name.rfind('.') == -1:
        image_name = image_name + ".jpg"
        log.debug("Image name is: {}".format(image_name))

    index = image_name.rfind('.jpg?')
    if index != -1:
        # strips off '?1020a0747' from some image names
        # that have misc. characters after the .jpg
        image_name = image_name[:index + 4]

    return image_name


####################################################################
#REQUIRES url
#MODIFIES url
#EFFECTS  Returns the static download URL of the file, specific
#         to Flickr. This SO post helped:
# https://stackoverflow.com/questions/21673323/download-flickr-images-of-specific-url
#
# A list of titles and how to determine size based on ending characters -
# _o (original file) is used here as it is most reliable,
# although sometimes a very large
# https://www.flickr.com/services/api/misc.urls.html
def Flickr_parse(url):
    try:
        # gets the page and reads the hmtl into flickr_html
        flickr_html = urllib.request.urlopen(url, cafile = 'cacert.pem').read()
        # searches for static flickr url within webpage
        flickr_html = flickr_html.decode('utf-8')
        
        # at the moment, BeautifulSoup would be too difficult to 
        # use to parse the html for the link, as the link is not within
        # standard html anyway. (It's located in 'Model Export' towards the
        # bottom of the page)
        img_link = re.findall(r"""
                              farm           # farm is always in static img url
                              [^":]*         # characters to not capture
                              _[o|k|h|b]\.   # _o indicates original img per 
                                             # flickr standards
                              [jpg|png|gif]* # file format is either 
                                             # png, jpg, or gif
                              """, flickr_html, re.VERBOSE)[0]    
        url = 'https://' + img_link
        # finds urls with \ in them so we must remove them
        url = url.replace('\\', '')
        log.debug("img_link from flickr regex: %s", img_link)
        #generates image_name from static url
        
        return General_parser(img_link), url
    except KeyboardInterrupt:
        sys.exit(0)
    
    # no links/an error occured in finding links in html of page
    except (IndexError,TypeError):
        log.debug("Did not find any links in Flickr_parse")
    
    # this (UnicodeDecodeError) is thrown when the file link is 
    # given to read, and cannot be decoded to "utf-8" therefore,
    # we just need to download the img normally anyway
    except UnicodeDecodeError:
        return General_parser(url), url
    except Exception:
        log.warning("Exception occured, or image does not fit"
                    " required size in Flickr_parse",
                         exc_info = True)
    return False, False

####################################################################
#REQUIRES url
#MODIFIES url, image_name
#EFFECTS  Returns the image_name and url of the correct link to
#         download from. 500px.com sometimes 'protects' the photos
#         so they are not as easily programatically downloaded,
#         however the links in the html provide the 'static' download
#         link
def Five00px_parse(url):
    try:
        #refer to Flickr_parse for explanation of this method
        px_html = urllib.request.urlopen(url, cafile = 'cacert.pem')
    
        img_html = BeautifulSoup(px_html)
        
        # finds the html with class 'the_photo' and returns the src of that elt
        img_link = img_html.select('.the_photo')[0].get('src')
        url = img_link
            
        return General_parser(img_link), url
    except KeyboardInterrupt:
        sys.exit(0)
    except (IndexError,TypeError):
        log.debug("No links found in Five00px_parse")
    except UnicodeDecodeError:
        return General_parser(url), url
    except Exception:
        log.warning("Exception occured in Five00px_parse", 
                         exc_info = True)
    return False, False
####################################################################
# Very similar to Five00px_parse and Flickr_parse, look through there
# for details of workings on this method
def Deviant_parse(url, regex):
    try:

        dev_html = urllib.request.urlopen(url, cafile = 'cacert.pem')

        # direct image download link that must begin with
        # fc or orig or pre
        if regex[:2] == "fc" or regex[:4] == "orig" or\
           regex[:3] == "pre" or regex[:3] == "img":
        
            return General_parser(url), url
        else:
            img_html = BeautifulSoup(dev_html)
        
            # finds all classes with 'dev-content-normal' and finds the src
            # attribute of it
            img_link = img_html.select('.dev-content-normal')[0].get('src')
            url = img_link 
           
            return General_parser(url), url

    except KeyboardInterrupt:
        sys.exit(0)
    except (IndexError, TypeError):
        log.debug("No links found in Deviant_parse")

        return False, False

    # this exception is when the good img url to download is
    # passed in. Since this url when opened is not html, it throws
    # this error, so we know we must find the image title and return
    # the url passed in
    except UnicodeDecodeError:
        return General_parser(url), url
    except Exception:
        log.warning("Exception occured in Deviant_parse",
                         exc_info = True)
        return False, False

####################################################################
# REQUIRES url for earlycanvas parsing
# MODIFIES the link that gets passed as the download link
# EFFECTS Returns the direct link to download the image
def Early_canvas_parser(url):
    html = urllib.request.urlopen(url, cafile = 'cacert.pem')
    html = BeautifulSoup(html)
    div = html.select('.item-image')[0]
    url = div.findChildren()[0].get('src')
    return url

####################################################################
# REQUIRES valid imgur url
# MODIFIES image_name
# EFFECTS  Retrives direct image link from imgur.com when posted
#          as either an album, or gallery. 
#   An album example: https://imgur.com/a/dLB0
#   A gallery example: https://imgur.com/gallery/fDdj6hw
def Imgur_parse(url, regex):

    # check if it's a gif or not from imgur. These don't
    # download/display
    if (url.rfind(".gif") != -1) or (url.rfind(".gifv") != -1):
        log.debug("Image is likely a gif or gifv, not downloading")
        return False, False 

    # then check if it's a direct link
    elif regex == "i.imgur.com":
        image_name = General_parser(url)
        return image_name, url

    # check if an imgur.com/gallery link
    elif (url.find('/gallery/') != -1):
        image_name = General_parser(url)
        url = "https://i.imgur.com/" + image_name   
        return image_name, url

    # /a/ means an album in imgur standards
    elif (url.find('/a/') != -1):
        # have to find new url to download the first image from album
        uaurl = urllib.request.Request(url, headers = {'User-Agent': USERAGENT})
        imgur_html = urllib.request.urlopen(uaurl, cafile = 'cacert.pem')
        soup = BeautifulSoup(imgur_html)
        
        #   | class=image  w/ child <a> | gets href of this <a> child |
        url = soup.select('.image a')[0].get('href')
        url = "https:" + url
        image_name = General_parser(url)
        return image_name, url

    # a regular imgur.com domain but no img type in url
    elif regex == "imgur.com":
        image_name = General_parser(url)
        url = "https://i.imgur.com/" + image_name
        return image_name, url

    # if we get here, there's likely a format of url error
    else:
        log.debug("Something went wrong in Imgur_parse")
        return False, False


####################################################################
#REQUIRES url of image to be renamed 
#MODIFIES nothing
#EFFECTS  Outputs the image title and URL of the photo being downloaded
#         instead of the long URL it comes in as
def Title_from_url(im):
    try:
        #finds last forward slash in index and then slices
        #the url up to that point + 1 to just get the image
        #title
        regex_result = re.findall(r'^(?:https?:\/\/)?(?:www\.)?([^\/]+)',\
                                                    im.link, re.IGNORECASE)
        log.debug("Regex (domain) from URL is: %s ", regex_result)
        
        # imgur domain
        if regex_result[0] == "imgur.com" or \
           regex_result[0] == "i.imgur.com":
           
            # check if we encountered bad data such as a gif or gifv
            image_name, url = Imgur_parse(im.link, regex_result[0])
            if image_name: 
                return image_name, url, True
            else:
                return False, False, False

        # staticflickr domain
        elif (regex_result[0].find("staticflickr") != -1):
            im.formatImgName()
            
            return im.image_name, im.link, True
        
        # flickr domain
        elif (regex_result[0].find("flickr") != -1):
            
            image_name, url = Flickr_parse(im.link)
            
            return image_name, url, True
        
        # 500px domain
        elif (regex_result[0].find("500px.com") != -1):
            
            image_name, url = Five00px_parse(im.link)

            return image_name, url, True
        # deviantart domain
        elif (regex_result[0].find("deviantart") != -1):
            
            image_name, url = Deviant_parse(im.link, regex_result[0])
            
            return image_name, url, True

        # pic.ms just a slight change in url formatting
        elif (regex_result[0].find("pic.ms") != -1):
            im.link = re.sub(r'html/', '', im.link)
            image_name = General_parser(im.link)
            return image_name, im.link, True

        # reddit.com self post
        elif (regex_result[0].find("reddit.com") != -1):
            log.debug("Appears to be a self post from reddit.com")
            return False, False, False

        # earlycanvas post
        elif (regex_result[0].find("earlycanvas.com") != -1):
            im.link = Early_canvas_parser(im.link)
            im.formatImgName()
            return im.image_name, im.link, True
            
        # all other domains with image type in url
        elif (im.link.find(".jpg") != -1) or (im.link.find(".png") != -1)\
             or (im.link.find(".gif") != -1):
            
            return General_parser(im.link), im.link, True

        else:
            remove = im.link.rindex('/')
            
            if remove == -1:
                image_name = im.id + '.jpg'
            else:    
                image_name =  im.link[-(len(im.link) - remove - 1):]
                log.info("Image_name is: %s", image_name)
                
            return image_name, im.link, False
    
    except ValueError:
        log.exception("Error in finding title from URL", exc_info=True)
        return False, False, False


####################################################################
#REQUIRES id of submission in question
#MODIFIES nothing
#EFFECTS  Checks if the id of the submission has already been
#         downloaded. Does not redownload the image if already
#         present. Otherwise downloads it.
def Already_downloaded(im):
    cur.execute('SELECT * FROM oldposts WHERE ID=?', [im.id])
    result = cur.fetchone()

    log.debug("Result of Already_downloaded is: %s", result)
    
    if result: 
        log.info("Picture: %s is already downloaded, will not "
                 "download again.", im.image_name)
        return True
    
    else:
        return False            


####################################################################
#REQUIRES Full title of post which may have the reslotuion of the
#         image
#MODIFIES nothing
#EFFECTS  Returns true if 
def Valid_width_height(im):
    try:
        result = re.findall(r'([0-9,]+)\s*(?:x|\*|×|\xc3\x97|xd7)\s*([0-9,]+)',\
                            im.title, re.IGNORECASE | re.UNICODE)        
        log.debug("Regex from width/height: %s", result)

        result1 = result[0][0]
        result2 = result[0][1]
        # 'erases' unwanted characters in the title
        width = re.sub("[^\d\.]", "", result1)
        height = re.sub("[^\d\.]", "", result2)
        
        log.debug("Width: %s \n\t\t\t\t\t\t  Height: %s", result1, result2)
       
        Database.updateWH(im, width, height)
        return Lookup_width_height(im)

    except IndexError:
        log.debug("The title of the submission does not appear "
                  "to contain the width and height of the image.")
        return False

####################################################################
#REQUIRES width, height from valid id in database
#MODIFIES nothing
#EFFECTS  Returns true if the width and height are above specified
#         dimensions
def Check_width_height(id):
    cur.execute('SELECT * FROM oldposts WHERE ID=?', [id])
    lookup = cur.fetchone()
    
    log.debug(u"Lookup from Check_width_height: %s", lookup)
    
    try: 
        width = lookup[5]
        height = lookup[6]
    
        if ((int(width) >= MINWIDTH) and \
            (int(height) >= MINHEIGHT)):
            return True
        else:
            log.debug("RESOLUTION OF IMAGE DOES NOT MEET REQUIREMENTS")
            return False

    except ValueError:
        log.exception("Incorrect type comparison for width and height"
                      " most likely an incorrect parsing of title.", 
                      exc_info = True)
    except TypeError:
        log.exception("Likely an image that did not include WxH in title.",
                      exc_info = True)
        return True


######################################################################
#REQUIRES checks the image for the width and height from the PIL module
#MODIFIES nothing
#EFFECTS  Returns true if the width and height are above specified
#         dimensions
def PIL_width_height(im):
    # get size of image by checking it after it has already downloaded
    with open(Config.downloadLoc() + im.image_name, 'rb') as file:
        try:
            image = Image.open(file)
        except OSError:
            return False

        width, height = image.size

    try: 
        if ((int(width) >= MINWIDTH) and \
            (int(height) >= MINHEIGHT)):
            Database.updateWH(im, width, height)
            return True

        else:
            Database.updateWH(im, width, height)
            log.debug("RESOLUTION OF IMAGE DOES NOT MEET REQUIREMENTS")
            return False
    except ValueError:
        log.exception("Incorrect type comparison for width and height "
                      "most likely an incorrect parsing of title.", 
                      exc_info=True)


####################################################################
#REQUIRES width, height and ID of the image
#MODIFIES nothing
#EFFECTS  Returns true if the image is greater than the width and 
#         height requirements set by the user.
def Lookup_width_height(im):
    if  Check_width_height(im.id):
        log.debug("Image: %s fits required size.", im.image_name)
        return True
    else:
        log.debug("Image: %s does not fit required size. "
                  "Will not download.", im.image_name)
        return False


####################################################################
#REQUIRES url, image_name, save_location, cur, sql
#MODIFIES file on hard drive, image_list
#EFFECTS  Prints out the download name and location, then saves the
#         picture to that spot.
def Download_img(url, im):

    # gets the pic download information and sets the download location
    picdl = urllib.request.Request(url, headers = {'User-Agent': USERAGENT})
    log.debug("URL is: %s", url)
    
    try:
        picdl = urllib.request.urlopen(picdl, cafile = 'cacert.pem')

    except (urllib.error.HTTPError, urllib.error.URLError):
        log.exception("ERROR: occured in Setting up the url!!\n",
                           exc_info=True)
        return False

    log.info("Downloading: %s \n\t\t\t\t\t\t  as: %s "\
             "\n\t\t\t\t\t\t  to: %s",
             url, im.image_name, im.save_location)

    try:
        with open(im.save_location, "wb") as picfile:
            picfile.write(picdl.read())
    except FileNotFoundError:
        # image is likely from a foreign site with oddly formatted url's
        # that made this fail when finding the file
        return False

    return True


####################################################################
#REQUIRES url 
#MODIFIES download location, adds new picture to file
#EFFECTS  Downloads a new picture from the url specified and saves
#         it to the location specified from Config.downloadLoc().
def Main_photo_controller(r, image_list):
    global MAXPOSTS
    
    Config.writeStatusBar("Fetching %s posts from specified "
                          "subreddits" % MAXPOSTS)
    log.debug("Fetching subreddits from %s", SUBREDDITS)
    log.debug("Pulling top %s posts", MAXPOSTS)
    log.debug("URL of query is %s", URL)

    i = 1        
    posts = MAXPOSTS

    for i, post in enumerate(r.get_content(url=URL,limit = MAXPOSTS),start = 1):
        
        # creates image class which holds necessary data about post
        im = Img(post)
        image_name, url, is_deviant = Title_from_url(im)

        Config.writeStatusBar("Checking %d of %d images" % (i, posts)) 
        log.debug("POST %d @@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@", i)
        log.debug(u"Title of post: {0} \n\t\t\t\t\t\t  Id of post: {1}"
                  u"\n\t\t\t\t\t\t  Link to Img: {2}\n\t\t\t\t\t\t Name of Img: {3}".format(
                  im.title, im.id, im.link, image_name))
        log.debug("is_deviant: %s", is_deviant)

        if (not image_name or not url):
            txt = "Image name or url is bad, not downloading"
            log.debug(txt)
            Config.writeStatusBar(txt)
            MAXPOSTS -= 1

        elif (NSFW and im.nsfw):
            NSFWTxt = "NSFW filter is on, and image is NSFW, not downloading"
            log.debug(NSFWTxt)
            Config.writeStatusBar(NSFWTxt)
            MAXPOSTS -= 1
                        
        else:
            im.setImgName(image_name)
            # if it's already downloaded, we can just check width/height
            if not Already_downloaded(im):
                Database.Insert_ImgDB(im) 
                
                # if it's not already downloaded, we must check the title
                # for width and height, and then attempt a download. If
                # the width/height is present and in range, and the 
                # download is good, we can set the image as the background
                if  Valid_width_height(im) and Download_img(url, im):
                    image_list.append(im)
                    log.debug("Image successfully downloaded with "
                              "WxH in title")

                # if it's not a good width because it's too small or we
                # couldn't find the title, then we check if we can download the
                # image and if that succeeds, then we check the width/height
                # If all these return true we can append the img to the list of
                # images to set
                elif is_deviant and Download_img(url, im) and\
                     PIL_width_height(im):
                    
                    image_list.append(im)
                    # specifically for subs w/o WxH in title, but still
                    # have images to download (e.x. imaginarystarscapes)
                    log.debug("Image successfully downloaded WITHOUT "
                              "WxH in title")
                else:
                    log.debug("PIL_width_height didn't check out, and neither "
                              "did Download_img, MAXPOSTS -= 1")
                    MAXPOSTS -= 1
            elif not Check_width_height(im.id):
                log.debug("Already downloaded and Check_width_height didn't work "
                          "MAXPOSTS -= 1")
                MAXPOSTS -= 1 
            else:
                # The reason for this is if a search is
                # cancelled before all images are
                # downloaded, then some images will be
                # available but we do not want to download
                # them again. Thus they will not be added
                # to the current image_list until this
                # statement takes place.
                
                image_list.append(im)
        i += 1
    log.debug("Exiting Main_photo_controller fn with MAXPOSTS %s" % MAXPOSTS)


###################################################################
#REQUIRES SETWALLPAPER command, and image_list 
#MODIFIES wallpaper background of the computer
#EFFECTS  Cycles through the wallpapers that are given by the titles
#         in the image_list list, based on the CYCLETIME
def Cycle_wallpaper(image_list):
    
    log.debug("NUM OF IMAGES IS: %s", len(image_list))
    Config.writeStatusBar("%d images downloaded" % len(image_list))
    
    try: 
        log.debug(image_list)
        for im in image_list:
            try:
                with open(im.save_location, 'rb') as image_file:
                    Image.open(image_file)
            except OSError:
                # the debug message below explains this try/except
                # block. the continue is so we continue through the
                # for loop
                log.debug("NOT SETTING WALLPAPER. LIKELY AN HTML "
                          "FILE DUE TO NON DIRECT DOWNLOAD LINK "
                          "FOR THE IMAGE!!! SAVING YOU FROM A "
                          "BLACK SCREEN! HALLELUJAH!", exc_info = True)
                continue
            im.setAsWallpaper()
            time.sleep(CYCLETIME*60)
    except IndexError:
        log.error("No posts appear to be in the specific "\
                  "subreddit/category selected. Try another category, or add "
                  "more subreddits to the list.")


###################################################################
#REQUIRES command line args
#MODIFIES some of the global variables declared at top of program
#EFFECTS  Sets variables to modify output of program and change 
#         default options to user specified ones.
def Parse_cmd_args(args = None):
    global MINWIDTH
    global MINHEIGHT
    global CYCLETIME
    global MAXPOSTS
    global CATEGORY
    global URL
    global SUBREDDITS
    global NSFW
    global DWNLDLOC

    default = Config.read_config()

    parser = argparse.ArgumentParser(description="Downloads"
            " images from user specified subreddits and sets"
            " them as the wallpaper.", prog="redditpaper.py")

    parser.add_argument("-mw", "--minwidth",
                        type = int,
                        help="Minimum width of picture required "
                             "to download",
                        default = default['MINWIDTH'])

    parser.add_argument("-mh", "--minheight",   
                        type = int,
                        help="Minimum height of picture required "
                             "to download",
                        default = default['MINHEIGHT'])

    parser.add_argument("-mp", "--maxposts",
                        type = int,
                        help="Amount of images to check and "
                             "download",
                        default = default['MAXPOSTS'])

    parser.add_argument("-t", "--cycletime",
                        type = float,
                        help="Amount of time (in minutes) each image "
                             "will be set as wallpaper",
                        default = default['CYCLETIME'])

    parser.add_argument("-c", "--category",
                        type = str,
                        choices = ['hot', 'new', 'rising', 'controversial',\
                                   'top'],
                        default = default['CATEGORY'],
                        help="Options: hot, new, rising, top")

    parser.add_argument("-s", "--subreddits", 
                        type = str,
                        help="Enter a list of mostly image subreddits "
                             "pull the top images from those subreddits",
                        default = default['SUBREDDITS'])

    parser.add_argument("--nsfw", 
                        help="--nsfw will filter images "
                             "out if they are NSFW",
                        default = default['NSFW'],
                        type = int)

    parser.add_argument("-dl", "--downloadLoc",
                        type = str,
                        help="Set the file location where the pictures "
                             "will be downloaded to. EX. "
                             "C:\\Users\\USERNAME\\pictures\\. Be sure to "
                             "include the last forward/backward slash.",
                        default = default['DWNLDLOC'])

    args = parser.parse_args()
    log.debug("parsing command args: %s" % args)

    a = {}
    # declare as global so rest of program can see the values
    MINWIDTH    =  a['MINWIDTH']   =  args.minwidth
    MINHEIGHT   =  a['MINHEIGHT']  =  args.minheight
    MAXPOSTS    =  a['MAXPOSTS']   =  args.maxposts
    CYCLETIME   =  a['CYCLETIME']  =  args.cycletime
    CATEGORY    =  a['CATEGORY']   =  args.category
    SUBREDDITS  =  a['SUBREDDITS'] =  args.subreddits
    NSFW        =  a['NSFW']       =  args.nsfw
    DWNLDLOC    =  a['DWNLDLOC']   =  args.downloadLoc
    a['STATUSBAR']  =  ""
    
    URL = "https://www.reddit.com/r/" + SUBREDDITS + "/" + CATEGORY + "/"
    log.debug("SUBREDDIT is %s", args.subreddits)

    # log.debug("made it past parsing")
    return a


###################################################################
if __name__ == '__main__':
    main()