Added docstring to all functions. 🎉

2017-12-22 12:52:38 +01:00
parent 6bdf904a40
commit 98c05a380d
4 changed files with 195 additions and 160 deletions
--- a/torrentSearch/http_utils.py
+++ b/torrentSearch/http_utils.py
@@ -8,26 +8,41 @@ from urllib.error import URLError

 logger = logging.getLogger('torrentSearch')

-def build_url(ssl, baseUrl, path, args_dict=[]):
+def build_url(ssl, baseUrl, path, args_dict={}):
+   """
+   Given the parameters joins them together to a url to 
+   :param bool ssl: if ssl is to be used or not
+   :param str baseUrl: the start of the url (http://thepiratebay.org)
+   :param list path: the rest of the path to the url (['search', 'lucifer', '0'])
+   :param dict args_dict: a dict with the query element we want to append to the url
+   :return: complete url based on the inputs
+   :rtype: str
+   """
   url_parts = list(parse.urlparse(baseUrl))
   url_parts[0] = 'https' if ssl else 'http'
-   if type(path) is list:
   url_parts[2] = '/'.join(path)
-   else:
-      url_parts[2] = path
   url_parts[4] = parse.urlencode(args_dict)
   return parse.urlunparse(url_parts)

-# Converts a input string or list to percent-encoded string,
-# this is for encoding information in a Uniform Resource
-# Identifier (URI) using urllib
 def convert_query_to_percent_encoded_octets(input_query):
+   """
+   Converts a string with spaces to a string separated by '%20'
+   :param str input_query:
+   :return: string with spaces replaced with '%20' if found any
+   :rtype: str
+   """
   if type(input_query) is list:
      input_query = ' '.join(input_query)

   return parse.quote(input_query)

 def fetch_url(url):
+   """
+   Call and get output for a given url
+   :param str url: the url we want to make a request to
+   :return: a response object with contents and status code of the request
+   :rtype: http.client.HTTPResponse
+   """
   logger.debug('Fetching query: {}'.format(url))
   req = request.Request(url, headers={'User-Agent': 'Mozilla/5.0'})
   try:
--- a/torrentSearch/jackett.py
+++ b/torrentSearch/jackett.py
@@ -21,27 +21,25 @@ class Jackett(object):
      self.page_limit = limit
      self.ssl = ssl

-	# Returns the api key set in the initiator
-	# return [string]
   def get_apikey(self):
      logger.debug('Using api key: {}'.format(self.apikey))
      return self.apikey

-	# Returns the path set in the initiator
-	# return [string]
   def get_path(self):
      return self.path

-	# Returns the page_limit set in the initiator
-	# return [string]
   def get_page_limit(self):
      logger.debug('Current page limit: {} pages'.format(self.page_limit))
      return self.page_limit

-	# Starts the call to getting result from our indexer
-	# query [string]
-	# returns [List of Torrent objects]
   def search(self, query):
+      """
+      Starts the call to getting result from our indexer
+      :param jackett.Jackett self: object instance
+      :param str query: query we want to search for 
+      :return: list of results we found from scraping jackett output based on query
+      :rtype: list
+      """
      baseUrl = 'http://' + self.host
      path = self.get_path()
      url_args = {
@@ -57,10 +55,15 @@ class Jackett(object):
      return self.parse_xml_for_torrents(res.read())


-	# def __init__(self, name, magnet=None, size=None, uploader=None, date=None,
-	# 	seed_count=None, leech_count=None, url=None):
-
   def find_xml_attribute(self, xml_element, attr):
+      """
+      Finds a specific XML attribute given a element name
+      :param jackett.Jackett self: object instance
+      :param xml.etree.ElementTree.Element xml_element: the xml tree we want to search
+      :param str attr: the attribute/element name we want to find in the xml tree
+      :return: the value of the element fiven the attr/element name
+      :rtype: str
+      """
      value = xml_element.find(attr)
      if (value != None):
         logger.debug('Found attribute: {}'.format(attr))
@@ -70,6 +73,13 @@ class Jackett(object):
         return ''

   def parse_xml_for_torrents(self, raw_xml):
+      """
+      Finds a specific XML attribute given a element name
+      :param jackett.Jackett self: object instance
+      :param bytes raw_xml: the xml page returned by querying jackett
+      :return: all the torrents we found in the xml page
+      :rtype: list
+      """
      tree = ET.fromstring(raw_xml)
      channel = tree.find('channel')
      results = []
--- a/torrentSearch/piratebay.py
+++ b/torrentSearch/piratebay.py
@@ -21,20 +21,20 @@ class Piratebay(object):
      self.page = 0
      self.total_pages = -1

-	# Returns the path set in the initiator
-	# return [string]
   def get_path(self):
      return self.path

-	# Returns the page_limit set in the initiator
-	# return [string]
   def get_page_limit(self):
      return self.page_limit

-	# Starts the call to getting result from our indexer
-	# query [string]
-	# returns [List of Torrent objects]
   def search(self, query):
+      """
+      Starts the call to getting result from our thepiratebay site
+      :param piratebay.Piratebay self: object instance
+      :param str query: query we want to search for 
+      :return: list of results we found from scraping thepiratebay site based on query
+      :rtype: list
+      """
      search_query = convert_query_to_percent_encoded_octets(query)
      baseUrl = 'http://' + self.host
      
@@ -45,7 +45,6 @@ class Piratebay(object):

      return self.parse_raw_page_for_torrents(res.read())

-
   def removeHeader(self, bs4_element):
      if ('header' in bs4_element['class']):
         return bs4_element.find_next('tr')
--- a/torrentSearch/search.py
+++ b/torrentSearch/search.py
@@ -79,7 +79,9 @@ def main():
 def getConfig():
   """
   Read path and get configuartion file with site settings
-   Returns config [configparser]
+
+   :return: config settings read from 'config.ini'
+   :rtype: configparser.ConfigParser
   """
   config = configparser.ConfigParser()
   config_dir = os.path.join(BASE_DIR, 'config.ini')
@@ -90,7 +92,10 @@ def getConfig():
 def createJSONList(torrents):
   """
   Iterates over all torrent objects in torrents and gets all attributes which are appended to a list
-   Returns: List of torrents with all their info in a JSON format
+
+   :param list torrents: integer of size of torrent file
+   :return: List of torrents with all their info in a JSON format
+   :rtype: str
   """
   jsonList = []
   for torrent in torrents:
@@ -129,7 +134,13 @@ def chooseCandidate(torrent_list):
 def searchTorrentSite(config, query, site, print_result):
   """
   Selects site based on input and finds torrents for that site based on query
-   Returns json list with results. If print_results is True in args then also prints the output to terminal
+
+   :param configparser.ConfigParser config: integer of size of torrent filest
+   :param str query: query to search search torrents for
+   :param str site: the site we want to index/scrape
+   :param boolean print_result: if the in results should be printed to terminal
+   :return: json list with results
+   :rtype: str
   """
   logger.debug('Searching for query {} at {}'.format(query, site))