epam-python-courses-7-bsu · Sergey582 · Nov 18, 2019 · Nov 20, 2019 · Nov 20, 2019 · Nov 21, 2019
diff --git a/final_task/README.md b/final_task/README.md
@@ -1,3 +1,48 @@
-# Your readme here
-Some text.
-Checkout how to write this file using *markdown*.
+
+#### This program receives RSS URL and prints results in human-readable format.
+
+- positional arguments:
++     source          RSS URL
+
+- optional arguments:
++     -h, --help      show this help message and exit
++     --version       Print version info
++     --json          Print result as JSON in stdout
++     --verbose       Outputs verbose status messages
++     --limit LIMIT   Limit news topics if this parameter provided
++     --date DATE     to search in cache for news by date in the format in YYYYmmdd
++     --to-html PATH  the conversion of news in html file
++     --to-pdf PATH   the conversion of news in pdf file
++     --colorize      print news in multi colored format
++     --clear         Clears news story
+
+
+
+-  Installation recommendation rss-reader:
+1.  Open terminal 
+2. Enter "pip install setuptools" or "pip3 install setuptools"
+3. Go to the folder final_task
+4. Enter "python3 setup.py install"
+5. Application installed
+6. To run the utility, type in the terminal "rss-reader" then a space and url on news
+- Example : rss-reader  https://news.yahoo.com/rss
+
+- News caching: 
++     In order to see the history you must enter an additional parameter --date
++     Example: rss-reader https://news.tut.by/rss/ --limit 2 --date 20191122
++     Searching by date and source or only by date
+
+- Format converter:
+1. Use --to-pdf to save news in pdf format
+2. Use --to-html to save news in html format
+3. If no internet connection, get a file without images
+4. Enter the full path to the file 
+5. If you enter path to directory,news successfully saved to file "your path+News.(pdf or html)"
+
+- If you enter --colorize,that will print the result of the utility in colorized mode.
+- If you enter --colorize with --json,that will print the result of the utility in json in colorized mode.
+
+- If you enter --clear this will delete all cached news
+
+
+
diff --git a/final_task/config.txt b/final_task/config.txt
@@ -0,0 +1,5 @@
+database postgres
+user postgres
+password 1
+host localhost
+port 5432
diff --git a/final_task/rss_reader/News.py b/final_task/rss_reader/News.py
@@ -0,0 +1,53 @@
+from dataclasses import dataclass
+import datetime
+import logging
+
+MODULE_LOGGER = logging.getLogger("rss_reader.News")
+
+
+@dataclass
+class News:
+    feed: str
+    title: str
+    date: datetime.datetime
+    link: str
+    info_about_image: str
+    briefly_about_news: str
+    links_from_news: list
+
+    def get_json(self):
+        """
+            returns news in json format
+        """
+        logger = logging.getLogger("rss_reader.News.get_json")
+        logger.info("return news in json format")
+        data = {
+            "Feed": self.feed,
+            "Title": self.title,
+            "Date": str(self.date),
+            "Link": self.link,
+            "Info about image": self.info_about_image,
+            "Briefly about news": self.briefly_about_news,
+            "Links": self.links_from_news
+
+        }
+        return data
+
+    def __str__(self):
+        """
+           Return a string representation of the news for print in stdout.
+        """
+        logger = logging.getLogger("rss_reader.News.__str__")
+        logger.info("return str")
+        links = ""
+        for index, link in enumerate(self.links_from_news or []):
+            if link:
+                links += "[" + str(index) + "] " + link + "\n"
+
+        return f"Feed: {self.feed}\n" \
+               f"Title: {self.title} \n" \
+               f"Date: {self.date} \n" \
+               f"Link: {self.link}\n" \
+               f"Info about image: {self.info_about_image}\n" \
+               f"Briefly about news: {self.briefly_about_news}\n" \
+               f"Links: \n{links}"
diff --git a/final_task/rss_reader/__init__.py b/final_task/rss_reader/__init__.py
diff --git a/final_task/rss_reader/converter.py b/final_task/rss_reader/converter.py
@@ -0,0 +1,209 @@
+import fnmatch
+import logging
+import os
+import textwrap
+from io import BytesIO
+
+import dominate
+import requests
+from PIL import Image
+from dominate import tags
+from reportlab.lib.pagesizes import A4
+from reportlab.pdfbase import pdfmetrics
+from reportlab.pdfbase.ttfonts import TTFont
+from reportlab.pdfgen.canvas import Canvas
+
+MODULE_LOGGER = logging.getLogger("rss_reader.converter")
+
+
+def get_path(path: str, expansion_file: str) -> str:
+    """
+    Checks the correctness of the entered path
+    if received path to directory check her on exist
+    if directory exist add News and expansion file
+    if received path to file check his on exist and check correctness expansion file
+    :param path:
+    :param expansion_file:
+    :return:
+    """
+    logger = logging.getLogger("rss_reader.converter.get_path")
+    logger.info("check path")
+    if os.path.isdir(path):
+        logger.info("path specified to directory")
+        result = path + '/News' + expansion_file
+    else:
+        if not fnmatch.fnmatch(path, '*%s' % expansion_file):
+            logger.error("Invalid expansion ")
+            raise FileNotFoundError(f"Invalid expansion {path}")
+        if not os.path.isdir(path[:path.rfind("/") + 1]):
+            logger.error("File or directory not found")
+            raise FileNotFoundError(f"File or directory not found {path}")
+        result = path
+    return result
+
+
+def get_html(list_of_news: list):
+    """
+    Forms html content
+    :param list_of_news:
+    :return:
+    """
+    logger = logging.getLogger("rss_reader.converter.get_html")
+    logger.info("getting html content")
+    doc = dominate.document(title='RSS READER')
+    for news in list_of_news:
+        with doc.head:
+            tags.link(rel='stylesheet', href='style.css')
+            tags.script(type='text/javascript', src='script.js')
+            tags.style("""\
+                     body {
+                         background-color: #F9F8F1;
+                         color: #2C232A;
+                         font-family: sans-serif;
+                         font-size: 2.6em;
+                         margin: 3em 1em;
+                     }
+
+                 """)
+
+        with doc:
+            with tags.div(id='header'):
+                tags.p("Feed: ", news.feed)
+                tags.p("Title: ", news.title)
+                tags.p("Date ", str(news.date))
+                tags.p("Link: ", tags.a(news.link.title(), href=news.link, target="_blank"))
+                tags.p("Info about image: ", news.info_about_image)
+                tags.p("Briefly about news: ", news.briefly_about_news)
+                tags.p("Links: ", )
+                for reference in news.links_from_news:
+                    if reference:
+                        tags.li(tags.a(reference.title(), href=reference, target="_blank"))
+                if news.links_from_news[1]:
+                    tags.a(tags.img(
+                        src=news.links_from_news[1],
+                        width="200", height="200", alt=news.info_about_image),
+                        href=news.links_from_news[1], target="_blank")
+    logger.info("html content received")
+    return doc
+
+
+def conversion_of_news_in_html(path, list_of_news):
+    logger = logging.getLogger("rss_reader.converter.conversion_of_news_in_html")
+    logger.info("conversion of news in html")
+    correct_path = get_path(path, ".html")
+    html_content = get_html(list_of_news)
+    save_html(correct_path, html_content)
+    logger.info("conversion of news in html successful completed")
+
+
+def save_html(path, html_content):
+    """
+    Save news in file
+    :param path:
+    :param html_content:
+    :return:
+    """
+    logger = logging.getLogger("rss_reader.converter.save_html")
+    try:
+        with open(path, 'w') as file:
+            file.write(html_content.render())
+        print("news successfully saved to file ", path)
+        logger.info("news successfully saved to file  ")
+    except MemoryError:
+        logger.error("not enough memory to save html file")
+        print("You do not have enough memory to save html file")
+
+
+def get_img(image_name, reference):
+    """
+    Download image in file
+    :param image_name:
+    :param reference:
+    :return: True if image successfully downloaded
+    """
+    logger = logging.getLogger("rss_reader.converter.get_img")
+    logger.info("return img")
+    is_picture = False
+    try:
+        response = requests.get(reference)
+        img = Image.open(BytesIO(response.content))
+        img = img.resize((100, 100))
+        img = img.convert('RGB')
+        img.save(image_name, 'JPEG')
+        is_picture = True
+    except requests.exceptions.ConnectionError:
+        logger = logging.getLogger("rss_reader.converter.get_img")
+        logger.error("You do not have an internet connection\n"
+                     "your news will be saved in pdf without pictures")
+    except requests.exceptions.MissingSchema:
+        logger = logging.getLogger("rss_reader.converter.get_img")
+        logger.error("Invalid url picture \n")
+    except OSError:
+        logger = logging.getLogger("rss_reader.converter.get_img")
+        logger.error("cannot identify image\n")
+    return is_picture
+
+
+def text_separator(text: str, break_long_words: bool) -> list:
+    """
+    Breaks text into lines of 50 characters
+    :param text:
+    :param break_long_words:
+    :return:
+    """
+    logger = logging.getLogger("rss_reader.converter.text_separator")
+    format_text = textwrap.fill(text, width=50, break_long_words=break_long_words)
+    ls = format_text.split('\n')
+    logger.info("text successfully broken")
+    return ls
+
+
+def print_text_in_pdf(canvas, text, x, y):
+    logger = logging.getLogger("rss_reader.converter.print_list_in_pdf")
+    logger.info("print list in pdf")
+    ls = text_separator(text, False)
+    for lines in ls:
+        if y < 45:
+            canvas.showPage()
+            canvas.setFont('FreeSans', 19)
+            y = 800
+        y -= 25
+        canvas.drawString(x, y, lines)
+    return y - 25
+
+
+def conversion_of_news_in_pdf(path, list_of_news):
+    logger = logging.getLogger("rss_reader.converter.conversion_of_news_in_pdf")
+    correct_path = get_path(path, ".pdf")
+    canvas = Canvas(correct_path, pagesize=A4)
+    pdfmetrics.registerFont(TTFont('FreeSans', 'FreeSans.ttf'))
+    canvas.setFont('FreeSans', 19)
+    canvas.setTitle("RSS READER")
+    x = 10
+    y = 800
+    pdfmetrics.registerFont(TTFont('FreeSans', 'FreeSans.ttf'))
+    name_buffer_picture_file = "tmp1"
+    for index, news in enumerate(list_of_news):
+        name_buffer_picture_file = name_buffer_picture_file[:-1] + str(index)
+        canvas.setFont('FreeSans', 19)
+        if get_img(name_buffer_picture_file + '.jpg', news.links_from_news[1]):
+            y -= 170
+            if y < 45:
+                canvas.showPage()
+                canvas.setFont('FreeSans', 19)
+                y = 680
+            canvas.drawImage(name_buffer_picture_file + ".jpg", x, y, 150, 150)
+            os.remove(name_buffer_picture_file + '.jpg')
+            y -= 40
+        y = print_text_in_pdf(canvas, news.feed, x, y)
+        y = print_text_in_pdf(canvas, news.title, x, y)
+        y = print_text_in_pdf(canvas, str(news.date), x, y)
+        y = print_text_in_pdf(canvas, news.link, x, y)
+        y = print_text_in_pdf(canvas, news.info_about_image, x, y)
+        y = print_text_in_pdf(canvas, news.briefly_about_news, x, y)
+        if y < 45:
+            canvas.showPage()
+            y = 800
+    logger.info("save news in pdf")
+    canvas.save()
+    print("news successfully saved to file  ", correct_path)