Daily-Dose/main.py

277 lines
6.9 KiB
Python

import configparser
from datetime import date
import feedparser
from mdutils import MdUtils
from os import path
from shutil import copy
#################
# Configuration #
#################
markdown = True
pdf = False
html = True
animations = True
html_stylesheet = "styles/simple.css"
title_animation = "fade-down"
heading_animation = "fade-right"
list_animation = "fade-left"
ConvertToHTML = True
title = date.today().strftime('%d %B, %Y')
og_title = title
feed_configuration = ['feeds.ini','covid.ini']
archive_configuration = {"feeds.ini":{"id":"daily-dose-list","folder":"archive-daily-dose",'title':"Daily-Dose"},"covid.ini":{"id":"covid-19-list","folder":"archive-covid-19","title":"Covid-19 Sentry"}}
update_archive = True
#############
# Functinos #
#############
def GetPosts(feed):
Posts = {}
ToIgnore = []
ReadSummary = True
URL = None
ShowLink = False
ToRead = 5
try:
URL = feeds[feed]["URL"]
except KeyError:
print("Improper configuration for %s. No URL Specified")
exit(1)
try:
ToIgnore = eval(feeds[feed]["IGNORE"])
except KeyError:
None
try:
ReadSummary = eval(feeds[feed]["SUMMARY"])
except KeyError:
ReadSummary = True
try:
ToRead = eval(feeds[feed]["ToRead"])
except:
None
try:
ShowLink = eval(feeds[feed]["LINK"])
except KeyError:
None
rss = feedparser.parse(URL)
maximum = len(rss.entries)
count = 0
if ToRead == -1 or ToRead > maximum:
ToRead = maximum
posts = []
summaries = []
links = []
added = 0
while count != maximum and added != ToRead:
Skip = False
Title = str(rss.entries[count].title)
Summary = rss.entries[count].summary
for words in ToIgnore:
if (words.lower() in Title.lower()) or (words.lower() in Summary.lower()):
Skip = True
break
if not Skip:
added += 1
posts.append(Title)
if ReadSummary:
summaries.append(Summary)
if ShowLink:
links.append(rss.entries[count].link)
count += 1
for idx in range(len(posts)):
Posts[idx] = {}
Posts[idx]["post"] = {}
Posts[idx]["post"]["title"] = posts[idx].encode('utf-8')
if ReadSummary:
Posts[idx]["post"]["summary"] = summaries[idx].encode('utf-8')
else:
Posts[idx]["summary"] = None
if ShowLink:
Posts[idx]["post"]["link"] = links[idx].encode('utf-8')
else:
Posts[idx]["post"]["link"] = None
Posts["NoOfPosts"] = len(posts)
Posts["Summary"] = ReadSummary
Posts["ShowLink"] = ShowLink
return Posts
def add_today(HomeFile,TagID,folder):
title = og_title
if path.exists(title+".html") or path.exists(str("./%s/"%folder)+title+".html"):
if path.exists(str("./%s/"%folder)+title+".html"):
None
else:
copy(str(title+".html"),folder)
else:
print("File does not exist!")
exit(1)
TagToFind = 'ul'
TagID = TagID
soup = None
with open(HomeFile) as fp:
soup = BeautifulSoup(fp,'html.parser')
ToUpdate = soup.find(TagToFind,{"id":TagID})
FilePath = str("./%s/"%folder) + str(str(title)+".html")
NewTag = soup.new_tag('li')
anchor = soup.new_tag('a',href=str('./%s/'%folder+title+".html"))
anchor.string = title
NewTag.append(anchor)
ToUpdate.insert(0,NewTag)
with open(HomeFile,'w') as fp:
fp.write(str(soup))
################
# Main Program #
###############
if (pdf and not markdown) or (html and not markdown):
print("Markdown should be True to convert to pdf/html")
exit(1)
if (update_archive and not html):
print("HTML is required to update archive")
exit(1)
for config in feed_configuration:
title = og_title
feeds = configparser.ConfigParser()
if feeds.read(config) == []:
print("%s does not exist!"%config)
exit(1)
else:
print("Reading %s"%config)
feeds.read(config)
rss_feeds = [x for x in feeds.keys()]
rss_feeds.pop(0)
print("Read %s feeds from the configuration file" % str(len(rss_feeds)))
print(rss_feeds)
posts = {}
for feed in rss_feeds:
sauce = GetPosts(feed)
posts[feed] = sauce
#print(posts)
if markdown:
mdfile = None
mdfile = MdUtils(file_name=title,title=archive_configuration[config]['title'])
for feed in posts:
mdfile.new_header(level=1,title="From %s" % feed)
for idx in range(posts[feed]["NoOfPosts"]):
mdfile.write(str("* **"+posts[feed][idx]["post"]["title"].decode('utf-8'))+"**")
if posts[feed]["Summary"]:
mdfile.write(" - ")
mdfile.write(posts[feed][idx]["post"]["summary"].decode('utf-8'))
if posts[feed]["ShowLink"]:
mdfile.write(" - [link](%s)"%posts[feed][idx]["post"]["link"].decode('utf-8'))
mdfile.write("\n\n")
elif posts[feed]["Summary"]:
mdfile.write("\n\n")
else:
mdfile.write("\n")
mdfile.new_line("\n")
mdfile.new_table_of_contents(table_title='Contents', depth=2)
mdfile.create_md_file()
import pypandoc
if pdf:
ifname = str(title.strip()) + ".md"
ofname = str(title.strip()) + ".pdf"
args = ['-V', 'geometry:margin=1.5cm']
convert = pypandoc.convert_file(ifname, 'pdf', outputfile=ofname,extra_args=args)
if html:
from bs4 import BeautifulSoup
ifname = str(title.strip()) + ".md"
ofname = str(title.strip()) + ".html"
convert = pypandoc.convert_file(ifname,'html',outputfile=ofname,extra_args=['-s'])
assert(convert) == ''
soup = None
with open(ofname) as fp:
soup = BeautifulSoup(fp,'html5lib')
title = soup.new_tag('title')
title.string = archive_configuration[config]['title']
soup.head.append(title)
viewport = soup.new_tag("meta",content="width=device-width, initial-scale=1.0")
viewport.attrs["name"] = "viewport"
soup.head.append(viewport)
custom_css = soup.new_tag('link',href=html_stylesheet,rel='stylesheet')
soup.head.append(custom_css)
custom_css = soup.new_tag('link',href=str("../"+html_stylesheet),rel='stylesheet')
soup.head.append(custom_css)
if animations:
aos_css = soup.new_tag('link',href='https://unpkg.com/aos@2.3.1/dist/aos.css',rel='stylesheet')
soup.head.append(aos_css)
aos_js = soup.new_tag('script',src="https://unpkg.com/aos@2.3.1/dist/aos.js")
soup.head.append(aos_js)
aos_script = soup.new_tag('script')
aos_script.string = "AOS.init();"
soup.body.append(aos_script)
for feed in rss_feeds:
ToFindID = str("from-"+str(feed.strip().replace(":","").replace(" ","-").lower()))
ToEdit = soup.find("h1", {"id": ToFindID})
ToEdit['data-aos'] = 'fade-right'
soup.find_all("h1")[0]['data-aos'] = title_animation
soup.find("h1",{"id":"contents"})['data-aos'] = heading_animation
soup.find("h1",{"id":"contents"})['data-aos-anchor-placement'] = "top-bottom"
paragraphs = soup.find_all("p")
for paras in paragraphs:
paras['data-aos'] = list_animation
paras['data-aos-anchor-placement'] = "bottom-bottom"
lis = soup.find_all("li")
for li in lis:
if li.a == None:
li['data-aos'] = list_animation
li['data-aos-anchor-placement'] = "bottom-bottom"
with open(ofname, "w") as outf:
outf.write(str(soup))
if update_archive:
add_today('index.html',archive_configuration[config]["id"],folder=archive_configuration[config]["folder"])