-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathhtml_output.py
72 lines (56 loc) · 2.47 KB
/
html_output.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
import Json_output
#import client
import numpy
import tldextract
import webbrowser
#import html_text
if __name__=='__main__':
api_key = 'zEbEqMY846voNjx8urJPNdDW99amKrRnjbLXkZz0'
url = input('Enter the article url')
content = Json_output.result(api_key, url)
if (content == None):
print("ERROR: can't get a valid response from the API")
exit(0)
f=open("output_html.html", 'w')
html_open = """<html> \n<head>\n<meta name="viewport" content="width=device-width, initial-scale=1.0">\n
<link href="https://fonts.googleapis.com/css?family=Open+Sans" rel="stylesheet">\n
<link rel="stylesheet" type="text/css" href="style.css">\n</head>\n<body>"""
f.write(html_open)
# Title of the content added to local html file
if (len(content['title'])!=0):
html_heading = """<div class="smart_article_title"><!-- DIV CONTAINER FOR TITLE -->\n<h1 align="center">%s</h1>\n</div> \n\n"""%(content['title'])
f.write(html_heading)
else:
html_heading = ''
f.write(html_heading)
# Adds source website to local html file
# site_name = client.MercuryAPICall.get_top_domain(url)
url_extract = tldextract.extract(url)
site_name = url_extract.domain + '.' + url_extract.suffix
if len(site_name)!=0:
html_site_name = """<li>%s</li>\n"""%(site_name)
else:
html_site_name = ''
# Adds published date if exist to local html file
if (len(str(content['date_published']))>=9):
html_date = """<li>%s</li>\n""" % ((str(content['date_published']))[:10])
else:
html_date = ''
# Adds author name if exist to the local html file
if content['author'] != None:
html_author = """<li>%s</li>\n"""%((content['author']))
else:
html_author = ''
html_meta_info = """<ul class="article_source_date_author">\n%s%s%s</ul>\n\n"""%(html_site_name,html_date,html_author)
f.write(html_meta_info)
# Adds main article content to the local html file
if (len(content['content'])!=0):
# tree = html_text.parse_html(content['content'])
# text = html_text.extract_text(tree)
html_body = """<div class="smart_article_content"><!-- DIV CONTAINER FOR MAIN ARTICLE CONTENT -->\n%s\n</div> \n\n"""%(content['content'])
f.write(html_body)
html_close = """</body>\n</html>"""
f.write(html_close)
# All additions to local html file done
f.close()
webbrowser.open_new_tab('output_html.html')