-
Notifications
You must be signed in to change notification settings - Fork 0
/
application.py
83 lines (71 loc) · 2.15 KB
/
application.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
from flask import Flask,url_for,render_template,request
# NLP Pkgs
from spacy_summarization import text_summarizer
from nltk_summarization import nltk_summarizer
#from gensim.summarization import summarize
import spacy
nlp = spacy.load('en')
import time
#Web scrapping pkg
from bs4 import BeautifulSoup
# from urllib import urlopen
from urllib.request import urlopen
application = app = Flask(__name__)
# Home[2]
#Function
def readingTime(mytext):
total_words = len([token.text for token in nlp(mytext)])
estimated_time = total_words/265.0
return estimated_time
#Fetch data from url
def get_text(url):
page = urlopen(url)
soup = BeautifulSoup(page,"lxml")
#fetch all p tags and put them together
fetched_text = ''.join(map(lambda p:p.text,soup.find_all('p')))
return fetched_text
@app.route('/')
def index():
return render_template('index.html')
@app.route('/analyze', methods=['GET','POST'])
def analyze():
start = time.time()
if request.method == 'POST':
rawtext = request.form['rawtext']
final_reading_time = readingTime(rawtext)
#Summarization
final_summary = text_summarizer(rawtext)
# Time to read
summ_reading_time = readingTime(final_summary)
end = time.time()
final_time = end - start
return render_template('index.html',
ctext = rawtext,
final_summary = final_summary,
final_time = final_time,
final_reading_time = final_reading_time,
summary_reading_time = summ_reading_time)
@app.route('/analyze_url', methods=['GET','POST'])
def analyze_url():
start = time.time()
if request.method == 'POST':
raw_url = request.form['raw_url']
rawtext = get_text(raw_url)
final_reading_time = readingTime(rawtext)
#Summarization
final_summary = text_summarizer(rawtext)
# Time to read
summ_reading_time = readingTime(final_summary)
end = time.time()
final_time = end - start
return render_template('index.html',
ctext = rawtext,
final_summary = final_summary,
final_time = final_time,
final_reading_time = final_reading_time,
summary_reading_time = summ_reading_time)
@app.route('/compare_summary')
def compare_summary():
return render_template('compare_summary.html')
if __name__ == '__main__':
app.run(debug=True)