-
Notifications
You must be signed in to change notification settings - Fork 3
/
flask_app.py
132 lines (118 loc) · 4.69 KB
/
flask_app.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
import torch, os, gdown
from flask import Flask, render_template, request, send_from_directory, make_response, jsonify
from pipelines import pipeline
from transformers import AutoTokenizer
from summarizer import Summarizer
app = Flask(__name__)
if os.path.isfile('./models/quant-t5-base.pt'):
pass
else:
print('Downloading models...')
if not os.path.isdir('models'): os.mkdir('models')
url1 = 'https://drive.google.com/uc?id=1-3ahaSJEmQFhFBmHnlze_0xgDjSKlUYN'
url2 = 'https://drive.google.com/uc?id=1-3MCWlC5Cqt6btBQnWtoidLezn4ybwdA'
url3 = 'https://drive.google.com/uc?id=1-IojDSCb9CGG-FqkJn8rWDelCh0QGbBC'
output1 = "models/qa-gen-base-t5.pt"
output2 = "models/quant-t5-base.pt"
output3 = "models/distil-bert-base.pt"
gdown.download(url1, output1, quiet=True)
gdown.download(url2, output2, quiet=True)
gdown.download(url3, output3, quiet=True)
print('Models downloaded..')
device = 'cpu'
print("Device used:", device)
print('Loading models....')
t5_base = torch.load('models/quant-t5-base.pt', map_location=device) # summarizer, text_similarity
Tokenizer1 = AutoTokenizer.from_pretrained("t5-base" )
t5_small_qa_qg = torch.load('models/qa-gen-small-t5.pt', map_location=device) # questions answer generation
Tokenizer2 = AutoTokenizer.from_pretrained("valhalla/t5-small-qa-qg-hl" )
question_generator = pipeline("question-generation", model=t5_small_qa_qg, tokenizer=Tokenizer2,
ans_model=t5_small_qa_qg, ans_tokenizer=Tokenizer2, use_cuda=device)
print('Done!!')
org_answers = []
# capitilize text of summary
def capitilize_text(source):
stop, output = '.', ''
i,j = 0, 0
for i, w in enumerate(source):
if w == stop:
sen = source[j:i+1].capitalize()
j = i+2
output+=sen
output+=source[j:].capitalize()
return output
# summarize text
def get_summary(text):
try:
text = "summarize: "+text
tokenized_text = Tokenizer1.encode(text, return_tensors="pt")
summary_ids = t5_base.generate(tokenized_text, num_beams=4, no_repeat_ngram_size=2,
min_length=30,max_length=1000, early_stopping=True)
output = Tokenizer1.decode(summary_ids[0], skip_special_tokens=True)
except :
print('Error.....')
return output
# questions and answers
def get_questions(text):
result = question_generator(text)
return result
# compare answers by user and model
def comapare_answers(pred_answer):
correct = 0
for i in range(len(org_answers)):
try:
org_answers[i] = "mrpc sentence1: "+org_answers[i] # model answer
pred_answer[i] = ". sentence2: "+pred_answer[i] # user answer
print(org_answers[i], pred_answer[i])
tokenized_text = Tokenizer1.encode(org_answers[i]+pred_answer[i], return_tensors="pt")
summary_ids = t5_base.generate(tokenized_text)
output = Tokenizer1.decode(summary_ids[0], skip_special_tokens=True)
print(output)
if output == 'equivalent':
correct+=1
except:
continue
return correct
@app.route('/', methods=['GET', 'POST'])
# home page
def home():
return render_template('index.html')
@app.route("/generate/summarize", methods=["POST"])
def summarize():
print('Generating SUmmary.....')
req = request.get_json()
summary = get_summary(req['input_text'])
res = make_response(jsonify({"my_summary": capitilize_text(summary)}), 200)
return res
@app.route("/generate/thequestions", methods=["POST"])
def thequestions():
global org_answers
questions = []
req = request.get_json()
print('Generating SUmmary.....')
text = get_summary(req['input_text'])
print('Generating questions.....')
question_answers = get_questions(text)
print(question_answers)
for a in question_answers:
if len(a['question']) < 70:
questions.append(a['question'])
org_answers.append(a['answer'][6:])
res = make_response(jsonify({"my_questions": questions}), 200)
return res
@app.route('/verifyquestions/verifcation', methods=["POST"])
def verifcation():
global org_answers
print('Verifying answers.......')
pred_answers = request.get_json()
correct_ans = comapare_answers(pred_answers['predicted_answers'])
print('Answers verified.......')
correct_ans = 'You answered {} questions correctly!!'.format(correct_ans)
org_answers = []
my_response = make_response(jsonify({"num_of_correct": correct_ans}), 200)
return my_response
@app.route('/favicon.ico')
def favicon():
return send_from_directory(os.path.join(app.root_path, 'static'), 'favicon.ico', mimetype='image/vnd.microsoft.icon')
if __name__ == '__main__':
app.run()