Compare commits
18 Commits
Bug493-Gon
...
master
Author | SHA1 | Date |
---|---|---|
李思楠 | 8cbc7c9a0c | |
丁晟晔 | ff6286cf01 | |
丁晟晔 | 1d7e61d751 | |
顾涵 | 708a6a2821 | |
顾涵 | 688a198768 | |
寻宇灿 | 1543b3095d | |
寻宇灿 | c6bf323c60 | |
寻宇灿 | 03ccb3527a | |
Hui Lan | b41e1044bc | |
Hui Lan | 67e921ba60 | |
Hui Lan | a5c3564f15 | |
Hui Lan | 1295616d5b | |
俞黄焘 | c151a0efaa | |
顾涵 | 030b89706e | |
Hui Lan | 349488167b | |
俞黄焘 | 39d96014d9 | |
顾涵 | acd8db6e3e | |
顾涵 | 9f3f5b43e1 |
|
@ -7,7 +7,7 @@ import random, glob
|
||||||
import hashlib
|
import hashlib
|
||||||
from datetime import datetime
|
from datetime import datetime
|
||||||
from flask import Flask, request, redirect, render_template, url_for, session, abort, flash, get_flashed_messages
|
from flask import Flask, request, redirect, render_template, url_for, session, abort, flash, get_flashed_messages
|
||||||
from difficulty import get_difficulty_level, text_difficulty_level, user_difficulty_level
|
from difficulty import get_difficulty_level_for_user, text_difficulty_level, user_difficulty_level
|
||||||
|
|
||||||
|
|
||||||
path_prefix = '/var/www/wordfreq/wordfreq/'
|
path_prefix = '/var/www/wordfreq/wordfreq/'
|
||||||
|
@ -53,7 +53,7 @@ def get_today_article(user_word_list, visited_articles):
|
||||||
# Choose article according to reader's level
|
# Choose article according to reader's level
|
||||||
d1 = load_freq_history(path_prefix + 'static/frequency/frequency.p')
|
d1 = load_freq_history(path_prefix + 'static/frequency/frequency.p')
|
||||||
d2 = load_freq_history(path_prefix + 'static/words_and_tests.p')
|
d2 = load_freq_history(path_prefix + 'static/words_and_tests.p')
|
||||||
d3 = get_difficulty_level(d1, d2)
|
d3 = get_difficulty_level_for_user(d1, d2)
|
||||||
|
|
||||||
d = None
|
d = None
|
||||||
result_of_generate_article = "not found"
|
result_of_generate_article = "not found"
|
||||||
|
|
|
@ -8,6 +8,7 @@
|
||||||
import pickle
|
import pickle
|
||||||
import math
|
import math
|
||||||
from wordfreqCMD import remove_punctuation, freq, sort_in_descending_order, sort_in_ascending_order
|
from wordfreqCMD import remove_punctuation, freq, sort_in_descending_order, sort_in_ascending_order
|
||||||
|
import snowballstemmer
|
||||||
|
|
||||||
|
|
||||||
def load_record(pickle_fname):
|
def load_record(pickle_fname):
|
||||||
|
@ -17,40 +18,50 @@ def load_record(pickle_fname):
|
||||||
return d
|
return d
|
||||||
|
|
||||||
|
|
||||||
def difficulty_level_from_frequency(word, d):
|
def convert_test_type_to_difficulty_level(d):
|
||||||
level = 1
|
"""
|
||||||
if not word in d:
|
对原本的单词库中的单词进行难度评级
|
||||||
return level
|
:param d: 存储了单词库pickle文件中的单词的字典
|
||||||
|
:return:
|
||||||
|
"""
|
||||||
|
result = {}
|
||||||
|
L = list(d.keys()) # in d, we have test types (e.g., CET4,CET6,BBC) for each word
|
||||||
|
|
||||||
if 'what' in d:
|
for k in L:
|
||||||
ratio = (d['what']+1)/(d[word]+1) # what is a frequent word
|
if 'CET4' in d[k]:
|
||||||
level = math.log( max(ratio, 1), 2)
|
result[k] = 4 # CET4 word has level 4
|
||||||
|
elif 'OXFORD3000' in d[k]:
|
||||||
|
result[k] = 5
|
||||||
|
elif 'CET6' in d[k] or 'GRADUATE' in d[k]:
|
||||||
|
result[k] = 6
|
||||||
|
elif 'OXFORD5000' in d[k] or 'IELTS' in d[k]:
|
||||||
|
result[k] = 7
|
||||||
|
elif 'BBC' in d[k]:
|
||||||
|
result[k] = 8
|
||||||
|
|
||||||
level = min(level, 8)
|
return result # {'apple': 4, ...}
|
||||||
return level
|
|
||||||
|
|
||||||
|
|
||||||
def get_difficulty_level(d1, d2):
|
def get_difficulty_level_for_user(d1, d2):
|
||||||
d = {}
|
"""
|
||||||
L = list(d1.keys()) # in d1, we have freuqence for each word
|
d2 来自于词库的35511个已标记单词
|
||||||
L2 = list(d2.keys()) # in d2, we have test types (e.g., CET4,CET6,BBC) for each word
|
d1 用户不会的词
|
||||||
L.extend(L2)
|
在d2的后面添加单词,没有新建一个新的字典
|
||||||
L3 = list(set(L)) # L3 contains all words
|
"""
|
||||||
for k in L3:
|
# TODO: convert_test_type_to_difficulty_level() should not be called every time. Each word's difficulty level should be pre-computed.
|
||||||
if k in d2:
|
d2 = convert_test_type_to_difficulty_level(d2) # 根据d2的标记评级{'apple': 4, 'abandon': 4, ...}
|
||||||
if 'CET4' in d2[k]:
|
stemmer = snowballstemmer.stemmer('english')
|
||||||
d[k] = 4 # CET4 word has level 4
|
|
||||||
elif 'CET6' in d2[k]:
|
|
||||||
d[k] = 6
|
|
||||||
elif 'BBC' in d2[k]:
|
|
||||||
d[k] = 8
|
|
||||||
if k in d1: # BBC could contain easy words that are not in CET4 or CET6. So 4 is not reasonable. Recompute difficulty level.
|
|
||||||
d[k] = min(difficulty_level_from_frequency(k, d1), d[k])
|
|
||||||
elif k in d1:
|
|
||||||
d[k] = difficulty_level_from_frequency(k, d1)
|
|
||||||
|
|
||||||
return d
|
|
||||||
|
|
||||||
|
for k in d1: # 用户的词
|
||||||
|
if k in d2: # 如果用户的词以原型的形式存在于词库d2中
|
||||||
|
continue # 无需评级,跳过
|
||||||
|
else:
|
||||||
|
stem = stemmer.stemWord(k)
|
||||||
|
if stem in d2: # 如果用户的词的词根存在于词库d2的词根库中
|
||||||
|
d2[k] = d2[stem] # 按照词根进行评级
|
||||||
|
else:
|
||||||
|
d2[k] = 3 # 如果k的词根都不在,那么就当认为是3级
|
||||||
|
return d2
|
||||||
|
|
||||||
|
|
||||||
def revert_dict(d):
|
def revert_dict(d):
|
||||||
|
@ -62,9 +73,10 @@ def revert_dict(d):
|
||||||
for k in d:
|
for k in d:
|
||||||
if type(d[k]) is list: # d[k] is a list of dates.
|
if type(d[k]) is list: # d[k] is a list of dates.
|
||||||
lst = d[k]
|
lst = d[k]
|
||||||
elif type(d[k]) is int: # for backward compatibility. d was sth like {'word':1}. The value d[k] is not a list of dates, but a number representing how frequent this word had been added to the new word book.
|
elif type(d[
|
||||||
|
k]) is int: # for backward compatibility. d was sth like {'word':1}. The value d[k] is not a list of dates, but a number representing how frequent this word had been added to the new word book.
|
||||||
freq = d[k]
|
freq = d[k]
|
||||||
lst = freq*['2021082019'] # why choose this date? No particular reasons. I fix the bug in this date.
|
lst = freq * ['2021082019'] # why choose this date? No particular reasons. I fix the bug in this date.
|
||||||
|
|
||||||
for time_info in lst:
|
for time_info in lst:
|
||||||
date = time_info[:10] # until hour
|
date = time_info[:10] # until hour
|
||||||
|
@ -79,7 +91,8 @@ def user_difficulty_level(d_user, d):
|
||||||
d_user2 = revert_dict(d_user) # key is date, and value is a list of words added in that date
|
d_user2 = revert_dict(d_user) # key is date, and value is a list of words added in that date
|
||||||
count = 0
|
count = 0
|
||||||
geometric = 1
|
geometric = 1
|
||||||
for date in sorted(d_user2.keys(), reverse=True): # most recently added words are more important while determining user's level
|
for date in sorted(d_user2.keys(),
|
||||||
|
reverse=True): # most recently added words are more important while determining user's level
|
||||||
lst = d_user2[date] # a list of words
|
lst = d_user2[date] # a list of words
|
||||||
lst2 = [] # a list of tuples, (word, difficulty level)
|
lst2 = [] # a list of tuples, (word, difficulty level)
|
||||||
for word in lst:
|
for word in lst:
|
||||||
|
@ -87,17 +100,17 @@ def user_difficulty_level(d_user, d):
|
||||||
lst2.append((word, d[word]))
|
lst2.append((word, d[word]))
|
||||||
|
|
||||||
lst3 = sort_in_ascending_order(lst2) # easiest tuple first
|
lst3 = sort_in_ascending_order(lst2) # easiest tuple first
|
||||||
#print(lst3)
|
# print(lst3)
|
||||||
for t in lst3:
|
for t in lst3:
|
||||||
word = t[0]
|
word = t[0]
|
||||||
hard = t[1]
|
hard = t[1]
|
||||||
#print('WORD %s HARD %4.2f' % (word, hard))
|
# print('WORD %s HARD %4.2f' % (word, hard))
|
||||||
geometric = geometric * (hard)
|
geometric = geometric * (hard)
|
||||||
count += 1
|
count += 1
|
||||||
if count >= 10:
|
if count >= 10:
|
||||||
return geometric**(1/count)
|
return geometric ** (1 / count)
|
||||||
|
|
||||||
return geometric**(1/max(count,1))
|
return geometric ** (1 / max(count, 1))
|
||||||
|
|
||||||
|
|
||||||
def text_difficulty_level(s, d):
|
def text_difficulty_level(s, d):
|
||||||
|
@ -105,13 +118,14 @@ def text_difficulty_level(s, d):
|
||||||
L = freq(s)
|
L = freq(s)
|
||||||
|
|
||||||
lst = [] # a list of tuples, each tuple being (word, difficulty level)
|
lst = [] # a list of tuples, each tuple being (word, difficulty level)
|
||||||
|
stop_words = {'the':1, 'and':1, 'of':1, 'to':1, 'what':1, 'in':1, 'there':1, 'when':1, 'them':1, 'would':1, 'will':1, 'out':1, 'his':1, 'mr':1, 'that':1, 'up':1, 'more':1, 'your':1, 'it':1, 'now':1, 'very':1, 'then':1, 'could':1, 'he':1, 'any':1, 'some':1, 'with':1, 'into':1, 'you':1, 'our':1, 'man':1, 'other':1, 'time':1, 'was':1, 'than':1, 'know':1, 'about':1, 'only':1, 'like':1, 'how':1, 'see':1, 'is':1, 'before':1, 'such':1, 'little':1, 'two':1, 'its':1, 'as':1, 'these':1, 'may':1, 'much':1, 'down':1, 'for':1, 'well':1, 'should':1, 'those':1, 'after':1, 'same':1, 'must':1, 'say':1, 'first':1, 'again':1, 'us':1, 'great':1, 'where':1, 'being':1, 'come':1, 'over':1, 'good':1, 'himself':1, 'am':1, 'never':1, 'on':1, 'old':1, 'here':1, 'way':1, 'at':1, 'go':1, 'upon':1, 'have':1, 'had':1, 'without':1, 'my':1, 'day':1, 'be':1, 'but':1, 'though':1, 'from':1, 'not':1, 'too':1, 'another':1, 'this':1, 'even':1, 'still':1, 'her':1, 'yet':1, 'under':1, 'by':1, 'let':1, 'just':1, 'all':1, 'because':1, 'we':1, 'always':1, 'off':1, 'yes':1, 'so':1, 'while':1, 'why':1, 'which':1, 'me':1, 'are':1, 'or':1, 'no':1, 'if':1, 'an':1, 'also':1, 'thus':1, 'who':1, 'cannot':1, 'she':1, 'whether':1} # ignore these words while computing the artile's difficulty level
|
||||||
for x in L:
|
for x in L:
|
||||||
word = x[0]
|
word = x[0]
|
||||||
if word in d:
|
if word not in stop_words and word in d:
|
||||||
lst.append((word, d[word]))
|
lst.append((word, d[word]))
|
||||||
|
|
||||||
lst2 = sort_in_descending_order(lst) # most difficult words on top
|
lst2 = sort_in_descending_order(lst) # most difficult words on top
|
||||||
#print(lst2)
|
# print(lst2)
|
||||||
count = 0
|
count = 0
|
||||||
geometric = 1
|
geometric = 1
|
||||||
for t in lst2:
|
for t in lst2:
|
||||||
|
@ -120,23 +134,19 @@ def text_difficulty_level(s, d):
|
||||||
geometric = geometric * (hard)
|
geometric = geometric * (hard)
|
||||||
count += 1
|
count += 1
|
||||||
if count >= 20: # we look for n most difficult words
|
if count >= 20: # we look for n most difficult words
|
||||||
return geometric**(1/count)
|
return geometric ** (1 / count)
|
||||||
|
|
||||||
return geometric**(1/max(count,1))
|
|
||||||
|
|
||||||
|
return geometric ** (1 / max(count, 1))
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
|
|
||||||
|
|
||||||
d1 = load_record('frequency.p')
|
d1 = load_record('frequency.p')
|
||||||
#print(d1)
|
# print(d1)
|
||||||
|
|
||||||
d2 = load_record('words_and_tests.p')
|
d2 = load_record('words_and_tests.p')
|
||||||
#print(d2)
|
# print(d2)
|
||||||
|
|
||||||
|
d3 = get_difficulty_level_for_user(d1, d2)
|
||||||
d3 = get_difficulty_level(d1, d2)
|
|
||||||
|
|
||||||
s = '''
|
s = '''
|
||||||
South Lawn
|
South Lawn
|
||||||
|
@ -197,7 +207,6 @@ Amidst the aftermath of this shocking referendum vote, there is great uncertaint
|
||||||
|
|
||||||
'''
|
'''
|
||||||
|
|
||||||
|
|
||||||
s = '''
|
s = '''
|
||||||
British Prime Minister Boris Johnson walks towards a voting station during the Brexit referendum in Britain, June 23, 2016. (Photo: EPA-EFE)
|
British Prime Minister Boris Johnson walks towards a voting station during the Brexit referendum in Britain, June 23, 2016. (Photo: EPA-EFE)
|
||||||
|
|
||||||
|
@ -218,7 +227,6 @@ The prime minister was forced to ask for an extension to Britain's EU departure
|
||||||
Johnson has repeatedly pledged to finalize the first stage, a transition deal, of Britain's EU divorce battle by Oct. 31. A second stage will involve negotiating its future relationship with the EU on trade, security and other salient issues.
|
Johnson has repeatedly pledged to finalize the first stage, a transition deal, of Britain's EU divorce battle by Oct. 31. A second stage will involve negotiating its future relationship with the EU on trade, security and other salient issues.
|
||||||
'''
|
'''
|
||||||
|
|
||||||
|
|
||||||
s = '''
|
s = '''
|
||||||
Thank you very much. We have a Cabinet meeting. We’ll have a few questions after grace. And, if you would, Ben, please do the honors.
|
Thank you very much. We have a Cabinet meeting. We’ll have a few questions after grace. And, if you would, Ben, please do the honors.
|
||||||
|
|
||||||
|
@ -233,17 +241,11 @@ We need — for our farmers, our manufacturers, for, frankly, unions and non-uni
|
||||||
|
|
||||||
'''
|
'''
|
||||||
|
|
||||||
|
# f = open('bbc-fulltext/bbc/entertainment/001.txt')
|
||||||
|
|
||||||
|
|
||||||
#f = open('bbc-fulltext/bbc/entertainment/001.txt')
|
|
||||||
f = open('wordlist.txt')
|
f = open('wordlist.txt')
|
||||||
s = f.read()
|
s = f.read()
|
||||||
f.close()
|
f.close()
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
print(text_difficulty_level(s, d3))
|
print(text_difficulty_level(s, d3))
|
||||||
|
|
||||||
|
|
||||||
|
|
|
@ -7,6 +7,7 @@ css:
|
||||||
js:
|
js:
|
||||||
head: # 在页面加载之前加载
|
head: # 在页面加载之前加载
|
||||||
- ../static/js/jquery.js
|
- ../static/js/jquery.js
|
||||||
|
- ../static/js/read.js
|
||||||
- ../static/js/word_operation.js
|
- ../static/js/word_operation.js
|
||||||
bottom: # 在页面加载完之后加载
|
bottom: # 在页面加载完之后加载
|
||||||
- ../static/js/fillword.js
|
- ../static/js/fillword.js
|
||||||
|
|
|
@ -1,9 +1,5 @@
|
||||||
let isRead = true;
|
let isRead = true;
|
||||||
let isChoose = true;
|
let isChoose = true;
|
||||||
let reader = window.speechSynthesis; // 全局定义朗读者,以便朗读和暂停
|
|
||||||
let current_position = 0; // 朗读文本的当前位置
|
|
||||||
let original_position = 0; // 朗读文本的初始位置
|
|
||||||
let to_speak = ""; // 朗读的初始内容
|
|
||||||
|
|
||||||
function getWord() {
|
function getWord() {
|
||||||
return window.getSelection ? window.getSelection() : document.selection.createRange().text;
|
return window.getSelection ? window.getSelection() : document.selection.createRange().text;
|
||||||
|
@ -11,7 +7,7 @@ function getWord() {
|
||||||
|
|
||||||
function fillInWord() {
|
function fillInWord() {
|
||||||
let word = getWord();
|
let word = getWord();
|
||||||
if (isRead) read(word);
|
if (isRead) Reader.read(word, inputSlider.value);
|
||||||
if (!isChoose) return;
|
if (!isChoose) return;
|
||||||
const element = document.getElementById("selected-words");
|
const element = document.getElementById("selected-words");
|
||||||
element.value = element.value + " " + word;
|
element.value = element.value + " " + word;
|
||||||
|
@ -19,50 +15,17 @@ function fillInWord() {
|
||||||
|
|
||||||
document.getElementById("text-content").addEventListener("click", fillInWord, false);
|
document.getElementById("text-content").addEventListener("click", fillInWord, false);
|
||||||
|
|
||||||
function makeUtterance(str, rate) {
|
const sliderValue = document.getElementById("rangeValue");
|
||||||
let msg = new SpeechSynthesisUtterance(str);
|
const inputSlider = document.getElementById("rangeComponent");
|
||||||
msg.rate = rate;
|
|
||||||
msg.lang = "en-US"; // TODO: add language options menu
|
|
||||||
msg.onboundary = ev => {
|
|
||||||
if (ev.name == "word") {
|
|
||||||
current_position = ev.charIndex;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
return msg;
|
|
||||||
}
|
|
||||||
|
|
||||||
const sliderValue = document.getElementById("rangeValue"); // 显示值
|
|
||||||
const inputSlider = document.getElementById("rangeComponent"); // 滑块元素
|
|
||||||
inputSlider.oninput = () => {
|
inputSlider.oninput = () => {
|
||||||
let value = inputSlider.value; // 获取滑块的值
|
let value = inputSlider.value;
|
||||||
sliderValue.textContent = value + '×';
|
sliderValue.textContent = value + '×';
|
||||||
if (!reader.speaking) return;
|
|
||||||
reader.cancel();
|
|
||||||
let msg = makeUtterance(to_speak.substring(original_position + current_position), value);
|
|
||||||
original_position = original_position + current_position;
|
|
||||||
current_position = 0;
|
|
||||||
reader.speak(msg);
|
|
||||||
};
|
};
|
||||||
|
|
||||||
function read(s) {
|
|
||||||
to_speak = s.toString();
|
|
||||||
original_position = 0;
|
|
||||||
current_position = 0;
|
|
||||||
let msg = makeUtterance(to_speak, inputSlider.value);
|
|
||||||
reader.speak(msg);
|
|
||||||
}
|
|
||||||
|
|
||||||
function onReadClick() {
|
function onReadClick() {
|
||||||
isRead = !isRead;
|
isRead = !isRead;
|
||||||
if (!isRead) {
|
|
||||||
reader.cancel();
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
function onChooseClick() {
|
function onChooseClick() {
|
||||||
isChoose = !isChoose;
|
isChoose = !isChoose;
|
||||||
}
|
}
|
||||||
|
|
||||||
function stopRead() {
|
|
||||||
reader.cancel();
|
|
||||||
}
|
|
|
@ -0,0 +1,35 @@
|
||||||
|
var Reader = (function() {
|
||||||
|
let reader = window.speechSynthesis;
|
||||||
|
let current_position = 0;
|
||||||
|
let original_position = 0;
|
||||||
|
let to_speak = "";
|
||||||
|
|
||||||
|
function makeUtterance(str, rate) {
|
||||||
|
let msg = new SpeechSynthesisUtterance(str);
|
||||||
|
msg.rate = rate;
|
||||||
|
msg.lang = "en-US";
|
||||||
|
msg.onboundary = ev => {
|
||||||
|
if (ev.name == "word") {
|
||||||
|
current_position = ev.charIndex;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return msg;
|
||||||
|
}
|
||||||
|
|
||||||
|
function read(s, rate) {
|
||||||
|
to_speak = s.toString();
|
||||||
|
original_position = 0;
|
||||||
|
current_position = 0;
|
||||||
|
let msg = makeUtterance(to_speak, rate);
|
||||||
|
reader.speak(msg);
|
||||||
|
}
|
||||||
|
|
||||||
|
function stopRead() {
|
||||||
|
reader.cancel();
|
||||||
|
}
|
||||||
|
|
||||||
|
return {
|
||||||
|
read: read,
|
||||||
|
stopRead: stopRead
|
||||||
|
};
|
||||||
|
})();
|
|
@ -62,6 +62,13 @@ function delete_word(theWord) {
|
||||||
});
|
});
|
||||||
}
|
}
|
||||||
|
|
||||||
|
function read_word(theWord) {
|
||||||
|
let to_speak = $("#word_" + theWord).text();
|
||||||
|
original_position = 0;
|
||||||
|
current_position = 0;
|
||||||
|
Reader.read(to_speak, inputSlider.value);
|
||||||
|
}
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* interface Word {
|
* interface Word {
|
||||||
* word: string,
|
* word: string,
|
||||||
|
@ -95,6 +102,7 @@ function wordTemplate(word) {
|
||||||
<a class="btn btn-success" onclick="familiar('${word.word}')" role="button">熟悉</a>
|
<a class="btn btn-success" onclick="familiar('${word.word}')" role="button">熟悉</a>
|
||||||
<a class="btn btn-warning" onclick="unfamiliar('${word.word}')" role="button">不熟悉</a>
|
<a class="btn btn-warning" onclick="unfamiliar('${word.word}')" role="button">不熟悉</a>
|
||||||
<a class="btn btn-danger" onclick="delete_word('${word.word}')" role="button">删除</a>
|
<a class="btn btn-danger" onclick="delete_word('${word.word}')" role="button">删除</a>
|
||||||
|
<a class="btn btn-info" onclick="read_word('${word.word}')" role="button">朗读</a>
|
||||||
</p>`;
|
</p>`;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
Binary file not shown.
|
@ -5,6 +5,8 @@
|
||||||
<meta name="viewport"
|
<meta name="viewport"
|
||||||
content="width=device-width, initial-scale=1.0, minimum-scale=0.5, maximum-scale=3.0, user-scalable=yes"/>
|
content="width=device-width, initial-scale=1.0, minimum-scale=0.5, maximum-scale=3.0, user-scalable=yes"/>
|
||||||
<meta name="format-detection" content="telephone=no"/>
|
<meta name="format-detection" content="telephone=no"/>
|
||||||
|
<link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.1/dist/css/bootstrap.min.css" rel="stylesheet">
|
||||||
|
<script src="https://cdn.jsdelivr.net/npm/bootstrap@5.3.1/dist/js/bootstrap.bundle.min.js"></script>
|
||||||
|
|
||||||
{{ yml['header'] | safe }}
|
{{ yml['header'] | safe }}
|
||||||
{% if yml['css']['item'] %}
|
{% if yml['css']['item'] %}
|
||||||
|
@ -26,12 +28,40 @@
|
||||||
}
|
}
|
||||||
|
|
||||||
@keyframes shakes {
|
@keyframes shakes {
|
||||||
10%, 90% { transform: translate3d(-1px, 0, 0); }
|
10%, 90% {
|
||||||
20%, 50% { transform: translate3d(+2px, 0, 0); }
|
transform: translate3d(-1px, 0, 0);
|
||||||
30%, 70% { transform: translate3d(-4px, 0, 0); }
|
|
||||||
40%, 60% { transform: translate3d(+4px, 0, 0); }
|
|
||||||
50% { transform: translate3d(-4px, 0, 0); }
|
|
||||||
}
|
}
|
||||||
|
20%, 50% {
|
||||||
|
transform: translate3d(+2px, 0, 0);
|
||||||
|
}
|
||||||
|
30%, 70% {
|
||||||
|
transform: translate3d(-4px, 0, 0);
|
||||||
|
}
|
||||||
|
40%, 60% {
|
||||||
|
transform: translate3d(+4px, 0, 0);
|
||||||
|
}
|
||||||
|
50% {
|
||||||
|
transform: translate3d(-4px, 0, 0);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
.lead {
|
||||||
|
font-size: 22px;
|
||||||
|
font-family: Helvetica, sans-serif;
|
||||||
|
white-space: pre-wrap;
|
||||||
|
}
|
||||||
|
|
||||||
|
.arrow {
|
||||||
|
padding: 0;
|
||||||
|
font-size: 20px;
|
||||||
|
line-height: 21px;
|
||||||
|
display: inline-block;
|
||||||
|
}
|
||||||
|
|
||||||
|
.arrow:hover {
|
||||||
|
cursor: pointer;
|
||||||
|
}
|
||||||
|
|
||||||
</style>
|
</style>
|
||||||
</head>
|
</head>
|
||||||
<body>
|
<body>
|
||||||
|
@ -45,47 +75,64 @@
|
||||||
<a class="btn btn-secondary" href="/reset" role="button" onclick="stopRead()">重设密码</a>
|
<a class="btn btn-secondary" href="/reset" role="button" onclick="stopRead()">重设密码</a>
|
||||||
|
|
||||||
</p>
|
</p>
|
||||||
{# {% for message in flashed_messages %}#} {# 根据user_service.userpage,取消了参数flashed_messages,因此注释了这段代码 #}
|
{% for message in get_flashed_messages() %}
|
||||||
{# <div class="alert alert-warning" role="alert">Congratulations! {{ message }}</div>#}
|
<div class="alert alert-warning alert-dismissible fade show" role="alert">
|
||||||
{# {% endfor %}#}
|
{{ message }}
|
||||||
|
<button type="button" class="btn-close" data-bs-dismiss="alert" aria-label="Close"></button>
|
||||||
|
</div>
|
||||||
|
{% endfor %}
|
||||||
|
|
||||||
<button class="btn btn-success" id="load_next_article" onclick="load_next_article()"> 下一篇 Next Article </button>
|
<button class="arrow" id="load_next_article" onclick="load_next_article();Reader.stopRead()"
|
||||||
<button class="btn btn-success" id="load_pre_article" onclick="load_pre_article()" > 上一篇 Previous Article </button>
|
title="下一篇 Next Article">⇨
|
||||||
|
</button>
|
||||||
|
<button class="arrow" id="load_pre_article" onclick="load_pre_article();Reader.stopRead()" style="display: none"
|
||||||
|
title="上一篇 Previous Article">⇦
|
||||||
|
</button>
|
||||||
|
|
||||||
<p><b>阅读文章并回答问题</b></p>
|
<p><b>阅读文章并回答问题</b></p>
|
||||||
<div id="text-content">
|
<div id="text-content">
|
||||||
<div id="found">
|
<div id="found">
|
||||||
<div class="alert alert-success" role="alert">According to your word list, your level is <span class="badge bg-success" id="user-level">{{ today_article["user_level"] }}</span> and we have chosen an article with a difficulty level of <span class="badge bg-success" id="text_level">{{ today_article["text_level"] }}</span> for you.</div>
|
<div class="alert alert-success" role="alert">According to your word list, your level is <span
|
||||||
|
class="text-decoration-underline" id="user_level">{{ today_article["user_level"] }}</span> and we
|
||||||
|
have chosen an article with a difficulty level of <span class="text-decoration-underline"
|
||||||
|
id="text_level">{{ today_article["text_level"] }}</span>
|
||||||
|
for you.
|
||||||
|
</div>
|
||||||
<p class="text-muted" id="date">Article added on: {{ today_article["date"] }}</p><br/>
|
<p class="text-muted" id="date">Article added on: {{ today_article["date"] }}</p><br/>
|
||||||
<div class="p-3 mb-2 bg-light text-dark"><br/>
|
<div class="p-3 mb-2 bg-light text-dark" style="margin: 0 0.5%;"><br/>
|
||||||
<p class="display-5" id="article_title">{{ today_article["article_title"] }}</p><br/>
|
<p class="display-6" id="article_title">{{ today_article["article_title"] }}</p><br/>
|
||||||
<p class="lead"><font id="article" size=2>{{ today_article["article_body"] }}</font></p><br/>
|
<p class="lead"><font id="article">{{ today_article["article_body"] }}</font></p><br/>
|
||||||
|
<div>
|
||||||
<p><small class="text-muted" id="source">{{ today_article['source'] }}</small></p><br/>
|
<p><small class="text-muted" id="source">{{ today_article['source'] }}</small></p><br/>
|
||||||
|
</div>
|
||||||
|
|
||||||
<p><b id="question">{{ today_article['question'] }}</b></p><br/>
|
<p><b id="question">{{ today_article['question'] }}</b></p><br/>
|
||||||
<script type="text/javascript">
|
<script type="text/javascript">
|
||||||
function toggle_visibility(id) { {# https://css-tricks.com/snippets/javascript/showhide-element/#}
|
function toggle_visibility(id) { {# https://css-tricks.com/snippets/javascript/showhide-element/#}
|
||||||
const e = document.getElementById(id);
|
const e = document.getElementById(id);
|
||||||
if(e.style.display === 'block')
|
if (e.style.display === 'block')
|
||||||
e.style.display = 'none';
|
e.style.display = 'none';
|
||||||
else
|
else
|
||||||
e.style.display = 'block';
|
e.style.display = 'block';
|
||||||
}
|
}
|
||||||
</script>
|
</script>
|
||||||
<button onclick="toggle_visibility('answer');">ANSWER</button>
|
<button onclick="toggle_visibility('answer');">ANSWER</button>
|
||||||
<div id="answer" style="display:none;">{{ today_article['answer'] }}</div><br/>
|
<div id="answer" style="display:none;">{{ today_article['answer'] }}</div>
|
||||||
|
<br/>
|
||||||
</div>
|
</div>
|
||||||
</div>
|
</div>
|
||||||
<div class="alert alert-success" role="alert" id="not_found" style="display:none;">
|
<div class="alert alert-success" role="alert" id="not_found" style="display:none;">
|
||||||
<p class="text-muted"><span class="badge bg-success">Notes:</span><br>No article is currently available for you. You can try again a few times or mark new words in the passage to improve your level.</p>
|
<p class="text-muted"><span class="badge bg-success">Notes:</span><br>No article is currently available for
|
||||||
|
you. You can try again a few times or mark new words in the passage to improve your level.</p>
|
||||||
</div>
|
</div>
|
||||||
<div class="alert alert-success" role="alert" id="read_all" style="display:none;">
|
<div class="alert alert-success" role="alert" id="read_all" style="display:none;">
|
||||||
<p class="text-muted"><span class="badge bg-success">Notes:</span><br>You've read all the articles.</p>
|
<p class="text-muted"><span class="badge bg-success">Notes:</span><br>You've read all the articles.</p>
|
||||||
</div>
|
</div>
|
||||||
</div>
|
</div>
|
||||||
|
|
||||||
<input type="checkbox" onclick="toggleHighlighting()" checked/>生词高亮
|
<input type="checkbox" id="highlightCheckbox" onclick="toggleHighlighting()"/>生词高亮
|
||||||
<input type="checkbox" onclick="onReadClick()" checked/>大声朗读
|
<input type="checkbox" id="readCheckbox" onclick="onReadClick()"/>大声朗读
|
||||||
<input type="checkbox" onclick="onChooseClick()" checked/>划词入库
|
<input type="checkbox" id="chooseCheckbox" onclick="onChooseClick()"/>划词入库
|
||||||
<div class="range">
|
<div class="range">
|
||||||
<div class="field">
|
<div class="field">
|
||||||
<div class="sliderValue">
|
<div class="sliderValue">
|
||||||
|
@ -97,8 +144,8 @@
|
||||||
<p><b>收集生词吧</b> (可以在正文中划词,也可以复制黏贴)</p>
|
<p><b>收集生词吧</b> (可以在正文中划词,也可以复制黏贴)</p>
|
||||||
<form method="post" action="/{{ username }}/userpage">
|
<form method="post" action="/{{ username }}/userpage">
|
||||||
<textarea name="content" id="selected-words" rows="10" cols="120"></textarea><br/>
|
<textarea name="content" id="selected-words" rows="10" cols="120"></textarea><br/>
|
||||||
<input type="submit" value="把生词加入我的生词库"/>
|
<button class="btn btn-primary btn-lg" type="submit" onclick="Reader.stopRead()">把生词加入我的生词库</button>
|
||||||
<input type="reset" value="清除"/>
|
<button class="btn btn-primary btn-lg" type="reset" onclick="clearSelectedWords()">清除</button>
|
||||||
</form>
|
</form>
|
||||||
{% if session.get['thisWord'] %}
|
{% if session.get['thisWord'] %}
|
||||||
<script type="text/javascript">
|
<script type="text/javascript">
|
||||||
|
@ -126,13 +173,15 @@
|
||||||
{% set freq = x[1] %}
|
{% set freq = x[1] %}
|
||||||
{% if session.get('thisWord') == x[0] and session.get('time') == 1 %}
|
{% if session.get('thisWord') == x[0] and session.get('time') == 1 %}
|
||||||
{% endif %}
|
{% endif %}
|
||||||
<p id='p_{{ word }}' class="new-word" >
|
<p id='p_{{ word }}' class="new-word">
|
||||||
<a id="word_{{ word }}" class="btn btn-light" href='http://youdao.com/w/eng/{{ word }}/#keyfrom=dict2.index'
|
<a id="word_{{ word }}" class="btn btn-light"
|
||||||
|
href='http://youdao.com/w/eng/{{ word }}/#keyfrom=dict2.index'
|
||||||
role="button">{{ word }}</a>
|
role="button">{{ word }}</a>
|
||||||
( <a id="freq_{{ word }}" title="{{ word }}">{{ freq }}</a> )
|
( <a id="freq_{{ word }}" title="{{ word }}">{{ freq }}</a> )
|
||||||
<a class="btn btn-success" onclick="familiar('{{ word }}')" role="button">熟悉</a>
|
<a class="btn btn-success" onclick="familiar('{{ word }}')" role="button">熟悉</a>
|
||||||
<a class="btn btn-warning" onclick="unfamiliar('{{ word }}')" role="button">不熟悉</a>
|
<a class="btn btn-warning" onclick="unfamiliar('{{ word }}')" role="button">不熟悉</a>
|
||||||
<a class="btn btn-danger" onclick="delete_word('{{ word }}')" role="button">删除</a>
|
<a class="btn btn-danger" onclick="delete_word('{{ word }}')" role="button">删除</a>
|
||||||
|
<a class="btn btn-info" onclick="read_word('{{ word }}')" role="button">朗读</a>
|
||||||
</p>
|
</p>
|
||||||
{% endfor %}
|
{% endfor %}
|
||||||
</div>
|
</div>
|
||||||
|
@ -146,60 +195,127 @@
|
||||||
{% endfor %}
|
{% endfor %}
|
||||||
{% endif %}
|
{% endif %}
|
||||||
<script type="text/javascript">
|
<script type="text/javascript">
|
||||||
function load_next_article(){
|
window.onload = function () { // 页面加载时执行
|
||||||
|
const settings = {
|
||||||
|
// initialize settings from localStorage
|
||||||
|
highlightChecked: localStorage.getItem('highlightChecked') !== 'false', // localStorage stores strings, default to true. same below
|
||||||
|
readChecked: localStorage.getItem('readChecked') !== 'false',
|
||||||
|
chooseChecked: localStorage.getItem('chooseChecked') !== 'false',
|
||||||
|
rangeValue: localStorage.getItem('rangeValue') || '1',
|
||||||
|
selectedWords: localStorage.getItem('selectedWords') || ''
|
||||||
|
};
|
||||||
|
|
||||||
|
const elements = {
|
||||||
|
highlightCheckbox: document.querySelector('#highlightCheckbox'),
|
||||||
|
readCheckbox: document.querySelector('#readCheckbox'),
|
||||||
|
chooseCheckbox: document.querySelector('#chooseCheckbox'),
|
||||||
|
rangeComponent: document.querySelector('#rangeComponent'),
|
||||||
|
rangeValueDisplay: document.querySelector('#rangeValue'),
|
||||||
|
selectedWordsInput: document.querySelector('#selected-words')
|
||||||
|
};
|
||||||
|
// 应用设置到页面元素
|
||||||
|
elements.highlightCheckbox.checked = settings.highlightChecked;
|
||||||
|
elements.readCheckbox.checked = settings.readChecked;
|
||||||
|
elements.chooseCheckbox.checked = settings.chooseChecked;
|
||||||
|
elements.rangeComponent.value = settings.rangeValue;
|
||||||
|
elements.rangeValueDisplay.textContent = `${settings.rangeValue}x`;
|
||||||
|
elements.selectedWordsInput.value = settings.selectedWords;
|
||||||
|
|
||||||
|
// 刷新页面或进入页面时判断,若不是首篇文章,则上一篇按钮可见
|
||||||
|
if (sessionStorage.getItem('pre_page_button') !== 'display' && sessionStorage.getItem('pre_page_button')) {
|
||||||
|
$('#load_pre_article').show();
|
||||||
|
}
|
||||||
|
|
||||||
|
// 事件监听器
|
||||||
|
elements.selectedWordsInput.addEventListener('input', () => {
|
||||||
|
localStorage.setItem('selectedWords', elements.selectedWordsInput.value);
|
||||||
|
});
|
||||||
|
|
||||||
|
elements.rangeComponent.addEventListener('input', () => {
|
||||||
|
const rangeValue = elements.rangeComponent.value;
|
||||||
|
elements.rangeValueDisplay.textContent = `${rangeValue}x`;
|
||||||
|
localStorage.setItem('rangeValue', rangeValue);
|
||||||
|
});
|
||||||
|
};
|
||||||
|
|
||||||
|
function clearSelectedWords() {
|
||||||
|
localStorage.removeItem('selectedWords');
|
||||||
|
document.querySelector('#selected-words').value = '';
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
function load_next_article() {
|
||||||
|
$("#load_next_article").prop("disabled", true)
|
||||||
$.ajax({
|
$.ajax({
|
||||||
url: '/get_next_article/{{username}}',
|
url: '/get_next_article/{{username}}',
|
||||||
dataType: 'json',
|
dataType: 'json',
|
||||||
success: function(data) {
|
success: function (data) {
|
||||||
// 更新页面内容
|
// 更新页面内容
|
||||||
if(data['today_article']){
|
if (data['today_article']) {
|
||||||
update(data['today_article']);
|
update(data['today_article']);
|
||||||
check_pre(data['visited_articles']);
|
check_pre(data['visited_articles']);
|
||||||
check_next(data['result_of_generate_article']);
|
check_next(data['result_of_generate_article']);
|
||||||
}
|
}
|
||||||
|
}, complete: function (xhr, status) {
|
||||||
|
$("#load_next_article").prop("disabled", false)
|
||||||
}
|
}
|
||||||
});
|
});
|
||||||
}
|
}
|
||||||
function load_pre_article(){
|
|
||||||
|
function load_pre_article() {
|
||||||
$.ajax({
|
$.ajax({
|
||||||
url: '/get_pre_article/{{username}}',
|
url: '/get_pre_article/{{username}}',
|
||||||
dataType: 'json',
|
dataType: 'json',
|
||||||
success: function(data) {
|
success: function (data) {
|
||||||
// 更新页面内容
|
// 更新页面内容
|
||||||
if(data['today_article']){
|
if (data['today_article']) {
|
||||||
update(data['today_article']);
|
update(data['today_article']);
|
||||||
check_pre(data['visited_articles']);
|
check_pre(data['visited_articles']);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
});
|
});
|
||||||
}
|
}
|
||||||
function update(today_article){
|
|
||||||
$('#user-level').html(today_article['user_level']);
|
function update(today_article) {
|
||||||
|
$('#user_level').html(today_article['user_level']);
|
||||||
$('#text_level').html(today_article["text_level"]);
|
$('#text_level').html(today_article["text_level"]);
|
||||||
$('#date').html('Article added on: '+today_article["date"]);
|
$('#date').html('Article added on: ' + today_article["date"]);
|
||||||
$('#article_title').html(today_article["article_title"]);
|
$('#article_title').html(today_article["article_title"]);
|
||||||
$('#article').html(today_article["article_body"]);
|
$('#article').html(today_article["article_body"]);
|
||||||
$('#source').html(today_article['source']);
|
$('#source').html(today_article['source']);
|
||||||
$('#question').html(today_article["question"]);
|
$('#question').html(today_article["question"]);
|
||||||
$('#answer').html(today_article["answer"]);
|
$('#answer').html(today_article["answer"]);
|
||||||
|
document.querySelector('#text_level').classList.add('mark'); // highlight text difficult level for 2 seconds
|
||||||
|
setTimeout(() => {
|
||||||
|
document.querySelector('#text_level').classList.remove('mark');
|
||||||
|
}, 2000);
|
||||||
|
document.querySelector('#user_level').classList.add('mark'); // do the same thing for user difficulty level
|
||||||
|
setTimeout(() => {
|
||||||
|
document.querySelector('#user_level').classList.remove('mark');
|
||||||
|
}, 2000);
|
||||||
}
|
}
|
||||||
<!-- 检查是否存在上一篇或下一篇,不存在则对应按钮隐藏-->
|
|
||||||
function check_pre(visited_articles){
|
<!-- 检查是否存在上一篇或下一篇,不存在则对应按钮隐藏-->
|
||||||
if((visited_articles=='')||(visited_articles['index']<=0)){
|
function check_pre(visited_articles) {
|
||||||
|
if ((visited_articles == '') || (visited_articles['index'] <= 0)) {
|
||||||
$('#load_pre_article').hide();
|
$('#load_pre_article').hide();
|
||||||
}else{
|
sessionStorage.setItem('pre_page_button', 'display')
|
||||||
|
} else {
|
||||||
$('#load_pre_article').show();
|
$('#load_pre_article').show();
|
||||||
|
sessionStorage.setItem('pre_page_button', 'show')
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
function check_next(result_of_generate_article){
|
|
||||||
if(result_of_generate_article == "found"){
|
function check_next(result_of_generate_article) {
|
||||||
$('#found').show();$('#not_found').hide();
|
if (result_of_generate_article == "found") {
|
||||||
|
$('#found').show();
|
||||||
|
$('#not_found').hide();
|
||||||
$('#read_all').hide();
|
$('#read_all').hide();
|
||||||
}else if(result_of_generate_article == "not found"){
|
} else if (result_of_generate_article == "not found") {
|
||||||
$('#found').hide();
|
$('#found').hide();
|
||||||
$('#not_found').show();
|
$('#not_found').show();
|
||||||
$('#read_all').hide();
|
$('#read_all').hide();
|
||||||
}else{
|
} else {
|
||||||
$('#found').hide();
|
$('#found').hide();
|
||||||
$('#not_found').hide();
|
$('#not_found').hide();
|
||||||
$('#read_all').show();
|
$('#read_all').show();
|
||||||
|
|
|
@ -0,0 +1,85 @@
|
||||||
|
''' Contributed by Lin Junhong et al. 2023-06.'''
|
||||||
|
|
||||||
|
from selenium import webdriver
|
||||||
|
from selenium.webdriver.common.desired_capabilities import DesiredCapabilities
|
||||||
|
|
||||||
|
from selenium.webdriver.support.ui import WebDriverWait
|
||||||
|
from selenium.webdriver.support import expected_conditions as EC
|
||||||
|
from selenium.common.exceptions import UnexpectedAlertPresentException, NoAlertPresentException
|
||||||
|
import random, time
|
||||||
|
import string
|
||||||
|
|
||||||
|
# 初始化webdriver
|
||||||
|
# driver = webdriver.Remote('http://localhost:4444/wd/hub', DesiredCapabilities.CHROME)
|
||||||
|
# driver.implicitly_wait(10)
|
||||||
|
driver = webdriver.Chrome("C:\\Users\\12993\AppData\Local\Programs\Python\Python38\\chromedriver.exe")
|
||||||
|
|
||||||
|
|
||||||
|
def test_next_article():
|
||||||
|
try:
|
||||||
|
driver.get("http://118.25.96.118:90")
|
||||||
|
assert 'English Pal -' in driver.page_source
|
||||||
|
# login
|
||||||
|
elem = driver.find_element_by_link_text('登录')
|
||||||
|
elem.click()
|
||||||
|
|
||||||
|
uname = 'abcdefg'
|
||||||
|
password = 'abcdefg'
|
||||||
|
elem = driver.find_element_by_id('username')
|
||||||
|
elem.send_keys(uname)
|
||||||
|
|
||||||
|
elem = driver.find_element_by_id('password')
|
||||||
|
elem.send_keys(password)
|
||||||
|
elem = driver.find_element_by_xpath('/html/body/div/button') # 找到登录按钮
|
||||||
|
elem.click()
|
||||||
|
|
||||||
|
time.sleep(0.5)
|
||||||
|
assert 'EnglishPal Study Room for ' + uname in driver.title
|
||||||
|
for i in range(50):
|
||||||
|
time.sleep(0.1)
|
||||||
|
# 找到固定按钮
|
||||||
|
elem = driver.find_element_by_xpath('//*[@id="load_next_article"]')
|
||||||
|
elem.click()
|
||||||
|
except Exception as e:
|
||||||
|
print(e)
|
||||||
|
|
||||||
|
|
||||||
|
def test_local_next_article():
|
||||||
|
try:
|
||||||
|
driver.get("http://127.0.0.1:5000")
|
||||||
|
assert 'English Pal -' in driver.page_source
|
||||||
|
# login
|
||||||
|
elem = driver.find_element_by_link_text('注册')
|
||||||
|
elem.click()
|
||||||
|
|
||||||
|
uname = 'abcdefg'
|
||||||
|
password = 'abcdefg'
|
||||||
|
elem = driver.find_element_by_id('username')
|
||||||
|
elem.send_keys(uname)
|
||||||
|
|
||||||
|
elem = driver.find_element_by_id('password')
|
||||||
|
elem.send_keys(password)
|
||||||
|
|
||||||
|
elem = driver.find_element_by_id('password2')
|
||||||
|
elem.send_keys(password)
|
||||||
|
|
||||||
|
time.sleep(0.5)
|
||||||
|
|
||||||
|
elem = driver.find_element_by_class_name('btn') # 找到提交按钮
|
||||||
|
elem.click()
|
||||||
|
time.sleep(0.5)
|
||||||
|
try:
|
||||||
|
WebDriverWait(driver, 1).until(EC.alert_is_present())
|
||||||
|
driver.switch_to.alert.accept()
|
||||||
|
except (UnexpectedAlertPresentException, NoAlertPresentException):
|
||||||
|
pass
|
||||||
|
|
||||||
|
time.sleep(0.5)
|
||||||
|
assert 'EnglishPal Study Room for ' + uname in driver.title
|
||||||
|
for i in range(50):
|
||||||
|
time.sleep(0.1)
|
||||||
|
# 找到固定按钮
|
||||||
|
elem = driver.find_element_by_xpath('//*[@id="load_next_article"]')
|
||||||
|
elem.click()
|
||||||
|
except Exception as e:
|
||||||
|
print(e)
|
|
@ -39,7 +39,7 @@ def file2str(fname):#文件转字符
|
||||||
|
|
||||||
|
|
||||||
def remove_punctuation(s): # 这里是s是形参 (parameter)。函数被调用时才给s赋值。
|
def remove_punctuation(s): # 这里是s是形参 (parameter)。函数被调用时才给s赋值。
|
||||||
special_characters = '\_©~<=>+-/[]*&$%^@.,?!:;#()"“”—‘’{}|' # 把里面的字符都去掉
|
special_characters = '\_©~<=>+/[]*&$%^@.,?!:;#()"“”—‘’{}|' # 把里面的字符都去掉
|
||||||
for c in special_characters:
|
for c in special_characters:
|
||||||
s = s.replace(c, ' ') # 防止出现把 apple,apple 移掉逗号后变成 appleapple 情况
|
s = s.replace(c, ' ') # 防止出现把 apple,apple 移掉逗号后变成 appleapple 情况
|
||||||
s = s.replace('--', ' ')
|
s = s.replace('--', ' ')
|
||||||
|
|
|
@ -1,4 +1,8 @@
|
||||||
Flask==1.1.2
|
Flask==2.0.3
|
||||||
selenium==3.141.0
|
selenium==3.141.0
|
||||||
PyYAML~=6.0
|
PyYAML~=6.0
|
||||||
pony==0.7.16
|
pony==0.7.16
|
||||||
|
snowballstemmer==2.2.0
|
||||||
|
Werkzeug==2.2.2
|
||||||
|
|
||||||
|
pytest~=8.1.1
|
Loading…
Reference in New Issue