from src.unmask import umaskall
import ipywidgets as widgets
text = widgets.Textarea(value="it _is a [RB] useful _", layout=widgets.Layout(width='100%', height="10em"))
top_k = widgets.IntText(layout=widgets.Layout(width='10%',))
top_k2 = widgets.IntSlider(min=1, max=100, value=10, step=1, description="Top-K", readout=False,
layout=widgets.Layout(width='90%',), style = {'description_width': 'auto'})
widgets.jslink((top_k2, 'value'), (top_k, 'value'))
split_stences = widgets.Checkbox(value=True, description="stence by stence", indent=False)
single_mask = widgets.Checkbox(value=False, description="one blank at a time", indent=False)
import codecs
file = widgets.FileUpload(multiple=False, description="Load File", accept=".txt")
def on_upload_change(change):
c = get_content(change['owner'])
if c:
text.value = c
on_button_clicked(button)
file.observe(on_upload_change, names='_counter')
def get_content(file):
file = file.value
if isinstance(file, dict):
c = next(iter(file.values()))['content']
else:
c = file[0]['content']
return codecs.decode(c, encoding="utf-8")
import sys
class MyWriter:
def __init__(self, file):
self.logfile = file
def write(self, text):
sys.stdout.write(text)
self.logfile.write(text)
def close(self):
sys.stdout.close()
self.logfile.close()
button = widgets.Button(description="Go", button_style="success",
icon="arrow-alt-circle-right", layout=widgets.Layout(width='30%'))
out = widgets.Output()
@out.capture()
def on_button_clicked(b):
out.clear_output()
with open("output-holly_cloze.txt", 'w', encoding="utf-8") as f:
umaskall(text.value, top_k=top_k.value,
split_stences=split_stences.value, single_mask=single_mask.value,
io=MyWriter(f))
button.on_click(on_button_clicked)
tpk = widgets.HBox(children=[top_k2, top_k])
chb = widgets.HBox(children=[split_stences, single_mask])
btn = widgets.HBox(children=[button, file])
display(tpk, chb, text, btn, out)
_
开头,如:It's a _great tool
或 It's 1pretty 2useful
|
表示逻辑或,如:it is a [RB] useful __.
或 [NN|PRP] is [adj]
\
,如:I am _
和I am _\
的区别split_stences
控制自动拆分成单句或段落多次输入Tag | Description | 释义 | 例子 |
---|---|---|---|
ADJ | adjective | 形容词 | new, good, high, special, big, local |
ADP | adposition | 介词 | on, of, at, with, by, into, under |
ADV | adverb | 副词 | really, already, still, early, now |
CONJ | conjunction | 连词 | and, or, but, if, while, although |
DET | determiner, article | 限定词 | the, a, some, most, every, no, which |
NOUN | noun | 名词 | year, home, costs, time, Africa |
NUM | numeral | 数词 | twenty-four, fourth, 1991, 14:24 |
PRT | particle | 虚词 | at, on, out, over per, that, up, with |
PRON | pronoun | 代词 | he, their, her, its, my, I, us |
VERB | verb | 动词 | is, say, told, given, playing, would |
. | punctuation marks | 标点符号 | . , ; ! |
X | other | 其它 | ersatz, esprit, dunno, gr8, univeristy |
Tag | Description | 释义 | 例子 |
---|---|---|---|
CC | Coordinating conjunction | 连词 | and, or,but, if, while,although |
CD | Cardinal number | 数词 | twenty-four, fourth, 1991,14:24 |
DT | Determiner | 限定词 | the, a, some, most,every, no |
EX | Existential there | 存在量词 | there, there’s |
FW | Foreign word | 外来词 | dolce, ersatz, esprit, quo,maitre |
IN | Preposition or subordinating conjunction | 介词连词 | on, of,at, with,by,into, under |
JJ | Adjective | 形容词 | new,good, high, special, big, local |
JJR | Adjective, comparative | 比较级词语 | bleaker braver breezier briefer brighter brisker |
JJS | Adjective, superlative | 最高级词语 | calmest cheapest choicest classiest cleanest clearest |
LS | List item marker | 标记 | A A. B B. C C. D E F First G H I J K |
MD | Modal | 情态动词 | can cannot could couldn’t |
NN | Noun, singular or mass | 名词 | year,home, costs, time, education |
NNS | Noun, plural | 名词复数 | undergraduates scotches |
NNP | Proper noun, singular | 专有名词 | Alison,Africa,April,Washington |
NNPS | Proper noun, plural | 专有名词复数 | Americans Americas Amharas Amityvilles |
PDT | Predeterminer | 前限定词 | all both half many |
POS | Possessive ending | 所有格标记 | ’ ‘s |
PRP | Personal pronoun | 人称代词 | hers herself him himself hisself |
PRP$ | Possessive pronoun | 所有格 | her his mine my our ours |
RB | Adverb | 副词 | occasionally unabatingly maddeningly |
RBR | Adverb, comparative | 副词比较级 | further gloomier grander |
RBS | Adverb, superlative | 副词最高级 | best biggest bluntest earliest |
RP | Particle | 虚词 | aboard about across along apart |
SYM | Symbol | 符号 | % & ’ ” ”. ) ) |
TO | to | 词to | to |
UH | Interjection | 感叹词 | Goodbye Goody Gosh Wow |
VB | Verb, base form | 动词 | ask assemble assess |
VBD | Verb, past tense | 动词过去式 | dipped pleaded swiped |
VBG | Verb, gerund or present participle | 动词现在分词 | telegraphing stirring focusing |
VBN | Verb, past participle | 动词过去分词 | multihulled dilapidated aerosolized |
VBP | Verb, non-3rd person singular present | 动词现在式非第三人称时态 | predominate wrap resort sue |
VBZ | Verb, 3rd person singular present | 动词现在式第三人称时态 | bases reconstructs marks |
WDT | Wh-determiner | Wh限定词 | who,which,when,what,where,how |
WP | Wh-pronoun | WH代词 | that what whatever |
WP$ | Possessive wh-pronoun | WH代词所有格 | whose |
WRB | Wh-adverb | WH副词 |