7
from IPython.display import HTML
8
from tqdm.notebook import tqdm as log_progress
10
from naeval.const import (
11
NEWS, WIKI, FICTION, SOCIAL, POETRY,
15
from naeval.io import (
22
from naeval.record import (
26
from naeval.dataset import sample
27
from naeval.readme import patch_readme
28
from naeval.lemma.datasets import load_dataset
29
from naeval.lemma.markup import (
34
CORUS_DATA_DIR = expanduser('~/proj/corus-data/gramru')
37
'dev/GramEval2020-RuEval2017-Lenta-news-dev.conllu',
38
'train/MorphoRuEval2017-Lenta-train.conllu',
41
'dev/GramEval2020-GSD-wiki-dev.conllu',
42
'train/GramEval2020-GSD-train.conllu'
45
'dev/GramEval2020-SynTagRus-dev.conllu',
46
'train/GramEval2020-SynTagRus-train-v2.conllu',
47
'train/MorphoRuEval2017-JZ-gold.conllu'
50
'dev/GramEval2020-RuEval2017-social-dev.conllu',
51
'train/GramEval2020-Taiga-social-train.conllu',
52
'train/MorphoRuEval2017-VK-gold.conllu'
55
'dev/GramEval2020-Taiga-poetry-dev.conllu',
56
'train/GramEval2020-Taiga-poetry-train.conllu'
60
DATASETS = [NEWS, WIKI, FICTION, SOCIAL, POETRY]
62
DATA_DIR = expanduser('~/proj/naeval/data/lemma')
64
README = expanduser('~/proj/naeval/README.md')