@article{7def8004-8d87-4f98-b356-2afd61be8d6a, author = {Jan Kocoń, Michał Gawor}, title = {Evaluating KGR10 Polish Word Embeddings in the Recognition of Temporal Expressions Using BiLSTM-CRF}, journal = {Schedae Informaticae}, volume = {2018}, number = {Volume 27}, year = {2018}, issn = {1732-3916}, pages = {93-106},keywords = {word embeddings; temporal expressions; recognition; TimeML; CRF; LSTM; BiLSTM; KGR10; FastText}, abstract = {The article introduces a new set of Polish word embeddings, built using KGR10 corpus, which contains more than 4 billion words. These embeddings are evaluated in the problem of recognition of temporal expressions (timexes) for the Polish language. We described the process of KGR10 corpus creation and a new approach to the recognition problem using Bidirectional Long-Short Term Memory (BiLSTM) network with additional CRF layer, where specific embeddings are essential. We presented experiments and conclusions drawn from them.}, doi = {10.4467/20838476SI.18.008.10413}, url = {https://ejournals.eu/en/journal/schedae-informaticae/article/evaluating-kgr10-polish-word-embeddings-in-the-recognition-of-temporal-expressions-using-bilstm-crf} }