@CONFERENCE\{IMM2017-07029, author = "F. {\AA}. Nielsen and L. K. Hansen", title = "Open semantic analysis: The case of word level semantics in Danish", year = "2017", month = "nov", keywords = "Danish, embedding, word2vec", booktitle = "8th Language \& Technology Conference: Human Language Technologies as a Challenge for Computer Science and Linguistics", volume = "", series = "", editor = "", publisher = "", organization = "", address = "", url = "http://www2.compute.dtu.dk/pubdb/pubs/7029-full.html", abstract = "The present research is motivated by the need for accessible and efficient tools for automated semantic analysis in Danish. We are inter- ested in tools that are completely open, so they can be used by a critical public, in public administration, non-governmental organizations and businesses. We describe data-driven models for Danish semantic relatedness, word intrusion and sentiment prediction. Open Danish corpora were assembled and unsupervised learning implemented for explicit semantic analysis and with Gensim’s Word2vec model. We evaluate the performance of the two models on three different annotated word datasets. We test the semantic representations’ alignment with single word sentiment using supervised learning. We find that logistic regression and large random forests perform well with Word2vec features." }