@incollection{HagenJannidisWitt2022, author = {Hagen, Thora and Jannidis, Fotis and Witt, Andreas}, title = {Word sense alignment and disambiguation for historical encyclopedias}, booktitle = {Graphs and Networks in the Humanities 2022. Technologies, Models, Analyses, and Visualizations. 6th International Conference, 3. - 4. February 2022, Online.}, editor = {Andrews, Tara and Diehr, Franziska and Efer, Thomas and Kuczera, Andreas and van Zundert, Joris}, url = {https://graphentechnologien.hypotheses.org/files/2022/01/Word_Sense_Alignment_and_Disambiguation_for_Historical_etc-Hagen_Jannidis_Witt.pdf}, publisher = {Leibniz-Institut f{\"u}r Deutsche Sprache (IDS)}, pages = {7}, year = {2022}, abstract = {This paper will address the challenge of creating a knowledge graph from a corpus of historical encyclopedias with a special focus on word sense alignment (WSA) and disambiguation (WSD). More precisely, we examine WSA and WSD approaches based on article similarity to link messy historical data, utilizing Wikipedia as aground-truth component - as the lack of a critical overlap in content paired with the amount of variation between and within the encyclopedias does not allow for choosing a "baseline" encyclopedia to align the others to. Additionally, we are comparing the disambiguation performance of conservative methods like the Lesk algorithm to more recent approaches, i.e. using language models to disambiguate senses.}, subject = {Semasiologie}, language = {en} }