@conference{1850062862013, author = "Annamaria Mesaros and Toni Heittola and Kalle Palom{\"a}ki", abstract = "A common problem of freely annotated or user contributed audio databases is the high variability of the labels, related to homonyms, synonyms, plurals, etc. Automatically re-labeling audio data based on audio similarity could offer a solution to this problem. This paper studies the relationship between audio and labels in a sound event database, by evaluating semantic similarity of labels of acoustically similar sound event instances. The assumption behind the study is that acoustically similar events are annotated with semantically similar labels. Indeed, for 43% of the tested data, there was at least one in ten acoustically nearest neighbors having a synonym as label, while the closest related term is on average one level higher or lower in the semantic hierarchy.", booktitle = "Proceedings of the 2013 IEEE International Conference on Acoustics, Speech and Signal Processing", doi = "https://dx.doi.org/10.1109/ICASSP.2013.6637761", isbn = "978-1-4799-0356-6", keywords = "audio similarity;semantic similarity;sound events", pages = "813-817", publisher = "IEEE Computer Society", title = "{A}nalysis of acoustic-semantic relationship for diversely annotated real-world audio data", url = "https://www.cs.tut.fi/~mesaros/pubs/mesaros_icassp2013_cr.pdf", year = "2013", }