@inproceedings{d34df823437f4cf68a854deb18fa2ed7,
title = "Euclidean embedding of co-occurrence data",
abstract = "Embedding algorithms search for low dimensional structure in complex data, but most algorithms only handle objects of a single type for which pairwise distances are specified. This paper describes a method for embedding objects of different types, such as images and text, into a single common Euclidean space based on their co-occurrence statistics. The joint distributions are modeled as exponentials of Euclidean distances in the low-dimensional embedding space, which links the problem to convex optimization over positive semidefinite matrices. The local structure of our embedding corresponds to the statistical correlations via random walks in the Euclidean space. We quantify the performance of our method on two text datasets, and show that it consistently and significantly outperforms standard methods of statistical correspondence modeling, such as multidimensional scaling and correspondence analysis.",
author = "Amir Globerson and Gal Chechik and Fernando Pereira and Naftali Tishby",
year = "2005",
language = "אנגלית",
isbn = "0262195348",
series = "Advances in Neural Information Processing Systems",
publisher = "Neural information processing systems foundation",
booktitle = "Advances in Neural Information Processing Systems 17 - Proceedings of the 2004 Conference, NIPS 2004",
note = "null ; Conference date: 13-12-2004 Through 16-12-2004",
}