The t-distributed Stochastic Neighbor Embedding (tSNE) algorithm has become
in recent years one of the most used and insightful techniques for the
exploratory data analysis of high-dimensional data. tSNE reveals clusters of
high-dimensional data points at different scales while it requires only minimal
tuning of its parameters. Despite these advantages, the computational
complexity of the algorithm limits its application to relatively small
datasets. To address this problem, several evolutions of tSNE have been
developed in recent years, mainly focusing on the scalability of the similarity
computations between data points. However, these contributions are insufficient
to achieve interactive rates when visualizing the evolution of the tSNE
embedding for large datasets. In this work, we present a novel approach to the
minimization of the tSNE objective function that heavily relies on modern
graphics hardware and has linear computational complexity. Our technique does
not only beat the state of the art, but can even be executed on the client side
in a browser. We propose to approximate the repulsion forces between data
points using adaptive-resolution textures that are drawn at every iteration
with WebGL. This approximation allows us to reformulate the tSNE minimization
problem as a series of tensor operation that are computed with TensorFlow.js, a
JavaScript library for scalable tensor computations.
%0 Generic
%1 pezzotti2018linear
%A Pezzotti, Nicola
%A Mordvintsev, Alexander
%A Hollt, Thomas
%A Lelieveldt, Boudewijn P. F.
%A Eisemann, Elmar
%A Vilanova, Anna
%D 2018
%K 2018 arxiv clustering google visualization
%T Linear tSNE optimization for the Web
%U http://arxiv.org/abs/1805.10817
%X The t-distributed Stochastic Neighbor Embedding (tSNE) algorithm has become
in recent years one of the most used and insightful techniques for the
exploratory data analysis of high-dimensional data. tSNE reveals clusters of
high-dimensional data points at different scales while it requires only minimal
tuning of its parameters. Despite these advantages, the computational
complexity of the algorithm limits its application to relatively small
datasets. To address this problem, several evolutions of tSNE have been
developed in recent years, mainly focusing on the scalability of the similarity
computations between data points. However, these contributions are insufficient
to achieve interactive rates when visualizing the evolution of the tSNE
embedding for large datasets. In this work, we present a novel approach to the
minimization of the tSNE objective function that heavily relies on modern
graphics hardware and has linear computational complexity. Our technique does
not only beat the state of the art, but can even be executed on the client side
in a browser. We propose to approximate the repulsion forces between data
points using adaptive-resolution textures that are drawn at every iteration
with WebGL. This approximation allows us to reformulate the tSNE minimization
problem as a series of tensor operation that are computed with TensorFlow.js, a
JavaScript library for scalable tensor computations.
@misc{pezzotti2018linear,
abstract = {The t-distributed Stochastic Neighbor Embedding (tSNE) algorithm has become
in recent years one of the most used and insightful techniques for the
exploratory data analysis of high-dimensional data. tSNE reveals clusters of
high-dimensional data points at different scales while it requires only minimal
tuning of its parameters. Despite these advantages, the computational
complexity of the algorithm limits its application to relatively small
datasets. To address this problem, several evolutions of tSNE have been
developed in recent years, mainly focusing on the scalability of the similarity
computations between data points. However, these contributions are insufficient
to achieve interactive rates when visualizing the evolution of the tSNE
embedding for large datasets. In this work, we present a novel approach to the
minimization of the tSNE objective function that heavily relies on modern
graphics hardware and has linear computational complexity. Our technique does
not only beat the state of the art, but can even be executed on the client side
in a browser. We propose to approximate the repulsion forces between data
points using adaptive-resolution textures that are drawn at every iteration
with WebGL. This approximation allows us to reformulate the tSNE minimization
problem as a series of tensor operation that are computed with TensorFlow.js, a
JavaScript library for scalable tensor computations.},
added-at = {2018-06-10T09:48:56.000+0200},
author = {Pezzotti, Nicola and Mordvintsev, Alexander and Hollt, Thomas and Lelieveldt, Boudewijn P. F. and Eisemann, Elmar and Vilanova, Anna},
biburl = {https://www.bibsonomy.org/bibtex/263695b63e612ea34d9578b46dce7ca18/achakraborty},
description = {[1805.10817] Linear tSNE optimization for the Web},
interhash = {8c531b7df0e64d3552e490deb7dff30f},
intrahash = {63695b63e612ea34d9578b46dce7ca18},
keywords = {2018 arxiv clustering google visualization},
note = {cite arxiv:1805.10817},
timestamp = {2018-06-10T09:48:56.000+0200},
title = {Linear tSNE optimization for the Web},
url = {http://arxiv.org/abs/1805.10817},
year = 2018
}