@article{ author = {Baldi, P.}, title = {Boolean autoencoders and hypercube clustering complexity}, journal = {Designs, Codes and Cryptography}, volume = {}, number = {}, pages = {1-21}, note = {}, abstract = {We introduce and study the properties of Boolean autoencoder circuits. In particular, we show that the Boolean autoencoder circuit problem is equivalent to a clustering problem on the hypercube. We show that clustering m binary vectors on the n -dimensional hypercube into k clusters is NP-hard, as soon as the number of clusters scales like $$m^\epsilon (\epsilon >0 )$$ , and thus the general Boolean autoencoder problem is also NP-hard. We prove that the linear Boolean autoencoder circuit problem is also NP-hard, and so are several related problems such as: subspace identification over finite fields, linear regression over finite fields, even/odd set intersections, and parity circuits. The emerging picture is that autoencoder optimization is NP-hard in the general case, with a few notable exceptions including the linear cases over infinite fields or the Boolean case with fixed size hidden layer. However learning can be tackled by approximate algorithms, including alternate optimization, suggesting a new class of learning algorithms for deep networks, including deep networks of threshold gates or artificial neurons.}, keywords = {Autoencoders,Clustering,Boolean circuits,Computational complexity}, year = {2012} }