Bihaqo · KhrulkovV · Jan 28, 2019 · Jan 29, 2019 · Feb 1, 2019 · Bihaqo
diff --git a/.travis.yml b/.travis.yml
@@ -12,7 +12,7 @@ env:
     - TF_VERSION=1.12
 # command to install dependencies
 install:
-  - pip install numpy tensorflow==$TF_VERSION keras
+  - pip install numpy tensorflow==$TF_VERSION keras sympy scipy
   - pip install coveralls
 # command to run tests
 script:

diff --git a/setup.py b/setup.py
@@ -9,6 +9,6 @@
       license='MIT',
       packages=['t3f'],
       install_requires=[
-            'numpy',
+            'numpy', 'sympy', 'scipy', 'keras'
       ],
       zip_safe=False)
diff --git a/t3f/nn.py b/t3f/nn.py
@@ -3,20 +3,129 @@
 from itertools import count
 import numpy as np
 from keras.engine.topology import Layer
+from keras.engine.base_layer import InputSpec
 from keras.layers import Activation
 import t3f
 import tensorflow as tf
+from sympy.utilities.iterables import multiset_partitions
+from sympy.ntheory import factorint
+from itertools import cycle, islice
+from scipy.stats import entropy
+
+
+MODES = ['ascending', 'descending', 'mixed']
+CRITERIONS = ['entropy', 'var']
+
+
+def _to_list(p):
+  res = []
+  for k, v in p.items():
+      res += [k, ] * v
+  return res
+
+
+def _roundup(n, k):
+  return int(np.ceil(n / 10**k)) * 10**k
+
+
+def _roundrobin(*iterables):
+  "roundrobin('ABC', 'D', 'EF') --> A D E B F C"
+  # Recipe credited to George Sakkis
+  pending = len(iterables)
+  nexts = cycle(iter(it).__next__ for it in iterables)
+  while pending:
+      try:
+          for next in nexts:
+              yield next()
+      except StopIteration:
+          pending -= 1
+          nexts = cycle(islice(nexts, pending))
+
+
+def _get_all_factors(n, d=3, mode='ascending'):
+  p = _factorint2(n)
+  if len(p) < d:
+      p = p + [1, ] * (d - len(p))
+
+  if mode == 'ascending':
+      def prepr(x):
+          return tuple(sorted([np.prod(_) for _ in x]))
+  elif mode == 'descending':
+      def prepr(x):
+          return tuple(sorted([np.prod(_) for _ in x], reverse=True))
+
+  elif mode == 'mixed':
+      def prepr(x):
+          x = sorted(np.prod(_) for _ in x)
+          N = len(x)
+          xf, xl = x[:N//2], x[N//2:]
+          return tuple(_roundrobin(xf, xl))
+
+  else:
+      raise ValueError('Wrong mode specified, only {} are available'.format(MODES))
+
+  raw_factors = multiset_partitions(p, d)
+  clean_factors = [prepr(f) for f in raw_factors]
+  clean_factors = list(set(clean_factors))
+  return clean_factors
+
+
+def _factorint2(p):
+  return _to_list(factorint(p))
+
+
+def auto_shape(n, d=3, criterion='entropy', mode='ascending'):
+  factors = _get_all_factors(n, d=d, mode=mode)
+  if criterion == 'entropy':
+      weights = [entropy(f) for f in factors]
+  elif criterion == 'var':
+      weights = [-np.var(f) for f in factors]
+  else:
+      raise ValueError('Wrong criterion specified, only {} are available'.format(CRITERIONS))
+
+  i = np.argmax(weights)
+  return list(factors[i])
+
+
+def suggest_shape(n, d=3, criterion='entropy', mode='ascending'):
+  weights = []
+  for i in range(len(str(n))):
+
+      n_i = _roundup(n, i)
+      if criterion == 'entropy':
+          weights.append(entropy(auto_shape(n_i, d=d, mode=mode, criterion=criterion)))
+      elif criterion == 'var':
+          weights.append(-np.var(auto_shape(n_i, d=d, mode=mode, criterion=criterion)))
+      else:
+          raise ValueError('Wrong criterion specified, only {} are available'.format(CRITERIONS))
+
+  i = np.argmax(weights)
+  factors = auto_shape(int(_roundup(n, i)), d=d, mode=mode, criterion=criterion)
+  return factors
 
 
 class KerasDense(Layer):
   _counter = count(0)
 
-  def __init__(self, input_dims, output_dims, tt_rank=2,
+  def __init__(self, units=None, d=None, use_auto_shape=True, mode='mixed',
+               criterion='entropy', in_dims=None, out_dims=None, tt_rank=8,
                activation=None, use_bias=True, kernel_initializer='glorot',
                bias_initializer=0.1, **kwargs):
     """Creates a TT-Matrix based Dense Keras layer.
+    If in_dim, out_dim and d are provided, will determine the (quasi)optimal
+    factorizations automatically using 'mode' factorization style, and 'criterion'
+    for optimality. Default settings are recommended.
+    Otherwise, the desired factorizations has to be specified as input_dims
+    and output_dims lists.
 
     Args:
+      in_dim: an int, number of input neurons
+      out_dim: an int, number of output neurons
+      d: number of factors in shape factorizations
+      mode: string, specifies the way of factorizing in_dim and out_dim.
+          Possible values are 'ascending', 'descending', 'mixed'.
+      criterion: string, specifies the shape optimality criterion.
+          Possible values are 'entropy', 'var'.
       input_dims: an array, tensor shape of the matrix row index
       ouput_dims: an array, tensor shape of the matrix column index
       tt_rank: a number or an array, desired tt-rank of the TT-Matrix
@@ -36,8 +145,29 @@ def __init__(self, input_dims, output_dims, tt_rank=2,
         unknown.
     """
     self.counter = next(self._counter)
-    self.tt_shape = [input_dims, output_dims]
-    self.output_dim = np.prod(output_dims)
+    if use_auto_shape:
+      if units and d:
+        out_dims = auto_shape(units, d=d, mode=mode, criterion=criterion)
+        # in_dims are not known yet
+        self.tt_shape = None
+      else:
+        raise ValueError('If auto_shape=True, you have to provide units and d,\
+                          got {} and {}'.format(units, d))
+
+    if not use_auto_shape:
+      if in_dims and out_dims:
+        self.tt_shape = [in_dims, out_dims]
+      else:
+        raise ValueError('If auto_shape=False you have to provide \
+                          the desired factorizations in_dims and out_dims, \
+                          got {} and {}'.format(in_dims, out_dims))
+    self.in_dims = in_dims
+    self.out_dims = out_dims
+    self.use_auto_shape = use_auto_shape
+    self.d = d
+    self.mode = mode
+    self.criterion = criterion
+    self.output_dim = np.prod(out_dims)
     self.tt_rank = tt_rank
     self.activation = activation
     self.use_bias = use_bias
@@ -46,6 +176,18 @@ def __init__(self, input_dims, output_dims, tt_rank=2,
     super(KerasDense, self).__init__(**kwargs)
 
   def build(self, input_shape):
+
+    if self.use_auto_shape:
+      self.in_dims = auto_shape(input_shape[1],
+                                mode=self.mode,
+                                criterion=self.criterion,
+                                d=self.d)
+      self.tt_shape = [self.in_dims, self.out_dims]
+    else:
+      if input_shape[1] != np.prod(self.in_dims):
+        raise ValueError('Input shape factorization does not \
+                          match the actual input shape')
+
     if self.kernel_initializer == 'glorot':
       initializer = t3f.glorot_initializer(self.tt_shape,
                                            tt_rank=self.tt_rank)
@@ -71,6 +213,8 @@ def build(self, input_shape):
     if self.b is not None:
       self.trainable_weights.append(self.b)
 
+    self.built = True
+
   def call(self, x):
     res = t3f.matmul(x, self.matrix)
     if self.use_bias: