scikit_tt/tensor_train.py

# -*- coding: utf-8 -*- 

import scikit_tt.utils as utl
import time as _time
import numpy as np
from scipy import linalg
from typing import List, Tuple, Union, Optional


class TT(object):
    """
    Tensor train class

    Tensor trains [1]_ are defined in terms of different attributes. That is, a tensor train with order ``d`` is 
    given by a list of 4-dimensional tensors

        ``[cores[0] , ..., cores[d-1]]``,

    where ``cores[i]`` is an ndarray with dimensions

        ``ranks[i] x row_dims[i] x col_dims[i] x ranks[i+1]``.

    There is no distinguish between tensor trains and tensor trains operators, i.e. a classical tensor train is 
    represented by cores with column dimensions equal to 1.

    An instance of the tensor train class can be initialized either from a list of cores, i.e. ``t = TT(cores)`` 
    where ``cores`` is a list as described above, or from a full tensor representation, i.e. ``t = TT(x)`` where 
    ``x`` is an ndarray with dimensions 

        ``row_dims[0] x ... x row_dims[-1] x col_dims[0] x ... x col_dims[-1]``.

    In the latter case, the tensor is decomposed into the TT format. For more information on the implemented tensor
    operations, we refer to [2]_.

    Attributes
    ----------
    order : int
        Order of the tensor train
    row_dims : list[int]
        List of the row dimensions of the tensor train
    col_dims : list[int]
        List of the column dimensions of the tensor train
    ranks : list[int]
        List of the ranks of the tensor train
    cores : list[np.ndarray]
        List of the cores of the tensor train

    Methods
    -------
    print(t)
        String representation of tensor trains
    +
        Sum of two tensor trains
    -
        Difference of two tensor trains
    *
        Multiplication of tensor trains and scalars
    @/dot(t,u)
        Multiplication of two tensor trains
    tensordot
        Index contraction between two tensortrains
    rank_tensordot
        Index contraction between TT and matrix along the rank-dimension
    concatenate
        Concatenate cores of two TT
    transpose
        Transpose of a tensor train
    rank_transpose
        Rank-transpose of a tensor train
    conj
        Complex conjugate of a tensor train
    isoperator
        Check is given tensor train is an operator
    copy
        Deep copy of a tensor train
    element
        Element of t at given indices
    full
        Convert tensor train to full format
    matricize
        Matricization of a tensor train
    ortho_left
        Left-orthonormalization of a tensor train
    ortho_right
        Right-orthonormalization of a tensor train
    ortho
        Left- and right-orthonormalization of a tensor train
    norm
        Norm of a tensor train
    tt2qtt
        Conversion from TT format into QTT format
    qtt2tt
        Conversion from QTT format into TT format
    svd
        Computation of a global SVD of a tensor train
    pinv
        Computation of the pseudoinverse of a tensor train
    diag
        Construction of diagonal MPO from MPS
    squeeze
        Squeeze TT decomposition
    zeros 
        Tensor train filled with zeros
    ones
        Tensor train filled with ones
    eye
        Identity tensor train
    unit
        Canonical unit tensor
    rand
        Random tensor train
    canonical
        Full-rank tensor train consisting of tensor products of the canonical basis
    uniform
       Uniformly distributed tensor train 
    residual_error
        Compute the residual error ||A@x-b|| in TT format. 

    References
    ----------
    .. [1] I. V. Oseledets, "Tensor-Train Decomposition", SIAM Journal on Scientific Computing 33 (5), 2011
    .. [2] P. Gelß. "The Tensor-Train Format and Its Applications: Modeling and Analysis of Chemical Reaction
           Networks, Catalytic Processes, Fluid Flows, and Brownian Dynamics", Freie Universität Berlin, 2017
    
    Examples
    --------
    Construct tensor train from list of cores:

    >>> import numpy as np
    >>> from scikit_tt.tensor_train import TT
    >>>
    >>> cores = [np.random.rand(1, 2, 3, 4), np.random.rand(4, 3, 2, 1)]
    >>> t = TT(cores)
    >>> print(t)
    >>> ...

    Construct tensor train from ndarray:

    >>> import numpy as np
    >>> from scikit_tt.tensor_train import TT
    >>>
    >>> x = np.random.rand(1, 2, 3, 4, 5, 6)
    >>> t = TT(x) 
    >>> print(t)
    >>> ...

    """

    def __init__(self, x: Union[List[np.ndarray], np.ndarray], 
                 threshold: float=0, 
                 max_rank:  int=np.infty, 
                 progress:  bool=False, 
                 string:    str=None):
        """
        Parameters
        ----------
        x : list[np.ndarray] or np.ndarray
            either a list[TT] cores or a full tensor
        threshold : float, optional
            threshold for reduced SVD decompositions, default is 0
        max_rank : int, optional
            maximum rank of the left-orthonormalized tensor train, default is np.infty

        Raises
        ------
        TypeError
            if x is neither a list of ndarray nor a single ndarray
        ValueError
            if list elements of x are not 4-dimensional tensors or shapes do not match
        ValueError
            if number of dimensions of the ndarray x is not a multiple of 2
        """

        # initialize from list of cores
        if isinstance(x, list):

            # check if orders of list elements are correct
            if np.all([x[i].ndim == 4 for i in range(len(x))]):

                # check if ranks are correct
                if np.all([x[i].shape[3] == x[i + 1].shape[0] for i in range(len(x) - 1)]):

                    # define order, row dimensions, column dimensions, ranks, and cores
                    self.order = len(x)
                    self.row_dims = [x[i].shape[1] for i in range(self.order)]
                    self.col_dims = [x[i].shape[2] for i in range(self.order)]
                    self.ranks = [x[i].shape[0] for i in range(self.order)] + [x[-1].shape[3]]
                    self.cores = x

                    # rank reduction
                    if threshold != 0 or max_rank != np.infty:
                        self.ortho(threshold=threshold, max_rank=max_rank)

                else:
                    raise ValueError('Shapes of list elements do not match.')

            else:
                raise ValueError('List elements must be 4-dimensional arrays.')

        # initialize from full array   
        elif isinstance(x, np.ndarray):

            # check if order of ndarray is a multiple of 2
            if np.mod(x.ndim, 2) == 0:

                
                # show progress
                if string is None:
                    string = 'HOSVD'
                start_time = utl.progress(string, 0, show=progress)

                # define order, row dimensions, column dimensions, ranks, and cores
                order = len(x.shape) // 2
                row_dims = x.shape[:order]
                col_dims = x.shape[order:]
                ranks = [1] * (order + 1)
                cores = []

                # permute dimensions, e.g., for order = 4: p = [0, 4, 1, 5, 2, 6, 3, 7]
                p = [order * j + i for i in range(order) for j in range(2)]
                y = np.transpose(x, p).copy()

                # decompose the full tensor
                for i in range(order - 1):
                    # reshape residual tensor
                    m = ranks[i] * row_dims[i] * col_dims[i]
                    n = np.prod(row_dims[i + 1:]) * np.prod(col_dims[i + 1:])
                    y = np.reshape(y, [m, n])

                    # apply SVD in order to isolate modes
                    [u, s, v] = linalg.svd(y, full_matrices=False)

                    # rank reduction
                    if threshold != 0:
                        indices = np.where(s / s[0] > threshold)[0]
                        u = u[:, indices]
                        s = s[indices]
                        v = v[indices, :]
                    if max_rank != np.infty:
                        u = u[:, :np.minimum(u.shape[1], max_rank)]
                        s = s[:np.minimum(s.shape[0], max_rank)]
                        v = v[:np.minimum(v.shape[0], max_rank), :]

                    # define new TT core
                    ranks[i + 1] = u.shape[1]
                    cores.append(np.reshape(u, [ranks[i], row_dims[i], col_dims[i], ranks[i + 1]]))

                    # set new residual tensor
                    y = np.diag(s).dot(v)

                    # show progress
                    utl.progress(string, 100 * (i + 1) / order, cpu_time=_time.time() - start_time, show=progress)

                # define last TT core
                cores.append(np.reshape(y, [ranks[-2], row_dims[-1], col_dims[-1], 1]))

                # initialize tensor train
                self.__init__(cores)

                # show progress
                utl.progress(string, 100, cpu_time=_time.time() - start_time, show=progress)

            else:
                raise ValueError('Number of dimensions must be a multiple of 2.')

        else:
            raise TypeError('Parameter must be either a list of cores or an ndarray.')

    def __repr__(self):
        """
        String representation of tensor trains

        Print the attributes of a given tensor train.
        """

        return ('\n'
                'Tensor train with order    = {d}, \n'
                '                  row_dims = {m}, \n'
                '                  col_dims = {n}, \n'
                '                  ranks    = {r}'.format(d=self.order, m=self.row_dims, n=self.col_dims, r=self.ranks))

    def __add__(self, tt_add: 'TT') -> 'TT':
        """
        Sum of two tensor trains.

        Add two given tensor trains with same row and column dimensions.

        Parameters
        ----------
        tt_add : TT
            tensor train which is added to self

        Returns
        -------
        TT
            sum of tt_add and self

        Raises
        ------
        TypeError
            if tt_add is not an instance of the TT class
        ValueError
            if dimensions of both tensor trains do not match
        """

        if isinstance(tt_add, TT):

            # check if row and column dimension are equal
            if self.row_dims == tt_add.row_dims and self.col_dims == tt_add.col_dims:

                # define order, ranks, and cores
                order = self.order
                ranks = [1] + [self.ranks[i] + tt_add.ranks[i] for i in range(1, order)] + [1]
                cores = []

                # construct cores
                for i in range(order):
                    # set core to zero array
                    if np.iscomplexobj(self.cores[i]) or np.iscomplexobj(tt_add.cores[i]):
                        cores.append(
                            np.zeros([ranks[i], self.row_dims[i], self.col_dims[i], ranks[i + 1]], dtype=complex))
                    else:
                        cores.append(np.zeros([ranks[i], self.row_dims[i], self.col_dims[i], ranks[i + 1]]))

                    # insert core of self
                    cores[i][0:self.ranks[i], :, :, 0:self.ranks[i + 1]] = self.cores[i]

                    # insert core of tt_add
                    r_1 = ranks[i] - tt_add.ranks[i]
                    r_2 = ranks[i]
                    r_3 = ranks[i + 1] - tt_add.ranks[i + 1]
                    r_4 = ranks[i + 1]
                    cores[i][r_1:r_2, :, :, r_3:r_4] = tt_add.cores[i]

                # define tt_sum
                tt_sum = TT(cores)

                return tt_sum

            else:
                raise ValueError('Tensor trains must have the same dimensions')

        else:
            raise TypeError('Unsupported parameter.')

    def __sub__(self, tt_sub: 'TT') -> 'TT': 
        """
        Difference of two tensor trains.

        Subtract two given tensor trains.

        Parameters
        ----------
        tt_sub : TT
            tensor train which is subtracted from self

        Returns
        -------
        TT
            difference of tt_add and self
        """

        # define difference in terms of addition and left-multiplication
        tt_diff = self + (-1) * tt_sub.copy()

        return tt_diff

    def __mul__(self, scalar: Union[int, float, complex]) -> 'TT':
        """
        Left-multiplication of tensor trains and scalars.

        Parameters
        ----------
        scalar : int or float or complex
            scalar value for the left-multiplication

        Returns
        -------
        TT
            product of scalar and self

        Raises
        ------
        TypeError
            if scalar is neither int nor float nor complex
        """

        # copy self
        tt_prod = self.copy()

        # check if scalar is int, float, or complex
        if isinstance(scalar, (int, float, complex)):

            # multiply first core by scalar
            tt_prod.cores[0] = scalar * tt_prod.cores[0]

        else:
            raise TypeError('Unsupported parameter.')

        return tt_prod

    def __rmul__(self, scalar: float) -> 'TT':
        """
        Right-multiplication of tensor trains and scalars.

        Parameters
        ----------
        scalar : float
            scalar value for the right-multiplication

        Returns
        -------
        TT
            product of self and scalar
        """

        # define product in terms of left-multiplication
        tt_prod = self.copy() * scalar

        return tt_prod

    def __matmul__(self, tt_mul: 'TT') -> 'TT':
        """
        Multiplication of tensor trains.

        For Python 3.5 and higher, use the operator, i.e. T @ U = T.__matmul__(T,U). Otherwise you can use T.dot(U) or
        TT.dot(T,U).

        Parameters
        ----------
        tt_mul : TT
            tensor train which is multiplied with self

        Returns
        -------
        TT
            product of self and tt_mul

        Raises
        ------
        TypeError
            if tt_mul is not an instance of the TT class
        ValueError
            if column dimensions of self do not match row dimensions of tt_mul
        """

        def core_multiplication(core_1: np.ndarray, core_2: np.ndarray):
            """
            Multiplies two 4-dimensional cores of the following shapes:

                (r1 x m x n x r2) (s1 x n x p x s2)
            Returns:

                Product U of cores T and S of shape (r1 * s1 x m x p x r2 * s2)
                
            """

            # Prepare cores for matrix multiplication
            c1_row = np.arange(core_1.shape[ 0], dtype = np.intp)[:, None]
            c1_col = np.arange(core_1.shape[-1], dtype = np.intp)[None, :]

            c2_row = np.arange(core_2.shape[ 0], dtype = np.intp)[:, None]
            c2_col = np.arange(core_2.shape[-1], dtype = np.intp)[None, :]

            # Index and broadcast accordingly
            core1_broad = core_1[c1_row, :, :, c1_col][:, None, :, None, :, :]
            core2_broad = core_2[c2_row, :, :, c2_col][None, :, None, :, :, :]

            contraction = core1_broad @ core2_broad

            reshape_contraction = contraction.reshape(

                    core_1.shape[ 0] * core_2.shape[ 0],
                    core_1.shape[-1] * core_2.shape[-1],
                    core_1.shape[ 1], 
                    core_2.shape[ 2]
            )

            result = reshape_contraction.transpose(0, 2, 3, 1)

            return result

        if isinstance(tt_mul, TT):

            # check if dimensions match
            if self.col_dims == tt_mul.row_dims:

                # multiply TT cores
                cores = [core_multiplication(self.cores[i], tt_mul.cores[i]) for i in range(self.order)]

                # define product tensor
                tt_prod = TT(cores)

                # set tt_prod to scalar if all dimensions are equal to 1
                if np.prod(tt_prod.row_dims) == 1 and np.prod(tt_prod.col_dims) == 1:
                    tt_prod = tt_prod.element([0] * tt_prod.order * 2)

                return tt_prod

            else:
                raise ValueError('Dimensions do not match.')
        else:
            raise TypeError('Unsupported argument.')

    def dot(self, tt_mul: 'TT') -> 'TT':
        """
        Multiplication of tensor trains.

        Alias for TT.__matmul__().

        Parameters
        ----------
        tt_mul : TT
            tensor train which is multiplied with self

        Returns
        -------
        tt_prod : TT or float
            product of self and tt_mul
        """

        tt_prod = self.__matmul__(tt_mul)

        return tt_prod

    def tensordot(self, other: 'TT', 
                  num_axes: int, 
                  mode: str='last-first',
                  overwrite: bool=False) -> 'TT':
        """
        Computes index contraction between self and other.

        The axes for contraction have to be the last or the first axes of self and other. Thus, there are 4 modes of
        operation: 'last-first', 'last-last', 'first-last' and 'first-first'. The sequence of not contracted cores of
        self is always maintained (cf. the 2nd example below).
        For saving memory, you can choose to overwrite self with the tensordot.

        Parameters
        ----------
        other : TT
        num_axes : int
            number of axes that should be contracted
        mode : {'last-first', 'last-last', 'first-last', 'first-first'}, optional
            location of the axes for contraction on self-other
        overwrite : bool, optional
            whether to overwrite self or not
            
        Returns
        -------
        TT
            tensordot(self, other)

        Examples
        --------
        Example for mode='last-first':
        >>> import scikit_tt.tensor_train as tt
        >>> t = tt.ones([1, 2, 3, 4], [5, 6, 7, 8], ranks=[1, 2, 4, 3, 1])
        >>> u = tt.ones([3, 4, 5], [7, 8, 2], ranks=[1, 7, 8, 1])
        >>> t.tensordot(u, 2)

        Tensor train with order    = 3,
                  row_dims = [1, 2, 5],
                  col_dims = [5, 6, 2],
                  ranks    = [1, 2, 8, 1]

        Example for mode='last-last'
        >>> t = tt.ones([2, 3, 4, 5], [1, 1, 1, 1], ranks=3)
        >>> u = tt.ones([7, 6, 4, 5], [1, 1, 1, 1], ranks=2)
        >>> t.tensordot(u, 2, mode='last-last')

        Tensor train with order    = 4,
                  row_dims = [2, 3, 6, 7],
                  col_dims = [1, 1, 1, 1],
                  ranks    = [1, 3, 2, 2, 1]

        As you can see, the sequence of not contracted cores of t (2, 3) is maintained. The sequence of the not
        contracted cores of u (7, 6) is reversed and the cores rank-transposed to fit together.
        """

        # define first and last core indices for contraction
        if mode == 'last-first':
            first_idx_self = self.order - num_axes
            first_idx_other = 0
            last_idx_self = self.order - 1
            last_idx_other = num_axes - 1
        elif mode == 'first-last':
            first_idx_self = 0
            first_idx_other = other.order - num_axes
            last_idx_self = num_axes - 1
            last_idx_other = other.order - 1
        elif mode == 'first-first':
            first_idx_self = 0
            first_idx_other = 0
            last_idx_other = num_axes - 1
            last_idx_self = num_axes - 1
        elif mode == 'last-last':
            first_idx_self = self.order - num_axes
            first_idx_other = other.order - num_axes
            last_idx_self = self.order - 1
            last_idx_other = other.order - 1
        else:
            raise ValueError('unknown mode')

        # check dimensions for contraction
        if num_axes > self.order or num_axes > other.order:
            raise ValueError('num_axes is too big')
        if self.row_dims[first_idx_self:last_idx_self + 1] != other.row_dims[first_idx_other:last_idx_other + 1] or \
                self.col_dims[first_idx_self:last_idx_self + 1] != other.col_dims[first_idx_other:last_idx_other + 1]:
            raise ValueError('axes do not match')

        # check if the needed ranks are 1
        if mode == 'last-first':
            if self.ranks[-1] != 1 or other.ranks[0] != 1:
                raise ValueError('last rank of self and first rank of other have to be 1')
        elif mode == 'last-last':
            if self.ranks[-1] != 1 or other.ranks[-1] != 1:
                raise ValueError('last rank of self and last rank of other have to be 1')
        elif mode == 'first-last':
            if self.ranks[0] != 1 or other.ranks[-1] != 1:
                raise ValueError('first rank of self and last rank of other have to be 1')
        else:  # mode == 'first-first':
            if self.ranks[0] != 1 or other.ranks[0] != 1:
                raise ValueError('first rank of self and first rank of other have to be 1')

        # copy self
        if overwrite is False:
            tdot = ones([1], [1], 1)  # placeholder
        else:
            tdot = self

        # calculate the contraction
        M = np.tensordot(self.cores[first_idx_self], other.cores[first_idx_other], axes=([1, 2], [1, 2]))
        # M.shape (r_0, r_1, s_0, s_1)

        for i in range(1, num_axes):
            M_new = np.tensordot(self.cores[first_idx_self + i], other.cores[first_idx_other + i],
                                 axes=([1, 2], [1, 2]))
            # M_new.shape (r_{i-1}, r_i, s_{i-1}, s_i)
            M = np.tensordot(M, M_new, axes=([1, 3], [0, 2]))  # shape (r_0, s_0, r_i, s_i)
            M = np.transpose(M, [0, 2, 1, 3])  # shape (r_0, r_i, s_0, s_i)

        if mode == 'last-first':
            M = M[:, 0, 0, :]  # shape (r_0, s_{num_axes})
        elif mode == 'last-last':
            M = M[:, 0, :, 0]  # shape (r_0, s_0)
        elif mode == 'first-last':
            M = M[0, :, :, 0]  # shape (r_{num_axes}, s_0)
        else:  # first-first
            M = M[0, :, 0, :]  # shape (r_{num_axes}, s_{num_axes})

        # build the cores
        if num_axes == self.order and num_axes == other.order:  # complete contraction over both
            tdot.cores = [M[:, np.newaxis, np.newaxis, :]]

        elif num_axes == self.order:  # complete contraction over self -> merge M into other
            tdot.cores = []
            if mode == 'last-first':
                tdot.cores.append(np.tensordot(M, other.cores[last_idx_other + 1], axes=([1], [0])))
                tdot.cores.extend(other.cores[last_idx_other + 2:])  # append the remaining cores of other
            elif mode == 'last-last':
                tdot.cores.append(np.tensordot(other.cores[first_idx_other - 1], M, axes=([3], [1])))
                tdot.cores.extend(other.cores[:first_idx_other - 1][::-1])  # append the remaining cores of other
                for i in range(len(tdot.cores)):  # they need to be rank-transposed
                    tdot.cores[i] = np.transpose(tdot.cores[i], [3, 1, 2, 0])
            elif mode == 'first-last':
                tdot.cores.append(np.tensordot(other.cores[first_idx_other - 1], M, axes=([3], [1])))
                tdot.cores = other.cores[:first_idx_other - 1] + tdot.cores  # append the remaining cores of other
            else:  # mode = 'first-first', merge M into last core of other
                tdot.cores.append(np.tensordot(M, other.cores[last_idx_other + 1], axes=([1], [0])))
                tdot.cores = other.cores[last_idx_other + 2:][::-1] + tdot.cores  # append the remaining cores of other
                for i in range(len(tdot.cores)):  # they need to be rank-transposed
                    tdot.cores[i] = np.transpose(tdot.cores[i], [3, 1, 2, 0])

        else:  # merge M into tdot
            if mode == 'last-first':
                tdot.cores = self.cores[:first_idx_self] + other.cores[last_idx_other + 1:]
                tdot.cores[first_idx_self - 1] = np.tensordot(tdot.cores[first_idx_self - 1], M, axes=([3], [0]))
            elif mode == 'last-last':
                tdot.cores = self.cores[:first_idx_self]
                tdot.cores[first_idx_self - 1] = np.tensordot(tdot.cores[first_idx_self - 1], M, axes=([3], [0]))
                tdot.cores.extend(other.cores[:first_idx_other][::-1])  # append the remaining cores of other
                for i in range(first_idx_self, len(tdot.cores)):  # they need to be rank-transposed
                    tdot.cores[i] = np.transpose(tdot.cores[i], [3, 1, 2, 0])
            elif mode == 'first-last':
                tdot.cores = self.cores[last_idx_self + 1:]
                tdot.cores[0] = np.tensordot(M, tdot.cores[0], axes=([0], [0]))
                tdot.cores = other.cores[:first_idx_other] + tdot.cores
            else:  # first-first
                tdot.cores = self.cores[last_idx_self + 1:]
                tdot.cores[0] = np.tensordot(M, tdot.cores[0], axes=([0], [0]))
                tdot.cores = other.cores[last_idx_other + 1:][::-1] + tdot.cores
                for i in range(other.order - num_axes):  # they need to be rank-transposed
                    tdot.cores[i] = np.transpose(tdot.cores[i], [3, 1, 2, 0])

        # define new order, row dimensions, column dimensions and ranks
        tdot.order = len(tdot.cores)
        tdot.row_dims = [tdot.cores[i].shape[1] for i in range(tdot.order)]
        tdot.col_dims = [tdot.cores[i].shape[2] for i in range(tdot.order)]
        tdot.ranks = [tdot.cores[i].shape[0] for i in range(tdot.order)] + [tdot.cores[-1].shape[3]]

        return tdot

    def rank_tensordot(self, matrix: np.ndarray, 
                       mode: str='last', 
                       overwrite: bool=False) -> 'TT':
        """
        Return index contraction between self and a 2D-array matrix along the first/last rank axis of the first/last
        core of self. Thus, this method is only useful in the unusual case where self.ranks[0] or self.ranks[-1] != 1.
        For example, these type of TT's appear as an output of the TT.svd method.

        Parameters
        ----------
        matrix: np.ndarray
            2D array
        mode: string
            one of the following: 'last', 'first'
        overwrite: bool
            whether to overwrite self or not, default is False

        Returns
        -------
        tdot : TT
            tensordot of self and matrix along the first/last rank axis of the first/last core of self
        """
        if len(matrix.shape) != 2:
            raise ValueError('argument matrix has to be 2D-Array')

        # copy self
        if overwrite is False:
            tdot = self.copy()
        else:
            tdot = self

        if mode == 'last':
            if tdot.ranks[-1] != matrix.shape[0]:
                raise ValueError('dimensions do not match')
            tdot.cores[-1] = np.tensordot(tdot.cores[-1], matrix, axes=([3], [0]))
        elif mode == 'first':
            if tdot.ranks[0] != matrix.shape[1]:
                raise ValueError('dimensions do not match')
            tdot.cores[0] = np.tensordot(matrix, tdot.cores[0], axes=([1], [0]))
        else:
            raise ValueError('unknown mode')

        tdot.ranks = [tdot.cores[i].shape[0] for i in range(tdot.order)] + [tdot.cores[-1].shape[3]]
        return tdot

    def concatenate(self, other: Union['TT', List[np.ndarray]],
                    overwrite: bool=False) -> 'TT':
        """
        Expand the list of cores of self by appending more cores.
        If other is a TT, concatenate the cores of self and the cores of other.
        If other is a list of cores, the cores are appended to self.cores.
        For example, this method can be used to reconstruct the original tensor from u,s,v from TT.svd.

        Parameters
        ----------
        other : TT or list[np.ndarray]
        overwrite : bool, optional

        Returns
        -------
        TT
        """

        # copy self
        if overwrite is False:
            tt = self.copy()
        else:
            tt = self

        if isinstance(other, TT):
            if tt.ranks[-1] != other.ranks[0]:
                raise ValueError('ranks do not match!')
            tt.cores.extend(other.cores)

        elif isinstance(other, list):
            # check if orders of list elements are correct
            if not np.all([other[i].ndim == 4 for i in range(len(other))]):
                raise ValueError('list elements must be 4-dimensional arrays')
            # check if ranks are correct
            if not np.all([other[i].shape[3] == other[i + 1].shape[0] for i in range(len(other) - 1)]):
                raise ValueError('List elements must be 4-dimensional arrays.')
            if tt.ranks[-1] != other[0].shape[0]:
                raise ValueError('ranks do not match!')
            tt.cores.extend(other)

        tt.order = len(tt.cores)
        tt.row_dims = [tt.cores[i].shape[1] for i in range(tt.order)]
        tt.col_dims = [tt.cores[i].shape[2] for i in range(tt.order)]
        tt.ranks = [tt.cores[i].shape[0] for i in range(tt.order)] + [tt.cores[-1].shape[3]]

        return tt

    def transpose(self, 
                  cores: Optional[List[int]]=None, 
                  conjugate: bool=False,
                  overwrite: bool=False) -> 'TT':
        """
        Transpose of tensor trains.

        Parameters
        ----------
        cores : list[int], optional
            cores which should be transposed, if cores=None (default), all cores are transposed
        conjugate : bool, optional
            whether to compute the conjugate transpose, default is False
        overwrite : bool, optional
            whether to overwrite self or not, default is False

        Returns
        -------
        TT
            transpose of self

        Examples
        --------
        >>> import scikit_tt.tensor_train as tt
        >>> t = tt.ones([1, 2, 3], [4, 5, 6], ranks=[1, 7, 8, 1])
        >>> t.transpose()

        Tensor train with order    = 3,
                          row_dims = [4, 5, 6],
                          col_dims = [1, 2, 3],
                          ranks    = [1, 7, 8, 1]

        >>> t.transpose(cores=[0, 1])

        Tensor train with order    = 3,
                          row_dims = [4, 5, 3],
                          col_dims = [1, 2, 6],
                          ranks    = [1, 7, 8, 1]
        """

        # define list of core numbers
        if cores is None:
            cores = np.arange(0, self.order)

        # copy self
        if overwrite is False:
            tt_transpose = self.copy()
        else:
            tt_transpose = self

        for i in range(self.order):

            if np.isin(i, cores):
                # permute second and third dimension of each core
                tt_transpose.cores[i] = np.transpose(tt_transpose.cores[i], [0, 2, 1, 3])

                # interchange row and column dimensions
                row_dim = tt_transpose.row_dims[i]
                col_dim = tt_transpose.col_dims[i]
                tt_transpose.row_dims[i] = col_dim
                tt_transpose.col_dims[i] = row_dim

                if conjugate:
                    tt_transpose.cores[i] = np.conj(tt_transpose.cores[i])

        return tt_transpose

    def rank_transpose(self, overwrite: bool=False) -> 'TT':
        """
        Computes the rank-transposed of self.

        The rank-transposed has the same cores as self but in reversed order. To fit together,
        every core needs to be transposed with respect to its ranks.

        Parameters
        ----------
        overwrite : bool, optional
            whether to overwrite self or not, default is False

        Returns
        -------
        TT
            rank-transpose of self

        Examples
        --------
        >>> import scikit_tt.tensor_train as tt
        >>> t = tt.ones([1, 2, 3], [4, 5, 6], ranks=[1, 7, 8, 1])
        >>> t.rank_transpose()

        Tensor train with order    = 3,
                  row_dims = [3, 2, 1],
                  col_dims = [6, 5, 4],
                  ranks    = [1, 8, 7, 1]
        """

        # copy self
        if overwrite is False:
            tt_transpose = self.copy()
        else:
            tt_transpose = self

        tt_transpose.cores.reverse()
        for i in range(len(tt_transpose.cores)):
            tt_transpose.cores[i] = np.transpose(tt_transpose.cores[i], [3, 1, 2, 0])
        tt_transpose.row_dims.reverse()
        tt_transpose.col_dims.reverse()
        tt_transpose.ranks.reverse()

        return tt_transpose

    def conj(self, overwrite: bool=False) -> 'TT':
        """
        Complex conjugate of tensor trains.

        Parameters
        ----------
        overwrite : bool, optional
            whether to overwrite self or not, default is False

        Returns
        -------
        TT
            complex conjugate of self
        """

        # copy self
        if overwrite is False:
            tt_conj = self.copy()
        else:
            tt_conj = self

        # conjugate each core
        for i in range(self.order):
            tt_conj.cores[i] = np.conj(tt_conj.cores[i])

        return tt_conj

    def isoperator(self) -> bool:
        """
        Operator check.

        Returns
        -------
        bool
            true if self is a TT operator
        """

        # check if all row dimensions or column dimensions of self are equal to 1
        op_bool = not (all([i == 1 for i in self.row_dims]) or all([i == 1 for i in self.col_dims]))

        return op_bool

    def copy(self) -> 'TT':
        """
        Deep copy of tensor trains.

        Returns
        -------
        TT
            deep copy of self
        """

        # copy TT cores
        cores = [self.cores[i].copy() for i in range(self.order)]

        # define copied version of self
        tt_copy = TT(cores)

        return tt_copy

    def element(self, indices: List[int]) -> float:
        """
        Single element of tensor trains.

        Parameters
        ----------
        indices : list[int]
            indices of a single entry of self ([x_1, ..., x_d, y_1, ..., y_d])

        Returns
        -------
        float
            single entry of self

        Raises
        ------
        TypeError
            if indices is not a list[int]
        ValueError
            if length of indices does not match the order of self
        IndexError
            if one or more indices are out of range
        """

        if isinstance(indices, list):

            # check is all indices are ints
            if np.all([isinstance(indices[i], (int, np.int32, np.int64)) for i in range(len(indices))]):

                # check if length of indices is correct
                if len(indices) == 2 * self.order:

                    # check if indices are in range
                    if np.all([indices[i] >= 0 for i in range(2 * self.order)]) and \
                            np.all([indices[i] < self.row_dims[i] for i in range(self.order)]) and \
                            np.all([indices[i + self.order] < self.col_dims[i] for i in range(self.order)]):

                        # construct matrix for first row and column indices
                        entry = np.squeeze(self.cores[0][:, indices[0], indices[self.order], :]).reshape(1,
                                                                                                         self.ranks[1])

                        # multiply with respective matrices for the following indices
                        for i in range(1, self.order):
                            entry = entry.dot(
                                np.squeeze(self.cores[i][:, indices[i], indices[self.order + i], :]).reshape(
                                    self.ranks[i], self.ranks[i + 1]))

                        entry = entry[0, 0]

                        return entry

                    else:
                        raise IndexError('Indices out of range.')

                else:
                    raise ValueError('Number of indices must be twice the order of the tensor train.')

            else:
                raise TypeError('Indices must be integers.')

        else:
            raise TypeError('Unsupported parameter.')

    def full(self) -> np.ndarray:
        """
        Conversion to full format.

        Returns
        -------
        full_tensor : np.ndarray
            full tensor representation of self (dimensions: m_1 x ... x m_d x n_1 x ... x n_d)
        """
        if self.ranks[0] != 1 or self.ranks[-1] != 1:
            raise ValueError("The first and last rank have to be 1!")

        # reshape first core
        full_tensor = self.cores[0].reshape(self.row_dims[0] * self.col_dims[0], self.ranks[1])

        for i in range(1, self.order):
            # contract full_tensor with next TT core and reshape
            full_tensor = full_tensor.dot(self.cores[i].reshape(self.ranks[i],
                                                                self.row_dims[i] * self.col_dims[i] * self.ranks[
                                                                    i + 1]))
            full_tensor = full_tensor.reshape(np.prod(self.row_dims[:i + 1]) * np.prod(self.col_dims[:i + 1]),
                                              self.ranks[i + 1])

        # reshape and transpose full_tensor
        p = [None] * 2 * self.order
        p[::2] = self.row_dims
        p[1::2] = self.col_dims
        q = [2 * i for i in range(self.order)] + [1 + 2 * i for i in range(self.order)]
        full_tensor = full_tensor.reshape(p).transpose(q)

        return full_tensor

    def matricize(self) -> np.ndarray:
        """
        Matricization of tensor trains.

        If self is a TT operator, then tt_mat is a matrix. Otherwise, the result is a vector.

        Returns
        -------
        np.ndarray
            matricization of self
        """

        # reshape first core
        tt_mat = self.cores[0].reshape(self.row_dims[0], self.col_dims[0], self.ranks[1])

        for i in range(1, self.order):
            # contract tt_mat with next TT core, permute and reshape
            tt_mat = np.tensordot(tt_mat, self.cores[i], axes=(2, 0))
            tt_mat = tt_mat.transpose([0, 2, 1, 3, 4]).reshape((np.prod(self.row_dims[:i + 1]),
                                                               np.prod(self.col_dims[:i + 1]), self.ranks[i + 1]))

        # reshape into vector or matrix
        m = np.prod(self.row_dims)
        n = np.prod(self.col_dims)
        if n == 1:
            tt_mat = tt_mat.reshape(m)
        else:
            tt_mat = tt_mat.reshape(m, n)

        return tt_mat

    def ortho_left(self, start_index: int=0, 
                   end_index: Optional[int]=None, 
                   threshold: float=0.0, 
                   max_rank: int=np.infty, 
                   progress: bool=False, 
                   string: str='Left-orthonormalization') -> 'TT':
        """
        Left-orthonormalization of tensor trains.

        Parameters
        ----------
        start_index : int, optional
            start index for orthonormalization, default is 0
        end_index : int, optional
            end index for orthonormalization, default is the index of the penultimate core
        threshold : float, optional
            threshold for reduced SVD decompositions, default is 0
        max_rank : int, optional
            maximum rank of the left-orthonormalized tensor train, default is np.infty
        progress : bool, optional
            whether to show progress bar, default is False
        string : string, optional
            title of the progress bar if progress is True

        Returns
        -------
        TT
            left-orthonormalized representation of self

        Raises
        ------
        TypeError
            if start_index or end_index are not integers
        ValueError
            if threshold is less than 0
        ValueError
            if max_rank is not a positive integer
        """

        # show progress
        start_time = utl.progress(string, 0, show=progress)

        # set end_index to the index of the penultimate core if not otherwise defined
        if end_index is None:
            end_index = self.order - 2

        if isinstance(start_index, int) and isinstance(end_index, int):

            if isinstance(threshold, (int, float)) and threshold >= 0:

                if (isinstance(max_rank, (int, np.int32, np.int64)) and max_rank > 0) or max_rank == np.infty:

                    for i in range(start_index, end_index + 1):

                        # apply SVD to ith TT core
                        try:
                            [u, s, v] = linalg.svd(
                                self.cores[i].reshape(self.ranks[i] * self.row_dims[i] * self.col_dims[i],
                                                      self.ranks[i + 1]), full_matrices=False, overwrite_a=True,
                                check_finite=False)
                        except:
                            [u, s, v] = linalg.svd(
                                self.cores[i].reshape(self.ranks[i] * self.row_dims[i] * self.col_dims[i],
                                                      self.ranks[i + 1]), full_matrices=False, overwrite_a=True,
                                check_finite=False, lapack_driver='gesvd')

                        # rank reduction
                        if threshold != 0:
                            indices = np.where(s / s[0] > threshold)[0]
                            u = u[:, indices]
                            s = s[indices]
                            v = v[indices, :]
                        if max_rank != np.infty:
                            u = u[:, :np.minimum(u.shape[1], max_rank)]
                            s = s[:np.minimum(s.shape[0], max_rank)]
                            v = v[:np.minimum(v.shape[0], max_rank), :]

                        # define updated rank and core
                        self.ranks[i + 1] = u.shape[1]
                        self.cores[i] = u.reshape(self.ranks[i], self.row_dims[i], self.col_dims[i], self.ranks[i + 1])

                        # shift non-orthonormal part to next core
                        self.cores[i + 1] = np.tensordot(np.diag(s).dot(v), self.cores[i + 1], axes=(1, 0))

                        # show progress
                        utl.progress(string + '... r=' + str(self.ranks[i + 1]),
                                     100 * (i - start_index + 1) / (end_index - start_index + 1),
                                     cpu_time=_time.time() - start_time, show=progress)

                    return self

                else:
                    raise ValueError('Maximum rank must be a positive integer.')

            else:
                raise ValueError('Threshold must be greater or equal 0.')

        else:
            raise TypeError('Start and end indices must be integers.')

    def ortho_right(self, start_index: Optional[int]=None, 
                    end_index: int=1, 
                    threshold: float=0, 
                    max_rank: int=np.infty) -> 'TT':
        """
        Right-orthonormalization of tensor trains.

        Parameters
        ----------
        start_index : int, optional
            start index for orthonormalization, default is the index of the last core
        end_index : int, optional
            end index for orthonormalization, default is 1
        threshold : float, optional
            threshold for reduced SVD decompositions, default is 0
        max_rank : int, optional
            maximum rank of the left-orthonormalized tensor train, default is np.infty

        Returns
        -------
        TT
            right-orthonormalized representation of self

        Raises
        ------
        TypeError
            if start_index or end_index are not integers
        ValueError
            if threshold is less than 0
        ValueError
            if max_rank is not a positive integer
        """

        # set start_index to the index of the last core if not otherwise defined
        if start_index is None:
            start_index = self.order - 1

        if isinstance(start_index, (int, np.int32, np.int64)) and isinstance(end_index, (int, np.int32, np.int64)):

            if isinstance(threshold, (int, np.int32, np.int64, float, np.float32, np.float64)) and threshold >= 0:

                if (isinstance(max_rank, (int, np.int32, np.int64)) and max_rank > 0) or max_rank == np.infty:

                    for i in range(start_index, end_index - 1, -1):

                        # apply SVD to ith TT core
                        try:
                            [u, s, v] = linalg.svd(self.cores[i].reshape(self.ranks[i],
                                                                         self.row_dims[i] * self.col_dims[i] *
                                                                         self.ranks[i + 1]), full_matrices=False,
                                                   overwrite_a=True, check_finite=False)
                        except:
                            [u, s, v] = linalg.svd(self.cores[i].reshape(self.ranks[i],
                                                                         self.row_dims[i] * self.col_dims[i] *
                                                                         self.ranks[i + 1]), full_matrices=False,
                                                   overwrite_a=True, check_finite=False, lapack_driver='gesvd')

                        # rank reduction
                        if threshold != 0:
                            indices = np.where(s / s[0] > threshold)[0]
                            u = u[:, indices]
                            s = s[indices]
                            v = v[indices, :]
                        if max_rank != np.infty:
                            u = u[:, :np.minimum(u.shape[1], max_rank)]
                            s = s[:np.minimum(s.shape[0], max_rank)]
                            v = v[:np.minimum(v.shape[0], max_rank), :]

                        # define updated rank and core
                        self.ranks[i] = v.shape[0]
                        self.cores[i] = v.reshape(self.ranks[i], self.row_dims[i], self.col_dims[i], self.ranks[i + 1])

                        # shift non-orthonormal part to previous core
                        self.cores[i - 1] = self.cores[i - 1].reshape(
                            self.ranks[i - 1] * self.row_dims[i - 1] * self.col_dims[i - 1],
                            self.cores[i - 1].shape[3]).dot(u).dot(np.diag(s))
                        self.cores[i - 1] = self.cores[i - 1].reshape(self.ranks[i - 1], self.row_dims[i - 1],
                                                                      self.col_dims[i - 1], self.ranks[i])

                    return self

                else:
                    raise ValueError('Maximum rank must be a positive integer.')

            else:
                raise ValueError('Threshold must be greater or equal 0.')

        else:
            raise TypeError('Start and end indices must be integers.')

    def ortho(self, threshold: float=0, max_rank: int=np.infty) -> 'TT':
        """
        Left- and right-orthonormalization of tensor trains.

        Parameters
        ----------
        threshold : float, optional
            threshold for reduced SVD decompositions, default is 0
        max_rank : int
            maximum rank of the right-orthonormalized tensor train

        Returns
        -------
        TT
           right-orthonormalized representation of self

        Raises
        ------
        ValueError
            if threshold is less than 0
        ValueError
            if max_rank is not a positive integer
        """

        if isinstance(threshold, (int, np.int32, np.int64, float, np.float32, np.float64)) and threshold >= 0:

            if (isinstance(max_rank, (int, np.int32, np.int64)) and max_rank > 0) or max_rank == np.infty:

                # left- and right-orthonormalize self
                self.ortho_left(threshold=threshold, max_rank=np.infty).ortho_right(threshold=threshold,
                                                                                    max_rank=max_rank)

                return self

            else:
                raise ValueError('Maximum rank must be a positive integer.')

        else:
            raise ValueError('Threshold must be greater or equal 0.')

    def norm(self, p: int=2) -> float:
        """
        Norm of tensor trains.

        Counterpart of matrix and vector norms. This function is able to return four different norms of tensor trains.

        Parameters
        ----------
        p : int
            order of the norm

        Returns
        -------
        float
            norm of self

        Notes
        -----
        The following norms can be calculated:

        ==== ====================== ===============================
        p    norm for tensor trains norm for tensor-train operators
        ==== ====================== ===============================
        1    Manhattan norm         maximum absolute column sum
        2    Eucildean norm         Frobenius norm
        ==== ====================== ===============================

        For the Manhattan norm, it is assumed that all entries of the tensor train are non-negative. The same holds for
        TT operators when computing the maximum column sum.

        Raises
        ------
        ValueError
            if p is not equal to 1 or 2

        Examples
        --------
        >>> import scikit_tt.tensor_train as tt
        >>> t = tt.ones([2, 2, 2], [3, 3, 3], ranks=4)
        >>> t.norm(p=1)
        128.0
        >>> t.norm(p=2)
        235.15101530718508
        """

        # copy self
        tt_tensor = self.copy()

        if p == 1:

            # Manhattan norm and maximum absolute column sum
            # ----------------------------------------------

            # transpose if necessary
            if all([i == 1 for i in self.row_dims]):
                tt_tensor = tt_tensor.transpose()

            # sum over row axes
            tt_tensor.cores = [
                np.sum(tt_tensor.cores[i], axis=1).reshape((tt_tensor.ranks[i], 1, tt_tensor.col_dims[i],
                                                           tt_tensor.ranks[i + 1])) for i in
                range(tt_tensor.order)]

            # define new row dimensions
            tt_tensor.row_dims = [1] * tt_tensor.order

            # matricize tensor train
            tt_tensor = tt_tensor.matricize()

            # compute norm
            norm = np.max(tt_tensor)

            return norm

        elif p == 2:

            # reshape cores if self is a TT operator
            if self.isoperator():
                cores = [
                    tt_tensor.cores[i].reshape(tt_tensor.ranks[i], tt_tensor.row_dims[i] * tt_tensor.col_dims[i], 1,
                                               tt_tensor.ranks[i + 1]) for i in range(tt_tensor.order)]
                tt_tensor = TT(cores)

            # Euclidean norm
            # --------------

            # right-orthonormalize tt_tensor
            tt_tensor = tt_tensor.ortho_right()

            # compute norm from first core
            norm = np.linalg.norm(
                tt_tensor.cores[0].reshape(tt_tensor.row_dims[0] * tt_tensor.col_dims[0] * tt_tensor.ranks[1]))

            return norm

        else:
            raise ValueError('p must be 1 or 2.')

    def tt2qtt(self, 
               row_dims: List[List[int]], 
               col_dims: List[List[int]], 
               threshold: float=0) -> 'TT':
        """
        Conversion from TT format into QTT format.

        Split the TT cores of a given tensor train in order to obtain a QTT representation.

        Example:

        Given a tensor train t with row dimensions m_1, ..., m_d and column dimensions n_1, ...,n_d,

            t_qtt = tt2qtt(t, [M_1, ..., M_d], [N_1, ..., N_d])

        defines a new instance of the TT class with dimensions given by the lists M_1, ..., M_d and N_1, ..., N_d,
        respectively. M_i and N_i are lists of ints such that np.prod(M_i) = m_i and np.prod(N_i)=n_i.

        Parameters
        ----------
        row_dims : list[list[int]]
            row dimensions for the QTT representation
        col_dims : list[list[int]]
            col dimensions for the QTT representation
        threshold : float, optional
            threshold for reduced SVD decompositions, default is 0

        Returns
        -------
        TT
            QTT representation of self
        """

        # define QTT cores and copy self
        qtt_cores = []
        tt_tensor = self.copy()

        # split TT cores of self
        # ----------------------

        for i in range(self.order):

            # define core, rank, row_dim, and col_dim
            core = tt_tensor.cores[i]
            rank = tt_tensor.ranks[i]
            row_dim = tt_tensor.row_dims[i]
            col_dim = tt_tensor.col_dims[i]

            # begin splitting
            for j in range(len(row_dims[i]) - 1):

                # set new row_dim and col_dim for reshape
                row_dim = int(row_dim / row_dims[i][j])
                col_dim = int(col_dim / col_dims[i][j])

                # reshape and transpose core
                core = core.reshape(rank, row_dims[i][j], row_dim, col_dims[i][j], col_dim,
                                    tt_tensor.ranks[i + 1]).transpose([0, 1, 3, 2, 4, 5])

                # apply SVD in order to split core
                [u, s, v] = linalg.svd(
                    core.reshape(rank * row_dims[i][j] * col_dims[i][j], row_dim * col_dim * tt_tensor.ranks[i + 1]),
                    full_matrices=False, overwrite_a=True, check_finite=False, lapack_driver='gesvd')

                # rank reduction
                if threshold != 0:
                    indices = np.where(s / s[0] > threshold)[0]
                    u = u[:, indices]
                    s = s[indices]
                    v = v[indices, :]

                # define QTT core
                qtt_cores.append(u.reshape(rank, row_dims[i][j], col_dims[i][j], s.shape[0]))

                # update residual core and rank
                core = np.diag(s).dot(v)
                rank = s.shape[0]

            # define last QTT core
            qtt_cores.append(core.reshape(rank, row_dim, col_dim, tt_tensor.ranks[i + 1]))

        # define quantized tensor train
        qtt_tensor = TT(qtt_cores)

        return qtt_tensor

    def qtt2tt(self, merge_numbers: List[int]) -> 'TT':
        """
        Conversion from QTT format into TT format.

        Contract the QTT cores of a given quantized tensor train in order to obtain a TT representation.

        Example:

        Given a quantized tensor train t with d cores,

            t_tt = qtt2tt(t, [c_1, ..., c_e])

        defines a new instance of the TT class with order e, i.e. qtt2tt merges the first c_1 cores, the second c_2
        cores, and so on.

        Parameters
        ----------
        merge_numbers : list[int]
            list of core numbers for contractions

        Returns
        -------
        TT
            TT representation of self
        """

        # define TT cores and copy self
        tt_cores = []
        qtt_tensor = self.copy()

        # contract cores of self
        # ----------------------

        # first index
        k = 0

        for i in range(len(merge_numbers)):

            # set new QTT core
            core = qtt_tensor.cores[k]

            # begin contractions
            for j in range(k + 1, k + merge_numbers[i]):
                # contract with next core and reshape
                core = np.tensordot(core, qtt_tensor.cores[j], axes=(3, 0)).transpose((0, 1, 3, 2, 4, 5))
                core = core.reshape((core.shape[0], core.shape[1] * core.shape[2], core.shape[3] * core.shape[4],
                                    core.shape[5]))

            # define TT core
            tt_cores.append(core)

            # increase contraction index
            k = k + merge_numbers[i]

        # define tensor train
        tt_tensor = TT(tt_cores)

        return tt_tensor

    def svd(self, 
            index:     int, 
            threshold: float=0.0, 
            max_rank:  int=np.infty, 
            ortho_l:   bool=True, 
            ortho_r:   bool=True, 
            overwrite: bool=False) -> Tuple['TT', 'TT', 'TT']: 
        """
        Computation of a global SVD of a tensor train.
        Construct a singular value decomposition of a (non-operator) tensor train t in the form of tensor networks u, s,
        and v such that, by contraction, t=u*diag(s)*v. See [1]_ and [2]_ for details.

        Parameters
        ----------
        index : int
            the cores 0 to index-1 represent the row dimensions and index to order-1 the column dimensions of the
            unfolded version of self
        threshold : float, optional
            threshold for reduced SVD decompositions, default is 0
        max_rank : int, optional
            maximal rank of reduced svd
        ortho_l: bool, optional
            whether to apply left-orthonormalization or not, default is True
        ortho_r : bool, optional
            whether to apply right-orthonormalization or not, default is True
        overwrite : bool, optional
            whether to overwrite self or not, default is False
        Returns
        -------
        u : TT
            left-orthonormal part of the global SVD
        s : np.ndarray
            vector of singular values of the global SVD
        v : TT
            right-orthonormal part of the global SVD
        References
        ----------
        .. [1] P. Gelß. "The Tensor-Train Format and Its Applications: Modeling and Analysis of Chemical Reaction
               Networks, Catalytic Processes, Fluid Flows, and Brownian Dynamics", Freie Universität Berlin, 2017
        .. [2] S. Klus, P. Gelß, S. Peitz, C. Schütte, "Tensor-based Dynamic Mode Decomposition", Nonlinearity 31 (7),
               2018
        """

        # copy self
        if overwrite is False:
            t = self.copy()
        else:
            t = self

        # left-orthonormalize cores 0 to index-2
        if ortho_l is True:
            t = t.ortho_left(end_index=index - 2, threshold=threshold, max_rank=max_rank)

        # right-orthonormalize cores index to order -1
        if ortho_r is True:
            t = t.ortho_right(end_index=index, threshold=threshold, max_rank=max_rank)

        # decompose (index-1)th core
        [u, s, v] = linalg.svd(t.cores[index - 1].reshape(t.ranks[index - 1] * t.row_dims[index - 1], t.ranks[index]),
                               full_matrices=False, overwrite_a=True, check_finite=False, lapack_driver='gesvd')

        # rank reduction
        if threshold != 0:
            indices = np.where(s / s[0] > threshold)[0]
            u = u[:, indices]
            s = s[indices]
            v = v[indices, :]
        if max_rank != np.infty:
            u = u[:, :np.minimum(u.shape[1], max_rank)]
            s = s[:np.minimum(s.shape[0], max_rank)]
            v = v[:np.minimum(v.shape[0], max_rank), :]

        # set new rank
        t.ranks[index] = u.shape[1]

        # update (index-1)th core
        t.cores[index - 1] = u.reshape(t.ranks[index - 1], t.row_dims[index - 1], 1, t.ranks[index])

        # update (index)th core
        t.cores[index] = np.tensordot(v, t.cores[index], axes=(1, 0))

        # contruct orthonormal parts of the global SVD
        u = TT(t.cores[:index])
        v = TT(t.cores[index:])

        return u, s, v

    def pinv(self, 
             index:     int, 
             threshold: float=0.0, 
             ortho_l:   bool=True,
             ortho_r:   bool=True,
             overwrite: bool=False) -> 'TT':
        """
        Computation of the pseudoinverse of a tensor train.

        Construct the pseudoinverse of a (non-operator) tensor train by a global SVD. See [1]_, [2]_ and [3]_ for
        details.

        Parameters
        ----------
        index : int
            the cores 0 to index-1 represent the row dimensions and index to order-1 the column dimensions of the
            unfolded version of self
        threshold : float, optional
            threshold for reduced SVD decompositions, default is 0
        ortho_l : bool, optional
            whether to apply left-orthonormalization or not, default is True
        ortho_r : bool, optional
            whether to apply right-orthonormalization or not, default is True
        overwrite : bool, optional
            whether to overwrite self or not, default is False

        Returns
        -------
        TT
            pseudoinverse of a given tensor train

        References
        ----------
        .. [1] P. Gelß. "The Tensor-Train Format and Its Applications: Modeling and Analysis of Chemical Reaction
               Networks, Catalytic Processes, Fluid Flows, and Brownian Dynamics", Freie Universität Berlin, 2017
        .. [2] S. Klus, P. Gelß, S. Peitz, C. Schütte, "Tensor-based Dynamic Mode Decomposition", Nonlinearity 31 (7),
               2018
        .. [3] P. Gelß, S. Klus, J. Eisert, C. Schütte, "Multidimensional Approximation of Nonlinear Dynamical Systems",
               arXiv:1809.02448, 2018
        """

        # compute gloabl SVD of self
        u, s, v = TT.svd(self, index, threshold=threshold, ortho_l=ortho_l, ortho_r=ortho_r, overwrite=overwrite)

        # define core list
        cores = u.cores + v.cores

        # contract s with (index)th core
        cores[index] = np.tensordot(np.diag(np.reciprocal(s)), cores[index], axes=(1, 0))

        # define tensor train
        p_inv = TT(cores)

        return p_inv
    
    def diag(self, t: 'TT', diag_list: List) -> 'TT':
        """
        Construction of diagonal MPO from MPS.

        Parameters
        ----------
        t: TT
            MPS decomposition
        diag_list: list
            cores to diagonalize

        Returns
        -------
        t_diag: TT
            MPO decomposition
        """

        cores = t.cores.copy()

        for i in diag_list:
            r1, d, _, r2 = cores[i].shape
            core_diag = np.zeros([r1,d,d,r2], dtype=complex)
            for k in range(r1):
                for l in range(r2):
                    core_diag[k,:,:,l] = np.diag(np.squeeze(cores[i][k,:,0,l]))
            cores[i] = core_diag

        t_diag = TT(cores)

        return t_diag
    

    def squeeze(self) -> 'TT':
        """
        Squeeze TT decomposition.

        Contract cores with row and column dimension 1 with neighboring cores.

        Parameters
        ----------
        t: TT
            TT decomposition

        Returns
        -------
        t_squeeze: TT
            Equivalent TT decomposition of the input tensor, all cores have either row
            or column dimension (or both) larger than 1.
        """

        # find cores with row and column dimension equal to 1
        no_mode_list = []
        for i in range(self.order):
            if self.row_dims[i] == 1 and self.col_dims[i] == 1:
                no_mode_list.append(i)

        # cores with row or column dimension (or both) larger than 1
        mode_list = list(np.setdiff1d(np.arange(self.order), no_mode_list))

        # append t.order for later loop
        mode_list += [self.order]

        # define core list
        cores = []

        # if first cores have row and column dimension equal to 1,
        # contract from the left with first relevant core
        if mode_list[0]>0:
            core_tmp = self.cores[0][0,0,0,:][None,:]
            for i in range(1,mode_list[0]):
                core_tmp = core_tmp@self.cores[i][:,0,0,:]
            self.cores[mode_list[0]] = np.tensordot(core_tmp, self.cores[mode_list[0]], axes=(1,0))

        # contract cores with row and column dimension with relevant cores from the right
        for i in range(len(mode_list)-1):
            core_tmp = self.cores[mode_list[i]]
            for j in range(mode_list[i]+1,mode_list[i+1]):
                core_tmp = core_tmp@self.cores[j][:,0,0,:]
            cores.append(core_tmp)

        # construct squeezed TT decomposition
        t_squeeze = TT(cores)

        return t_squeeze


# construction of specific tensor-train decompositions
# ----------------------------------------------------

def zeros(row_dims: List[int], col_dims: List[int], ranks: Union[int, List[int]]=1) -> 'TT':
    """
    Tensor train filled with zeros.

    Parameters
    ----------
    row_dims : list[int]
        list of the row dimensions of the tensor train of all zeros
    col_dims : list[int]
        list of the column dimensions of the tensor train of all zeros
    ranks : int or list[int], optional
        list of the ranks of the tensor train of all zeros, default is [1, ..., 1]

    Returns
    -------
    TT
        Tensor train filled with zeros
    """

    # set ranks of tt_zeros
    if not isinstance(ranks, list):
        ranks = [1] + [ranks for _ in range(len(row_dims) - 1)] + [1]

    # define TT cores of tt_zeros
    cores = [np.zeros([ranks[i], row_dims[i], col_dims[i], ranks[i + 1]]) for i in range(len(row_dims))]

    # define tensor train
    tt_zeros = TT(cores)

    return tt_zeros


def ones(row_dims: List[int], col_dims: List[int], ranks: Union[int, List[int]]=1) -> 'TT':
    """
    Tensor train filled with ones.

    Parameters
    ----------
    row_dims : list[int]
        list of the row dimensions of the tensor train of all ones
    col_dims : list[int]
        list of the column dimensions of the tensor train of all ones
    ranks : int or list[int], optional
        list of the ranks of the tensor train of all ones, default is [1, ..., 1]

    Returns
    -------
    TT
        Tensor train filled with ones
    """

    # set ranks of tt_ones
    if not isinstance(ranks, list):
        ranks = [1] + [ranks for _ in range(len(row_dims) - 1)] + [1]

    # define TT cores of tt_ones
    cores = [np.ones([ranks[i], row_dims[i], col_dims[i], ranks[i + 1]]) for i in range(len(row_dims))]

    # define tensor train
    tt_ones = TT(cores)

    return tt_ones


def eye(dims: List[int]) -> 'TT':
    """
    Identity tensor train.

    Parameters
    ----------
    dims : list[int]
        list of row/column dimensions of the identity tensor train

    Returns
    -------
    TT
        Identity tensor train
    """

    # define cores of tt_eye
    cores = [np.zeros([1, dims[i], dims[i], 1]) for i in range(len(dims))]
    for i in range(len(dims)):
        cores[i][0, :, :, 0] = np.eye(dims[i])

    # define tensor train
    tt_eye = TT(cores)

    return tt_eye


def unit(dims: List[int], inds: List[int]) -> 'TT':
    """
    Canonical unit tensor.

    Return specific canonical unit tensor in given dimensions.

    Parameters
    ----------
    dims : list[int]
        dimensions of the tensor train
    inds : list[int]
        positions of the 1s

    Returns
    -------
    TT
        unit tensor train
    """

    t = zeros(dims, [1] * len(dims))
    for i in range(t.order):
        t.cores[i][0, inds[i], 0, 0] = 1
    return t


def rand(row_dims : List[int], col_dims: List[int], ranks: Union[int, List[int]]=1) -> 'TT':
    """
    Random tensor train.

    Parameters
    ----------
    row_dims : list[int]
        list of row dimensions of the random tensor train
    col_dims : list[int]
        list of column dimensions of the random tensor train
    ranks : int or list[int], optional
        list of the ranks of the random tensor train, default is [1, ..., 1]

    Returns
    -------
    TT
        random tensor train
    """

    # set ranks of tt_rand
    if not isinstance(ranks, list):
        ranks = [1] + [ranks for _ in range(len(row_dims) - 1)] + [1]

    # define TT cores of tt_rand
    cores = [np.random.rand(ranks[i], row_dims[i], col_dims[i], ranks[i + 1]) for i in range(len(row_dims))]

    # define tensor train
    tt_rand = TT(cores)

    return tt_rand


def canonical(row_dims: List[int], max_rank: int) -> 'TT':
    """
    Full-rank tensor train consisting of tensor products of the canonical basis.

    Parameters
    ----------
    row_dims : list[int]
        list of row dimensions of the random tensor train
    max_rank : int
        maximum rank of the TT decomposition

    Returns
    -------
    TT
        canonical tensor train
    """

    # initialize core list
    order = len(row_dims)
    cores = [None for _ in range(order)]

    # define cores from the left
    r_tmp_left = 1
    for i in range(order // 2):
        cores[i] = np.eye(r_tmp_left * row_dims[i], np.amin([r_tmp_left * row_dims[i], max_rank]))
        cores[i] = cores[i].reshape((r_tmp_left, row_dims[i], 1, np.amin([r_tmp_left * row_dims[i], max_rank])))
        r_tmp_left = np.amin([r_tmp_left * row_dims[i], max_rank])

    # define cores from the right
    r_tmp_right = 1
    for i in range(order // 2):
        cores[-i - 1] = np.eye(np.amin([r_tmp_right * row_dims[-i-1], max_rank]), row_dims[-i-1] * r_tmp_right)
        cores[-i - 1] = cores[-i - 1].reshape(
            [np.amin([r_tmp_right * row_dims[-i-1], max_rank]), row_dims[-i-1], 1, r_tmp_right])
        r_tmp_right = np.amin([r_tmp_right * row_dims[-i-1], max_rank])

    # define core in the middle (if order is odd)
    if np.mod(order, 2) == 1:
        cores[order // 2] = np.eye(r_tmp_left * row_dims[order // 2], r_tmp_right).reshape(
            [r_tmp_left, row_dims[order // 2], 1, r_tmp_right])

    # define tensor train
    tt_canonical = TT(cores)

    return tt_canonical


def uniform(row_dims: List[int], ranks: Union[int, List[int]]=1, norm: float=1) -> 'TT':
    """
    Uniformly distributed tensor train.

    Parameters
    ----------
    row_dims : list[int]
        list of row dimensions of the random tensor train
    ranks : int or list[int], optional
        list of the ranks of the uniformly distributed tensor train, default is [1, ..., 1]
    norm : float, optional
        norm of the uniformly distributed tensor train, default is 1

    Returns
    -------
    TT
        uniformly distributed tensor train
    """

    # set ranks of tt_uni
    if not isinstance(ranks, list):
        ranks = [1] + [ranks for _ in range(len(row_dims) - 1)] + [1]

    # compute factor for each core such that tt_uni has given norm
    factor = (norm / (np.sqrt(np.prod(row_dims)) * np.prod(ranks))) ** np.true_divide(1, len(row_dims))

    # define TT cores of tt_uni
    cores = [factor * np.ones([ranks[i], row_dims[i], 1, ranks[i + 1]]) for i in range(len(row_dims))]

    # define tensor train
    tt_uni = TT(cores)

    return tt_uni


def residual_error(operator: 'TT', lhs: 'TT', rhs: 'TT') -> float:
    """
    Compute the residual error ||A@x-b|| in TT format. Since the ranks of A@x may be too large for storing
    the complete tensor train, the residual error is computed in a core-wise manner. 

    Parameters
    ----------
    operator : TT
        TT operator
    lhs : TT
        left-hand side in TT format
    rhs : TT
        right-hand side in TT format

    Returns
    -------
    error : float
        residual error
    """

    for i in range(operator.order):
        Ax = np.tensordot(operator.cores[i], lhs.cores[i], axes=(2,1)).transpose([0, 3, 1, 4, 2, 5]).reshape([operator.ranks[i]*lhs.ranks[i], operator.row_dims[i], operator.ranks[i+1]*lhs.ranks[i+1]])
        b = rhs.cores[i].reshape(rhs.ranks[i], rhs.row_dims[i], rhs.ranks[i+1])
        if i == 0:
            core = np.append(Ax, -b, axis=2)
            [u, s, v] = linalg.svd(core.reshape([core.shape[0]*core.shape[1], core.shape[2]]), full_matrices=False, overwrite_a=True, check_finite=False, lapack_driver='gesvd')
            M = np.diag(s).dot(v)
        elif i == (operator.order - 1):
            core = np.append(Ax, b, axis=0)
            core = np.tensordot(M, core, axes=(1,0))
            error = np.linalg.norm(core.flatten())
        else:
            core_1 = np.append(Ax, np.zeros([Ax.shape[0], Ax.shape[1], b.shape[2]]), axis=2)
            core_2 = np.append(np.zeros([b.shape[0], b.shape[1], Ax.shape[2]]), b, axis=2)
            core = np.append(core_1, core_2, axis=0)
            core = np.tensordot(M, core, axes=(1,0))
            [u, s, v] = linalg.svd(core.reshape([core.shape[0]*core.shape[1], core.shape[2]]), full_matrices=False, overwrite_a=True, check_finite=False, lapack_driver='gesvd')
            M = np.diag(s).dot(v)

    return error