# current input one-hot vector dimension
16*128*2+32*16+100

4708


# computation of the number of octaves needed for the encoding
import numpy as np
np.ceil(128/12.)

11.0


# dimensionality analysis -> basic (one)-hot encoding
16 + 11 + 12 + 2

41


2**8, 2**5

(256, 32)


f = (1./600)
fs = f/2
f,fs

(0.0016666666666666668, 0.0008333333333333334)


def get_upper_pow2(M):
    i = 1
    n = 0
    while (i <= M):
        i = i << 1
        n+=1
    return n,i

def get_lower_pow2(M):
    i = 1
    n = -1
    while (i <= M):
        i = i << 1
        n+=1
    return n,i


for m in range (1,11): # iterating to show the vector dimension needed for each minute increment resolution
    M = m * 60 * 1000 # 10 minutes, 60 seconds per minute 1000 ms -> putting all into
    n,i = get_upper_pow2(M)
    print( m, n, i)

1 16 65536
2 17 131072
3 18 262144
4 18 262144
5 19 524288
6 19 524288
7 19 524288
8 19 524288
9 20 1048576
10 20 1048576


# and the smallest resolution:
get_lower_pow2(5)

(2, 8)


def get_upper_pow2(M):
    i = 1
    n = 0
    while (i <= M):
        i = i << 1
        n+=1
    return n


def get_lower_pow2(m):
    i = 1
    n = -1
    while (i <= m):
        i = i << 1
        n+=1
    return n


class Lin2WaveEncoder():
    """
    Fourier Series Inspired Approximation of a linear function encoding.
    Takes the linear function as one period of a SawTooth-Wave and encodes
    the period with enough elements to approximate the function wiht the
    resolution needed for a (close to) perfect reconstruction of the input
    """
    def __init__(self, min_val, max_val, neg_allowed=True):
        """
        @param min_val: minimum value to encode
        @param max_val: maximum value to encode
        @param neg_allowed=True : allow negative values in the encoded vecto. If False
                        will move the sinusoids to the range [0,1]
        """
        self.min = min_val
        self.max = max_val
        self.neg_allowed = neg_allowed
        self.n_low = np.max(1, get_lower_pow2(min_val))
        self.n_high = get_upper_pow2(max_val)
        self.n = self.n_high - self.n_low
        # Each period indicates a resolution level, this allows for different (time) scales
        self.periods = [2**i for i in range(self.n_low, self.n_high)]  # choose periods acording to sampling -> maybe we should add 3rds and 5ths of each to allow for more complex time pattern compositions
        # Fourier divisor coefficients of the Series
        self.coefficients = [2*i for i in range(self.n_low, self.n_high)]  # just counting the elements
        print(self.coefficients, self.periods)


    def encode(self, x):
        """
        @param x: input vector to encode
        @return vector encoding the input x in the value points of x for the sinusoidal encoders
        """
        vec = []
        for n,T in zip(self.coefficients, self.periods):
            val = np.stack( np.sin(n * x / T) ) # base term of a SawTooth Wave of period T Fourier Series
            #val = np.stack( np.sin( x / T) ) # it seems to work better for the mix without the constant
            vec.append(val)
        ret = np.stack(vec)
        if not self.neg_allowed:
            ret = (ret + 1. ) / 2.  # pull all the encoded values in range [0,1]
        return ret

    def decode(self, vec):
        """
        @param vec: multi-dimensional input vector to decode into the original signal
        """
        x = 0
        scale_factor = []
        for n,T in zip(self.coefficients, self.periods):
            scale_factor.append((1./n)*T)  # Scale factor of each term
            #scale_factor.append(T)  # Scale factor of each term
        scale_factor = np.array(scale_factor)
        tx = vec
        tx = tx * scale_factor[:,None]
        x = np.sum(tx, axis=0)
        if not self.neg_allowed:  # here as is commutative to make less computations
            x = (x * 2.) -1 # go back to the original range
        return x


we = Lin2WaveEncoder(1,1000000) # 10 seconds max -> 13 parameters

[2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30, 32, 34, 36, 38] [2, 4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384, 32768, 65536, 131072, 262144, 524288]


l_short = np.linspace(0,np.pi,10000)  # for short periods the reconstruction works great -> this is already usable if the input is scaled to these kind of elements
l_long = np.linspace(0,10000,1000)  # for long periods this starts to work less and less well


import matplotlib.pyplot as plt
%matplotlib inline


plt.plot(l_short)

[<matplotlib.lines.Line2D at 0x7f47ffe61940>]


plt.plot(l_long)

[<matplotlib.lines.Line2D at 0x7f480802bf28>]


el_short = we.encode(l_short)
el_long  = we.encode(l_long)


el_short.shape, el_long.shape

((13, 10000), (13, 1000))


dl_short = we.decode(l_short)
dl_long  = we.decode(l_long)


dl_short.shape, dl_long.shape

((10000,), (1000,))


plt.plot(dl_short)

[<matplotlib.lines.Line2D at 0x7f4808024278>]


plt.clf()
plt.plot(dl_long)

[<matplotlib.lines.Line2D at 0x7f4807f87978>]


def fourier10000(x):
    ret = -10000*np.sin(np.pi*x/5000)/np.pi - 5000*np.sin(np.pi*x/2500)/np.pi - 10000*np.sin(3*np.pi*x/5000)/(3*np.pi) - 2500*np.sin(np.pi*x/1250)/np.pi - 2000*np.sin(np.pi*x/1000)/np.pi - 5000*np.sin(3*np.pi*x/2500)/(3*np.pi) - 10000*np.sin(7*np.pi*x/5000)/(7*np.pi) - 1250*np.sin(np.pi*x/625)/np.pi - 10000*np.sin(9*np.pi*x/5000)/(9*np.pi) - 1000*np.sin(np.pi*x/500)/np.pi
    return ret


fel_short = fourier10000(l_short)
fel_long = fourier10000(l_long)


plt.plot(fel_short)

[<matplotlib.lines.Line2D at 0x7f4807efb668>]


plt.plot(fel_long)

[<matplotlib.lines.Line2D at 0x7f4807ee05c0>]


import sympy
from sympy import fourier_series, pi
from sympy import abc
from sympy.plotting import plot as spplot


M = 1 # seconds
sm = fourier_series(abc.x, (abc.x, 0, M))
sm10k = fourier_series(abc.x, (abc.x, 0, 10000))


sm.truncate(10)

-sin(2*pi*x)/pi - sin(4*pi*x)/(2*pi) - sin(6*pi*x)/(3*pi) - sin(8*pi*x)/(4*pi) - sin(10*pi*x)/(5*pi) - sin(12*pi*x)/(6*pi) - sin(14*pi*x)/(7*pi) - sin(16*pi*x)/(8*pi) - sin(18*pi*x)/(9*pi) - sin(20*pi*x)/(10*pi)


from sympy import lambdify


fsm = lambdify(abc.x, sm.truncate(10), "numpy")


fsm(1)

7.796343665038751e-16


sm.truncate(10).args

(-sin(2*pi*x)/pi,
 -sin(4*pi*x)/(2*pi),
 -sin(6*pi*x)/(3*pi),
 -sin(8*pi*x)/(4*pi),
 -sin(10*pi*x)/(5*pi),
 -sin(12*pi*x)/(6*pi),
 -sin(14*pi*x)/(7*pi),
 -sin(16*pi*x)/(8*pi),
 -sin(18*pi*x)/(9*pi),
 -sin(20*pi*x)/(10*pi))


sm.truncate(10).args[0].args

(-1, 1/pi, sin(2*pi*x))


sm10k.truncate(10).args

(-10000*sin(pi*x/5000)/pi,
 -5000*sin(pi*x/2500)/pi,
 -2500*sin(pi*x/1250)/pi,
 -2000*sin(pi*x/1000)/pi,
 -1250*sin(pi*x/625)/pi,
 -1000*sin(pi*x/500)/pi,
 -10000*sin(3*pi*x/5000)/(3*pi),
 -10000*sin(7*pi*x/5000)/(7*pi),
 -10000*sin(9*pi*x/5000)/(9*pi),
 -5000*sin(3*pi*x/2500)/(3*pi))


f1 = sm10k.truncate(10).args[0]


np.product(f1.args[:-1])

-10000/pi


coef_fact = [ (np.product(f.args[:-1]),  lambdify(abc.x, f.args[-1], "numpy")  ) for f in sm10k.truncate(10).args]


z1,z2 = zip(*coef_fact)

z1

(-10000/pi,
 -5000/pi,
 -2500/pi,
 -2000/pi,
 -1250/pi,
 -1000/pi,
 -10000/(3*pi),
 -10000/(7*pi),
 -10000/(9*pi),
 -5000/(3*pi))


lambdify(abc.x, z1[0], "numpy")(0)

-3183.098861837907


pi.evalf()

3.14159265358979


sm10k.truncate(10)

-10000*sin(pi*x/5000)/pi - 5000*sin(pi*x/2500)/pi - 10000*sin(3*pi*x/5000)/(3*pi) - 2500*sin(pi*x/1250)/pi - 2000*sin(pi*x/1000)/pi - 5000*sin(3*pi*x/2500)/(3*pi) - 10000*sin(7*pi*x/5000)/(7*pi) - 1250*sin(pi*x/625)/pi - 10000*sin(9*pi*x/5000)/(9*pi) - 1000*sin(pi*x/500)/pi


sm.scale(10000).truncate(10)

-10000*sin(2*pi*x)/pi - 5000*sin(4*pi*x)/pi - 10000*sin(6*pi*x)/(3*pi) - 2500*sin(8*pi*x)/pi - 2000*sin(10*pi*x)/pi - 5000*sin(12*pi*x)/(3*pi) - 10000*sin(14*pi*x)/(7*pi) - 1250*sin(16*pi*x)/pi - 10000*sin(18*pi*x)/(9*pi) - 1000*sin(20*pi*x)/pi


sm.truncate(10).evalf(1)

-0.3*sin(2*pi*x) - 0.2*sin(4*pi*x) - 0.1*sin(6*pi*x) - 0.08*sin(8*pi*x) - 0.06*sin(10*pi*x) - 0.05*sin(12*pi*x) - 0.05*sin(14*pi*x) - 0.04*sin(16*pi*x) - 0.04*sin(18*pi*x) - 0.03*sin(20*pi*x)


s = fourier_series(abc.x, (abc.x, 0, pi))


s.scale(10).truncate(10)

-10*sin(2*x) - 5*sin(4*x) - 10*sin(6*x)/3 - 5*sin(8*x)/2 - 2*sin(10*x) - 5*sin(12*x)/3 - 10*sin(14*x)/7 - 5*sin(16*x)/4 - 10*sin(18*x)/9 - sin(20*x)


s.truncate(20)

-sin(2*x) - sin(4*x)/2 - sin(6*x)/3 - sin(8*x)/4 - sin(10*x)/5 - sin(12*x)/6 - sin(14*x)/7 - sin(16*x)/8 - sin(18*x)/9 - sin(20*x)/10 - sin(22*x)/11 - sin(24*x)/12 - sin(26*x)/13 - sin(28*x)/14 - sin(30*x)/15 - sin(32*x)/16 - sin(34*x)/17 - sin(36*x)/18 - sin(38*x)/19 - sin(40*x)/20

MIDI encoding analysis¶

TLDR:¶

Introduction¶

Basic Idea Description¶

Codes:¶

Encoding Problems & Questions¶

Features candidates for One-hot Encoding¶

Velocity encoding¶

One-Hot encoding of Velocity¶

Sinusoidal (Fourier Inspired) Encoding of Velocity¶

Time encoding¶

Why not linear encoding?¶

Time resolution Analysis¶

Time encoding details¶

Intuition¶

Reference Formulas¶

Hypothesis .... (not proved yet and in working progress...)¶

WARNING¶

Other tools (python)¶