irpjast/testing_svd.org

#+TITLE: Testing Svd
#+title:     Testing SVD
#+author:    Vijay Gopal Chilkuri
#+email:     vijay.gopal.c@gmail.com

* Generate a block random distribution of positions

Here's a small function to generate random points inside a 3D box of given length.

#+name: generate3Dpoints
#+begin_src python


def get_sphere_distribution(n, dmin, Ls, maxiter=1e4, allow_wall=True):
    """Get random points in a box with given dimensions and minimum separation.

    Parameters:

    - n: number of points
    - dmin: minimum distance
    - Ls: dimensions of box, shape (3,) array
    - maxiter: maximum number of iterations.
    - allow_wall: whether to allow points on wall;
       (if False: points need to keep distance dmin/2 from the walls.)

    Return:

    - ps: array (n, 3) of point positions,
      with 0 <= ps[:, i] < Ls[i]
    - n_iter: number of iterations
    - dratio: average nearest-neighbor distance, divided by dmin.

    Note: with a fill density (sphere volume divided by box volume) above about
    0.53, it takes very long. (Random close-packed spheres have a fill density
    of 0.64).

    Author: Han-Kwang Nienhuys (2020)
    Copying: BSD, GPL, LGPL, CC-BY, CC-BY-SA
    See Stackoverflow: https://stackoverflow.com/a/62895898/6228891
    """
    Ls = np.array(Ls).reshape(3)
    if not allow_wall:
        Ls -= dmin

    # filling factor; 0.64 is for random close-packed spheres
    # This is an estimate because close packing is complicated near the walls.
    # It doesn't work well for small L/dmin ratios.
    sphere_vol = np.pi/6*dmin**3
    box_vol = np.prod(Ls + 0.5*dmin)
    fill_dens = n*sphere_vol/box_vol
    if fill_dens > 0.64:
        msg = f'Too many to fit in the volume, density {fill_dens:.3g}>0.64'
        raise ValueError(msg)

    # initial try
    ps = np.random.uniform(size=(n, 3)) * Ls

    # distance-squared matrix (diagonal is self-distance, don't count)
    dsq = ((ps - ps.reshape(n, 1, 3))**2).sum(axis=2)
    dsq[np.arange(n), np.arange(n)] = np.infty

    for iter_no in range(int(maxiter)):
        # find points that have too close neighbors
        close_counts = np.sum(dsq < dmin**2, axis=1)  # shape (n,)
        n_close = np.count_nonzero(close_counts)
        if n_close == 0:
            break

        # Move the one with the largest number of too-close neighbors
        imv = np.argmax(close_counts)

        # new positions
        newp = np.random.uniform(size=3)*Ls
        ps[imv]= newp

        # update distance matrix
        new_dsq_row = ((ps - newp.reshape(1, 3))**2).sum(axis=-1)
        dsq[imv, :] = dsq[:, imv] = new_dsq_row
        dsq[imv, imv] = np.inf
    else:
        raise RuntimeError(f'Failed after {iter_no+1} iterations.')

    if not allow_wall:
        ps += dmin/2

    dratio = (np.sqrt(dsq.min(axis=1))/dmin).mean()
    return ps, iter_no+1, dratio
#+end_src

A function that generates a block random set of points

#+name: generateBlocks
#+begin_src python :noweb yes

<<generate3Dpoints>>

def generateBlockRandomPointsAtShftApart(n,L1,dmin,shift):
    """
    Parameters:

    - n: number of points
    - L1: dimensions of box, shape (3,) array
    - dmin: minimum intra block distance
    - shift: inter block distance

    Return:

    - r: array (n, 3) of point positions,

    """

    Ls = np.array([L1,L1,L1]) # lengths of the box

    # Quadrant +,+
    dist11,a,b = get_sphere_distribution(n,dmin,Ls)
    dist11 += np.array([shift,shift,0.0])

    # Quadrant -,+
    dist21,a,b = get_sphere_distribution(n,dmin,Ls)
    dist21 += np.array([-shift,shift,0.0])

    # Quadrant +,-
    dist12,a,b = get_sphere_distribution(n,dmin,Ls)
    dist12 += np.array([shift,-shift,0.0])

    # Quadrant -,-
    dist22,a,b = get_sphere_distribution(n,dmin,Ls)
    dist22 += np.array([-shift,-shift,0.0])

    xs = np.concatenate((dist11[:,0],dist12[:,0],dist21[:,0],dist22[:,0]))
    ys = np.concatenate((dist11[:,1],dist12[:,1],dist21[:,1],dist22[:,1]))
    zs = np.concatenate((dist11[:,2],dist12[:,2],dist21[:,2],dist22[:,2]))

    return((np.array((xs,ys,zs))).T)
#+end_src

#+RESULTS: generateBlocks
#+begin_example
None
#+end_example

#+begin_src python :noweb yes :results file :exports results
import numpy as np
# matplotlib related
import matplotlib.pyplot as plt

<<generateBlocks>>

L1 = 1.0
n = 100 # number of points
dmin = 0.1 # min dist between points
Ls = np.array([L1,L1,L1]) # lengths of the box
shift = -10.0
kappa = 2.0

rlist = generateBlockRandomPointsAtShftApart(n,L1,dmin,shift)
print(rlist.shape)

fig = plt.figure()
ax = fig.add_subplot(111, projection='3d')

xs = rlist.T[0]
ys = rlist.T[1]
zs = rlist.T[2]
ax.scatter(xs, ys, zs, marker='o')

fig.savefig('/tmp/test8.png')
#plt.show()
return '/tmp/test8.png'
#+end_src

#+RESULTS:
[[file:/tmp/test8.png]]

#+begin_src python :noweb yes :results file :exports results

# matplotlib related
import matplotlib.pyplot as plt
# linear algebra
import numpy as np

<<generate3Dpoints>>

shift = -1.0

# Quadrant +,+
L1 = 1.0
n = 50 # number of points
dmin = 0.1 # min dist between points
Ls = np.array([L1,L1,L1]) # lengths of the box
dist11,a,b = get_sphere_distribution(n,dmin,Ls)
dist11 += np.array([shift,shift,0.0])

# Quadrant -,+
L1 = 1.0
n = 50 # number of points
dmin = 0.1 # min dist between points
Ls = np.array([L1,L1,L1]) # lengths of the box
dist21,a,b = get_sphere_distribution(n,dmin,Ls)
dist21 += np.array([-shift,shift,0.0])

# Quadrant +,-
L1 = 1.0
n = 50 # number of points
dmin = 0.1 # min dist between points
Ls = np.array([L1,L1,L1]) # lengths of the box
dist12,a,b = get_sphere_distribution(n,dmin,Ls)
dist12 += np.array([shift,-shift,0.0])

# Quadrant -,-
L1 = 1.0
n = 50 # number of points
dmin = 0.1 # min dist between points
Ls = np.array([L1,L1,L1]) # lengths of the box
dist22,a,b = get_sphere_distribution(n,dmin,Ls)
dist22 += np.array([-shift,-shift,0.0])


fig = plt.figure()
ax = fig.add_subplot(111, projection='3d')

xs = np.concatenate((dist11[:,0],dist12[:,0],dist21[:,0],dist22[:,0]))
ys = np.concatenate((dist11[:,1],dist12[:,1],dist21[:,1],dist22[:,1]))
zs = np.concatenate((dist11[:,2],dist12[:,2],dist21[:,2],dist22[:,2]))
ax.scatter(xs, ys, zs, marker='o')

fig.savefig('/tmp/test3.png')
#plt.show()
return '/tmp/test3.png'
#+end_src

#+RESULTS:
[[file:/tmp/test3.png]]

* Is the SVD decomposition of distances really useful ?

The problem is the following:

** Given a metric F(r1,r2) finding the best representatin of F(r1,r2)

*** Slater metric

The metric can be a scaled distance such as

\[
F(r_1,r_2) = \exp(-\kappa(|r_1 - r_2|))
\]

Where,\(\kappa\) is the rate of the breadth of the slater.

#+begin_src python :results file :exports results
# matplotlib related
import matplotlib
import matplotlib.pyplot as plt
# linear algebra
import numpy

# Data for plotting

kappa  = 1.0/2.0
xstart = 0.0
xend   = 2.0
xstep  = 0.1
s = numpy.array(list(map(lambda x : numpy.exp(-x * numpy.arange(xstart,xend,xstep)), [100, 25, 10,5,2,1]))).T
#s = numpy.exp(-kappa * numpy.arange(0,1,0.1))
t = numpy.arange(xstart,xend,xstep)

fig, ax = plt.subplots()
ax.plot(t, s)

ax.set(xlabel=r'$r_{12}$', ylabel=r'$F(r_1,r_2)$',
       title='Comparison of Kappa')
#ax.set_yscale('log')
ax.grid()

fig.savefig('/tmp/test1.png')
#plt.show()
return '/tmp/test1.png'
#+end_src

#+RESULTS:
[[file:/tmp/test1.png]]


*** Gaussian metric

The metric can be a scaled distance such as

\[
F(r_1,r_2) = \exp(-\kappa(|r_1 - r_2|^2))
\]

Where,\(\kappa\) is the rate of the breadth of the gaussian.

#+begin_src python :results file :exports results
# matplotlib related
import matplotlib
import matplotlib.pyplot as plt
# linear algebra
import numpy

# Data for plotting

kappa  = 1.0/2.0
xstart = 0.0
xend   = 2.0
xstep  = 0.1
s = numpy.array(list(map(lambda x : numpy.exp(-x * numpy.power(numpy.arange(xstart,xend,xstep),2)), [100, 25, 10,5,2,1]))).T
#s = numpy.exp(-kappa * numpy.arange(0,1,0.1))
t = numpy.arange(xstart,xend,xstep)


fig, ax = plt.subplots()
ax.plot(t, s)

ax.set(xlabel=r'$r_{12}$', ylabel=r'$F(r_1,r_2)$',
       title='Comparison of Kappa')
#ax.set_yscale('log')
ax.grid()

fig.savefig('/tmp/test2.png')
#plt.show()
return '/tmp/test2.png'
#+end_src

#+RESULTS:
[[file:/tmp/test2.png]]

* Generating a box of electrons centered around nucleii

** Generate randomly distributed nucleii

The nucleii will serve as anchors for the screening of distances for calculating the
screened \(\tilde{F}(r_1,r_2)\) metric.


* Calculating SVD of the distance vector

** Slater metric

Calculate the matrix of the \(F(r_1,r_2)\) metric i.e. the slater metric.

#+begin_src python :noweb yes :results file :exports results
import numpy as np
from functools import reduce
import matplotlib.pyplot as plt

<<generateBlocks>>

L1 = 1.0
n = 10 # number of points
dmin = 0.01 # min dist between points
Ls = np.array([L1,L1,L1]) # lengths of the box
shift = -1.0
kappa = 0.6

rlist = generateBlockRandomPointsAtShftApart(n,L1,dmin,shift)
print(rlist.shape)

rij = np.zeros(shape=(rlist.shape[0],rlist.shape[0]))

def funcF(x,y):
    return(np.exp(-kappa * np.linalg.norm(x-y)))

rij = np.array([[funcF(xval, yval) for yval in rlist] for xval in rlist])

u,d,vt = np.linalg.svd(rij)
#print(d)
#plt.imshow(rij)
#plt.colorbar()
#plt.show()
plt.plot(range(d.shape[0]),d)
plt.yscale('log')
plt.savefig('/tmp/plot3.png')
return '/tmp/plot3.png'
#+end_src

#+RESULTS:
[[file:/tmp/plot3.png]]

#+begin_src python :results output
import numpy
a = numpy.array([[1,2,3],[4,5,6],[7,8,9]])
b = numpy.array([[11,12,13],[14,15,16],[17,18,19]])
print(list(zip(a,b))[0][1])
print(numpy.square(a[:,0]))

def stepExp(a):
    def myexp(x):
        if numpy.abs(x) > 1e+0:
            return numpy.zeros_like(x)
        else:
            return numpy.exp(x)

    res = numpy.array([[myexp(x) for x in y] for y in a])
    return(res)

print(numpy.exp(a))
print(stepExp(a))
#+end_src

#+RESULTS:
#+begin_example
[11 12 13]
[ 1 16 49]
[[2.71828183e+00 7.38905610e+00 2.00855369e+01]
 [5.45981500e+01 1.48413159e+02 4.03428793e+02]
 [1.09663316e+03 2.98095799e+03 8.10308393e+03]]
[[2.71828183 0.         0.        ]
 [0.         0.         0.        ]
 [0.         0.         0.        ]]
#+end_example

** Gaussian metric

Calculate the matrix of the \(FG(r_1,r_2)\) metric i.e. the gaussian metric.

#+begin_src python :noweb yes :results file :exports results
import numpy as np
from functools import reduce
import matplotlib.pyplot as plt

<<generateBlocks>>

L1 = 1.0
n = 100 # number of points
dmin = 0.1 # min dist between points
Ls = np.array([L1,L1,L1]) # lengths of the box
shift = -10.0
kappa = 2.0

rlist = generateBlockRandomPointsAtShftApart(n,L1,dmin,shift)
print(rlist.shape)

rij = np.zeros(shape=(rlist.shape[0],rlist.shape[0]))

def funcF(x,y):
    return(np.exp(-kappa * np.linalg.norm(x-y)))

def funcFG(x,y):
    return(np.exp(-kappa * np.square(np.linalg.norm(x-y))))

def funcFGD(x,y):
    rij = np.exp(-kappa * 0.1 * np.square(np.linalg.norm(x-y)))
    return(rij)

rijSlater = np.array([[funcF(xval, yval) for yval in rlist] for xval in rlist])
rijGaussian = np.array([[funcFG(xval, yval) for yval in rlist] for xval in rlist])
rijDeltafn = np.array([[funcFGD(xval, yval) for yval in rlist] for xval in rlist])

u,dS,vt = np.linalg.svd(rijSlater)
dS = dS/np.linalg.norm(dS)
u,dG,vt = np.linalg.svd(rijGaussian)
dG = dG/np.linalg.norm(dG)
u,dGD,vt = np.linalg.svd(rijDeltafn)
dGD = dGD/np.linalg.norm(dGD)

#print(d)
#plt.imshow(rij)
#plt.colorbar()
#plt.show()
plt.plot(range(dG.shape[0]),np.array([dS,dG,dGD]).T)
plt.yscale('log')
plt.savefig('/tmp/plot4.png')
return '/tmp/plot4.png'
#+end_src

#+RESULTS:
[[file:/tmp/plot4.png]]

** Palying around

Calculate the matrix of the \(FG(r_1,r_2)\) metric i.e. the gaussian metric.

#+begin_src python :noweb yes :results file :exports results
import numpy as np
from functools import reduce
import matplotlib.pyplot as plt

<<generateBlocks>>

L1 = 1.0
n = 100 # number of points
dmin = 0.1 # min dist between points
Ls = np.array([L1,L1,L1]) # lengths of the box
shift = -1.0
kappa = 2.0

rlist = generateBlockRandomPointsAtShftApart(n,L1,dmin,shift)
print(rlist.shape)

rij = np.zeros(shape=(rlist.shape[0],rlist.shape[0]))


def funcF(x,y):
    rij = np.exp(-kappa * np.linalg.norm(x-y))
    return(rij)

def funcFG(x,y):
    rij = np.exp(-kappa * np.square(np.linalg.norm(x-y)))
    return(rij)

def myexp(x):
    if np.abs(x) > 1e-0:
        return np.exp(-x)
    else:
        return np.exp(x)

def funcFGD(x,y):
    rij = myexp(-kappa * np.square(np.linalg.norm(x-y)))
    return(rij)

rijSlater = np.array([[funcF(xval, yval) for yval in rlist] for xval in rlist])
#rijSlater = rijSlater/np.max(rijSlater)
rijGaussian = np.array([[funcFG(xval, yval) for yval in rlist] for xval in rlist])
#rijGaussian = rijGaussian/np.max(rijGaussian)
rijDeltafn = np.array([[funcFGD(xval, yval) for yval in rlist] for xval in rlist])
#rijDeltafn = rijDeltafn/np.max(rijDeltafn)

u,dS,vt = np.linalg.svd(rijSlater)
dS = dS/np.linalg.norm(dS)
u,dG,vt = np.linalg.svd(rijGaussian)
dG = dG/np.linalg.norm(dG)
u,dGD,vt = np.linalg.svd(rijDeltafn)
dGD = dGD/np.linalg.norm(dGD)

#print(d)
#plt.imshow(rij)
#plt.colorbar()
#plt.show()
plt.plot(range(dG.shape[0]),np.array([dS,dG,dGD]).T)
plt.yscale('log')
plt.savefig('/tmp/plot5.png')
return '/tmp/plot5.png'
#+end_src

#+RESULTS:
[[file:/tmp/plot5.png]]
#+begin_src python :results file :exports results
import numpy
import matplotlib.pyplot as plt

def myexp2(x):
    if numpy.abs(x) > 1e-0:
        return numpy.exp(-x)
    else:
        return numpy.exp(x)

def myexp(x):
    return(numpy.array([myexp2(y) for y in x]))

kappa  = 1.0/2.0
xstart = 0.0
xend   = 2.0
xstep  = 0.1
s = numpy.array(list(map(lambda x : myexp(-x * numpy.power(numpy.arange(xstart,xend,xstep),2)), [10,5,1,0.5,0.1]))).T
#s = numpy.exp(-kappa * numpy.arange(0,1,0.1))
t = numpy.arange(xstart,xend,xstep)


fig, ax = plt.subplots()
ax.plot(t, s)

ax.set(xlabel=r'$r_{12}$', ylabel=r'$F(r_1,r_2)$',
       title='Comparison of Kappa')
ax.set_yscale('log')
ax.grid()

fig.savefig('/tmp/test7.png')
#plt.show()
return '/tmp/test7.png'
#+end_src

#+RESULTS:
[[file:/tmp/test7.png]]

** Testing SVD for custom matrices

#+begin_src python :results output
import numpy
import matplotlib.pyplot as plt

a = numpy.array([[0,100,200],[100,0,200],[100,200,0]])
b = numpy.exp(-a)
print("Matrix A")
print(a)
print("Matrix Exp(A)")
print(numpy.around(b,10))
u,d,vt = numpy.linalg.svd(a)
d = d/numpy.linalg.norm(d)
print("Singular values of A")
print(numpy.around(d,3))
print("Singular vectors of A")
print(numpy.around(u,3))
u,d,vt = numpy.linalg.svd(b)
d = d/numpy.linalg.norm(d)
print("Singular values of Exp(A)")
print(numpy.around(d,3))
print("Singular vectors of Exp(A)")
print(numpy.around(u,3))
#+end_src

#+RESULTS:
#+begin_example
Matrix A
[[  0 100 200]
 [100   0 200]
 [100 200   0]]
Matrix Exp(A)
[[1. 0. 0.]
 [0. 1. 0.]
 [0. 0. 1.]]
Singular values of A
[0.813 0.53  0.24 ]
Singular vectors of A
[[-0.67   0.142  0.728]
 [-0.626  0.42  -0.657]
 [-0.399 -0.896 -0.193]]
Singular values of Exp(A)
[0.577 0.577 0.577]
Singular vectors of Exp(A)
[[-1.     0.    -0.   ]
 [-0.    -0.894 -0.447]
 [-0.    -0.447  0.894]]
#+end_example