%matplotlib inline
import numpy as np, matplotlib as mpl, scipy as sp
from matplotlib import pylab, mlab, pyplot as plt
from tqdm.notebook import tqdm, trange

from numpy import sqrt, pi, exp, log, floor, ceil, sin, cos
from numpy.linalg import norm

rng = np.random.default_rng()

# Compute π by finding the area of the unit circle by quadrature.
N = 10000

# Divide [0, 1]^2 into N squares, and find their centers.
V = np.linspace( -1, 1, num=int(sqrt(N)) )
dx = V[1] - V[0]
V = dx/2 + V[:-1]
(xx, yy) = np.meshgrid( V, V)

plt.gca().add_artist( plt.Circle( (0, 0), 1, color='C1', alpha=.2, ec='k' ) )
plt.scatter( xx, yy, s=.5 )

n_inside = np.sum( sqrt( xx**2 + yy**2 ) < 1 )
_ = plt.title( f'$π \\approx {n_inside * dx**2}$' )

# Compute π by choosing random points in the square [-1, 1]^2, and checking how many lie inside the unit circle
P = rng.uniform( low=-1, high=1, size=(2,N) )

plt.gca().add_artist( plt.Circle( (0, 0), 1, color='C1', alpha=.2, ec='k' ) )
plt.scatter( P[0], P[1], s=.1 )

n_inside = np.sum( norm(P, axis=0 ) < 1 )
_ = plt.title( f'{n_inside/N*100 :.2f}% points inside unit circle. $π \\approx {4*n_inside/N}$' )

%%time
P = rng.uniform( low=-1, high=1, size=(N, 2) )
NN = np.arange( 1, N+1, dtype=int )
π_approx = 4 * np.cumsum( norm(P,axis=1) < 1 ) / NN

CPU times: user 3.48 ms, sys: 16 μs, total: 3.49 ms
Wall time: 2.16 ms

N0 = int(N//10)
plt.plot( NN[N0:], π_approx[N0:] )
_ = plt.title( 'Approximation of π as $N$ increases' )

%%time
N = 10**6
# Memory friendly, but slow (in Python) way of computing
n_inside = 0
prog = tqdm( range( N ), bar_format="{l_bar}{bar} {elapsed}<{remaining}, {rate_fmt}{postfix}" )
for n in prog:
    P = rng.uniform( -1, 1, size=2 )
    n_inside += ( norm(P) < 1 )
    prog.set_description_str( f'π≈{4*n_inside/(n+1):.6f}, error≈{abs( 4*n_inside/(n+1) - pi):.3e}', refresh=False )

  0%|           00:00<?, ?it/s

CPU times: user 7.83 s, sys: 132 ms, total: 7.96 s
Wall time: 7.91 s

%%time
# Faster, memory friendly way of computing
# Can get even faster by parallelizing, but don't get carried away... now

chunk_size = int(N//100)
n_chunks = N // chunk_size # Choose N to be a multiple of chunk_size

n_inside = 0
prog = tqdm( range( n_chunks ), bar_format="{l_bar}{bar} {elapsed}<{remaining}, {rate_fmt}{postfix}" )
for n in prog:
    P = rng.uniform( -1, 1, size=(2, chunk_size) )
    n_inside += np.sum( norm(P, axis=0) < 1 )

    π_approx = n_inside / (n+1) / chunk_size * 4
    prog.set_description_str( f'π={π_approx:.6f}, error≈{abs(π_approx - pi):.3e}', refresh=False )

print( f'Memory used ≈ {P.nbytes / 2**20}mb' )

  0%|           00:00<?, ?it/s

Memory used ≈ 0.152587890625mb
CPU times: user 32.5 ms, sys: 72 μs, total: 32.6 ms
Wall time: 31.2 ms

n_trials = 10**3
N = 10**6
chunk_size = 10**4
NN = np.arange( chunk_size, N, chunk_size )

print( f'Roughly {len(NN) * n_trials * 8 / 2**20:.3f}mb memory required.' )

Roughly 0.755mb memory required.

π_approx = np.empty( (len(NN), n_trials) )

for i, n in tqdm( enumerate(NN), total=len(NN) ):
    P = rng.uniform( -1, 1, size=(2, chunk_size, n_trials) )
    n_inside = np.sum( norm(P, axis=0) < 1, axis=0 )
    if i == 0: π_approx[i] = n_inside / n * 4
    else: π_approx[i] = (NN[i-1]* π_approx[i-1] + n_inside *4 ) / n

π_avg = np.mean( π_approx, axis=-1 )
σ = np.std( π_approx, axis=-1 )

  0%|          | 0/99 [00:00<?, ?it/s]

plt.fill_between( NN, π_avg - σ, π_avg + σ, alpha=.3, label='Std Dev' )
for n in sorted( rng.choice( n_trials, replace=False, size=3) ):
    plt.plot( NN, π_approx[:, n], alpha=.6, label=f'Trial {n+1}' )

plt.plot( NN, π_avg, label='Average' )
_ = plt.title( f'Approximation of π for {n_trials} trials' )
plt.legend()

<matplotlib.legend.Legend at 0x7d824651c5f0>

plt.loglog( NN, σ, label='σ' )

a = np.polyfit( log(NN), log(σ), 1 )
plt.loglog( NN, exp( a[0]*log(NN) + a[1] ), '--', alpha=.5, label=f'${exp(a[1]):.2f}\\, N^{{ {a[0]:.3f} }}$' )

_= plt.xlabel( 'log $N$' )
_ = plt.title( f'log log plot of σ vs $N$' )
plt.legend()

<matplotlib.legend.Legend at 0x7d8244652810>

# Compute by quadrature.
N = 10**7 #Warning -- start with N small, and ensure you have enough memory.
d = 10

V_1d = np.linspace( -1, 1, num=int( ceil(N**(1/d)) ) )
dx = V_1d[1] - V_1d[0]
V_1d = dx/2 + V_1d[:-1] # Centers of squares in one axis

V = [ V_1d for _ in range(d) ]
xx = np.meshgrid( *V ) # Centers of squares in d dim

n_inside = np.sum( norm(xx, axis=0) < 1 )
vol = n_inside * dx**d

# Closed form volume from Wikipedia: https://en.wikipedia.org/wiki/Volume_of_an_n-ball
exact_vol = pi**(d/2) / sp.special.gamma( d/2 + 1 )
print( f'd={d}, Computed vol={vol:.3f}, exact vol={exact_vol:.3f}, error={abs(vol - exact_vol):.2e}' )
print( f'Memory used ≈ {d*xx[0].nbytes / 2**20}mb' )

del xx

d=10, Computed vol=3.071, exact vol=2.550, error=5.21e-01
Memory used ≈ 745.0580596923828mb

# Compute by Monte Carlo
d = 10
N = 10**7

exact_vol = pi**(d/2) / sp.special.gamma( d/2 + 1 )

chunk_size = 10**5
n_chunks = N // chunk_size # Choose N to be a multiple of chunk_size

n_inside = 0
prog = tqdm( range( n_chunks ), bar_format="{l_bar}{bar} {elapsed}<{remaining}, {rate_fmt}{postfix}" )
for n in prog:
    P = rng.uniform( -1, 1, size=(d, chunk_size) )
    n_inside += np.sum( norm(P, axis=0) < 1 )

    vol = n_inside / (n+1) / chunk_size * 2**d
    prog.set_description_str( f'vol={vol:.6f}, error≈{abs(vol-exact_vol):.3e}', refresh=False )

print( f'd={d}, Computed vol={vol:.6f}, exact vol={exact_vol:.6f}, error={abs(vol - exact_vol):.2e}' )
print( f'Memory used ≈ {P.nbytes / 2**20}mb' )

  0%|           00:00<?, ?it/s

d=10, Computed vol=2.565734, exact vol=2.550164, error=1.56e-02
Memory used ≈ 7.62939453125mb

A simple Monte Carlo example¶

Getting started¶

Installing Python and Jupyter.¶

Using Colab¶

Checking it works¶

Computing π¶

Visualizing the error as N gets large¶

Volume of a $d$-dimensional ball¶

Few take aways¶