%pylab inline
from tqdm.notebook import tqdm, trange
import scipy as sp

rng = random.default_rng()

%pylab is deprecated, use %matplotlib inline and import the required libraries.
Populating the interactive namespace from numpy and matplotlib

# Compute π by finding the area of the unit circle by quadrature.
N = 10000

# Divide [0, 1]^2 into N squares, and find their centers.
V = linspace( -1, 1, num=int(sqrt(N)) )
dx = V[1] - V[0]
V = dx/2 + V[:-1]
(xx, yy) = meshgrid( V, V)

gca().add_artist( Circle( (0, 0), 1, color='C1', alpha=.2, ec='k' ) )
scatter( xx, yy, s=.5 )

n_inside = sum( sqrt( xx**2 + yy**2 ) < 1 )
_ = title( f'$π \\approx {n_inside * dx**2}$' )

# Compute π by choosing random points in the square [-1, 1]^2, and checking how many lie inside the unit circle
N = 10000
P = rng.uniform( low=-1, high=1, size=(2,N) )

gca().add_artist( Circle( (0, 0), 1, color='C1', alpha=.2, ec='k' ) )
scatter( P[0], P[1], s=.5 )

n_inside = sum( norm(P, axis=0 ) < 1 )
_ = title( f'{n_inside/N*100 :.2f}% points inside unit circle. $π \\approx {4*n_inside/N}$' )

%%time

N = 10**6
P = rng.uniform( low=-1, high=1, size=(N, 2) )
NN = arange( 1, N+1, dtype=int )
π_approx = 4 * cumsum( norm(P,axis=1) < 1 ) / NN

CPU times: user 24 ms, sys: 17.1 ms, total: 41.1 ms
Wall time: 39.9 ms

plot( NN[1000:], π_approx[1000:] )
_ = title( 'Approximation of π as $N$ increases' )

%%time

# Memory friendly, but slow (in Python) way of computing
N = 10**6
n_inside = 0
prog = tqdm( range( N ), bar_format="{l_bar}{bar} {elapsed}<{remaining}, {rate_fmt}{postfix}" )
for n in prog:
    P = rng.uniform( -1, 1, size=2 )
    n_inside += ( norm(P) < 1 )
    prog.set_description_str( f'π≈{4*n_inside/(n+1):.6f}, error≈{abs( 4*n_inside/(n+1) - pi):.3e}', refresh=False )

  0%|           00:00<?, ?it/s

CPU times: user 5.29 s, sys: 83.2 ms, total: 5.38 s
Wall time: 5.31 s

%%time
# Faster, memory friendly way of computing
# Can get even faster by parallelizing, but don't get carried away.

N = 10**8
chunk_size = 10**5
n_chunks = N // chunk_size # Choose N to be a multiple of chunk_size

n_inside = 0
prog = tqdm( range( n_chunks ), bar_format="{l_bar}{bar} {elapsed}<{remaining}, {rate_fmt}{postfix}" )
for n in prog:
    P = rng.uniform( -1, 1, size=(2, chunk_size) )
    n_inside += sum( norm(P, axis=0) < 1 )

    π_approx = n_inside / (n+1) / chunk_size * 4
    prog.set_description_str( f'π={π_approx:.6f}, error≈{abs(π_approx - pi):.3e}', refresh=False )

print( f'Memory used ≈ {P.nbytes / 2**20}mb' )

  0%|           00:00<?, ?it/s

Memory used ≈ 1.52587890625mb
CPU times: user 1.09 s, sys: 6.46 ms, total: 1.09 s
Wall time: 1.09 s

n_trials = 10**3
N = 10**6
chunk_size = 10**4
NN = arange( chunk_size, N, chunk_size )

print( f'Roughly {len(NN) * n_trials * 8 / 2**20:.3f}mb memory required.' )

Roughly 0.755mb memory required.

π_approx = empty( (len(NN), n_trials) )

for i, n in tqdm( enumerate(NN), total=len(NN) ):
    P = rng.uniform( -1, 1, size=(2, chunk_size, n_trials) )
    n_inside = sum( norm(P, axis=0) < 1, axis=0 )
    if i == 0: π_approx[i] = n_inside / n * 4
    else: π_approx[i] = (NN[i-1]* π_approx[i-1] + n_inside *4 ) / n

π_avg = mean( π_approx, axis=-1 )
σ = std( π_approx, axis=-1 )

  0%|          | 0/99 [00:00<?, ?it/s]

fill_between( NN, π_avg - σ, π_avg + σ, alpha=.3, label='Std Dev' )
for n in range( 3 ):
    plot( NN, π_approx[:, n], alpha=.6, label=f'Trial {n+1}' )

plot( NN, π_avg, label='Average' )
_ = title( f'Approximation of π for {n_trials} trials' )
legend()

<matplotlib.legend.Legend at 0x7ff9c0381ed0>

loglog( NN, σ, label='σ' )

a = polyfit( log(NN), log(σ), 1 )
loglog( NN, exp( a[0]*log(NN) + a[1] ), '--', alpha=.5, label=f'${exp(a[1]):.2f}\\, N^{{ {a[0]:.3f} }}$' )

_=xlabel( 'log $N$' )
_ = title( f'log log plot of σ vs $N$' )
legend()

<matplotlib.legend.Legend at 0x7ff9c0281190>

# Compute by quadrature.
N = 10**7 #Warning -- start with N small, and ensure you have enough memory.
d = 10

V_1d = linspace( -1, 1, num=int( ceil(N**(1/d)) ) )
dx = V_1d[1] - V_1d[0]
V_1d = dx/2 + V_1d[:-1] # Centers of squares in one axis

V = [ V_1d for _ in range(d) ]
xx = meshgrid( *V ) # Centers of squares in d dim

n_inside = sum( norm(xx, axis=0) < 1 )
vol = n_inside * dx**d

# Closed form volume from Wikipedia: https://en.wikipedia.org/wiki/Volume_of_an_n-ball
exact_vol = pi**(d/2) / sp.special.gamma( d/2 + 1 )
print( f'd={d}, Computed vol={vol:.3f}, exact vol={exact_vol:.3f}, error={abs(vol - exact_vol):.2e}' )
print( f'Memory used ≈ {d*xx[0].nbytes / 2**20}mb' )

del xx

d=10, Computed vol=3.071, exact vol=2.550, error=5.21e-01
Memory used ≈ 745.0580596923828mb

# Compute by Monte Carlo
d = 10
N = 10**7

exact_vol = pi**(d/2) / sp.special.gamma( d/2 + 1 )

chunk_size = 10**5
n_chunks = N // chunk_size # Choose N to be a multiple of chunk_size

n_inside = 0
prog = tqdm( range( n_chunks ), bar_format="{l_bar}{bar} {elapsed}<{remaining}, {rate_fmt}{postfix}" )
for n in prog:
    P = rng.uniform( -1, 1, size=(d, chunk_size) )
    n_inside += sum( norm(P, axis=0) < 1 )

    vol = n_inside / (n+1) / chunk_size * 2**d
    prog.set_description_str( f'vol={vol:.6f}, error≈{abs(vol-exact_vol):.3e}', refresh=False )

print( f'd={d}, Computed vol={vol:.3f}, exact vol={exact_vol:.3f}, error={abs(vol - exact_vol):.2e}' )
print( f'Memory used ≈ {P.nbytes / 2**20}mb' )

  0%|           00:00<?, ?it/s

d=10, Computed vol=2.549, exact vol=2.550, error=9.16e-04
Memory used ≈ 7.62939453125mb

A simple Monte Carlo example¶

Getting started¶

Using Colab¶

Installing locally.¶

Running this notebook.¶

Computing π¶

Visualizing the error as N gets large¶

Volume of a $d$-dimensional ball¶

Few take aways¶