import numpy as np
from math import comb
import matplotlib.pyplot as plt
import scipy
num_points = 10
num_terms = 100
p_values = np.linspace(.05, 1, num_points)
vals = np.array([[comb(num_terms, i + 1) * (1 - p)**(i + 1) for i in range(num_terms)] for p in p_values]).T
vals /= (scipy.linalg.norm(vals, axis=0)+.01) #adding small number just for numerical stability
np.argmax(vals, axis=0)
plt.plot(vals, label=np.round(p_values, 2))
plt.xlabel('polynomial power k')
plt.ylabel('normalized value, proportional to (n choose k)(1-p)^k')
plt.title('Counting the expected number of signals associated with binomial coefficients')
plt.legend(title='noise strength')
plt.savefig('fig1')

from PIL import Image
img = Image.open('fig1.png');
img.convert("RGB")

plt.plot(p_values, np.argmax(vals, axis=0))
plt.title("peak index of binomial coefficients vs. noise")
plt.xlabel("noise strength")
plt.ylabel("index");

vals = np.array([[comb(num_terms, i + 1) * (1 - p**.1)**(i + 1) for i in range(num)] for p in p_values]).T
vals /= (scipy.linalg.norm(vals, axis=0)+.01) #adding small number just for numerical stability
np.argmax(vals, axis=0)
plt.plot(p_values, np.argmax(vals, axis=0))
plt.title("peak index of binomial coefficients vs. noise")
plt.xlabel("noise strength")
plt.ylabel("index");

# Necessary imports 
import pickle
import matplotlib.pyplot as plt
import numpy as np
from scipy.optimize import curve_fit
from scipy.special import factorial
from math import comb

# Load the dataset
file_name = 'webpost.pkl'
with open(file_name, 'rb') as f:
    data = pickle.load(f)
    
    
# To start, we organize the data we've gathered, extracting minimum values associated with each noise.

min_values_by_noise = {}
for (noise, _), pairs in data.items():
    if noise not in min_values_by_noise:
        min_values_by_noise[noise] = {}
    
    for x, y in pairs:
        min_values_by_noise[noise][x] = min(y, min_values_by_noise[noise].get(x, y))

# Reduce the data for plotting
reduced_data = {}
for noise, x_y_pairs in min_values_by_noise.items():
    x_values_sorted = sorted(x_y_pairs.keys())
    y_values_sorted = [x_y_pairs[x] for x in x_values_sorted]
    reduced_data[noise] = y_values_sorted
    plt.plot(x_values_sorted, y_values_sorted, marker='x', color='r')

    
# Plot the theoretical curves and compare them to the numerical data
alpha = 0.2
x = np.linspace(0, 7, 100)

# Generate and plot theoretical lines
asymptote = .8
num = 1000
for i in range(4, num, int(num/20)):
    plt.plot(x, (1-asymptote)/(x/1000 + 1)**(i/2) + asymptote, alpha=alpha, color='k')

# Final plot settings
plt.title('Loss vs. Reservoir Size')
plt.xlabel('Reservoir Size')
plt.ylabel('Loss')
plt.plot([], [], marker='x', color='r', label='Numerics')
plt.plot([], [], color='k', label='Theory')
plt.legend()
plt.savefig('fig2')
plt.clf()
# Now, we fit the data to a model and find actual parameters.
def model(x, a, b):
    return a/x**b + asymptote

fits = []

# Perform the fit for each dataset
for key in reduced_data:
    x = np.array(sorted(min_values_by_noise[key].keys()))
    y = np.array(reduced_data[key])
    popt, pcov = curve_fit(model, x, y, maxfev=1000000, p0=(1, 1))
    
    fits.append((key, popt))
    x_fine = np.linspace(1, 7, 400)
    
    # Plot the fitted function
    plt.scatter(x, y)
    plt.plot(x_fine, model(x_fine, *popt), 'r-')
    plt.xlabel('Reservoir Size')
    plt.ylabel('Loss')
    plt.title('Loss vs. Reservoir Size, Fits')
plt.savefig('fig3')
plt.clf();

<Figure size 640x480 with 0 Axes>

from PIL import Image
img = Image.open('fig2.png');
img.convert("RGB")

img = Image.open('fig3.png');
img.convert("RGB")

# We analyze the decay power versus noise power and plot the results.

# Extract the fitting parameters
xs = [fit[0] for fit in fits]
ys = [fit[1] for fit in fits]

# Sort the fits for plotting
xys = sorted(zip(xs, ys), key=lambda x: x[0])
xs = [el[0] for el in xys]
ys = [el[1] for el in xys]

# Select the range for plotting
c, d = 12, -1
x = xs[c:d]
y = (np.array(ys).T)[1][c:d]

# Generate a smooth line for the heuristic argument
x_fine = np.linspace(min(x), max(x), 100)

scale = 100
num = len(x_fine)
p_values = np.linspace(.05, 1, num)
vals = np.array([[comb(scale, i + 1) * (1 - p**.1)**(i + 1) for i in range(scale)] for p in p_values]).T
offset = 3
max_power = offset + np.argmax(vals, axis=0)

# Plot the decay power
plt.scatter(x, y/y[0], label=f"Data")
# Plot the heuristic line
plt.plot(x_fine, max_power/max_power[0], label="Heuristic Prediction")
plt.legend()
plt.title("Fit Polynomial Decays vs. Heuristic Prediction from ")
plt.xlabel("noise strength")
plt.ylabel("power law scaling coefficient\n normalized to first point")
plt.savefig('fig4')
plt.clf()
# A small noise rate becomes non-meaningful at some point. With only 1000 points, the ability to distinguish errors diminishes.
# In a zero-noise scenario, behavior tends towards an exponential decay; detecting deviations from this trend requires larger reservoir sizes.

from PIL import Image
img = Image.open('fig4.png');
img.convert("RGB")

Part 3: Analysis¶