#!/usr/bin/env python

# ----------------------------------------------------------------------------------- 
#
#  Python macro for illustration of the Central Limit Theorem (CLT).
#
#  Random numbers from different distributions (but with RMS = 1) are added to a sum,
#  and many such sums are plottet. As it turns out (and as dictated by the CLT),
#  their distribution turns about to be Gaussian.
#  The example also illutrates how widths (and therefore uncertainties) are added in
#  quadrature, as one has to divide the sum by the square root of the number of random
#  numbers that went into the sum in order to get a Gaussian of unit width (when using
#  random numbers of unit width, i.e. RMS = 1).
#
#  For more information on the Central Limit Theorem, see:
#    R. Barlow: page 49
#    G. Cowan: page 33
#    http://en.wikipedia.org/wiki/Central_limit_theorem
#
#  Run this macro by:
#    From prompt: > ./CentralLimit.py
#  
#  Author: Troels C. Petersen (NBI)
#  Email:  petersen@nbi.dk
#  Date:   11th of November 2017
#
#  ----------------------------------------------------------------------------------- //

from __future__ import division, print_function
import numpy as np
import matplotlib.pyplot as plt
from iminuit import Minuit
from probfit import BinnedLH#, , UnbinnedLH, BinnedChi2, Chi2Regression, Extended
plt.close('all')

r = np.random                         # Random generator
r.seed(42)                            # Set a random seed (but a fixed one - more on that later.)

Nexperiments = 1000                   # Number of sums produced
Nuniform     = 10                     # Number of uniform numbers used in sum
Nexponential = 10                     # Number of exponential numbers used in sum
Ncauchy      = 10                     # Number of cauchy numbers used in sum

pi = 3.14159265358979323846264338328  # Selfexplanatory!!!
pi = np.pi                       # Another way of doing it - probably better!

verbose = True                        # Print some numbers or not?
Nverbose = 10                         # If so, how many?
SavePlots = True                     # Save the plots produced to file(s)?


# =============================================================================
# Initial functions
# =============================================================================


# function to create a nice string output
def nice_string_output(names, values, extra_spacing = 2):
    max_values = len(max(values, key=len))
    max_names = len(max(names, key=len))
    string = ""
    for name, value in zip(names, values):
        string += "{0:s} {1:>{spacing}} \n".format(name, value,
                   spacing = extra_spacing + max_values + max_names - len(name))
    return string[:-2]


#----------------------------------------------------------------------------------
# Loop over process:
#----------------------------------------------------------------------------------

N3sigma = 0        # Counter for the number of produced sums, that fall outside +-3 sigma

x_Uniform = []
x_Exponential = []
x_Cauchy = []
x_Sum = []

for iexp in range( Nexperiments ) : 

    if (iexp % 100 == 0) : 
        print("At iexp : ", iexp)                         # Show progress!
    sum_value = 0.0                                       # sum_value is the number we are going to add random numbers to!
                                                          # According to the CLT, it should be Gaussianly distributed.
 
    # Generating uniform numbers (with mean 0, and RMS of 1):
    for i in range( Nuniform ) : 
        x = np.sqrt(12.0) * (r.uniform() - 0.5)           # Uniform between +-sqrt(3). Why?
        sum_value += x
        x_Uniform.append(x)
        if (verbose and iexp == 0 and i < Nverbose) :
            print( "   Uniform:     {0:7.4f}".format(x))

    # Generating exponential numbers (with mean 0, and RMS of 1):
    for i in range( Nexponential ) : 
        x = -np.log( r.uniform() ) - 1.0                  # Exponential starting at -1. Why?
        # x = r.exponential() - 1.0                       # Alternative way to produce x exponentially.
        sum_value += x
        x_Exponential.append(x)
        if (verbose and iexp == 0 and i < Nverbose) : 
            print( "   Exponential: {0:7.4f}".format(x))

    # Generating numbers according to a Cauchy distribution (1 / (1 + x^2)):
    for i in range( Ncauchy ) : 
        x = np.tan(pi * (r.uniform() - 0.5))              # Cauchy with mean 0
        # x = r.standard_cauchy()                         # Alternative way to produce x according to Cauchy PDF.
        sum_value += x
        x_Cauchy.append(x)
        if (verbose and iexp == 0 and i < Nverbose) :
            print( "   Cauchy:      {0:7.4f}".format(x))

    Ntotal = Nuniform + Nexponential + Ncauchy
    sum_value = sum_value / np.sqrt( Ntotal )     # Ask yourself, why I divide by sqrt(N)?
    x_Sum.append(sum_value)
    if not (-3.0 < sum_value < 3.0) :
        N3sigma += 1
        
x_Uniform = np.array(x_Uniform)
x_Exponential = np.array(x_Exponential)
x_Cauchy = np.array(x_Cauchy)
x_Sum = np.array(x_Sum)


#---------------------------------------------------------------------------------- 
# Draw the input distributions:
#---------------------------------------------------------------------------------- 

Nbins = 240
x_ranges = [(-2.5, 2.5), (-1.5, 5.5), (-6,6)]

fig, ax = plt.subplots(nrows=1, ncols=3, figsize=(12,6))

x_all = [x_Uniform, x_Exponential, x_Cauchy]
titles = ['Uniform', 'Exponential', 'Cauchy']
for ax_i, x, title, x_range in zip(ax, x_all, titles, x_ranges):
    ax_i.hist(x, bins=Nbins, range=x_range, histtype='step')
    ax_i.set_title(title)
    ymax = ax_i.get_ylim()[1]*1.2
    ax_i.set_ylim(0, ymax)

    names = ['Entries', 'Mean', 'Std. Dev. ', 'Std. Dev. in interval']
    values = [  "{:d}".format(len(x)), 
                "{:.3f}".format(x.mean()),
                "{:.3f}".format(x.std(ddof=1)),
                "{:.3f}".format(x[(x_range[0]<x) & (x<x_range[1])].std(ddof=1)),
            ]
    
    ax_i.text(0.05, 0.97, nice_string_output(names, values), family='monospace', transform=ax_i.transAxes, fontsize=10, verticalalignment='top')


# Write how many of the experiments had a result outside the range [-3,3], i.e. beyond +-3 sigma:
print( "  N experiments beyond 3 sigma / total: {0:4d} / {1:d}    ({2:6.4f}) \n".format(N3sigma, Nexperiments, N3sigma/Nexperiments))


plt.tight_layout()
plt.show(block=False)
# Note, we refer to the old plot "ax". Had we done another plot inbetween, 
# we would not have been able to plot on top of the old figure with the matlab syntax

if (SavePlots) :
    fig.savefig('Plot_CentralLimit_Input.pdf', dpi=600)


#---------------------------------------------------------------------------------- 
# Draw output plots with corresponding fits to the screen:
#---------------------------------------------------------------------------------- 

xmin, xmax = -6,6

fig2, ax2 = plt.subplots(figsize=(12, 6)) 

hist2 = ax2.hist(x_Sum, bins=Nbins, range=(xmin, xmax), histtype='step')
ax2.set_xlabel('Sum')
ax2.set_ylabel('Frequency')


# Define your PDF / model 
def gauss_pdf(x, mu, sigma):
    """Normalized Gaussian"""
    return 1 / np.sqrt(2 * np.pi) / sigma * np.exp(-(x - mu) ** 2 / 2. / sigma ** 2)

def gauss_extended(x, N, mu, sigma):
    """Non-normalized Gaussian"""
    return N * gauss_pdf(x, mu, sigma)
# could also be written as:
#gauss_extended = Extended(gauss_pdf)

# Make a Binned Likelihood object based on the fit function gauss_extended and 
# the original data x_all. Use the same bins and bounds as the original histogram. 
# extended=True: this means that we let the number of events N be a variable as well
# extended=False: this means that we have a fixed number of events, N.
binned_likelihood = BinnedLH(gauss_extended, x_Sum, bins=Nbins, bound=(xmin, xmax), extended=True) 

# be ready to fit to the LH object with the given fit parameters. Other options are:
# x=2 set intial value of x to 2
# limit_x = (-1,1) set the range for x
# y=2, fix_y=True fix y value to 2
minuit = Minuit(binned_likelihood, pedantic=False, mu=-1, sigma=1, N=1000)  
minuit.migrad();  # perform the actual fit
minuit_output = [minuit.get_fmin(), minuit.get_param_states()] # save the output parameters in case needed
fit_N, fit_mu, fit_sigma = minuit.args # the fitted values of the parameters
for name in minuit.parameters:
    print("Fit value: {0} = {1:.5f} +/- {2:.5f}".format(name, minuit.values[name], minuit.errors[name]))
LLH_value = minuit.fval # the LLH value


Nscale = (xmax-xmin) / Nbins # the scale factor between histogram and the fit. Takes e.g. bin width into account.
x_fit = np.linspace(xmin-0.1, xmax+0.1, 1000) # Create the x-axis for the plot of the fitted function
y_fit = Nscale*gauss_extended(x_fit, fit_N, fit_mu, fit_sigma) # the fitted function

ax2.plot(x_fit, y_fit, '-', color='red', label='Fit with Gaussian to x') 

entries, bin_edges, _patches = hist2
bin_centers = 0.5*(bin_edges[1:] + bin_edges[:-1])
hist1_x, hist1_y = bin_centers, entries
hist1_sy = np.sqrt(hist1_y)


# Here we calculate the chi2 value of the fit and the number of non-empty bins
chi2_val = 0
N_NotEmptyBin = 0
for x, y, sy in zip(hist1_x, hist1_y, hist1_sy):
    if (sy > 0) :
        f = Nscale * gauss_extended(x, fit_N, fit_mu, fit_sigma) # calc the model value
        residual  = ( y-f ) / sy  # find the uncertainty-weighted residual
        chi2_val += residual**2  # the chi2-value is the squared residual
        N_NotEmptyBin += 1 # count the bin as non-empty since sy>0 (and thus y>0)


# Here we find the number of degrees of freedom, which is the number of 
# elements in the fit (non-empty) minus the number of fitting parameters
N_DOF = N_NotEmptyBin - len(minuit.args)


from scipy import stats
chi2_prob =  stats.chi2.sf(chi2_val, N_DOF) # The chi2 probability given N_DOF degrees of freedom

names = ['Entries', 'Mean in interval', 'Std. Dev. in interval', 'Chi2/DOF', 'Prob', 'N', 'mu', 'sigma'] #+ minuit.parameters
values = [  "{:d}".format(len(x_Sum)), 
            "{:.3f}".format(x_Sum[(xmin<x_Sum) & (x_Sum<xmax)].mean()),
            "{:.3f}".format(x_Sum[(xmin<x_Sum) & (x_Sum<xmax)].std(ddof=1)),
            "{:.3f} / {:d}".format(chi2_val, N_DOF),
            "{:.3f}".format(chi2_prob), 
            "{:.3f} +/- {:.3f}".format(minuit.values['N'], minuit.errors['N']), 
            "{:.3f} +/- {:.3f}".format(minuit.values['mu'], minuit.errors['mu']), 
            "{:.3f} +/- {:.3f}".format(minuit.values['sigma'], minuit.errors['sigma']), 
        ]
    
# place a text box in upper left in axes coords
ax2.text(0.02, 0.97, nice_string_output(names, values), family='monospace', transform=ax2.transAxes, fontsize=10, verticalalignment='top')


Nscale = (xmax-xmin) / Nbins # the scale factor between histogram and the fit. Takes e.g. bin width into account.
y_fit2 = Nscale*gauss_extended(x_fit, len(x_Sum), 0, 1) # unit gaussian

ax2.plot(x_fit, y_fit2, '-', color='blue') 


plt.tight_layout()
plt.show(block=False)
# Note, we refer to the old plot "ax". Had we done another plot inbetween, 
# we would not have been able to plot on top of the old figure with the matlab syntax

if (SavePlots) :
    fig2.savefig('Histogram.pdf', dpi=600)


# Finally, ensure that the program does not termine (and the plot disappears), before you press enter:
try:
    __IPYTHON__
except:
    raw_input('Press Enter to exit')


# ---------------------------------------------------------------------------------- 
# 
# First make sure that you understand what the Central Limit Theorem (CLT) states!
# Then, acquaint yourself with the program. Make sure that you read through it, as many
# of these features will be used onwards. Do you understand why the uniform distribution
# needs to go from +-sqrt(3) in order to give a distribution with a width of one (i.e. unit)
# and why you subtract one from the exponential distribution (and how this works at all)?
# 
# Then try to see what the result of adding 10 uniform random numbers is? Which
# distribution does it give (surprise!!!), and how well does it resemble it?
# 
# 
# Questions:
# ----------
#  1) What is the mean and RMS of the input distributions?
#
#  2) Why is there a "/sqrt(N)" in line 112 (when summing up the various contributions to sum)?
#     Hint: Assume that I always wanted to compare the distribution of sums with a UNIT Gaussian.
#
#  3) Using a sum of 10 uniform random numbers with mean 0 and width 1, what is the expected
#     width of the resulting distribution according to CLT? What is the probability of
#     obtaining a number beyond 3 sigma, i.e. how many numbers did you get beyond 3 sigma?
#     What would you expect from a true Gaussian distribution?
#     And what about the same question for 3.5 sigma? And 4.0 sigma?
#     Perhaps increase the number of experiments run to (much) more than 1000...
# 
#  4) Now try to add 10 exponential. Does that give something Gaussian? What about 1000?
#     Then try to add 10 cauchy numbers. Does that give something Gaussian? What about 1000?
#     If not Gaussian, why do the Cauchy distribution "ruin" the Gaussian distribution?
#     And is this in conflict with the Central Limit Theorem?
# 
# 
# Advanced questions:
# -------------------
#  1) If one used a trunkated mean of 10 Cauchy numbers (throwing away the top and bottom e.g. 10%),
#     will the truncated mean of 1000 Cauchy numbers then converge to a Gaussian?
#
#  2) How few/many uniform random numbers needs to be added, before the probability
#     for the sum to follow a Gaussian distribution is greater than 1% (on average)
#     when using 1000 sums (i.e. Nexperiments = 1000)?
#
# ----------------------------------------------------------------------------------