#!/usr/bin/env python

from scipy import optimize
from math import pow, log, exp, sqrt
from random import random, normalvariate
import copy
import numpy

verbose = False
  
_use_fmin = False


############################################################################
# Begin model-specific initialization code
############################################################################

############################################################################
# Here declare a "class" that allows us to bundle together different pieces
#   of information about our data in a convenient bundle. The read_data 
#   function and simulate data function will create "Skink" objects, and 
#   store them in a list.
#
# Specifically the data_list will have an element for each mating group.
#
# Each of these elements will consist of three lists - one for each diet
#   treatment.  Specifically, if group_data is the data for one mating group 
#   (foursome), then:
#       group_data[0] will be a list of individuals exposed to the "Small"
#               insect diet,
#       group_data[1] will be a list of individuals exposed to the "Medium"
#               insect diet, and 
#       group_data[2] will be a list of individuals exposed to the "Large"
#               insect diet.
# Each of this lists will be a list of "Skink objects"
#
# If s1 and s2 refer to two different Skink objects then you can see if they
#   share a mother using code like this:
#
#   if s1.mom == s2.mom:
#       here is a block of code to execute for shared mothers
#   else:
#       here is a block of code to execute for distinct mothers
# 
# Note that we use the "." operator to examine an attribute inside the "Skink"
#   objects.  The objects are just a convenient way to keep info on mom, dad,
#   treatment, and y-value (the dependent variable, growth rate) bundled
#   together.
############################################################################
class Skink(object):
    def __init__(self, mom, dad, treatment, y):
        self.mom = mom
        self.dad = dad
        self.treatment = treatment
        self.y = y
    def __repr__(self):
        return "Skink(mom=" + str(self.mom) + ", dad=" + str(self.dad) + ", treatment=" + str(self.treatment) + ", y=" + str(self.y) + ")"
    def __str__(self):
        return self.repr()


# This is a list of values to try for the numerical optimizer.  The length of 
#   this list is also used by some functions to determine the dimensionality
#   of the model
initial_parameter_guess = [10.0, 10.0, 10.0, 1, 4 ]
# This is a list of parameter names to show. Modify this based on what order
#   you want to use for the parameter list. It does not matter which order
#   you choose, but you need to know what the program thinks of as the first
#   and second parameters so that the output will make sense and your code
#   that unpacks the parameter list will know whether the first parameter is
#   the recapture probability or the probability of an individual being asymmetric
#   You should put the names in quotes, so the line would look like:
#  
#   parameter_names = ['mu', 'sigma'] 
#   
#   for inference under the normal model.
#
parameter_names = ['mu_S', 'mu_M', 'mu_L', 'var_G', 'var_Error']


# This version of the program will us the L-BFGS constrained optimization
#   approach to maximize the likelihood.  
# Here we'll specify bounds for each of the parameters as pairs (min, max) which
#   specify the minimum and maximum value.  If a parameter is unbounded we can 
#   simply list None as the bound.
# Allowing var_Error to be 0 can result in numerical problems as the lnL goes to
#   very small numbers.  Putting a lower bound will avoid this.
min_var_error = 1e-6
parameter_bounds = [(None, None), (None, None), (None, None), (0.0, None), (min_var_error, None), ]

# we expect the number of parameters to be the same in both lists. This is a 
#   sanity check that helps us see if we made a mistake.
#
assert(len(initial_parameter_guess) == len(parameter_names)) 
############################################################################
# End model-specific initialization code
############################################################################


def calculate_incidence_row_for_indiv(skink):
    '''This function should return a python list. This list will be a single
    row in the incidence matrix.  
    It should contain a coefficient (e.g. 1 or 0) for each of the parameters 
    that appear in the equation of the linear predictor for this particular 
    skink.
    
    The incidence matrix will be multiplied by a parameter values. So the length
    of each row that you return here should be equal to the number of parameters
    
    '''
    
    treatment = skink.treatment
    mom = skink.mom
    dad = skink.dad
    
    # If you were to want a row that is [1, 2, 0]
    #   then you could substitute:
    #
    #   INCIDENCE_MATRIX_ROW = [1, 2, 0]
    #
    # or you could build the list one element at time:
    #
    # INCIDENCE_MATRIX_ROW = []
    # INCIDENCE_MATRIX_ROW.append(1)
    # INCIDENCE_MATRIX_ROW.append(2)
    # INCIDENCE_MATRIX_ROW.append(0)
    #    
    INCIDENCE_MATRIX_ROW = []
    YOU WILL NEED SOME CODE AROUND HERE TO FILL IN THE ROW OF THE INCIDENCE MATRIX
    FOR THIS SKINK
    
    return INCIDENCE_MATRIX_ROW
    

# you should not need to alter this next line.
the_incidence_matrix = None
    
    
def ln_likelihood(the_data, param_list):
    '''Calculates the log-likelihood of the parameter values in `param_list`
    based on `the_data`
    '''
    global the_incidence_matrix
    if verbose:
        sys.stderr.write('param = ' + str(param_list) + '\n')
    ############################################################################
    # Begin model-specific log-likelihood code
    ############################################################################
    first_p, second_p, third_p, fourth_p, fifth_p = param_list
    mu0 = first_p
    mu1 = second_p
    mu2 = third_p
    var_g = fourth_p
    var_error = fifth_p
    
    # The data is stored in multiple forms.  They will be explained below as needed.
    # You should not have to change the next 4 lines...
    blocked_by_foursome = the_data[0]
    observed_values = the_data[1]
    foursome_sizes = the_data[2]
    flattened_data = the_data[3]
    
    # do our "sanity-checking" to make sure that we are in the legal range of 
    #   the parameters.
    #
    for p in param_list:
        if p != p:
            return float('-inf')
    if var_g < 0.0:
        return float('-inf')
    if var_error < 0.0:
        return float('-inf')


    FIXED_EFFECT_LIST = [HERE IS WHERE YOU LIST THE PARAMETERS THAT ARE MULTIPLIED BY THE INCIDENCE MATRIX]
    
    # this next line creates a column vector, to be multiplied by the incidence 
    #   matrix (you should not have to change this)
    fixed_effects = numpy.matrix(FIXED_EFFECT_LIST).transpose()
    
    # this calculates a vector of expected values from the fixed effects and 
    #   incidence matrix  (you should not have to change this)
    expected_values = the_incidence_matrix*fixed_effects
    
    
    # Because the values for the skinks from different foursomes will have a 
    #   covariance of 0, most of the covariance matrix will be 0's and we can
    #   create it in block-diagonal form that is easier to work with (and results
    #   in much faster calculations.
    # Here will create a list of matrices.  This will be the 
    #   non-zero blocks along the diagonal of the covariance matrix.
    # You won't have to change this next line.
    non_zero_covariance_blocks = list()

    YOU MAY WANT TO HAVE SOME CALCULATIONS HERE FOR TERMS THAT WILL
    OCCUR MANY TIMES IN THE COVARIANCE MATRIX...
    
    # Here we walk over the data set one foursome at a time.
    for foursome_index, foursome_data in enumerate(flattened_data):
        # num_in_foursome will hold the number of skinks from this foursome
        #   from all parental combinations and treatments.
        num_in_foursome = foursome_sizes[foursome_index]
        
        # make an empty covariance matrix for this foursome (no need to change this).
        empty_row = [None]*num_in_foursome
        # make an empty maxtrix by copying the empty row num_in_foursome times
        #   (you don't have to change this line).
        foursome_cov = [copy.copy(empty_row) for i in xrange(num_in_foursome)]
        
        for i, skink_i in enumerate(foursome_data):
            for j in range(i, num_in_foursome):
                skink_j = foursome_data[j]

                ################################################################
                # here we need to fill in foursome_cov[i][j] with the
                # covariance for skink_i and skink_j
                #
                # We'll do this by examining the attributes (such as skink_i.mom 
                #   and skink_i.dad) in skink_i and skink_j to fill in cov_element
                #
                # and then storing cov_element
                ################################################################
                cov_element = SOMETHING GOES HERE
                YOU WILL NEED STATEMENTS LIKE "if i == j:" and "if skink_i.mom == skink_j.mom:"
                
                
                ################################################################
                # this is where we store the covariance element (the cov matrix
                # is symmetric, so we store it in (i, j) and (j, i)
                # If you calculated the covariance and stored it in the variable
                #   called cov_element, then you should not have to change this.
                ################################################################
                foursome_cov[i][j] = cov_element
                foursome_cov[j][i] = cov_element
        # append this non-zero part of the covariance matrix to a list
        #   that will be used to represent a block diagonal matrix for all 
        #   measurements.
        # first we'll convert it from a python list of lists to a numpy matrix
        # (you should not have to change this).
        numpy_fam_cov = numpy.matrix(foursome_cov)
        non_zero_covariance_blocks.append(numpy_fam_cov)

    # here we calculate the inverse (exploiting the block diagonal structure)
    inverse_var = invert_block_diagonal(non_zero_covariance_blocks)

    # here we calculate the log of the determinant (exploiting the block diagonal structure)
    ln_determinant = ln_determinant_block_diagonal(non_zero_covariance_blocks)

    # We can calculate residuals by substracting observed_values from
    #   expected_values.  When we convert the python lists of values 
    #   to numpy.matrix objects, we get a column matrix. 
    residuals_column = expected_values - observed_values

    # We can transpose the column vector of residuals to get a row...
    residuals_row = residuals_column.transpose()
    
    scaled_dev_sq = residuals_row*inverse_var*residuals_column
    ln_l = -0.5*(ln_determinant + float(scaled_dev_sq))

    if verbose:
        sys.stderr.write('ln_l = ' + str(ln_l) + '\n')
    # This is how we send the result back to the function that called this
    #   function.  
    return ln_l
    ############################################################################
    # End model-specific log-likelihood code
    ############################################################################


def simulate_data(template_data, param_list):
    '''Simulate a data set of the same size as `template_data` but under a 
    model described by the parameter values in `params`
    '''
    ############################################################################
    # Begin model-specific simulation code
    ############################################################################
    first_p, second_p, third_p, fourth_p, fifth_p = param_list
    mu0 = first_p
    mu1 = second_p
    mu2 = third_p
    var_g = fourth_p
    var_error = fifth_p
    

    # Here we'll grab the form of the data that is a list for each family
    #   there will be a list of all of the Skinks in that family.  We can
    #   use the skink.mom, skink.dad, skink.treatment attributes of each Skink
    #   to figure out mom, dad, and treatment
    # You should not have to change this line.
    by_foursome_list = template_data[3]

    YOU MIGHT WANT TO CALCULATE SOME QUANTITIES HERE THAT ARE USED IN ALL SIMULATIONS.

    ####################################################################
    # We'll walk through each foursome, simulating new values for the response "y"
    #
    # NOTE: We are going to modify the data "in-place" in this simulation (unlike
    #   previous simulations where we left the original data untouched).
    ####################################################################
    for foursome_data in by_foursome_list:
        
        YOU_WILL_NEED_SOME_CODE_AROUND_HERE_TO_SIMULATE_RANDOM_VARIABLES_FOR_THIS_FOURSOME
        ####################################################################
        # We'll walk through each skink in the foursome and simulate a value...
        ####################################################################
        for skink in foursome_data:
            treatment = skink.treatment
            mom = skink.mom
            dad = skink.dad
            ########################################
            # At this point the variables "treatment", "mom" and "dad"
            # all refer to the current skink in the current foursome.
            # If you draw a random value for the dependent variable 
            # and store it in skink.y, then the simulation will be complete

            SIM_VALUE = YOU_WILL_NEED_SOME_CODE_AROUND_HERE_TO_SIMULATE_A_RESPONSE_FOR_THIS_SKINK
            
            ####################################################################
            # Here we can record SIM_VALUE as this skink's response. This
            #   this will complete our simulation of a dependent variable for
            #   this individual skink.
            ####################################################################
            skink.y = SIM_VALUE

    # You won't need to change the next line, but I'll explain it anyway...
    # This is a bit cryptic. Our simulation has been modifying the Skink objects
    #   in by_foursome_list. Because these *same* skink objects are also stored
    #   in the first element of template_data (in a form that more clearly 
    #   reveals the factorial nature of the study), we can call process_data
    #   on template_data[0] to transform the simulated data to make it easier 
    #   to process each simulation.
    # process_data is also called by read_data.  So we are really just using this
    #   function to put our simulations into the same structure as the original
    #   data. 
    return process_data(template_data[0])
    ############################################################################
    # End model-specific simulation code
    ############################################################################


def calculate_incidence_matrix(the_data):
    '''This function is called to fill in the incidence matrix for the model.
    
    You should not need to touch this code.  It calls calculate_incidence_row_for_indiv
    repeatedly to actually fill the matrix.
    '''
    global the_incidence_matrix
    the_incidence_matrix_row_list = []
    for foursome_index, foursome_data in enumerate(the_data):
        for treatment_index, indiv_data in enumerate(foursome_data):
            for indiv in indiv_data:
                the_incidence_matrix_row = calculate_incidence_row_for_indiv(indiv)
                the_incidence_matrix_row_list.append(the_incidence_matrix_row)
    the_incidence_matrix = numpy.matrix(the_incidence_matrix_row_list)


def block_diag(*arrs):
    """Create a new diagonal matrix from the provided arrays.

    Parameters
    ----------
    a, b, c, ... : ndarray
        Input arrays.

    Returns
    -------
    D : ndarray
        Array with a, b, c, ... on the diagonal.

    Code from http://mail.scipy.org/pipermail/scipy-user/attachments/20090520/f30c0928/attachment.obj
    posted by Stefan van der Walt http://mail.scipy.org/pipermail/scipy-user/2009-May/021101.html
    """
    arrs = [numpy.asarray(a) for a in arrs]
    shapes = numpy.array([a.shape for a in arrs])
    out = numpy.zeros(numpy.sum(shapes, axis=0))

    r, c = 0, 0
    for i, (rr, cc) in enumerate(shapes):
        out[r:r + rr, c:c + cc] = arrs[i]
        r += rr
        c += cc
    return out

def invert_block_diagonal(block_list):
    inv_block_list = []
    for block in block_list:
        inv_block = numpy.linalg.inv(block)
        inv_block_list.append(inv_block)
    return block_diag(*inv_block_list)

def ln_determinant_block_diagonal(block_list):
    det = 0.0
    for block in block_list:
        det = det + log(numpy.linalg.det(block))
    return det


def calc_global_ml_solution(data, initial_point=None):
    '''Uses SciPy's  optimize.fmin_l_bfgs_b to find the mle. Starts the search at
    s = 0.75, and w = 0.75

    Returns the (s_mle, w_mle, ln_L)
    '''

    def scipy_ln_likelihood(x):
        '''SciPy minimizes functions. We want to maximize the likelihood. This
        function adapts our ln_likelihood function to the minimization context
        by returning the negative log-likelihood.
    
        We use this function with SciPy's minimization routine (minimizing the
        negative log-likelihood will maximize the log-likelihood).
        '''
        return -ln_likelihood(data, x)

    if initial_point is None:
        x0 = initial_parameter_guess
    else:
        x0 = initial_point
    if _use_fmin:
        solution = optimize.fmin(scipy_ln_likelihood, 
                                          x0,
                                          xtol=1e-8,
                                          disp=False)
    else:
        opt_blob = optimize.fmin_l_bfgs_b(scipy_ln_likelihood, 
                                          x0,
                                          bounds=parameter_bounds,
                                          approx_grad=True,
                                          epsilon=1e-8,
                                          disp=False)
        solution = list(opt_blob[0])
    ln_l = -scipy_ln_likelihood(solution)
    solution.append(ln_l)
    return solution
        

def calc_null_ml_solution(data, param_constraints, initial_point=None):
    '''This function allows us to optimize those parameters that are set to 
    None in the list `param_constraints`. Other parameters are forced to assume
    the value listed in param_constraints.
    '''
    x0 = []
    adaptor_list = []
    constr_bounds = []
    for i, val in enumerate(initial_parameter_guess):
        if i >= len(param_constraints) or param_constraints[i] == None:
            if initial_point is None:
                x0.append(val)
            else:
                x0.append(initial_point[i])
            constr_bounds.append(parameter_bounds[i])
            adaptor_list.append(None)
            
        else:
            adaptor_list.append(param_constraints[i])
    
    def intercalate_constraints(x):
        p = []
        x_index = 0
        for el in adaptor_list:
            if el is None:
                p.append(x[x_index])
                x_index = x_index + 1
            elif isinstance(el, list):
                assert(len(el) == 1)
                assert(el[0] < len(p))
                p.append(x[el[0]])
            else:
                p.append(el)
        return p
        

    def constrained_scipy_ln_likelihood(x):
        all_params = intercalate_constraints(x)
        return -ln_likelihood(data, all_params)
        
    if len(x0) > 0:
        if _use_fmin:
            solution = optimize.fmin(constrained_scipy_ln_likelihood,
                                     x0,
                                     xtol=1e-8,
                                     disp=False)
            
        else:
            opt_blob = optimize.fmin_l_bfgs_b(constrained_scipy_ln_likelihood,
                                     x0,
                                     bounds=constr_bounds,
                                     approx_grad=True,
                                     epsilon=1e-8,
                                     disp=False)
            solution = opt_blob[0]
        all_params = intercalate_constraints(solution)
    else:
        all_params = list(param_constraints)
    ln_l = ln_likelihood(data, all_params)
    all_params = list(all_params)
    all_params.append(ln_l)
    return all_params


def calc_lrt_statistic(data, null_params, initial_point=None):
    '''Returns (log-likelihood ratio test statistic,
                list of MLEs of all parameters and lnL at the global ML point,
                a list of the MLEs of all parameters and lnL under the null)
        
    for `data` with the null hypothesis being the parameters constrained
    to be at the values specified in the list `null_params`
    '''
    # First we calculate the global and null solutions
    #
    global_mle = calc_global_ml_solution(data, initial_point=initial_point)
    null_mle = calc_null_ml_solution(data, null_params, initial_point=initial_point)

    # the log-likelihood is returned as the last element of the list by these
    #   functions.  We can access this element by referring to element -1 using
    #   the list indexing syntax - which is [] braces:
    #
    global_max_ln_l = global_mle[-1]
    null_max_ln_l = null_mle[-1]
    # Now we can calculate the likelihood ratio test statistic, and return
    #   it as well as the global and null solutions
    #
    lrt = -2*(null_max_ln_l - global_max_ln_l)
    return lrt, global_mle, null_mle


def process_data(data_set):
    '''To make it easier to deal with the data, we'll calculate a few summaries
    of the data.  Three items will be returned:
        the data_set,
        the observations,
        the number of individuals in each mating group.
    '''
    block_sizes = []
    observed_values = []
    flattened_data = []
    for group_data in data_set:
        sz = 0
        flat = []
        for group_treatment_data in group_data:
            sz = sz + len(group_treatment_data)
            flat.extend(group_treatment_data)
            for skink in group_treatment_data:
                observed_values.append(skink.y)
        flattened_data.append(flat)
        block_sizes.append(sz)
    observed_values = numpy.matrix(observed_values).transpose()
    return data_set, observed_values, block_sizes, flattened_data

def read_data(filepath):
    '''Reads filepath as a tab-separated csv file and returns a 3dimensional data matrix.'''
    import os
    import csv
    import itertools
    if not os.path.exists(filepath):
        raise ValueError('The file "' + filepath + '" does not exist')
    
    TREATMENT_CODES = 'SML'    
    MAX_TREATMENT_VALUE = len(TREATMENT_CODES) - 1
    
    # Here we create a csv reader and tell it that a tab (\t) is the column delimiter
    entries = csv.reader(open(filepath, 'rbU'), delimiter=',')

    # Here we check that file has the headers that we exect
    first_row = entries.next()
    expected_headers = ['mating group (foursome)', 'mom', 'dad', 'treatment', 'y (growth rate)']
    for got, expected in itertools.izip(first_row, expected_headers):
        if got.lower().strip() != expected:
            raise ValueError('Error reading "' + filepath + '": expecting a column labelled "' + expected + '", but found "' + got + '" instead.')

    # It is not too hard to have this loop put the data in the right spot in the
    #   matrix, so that the data file can be somwhat flexible.

    by_family = {}
    for n, row in enumerate(entries):
        fam_id, mom_id, dad_id, treatment_code, value = row
        try:
            fam_id = int(fam_id)
        except:
            raise ValueError("Error reading data row " + str(1 + n) + ' of "' + filepath + '": expecting an integer for family ID, but got ' + str(fam_id))
        try:
            mom_id = int(mom_id)
        except:
            raise ValueError("Error reading data row " + str(1 + n) + ' of "' + filepath + '": expecting an integer for mom ID, but got ' + str(mom_id))
        try:
            dad_id = int(dad_id)
        except:
            raise ValueError("Error reading data row " + str(1 + n) + ' of "' + filepath + '": expecting an integer for mom ID, but got ' + str(dad_id))
        try:
            treatment_id = TREATMENT_CODES.index(treatment_code.upper())
            assert(treatment_id >= 0 and treatment_id <= MAX_TREATMENT_VALUE)
        except:
            raise ValueError("Error reading data row " + str(1 + n) + ' of "' + filepath + '": expecting a single letter code (one of "' + TREATMENT_CODES + '") for the treatment, but got ' + str(treatment_code))
        try:
            value = float(value)
        except:
            raise ValueError("Error reading data row " + str(1 + n) + ' of "' + filepath + '": expecting an number for the trait value, but got ' + str(value))
        # a new family corresponds to an empty dictionary of individuals
        #   for the 0, and 1 treatment. So we can create a list with two empty
        #   dictionaries as the "blank" entry.
        empty_family_entry = [[] for i in range(MAX_TREATMENT_VALUE + 1)]
        fam_array = by_family.setdefault(fam_id, empty_family_entry)
        # now we grab the appropriate one for this treatment
        list_for_fam_treatment = fam_array[treatment_id]
        list_for_fam_treatment.append(Skink(mom=mom_id, 
                                            dad=dad_id,
                                            treatment=treatment_id,
                                            y=value))

    fam_keys = by_family.keys()
    fam_keys.sort()

    # Now we'll sort the data matrix and print some status information
    status_stream = sys.stdout
    status_stream.write("Data read for " + str(len(fam_keys)) + " families...\n")
    full_data = []
    for i, fam_id in enumerate(fam_keys):
        treatments_list = by_family[fam_id]
        status_stream.write("  Mating group index=" + str(i) + " (id in datafile = " + str(fam_id) + "):\n")
        full_data.append(treatments_list)
        for treat_ind, indiv_list in enumerate(treatments_list):
            treatment_code = TREATMENT_CODES[treat_ind]
            status_stream.write('    ' + str(len(indiv_list)) + ' individuals in with treatment code "' + treatment_code + '" (numerical code ' + str(treat_ind) + ')\n')
    return process_data(full_data)
    

def print_help():
    num_args_expected = 2 + len(initial_parameter_guess)
    output_stream = sys.stdout
    output_stream.write('Expecting ' + str(num_args_expected) + ''' arguments.
    The last argument should be the number of parametric bootstrapping replicates,

    The first argument should be the path (filename) for the datafile (which
        should be a csv file with tab as the column separator.
    
    The intervening arguments should be values of the parameters in the null
        hypothesis (or 'None' to indicate that the parameter is not constrained
        in the null hypothesis).
    
    The order of the parameters is in this constraint statement is:
        ''')
    for p in parameter_names:
        output_stream.write(p + ' ')
    assert len(initial_parameter_guess) > 0
    if len(initial_parameter_guess) == 1:
        c_name = parameter_names[0]
        c_val = str(initial_parameter_guess[0])
        parg_list[c_val]
    else:
        c_name = parameter_names[1]
        c_val = str(initial_parameter_guess[1])
        parg_list = ['None'] * len(initial_parameter_guess)
        parg_list[1] = str(initial_parameter_guess[1])

    output_stream.write('''

    So if the data was in test.csv, and you want to perform 1000 simulations and you want to test the
        hypothesis that:
            ''' + c_name + ' = ' + c_val + '''
        then you would use the arguments:

test.csv ''' + ' '.join(parg_list) +  ''' 1000

''')        
        

if __name__ == '__main__':
    # user-interface and sanity checking...

    # we 
    import sys
    try:
        filepath = sys.argv[1] 
        arguments = sys.argv[2:]
        if len(arguments) < 1 + len(initial_parameter_guess):
            print len(arguments)
            print_help()
            sys.exit(1)
    except Exception, e:
        print 'Error:', e, '\n'
        print_help()
        sys.exit(1)

    real_data = read_data(filepath)
    calculate_incidence_matrix(real_data[0])

    # The number of simulations is the last parameter...
    #
    n_sims = int(arguments[-1])
    
    # The "middle" arguments will be constraints on the parameters.
    # We'll store the number for every argument that is an argument.  If the
    #   argument can't be turned into a number then we'll reach the except
    #   block.  In this case we'll insert None into the list to indicate that
    #   the parameter is not constrained.
    #
    null_params = []
    for arg in arguments[:-1]:  # this walks through all arguments except the last
        try:
            p = float(arg)
            null_params.append(p)
        except:
            try:
                if arg.upper() == 'NONE':
                    null_params.append(None)
                elif arg.upper().startswith("EQUALS"):
                    n = int(arg[len("EQUALS"):])
                    if n == len(null_params):
                        sys.exit("You can't constrain a parameter to be equal to itself")
                    if n > len(null_params):
                        sys.exit("You can't constrain a parameter to be equal to a \"later\" parameter (one with a higher index)")
                    if n < len(null_params) and isinstance(null_params[n], list):
                        sys.exit("You can't constrain a parameter to be equal a parameter that itself is to be equal to a third parameter")
                    null_params.append([n])
                else:
                    raise
            except:
                raise
                print_help()
                sys.exit("Expecting a parameter value to be a number, None, or Equals<some number> where <some number> is replaced with the number of the parameter that is constrained to have the same value (the first parameter should be numbered 0)")
    print "null_params =", null_params
    # Call a function to maximize the log-likelihood under the unconstrained
    #   and null conditions.  This returns the LRT statistic and the 
    #   parameter estimates as lists
    #
    lrt, mle_list, null_mle_list = calc_lrt_statistic(real_data, null_params)

    # We can "unpack" the list into 3 separate variables to make it easier to
    #   report
    ln_l = mle_list[-1]
    ln_l_null = null_mle_list[-1]

    for n, param_name in enumerate(parameter_names):
        print "MLE of", param_name, "=", mle_list[n]
    print "lnL at MLEs =", ln_l
    print "L at MLEs =", exp(ln_l)

    for n, param_name in enumerate(parameter_names):
        v = null_mle_list[n]
        if null_params[n] is None:
            print "Under the null, the MLE of", param_name, "=", v
        elif isinstance(null_params[n], list):
            constrained_index = null_params[n][0]
            print "Under the null, ", param_name, " is constrained to be equal to", parameter_names[constrained_index], "(", null_mle_list[constrained_index] ,")"
        else:
            print "Under the null, ", param_name, " is constrained to be", v
    print "ln_l at null =", ln_l_null
    print "L at null =", exp(ln_l_null)

    print
    print "2* log-likelihood ratio = ", lrt
    print


    # Do parametric bootstrapping to produce the null distribution of the LRT statistic
    #
    if n_sims < 1:
        sys.exit(0)
    print "Generating null distribution of LRT..."

    param_boot_lrt_filename = "ParametricBootstrapLRT.csv"
    sys.stderr.write("About to overwrite the contents of " + param_boot_lrt_filename + "\n")
    # Here we open a file. 'w' means that we open it for the purpose of writing
    #   
    param_boot_lrt_file = open(param_boot_lrt_filename, 'w')
    # Here we will write a tab-separated "header" to the file so that each
    #   column has a name.  We use special "escape" codes to indicate a tab
    #   and newline characters. \t means tab and \n means newline
    param_boot_lrt_file.write("SimRepNumber\tLRT\n")
    
    param_boot_param_est_filename = "ParametricBootstrapParam.csv"
    sys.stderr.write("About to overwrite the contents of " + param_boot_param_est_filename + "\n");
    param_boot_param_est_file = open(param_boot_param_est_filename, 'w')
    # This is a cute, cryptic syntax for creating a line of text that 
    #   consists of all of the strings in the list, joined together with tab
    #   character.  In this case use the list of parameter names
    param_header = '\t'.join(parameter_names)
    param_boot_param_est_file.write("SimRepNumber\t" + param_header + "\n")


    # We'll write the simulated LRT values to the "standard error stream" 
    sys.stderr.write("rep\tlrt\n")

    # null_dist will be a list that holds all of the simulated LRT values. We
    # use [] to create an empty list.
    #
    null_dist = []

    # a "for loop" will repeat the following instructions n_sims times
    #
    sim_params = null_mle_list[:-1]
    for i in range(n_sims):
        # This simulates a data set assuming that the parameters are at the
        #   values that the take under the null hypothesis (since we want the
        #   null distribution of the test statistic).
        #
        sim_data = simulate_data(real_data, sim_params)

        # Calculate the LRT on the simulated data using the same functions that
        #   we used when we analyzed the real data
        #
        sim_lrt, sim_mle_list, sim_null = calc_lrt_statistic(sim_data, 
                                                             null_params, 
                                                             initial_point=sim_params)
        
        YOU WILL NEED TO ADD SOME CODE HERE TO CALL param_boot_lrt_file.write
        AND param_boot_param_est_file.write WITH A STRING THAT CONTAINS THE 
        APPROPRIATE INFORMATION. PUT A \t BETWEEN EACH ITEM THAT SHOULD BE
        IN A SEPARATE COLUMN. PUT A \n AT THE END OF THE LINE. YOU WILL HAVE
        TO USE THE str(x) TO CONVERT A NUMBER, x, TO A STRING THAT CAN BE
        WRITTEN TO THE FILE.
        
        # Add the simulated LRT to our null distribution
        #
        null_dist.append(sim_lrt)

        # Write the value to the standard error stream.  The str() function converts
        #   numbers to strings so that they can be written to the output stream
        #
        sys.stderr.write(str(i + 1))
        sys.stderr.write('\t')
        sys.stderr.write(str(sim_lrt))
        sys.stderr.write('\n')

    # We want the most extreme (negative) values of the LRT from the simulations
    #   if we sort the list, then these values will be at the front of the list
    #   (available by indexing the list with small numbers)
    #
    null_dist.sort()

    # We can report the value of the LRT that is smaller than 95% of the simulated
    #   values...
    #
    n_for_p_point05 = int(0.05*n_sims)
    print "5% critical value is approx =", null_dist[n_for_p_point05]

    # And we can calculate the P-value for our data by counting the number of
    #   simulated replicates that are more extreme than our observed data.
    #   We do this by starting a counter at 0, walking through the stored
    #   null distribution, and adding 1 to our counter every time we see a
    #   simulated LRT that is more extreme than the "real" lrt.
    #
    n_more_extreme = 0
    for v in null_dist:
        if v >= lrt:
            n_more_extreme = n_more_extreme + 1
        else:
            break
    # Then we express this count of the number more extreme as a probability
    #    that a simulated value would be more extreme than the real data.
    #
    print "Approx P-value =", n_more_extreme/float(n_sims)