diff --git a/OptionSelect/create_excel.py b/OptionSelect/create_excel.py
new file mode 100644
index 0000000..4c98bf8
--- /dev/null
+++ b/OptionSelect/create_excel.py
@@ -0,0 +1,35 @@
+# -*- coding: utf-8 -*-
+"""
+Created on Fri Feb 12 15:14:24 2016
+
+@author: Calvin
+
+MRI prep script. This script should be run before anything else is done, preferably before the subject arrives
+It will create the excel file into which the elicited preference ranks are enter.
+"""
+
+import pandas as pd
+import numpy as np
+import os
+import xlwt
+
+check1 = 'no' #initialize while loop variables
+check2 = 'no'
+
+print('Current directory is: ' + os.getcwd())
+while check1!='yes': #check if path is okay
+    check1 = input("Is this path correct? Enter yes if correct: \n")
+
+while check2 != 'yes': #request SID and prompt for okay
+    SID = input('Enter subject ID: ')
+    check2 = input('Is '+ SID+  ' correct?\nEnter yes if correct:\n')
+
+num_range = np.arange(2,62).astype('str') #this creates the excel formula for bundle type
+logic_vec = [xlwt.Formula('IF(B'+x+'=C'+x+',2,IF(C'+x+'=0,1,3))') for x in num_range]
+
+empty_frame = pd.DataFrame(columns = ['rank', 'item1', 'item2', 'type']) #creates data frame
+empty_frame['rank'] = range(60) #populates dataframe
+empty_frame['type']=logic_vec
+empty_frame.to_excel('rank'+SID+'.xls', index = False) #saves dataframe
+SID = [int(SID)]
+np.savetxt('options_to_edit.txt', SID, fmt='%1.0f')
\ No newline at end of file
diff --git a/OptionSelect/ga_multi copy.py b/OptionSelect/ga_multi copy.py
deleted file mode 100644
index 7cbe86a..0000000
--- a/OptionSelect/ga_multi copy.py	
+++ /dev/null
@@ -1,293 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-Created on Thu Aug 13 13:01:21 2015
-@author: Calvin
-"""
-
-#%%==========imports and constants=================%%#
-import numpy as np
-import pandas as pd
-from deap import base, creator, tools
-import matplotlib.pyplot as plt
-from scipy.stats import kstest, ks_2samp
-import random, operator, seaborn
-import multiprocessing as mp
-import json
-import os
-
-#os.chdir('C:\Users\Calvin\Documents\GitHub\Nypype_Workflows\MVPA')
-
-# Define the location of the csv file with modeled preferences, should make relative
-# Three col CSV (Item-Code, Option-Type, Value)
-csv_filepath='rank000.csv'
-
-
-#%% Magic Numbers
-#nepochs-number of epochs, ngen-number of generations in an epoch
-#cxpb- probability of a cross over occuring in one chromosome of a mating pair
-#mutpb- probability of at each nucleotide of a mutation
-#number of individuals to put in HOF in each epoc
-nepochs, ngen, npop, cxpb, mutpb =2,30,100, 0.1, 0.05
-    
-HOFsize=1
-
-HallOfFame=[]
-
-SID='a03'
-n_single=20 #1 number of possibilities for singleton
-n_hetero=15 #2 number of possibilities for the heterogenous bundle
-n_homo=22 #3 number of possibilities for the homogeneous scaling
-n_genome=n_single+n_hetero+n_homo #total number of possibilities for all cases
-n_target=10 #Desired number in each chromosome
-
-chromosomeDict={0:n_single, 1:n_hetero, 2:n_homo}
-
-#Define the seed for the random number generator for replication purposes
-random.seed(1)
-np.random.seed(1)
-
-#%%===========define fitness and functions=================%%#
-uni=np.random.uniform(0,60,500)
-
-def evalFit(individual): 
-    """ A weighted total of fitness scores to be maximized
-    RangeCost-maximum to minimum
-    SimilarityCost - number of items in both singleton and homogenous scaling
-    UniformCost- Uses KS divergence to indicate distance of distribution of values from uniform distribution
-    DistanceCost- Uses KS divergence to indicate differences between distributions
-    Cost currently is a simple weightable summation, might be changed to F score"""
-    indiv=genoToPheno(individual)
-    #####similarityCost=np.sum(np.in1d(individual[0][0],[ bundleLookup[k] for k in individual[0][1] ]))
-    similarityCost=np.sum(np.in1d([singletonLookup[k] for k in individual[0][0]],[ bundleLookup[k] for k in individual[0][1] ]))
-    similarity2=np.sum([np.sum(c)>1 for c in [np.in1d(p,[singletonLookup[k] for k in individual[0][0]]) for p in [ bundleLookup2[w] for w in individual[0][2] ]]])
-    #similarityCost=   np.sum([np.sum(c)>1 for c in [np.in1d(k,x) for k in y]])
-    #x is singelton, y is array of tuples of constituent items
-    ######similarity2=np.sum([np.sum(c)>1 for c in [np.in1d(p,individual[0][0]) for p in [ bundleLookup2[w] for w in individual[0][2] ]]])
-    rangeCost=(np.ptp(indiv[0])+np.ptp(indiv[1])+np.ptp(indiv[2]))/125
-    uniformCost=1/(kstest(indiv[0],'uniform')[0]+kstest(indiv[1],'uniform')[0]+kstest(indiv[2],'uniform')[0])
-    #uniformCost=(ks_2samp(indiv[0], uni)[1]+ks_2samp(indiv[1], uni)[1]+ks_2samp(indiv[2], uni)[1])    
-    distanceCost=(ks_2samp(indiv[0], indiv[1])[1]+ks_2samp(indiv[1], indiv[2])[1]+ks_2samp(indiv[2], indiv[0])[1])
-    cost=20*rangeCost+30*uniformCost+10*distanceCost+similarityCost+similarity2   
-    return (cost,)
-
-def getSims(individual):
-    similarityCost=np.sum(np.in1d([singletonLookup[k] for k in individual[0][0]],[ bundleLookup[k] for k in individual[0][1] ]))
-    similarity2=np.sum([np.sum(c)>1 for c in [np.in1d(p,[singletonLookup[k] for k in individual[0][0]]) for p in [ bundleLookup2[w] for w in individual[0][2] ]]])
-    print similarityCost
-    print similarity2
-    
-
-# Creates the initial generation      
-def createIndividual():
-    """Creates a random individual with 11 singleton, 10 het. bundle, 10 hom. scale"""    
-    return [random.sample(valueDictionary[1].keys(),n_target+1),
-               random.sample(valueDictionary[2].keys(),n_target),
-                random.sample(valueDictionary[3].keys(),n_target)]
-
-
-# Crossover algorithm          
-def nonReplicatingCross(ind1, ind2):
-    """Performs a crossover in-place"""
-    """Highly in need of new documentation"""
-    chromosomeNumber = random.randint(0,2)
-    indLength = len(ind1[chromosomeNumber])
-    cxpoint = random.randint(1,indLength-1)
-    child1 = np.zeros(indLength) #create a child array to use
-    child2 = np.zeros(indLength)
-    child1[0:cxpoint]=ind1[chromosomeNumber][0:cxpoint] #do the first half of the crossover
-    child2[0:cxpoint]=ind2[chromosomeNumber][0:cxpoint]
-    try:
-        child1[child1==0]=[x for x in ind2[chromosomeNumber] if x not in child1][0:len(child1[child1==0])]
-    except ValueError:
-        pass
-    if (child1[child1==0]!=[]) or (child1[child1==0]==[0]):
-        child1[child1==0]=random.sample([x for x in valueDictionary[chromosomeNumber+1].keys() if x not in child1], np.sum(np.where(child1==0, 1, 0)))
-    try:
-        child2[child2==0]=[x for x in ind1[chromosomeNumber] if x not in child2][0:len(child2[child2==0])]
-    except ValueError:
-        pass
-    if (child2[child2==0]!=[]) or (child2[child2==0]==[0]):
-        child2[child2==0]=random.sample([x for x in valueDictionary[chromosomeNumber+1].keys() if x not in child2], np.sum(np.where(child2==0, 1, 0)))
-    ind1[chromosomeNumber]=child1  #copy the child array onto the parent array (in place modification)
-    ind2[chromosomeNumber]=child2
-    
-    return ind1, ind2
-  
-#Mutation algorithm      
-def nonReplicatingMutate(ind,indpb):
-    """Mutates an individual in place"""
-    ind=np.asarray(ind) #copy indiviudal into numpy array
-    for chro in range(0,3):
-        for i in range(1,len(ind[chro])):
-                if random.random() < indpb: #for each nucleotide, use roulette to see if there is a mutation
-                            ind[chro][i]=(random.sample([x for x in valueDictionary[chro+1].keys() if x not in ind[chro]],1))[0]                                
-    return ind
-    del ind
-    
-#Maps genotype onto phenotype (item number onto value)    
-def genoToPheno(individual):
-    #print individual
-    indiv=[np.zeros(n_target+1), np.zeros(n_target), np.zeros(n_target)]
-    for chro in range(0,3):
-        for i in range(len(individual[0][chro])):
-            indiv[chro][i]=valueDictionary[chro+1][int(individual[0][chro][i])]
-    return indiv
-
-#stores top n individuals of an epoch in a list    
-def custHallOfFame(population,maxaddsize):
-    for i in tools.selBest(population, k=maxaddsize): 
-        HallOfFame.append(i)
-
-#checks for human error in value entry
-def inputErrorCheck(raw_data):
-    if not raw_data[['item1', 'item2']].applymap(np.isreal).all().all():
-        raise ValueError('Custom error, ask CL : Some item value is not a number')
-    if [raw_data['index']>60].any:
-        raise ValueError("Custom error, ask CL : An item index is > 60")
-    for bundleType in range(1,4):
-        if raw_data[raw_data['type']==bundleType].duplicated(subset=['item1', 'item2']).any():
-            print raw_data[raw_data['type']==bundleType].duplicated(subset=['item1', 'item2'])
-            raise ValueError('Custom error, ask CL : Some item value is duplicated')
-    
-    
-
-#%%==============import data from csv======================%%#
-raw_choice_dataset = pd.read_csv(csv_filepath, sep=',', header=0)
-
-raw_choice_dataset=raw_choice_dataset[raw_choice_dataset['SID']==SID]
-
-valueDictionary={}
-for x in range(1,4):
-  #Create a dictionary/hashtable associating the unique ID assigned to each singleton or bundle to its modeled value
-    placeholderValueDictionary={}
-    for rows in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==x].iterrows():
-        #rows[1][6]=rows[1][2] # change this once modeling is done
-        placeholderValueDictionary[int(rows[1]['index'])] =float(rows[1]['index'])
-    valueDictionary[x]=placeholderValueDictionary
-    
-singletonLookup={}
-for x in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==1].iterrows():
-    singletonLookup[int(x[1]['index'])]=int(x[1]['item1'])
-
-bundleLookup={}
-for x in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==2].iterrows():
- #create a dictionary/hastable that gives constituent item in homogeneous bundles
-    bundleLookup[int(x[1]['index'])]=int(x[1]['item1'])
-    
-bundleLookup2={}
-for x in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==3].iterrows():
-    bundleLookup2[int(x[1]['index'])]=(int(x[1]['item1']),int(x[1]['item2']))
-#%%===============initialize toolbox=======================%%#
-creator.create("FitnessMax", base.Fitness, weights=(1.0,))
-creator.create("Individual", list, typecode="d", fitness=creator.FitnessMax)
-
-stats = tools.Statistics(key=operator.attrgetter("fitness.values"))
-stats.register("max", np.max)
-stats.register("mean", np.mean)
-stats.register("min", np.min)
-
-toolbox = base.Toolbox()
-
-toolbox.register("HOF", custHallOfFame, maxaddsize=HOFsize)
-toolbox.register("create_individual", createIndividual)
-toolbox.register("individuals", tools.initRepeat, creator.Individual,
-                 toolbox.create_individual, n=1) 
-toolbox.register("population", tools.initRepeat, list, toolbox.individuals)
-
-toolbox.register("evaluate", evalFit)
-
-toolbox.register("mate", nonReplicatingCross)
-toolbox.register("mutate", nonReplicatingMutate, indpb=.1)
-toolbox.register("select", tools.selTournament, tournsize=2)
-
-
-#toolbox.register('map', futures.map)
-
-s= tools.Statistics()
-s.register("max", np.max)
-s.register("mean", np.mean)
-
-log=tools.Logbook()
-
-def main_program(pop):    
-    fitnesses = toolbox.map(toolbox.evaluate, pop) # eval. fitness of pop
-    for ind, fit in zip(pop, fitnesses):
-        ind.fitness.values = fit
-    
-    for g in range(ngen):  
-        if g%5==0:
-            print str(g) + ' of ' + str(ngen)       
-        offspring = toolbox.select(pop, len(pop)) #select which individuals to mate
-        offspring = map(toolbox.clone, offspring)
-        
-        for child1, child2 in zip(offspring[::2], offspring[1::2]): #determine whether to have a cross over
-            if random.random() < cxpb:
-                child1[0], child2[0] = toolbox.mate(child1[0], child2[0])
-                del child1.fitness.values, child2.fitness.values
-    
-        for mutant in offspring: #determine whether to mutate
-            if random.random() < mutpb:
-                mutant[0]=toolbox.mutate(mutant[0])
-                del mutant.fitness.values      
-        
-        invalids = [ind for ind in offspring if not ind.fitness.valid] #assign fitness scores to new offspring
-        fitnesses = toolbox.map(toolbox.evaluate, invalids)
-        for ind, fit in zip(invalids, fitnesses):
-            ind.fitness.values = fit  
-        
-        log.record(gen=g,**stats.compile(pop))
-        pop[:] = offspring #update population with offspring    
-    return tools.selBest(pop,k=1)[0][0]
-
-#%%======================main==============================%%#
-if __name__ == '__main__':  
-    print 'GA algorithm starting with the following settings:'
-    print 'nepochs = ' + str(nepochs) + ' ngen = ' + str(ngen) + ' npop = ' + str(npop)
-    print 'cxpb = ' + str(cxpb) + ' mutpb = ' + str(mutpb)
-    answer = input('Are the following settings okay? (0/1)  ')
-    if answer == 0:
-        raise ValueError('Custom Error: Please change settings in script file')    
-    
-    print 'initializing processing pool'
-    return_var= []
-    processes = []
-    pool = mp.Pool(processes = 8)
-    pop_pool = [toolbox.population(n=npop) for x in range(8)]
-    results = pool.map(main_program,pop_pool)
-    pool.close()
-    print 'pool finished, outputing to JSON'    
-    
-    results = [[np.sort(x[0]),np.sort(x[1]),np.sort(x[2])] for x in results]
-    
-    resultsFit = [evalFit([x]) for x in results]
-    maxIndex = np.argmax(resultsFit)
-    
-    bestIndividual = results[maxIndex]
-    
-    singletonTransed = [singletonLookup[item] for item in bestIndividual[0]]
-    median = singletonTransed[5]
-    singletonTransed = np.delete(singletonTransed, 5).tolist()
-    homoTransed = [bundleLookup[item] for item in bestIndividual[1]]
-    heteroTransed = [bundleLookup2[item] for item in bestIndividual[2]]
-    
-    outputData = { 'singleton' : singletonTransed, 'homo' : homoTransed, 'hetero' : heteroTransed, 'median' : median }
-    outputData = json.dumps(outputData)
-    with open('jsonOut.txt', 'w') as outfile:
-        outfile.write(str(outputData))
-        
-    outputDataFull = np.hstack((bestIndividual[0], bestIndividual[1],bestIndividual[2]))
-    outputDataFull = np.sort(outputDataFull)
-    transedFullData = []
-    for x in outputDataFull:
-        if x in singletonLookup.keys():
-            transedFullData.append(singletonLookup[x])
-        if x in bundleLookup.keys():
-            transedFullData.append(bundleLookup[x])
-        if x in bundleLookup2.keys():
-            transedFullData.append(bundleLookup2[x])
-        else:
-            raise ValueError('Custom error: item in outputData JSON was not in any value dictionary')
-    outputData = { 'options' : transedFullData}
-    outputData = json.dumps(outputData)
-    with open('jsonOutExtended.txt', 'w') as outfile:
-        outfile.write(str(outputData))
\ No newline at end of file
diff --git a/OptionSelect/ga_multi.py b/OptionSelect/ga_multi.py
index d4e8493..254ddb3 100644
--- a/OptionSelect/ga_multi.py
+++ b/OptionSelect/ga_multi.py
@@ -1,296 +1,310 @@
-# -*- coding: utf-8 -*-
-"""
-Created on Thu Aug 13 13:01:21 2015
-
-@author: Calvin
-"""
-
-#%%==========imports and constants=================%%#
-import numpy as np
-import pandas as pd
-from deap import base, creator, tools
-import matplotlib.pyplot as plt
-from scipy.stats import kstest, ks_2samp
-import random, operator, seaborn
-import multiprocessing as mp
-import json
-import os
-
-os.chdir('/Users/Dalton/Documents/Projects/BundledOptionsExp/Collection/OptionSelect')
-
-# Define the location of the csv file with modeled preferences, should make relative
-# Three col CSV (Item-Code, Option-Type, Value)
-csv_filepath='rank3306.csv'
-
-
-#%% Magic Numbers
-#nepochs-number of epochs, ngen-number of generations in an epoch
-#cxpb- probability of a cross over occuring in one chromosome of a mating pair
-#mutpb- probability of at each nucleotide of a mutation
-#number of individuals to put in HOF in each epoc
-nepochs, ngen, npop, cxpb, mutpb =2,80,2000, 0.1, 0.05
-    
-HOFsize=1
-
-HallOfFame=[]
-
-SID='a03'
-n_single=20 #1 number of possibilities for singleton
-n_hetero=15 #2 number of possibilities for the heterogenous bundle
-n_homo=22 #3 number of possibilities for the homogeneous scaling
-n_genome=n_single+n_hetero+n_homo #total number of possibilities for all cases
-n_target=10 #Desired number in each chromosome
-
-chromosomeDict={0:n_single, 1:n_hetero, 2:n_homo}
-
-#Define the seed for the random number generator for replication purposes
-random.seed(1)
-np.random.seed(1)
-
-#%%===========define fitness and functions=================%%#
-uni=np.random.uniform(0,60,500)
-
-def evalFit(individual): 
-    """ A weighted total of fitness scores to be maximized
-    RangeCost-maximum to minimum
-    SimilarityCost - number of items in both singleton and homogenous scaling
-    UniformCost- Uses KS divergence to indicate distance of distribution of values from uniform distribution
-    DistanceCost- Uses KS divergence to indicate differences between distributions
-    Cost currently is a simple weightable summation, might be changed to F score"""
-    indiv=genoToPheno(individual)
-    #####similarityCost=np.sum(np.in1d(individual[0][0],[ bundleLookup[k] for k in individual[0][1] ]))
-    similarityCost=np.sum(np.in1d([singletonLookup[k] for k in individual[0][0]],[ bundleLookup[k] for k in individual[0][1] ]))
-    similarity2=np.sum([np.sum(c)>1 for c in [np.in1d(p,[singletonLookup[k] for k in individual[0][0]]) for p in [ bundleLookup2[w] for w in individual[0][2] ]]])
-    #similarityCost=   np.sum([np.sum(c)>1 for c in [np.in1d(k,x) for k in y]])
-    #x is singelton, y is array of tuples of constituent items
-    ######similarity2=np.sum([np.sum(c)>1 for c in [np.in1d(p,individual[0][0]) for p in [ bundleLookup2[w] for w in individual[0][2] ]]])
-    rangeCost=(np.ptp(indiv[0])+np.ptp(indiv[1])+np.ptp(indiv[2]))/125
-    uniformCost=1/(kstest(indiv[0],'uniform')[0]+kstest(indiv[1],'uniform')[0]+kstest(indiv[2],'uniform')[0])
-    #uniformCost=(ks_2samp(indiv[0], uni)[1]+ks_2samp(indiv[1], uni)[1]+ks_2samp(indiv[2], uni)[1])    
-    distanceCost=(ks_2samp(indiv[0], indiv[1])[1]+ks_2samp(indiv[1], indiv[2])[1]+ks_2samp(indiv[2], indiv[0])[1])
-    cost=20*rangeCost+30*uniformCost+10*distanceCost+similarityCost+similarity2   
-    return (cost,)
-
-def getSims(individual):
-    similarityCost=np.sum(np.in1d([singletonLookup[k] for k in individual[0][0]],[ bundleLookup[k] for k in individual[0][1] ]))
-    similarity2=np.sum([np.sum(c)>1 for c in [np.in1d(p,[singletonLookup[k] for k in individual[0][0]]) for p in [ bundleLookup2[w] for w in individual[0][2] ]]])
-    print similarityCost
-    print similarity2
-    
-
-# Creates the initial generation      
-def createIndividual():
-    """Creates a random individual with 11 singleton, 10 het. bundle, 10 hom. scale"""    
-    return [random.sample(valueDictionary[1].keys(),n_target+1),
-               random.sample(valueDictionary[2].keys(),n_target),
-                random.sample(valueDictionary[3].keys(),n_target)]
-
-
-# Crossover algorithm          
-def nonReplicatingCross(ind1, ind2):
-    """Performs a crossover in-place"""
-    """Highly in need of new documentation"""
-    chromosomeNumber = random.randint(0,2)
-    indLength = len(ind1[chromosomeNumber])
-    cxpoint = random.randint(1,indLength-1)
-    child1 = np.zeros(indLength) #create a child array to use
-    child2 = np.zeros(indLength)
-    child1[0:cxpoint]=ind1[chromosomeNumber][0:cxpoint] #do the first half of the crossover
-    child2[0:cxpoint]=ind2[chromosomeNumber][0:cxpoint]
-    try:
-        child1[child1==0]=[x for x in ind2[chromosomeNumber] if x not in child1][0:len(child1[child1==0])]
-    except ValueError:
-        pass
-    if (child1[child1==0]!=[]) or (child1[child1==0]==[0]):
-        child1[child1==0]=random.sample([x for x in valueDictionary[chromosomeNumber+1].keys() if x not in child1], np.sum(np.where(child1==0, 1, 0)))
-    try:
-        child2[child2==0]=[x for x in ind1[chromosomeNumber] if x not in child2][0:len(child2[child2==0])]
-    except ValueError:
-        pass
-    if (child2[child2==0]!=[]) or (child2[child2==0]==[0]):
-        child2[child2==0]=random.sample([x for x in valueDictionary[chromosomeNumber+1].keys() if x not in child2], np.sum(np.where(child2==0, 1, 0)))
-    ind1[chromosomeNumber]=child1  #copy the child array onto the parent array (in place modification)
-    ind2[chromosomeNumber]=child2
-    
-    return ind1, ind2
-  
-#Mutation algorithm      
-def nonReplicatingMutate(ind,indpb):
-    """Mutates an individual in place"""
-    ind=np.asarray(ind) #copy indiviudal into numpy array
-    for chro in range(0,3):
-        for i in range(1,len(ind[chro])):
-                if random.random() < indpb: #for each nucleotide, use roulette to see if there is a mutation
-                            ind[chro][i]=(random.sample([x for x in valueDictionary[chro+1].keys() if x not in ind[chro]],1))[0]                                
-    return ind
-    del ind
-    
-#Maps genotype onto phenotype (item number onto value)    
-def genoToPheno(individual):
-    #print individual
-    indiv=[np.zeros(n_target+1), np.zeros(n_target), np.zeros(n_target)]
-    for chro in range(0,3):
-        for i in range(len(individual[0][chro])):
-            indiv[chro][i]=valueDictionary[chro+1][int(individual[0][chro][i])]
-    return indiv
-
-#stores top n individuals of an epoch in a list    
-def custHallOfFame(population,maxaddsize):
-    for i in tools.selBest(population, k=maxaddsize): 
-        HallOfFame.append(i)
-
-#checks for human error in value entry
-def inputErrorCheck(raw_data):
-    if not raw_data[['item1', 'item2']].applymap(np.isreal).all().all():
-        raise ValueError('Custom error, ask CL : Some item value is not a number')
-    if [raw_data['index']>60].any:
-        raise ValueError("Custom error, ask CL : An item index is > 60")
-    for bundleType in range(1,4):
-        if raw_data[raw_data['type']==bundleType].duplicated(subset=['item1', 'item2']).any():
-            print raw_data[raw_data['type']==bundleType].duplicated(subset=['item1', 'item2'])
-            raise ValueError('Custom error, ask CL : Some item value is duplicated')
-    
-    
-
-#%%==============import data from csv======================%%#
-raw_choice_dataset = pd.read_csv(csv_filepath, sep=',', header=0)
-
-valueDictionary={}
-for x in range(1,4):
-  #Create a dictionary/hashtable associating the unique ID assigned to each singleton or bundle to its modeled value
-    placeholderValueDictionary={}
-    for rows in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==x].iterrows():
-        #rows[1][6]=rows[1][2] # change this once modeling is done
-        placeholderValueDictionary[int(rows[1]['rank'])] =float(rows[1]['rank'])
-    valueDictionary[x]=placeholderValueDictionary
-    
-singletonLookup={}
-for x in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==1].iterrows():
-    singletonLookup[int(x[1]['rank'])]=int(x[1]['item1'])
-
-bundleLookup={}
-for x in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==2].iterrows():
- #create a dictionary/hastable that gives constituent item in homogeneous bundles
-    bundleLookup[int(x[1]['rank'])]=int(x[1]['item1'])
-    
-bundleLookup2={}
-for x in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==3].iterrows():
-    bundleLookup2[int(x[1]['rank'])]=(int(x[1]['item1']),int(x[1]['item2']))
-#%%===============initialize toolbox=======================%%#
-creator.create("FitnessMax", base.Fitness, weights=(1.0,))
-creator.create("Individual", list, typecode="d", fitness=creator.FitnessMax)
-
-stats = tools.Statistics(key=operator.attrgetter("fitness.values"))
-stats.register("max", np.max)
-stats.register("mean", np.mean)
-stats.register("min", np.min)
-
-toolbox = base.Toolbox()
-
-toolbox.register("HOF", custHallOfFame, maxaddsize=HOFsize)
-toolbox.register("create_individual", createIndividual)
-toolbox.register("individuals", tools.initRepeat, creator.Individual,
-                 toolbox.create_individual, n=1) 
-toolbox.register("population", tools.initRepeat, list, toolbox.individuals)
-
-toolbox.register("evaluate", evalFit)
-
-toolbox.register("mate", nonReplicatingCross)
-toolbox.register("mutate", nonReplicatingMutate, indpb=.1)
-toolbox.register("select", tools.selTournament, tournsize=2)
-
-
-#toolbox.register('map', futures.map)
-
-s= tools.Statistics()
-s.register("max", np.max)
-s.register("mean", np.mean)
-
-log=tools.Logbook()
-
-def main_program(pop):    
-    fitnesses = toolbox.map(toolbox.evaluate, pop) # eval. fitness of pop
-    for ind, fit in zip(pop, fitnesses):
-        ind.fitness.values = fit
-    
-    for g in range(ngen):  
-        if g%5==0:
-            print str(g) + ' of ' + str(ngen)       
-        offspring = toolbox.select(pop, len(pop)) #select which individuals to mate
-        offspring = map(toolbox.clone, offspring)
-        
-        for child1, child2 in zip(offspring[::2], offspring[1::2]): #determine whether to have a cross over
-            if random.random() < cxpb:
-                child1[0], child2[0] = toolbox.mate(child1[0], child2[0])
-                del child1.fitness.values, child2.fitness.values
-    
-        for mutant in offspring: #determine whether to mutate
-            if random.random() < mutpb:
-                mutant[0]=toolbox.mutate(mutant[0])
-                del mutant.fitness.values      
-        
-        invalids = [ind for ind in offspring if not ind.fitness.valid] #assign fitness scores to new offspring
-        fitnesses = toolbox.map(toolbox.evaluate, invalids)
-        for ind, fit in zip(invalids, fitnesses):
-            ind.fitness.values = fit  
-        
-        log.record(gen=g,**stats.compile(pop))
-        pop[:] = offspring #update population with offspring    
-    return tools.selBest(pop,k=1)[0][0]
-
-#%%======================main==============================%%#
-if __name__ == '__main__':  
-    print 'GA algorithm starting with the following settings:'
-    print 'nepochs = ' + str(nepochs) + ' ngen = ' + str(ngen) + ' npop = ' + str(npop)
-    print 'cxpb = ' + str(cxpb) + ' mutpb = ' + str(mutpb)
-    answer = input('Are the following settings okay? (0/1)  ')
-    if answer == 0:
-        raise ValueError('Custom Error: Please change settings in script file')    
-    
-    print 'initializing processing pool'
-    return_var= []
-    processes = []
-    pool = mp.Pool(processes = 8)
-    pop_pool = [toolbox.population(n=npop) for x in range(8)]
-    results = pool.map(main_program,pop_pool)
-    pool.close()
-    print 'pool finished, outputing to JSON'    
-    
-    results = [[np.sort(x[0]),np.sort(x[1]),np.sort(x[2])] for x in results]
-    
-    resultsFit = [evalFit([x]) for x in results]
-    maxIndex = np.argmax(resultsFit)
-    
-    bestIndividual = results[maxIndex]
-    
-    singletonTransed = [singletonLookup[item] for item in bestIndividual[0]]
-    median = singletonTransed[5]
-    medianUntransed = bestIndividual[0][5]
-    singletonTransed = np.delete(singletonTransed, 5).tolist()
-    homoTransed = [bundleLookup[item] for item in bestIndividual[1]]
-    heteroTransed = [bundleLookup2[item] for item in bestIndividual[2]]
-    
-    outputData = { 'singleton' : singletonTransed, 'homo' : homoTransed, 'hetero' : heteroTransed, 'median' : median }
-    outputData = json.dumps(outputData)
-    with open('jsonOut.txt', 'w') as outfile:
-        outfile.write(str(outputData))
-
-    extended = np.unique(np.hstack((np.ravel([bundleLookup[x] for x in bestIndividual[1]]), np.ravel([bundleLookup2[x] for x in bestIndividual[2]]), bestIndividual[0])))
-    outputDataFull = np.hstack((extended, bestIndividual[1],bestIndividual[2], medianUntransed))
-    outputDataFull = np.unique(outputDataFull)
-    outputDataFull = np.sort(outputDataFull)
-    transedFullData = []
-    for x in outputDataFull:
-        if x in singletonLookup.keys():
-            transedFullData.append(singletonLookup[x])
-        elif x in bundleLookup.keys():
-            transedFullData.append((bundleLookup[x],bundleLookup[x]))
-        elif x in bundleLookup2.keys():
-            transedFullData.append(bundleLookup2[x])
-        else:
-            raise ValueError('Custom error: item in outputData JSON was not in any value dictionary')
-    outputData = { 'options' : transedFullData}
-    outputData = json.dumps(outputData)
-    with open('jsonOutExtended.txt', 'w') as outfile:
-        outfile.write(str(outputData))
-        
+# -*- coding: utf-8 -*-
+"""
+Created on Thu Aug 13 13:01:21 2015
+@author: Calvin Leather
+
+This script uses the item rankings given by participants to determine a well balanaced set of decision options.
+It takes as input the excel file used to 
+"""
+
+#%%==========imports and constants=================%%#
+import numpy as np
+import pandas as pd
+from deap import base, creator, tools
+from scipy.stats import kstest, ks_2samp
+import random, operator
+import multiprocessing as mp
+import json
+import os
+import matplotlib.pyplot as plt
+import seaborn as sns
+
+# Define the location of the csv file with modeled preferences, should make relative
+# Three col CSV (Item-Code, Option-Type, Value)
+try:
+    option_text = np.loadtxt('options_to_edit.txt')
+    inputSID = int(option_text)
+except:
+    raise ValueError('Something is wrong w options_to_edit.txt. Please edit this file with the correct SID and rerun')
+csv_filepath=r'rank' + str(inputSID)+ '.xls'
+
+
+#%% Magic Numbers
+#nepochs-number of epochs, ngen-number of generations in an epoch
+#cxpb- probability of a cross over occuring in one chromosome of a mating pair
+#mutpb- probability of at each nucleotide of a mutation
+#number of individuals to put in HOF in each epoc
+nepochs, ngen, npop, cxpb, mutpb =2,50,250, 0.1, 0.05
+n_proc = 2
+    
+HOFsize=1
+
+HallOfFame=[]
+
+n_single=20 #1 number of possibilities for singleton
+n_hetero=15 #2 number of possibilities for the heterogenous bundle
+n_homo=22 #3 number of possibilities for the homogeneous scaling
+n_genome=n_single+n_hetero+n_homo #total number of possibilities for all cases
+n_target=10 #Desired number in each chromosome
+
+
+chromosomeDict={0:n_single, 1:n_hetero, 2:n_homo}
+
+#Define the seed for the random number generator for replication purposes
+#random.seed(1)
+#np.random.seed(1)
+
+#%%===========define fitness and functions=================%%#
+#uni=np.random.uniform(0,60,500)
+
+def evalFit(individual): 
+    """ A weighted total of fitness scores to be maximized
+    RangeCost-maximum to minimum
+    SimilarityCost - number of items in both singleton and homogenous scaling
+    UniformCost- Uses KS divergence to indicate distance of distribution of values from uniform distribution
+    DistanceCost- Uses KS divergence to indicate differences between distributions
+    Cost currently is a simple weightable summation, might be changed to F score"""
+    #indiv=genoToPheno(individual)
+    indiv = individual[0]
+    indiv = [np.sort(indiv[0]), np.sort(indiv[1]), np.sort(indiv[2])] 
+    rangeCost=3*(np.ptp(indiv[0])+np.ptp(indiv[1])+np.ptp(indiv[2]))
+    diffCost = -2*np.var((np.mean(indiv[0]),np.mean(indiv[1]), np.mean(indiv[2])))
+    spacingCost = 5*(np.mean(np.diff(np.hstack((0,indiv[0],60))))+np.mean(np.diff(np.hstack((0,indiv[1],60))))+np.mean(np.diff(np.hstack((0,indiv[2],60)))))
+    varCost = -10*(np.power(np.var(np.diff(np.hstack((0,indiv[0],60)))),3)+np.power(np.var(np.diff(np.hstack((0,indiv[1],60)))),3)+np.power(np.var(np.diff(np.hstack((0,indiv[2],60)))),3))
+    adjCost = -15*(np.sum(np.diff(indiv[0])==1)+ np.sum(np.diff(indiv[1])==1)+ np.sum(np.diff(indiv[2])==1))
+    cost=rangeCost+spacingCost+varCost+rangeCost+diffCost+adjCost
+    return (cost,)
+
+def getSims(individual):
+    similarityCost=np.sum(np.in1d([singletonLookup[k] for k in individual[0][0]],[ bundleLookup[k] for k in individual[0][1] ]))
+    similarity2=np.sum([np.sum(c)>1 for c in [np.in1d(p,[singletonLookup[k] for k in individual[0][0]]) for p in [ bundleLookup2[w] for w in individual[0][2] ]]])
+    print(similarityCost)
+    print(similarity2)
+    
+
+# Creates the initial generation      
+def createIndividual():
+    """Creates a random individual with 11 singleton, 10 het. bundle, 10 hom. scale"""    
+    return [random.sample(valueDictionary[1].keys(),n_target+1),
+               random.sample(valueDictionary[2].keys(),n_target),
+                random.sample(valueDictionary[3].keys(),n_target)]
+
+
+# Crossover algorithm          
+def nonReplicatingCross(ind1, ind2):
+    """Performs a crossover in-place"""
+    """Highly in need of new documentation"""
+    chromosomeNumber = random.randint(0,2)
+    indLength = len(ind1[chromosomeNumber])
+    cxpoint = random.randint(1,indLength-1)
+    child1 = np.zeros(indLength) #create a child array to use
+    child2 = np.zeros(indLength)
+    child1[0:cxpoint]=ind1[chromosomeNumber][0:cxpoint] #do the first half of the crossover
+    child2[0:cxpoint]=ind2[chromosomeNumber][0:cxpoint]
+    try:
+        child1[child1==0]=[x for x in ind2[chromosomeNumber] if x not in child1][0:len(child1[child1==0])]
+    except ValueError:
+        pass
+    if (child1[child1==0]!=[]) or (child1[child1==0]==[0]):
+        child1[child1==0]=random.sample([x for x in valueDictionary[chromosomeNumber+1].keys() if x not in child1], np.sum(np.where(child1==0, 1, 0)))
+    try:
+        child2[child2==0]=[x for x in ind1[chromosomeNumber] if x not in child2][0:len(child2[child2==0])]
+    except ValueError:
+        pass
+    if (child2[child2==0]!=[]) or (child2[child2==0]==[0]):
+        child2[child2==0]=random.sample([x for x in valueDictionary[chromosomeNumber+1].keys() if x not in child2], np.sum(np.where(child2==0, 1, 0)))
+    ind1[chromosomeNumber]=child1  #copy the child array onto the parent array (in place modification)
+    ind2[chromosomeNumber]=child2
+    
+    return ind1, ind2
+  
+#Mutation algorithm      
+def nonReplicatingMutate(ind,indpb):
+    """Mutates an individual in place"""
+    ind=np.asarray(ind) #copy indiviudal into numpy array
+    for chro in range(0,3):
+        for i in range(1,len(ind[chro])):
+                if random.random() < indpb: #for each nucleotide, use roulette to see if there is a mutation
+                            ind[chro][i]=(random.sample([x for x in valueDictionary[chro+1].keys() if x not in ind[chro]],1))[0]                                
+    return ind
+    del ind
+    
+#Maps genotype onto phenotype (item number onto value)    
+def genoToPheno(individual):
+    #print individual
+    indiv=[np.zeros(n_target+1), np.zeros(n_target), np.zeros(n_target)]
+    for chro in range(0,3):
+        for i in range(len(individual[0][chro])):
+            indiv[chro][i]=valueDictionary[chro+1][int(individual[0][chro][i])]
+    return indiv
+
+#checks for human error in value entry
+def inputErrorCheck(raw_data):
+    if not raw_data[['item1', 'item2']].applymap(np.isreal).all().all():
+        raise ValueError('Custom error, ask CL : Some item value is not a number')
+    if (raw_data.index>=60).any():
+        raise ValueError("Custom error, ask CL : An item index is > 60")
+    if raw_data.duplicated(subset=['item1', 'item2']).any():
+        print(raw_data[raw_data.duplicated(subset=['item1', 'item2'])])
+        raise ValueError('Custom error, ask CL : Some item value is duplicated')
+    if raw_data[['item1', 'item2']].applymap(lambda x: x>30).any().any():
+        raise ValueError('Item number is greater than 30')
+        
+def getRank(item):
+    if type(item)==tuple:
+        return raw_choice_dataset.loc[(raw_choice_dataset['item1']==item[0]) & (raw_choice_dataset['item2']==item[1]),'rank'].values[0] 
+    else:
+        raise ValueError('Custom error: Some item is not a tuple in rank ordering')
+
+#%%==============import data from csv======================%%#
+raw_choice_dataset = pd.read_excel(csv_filepath, sep=',', header=0)
+
+inputErrorCheck(raw_choice_dataset)
+
+valueDictionary={}
+for x in range(1,4):
+  #Create a dictionary/hashtable associating the unique ID assigned to each singleton or bundle to its modeled value
+    placeholderValueDictionary={}
+    for rows in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==x].iterrows():
+        #rows[1][6]=rows[1][2] # change this once modeling is done
+        placeholderValueDictionary[int(rows[1]['rank'])] =float(rows[1]['rank'])
+    valueDictionary[x]=placeholderValueDictionary
+    
+singletonLookup={}
+for x in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==1].iterrows():
+    singletonLookup[int(x[1]['rank'])]=int(x[1]['item1'])
+
+bundleLookup={}
+for x in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==2].iterrows():
+ #create a dictionary/hastable that gives constituent item in homogeneous bundles
+    bundleLookup[int(x[1]['rank'])]=int(x[1]['item1'])
+    
+bundleLookup2={}
+for x in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==3].iterrows():
+    bundleLookup2[int(x[1]['rank'])]=(int(x[1]['item1']),int(x[1]['item2']))
+#%%===============initialize toolbox=======================%%#
+creator.create("FitnessMax", base.Fitness, weights=(1.0,))
+creator.create("Individual", list, typecode="d", fitness=creator.FitnessMax)
+
+stats = tools.Statistics(key=operator.attrgetter("fitness.values"))
+stats.register("max", np.max)
+stats.register("mean", np.mean)
+stats.register("min", np.min)
+
+toolbox = base.Toolbox()
+
+toolbox.register("HOF", tools.HallOfFame, maxsize = 5)
+toolbox.register("create_individual", createIndividual)
+toolbox.register("individuals", tools.initRepeat, creator.Individual,
+                 toolbox.create_individual, n=1) 
+toolbox.register("population", tools.initRepeat, list, toolbox.individuals)
+
+toolbox.register("evaluate", evalFit)
+
+toolbox.register("mate", nonReplicatingCross)
+toolbox.register("mutate", nonReplicatingMutate, indpb=.1)
+toolbox.register("select", tools.selTournament, tournsize=3)
+
+
+#toolbox.register('map', futures.map)
+
+s= tools.Statistics()
+s.register("max", np.max)
+s.register("mean", np.mean)
+
+log=tools.Logbook()
+
+def main_program(pop):    
+    HOF = []
+    fitnesses = toolbox.map(toolbox.evaluate, pop) # eval. fitness of pop
+    for ind, fit in zip(pop, fitnesses):
+        ind.fitness.values = fit
+    
+    for g in range(ngen):  
+        if g%5==0:
+            print(str(g) + ' of ' + str(ngen))       
+        offspring = toolbox.select(pop, len(pop)) #select which individuals to mate
+        offspring = list(map(toolbox.clone, offspring))
+        
+        for child1, child2 in zip(offspring[::2], offspring[1::2]): #determine whether to have a cross over
+            if random.random() < cxpb:
+                toolbox.mate(child1[0], child2[0])
+                del child1.fitness.values, child2.fitness.values
+    
+        for mutant in offspring: #determine whether to mutate
+            if random.random() < mutpb:
+                toolbox.mutate(mutant[0])
+                del mutant.fitness.values      
+        
+        invalids = [ind for ind in offspring if not ind.fitness.valid] #assign fitness scores to new offspring
+        fitnesses = toolbox.map(toolbox.evaluate, invalids)
+        for ind, fit in zip(invalids, fitnesses):
+            ind.fitness.values = fit  
+        
+        pop[:] = offspring #update population with offspring
+        log.record(gen=g,**stats.compile(pop))
+    return tools.selBest(pop,k=1)[0][0], log, HOF
+
+#%%======================main==============================%%#
+if __name__ == '__main__':  
+    print('GA algorithm starting with the following settings:')
+    print('nepochs = ' + str(nepochs) + ' ngen = ' + str(ngen) + ' npop = ' + str(npop))
+    print('cxpb = ' + str(cxpb) + ' mutpb = ' + str(mutpb) + ' SID = ' + str(inputSID))
+    answer = input('Are the following settings okay? (0/1)  ')
+    if answer == 0:
+        raise ValueError('Custom Error: Please change settings in script file')    
+    
+    print('initializing processing pool')
+    return_var= []
+    processes = []
+    pool = mp.Pool(processes = n_proc)
+    pop_pool = [toolbox.population(n=npop) for x in range(n_proc)]
+    results = pool.map(main_program,pop_pool)
+    pool.close()
+    print('pool finished, outputing to JSON')    
+    
+    best_inds = [x[0] for x in results]
+    stats = [x[1] for x in results]
+    HOF_best = [x[2] for x in results]
+    #plt.plot([x['min'] for x in stats[0]])
+    results = best_inds
+    results = [[np.sort(x[0]),np.sort(x[1]),np.sort(x[2])] for x in results]
+    
+    resultsFit = [evalFit([x]) for x in results]
+    maxIndex = np.argmax(resultsFit)
+    
+    bestIndividual = results[maxIndex]
+    
+    singletonTransed = [singletonLookup[item] for item in bestIndividual[0]]
+    median = singletonTransed[5]
+    medianUntransed = bestIndividual[0][5]
+    singletonTransed = np.delete(singletonTransed, 5).tolist()
+    homoTransed = [bundleLookup[item] for item in bestIndividual[1]]
+    heteroTransed = [bundleLookup2[item] for item in bestIndividual[2]]
+    
+    outputData = { 'singleton' : singletonTransed, 'homo' : homoTransed, 'hetero' : heteroTransed, 'median' : median }
+    outputData = json.dumps(outputData)
+    with open('jsonOut.txt', 'w') as outfile:
+        outfile.write(str(outputData))
+
+    extended = np.unique(np.hstack((np.ravel([bundleLookup[x] for x in bestIndividual[1]]), np.ravel([bundleLookup2[x] for x in bestIndividual[2]]), [singletonLookup[x] for x in bestIndividual[0]]))).tolist()
+    homoTransed = [(x,x) for x in homoTransed]
+    extended= [(x,0) for x in extended]
+    outputDataFull  = extended+homoTransed+heteroTransed #median is in bestIndividual, so is included
+    outputDataFull=sorted(outputDataFull, key = getRank)
+    outputDataFull = [item[0] if item[1]==0 else item for item in outputDataFull]
+    outputData = { 'options' : outputDataFull }
+    outputData = json.dumps(outputData)
+    with open('..\\BehavioralValueMeasurements\\jsonOutExtended.txt', 'w') as outfile:
+        outfile.write(str(outputData))
+    #outputDataFull=sorted(outputDataFull, key = getRank)
+    #outputDataFull=sorted(outputDataFull) 
+    #plt.hold(True)
+    #plt.title(csv_filepath)
+    #sns.set_context(rc={"figure.figsize": (8, 4)})
+    #plt.bar(np.asarray(bestIndividual[0]),np.ones((1,len(bestIndividual[0])))[0], color = 'blue')
+    #plt.bar(np.asarray(bestIndividual[1]),np.ones((1,len(bestIndividual[1])))[0], color = 'red')
+    #plt.bar(np.asarray(bestIndividual[2]),np.ones((1,len(bestIndividual[2])))[0], color = 'green')
+    #individual=[bestIndividual]
+    #similarityCost=np.sum(np.in1d([singletonLookup[k] for k in individual[0][0]],[ bundleLookup[k] for k in individual[0][1] ]))
+    #similarity2=np.sum([np.sum(c)>1 for c in [np.in1d(p,[singletonLookup[k] for k in individual[0][0]]) for p in [ bundleLookup2[w] for w in individual[0][2] ]]])
\ No newline at end of file
diff --git a/OptionSelect/graph.py b/OptionSelect/graph.py
new file mode 100644
index 0000000..4a257be
--- /dev/null
+++ b/OptionSelect/graph.py
@@ -0,0 +1,22 @@
+# -*- coding: utf-8 -*-
+"""
+Created on Thu Nov 05 18:42:47 2015
+
+@author: Calvin
+"""
+import numpy as np
+import pandas as pd
+from deap import base, creator, tools
+import matplotlib.pyplot as plt
+from scipy.stats import kstest, ks_2samp
+import random, operator, seaborn
+import multiprocessing as mp
+import json
+import os
+import seaborn as sns
+
+plt.hold(True)
+sns.set_context(rc={"figure.figsize": (8, 4)})
+plt.bar(np.asarray(bestIndividual[0]),np.ones((1,len(bestIndividual[0])))[0], color = 'blue')
+plt.bar(np.asarray(bestIndividual[1]),np.ones((1,len(bestIndividual[1])))[0], color = 'red')
+plt.bar(np.asarray(bestIndividual[2]),np.ones((1,len(bestIndividual[2])))[0], color = 'green')
diff --git a/OptionSelect/jsonOut.txt b/OptionSelect/jsonOut.txt
deleted file mode 100644
index 92b8e79..0000000
--- a/OptionSelect/jsonOut.txt
+++ /dev/null
@@ -1 +0,0 @@
-{"hetero": [[13, 24], [18, 26], [18, 30], [9, 16], [16, 30], [23, 21], [21, 26], [4, 8], [30, 21], [30, 12]], "singleton": [11, 18, 17, 16, 24, 13, 9, 26, 30, 21], "homo": [18, 24, 16, 23, 9, 26, 6, 4, 21, 5], "median": 23}
\ No newline at end of file
diff --git a/OptionSelect/jsonOutExtended.txt b/OptionSelect/jsonOutExtended.txt
deleted file mode 100644
index a3fbdab..0000000
--- a/OptionSelect/jsonOutExtended.txt
+++ /dev/null
@@ -1 +0,0 @@
-{"options": [[13, 24], [18, 18], [18, 26], [18, 30], 11, 18, [24, 24], 17, [9, 16], [13, 13], [16, 16], [23, 23], [8, 9], [16, 30], [10, 16], [9, 9], 16, 24, 23, 13, [23, 21], [21, 26], [26, 26], [8, 8], [4, 8], [6, 6], [4, 4], [30, 21], [30, 12], [21, 21], 9, 26, [5, 5], 30, 21]}
\ No newline at end of file
diff --git a/OptionSelect/options_to_edit.txt b/OptionSelect/options_to_edit.txt
new file mode 100644
index 0000000..e83e892
--- /dev/null
+++ b/OptionSelect/options_to_edit.txt
@@ -0,0 +1 @@
+9999
\ No newline at end of file
diff --git a/OptionSelect/rank9999.xls b/OptionSelect/rank9999.xls
new file mode 100644
index 0000000..4434331
Binary files /dev/null and b/OptionSelect/rank9999.xls differ
diff --git a/OptionSelect/stimulusSelection.py b/OptionSelect/stimulusSelection.py
deleted file mode 100644
index 88c7445..0000000
--- a/OptionSelect/stimulusSelection.py
+++ /dev/null
@@ -1,279 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-GA based stimulus selector
- 
-Created on Sat Feb 21 13:10:50 2015
-@author: Calvin Leather
-To do-
-Look into uniformity metric in evalFit()
-Explore different types of means
-"""
-#%%==========imports and constants=================%%#
-import numpy as np
-import pandas as pd
-from deap import base, creator, tools
-import matplotlib.pyplot as plt
-from scipy.stats import kstest, ks_2samp
-import random, operator, seaborn
-import multiprocessing as mp
-import json
-import os
-
-#os.chdir('C:\Users\Calvin\Documents\GitHub\Nypype_Workflows\MVPA')
-
-#%% Magic Numbers
-#nepochs-number of epochs, ngen-number of generations in an epoch
-#cxpb- probability of a cross over occuring in one chromosome of a mating pair
-#mutpb- probability of at each nucleotide of a mutation
-#number of individuals to put in HOF in each epoc
-nepochs, ngen, npop, cxpb, mutpb =2,50,1000, 0.1, 0.05
-    
-HOFsize=1
-
-HallOfFame=[]
-
-SID='a03'
-n_single=20 #1 number of possibilities for singleton
-n_hetero=15 #2 number of possibilities for the heterogenous bundle
-n_homo=22 #3 number of possibilities for the homogeneous scaling
-n_genome=n_single+n_hetero+n_homo #total number of possibilities for all cases
-n_target=10 #Desired number in each chromosome
-
-chromosomeDict={0:n_single, 1:n_hetero, 2:n_homo}
-
-#Define the seed for the random number generator for replication purposes
-random.seed(1)
-np.random.seed(1)
-
-#%%===========define fitness and functions=================%%#
-uni=np.random.uniform(0,60,500)
-
-def evalFit(individual): 
-    """ A weighted total of fitness scores to be maximized
-    RangeCost-maximum to minimum
-    SimilarityCost - number of items in both singleton and homogenous scaling
-    UniformCost- Uses KS divergence to indicate distance of distribution of values from uniform distribution
-    DistanceCost- Uses KS divergence to indicate differences between distributions
-    Cost currently is a simple weightable summation, might be changed to F score"""
-    indiv=genoToPheno(individual)
-    #####similarityCost=np.sum(np.in1d(individual[0][0],[ bundleLookup[k] for k in individual[0][1] ]))
-    similarityCost=np.sum(np.in1d([singletonLookup[k] for k in individual[0][0]],[ bundleLookup[k] for k in individual[0][1] ]))
-    similarity2=np.sum([np.sum(c)>1 for c in [np.in1d(p,[singletonLookup[k] for k in individual[0][0]]) for p in [ bundleLookup2[w] for w in individual[0][2] ]]])
-    #similarityCost=   np.sum([np.sum(c)>1 for c in [np.in1d(k,x) for k in y]])
-    #x is singelton, y is array of tuples of constituent items
-    ######similarity2=np.sum([np.sum(c)>1 for c in [np.in1d(p,individual[0][0]) for p in [ bundleLookup2[w] for w in individual[0][2] ]]])
-    rangeCost=(np.ptp(indiv[0])+np.ptp(indiv[1])+np.ptp(indiv[2]))/125
-    uniformCost=1/(kstest(indiv[0],'uniform')[0]+kstest(indiv[1],'uniform')[0]+kstest(indiv[2],'uniform')[0])
-    #uniformCost=(ks_2samp(indiv[0], uni)[1]+ks_2samp(indiv[1], uni)[1]+ks_2samp(indiv[2], uni)[1])    
-    distanceCost=(ks_2samp(indiv[0], indiv[1])[1]+ks_2samp(indiv[1], indiv[2])[1]+ks_2samp(indiv[2], indiv[0])[1])
-    cost=20*rangeCost+30*uniformCost+10*distanceCost+similarityCost+similarity2   
-    return (cost,)
-
-def getSims(individual):
-    similarityCost=np.sum(np.in1d([singletonLookup[k] for k in individual[0][0]],[ bundleLookup[k] for k in individual[0][1] ]))
-    similarity2=np.sum([np.sum(c)>1 for c in [np.in1d(p,[singletonLookup[k] for k in individual[0][0]]) for p in [ bundleLookup2[w] for w in individual[0][2] ]]])
-    print similarityCost
-    print similarity2
-    
-
-# Creates the initial generation      
-def createIndividual():
-    """Creates a random individual with 11 singleton, 10 het. bundle, 10 hom. scale"""    
-    return [random.sample(valueDictionary[1].keys(),n_target+1),
-               random.sample(valueDictionary[2].keys(),n_target),
-                random.sample(valueDictionary[3].keys(),n_target)]
-
-
-# Crossover algorithm          
-def nonReplicatingCross(ind1, ind2):
-    """Performs a crossover in-place"""
-    """Highly in need of new documentation"""
-    chromosomeNumber = random.randint(0,2)
-    indLength = len(ind1[chromosomeNumber])
-    cxpoint = random.randint(1,indLength-1)
-    child1 = np.zeros(indLength) #create a child array to use
-    child2 = np.zeros(indLength)
-    child1[0:cxpoint]=ind1[chromosomeNumber][0:cxpoint] #do the first half of the crossover
-    child2[0:cxpoint]=ind2[chromosomeNumber][0:cxpoint]
-    try:
-        child1[child1==0]=[x for x in ind2[chromosomeNumber] if x not in child1][0:len(child1[child1==0])]
-    except ValueError:
-        pass
-    if (child1[child1==0]!=[]) or (child1[child1==0]==[0]):
-        child1[child1==0]=random.sample([x for x in valueDictionary[chromosomeNumber+1].keys() if x not in child1], np.sum(np.where(child1==0, 1, 0)))
-    try:
-        child2[child2==0]=[x for x in ind1[chromosomeNumber] if x not in child2][0:len(child2[child2==0])]
-    except ValueError:
-        pass
-    if (child2[child2==0]!=[]) or (child2[child2==0]==[0]):
-        child2[child2==0]=random.sample([x for x in valueDictionary[chromosomeNumber+1].keys() if x not in child2], np.sum(np.where(child2==0, 1, 0)))
-    ind1[chromosomeNumber]=child1  #copy the child array onto the parent array (in place modification)
-    ind2[chromosomeNumber]=child2
-    
-    return ind1, ind2
-  
-#Mutation algorithm      
-def nonReplicatingMutate(ind,indpb):
-    """Mutates an individual in place"""
-    ind=np.asarray(ind) #copy indiviudal into numpy array
-    for chro in range(0,3):
-        for i in range(1,len(ind[chro])):
-                if random.random() < indpb: #for each nucleotide, use roulette to see if there is a mutation
-                            ind[chro][i]=(random.sample([x for x in valueDictionary[chro+1].keys() if x not in ind[chro]],1))[0]                                
-    return ind
-    del ind
-    
-#Maps genotype onto phenotype (item number onto value)    
-def genoToPheno(individual):
-    #print individual
-    indiv=[np.zeros(n_target+1), np.zeros(n_target), np.zeros(n_target)]
-    for chro in range(0,3):
-        for i in range(len(individual[0][chro])):
-            indiv[chro][i]=valueDictionary[chro+1][int(individual[0][chro][i])]
-    return indiv
-
-#stores top n individuals of an epoch in a list    
-def custHallOfFame(population,maxaddsize):
-    for i in tools.selBest(population, k=maxaddsize): 
-        HallOfFame.append(i)
-
-#checks for human error in value entry
-def inputErrorCheck(raw_data):
-    if not raw_data[['item1', 'item2']].applymap(np.isreal).all().all():
-        raise ValueError('Custom error, ask CL : Some item value is not a number')
-    for bundleType in range(1,4):
-        if raw_data[raw_data['type']==bundleType].duplicated(subset=['item1', 'item2']).any():
-            raise ValueError('Custom error, ask CL : Some item value is duplicated')
-    
-
-
-#%%===============initialize toolbox=======================%%#
-creator.create("FitnessMax", base.Fitness, weights=(1.0,))
-creator.create("Individual", list, typecode="d", fitness=creator.FitnessMax)
-
-stats = tools.Statistics(key=operator.attrgetter("fitness.values"))
-stats.register("max", np.max)
-stats.register("mean", np.mean)
-stats.register("min", np.min)
-
-toolbox = base.Toolbox()
-
-toolbox.register("HOF", custHallOfFame, maxaddsize=HOFsize)
-toolbox.register("create_individual", createIndividual)
-toolbox.register("individuals", tools.initRepeat, creator.Individual,
-                 toolbox.create_individual, n=1) 
-toolbox.register("population", tools.initRepeat, list, toolbox.individuals)
-
-toolbox.register("evaluate", evalFit)
-
-toolbox.register("mate", nonReplicatingCross)
-toolbox.register("mutate", nonReplicatingMutate, indpb=.1)
-toolbox.register("select", tools.selTournament, tournsize=2)
-
-
-#toolbox.register('map', futures.map)
-
-s= tools.Statistics()
-s.register("max", np.max)
-s.register("mean", np.mean)
-
-log=tools.Logbook()
-
-def main_program(pop):
-
-    fitnesses = toolbox.map(toolbox.evaluate, pop) # eval. fitness of pop
-    for ind, fit in zip(pop, fitnesses):
-        ind.fitness.values = fit
-    
-    for g in range(ngen):  
-        if g%5==0:
-            print str(g) + ' of ' + str(ngen)       
-        offspring = toolbox.select(pop, len(pop)) #select which individuals to mate
-        offspring = map(toolbox.clone, offspring)
-        
-        for child1, child2 in zip(offspring[::2], offspring[1::2]): #determine whether to have a cross over
-            if random.random() < cxpb:
-                child1[0], child2[0] = toolbox.mate(child1[0], child2[0])
-                del child1.fitness.values, child2.fitness.values
-    
-        for mutant in offspring: #determine whether to mutate
-            if random.random() < mutpb:
-                mutant[0]=toolbox.mutate(mutant[0])
-                del mutant.fitness.values      
-        
-        invalids = [ind for ind in offspring if not ind.fitness.valid] #assign fitness scores to new offspring
-        fitnesses = toolbox.map(toolbox.evaluate, invalids)
-        for ind, fit in zip(invalids, fitnesses):
-            ind.fitness.values = fit  
-        
-        log.record(gen=g,**stats.compile(pop))
-        pop[:] = offspring #update population with offspring    
-    return tools.selBest(pop,k=1)[0][0]
-
-#%%======================main==============================%%#
-if __name__ == '__main__':  
-    #%%==============import data from csv======================%%#
-    # Define the location of the csv file with modeled preferences, should make relative
-    # Three col CSV (Item-Code, Option-Type, Value)
-    SID = input('enter subject ID')    
-    csv_filepath='rank'+str(SID)+'.csv'
-
-    raw_choice_dataset = pd.read_csv(csv_filepath, sep=',', header=0)
-
-    valueDictionary={}
-    for x in range(1,4):
-      #Create a dictionary/hashtable associating the unique ID assigned to each singleton or bundle to its modeled value
-        placeholderValueDictionary={}
-        for rows in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==x].iterrows():
-            #rows[1][6]=rows[1][2] # change this once modeling is done
-            placeholderValueDictionary[int(rows[1]['rank'])] =float(rows[1]['rank'])
-        valueDictionary[x]=placeholderValueDictionary
-        
-    singletonLookup={}
-    for x in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==1].iterrows():
-        singletonLookup[int(x[1]['rank'])]=int(x[1]['item1'])
-
-    bundleLookup={}
-    for x in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==2].iterrows():
-     #create a dictionary/hastable that gives constituent item in homogeneous bundles
-        bundleLookup[int(x[1]['rank'])]=int(x[1]['item1'])
-        
-    bundleLookup2={}
-    for x in raw_choice_dataset[raw_choice_dataset['type'].astype(int)==3].iterrows():
-        bundleLookup2[int(x[1]['rank'])]=(int(x[1]['item1']),int(x[1]['item2']))
-
-
-    print 'GA algorithm starting with the following settings:'
-    print 'nepochs = ' + str(nepochs) + ' ngen = ' + str(ngen) + ' npop = ' + str(npop)
-    print 'cxpb = ' + str(cxpb) + ' mutpb = ' + str(mutpb)
-    answer = input('Are the following settings okay? (0/1)  ')
-    if answer == 0:
-        raise ValueError('Custom Error: Please change settings in script file')
-    
-    
-    print 'initializing processing pool'
-    return_var= []
-    processes = []
-    pool = mp.Pool(processes = 8)
-    pop_pool = [toolbox.population(n=npop) for x in range(8)]
-    results = pool.map(main_program,pop_pool)
-    pool.close()
-    print 'pool finished, outputing to JSON'    
-    
-    results = [[np.sort(x[0]),np.sort(x[1]),np.sort(x[2])] for x in results]
-    
-    resultsFit = [evalFit([x]) for x in results]
-    maxIndex = np.argmax(resultsFit)
-    
-    bestIndividual = results[maxIndex]
-    
-    singletonTransed = [singletonLookup[item] for item in bestIndividual[0]]
-    median = singletonTransed[5]
-    singletonTransed = np.delete(singletonTransed, 5).tolist()
-    homoTransed = [bundleLookup[item] for item in bestIndividual[1]]
-    heteroTransed = [bundleLookup2[item] for item in bestIndividual[2]]
-    
-    outputData = { 'singleton' : singletonTransed, 'homo' : homoTransed, 'hetero' : heteroTransed, 'median' : median }
-    outputData = json.dumps(outputData)
-    with open('jsonOut'+str(SID)+'.txt', 'w') as outfile:
-        outfile.write(str(outputData))
diff --git a/Procedure.txt b/Procedure.txt
new file mode 100644
index 0000000..a59173b
--- /dev/null
+++ b/Procedure.txt
@@ -0,0 +1 @@
+change options_to_edit.txt to correct SID
\ No newline at end of file