BhallaLab · dilawar · Oct 8, 2018 · Sep 27, 2018 · Oct 6, 2018 · Oct 7, 2018
diff --git a/basicParameterSweep.py b/basicParameterSweep.py
@@ -0,0 +1,187 @@
+
+# 
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License as
+# published by the Free Software Foundation; either version 3, or
+# (at your option) any later version.
+# 
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+# General Public License for more details.
+# 
+# You should have received a copy of the GNU General Public License
+# along with this program; see the file COPYING.  If not, write to
+# the Free Software Foundation, Inc., 51 Franklin Street, Fifth
+# Floor, Boston, MA 02110-1301, USA.
+# 
+# 
+
+'''
+*******************************************************************
+ * File:            basicParameterSweep.py
+ * Description:
+ * Author:          Upinder S. Bhalla
+ * E-mail:          bhalla@ncbs.res.in
+ ********************************************************************/
+
+/**********************************************************************
+** This program is part of 'FindSim', the
+** Framework for Integrating Neuronal Data and SIgnaling Models
+**           copyright (C) 2003-2018 Upinder S. Bhalla. and NCBS
+**********************************************************************/
+
+This script does a basic parameter sweep on the model. It runs the findSim 
+program on all tsv files in the specified directory with modifications of
+the selected parameters. It computes the mean score for each run and
+presents the "best" (parameter, score) along with next-best flanking.
+It can do this in parallel using Python's multiprocessing library.
+'''
+
+from __future__ import print_function
+import numpy
+import argparse
+import os
+import sys
+import argparse
+import findSim
+from multiprocessing import Pool
+
+scaleFactors = [0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 1, 1.05, 1.1, 1.2, 1.4, 1.6, 1.8, 2.0]
+
+resultCount = 0
+
+def reportReturn( result ):
+    global resultCount
+    print( ".", end = '' )
+    sys.stdout.flush()
+    resultCount += 1
+    if resultCount % 50 == 0:
+        print( " {}".format( resultCount ) )
+
+def enumerateFindSimFiles( location ):
+    if os.path.isdir( location ):
+        if location[-1] != '/':
+            location += '/'
+        fnames = [ (location + i) for i in os.listdir( location ) if i.endswith( ".tsv" )]
+        return fnames, [1.0] * len( fnames )
+    elif os.path.isfile( location ):
+        fnames = []
+        weights = []
+        with open( location, "r" ) as fp:
+            for line in fp:
+                if len( line ) <= 2:
+                    continue
+                if line[0] == '#':
+                    continue
+                f,w = line.split()
+                fnames.append( f )
+                weights.append( float( w ) )
+        return fnames, weights
+    else:
+        print( "Error: Unable to find file or directory at " + location )
+        quit()
+
+
+def main():
+    parser = argparse.ArgumentParser( description = 'Wrapper script to run a lot of FindSim evaluations in parallel.' )
+
+    parser.add_argument( 'location', type = str, help='Required: Directory in which the scripts (in tsv format) are all located. OR: File in which each line is the filename of a scripts.tsv file, followed by weight to assign for that file.')
+    parser.add_argument( '-n', '--numProcesses', type = int, help='Optional: Number of processes to spawn', default = 2 )
+    parser.add_argument( '-m', '--model', type = str, help='Optional: Composite model definition file. First searched in directory "location", then in current directory.', default = "FindSim_compositeModel_1.g" )
+    parser.add_argument( '-p', '--parameter_sweep', nargs='*', default=[],  help='Does a parameter sweep in range 0.5-2x of each object.field pair.' )
+    parser.add_argument( '-f', '--file', type = str, help='Optional: File name for output of parameter sweep', default = "" )
+    args = parser.parse_args()
+    location = args.location
+    if location[-1] != '/':
+        location += '/'
+    if os.path.isfile( location + args.model ):
+        modelFile = location + args.model
+    elif os.path.isfile( args.model ):
+        modelFile = args.model
+    else:
+        print( "Error: Unable to find model file {}".format( args.model ) )
+        quit()
+
+    #fnames = [ (location + i) for i in os.listdir( args.location ) if i.endswith( ".tsv" )]
+    fnames, weights = enumerateFindSimFiles( args.location )
+    #print( fnames )
+    #print( weights )
+    pool = Pool( processes = args.numProcesses )
+    #ret = findSim.innerMain(fnames[0], hidePlot=True)
+
+    argDict = {}
+    for i in args.parameter_sweep:
+        print( "{}".format( i ) )
+        scaleDict = {}
+        spl = i.split( '.' )
+        assert( len(spl) == 2 )
+        obj, field = spl
+        for scale in scaleFactors:
+            ret = []
+            for k in fnames:
+                ret.append( pool.apply_async( findSim.innerMain, (k,), dict(modelFile = modelFile, hidePlot=True, silent=True, scaleParam=[obj,field,str(scale)]), callback = reportReturn ) )
+            scaleDict[scale] = ret
+        argDict[i] = scaleDict
+
+    results = {}
+    for i in argDict:
+        scaleDict = argDict[i]
+        temp = {}
+        for j in scaleDict:
+            temp[j] = [ k.get() for k in scaleDict[j] ]
+        results[i] = temp
+    print( "\n---------------- Completed ----------------- " )
+    dumpData = False
+    fp = ""
+    if len( args.file ) > 0:
+        fp = open( args.file, "w" )
+        dumpData = True
+    for objfield in results:
+        analyzeResults( fp, dumpData, objfield, results[objfield], weights )
+    if dumpData:
+        fp.close()
+
+def analyzeResults( fp, dumpData, name, results, weights ):
+    score = []
+    scale = []
+    numTotExpts = 0
+    numGoodExpts = 0
+    sumWts = 0.0
+    for res in results:
+        assert( len( weights ) == len( results[res] ) )
+        numTotExpts += len( results[res] )
+        goodRes = [ x*w for x,w in zip(results[res], weights) if x >= 0.0 ]
+        sumWts = sum( [w for x,w in zip(results[res], weights) if x>= 0.0])
+        numGoodExpts += len( goodRes )
+        if len( goodRes ) > 0:
+            score.append( sum(goodRes)/sumWts )
+            #print( "{}, {}".format( goodRes, sumWts ) )
+            scale.append( res )
+
+    if len(score) == 0:
+        outputStr = "{}: score -1 at scale -  with Q = 0 in 0/{} expts".format(name, numTotExpts )
+        print( outputStr )
+        if dumpData:
+            fp.write( outputStr )
+        return
+    bestScore = min( score )
+    bestScoreIndex = score.index( bestScore )
+    # We want best, the scale of the best, if it is an extrema, and Q
+    # Q = slope = (max - min)/abs(scaleMax - scaleMin)
+    if len( score ) == 1:
+        Q = 0
+    else:
+        worstScore = max(score)
+        worstScoreIndex = score.index( worstScore )
+        Q = (worstScore - bestScore)/abs(scale[bestScoreIndex] - scale[worstScoreIndex])
+    outputStr = "{}: score {:.3f} at scale {} with Q = {:.3f} in {}/{} expts".format(name, bestScore, scale[bestScoreIndex], Q, numGoodExpts, numTotExpts )
+    print( outputStr )
+    if dumpData:
+        fp.write( outputStr + '\n' )
+        for i, j in sorted(zip( scale, score )):
+            fp.write( "{:.3f}   {:.3f}\n".format( i, j ) )
+
+# Run the 'main' if this script is executed standalone.
+if __name__ == '__main__':
+    main()