Changeset 25836 for issm/trunk/src/m/qmu/dakota_out_parse.py

issm/trunk

Property svn:mergeinfo changed

merged: 24687-24689,24691-25328,25330-25332,25334,25336-25346,25354-25357,25362-25478,25481-25493,25497-25525,25528-25533,25536,25539-25565,25567-25586,25590-25594,25597-25598,25608-25612,25616-25617,25619-25624,25626-25723,25725-25738,25741,25744-25775,25777-25829,25832-25833

issm/trunk/src

Property svn:mergeinfo changed

/issm/branches/trunk-larour-SLPS2020/src (added)	merged: 25333,25335,25347-25353,25358-25361,25479-25480,25494-25496,25534-25535,25537-25538,25566,25587-25589,25596,25599-25603,25605,25613-25615,25618,25625
/issm/trunk-jpl/src	merged: 24687,24689,24691,24705,24708-24716,24718-24719,24727-24731,24733-24736,24738,24740-24747,24750-24754,24756,24759-24762,24765-24772,24774,24776-24780,24784,24786,24788-24794,24796-24800,24802-24808,24816-24820,24822-24823,24830,24835-24837,24839,24841,24843-24855,24857-24861,24865-24870,24873-24875,24878-24889,24892,24894-24904,24910,24915-24921,24924,24926,24933-24936,24938-24947,24949-24951,24956-24957,24959-24960,24963-24964,24968-24969,24972-24974,24976-24991,24994,24998-25004,25006,25010-25015,25018-25028,25030-25039,25041,25044-25045,25047,25050-25066,25068-25069,25072,25074,25076,25078-25088,25090-25101,25105,25109-25110,25116-25120,25122-25123,25125,25128-25130,25132,25136-25139,25141-25146,25148-25158,25160-25172,25183,25185,25189-25193,25195-25196,25198,25201,25206-25215,25218-25223,25225,25227-25233,25235-25237,25239-25242,25244-25253,25255-25267,25269-25270,25272-25279,25281-25289,25292-25297,25300-25301,25303-25308,25310-25328,25330,25332,25334,25336-25341,25343-25344,25346,25354,25357,25362-25366,25368-25369,25373-25374,25377-25396,25400-25408,25411-25415,25417-25427,25430,25435-25460,25463-25469,25471-25474,25476-25478,25481,25483-25492,25497,25499-25503,25505-25516,25519-25525,25528-25533,25536,25539-25541,25543,25549-25551,25554-25564,25571,25574-25576,25578,25580-25586,25590-25594,25597-25598,25608-25611,25619-25623,25626-25634,25636-25639,25642-25645,25647,25649,25652,25655,25658,25661-25664,25666,25668-25669,25675,25677-25686,25688,25691,25694-25698,25703,25710-25712,25714-25715,25717-25718,25720-25723,25725-25728,25733-25738,25741,25747,25750-25759,25761-25764,25766-25767,25770-25775,25777-25780,25784,25786,25792-25794,25797-25798,25806-25807,25810-25814,25816-25819,25826-25829,25833

issm/trunk/src/m/qmu/dakota_out_parse.py

-              r24313
+              r25836
 from helpers import *
 #Note: this may be re-written later to take advantage of Python's file i / o mechanics
 #    as it is written now it is often difficult to work with, but is analagous to
 #    the Matlab version of dakota_out_parse
+# NOTE: May be rewritten later to take advantage of Python's file I/O
+# mechanics. As it is written now, it is often difficult to work with, but is
+# analagous to the MATLAB version of dakota_out_parse.
 def dakota_out_parse(filei):  # {{{
+    '''
+  read a Dakota .out or .dat output file and parse it.
+  [method, dresp, scm, pcm, srcm, prcm] = dakota_out_parse(filei)
+  where the required input is:
+    filei         (character, name of .out file)
+  the required output is:
+    method        (character, dakota method name)
+    dresp         (structure array, responses)
+  and the optional output is:
+    scm           (double array, simple correlation matrix)
+    pcm           (double array, partial correlation matrix)
+    srcm          (double array, simple rank correlation matrix)
+    prcm          (double array, partial rank correlation matrix)
+  the filei will be prompted if empty.  the fields of dresp
+  are particular to the data contained within the file.  the
+  scm, pcm, srcm, and prcm are output by dakota only for the
+  sampling methods.
+  this function reads a dakota .out output file and parses it
+  into the matlab workspace.  it operates in a content - driven
+  fashion, where it skips the intermediate data and then parses
+  whatever output data it encounters in the order in which it
+  exists in the file, rather than searching for data based on
+  the particular method.  (this makes it independent of method.)
+  it also can read and parse the .dat tabular_output file.
+  this data would typically be used for plotting and other
+  post - processing within matlab or excel.
+'''
+    """DAKOTA_OUT_PARSE - read a Dakota .out or .dat output file and parse it.
+    Usage:
+        [method, dresp, scm, pcm, srcm, prcm] = dakota_out_parse(filei)
+    where the required input is,
+        filei         (character, name of .out file)
+    the required output is,
+        method        (character, Dakota method name)
+        dresp         (structure array, responses)
+    and the optional output is,
+        scm           (double array, simple correlation matrix)
+        pcm           (double array, partial correlation matrix)
+        srcm          (double array, simple rank correlation matrix)
+        prcm          (double array, partial rank correlation matrix)
+    The filei will be prompted for if empty. The fields of dresp are particular
+    to the data contained within the file. The scm, pcm, srcm, and prcm are
+    output by Dakota only for the sampling methods.
+    This function reads a Dakota .out output file and parses it into the Python
+    runtime. It operates in a content-driven fashion, where it skips the
+    intermediate data and then parses whatever output data it encounters in the
+    order in which it exists in the file, rather than searching for data based
+    on the particular method (this makes it independent of method). It also can
+    read and parse the .dat tabular_output file.
+    This data would typically be used for plotting and other postprocessing
+    within MATLAB or Excel.
+    TODO:
+    - Figure out why output from Dakota is different under MATLAB and Python
+    (is it the input file that we write?)
+    "Copyright 2009, by the California Institute of Technology. ALL RIGHTS
+    RESERVED. United States Government Sponsorship acknowledged. Any commercial
+    use must be negotiated with the Office of Technology Transfer at the
+    California Institute of Technology. (NTR 47078)
+    This software may be subject to U.S. export control laws. By accepting this
+    software, the user agrees to comply with all applicable U.S. export laws
+    and regulations. User has the responsibility to obtain export licenses, or
+    other export authority as may be required before exporting such information
+    to foreign countries or providing access to foreign persons."
+    """
     if filei is None:
         help(dakota_out_parse)
 …
     if not isfile(filei) or getsize(filei) == 0:
         filei = str(eval(input('Input file?  ')))
+        filei = str(eval(input('Input file? ')))
     #fidi = fopen(sprintf('%s', filei), 'r')
 …
         fline = fidi.readline()
         if getsize(filei) == 0 or fline == '':
             raise RuntimeError('File ' + filei + ' is empty.')
         dresp = []  # of struct()
+            raise RuntimeError('File ' + filei + ' is empty')
+        dresp = [] # of struct()
         scm = struct()
         pcm = struct()
 …
             fidi.seek(0, 0)
     #  loop through the file to find the Dakota method name
+        # loop through the file to find the Dakota method name
         fline = findline(fidi, 'method', True)
         if fline is None:
 …
                 [ntokens, tokens] = fltokens(fline)
                 method = tokens[0].strip()
                 print('Dakota method =\'' + method + '\'.')
+                print('Dakota method = \'' + method + '\'')
             elif fline[6] in ['N', 'n']:
                 fline = findline(fidi, 'methodName = ')
                 [ntokens, tokens] = fltokens(fline)
                 method = tokens[2].strip()
                 print('Dakota methodName = "' + method + '".')
     #  loop through the file to find the function evaluation summary
+                print('Dakota methodName = \'' + method + '\'')
+        # loop through the file to find the function evaluation summary
         counter = 0
         fline = ''
         nfeval = nfeval_read(fidi, fline)
         #  process each results section based on content of the file
+        # process each results section based on content of the file
         while counter < 10:
             # because python makes file i / o difficult
+            # because python makes file I/O difficult
             # if we see 10 + blank lines in a row then we have reached EOF
             # (tests show actual maximum number of blank lines is around 5)
 …
             else:
                 counter = 0
     #     ipos = ftell(fidi)
+            # ipos = ftell(fidi)
             fline = fidi.readline()
             if fline == '' or fline.isspace():
 …
                 'Unexpected line: ' + str(fline)
     #     fidi.seek(ipos, 0)
     #  loop through the file to verify the end
+            # fidi.seek(ipos, 0)
+    # loop through the file to verify the end
     # fline = findline(fidi, '<<<<< Single Method Strategy completed')
 …
     #     return
+    #
         print('End of file successfully reached.')
+        print('End of file successfully reached')
     #close(fidi)
     #except Exception as err:
     #print "ERROR in dakota_out_parse: " + err
     #raise err
     #raise RuntimeError(filei + ' could not be opened.')
+    #raise RuntimeError(filei + ' could not be opened')
     return [method, dresp, scm, pcm, srcm, prcm]
 …
 def dak_tab_out(fidi, fline):  # {{{
+    #  function to parse the dakota tabular output file
+    print('Reading Dakota tabular output file.')
+    #  process column headings of matrix (skipping eval_id)
+    """DAK_TAB_OUT - function to parse the Dakota tabular output file
+    """
+    print('Reading Dakota tabular output file')
+    # Process column headings of matrix (skipping eval_id)
     [ntokens, tokens] = fltokens(fline)
+    # New file DAKOTA versions > 6
+    if strncmpi(fline, '%eval_id interface', 18):
+    if strncmpi(fline, '%eval_id interface', 18): # Dakota versions >= 6
         offset = 2
     else:  #DAKOTA versions < 6
+    else:  # Dakota versions < 6
         offset = 1
     desc = [['' for i in range(ntokens - offset)]]
+    desc = ['' for i in range(ntokens - offset)]
     data = np.zeros((1, ntokens - offset))
     for i in range(ntokens - offset):
         desc[0][i] = str(tokens[i + offset])
     print("Number of columns (Dakota V + R)=" + str(ntokens - 2) + '.')
     #  process rows of matrix
+        desc[i] = str(tokens[i + offset])
+    print('Number of columns (Dakota V + R) = {}'.format(ntokens - 2))
+    # Process rows of matrix
     nrow = 0
     while True:
         fline = fidi.readline()
 …
         [ntokens, tokens] = fltokens(fline)
+    #  add row values to matrix (skipping eval_id)
+        # Add row values to matrix (skipping eval_id)
         for i in range(ntokens - offset):
             data[nrow, i] = tokens[i + offset]
 …
         nrow = nrow + 1
+    print('Number of rows (Dakota func evals) = ' + str(nrow) + '.')
+    #  calculate statistics
+    #  since normfit doesn't have a dim argument, and matlab isvector is True
+    #  for a 1xn matrix, handle the case of one row explicitly
+    #  Update: normfit_issm.py does handle this case
+    print('Number of rows (Dakota func evals) = ' + str(nrow))
+    # Calculate statistics
     if (np.size(data, 0) > 1):
         #dmean  =mean   (data)
         #dstddev = std    (data, 0)
+        #dmean = mean(data)
+        #dstddev = std(data, 0)
         [dmean, dstddev, dmeanci, dstddevci] = normfit_issm(data, 0.05)
     else:
 …
             [dmean[0, i], dstddev[0, i], dmeanci[:, i], dstddevci[:, i]] = normfit_issm(data[:, i], 0.05)
     dmin = data.min(0)
+    dmin = data.min(axis=0)
     dquart1 = prctile_issm(data, 25, 0)
     dmedian = np.median(data, 0)
+    dmedian = np.median(data, axis=0)
     dquart3 = prctile_issm(data, 75, 0)
     dmax = data.max(0)
+    dmax = data.max(axis=0)
     dmin95 = prctile_issm(data, 5, 0)
     dmax95 = prctile_issm(data, 95, 0)
     # Note: the following line may cause the following warning
     #    (should not crash or invalidate results) when one of
     #    the inputs does not change with respect to the
     #    other / s causing an internal divide-by - zero error
     # / usr / local / lib / python2.7 / dist - packages / numpy / lib / function_base.py:3163:
     #    RuntimeWarning: invalid value encountered in true_divide
     #    c / = stddev[:, None]
+    #    (and / or the same but with "c / = stddev[None, :]")
+    # NOTE: The following line may cause the following warning (should not
+    # crash or invalidate results) when one of the inputs does not change with
+    # respect to the other(s), causing an internal divide-by-zero error,
+    #
+    #       /usr/local/lib/python2.7/dist-packages/numpy/lib/function_base.py:3163:
+    #       RuntimeWarning: invalid value encountered in true_divide
+    #       c /= stddev[:, None]
+    #
+    # (and/or the same but with "c /= stddev[None, :]")
+    # Equivalent to Dakota scm, MATLAB corrcoef, and Excel correl
     dcorrel = np.corrcoef(data.T)
     #  divide the data into structures for consistency
+    # Divide the data into structures for consistency
     dresp = []
     for i in range(len(desc)):
         dresp.append(struct())
         dresp[i].descriptor = str(desc[i])
+        dresp[i].descriptor = desc[i]
         dresp[i].sample = data[:, i]
         dresp[i].mean = dmean[i]
 …
     [ntokens, tokens] = fltokens(fline)
     nfeval = tokens[4]
     print('  Dakota function evaluations = ' + str(int(nfeval)) + '.')
+    print('  Dakota function evaluations = ' + str(int(nfeval)))
     return nfeval
 …
     [ntokens, tokens] = fltokens(fline)
     nsamp = tokens[3]
     print('  Dakota samples = ' + str(int(nsamp)) + '.')
+    print('  Dakota samples = ' + str(int(nsamp)))
     return nsamp
 …
         dresp[-1].coefvar = tokens[12]
     print('  Number of Dakota response functions = ' + str(len(dresp)) + '.')
+    print('  Number of Dakota response functions = ' + str(len(dresp)))
     return dresp
 …
     if fline is None or fline == '' or fline.isspace():
         fline = findline(fidi, 'Moment - based statistics for each response function')
+        fline = findline(fidi, 'Moment-based statistics for each response function')
         return
     print('Reading moment - based statistics for response functions:')
+    print('Reading moment-based statistics for response functions:')
     #  skip column headings of moment - based statistics
 …
         dresp[-1].kurtosis = tokens[4]
     print('  Number of Dakota response functions = ' + str(len(dresp)) + '.')
+    print('  Number of Dakota response functions = ' + str(len(dresp)))
     return dresp
 …
             dresp[i].stddevci[1, 0] = tokens[4]
     print('  Number of Dakota response functions = ' + str(len(dresp)) + '.')
+    print('  Number of Dakota response functions = ' + str(len(dresp)))
     return dresp
 …
                 fline = fidi.readline()
     print('  Number of Dakota response functions = ' + str(len(dresp)) + '.')
+    print('  Number of Dakota response functions = ' + str(len(dresp)))
     return dresp
 …
                 fline = fidi.readline()
     print('  Number of Dakota response functions = ' + str(len(dresp)) + '.')
+    print('  Number of Dakota response functions = ' + str(len(dresp)))
     return dresp
 …
             return
     print('Reading ' + fline + '.')
+    print('Reading ' + fline)
     cmat.title = fline
 …
         #  if importance factors missing, skip to cdf
         if not idvar:
             print('    Importance Factors not available.')
+            print('    Importance Factors not available')
             dresp[-1].var = []
             dresp[-1].impfac = []
 …
         #  if cdf missing, skip to end of response function
         if not icdf:
             print('    Cumulative Distribution Function not available.')
+            print('    Cumulative Distribution Function not available')
             dresp[ndresp].cdf = []
             while (fline != '' and not fline.isspace()) and not strncmpi(fline, 'MV Statistics for ', 18) and not strncmp(fline, ' - ', 1):
                 fline = fidi.readline()
     print('  Number of Dakota response functions = ' + str(len(dresp)) + '.')
+    print('  Number of Dakota response functions = ' + str(len(dresp)))
     return dresp
 …
         dresp[-1].vum = []
     print('Reading measures for volumetric uniformity.')
+    print('Reading measures for volumetric uniformity')
     fline = fidi.readline()
     fline = fidi.readline()
 …
     [ntokens, tokens] = fltokens(fline)
     method = tokens[2]
     print('Dakota iterator \'' + str(method) + '\' completed.')
+    print('Dakota iterator \'' + str(method) + '\' completed')
     return method
 …
     #  issue warning and reset file position
     print('Warning: findline:str_not_found: String ' + str(string) + ' not found in file.')
+    print('Warning: findline:str_not_found: String ' + str(string) + ' not found in file')
     fidi.seek(ipos, 0)
     return None

Context Navigation

Legend:

issm/trunk

issm/trunk/src

issm/trunk/src/m/qmu/dakota_out_parse.py

Download in other formats: