casa / casa5 / 8d3ac223f77

Commits

Federico Montesino Pouzols authored 8d3ac223f77 11 Feb 2019

Python 3 compat and imports for Python 2/3 - CASA 5/6, CAS-12282

gcwrap/python/scripts/partitionhelper.py

Modified

-1
+import os
-2
+import sys
-3
+import shutil
-4
+import pprint as pp
-5
+import traceback
-6
+import time
--
+import commands
-7
+import numpy as np
--
+import matplotlib.pyplot as plt
--
+from __main__ import *
--
+from taskinit import *
-+
+from matplotlib import pyplot as plt
-+
-+
+try:
-+
+    # CASA 6
-+
+    from casatasks import casalog
-+
+    from casatools.platform import bytes2str
-+
+    from casatools import table, ms, msmetadata
-+
-+
+    import subprocess
-+
+    use_old_casa5_commands = False
-+
+except ImportError:
-+
+    # CASA 5
-+
+    from __main__ import *
-+
+    from taskinit import *
-+
-+
+    import commands
-+
+    use_old_casa5_commands = True
-25
-26
-27
+class convertToMMS():
-28
+    def __init__(self,\
-29
+                 inpdir=None, \
-30
+                 mmsdir=None, \
-31
+                 axis='auto', \
-32
+                 numsubms=4,
-33
+#                 createmslink=False, \
-34
+                 cleanup=False):
-117
+                sys.exit(2)
-118
-119
+            # Verify later if this is still needed
-120
+            time.sleep(10)
-121
-122
+            casalog.origin('convertToMMS')
-123
+            casalog.post('--------------- Successfully created MMS -----------------')
-124
-125
-126
+        # Copy non-MS files to MMS directory
--
+        for ff in nonmslist:
--
+            bfile = os.path.basename(ff)
-+
+        for nfile in nonmslist:
-+
+            bfile = os.path.basename(nfile)
-129
+            lfile = os.path.join(self.mmsdir, bfile)
-130
+            casalog.post('Copying non-MS file '+bfile)
-131
+#            os.symlink(file, lfile)
--
+#            shutil.copytree(ff, lfile, symlinks=False)
--
+            os.system("cp -RL "+ff+" "+lfile)
-+
+#            shutil.copytree(nfile, lfile, symlinks=False)
-+
+            os.system("cp -RL {0} {1}".format(nfile, lfile))
-134
-135
-136
+    def getMSlist(self, files):
-137
+        '''Get a list of MSs from a directory.
-138
+           files -> a tuple that is returned by the following call:
-139
+           files = os.walk(self.inpdir,followlinks=True).next()
-140
-141
+           It will test if a directory is an MS and will only return
-142
+           true MSs, that have Type:Measurement Set in table.info. It will skip
-143
+           directories that start with . and those that do not end with
-150
+        # Loop through list of directories
-151
+        for d in files[1]:
-152
+            # Skip . entries
-153
+            if d.startswith('.'):
-154
+                continue
-155
-156
+#            if not d.endswith('.ms'):
-157
+#                continue
-158
-159
+            # Full path for directory
--
+            dir = os.path.join(topdir,d)
-+
+            mydir = os.path.join(topdir,d)
-161
-162
+            # It is probably an MS
--
+            if self.isItMS(dir) == 1:
--
+                mslist.append(dir)
-+
+            if self.isItMS(mydir) == 1:
-+
+                mslist.append(mydir)
-165
-166
+        return mslist
-167
-168
+    def isItMS(self, mydir):
-169
+        '''Check the type of a directory.
-170
+           mydir  --> full path of a directory.
-171
+                Returns 1 for an MS, 2 for a cal table and 3 for a MMS.
-172
+                If 0 is returned, it means any other type or an error.'''
-173
-174
+        ret = 0
-175
-176
+        # Listing of this directory
-177
+        ldir = os.listdir(mydir)
-178
-179
+        if not ldir.__contains__('table.info'):
-180
+            return ret
-181
-182
+        cmd1 = 'grep Type '+mydir+'/table.info'
--
+        mytype = commands.getoutput(cmd1)
-183
+        cmd2 = 'grep SubType '+mydir+'/table.info'
--
+        stype = commands.getoutput(cmd2)
--
-+
+        if use_old_casa5_commands:
-+
+            mytype = commands.getoutput(cmd1)
-+
+            stype = commands.getoutput(cmd2)
-+
+        else:
-+
+            mytype = bytes2str(subprocess.check_output(cmd1)).rstrip("\n")
-+
+            stype = bytes2str(subprocess.check_output(cmd2)).rstrip("\n")
-+
-191
+        # It is a cal table
-192
+        if mytype.__contains__('Calibration'):
-193
+            ret = 2
-194
-195
+        elif mytype.__contains__('Measurement'):
-196
+            # It is a Multi-MS
-197
+            if stype.__contains__('CONCATENATED'):
-198
+                # Further check
-199
+                if ldir.__contains__('SUBMSS'):
-200
+                    ret = 3
-250
-251
-252
+    def runPartition(self, ms, mmsdir, axis, subms):
-253
+        '''Run partition with default values to create an MMS.
-254
+           ms         --> full pathname of the MS
-255
+           mmsdir     --> directory to save the MMS to
-256
+           axis      --> separationaxis to use (spw, scan, auto)
-257
+           subms  --> number of subMss to create
-258
-259
+        '''
--
+        from tasks import partition
--
+        from __main__ import default
-+
+        try:
-+
+            # CASA 6
-+
+            from casatasks import partition
-+
+        except ImportError:
-+
+            # CASA 5
-+
+            from tasks import partition
-266
-267
+        if not os.path.lexists(ms):
-268
+            return False
-269
-270
+        # Create MMS name
-271
+#        bname = os.path.basename(ms)
-272
+#        if bname.endswith('.ms'):
-273
+#            mmsname = bname.replace('.ms','.mms')
-274
+#        else:
-275
+#            mmsname = bname+'.mms'
-289
+#            return False
-290
-291
+        # Check for remainings of corrupted mms
-292
+#        corrupted = mms.replace('.mms','.data')
-293
+        corrupted = MMSFullName + '.data'
-294
+        if os.path.exists(corrupted):
-295
+            casalog.post('Cleaning up left overs','WARN')
-296
+            shutil.rmtree(corrupted)
-297
-298
+        # Run partition
--
+        default('partition')
-299
+        partition(vis=ms, outputvis=MMSFullName, createmms=True, datacolumn='all', flagbackup=False,
-300
+                  separationaxis=axis, numsubms=subms)
-301
+        casalog.origin('convertToMMS')
-302
-303
+        # Check if MMS was created
-304
+        if not os.path.exists(MMSFullName):
-305
+            casalog.post('Cannot create MMS ->'+MMSFullName, 'ERROR')
-306
+            return False
-307
-308
+        # If requested, create a link to this MMS with the original MS name
-312
+#            mmsname = os.path.basename(mms)
-313
+##            lms = mmsname.replace('.mms', '.ms')
-314
+#            casalog.post('Creating symbolic link to MMS')
-315
+##            os.symlink(mmsname, lms)
-316
+#            os.symlink(mmsname, bname)
-317
+#            os.chdir(here)
-318
-319
+        return True
-320
-321
+    def usage(self):
--
+        print '========================================================================='
--
+        print '          convertToMMS will create a directory with multi-MSs.'
--
+        print 'Usage:\n'
--
+        print '  import partitionhelper as ph'
--
+        print '  ph.convertToMMS(inpdir=\'dir\') \n'
--
+        print 'Options:'
--
+        print '   inpdir <dir>        directory with input MS.'
--
+        print '   mmsdir <dir>        directory to save output MMS. If not given, it will save '
--
+        print '                       the MMS in a directory called mmsdir in the current directory.'
--
+        print "   axis='auto'         separationaxis parameter of partition (spw,scan,auto)."
--
+        print "   numsubms=4         number of subMSs to create in output MMS"
--
+        print '   cleanup=False       if True it will remove the output directory before starting.\n'
-+
+        print('=========================================================================')
-+
+        print('          convertToMMS will create a directory with multi-MSs.')
-+
+        print('Usage:\n')
-+
+        print('  import partitionhelper as ph')
-+
+        print('  ph.convertToMMS(inpdir=\'dir\') \n')
-+
+        print('Options:')
-+
+        print('   inpdir <dir>        directory with input MS.')
-+
+        print('   mmsdir <dir>        directory to save output MMS. If not given, it will save ')
-+
+        print('                       the MMS in a directory called mmsdir in the current directory.')
-+
+        print("   axis='auto'         separationaxis parameter of partition (spw,scan,auto).")
-+
+        print("   numsubms=4         number of subMSs to create in output MMS")
-+
+        print('   cleanup=False       if True it will remove the output directory before starting.\n')
-334
--
+        print ' NOTE: this script will run using the default values of partition. It will try to '
--
+        print ' create an MMS for every MS in the input directory. It will skip non-MS directories '
--
+        print ' such as cal tables. If partition succeeds, the script will create a link to every '
--
+        print ' other directory or file in the output directory. '
--
+        print ' The script will not walk through sub-directories of inpdir. It will also skip '
--
+        print ' files or directories that start with a .'
--
+        print '=========================================================================='
-+
+        print(' NOTE: this script will run using the default values of partition. It will try to ')
-+
+        print(' create an MMS for every MS in the input directory. It will skip non-MS directories ')
-+
+        print(' such as cal tables. If partition succeeds, the script will create a link to every ')
-+
+        print(' other directory or file in the output directory. ')
-+
+        print(' The script will not walk through sub-directories of inpdir. It will also skip ')
-+
+        print(' files or directories that start with a .')
-+
+        print('==========================================================================')
-342
+        return
-343
-344
+#
-345
+# -------------- HELPER functions for dealing with an MMS --------------
-346
+#
-347
+#    getMMSScans        'Get the list of scans of an MMS dictionary'
-348
+#    getScanList        'Get the list of scans of an MS or MMS'
-349
+#    getScanNrows       'Get the number of rows of a scan in a MS. It will add the
-350
+#                         nrows of all sub-scans.'
-351
+#    getMMSScanNrows    'Get the number of rows of a scan in an MMS dictionary.'
-356
-357
+# def getNumberOf(msfile, item='row'):
-358
+#     '''Using the msmd tool, it gets the number of
-359
+#        scan, spw, antenna, baseline, field, state,
-360
+#        channel, row in a MS or MMS'''
-361
+#
-362
+#     md = msmdtool()
-363
+#     try:
-364
+#         md.open(msfile)
-365
+#     except:
--
+#         print 'Cannot open the msfile'
-+
+#         print('Cannot open the msfile')
-367
+#         return 0
-368
+#
-369
+#     if item == 'row':
-370
+#         numof = md.nrows()
-371
+#     elif item == 'scan':
-372
+#         numof = md.nscans()
-373
+#     elif item == 'spw':
-374
+#         numof = md.nspw()
-375
+#     elif item == 'antenna':
-376
+#         numof = md.nantennas()
-391
-392
+# NOTE
-393
+# There is a bug in ms.getscansummary() that does not give the scans for all
-394
+# observation Ids, but only for the last one. See CAS-4409
-395
+def getMMSScans(mmsdict):
-396
+    '''Get the list of scans of an MMS dictionary.
-397
+       mmsdict  --> output dictionary from listpartition(MMS,createdict=true)
-398
+       Return a list of the scans in this MMS. '''
-399
-400
+    if not isinstance(mmsdict, dict):
--
+        print 'ERROR: Input is not a dictionary'
-+
+        print('ERROR: Input is not a dictionary')
-402
+        return []
-403
-404
+    tkeys = mmsdict.keys()
-405
+    scanlist = []
-406
+    slist = set(scanlist)
-407
+    for k in tkeys:
-408
+        skeys = mmsdict[k]['scanId'].keys()
-409
+        for j in skeys:
-410
+            slist.add(j)
-411
-451
+    '''
-452
+    msTool=mstool()
-453
+    msTool.open(msfile)
-454
+    if isinstance(selection, dict) and selection != {}:
-455
+        msTool.msselect(items=selection)
-456
-457
+    scand = msTool.getscansummary()
-458
+    msTool.close()
-459
-460
+    Nrows = 0
--
+    if not scand.has_key(str(myscan)):
-+
+    if not str(myscan) in scand:
-462
+        return Nrows
-463
-464
+    subscans = scand[str(myscan)]
-465
+    for ii in subscans.keys():
-466
+        Nrows += scand[str(myscan)][ii]['nRow']
-467
-468
+    return Nrows
-469
-470
-471
+def getMMSScanNrows(thisdict, myscan):
-472
+    '''Get the number of rows of a scan in an MMS dictionary.
-473
+       thisdict  --> output dictionary from listpartition(MMS,createdict=true)
-474
+       myscan    --> scan ID (int)
-475
+       Return the number of rows in the given scan. '''
-476
-477
+    if not isinstance(thisdict, dict):
--
+        print 'ERROR: Input is not a dictionary'
-+
+        print('ERROR: Input is not a dictionary')
-479
+        return -1
-480
-481
+    tkeys = thisdict.keys()
-482
+    scanrows = 0
-483
+    for k in tkeys:
--
+        if thisdict[k]['scanId'].has_key(myscan):
-+
+        if myscan in thisdict[k]['scanId']:
-485
+            scanrows += thisdict[k]['scanId'][myscan]['nrows']
-486
-487
+    return scanrows
-488
-489
-490
+def getSpwIds(msfile, myscan, selection={}):
-491
+    '''Get the Spw IDs of a scan.
-492
+       msfile     --> name of the MS or MMS
-493
+       myscan     --> scan Id (int)
-494
+       selection  --> dictionary with data selection
-501
+    msTool=mstool()
-502
+    msTool.open(msfile)
-503
+    if isinstance(selection, dict) and selection != {}:
-504
+        msTool.msselect(items=selection)
-505
-506
+    scand = msTool.getscansummary()
-507
+    msTool.close()
-508
-509
+    spwlist = []
-510
--
+    if not scand.has_key(str(myscan)):
-+
+    if not str(myscan) in scand:
-512
+        return spwlist
-513
-514
+    subscans = scand[str(myscan)]
-515
+    aspws = np.array([],dtype=int)
-516
-517
+    for ii in subscans.keys():
-518
+        sscanid = ii
-519
+        spwids = scand[str(myscan)][sscanid]['SpwIds']
-520
+        aspws = np.append(aspws,spwids)
-521
-569
+    for subms in mslist:
-570
+        try:
-571
+            mslocal1.open(subms)
-572
+            scans = mslocal1.getscansummary()
-573
+            msscanlist.append(scans)
-574
+            spws = mslocal1.getspectralwindowinfo()
-575
+            msspwlist.append(spws)
-576
+            mslocal1.close()
-577
+        except:
-578
+            mslocal1.close()
--
+            raise Exception, 'Cannot get scan/spw information from subMS'
-+
+            raise Exception('Cannot get scan/spw information from subMS')
-580
-581
+        # Get the data volume in bytes per sub-MS
-582
+        sizelist.append(getDiskUsage(subms))
-583
-584
+    # Get the information to list in output
-585
+    # Dictionary to return
-586
+    outdict = {}
-587
-588
+    for ims in range(mslist.__len__()):
-589
+        # Create temp dictionary for each sub-MS
-649
-650
-651
+def getMMSSpwIds(thisdict):
-652
+    '''Get the list of spws from an MMS dictionary.
-653
+       thisdict  --> output dictionary from listpartition(MMS,createdict=true)
-654
+       Return a list of the spw Ids in the dictionary. '''
-655
-656
+    import numpy as np
-657
-658
+    if not isinstance(thisdict, dict):
--
+        print 'ERROR: Input is not a dictionary'
-+
+        print('ERROR: Input is not a dictionary')
-660
+        return []
-661
-662
+    tkeys = thisdict.keys()
-663
-664
+    aspws = np.array([],dtype='int32')
-665
+    for k in tkeys:
-666
+        scanlist = thisdict[k]['scanId'].keys()
-667
+        for s in scanlist:
-668
+            spwids = thisdict[k]['scanId'][s]['spwIds']
-669
+            aspws = np.append(aspws, spwids)
-705
-706
+    Keyword arguments:
-707
+       msfile  --> name of the MS
-708
+       This function will return a value given by the command du -hs
-709
+    """
-710
-711
+    from subprocess import Popen, PIPE, STDOUT
-712
-713
+    # Command line to run
-714
+    ducmd = 'du -hs '+msfile
--
--
+    p = Popen(ducmd, shell=True, stdin=PIPE, stdout=PIPE, stderr=STDOUT, close_fds=True)
--
--
+    sizeline = p.stdout.read()
--
-+
-+
+    if use_old_casa5_commands:
-+
+        p = Popen(ducmd, shell=True, stdin=PIPE, stdout=PIPE, stderr=STDOUT, close_fds=True)
-+
+        sizeline = p.stdout.read()
-+
+        _out, _err = p.communicate()
-+
+    else:
-+
+        p = Popen(ducmd, shell=True, stdin=None, stdout=PIPE, stderr=STDOUT, close_fds=True)
-+
+        o, e = p.communicate()             ### previously 'sizeline = p.stdout.read()' here
-+
+                                           ### left process running...
-+
+        sizeline = bytes2str(o.split( )[0])
-+
-726
+    # Create a list of the output string, which looks like this:
-727
+    # ' 75M\tuidScan23.data/uidScan23.0000.ms\n'
-728
+    # This will create a list with [size,sub-ms]
-729
+    mssize = sizeline.split()
-730
-731
+    return mssize[0]
-732
-733
-734
+def getSubtables(vis):
-735
+    tbTool = tbtool()
-755
+        copysubtables    -- True will copy the sub-tables from the first subMS to the others in the
-756
+                            output MMS. Default to False.
-757
+        omitsubtables    -- List of sub-tables to omit when copying to output MMS. They will be linked instead
-758
+        parallelasxis    -- Optionally, set the value to be written to AxisType in table.info of the output MMS
-759
+                            Usually this value comes from the separationaxis keyword of partition or mstransform.
-760
-761
+          Be AWARE that this function will remove the tables listed in submslist.
-762
+    """
-763
-764
+    if os.path.exists(outputvis):
--
+        raise ValueError, "Output MS already exists"
-+
+        raise ValueError('Output MS already exists')
-766
-767
+    if len(submslist)==0:
--
+        raise ValueError, "No SubMSs given"
-+
+        raise ValueError('No SubMSs given')
-769
-770
+    ## make an MMS with all sub-MSs contained in a SUBMSS subdirectory
-771
+    origpath = os.getcwd()
-772
+    mymstool = mstool()
-773
+    mytbtool = tbtool()
-774
-775
+    try:
-776
+        try:
-777
+            mymstool.createmultims(outputvis,
-778
+                                   submslist,
-827
+                os.system('rm -rf '+s)
-828
+                os.symlink('../'+mastersubms+'/'+s, s)
-829
-830
+        # Write the AxisType info in the MMS
-831
+        if parallelaxis != '':
-832
+            setAxisType(outputvis, parallelaxis)
-833
-834
+    except:
-835
+        theproblem = str(sys.exc_info())
-836
+        os.chdir(origpath)
--
+        raise ValueError, "Problem in MMS creation: "+theproblem
-+
+        raise ValueError('Problem in MMS creation: {0}'.format(theproblem))
-838
-839
+    os.chdir(origpath)
-840
-841
+    return True
-842
-843
+def axisType(mmsname):
-844
+    """Get the axisType information from a Multi-MS. The AxisType information
-845
+       is usually added for Multi-MS with the axis which data is parallelized across.
-846
-847
+       Keyword arguments:
-848
+           mmsname    --    name of the Multi-MS
-849
-850
+        It returns the value of AxisType or an empty string if it doesn't exist.
-851
+    """
-852
+    tblocal = tbtool()
-853
-854
+    axis = ''
-855
-856
+    try:
-857
+        tblocal.open(mmsname, nomodify=True)
-858
+    except:
--
+        raise ValueError, "Unable to open table %s" % mmsname
-+
+        raise ValueError('Unable to open table {0}'.format(mmsname))
-860
-861
+    tbinfo = tblocal.info()
-862
+    tblocal.close()
-863
--
+    if tbinfo.has_key('readme'):
-+
+    if 'readme' in tbinfo:
-865
+        readme = tbinfo['readme']
-866
+        readlist = readme.splitlines()
-867
+        for val in readlist:
-868
+            if val.__contains__('AxisType'):
-869
+                a,b,axis = val.partition('=')
-870
-871
-872
+    return axis.strip()
-873
-874
+def setAxisType(mmsname, axis=''):
-875
+    """Set the AxisType keyword in a Multi-MS info. If AxisType already
-876
+       exists, it will be overwritten.
-877
-878
+    Keyword arguments:
-879
+        mmsname    --    name of the Multi-MS
-880
+        axis       --    parallel axis of the Multi-MS. Options: scan; spw or scan,spw
-881
-882
+        Return True on success, False otherwise.
-883
+    """
-884
-885
+    if axis == '':
--
+        raise ValueError, "Axis value cannot be empty"
-+
+        raise ValueError('Axis value cannot be empty')
-887
-888
+    tblocal = tbtool()
-889
+    try:
-890
+        tblocal.open(mmsname, nomodify=False)
-891
+    except:
--
+        raise ValueError, "Unable to open table %s" % mmsname
-+
+        raise ValueError('Unable to open table {0}'.format(mmsname))
-893
-894
+    import copy
-895
-896
+    tbinfo = tblocal.info()
-897
+    readme = ''
-898
+    # Save original readme
--
+    if tbinfo.has_key('readme'):
-+
+    if 'readme' in tbinfo:
-900
+        readme = tbinfo['readme']
-901
-902
+    # Check if AxisType already exist and remove it
-903
+    if axisType(mmsname) != '':
--
+        print 'WARN: Will overwrite the existing AxisType value'
-+
+        print('WARN: Will overwrite the existing AxisType value')
-905
+        readlist = readme.splitlines()
-906
+        newlist = copy.deepcopy(readlist)
-907
+        for val in newlist:
-908
+            if val.__contains__('AxisType'):
-909
+                readlist.remove(val)
-910
-911
+        # Recreate the string
-912
+        nr = ''
-913
+        for val in readlist:
-914
+            nr = nr + val + '\n'
-959
+        # Initialize scan sub-map
-960
+        scanDdiMap[scan] = {}
-961
+        # Iterate over timestamps for this scan
-962
+        for timestamp in scanSummary[scan]:
-963
+            # Get list of ddis for this timestamp
-964
+            DDIds = scanSummary[scan][timestamp]['DDIds']
-965
+            fieldId = str(scanSummary[scan][timestamp]['FieldId'])
-966
+            # Get number of rows per ddi (assume all DDIs have the same number of rows)
-967
+            # In ALMA data WVR DDI has only one row per antenna but it is separated from the other DDIs
-968
+            nrowsPerDDI = scanSummary[scan][timestamp]['nRow'] / len(DDIds)
--
+))
-969
+            # Iterate over DDIs for this timestamp
-970
+            for ddi in DDIds:
-971
+                # Convert to string to be used as a map key
-972
+                ddi = str(ddi)
-973
+                # Check if DDI entry is already present for this scan, otherwise initialize it
--
+                if not scanDdiMap[scan].has_key(ddi):
-+
+                if ddi not in scanDdiMap[scan]:
-975
+                    scanDdiMap[scan][ddi] = {}
-976
+                    scanDdiMap[scan][ddi]['nVis'] = 0
-977
+                    scanDdiMap[scan][ddi]['fieldId'] = fieldId
-978
+                    scanDdiMap[scan][ddi]['isWVR'] = ddIspectralWindowInfo[ddi]['isWVR']
-979
+                # Calculate number of visibilities
-980
+                nvis = nrowsPerDDI*ddIspectralWindowInfo[ddi]['NumChan']*ddIspectralWindowInfo[ddi]['NumCorr']
-981
+                # Add number of rows and vis from this timestamp
-982
+                scanDdiMap[scan][ddi]['nVis'] = scanDdiMap[scan][ddi]['nVis'] + nvis
-983
+                # Update ddi nvis
--
+                if not nVisPerDDI.has_key(ddi):
-+
+                if ddi not in nVisPerDDI:
-985
+                    nVisPerDDI[ddi] = nvis
-986
+                else:
-987
+                    nVisPerDDI[ddi] = nVisPerDDI[ddi] + nvis
-988
+                # Update scan nvis
--
+                if not nVisPerScan.has_key(scan):
-+
+                if scan not in nVisPerScan:
-990
+                    nVisPerScan[scan] = nvis
-991
+                else:
-992
+                    nVisPerScan[scan] = nVisPerScan[scan] + nvis
-993
+                # Update field nvis
--
+                if not nVisPerField.has_key(fieldId):
-+
+                if fieldId not in nVisPerField:
-995
+                    nVisPerField[fieldId] = nvis
-996
+                else:
-997
+                    nVisPerField[fieldId] = nVisPerField[fieldId] + nvis
-998
-999
+    return scanDdiMap, nVisPerDDI, nVisPerScan, nVisPerField
-1000
-1001
+def getPartitionMap(msfilename, nsubms, selection={}, axis=['field','spw','scan'],plotMode=0):
-1002
+    """Generates a partition scan/spw map to obtain optimal load balancing with the following criteria:
-1003
-1004
+st - Maximize the scan/spw/field distribution across sub-MSs
-1077
+    if nsubms > nScanDDIPairs:
-1078
+        casalog.post("Number of subMSs (%i) is greater than available scan,ddi pairs (%i), setting nsubms to %i"
-1079
+                     % (nsubms,nScanDDIPairs,nScanDDIPairs),"WARN","getPartitionMap")
-1080
+        nsubms = nScanDDIPairs
-1081
-1082
+    ddiArray = np.array(ddiList)
-1083
+    scanArray = np.array(scanList)
-1084
+    nVisArray = np.array(nVisList)
-1085
-1086
+    nVisSortIndex = np.lexsort((ddiArray, scanArray, nVisArray))
-+
+    # argsort/lexsort return indices by increasing value. This reverses the indices by
-+
+    # decreasing value
-1089
+    nVisSortIndex[:] = nVisSortIndex[::-1]
-1090
-1091
+    ddiArray = ddiArray[nVisSortIndex]
-1092
+    scanArray = scanArray[nVisSortIndex]
-1093
+    nVisArray = nVisArray[nVisSortIndex]
-1094
-1095
+    # Make a map for the contribution of each subMS to each scan
-1096
+    scanNvisDistributionPerSubMs = {}
-1097
+    for scan in scanSummary:
-1098
+        scanNvisDistributionPerSubMs[scan] = np.zeros(nsubms)
-1131
-1132
+        ddi = ddiArray[pair]
-1133
+        scan = scanArray[pair]
-1134
+        field = scanDdiMap[scan][ddi]['fieldId']
-1135
-1136
+        # Select the subMS that with bigger (scan/ddi/field gap)
-1137
+        # We use the average as a refLevel to include global structure information
-1138
+        # But we also take into account the actual max value in case we are distributing large uneven chunks
-1139
+        jointNvisGap = np.zeros(nsubms)
-1140
+        if 'scan' in axis:
--
+            refLevel = max(nVisPerScan[scan]/nsubms,scanNvisDistributionPerSubMs[scan].max())
-+
+            refLevel = max(nVisPerScan[scan] //
-+
+                           nsubms,scanNvisDistributionPerSubMs[scan].max())
-1143
+            jointNvisGap = jointNvisGap + refLevel - scanNvisDistributionPerSubMs[scan]
-1144
+        if 'spw' in axis:
--
+            refLevel = max(nVisPerDDI[ddi]/nsubms,ddiNvisDistributionPerSubMs[ddi].max())
-+
+            refLevel = max(nVisPerDDI[ddi] //
-+
+                           nsubms,ddiNvisDistributionPerSubMs[ddi].max())
-1147
+            jointNvisGap = jointNvisGap + refLevel - ddiNvisDistributionPerSubMs[ddi]
-1148
+        if 'field' in axis:
--
+            refLevel = max(nVisPerField[field]/nsubms,fieldNvisDistributionPerSubMs[field].max())
--
+            jointNvisGap = jointNvisGap + refLevel - fieldNvisDistributionPerSubMs[field]
-+
+            refLevel = max(nVisPerField[field] //
-+
+                           nsubms,fieldNvisDistributionPerSubMs[field].max())
-+
+            jointNvisGap = jointNvisGap + refLevel - fieldNvisDistributionPerSubMs[field]
-1152
-1153
+        optimalSubMs = np.where(jointNvisGap == jointNvisGap.max())
-1154
+        optimalSubMs = optimalSubMs[0] # np.where returns a tuple
-1155
-1156
+        # In case of multiple candidates select the subms with minum number of total visibilities
-1157
+        if len(optimalSubMs) > 1:
-1158
+            subIdx = np.argmin(nvisPerSubMs[optimalSubMs])
-1159
+            optimalSubMs = optimalSubMs[subIdx]
-1160
+        else:
-1161
+            optimalSubMs = optimalSubMs[0]

casa5

Commits

Jira Issues

Add shortcut