facetselfcal.py

#!/usr/bin/env python

# auto update channels out and fitspectralpol for high dynamic range
#h5_merger.merge_h5(h5_out=outparmdb,h5_tables=parmdb,add_directions=sourcedir_removed.tolist(),propagate_flags=False) Needs to be propagate_flags to be fully correct, this is a h5_merger issue
# check that MODEL_DATA_DD etc XY,YX are set to zero/or clean if wsclean predicts are used for Stokes I/dual 
# time, timefreq, freq med/avg steps (via losoto)
# BDA step DP3
# compression: blosc2
# useful? https://learning-python.com/thumbspage.html
# bdsf still steals the logger https://github.com/lofar-astron/PyBDSF/issues/176
# add html summary overview
# Stacking check that freq and time axes are identical
# Add multi-run stacking
# scalaraphasediff solve WEIGHT_SPECTRUM_PM should not be dysco compressed! Or not update weights there...
# BLsmooth cannot smooth more than bandwidth and time smearing allows, not checked now
# bug related to sources-pb.txt in facet imaging being empty if no -apply-beam is used
# fix RR-LL referencing for flaged solutions, check for possible superterp reference station
# put all fits images in images folder, all solutions in solutions folder? to reduce clutter
# phase detrending.
# log command into the FITS header
# BLsmooth constant smooth for gain solves
# stop selfcal  based on some metrics
# use scalarphasediff sols stats for solints? test amplitude stats as well
# parallel solving with DP3, given that DP3 often does not use all cores?
# uvmin, uvmax, uvminim, uvmaxim per ms per soltype

#antidx = 0
#pt.taql("select ANTENNA1,ANTENNA2,gntrue(FLAG)/(gntrue(FLAG)+gnfalse(FLAG)) as NFLAG from L656064_129_164MHz_uv_pre-cal.concat.ms WHERE (ANTENNA1=={:d} OR ANTENNA2=={:d}) AND ANTENNA1!=ANTENNA2".format(antidx, antidx)).getcol('NFLAG')

# example:
# python facetselfal.py -b box_18.reg --forwidefield --avgfreqstep=2 --avgtimestep=2 --smoothnessconstraint-list="[0.0,0.0,5.0]" --antennaconstraint-list="['core']" --solint-list=[1,20,120] --soltypecycles-list="[0,1,3]" --soltype-list="['tecandphase','tecandphase','scalarcomplexgain']" test.ms

# Standard library imports
import argparse
import ast
import configparser
import fnmatch
import glob
import logging
import multiprocessing
import os
import os.path
import pickle
import re
import subprocess
import sys
import time

from itertools import product
from itertools import groupby

# Third party imports
import astropy
import astropy.stats
import astropy.units as units
import bdsf
import casacore.tables as pt
import losoto
import losoto.lib_operations
import matplotlib
import matplotlib.pyplot as plt
import numpy as np
import pyregion
import tables
import scipy.special

from astropy.io import fits
from astropy.wcs import WCS
from astropy.io import ascii
from astropy.coordinates import AltAz, EarthLocation, ITRS, SkyCoord
#from astropy.coordinates import angular_separation
from astropy.time import Time
from astroquery.skyview import SkyView
from losoto import h5parm

logger = logging.getLogger(__name__)
logging.basicConfig(filename='selfcal.log',
                    format='%(levelname)s:%(asctime)s ---- %(message)s', datefmt='%m/%d/%Y %H:%M:%S')
logger.setLevel(logging.DEBUG)

try:
    import everybeam
except ImportError:
    logger.warning('Failed to import EveryBeam, functionality will not be available.')

matplotlib.use('Agg')
# For NFS mounted disks
os.environ["HDF5_USE_FILE_LOCKING"] = "FALSE"

# from astropy.utils.data import clear_download_cache
# clear_download_cache()

def fix_h5(h5_list):
    '''
    Fix for h5_merger that cannot handle multi-dir merges where both h5 with and without pol-axis are included
    '''
    import h5_merger
    for h5file in h5_list:
        outparmdb = h5file.replace('.h5', '.tmp.h5')
        if os.path.isfile(outparmdb):
            os.system('rm -f ' + outparmdb)
        # copy to get a clean h5 with standard dimensions
        h5_merger.merge_h5(h5_out=outparmdb,h5_tables=h5file,propagate_flags=True)

        # overwrite original 
        os.system('cp -f ' + outparmdb + ' ' + h5file )
        os.system('rm -f ' + outparmdb)
    return


def update_fitspectralpol(args):
    if args['update_fitspectralpol']:
         args['fitspectralpol'] = set_fitspectralpol(args['channelsout'])
    return args['fitspectralpol']

def update_channelsout(args, selfcalcycle, mslist):
   
    if args['update_channelsout']:
        t = pt.table(mslist[0] + '/OBSERVATION', ack=False)
        telescope = t.getcol('TELESCOPE_NAME')[0] 
        t.close()
        # set stackstr
        for msim_id, mslistim in enumerate(nested_mslistforimaging(mslist, stack=args['stack'])):
            if args['stack']:
                stackstr= '_stack' + str(msim_id).zfill(2)
            else:
                stackstr='' # empty string
  
        # set imagename
        if args['imager'] == 'WSCLEAN':
            if args['idg']:
              imagename  = args['imagename'] + str(selfcalcycle).zfill(3) + stackstr + '-MFS-image.fits'
            else:
              imagename  = args['imagename'] + str(selfcalcycle).zfill(3) + stackstr + '-MFS-image.fits'
        if args['imager'] == 'DDFACET':
            imagename  = args['imagename'] + str(selfcalcycle).zfill(3) + stackstr + '.app.restored.fits'
        if args['channelsout'] == 1: # strip MFS from name if no channels images present
            imagename = imagename.replace('-MFS', '').replace('-I','')

        dr = get_image_dynamicrange(imagename)
        
        if dr > 1500 and telescope == 'LOFAR':
          args['channelsout'] =  set_channelsout(mslist, factor=2) 
        if dr > 3000 and telescope == 'LOFAR':
          args['channelsout'] =  set_channelsout(mslist, factor=3) 
        if dr > 6000 and telescope == 'LOFAR':
          args['channelsout'] =  set_channelsout(mslist, factor=4) 

        if dr > 30000 and telescope == 'MeerKAT':
          args['channelsout'] =  set_channelsout(mslist, factor=1.5) 
        if dr > 60000 and telescope == 'MeerKAT':
          args['channelsout'] =  set_channelsout(mslist, factor=2) 
        if dr > 90000 and telescope == 'MeerKAT':
          args['channelsout'] =  set_channelsout(mslist, factor=3) 

    return args['channelsout']

def round_up_to_even(number):
    return int(np.ceil(number / 2.) * 2)

def set_channelsout(mslist, factor=1):
    t = pt.table(mslist[0] + '/OBSERVATION', ack=False)
    telescope = t.getcol('TELESCOPE_NAME')[0] 
    t.close()
    f_bw = get_fractional_bandwidth(mslist)

    if telescope == 'LOFAR':
        channelsout = round_up_to_even(f_bw*12*factor)
    elif telescope == 'MeerKAT':   
        channelsout = round_up_to_even(f_bw*16*factor)
    else:    
        channelsout = round_up_to_even(f_bw*12*factor)
    return channelsout
  
def set_fitspectralpol(channelsout):
    if channelsout == 1:
        fitspectralpol = 1  
    elif channelsout == 2:  
        fitspectralpol = 2 
    elif channelsout <= 6:  
        fitspectralpol = 3 
    elif channelsout <= 8:  
        fitspectralpol = 5 
    elif channelsout <= 12:  
        fitspectralpol = 7 
    elif channelsout > 12 :  
        fitspectralpol = 9 
    else:
       print('channelsout', channelsout)
       raise Exception('channelsout has an invalid value')  
    return fitspectralpol
  
def get_fractional_bandwidth(mslist):
    '''
    Compute fractional bandwidth of a list of MS
    input mslist: list of ms
    return fractional bandwidth
    '''
    freqaxis = [] 
    for ms in mslist:        
        t = pt.table(ms + '/SPECTRAL_WINDOW', readonly=True, ack=False)
        freq = t.getcol('CHAN_FREQ')[0]
        t.close()
        freqaxis.append(freq)
    freqaxis = np.hstack(freqaxis) 
    f_bw = (np.max(freqaxis) - np.min(freqaxis))/np.min(freqaxis)
    
    if f_bw == 0.0: # single channel data
       t = pt.table(mslist[0] + '/SPECTRAL_WINDOW', readonly=True, ack=False) # just take the first and assume this is ok
       f_bw =  t.getcol('TOTAL_BANDWIDTH')[0]/np.min(freqaxis)
       t.close()
    return f_bw
  

def MeerKAT_antconstraint(antfile='MeerKATlayout.csv', ctype='all'):
    if ctype not in ['core','remote','all']:
        print('Wrong input detected, ctype needs to be in core,remote,or all')
        sys.exit()

    data = ascii.read(antfile,delimiter=';',header_start=0) 
    distance = np.sqrt(data['East']**2+ data['North']**2 + data['Up']**2)
    #print(distance
    idx_core = np.where(distance <= 1000.)
    idx_rs   = np.where(distance > 1000.)
    if ctype == 'core':
        return data['Antenna'][idx_core].tolist()
    if ctype == 'remote':
        return data['Antenna'][idx_rs].tolist()
    if ctype == 'all':  
        return data['Antenna'].tolist()

def remove_column_ms(mslist, colname):
    '''
    Remove a column from a Measurement Sets
    mslist (str/list): input ms(list)
    colname: column that will be removed
    '''
    if type(mslist) == list:
        for ms in mslist:
            ts = pt.table(ms, readonly=False, ack=False)
            ts.removecols([colname])
            ts.close()
    else:
        ts = pt.table(mslist, readonly=False, ack=False)
        ts.removecols([colname])
        ts.close()
    return

def update_sourcedirname_h5_dde(h5, modeldatacolumns):
    '''
    Replace direction names in h5 with the modeldatacolumns names
    '''
    
    modeldatacolumns_outname = [] 
    for mm_id, mm in enumerate(modeldatacolumns):
       modeldatacolumns_outname.append('DIL' + str(mm_id).zfill(2))  # need a name that has only 5 characters because otherwise we cannot copy over the names 
    
    H = tables.open_file(h5,mode='a')
    for direction_id, direction in enumerate(modeldatacolumns):
       H.root.sol000.source[direction_id] = (modeldatacolumns[direction_id], H.root.sol000.source[direction_id]['dir'])
       print(H.root.sol000.source[direction_id]['name'], modeldatacolumns[direction_id])
       
    try:
       H.root.sol000.phase000.dir[:] = modeldatacolumns_outname
       print('Update direction names phase000',modeldatacolumns_outname)
    except:
       pass
    try:
       H.root.sol000.amplitude000.dir[:] = modeldatacolumns_outname
       print('Update direction names amplitude000',modeldatacolumns_outname)
    except:
       pass
    try:
       H.root.sol000.tec000.dir[:] = modeldatacolumns_outname
       print('Update direction names tec000',modeldatacolumns_outname)
    except:
       pass
    try:
       H.root.sol000.rotation000.dir[:] = modeldatacolumns_outname
       print('Update direction names rotation000',modeldatacolumns_outname)
    except:
       pass
                     
    H.close()
    print('Done fixing direction names')
    return


def merge_splitted_h5_ordered(modeldatacolumnsin, parmdb_out, clean_up=False):
   h5list_sols = []
   for colid, coln in enumerate(modeldatacolumnsin):
         h5list_sols.append('Dir' + str(colid).zfill(2) + '.h5')
   print('These are the h5 that need merging:', h5list_sols)
   if os.path.isfile(parmdb_out):
      os.system('rm -f ' + parmdb_out)  
   
   f = open('facetdirections.p', 'rb')
   sourcedir = pickle.load(f) # units are radian
   f.close()   
   parmdb_merge_list = []
   
   
   for direction in sourcedir:
      print(direction)
      c1 = SkyCoord(direction[0] * units.radian,  direction[1] * units.radian, frame='icrs')
      distance = 1e9
      #print(c1)
      for hsol in h5list_sols:
         H5 = tables.open_file(hsol, mode='r')
         dd = H5.root.sol000.source[:][0]
         H5.close()
         ra, dec = dd[1]
         c2 = SkyCoord(ra * units.radian,  dec * units.radian, frame='icrs')
         angsep = c1.separation(c2).to(units.degree)
         #print(c2)
      
         #print(hsol, angsep.value, '[degree]')
         if angsep.value < distance:
            distance = angsep.value
            matchging_h5 = hsol
      parmdb_merge_list.append(matchging_h5)
      print('separation direction entry and h5 entry is:', distance, matchging_h5)   
      assert abs(distance) < 0.00001 # there should always be a close to perfect match
      
   import h5_merger   
   h5_merger.merge_h5(h5_out=parmdb_out,h5_tables=parmdb_merge_list,propagate_flags=True)   
   
   if clean_up:
      for h5 in h5list_sols:
         os.system('rm -f ' + h5)
   return
   
def copy_over_solutions_from_skipped_directions(modeldatacolumnsin,id_kept):
   ''' 
   modeldatacolumnsin: all modeldatacolumns
   id_kept: indices of the modeldatacolumns kept in the solve id_kept
   '''
   h5list_sols = []
   h5list_empty = []
   for colid, coln in enumerate(modeldatacolumnsin):
      if colid >= len(id_kept):
         h5list_empty.append('Dir' + str(colid).zfill(2) + '.h5')
      else:
         h5list_sols.append('Dir' + str(colid).zfill(2) + '.h5')
   print('These h5 have solutions:', h5list_sols)
   print('These h5 are empty:',h5list_empty)

   # fill the empty directions (those that were removed and not solve) with the closest valid solutions
   for h5 in h5list_empty:
      hempty = tables.open_file(h5, mode='a')
      direction = hempty.root.sol000.source[:][0]
      ra, dec = direction[1]
      c1 = SkyCoord(ra * units.radian,  dec * units.radian, frame='icrs')
      #print(c1)
      
      distance = 1e9
      for h5sol in h5list_sols:
          hsol = tables.open_file(h5sol, mode='r')
          directionsol = hsol.root.sol000.source[:][0]
          rasol, decsol = directionsol[1]
          c2 = SkyCoord(rasol * units.radian,  decsol * units.radian, frame='icrs') 
          angsep = c1.separation(c2).to(units.degree)
          #print(h5, h5sol, angsep.value, '[degree]')
          if angsep.value < distance:
             distance = angsep.value
             matchging_h5 = h5sol
          hsol.close()
      print(h5 + ' needs solutions copied from ' +  matchging_h5, distance)
   
      # copy over the values
      hmatch = tables.open_file(matchging_h5, mode='r')
      
      try:
         hempty.root.sol000.phase000.val[:] = np.copy(hmatch.root.sol000.phase000.val[:])
         print('Copied over phase000')
      except:
        pass
      try:
         hempty.root.sol000.amplitude000.val[:] = np.copy(hmatch.root.sol000.amplitude000.val[:])
         print('Copied over amplitude000')
      except:
        pass
      try:
         hempty.root.sol000.tec000.val[:] = np.copy(hmatch.root.sol000.tec000.val[:])
         print('Copied over tec000')
      except:
        pass      
      try:
         hempty.root.sol000.rotation000.val[:] = np.copy(hmatch.root.sol000.rotation000.val[:])
         print('Copied over rotation000')
      except:
        pass

      hmatch.close()
      hempty.flush()
      hempty.close()
   return
 
 
def filter_baseline_str_removestations(stationlist):
  fbaseline = "'"
  for station_id, station in enumerate(stationlist):
    fbaseline = fbaseline +"!" +station + "&&*"
    if station_id+1 < len(stationlist):
       fbaseline = fbaseline + ";"
  return fbaseline + "'"
  

def return_antennas_highflaggingpercentage(ms, percentage=0.85):
   ### Find all antennas with more than 80% flagged data
   print('Finding stations with a flagging percentage above ' + str(100*percentage) + ' ....')
   from casacore.tables import taql
   t = taql(""" SELECT antname, gsum(numflagged) AS numflagged, gsum(numvis) AS numvis,
       gsum(numflagged)/gsum(numvis) as percflagged FROM [[ SELECT mscal.ant1name() AS antname, ntrue(FLAG) AS numflagged, count(FLAG) AS numvis FROM """ + ms + """ ],[ SELECT mscal.ant2name() AS antname, ntrue(FLAG) AS numflagged, count(FLAG) AS numvis FROM """ + ms + """ ] ] GROUP BY antname HAVING percflagged > """ + str(percentage) +  """ """)

   flaggedants = [ row["antname"] for row in t ]
   print('Found:', flaggedants)
   return flaggedants


def create_empty_fitsimage(ms, imsize, pixelsize, outfile):
    '''
    Create emtpy (zeros) FITS file with size imsize and pixelsize
    Image center coincides with the phase center of the provided ms
    '''
    data = np.zeros((imsize, imsize)) 

    w = WCS(naxis=2)
    # what is the center pixel of the XY grid.
    w.wcs.crpix = [imsize/2, imsize/2]

    # coordinate of the pixel.
    w.wcs.crval = grab_coord_MS(ms)

    # the pixel scale
    w.wcs.cdelt = np.array([pixelsize/3600., pixelsize/3600.])
    
    # projection
    w.wcs.ctype = ["RA---SIN", "DEC--SIN"]

    # write the HDU object WITH THE HEADER
    header = w.to_header()
    hdu = fits.PrimaryHDU(data, header=header)
    hdu.writeto(outfile, overwrite=True)
    return 

def copy_over_sourcedirection_h5(h5ref, h5):
    '''
    Replace source direction in h5 with the one in h5ref
    '''
    from overwrite_table import overwrite_table
    Href = tables.open_file(h5ref, mode='r')
    refsource = Href.root.sol000.source[:]
    Href.close()
    overwrite_table(h5, 'source', refsource)
    return


def set_DDE_predict_skymodel_solve(wscleanskymodel):
  if wscleanskymodel is not None:
     return 'WSCLEAN'
  else: 
     return 'DP3'

def getAntennas(ms):
   """
   Return a list of antenna names
   """
   t = pt.table(ms + "/ANTENNA", readonly=True, ack=False)
   antennas = t.getcol('NAME')
   t.close()
   return antennas


def grab_coord_MS(MS):
    """
    Read the coordinates of a field from one MS corresponding to the selection given in the parameters

    Parameters
    ----------
    MS : str
        Full name (with path) to one MS of the field

    Returns
    -------
    RA, Dec : "tuple"
        coordinates of the field (RA, Dec in deg , J2000)
    """

    # reading the coordinates ("position") from the MS
    # NB: they are given in rad,rad (J2000)
    [[[ra,dec]]] = pt.table(MS+'::FIELD', readonly=True, ack=False).getcol('PHASE_DIR')

    # RA is stocked in the MS in [-pi;pi]
    # => shift for the negative angles before the conversion to deg (so that RA in [0;2pi])
    if ra<0:
        ra=ra+2*np.pi

    # convert radians to degrees
    ra_deg =  ra/np.pi*180.
    dec_deg = dec/np.pi*180.

    # and sending the coordinates in deg
    return(ra_deg,dec_deg)


def getGSM(ms_input, SkymodelPath='gsm.skymodel', Radius="5.", DoDownload="Force", Source="GSM", targetname = "pointing", fluxlimit = None):
    """
    Download the skymodel for the target field

    Parameters
    ----------
    ms_input : str
        String from the list (map) of the target MSs
    SkymodelPath : str
        Full name (with path) to the skymodel; if YES is true, the skymodel will be downloaded here
    Radius : string with float (default = "5.")
        Radius for the TGSS/GSM cone search in degrees
    DoDownload : str ("Force" or "True" or "False")
        Download or not the TGSS skymodel or GSM.
        "Force": download skymodel from TGSS or GSM, delete existing skymodel if needed.
        "True" or "Yes": use existing skymodel file if it exists, download skymodel from
                         TGSS or GSM if it does not.
        "False" or "No": Do not download skymodel, raise an exception if skymodel
                         file does not exist.
    targetname : str
        Give the patch a certain name, default: "pointing"
    """
    import lsmtool
    FileExists = os.path.isfile(SkymodelPath)
    if (not FileExists and os.path.exists(SkymodelPath)):
        raise ValueError("download_tgss_skymodel_target: Path: \"%s\" exists but is not a file!"%(SkymodelPath))
    download_flag = False
    #if not os.path.exists(os.path.dirname(SkymodelPath)):
    #    os.makedirs(os.path.dirname(SkymodelPath))
    if DoDownload.upper() == "FORCE":
        if FileExists:
            os.remove(SkymodelPath)
        download_flag = True
    elif DoDownload.upper() == "TRUE" or DoDownload.upper() == "YES":
        if FileExists:
            print("USING the exising skymodel in "+ SkymodelPath)
            return(0)
        else:
            download_flag = True
    elif DoDownload.upper() == "FALSE" or DoDownload.upper() == "NO":
         if FileExists:
            print("USING the exising skymodel in "+ SkymodelPath)
            return(0)
         else:
            raise ValueError("download_tgss_skymodel_target: Path: \"%s\" does not exist and skymodel download is disabled!"%(SkymodelPath))

    # If we got here, then we are supposed to download the skymodel.
    assert download_flag is True # Jaja, belts and suspenders...
    print("DOWNLOADING skymodel for the target into "+ SkymodelPath)

    # Reading a MS to find the coordinate (pyrap)
    [RATar,DECTar]=grab_coord_MS(ms_input)

    # Downloading the skymodel, skip after five tries
    errorcode = 1
    tries     = 0
    while errorcode != 0 and tries < 5:
        if Source == 'TGSS':
            errorcode = os.system("wget -O "+SkymodelPath+ " \'http://tgssadr.strw.leidenuniv.nl/cgi-bin/gsmv5.cgi?coord="+str(RATar)+","+str(DECTar)+"&radius="+str(Radius)+"&unit=deg&deconv=y\' ")
        elif Source == 'GSM':
            errorcode = os.system("wget -O "+SkymodelPath+ " \'https://lcs165.lofar.eu/cgi-bin/gsmv1.cgi?coord="+str(RATar)+","+str(DECTar)+"&radius="+str(Radius)+"&unit=deg&deconv=y\' ")
        time.sleep(5)
        tries += 1

    if not os.path.isfile(SkymodelPath):
        raise IOError("download_tgss_skymodel_target: Path: \"%s\" does not exist after trying to download the skymodel."%(SkymodelPath))

    # Treat all sources as one group (direction)
    skymodel = lsmtool.load(SkymodelPath)
    if fluxlimit:
        skymodel.remove('I<' + str(fluxlimit))
    skymodel.group('single', root = targetname)
    skymodel.write(clobber=True)
    
    return SkymodelPath


def concat_ms_wsclean_facetimaging(mslist, h5list=None,concatms=True):

   import h5_merger
   keyfunct = lambda x: ' '.join(sorted(getAntennas(x)))

   MSs_list = sorted(mslist, key=keyfunct) # needs to be sorted

   groups = []
   for k, g in groupby(MSs_list, keyfunct):
      groups.append(list(g))
   print(f"Found {len(groups)} groups of datasets with same antennas.")

   for i, group in enumerate(groups, start=1):
      antennas = ', '.join(getAntennas(group[0]))
      print(f"WSClean MS group {i}: {group}")
      print(f"List of antennas: {antennas}")

   MSs_files_clean = []
   H5s_files_clean = []
   for g, group in enumerate(groups):
      if os.path.isdir(f'wsclean_concat_{g}.ms') and concatms:
         os.system(f'rm -rf wsclean_concat_{g}.ms')
      
      if h5list is not None:
         h5group = []
         for ms in group:
            h5group.append(time_match_mstoH5(h5list, ms))
         print('------------------------------')
         print('MS group and matched h5 group', group, h5group)
         print('------------------------------')
         if os.path.isfile(f'wsclean_concat_{g}.h5'):
            os.system(f'rm -rf wsclean_concat_{g}.h5')     
         h5_merger.merge_h5(h5_out=f'wsclean_concat_{g}.h5', h5_tables=h5group, \
                            propagate_flags=True, time_concat=True)
         H5s_files_clean.append(f'wsclean_concat_{g}.h5')
      if concatms:
         print(f'taql select from {group} giving wsclean_concat_{g}.ms as plain')
         run(f'taql select from {group} giving wsclean_concat_{g}.ms as plain')
      MSs_files_clean.append(f'wsclean_concat_{g}.ms')
    
   #MSs_files_clean = ' '.join(MSs_files_clean)

   #print('Use the following ms files as input in wsclean:')
   #print(MSs_files_clean)
   
   return MSs_files_clean, H5s_files_clean


def check_for_BDPbug_longsolint(mslist, facetdirections, args=None):
   #try:
   dirs, solints, soltypelist_includedir = parse_facetdirections(facetdirections, 1000, args=args)
   #except:
   #    try:
   #      f = open(facetdirections, 'rb')
   #      PatchPositions_array = pickle.load(f)
   #      f.close()
   #      solints = None
   #    except: 
   #      raise Exception('Trouble read file format:' + facetdirections) 
	   
   if solints is None:
      return  
   
   solint_reformat= np.array(solints)
   import math
   for ms in mslist:
      t = pt.table(ms, readonly=True, ack=False)
      time = np.unique(t.getcol('TIME'))
      t.close()
      print('------------' + ms)
      ms_ntimes = len(time)
      #print(ms, ms_ntimes)
      for solintcyle_id, tmpval in enumerate(solint_reformat[0]): 
         print(' --- ' + str('pertubation cycle=') + str(solintcyle_id) + '--- ')
         solints_cycle = solint_reformat[:,solintcyle_id]
         solints = [int(format_solint(x, ms)) for x in solints_cycle]
         print('Solint unmodified per direction', solints) 
         solints = tweak_solints(solints, ms_ntimes=ms_ntimes)
         print('Solint tweaked per direction   ', solints) 
         #print('Here')
         #sys.exit()
         lcm = math.lcm(*solints)
         divisors = [int(lcm/i) for i in solints]
         print('Solint passed to DP3 would be:', lcm, ' --Number of timeslots in MS:', ms_ntimes)
         if lcm > ms_ntimes:
            print('Bad divisor for solutions_per_direction DDE solve. DP3 Solint > number of timeslots in the MS')
            sys.exit() 
      print('------------')

   return

def selfcal_animatedgif(fitsstr, outname):
   limit_min = -250e-6
   limit_max = 2.5e-2
   cmd = 'ds9 ' + fitsstr + ' '
   cmd += '-single -view basic -frame first -geometry 800x800 -zoom to fit -sqrt -scale limits ' 
   cmd +=  str(limit_max)  + ' ' + str(limit_max) + ' '
   cmd += '-cmap ch05m151008 -colorbar lock yes -frame lock wcs '
   cmd += '-lock scalelimits yes -movie frame gif 10 '
   cmd += outname + ' -quit'
   run(cmd)
   return


def find_closest_ddsol(h5, ms): # 
   """
   find closest direction in multidir h5 files to the phasecenter of the ms
   """
   t2 = pt.table(ms + '::FIELD', ack=False)
   phasedir = t2.getcol('PHASE_DIR').squeeze()
   t2.close()
   c1 = SkyCoord(phasedir[0] * units.radian,  phasedir[1] * units.radian, frame='icrs')
   H5 = tables.open_file(h5)
   distance = 1e9 # just a big number
   for direction_id, direction in enumerate (H5.root.sol000.source[:]):
      ra, dec = direction[1]
      c2 = SkyCoord(ra * units.radian,  dec * units.radian, frame='icrs')
      angsep = c1.separation(c2).to(units.degree)
      print(direction[0], angsep.value, '[degree]')
      if angsep.value < distance:
        distance = angsep.value
        dirname = direction[0]
   H5.close()
   return dirname


def set_beamcor(ms, beamcor_var):
   """
   Determine whether to do beam correction or note
   """
   if beamcor_var == 'no':
      logger.info('Run DP3 applybeam: no')
      return False
   if beamcor_var == 'yes':
      logger.info('Run DP3 applybeam: yes')
      return True  

   t = pt.table(ms + '/OBSERVATION', ack=False)
   if t.getcol('TELESCOPE_NAME')[0] != 'LOFAR':
      t.close()
      logger.info('Run DP3 applybeam: no (because we are not using LOFAR observations)')
      return False
   t.close()

   # If we arrive here beamcor_var was set to auto and we are using a LOFAR observation   
   if not beamkeywords(ms):
      # we have old prefactor data in this case, no beam keywords available
      # assume beam was taken out in the field center only if user as set 'auto'
      logger.info('Run DP3 applybeam: yes')
      return True

   # now check if beam was taken out in the current phase center
   t = pt.table(ms, readonly=True, ack=False)
   beamdir = t.getcolkeyword('DATA', 'LOFAR_APPLIED_BEAM_DIR')
   
   t2 = pt.table(ms + '::FIELD', ack=False)
   phasedir = t2.getcol('PHASE_DIR').squeeze()
   t.close()
   t2.close()
   
   c1 = SkyCoord(beamdir['m0']['value']* units.radian, beamdir['m1']['value'] * units.radian, frame='icrs')
   c2 = SkyCoord(phasedir[0] * units.radian,  phasedir[1] * units.radian, frame='icrs')
   angsep = c1.separation(c2).to(units.arcsec)
   
   # angular_separation is recent astropy functionality, do not use, instead use the older SkyCoord.seperation
   #angsep = 3600.*180.*astropy.coordinates.angular_separation(phasedir[0], phasedir[1], beamdir['m0']['value'], beamdir['m1']['value'])/np.pi
   
   print('Angular separation between phase center and applied beam direction is', angsep.value, '[arcsec]')
   logger.info('Angular separation between phase center and applied beam direction is:' + str(angsep.value) + ' [arcsec]')
   
   # of less than 10 arcsec than do beam correction
   if angsep.value < 10.0: 
      logger.info('Run DP3 applybeam: no')
      return False
   else:
      logger.info('Run DP3 applybeam: yes')
      return True

def isfloat(num):
    """
    Check if value is a float
    """
    try:
        float(num)
        return True
    except ValueError:
        return False

def parse_history(ms, hist_item):
    """
    Grep specific history item from MS
    :param ms: measurement set
    :param hist_item: history item
    :return: parsed string
    """
    hist = os.popen('taql "SELECT * FROM '+ms+'::HISTORY" | grep '+hist_item).read().split(' ')
    for item in hist:
        if hist_item in item and len(hist_item)<=len(item):
            return item
    print('WARNING:' + hist_item + ' not found')
    return None


def find_prime_factors(n):
  factorlist = []
  num = n
  while (n % 2 == 0):
    factorlist.append(2)
    n = n/2

  for i in range(3,int(num/2)+1,2):
    while (n % i == 0):
      factorlist.append(i)
      n = n/i
    if (n==1):
      break
  return(factorlist)

def tweak_solintsold(solints, solval=20):
    solints_return = []
    for sol in solints:
        soltmp = sol
        if soltmp > solval:
           soltmp += (int)(soltmp & 1) # round up to even
        solints_return.append((soltmp)) 
    return solints_return

def tweak_solints(solints, solvalthresh=11, ms_ntimes=None):
    """
    Returns modified solints that can be factorized by 2 or 3 if input contains number >= solvalthresh
    """
    solints_return = []
    if np.max(solints) < solvalthresh:
        return solints  
    possible_solints = listof2and3prime(startval=2, stopval=10000)
    if ms_ntimes is not None:
       possible_solints= remove_bad_endrounding(possible_solints,ms_ntimes)

    for sol in solints:
        solints_return.append(find_nearest(possible_solints, sol)) 
    return solints_return

def tweak_solints_single(solint, ms_ntimes, solvalthresh=11, ):
    """
    Returns modified solint that avoids a short number of left over timeslots near the end of the ms
    """
    if np.max(solint) < solvalthresh:
        return solint  
   
    possible_solints = np.arange(1,2*solint)
    possible_solints= remove_bad_endrounding(possible_solints,ms_ntimes)

    return find_nearest(possible_solints, solint)


def remove_bad_endrounding(solints, ms_ntimes, ignorelessthan=11):
   '''
   list of possible solints to start with
   ms_ntimes: number of timeslots in the MS
   if ignorelessthan then do not use this extra option
   '''
   solints_out = []
   for solint in solints:
      if (float(ms_ntimes)/float(solint)) - (np.floor(float(ms_ntimes)/float(solint))) > 0.5 or solint<ignorelessthan:
         solints_out.append(solint)
   return solints_out
 
def listof2and3prime(startval=2, stopval=10000):
   solint=[1]
   for i in np.arange(startval,stopval):
     factors = find_prime_factors(i)
     if len(factors) > 0:
        if factors[-1] == 2 or factors[-1] == 3 :
          solint.append(i)
   return solint

def find_nearest(array, value):
    array = np.asarray(array)
    idx = (np.abs(array - value)).argmin()
    return array[idx]

def get_time_preavg_factor_LTAdata(ms):
    """
    Get time pre-averaging factor (given by demixer.timestep)
    :param ms: measurement set
    :return: averaging integer
    """
    parse_str = "demixer.timestep="
    parsed_history = parse_history(ms, parse_str)
    avg_num = re.findall(r'\d+', parsed_history.replace(parse_str, ''))[0]
    if avg_num.isdigit():
        factor = int(float(avg_num))
        if factor!=1:
            print("WARNING: " + ms + " time has been pre-averaged with factor "+str(factor)+". This might cause time smearing effects.")
        return factor
    elif isfloat(avg_num):
        factor = float(avg_num)
        print("WARNING: parsed factor in " + ms + " is not a digit but a float")
        return factor
    else:
        print("WARNING: parsed factor in " + ms + " is not a float or digit")
        return None
      
def add_dummyms(msfiles):
    '''
    Add dummy ms to create a regular freuqency grid when doing a concat with DPPP
    '''
    if len(msfiles) == 1:
      return msfiles
    keyname = 'REF_FREQUENCY'
    freqaxis = []
    newmslist  = []

    # Check for wrong REF_FREQUENCY which happens after a DPPP split in frequency
    for ms in msfiles:        
        t = pt.table(ms + '/SPECTRAL_WINDOW', readonly=True)
        freq = t.getcol('REF_FREQUENCY')[0]
        t.close()
        freqaxis.append(freq)
    freqaxis = np.sort( np.array(freqaxis))
    minfreqspacing = np.min(np.diff(freqaxis))
    if minfreqspacing == 0.0:
       keyname = 'CHAN_FREQ' 
    
    
    freqaxis = [] 
    for ms in msfiles:        
        t = pt.table(ms + '/SPECTRAL_WINDOW', readonly=True)
        if keyname == 'CHAN_FREQ':
          freq = t.getcol(keyname)[0][0]
        else:
          freq = t.getcol(keyname)[0]  
        t.close()
        freqaxis.append(freq)
    
    # put everything in order of increasing frequency
    freqaxis = np.array(freqaxis)
    idx = np.argsort(freqaxis)
    
    freqaxis = freqaxis[np.array(tuple(idx))]
    sortedmslist = list( msfiles[i] for i in idx )
    freqspacing = np.diff(freqaxis)
    minfreqspacing = np.min(np.diff(freqaxis))
 
    # insert dummies in the ms list if needed
    count = 0
    newmslist.append(sortedmslist[0]) # always start with the first ms the list
    for msnumber, ms in enumerate(sortedmslist[1::]): 
      if int(round(freqspacing[msnumber]/minfreqspacing)) > 1:
        ndummy = int(round(freqspacing[msnumber]/minfreqspacing)) - 1
 
        for dummy in range(ndummy):
          newmslist.append('dummy' + str(count) + '.ms')
          print('Added dummy:', 'dummy' + str(count) + '.ms') 
          count = count + 1
      newmslist.append(ms)
       
    print('Updated ms list with dummies inserted to create a regular frequency grid')
    print(newmslist) 
    return newmslist

def number_of_unique_obsids(msfiles):
    '''
    Basic function to get numbers of observations based on first part of ms name
    (assumes one uses "_" here)

     Args:
         command (list): the list of ms
     Returns:
         reval (int): number of observations
  
    '''
    obsids = []
    for ms in msfiles:
       obsids.append(os.path.basename(ms).split('_')[0])
       print('Using these observations ', np.unique(obsids))
    return len(np.unique(obsids))

def getobsmslist(msfiles, observationnumber):
    '''
    make a list of ms beloning to the same observation
    '''
    obsids = []    
    for ms in msfiles:
      obsids.append(os.path.basename(ms).split('_')[0])
    obsidsextract = np.unique(obsids)[observationnumber]
    mslist = []
    for ms in msfiles:
      if (os.path.basename(ms).split('_')[0]) == obsidsextract:
        mslist.append(ms)
    return mslist 

def mscolexist(ms, colname):
    """ Check if a colname exists in the measurement set ms, returns either True or False """
    if os.path.isdir(ms):
      t = pt.table(ms,readonly=True, ack=False)
      colnames =t.colnames()
      if colname in colnames: # check if the column is in the list
         exist = True
      else:
        exist = False  
      t.close()
    else:
      exist = False # ms does not exist  
    return exist

 
def concat_ms_from_same_obs(mslist, outnamebase, colname='DATA', dysco=True):
   for observation in range(number_of_unique_obsids(mslist)):
      # insert dummies for completely missing blocks to create a regular freuqency grid for DPPP
      obs_mslist = getobsmslist(mslist, observation)
      obs_mslist    = add_dummyms(obs_mslist)   

      msoutconcat = outnamebase + '_' + str(observation) + '.ms'
      msfilesconcat = []

      #remove ms from the list where column DATA_SUB does not exist (to prevent NDPPP crash)
      for msnumber, ms in enumerate(obs_mslist):
         if os.path.isdir(ms):
            if mscolexist(ms,colname):
                msfilesconcat.append(ms)
            else:
                msfilesconcat.append('missing' + str(msnumber))
         else:  
            msfilesconcat.append('missing' + str(msnumber))    
     
         #  CONCAT
         cmd =  'DP3 msin="' + str(msfilesconcat) + '" msin.orderms=False '
         cmd += 'steps=[] '
         cmd += 'msin.datacolumn=%s msin.missingdata=True '%colname
         cmd += 'msin.weightcolumn=WEIGHT_SPECTRUM ' 
         if dysco:
            cmd += 'msout.storagemanager=dysco '
            cmd += 'msout.storagemanager.weightbitrate=16 '
         cmd += 'msout=' + msoutconcat + ' '
         if os.path.isdir(msoutconcat):
            os.system('rm -rf ' + msoutconcat)
      run(cmd, log=False)
   return   

def fix_equidistant_times(mslist, dryrun, dysco=True): 
    t = pt.table(mslist[0] + '/OBSERVATION', ack=False)
    telescope = t.getcol('TELESCOPE_NAME')[0] 
    t.close()
    mslist_return = []
    if telescope != 'LOFAR':
        import split_irregular_timeaxis  
    for ms in mslist:
        if telescope != 'LOFAR':
           if check_equidistant_times([ms], stop=False, return_result=True):
              print(ms + ' has a regular time axis')
              mslist_return.append(ms)
           else:
              ms_path = split_irregular_timeaxis.regularize_ms(ms, overwrite=True, dryrun=dryrun)
              # Do the splitting
              mslist_return = mslist_return + split_irregular_timeaxis.split_ms(ms_path, overwrite=True, prefix=ms_path, return_mslist=True, dryrun=dryrun, dysco=dysco)
        else:
           mslist_return.append(ms)
    return sorted(mslist_return)       
 
 
def check_equidistant_times(mslist, stop=True, return_result=False):
    ''' Check if times in mslist are equidistant

    Args:
        command (list): the list of ms
    Returns:
        reval (int): the returncode of the command.
    '''
    for ms in mslist:
        t = pt.table(ms, ack=False)
        times = np.unique(t.getcol('TIME'))
        t.close()
        if len(times) == 1: # single timestep data
            return  
        diff_times = np.abs(np.diff(times))[:-1] # take out the last one because this one can be special  due to rounding at the end....
        diff_times_medsub = np.abs(diff_times - np.median(diff_times))
        idx_deviating, = np.where(diff_times_medsub > 0.2*np.median(diff_times)) # 20% tolerance
        #print(len(idx_deviating))
        #print(idx_deviating)
        #sys.exit()
        if len(idx_deviating) > 0:
            print(diff_times)
            print('These time slots numbers are deviating', idx_deviating)
            print(diff_times[idx_deviating])
            print(ms, 'Time axis is not equidistant, this might cause DP3 errors and segmentation faults (check how your data was averaged')
            #raise Exception(ms +': Time axis is not equidistant')
            print('Avoid averaging your data with CASA or CARACal, instead average with DP3, this usually solves the issue')
            
            # comment line out below if you are willing to take the risk
            if stop:
                print('If you want to take the risk comment out the sys.exit() in the Python code')
                sys.exit()
        t.close()
    if return_result:
        if len(idx_deviating) > 0:
            return False # so irregular time axis
        else:
            return True # so normal time axis
    return
 
def check_equidistant_freqs(mslist):
    ''' Check if freuqencies in mslist are equidistant

    Args:
        command (list): the list of ms
    Returns:
        reval (int): the returncode of the command.
    '''
    for ms in mslist:
        t = pt.table(ms + '/SPECTRAL_WINDOW', ack=False)
        chan_freqs = t.getcol('CHAN_FREQ')[0]
        if len(chan_freqs) == 1: # single channel data
            return  
        diff_freqs = np.diff(chan_freqs)
        t.close()
        if len(np.unique(diff_freqs)) != 1:
            print(np.unique(diff_freqs))
            print(ms, 'Frequency channels are not equidistant, made a mistake in DP3 concat?')
            raise Exception(ms +': Freqeuency channels are no equidistant, made a mistake in DP3 concat?')
        t.close()
    return

def run(command, log=False):
    ''' Execute a shell command through subprocess

    Args:
        command (str): the command to execute.
    Returns:
        None
    '''
    if log:
        print(command)
        logger.info(command)  
    retval = subprocess.call(command, shell=True)
    if retval != 0:
        print('FAILED to run ' + command + ': return value is ' + str(retval))
        raise Exception(command)
    return retval


def fix_bad_weightspectrum(mslist, clipvalue):
    ''' Sets bad values in WEIGHT_SPECTRUM that affect imaging and subsequent self-calibration to 0.0.

    Args:
        mslist (list): a list of Measurement Sets to iterate over and fix outlier values of.
        clipvalue (float): value above which WEIGHT_SPECTRUM will be set to 0.
    Returns:
        None
    '''
    for ms in mslist:
        print('Clipping WEIGHT_SPECTRUM manually', ms, clipvalue)
        t = pt.table(ms, readonly=False)
        ws = t.getcol('WEIGHT_SPECTRUM')
        idx = np.where(ws > clipvalue)
        ws[idx] = 0.0
        t.putcol('WEIGHT_SPECTRUM', ws)
        t.close()
    return


def format_solint(solint, ms, return_ntimes=False):
    ''' Format the solution interval for DP3 calls.

    Args:
        solint (int or str): input solution interval.
        ms (str): measurement set to extract the integration time from.
    Returns:
        solintout (str): processed solution interval.
    '''
    if str(solint).isdigit():
        if return_ntimes:
            t = pt.table(ms, readonly=True, ack=False)
            time = np.unique(t.getcol('TIME'))
            t.close()
            return str(solint), len(time)
        else:
            return str(solint)
    else:
        t = pt.table(ms, readonly=True, ack=False)
        time = np.unique(t.getcol('TIME'))
        tint = np.abs(time[1] - time[0])
        t.close()
        if 's' in solint:
            solintout = int(np.rint(float(re.findall(r'[+-]?\d+(?:\.\d+)?', solint)[0]) / tint))
        if 'm' in solint:
            solintout = int(np.rint(60. * float(re.findall(r'[+-]?\d+(?:\.\d+)?', solint)[0]) / tint))
        if 'h' in solint:
            solintout = int(np.rint(3600. * float(re.findall(r'[+-]?\d+(?:\.\d+)?', solint)[0]) / tint))
        if solintout < 1:
            solintout = 1
        if return_ntimes:
            return str(solintout), len(time)
        else:
            return str(solintout)


def format_nchan(nchan, ms):
    ''' Format the solution interval for DP3 calls.

    Args:
        nchan (int or str): input solution interval along the frequency axis.
        ms (str): measurement set to extract the frequnecy resolution from.
    Returns:
        solintout (str): processed frequency solution interval.
    '''
    if str(nchan).isdigit():
        return str(nchan)
    else:
        t = pt.table(ms + '/SPECTRAL_WINDOW', ack=False)
        chanw = np.median(t.getcol('CHAN_WIDTH'))
        t.close()
        if 'Hz' in nchan:
            nchanout = int(np.rint(float(re.findall(r'[+-]?\d+(?:\.\d+)?', nchan)[0]) / chanw))
        if 'kHz' in nchan:
            nchanout = int(np.rint(1e3 * float(re.findall(r'[+-]?\d+(?:\.\d+)?', nchan)[0]) / chanw))
        if 'MHz' in nchan:
            nchanout = int(np.rint(1e6 * float(re.findall(r'[+-]?\d+(?:\.\d+)?', nchan)[0]) / chanw))
        if nchanout < 1:
            nchanout = 1
        return str(nchanout)

def make_utf8(inp):
    """
    Convert input to utf8 instead of bytes
    :param inp: string input
    :return: input in utf-8 format
    """

    try:
        inp = inp.decode('utf8')
        return inp
    except (UnicodeDecodeError, AttributeError):
        return inp


def FFTdelayfinder(h5, refant):
    from scipy.fftpack import fft, fftfreq
    H = tables.open_file(h5)
    upsample_factor = 10

    # reference to refant
    refant_idx = np.where(H.root.sol000.phase000.ant[:] == refant)
    phase = H.root.sol000.phase000.val[:]
    phasen = phase - phase[:, :, refant_idx[0], :]

    phasecomplex = np.exp(phasen * 1j)
    freq = H.root.sol000.phase000.freq[:]
    timeaxis = H.root.sol000.phase000.time[:]
    timeaxis = timeaxis - np.min(timeaxis)

    delayaxis = fftfreq(upsample_factor * freq.size,
                        d=np.abs(freq[1] - freq[0]) / float(upsample_factor))

    for ant_id, ant in enumerate(H.root.sol000.phase000.ant[:]):
        delay = 0.0 * H.root.sol000.phase000.time[:]
        print('FFT delay finding for:', ant)
        for time_id, time in enumerate(H.root.sol000.phase000.time[:]):
            delay[time_id] = delayaxis[np.argmax(np.abs(fft(phasecomplex[time_id, :, ant_id, 0], n=upsample_factor * len(freq))))]
        plt.plot(timeaxis/3600., delay*1e9)
    plt.ylim(-2e-6 * 1e9, 2e-6 * 1e9)
    plt.ylabel('Delay [ns]')
    plt.xlabel('Time [hr]')
    # plt.title(ant)
    plt.show()
    H.close()
    return


def check_strlist_or_intlist(argin):
    ''' Check if the argument is a list of integers or a list of strings with correct formatting.

    Args:
        argin (str): input string to check.
    Returns:
        arg (list): properly formatted list extracted from the output.
    '''

    # check if input is a list and make proper list format
    arg = ast.literal_eval(argin)
    if type(arg) is not list:
        raise argparse.ArgumentTypeError("Argument \"%s\" is not a list" % (argin))

    # check for integer list
    if all([isinstance(item, int) for item in arg]):
        if np.min(arg) < 1:
            raise argparse.ArgumentTypeError("solint_list cannot contain values smaller than 1")
        else:
            return arg
    # so not an integer list, so now check for string list
    if all([isinstance(item, str) for item in arg]):
        # check if string contains numbers
        for item2 in arg:
            # print(item2)
            if not any([ch.isdigit() for ch in item2]):
                raise argparse.ArgumentTypeError("solint_list needs to contain some number characters, not only units")
            # check in the number in there is smaller than 1
            # print(re.findall(r'[+-]?\d+(?:\.\d+)?',item2)[0])
            if float(re.findall(r'[+-]?\d+(?:\.\d+)?', item2)[0]) <= 0.0:
                raise argparse.ArgumentTypeError("numbers in solint_list cannot be smaller than zero")
            # check if string contains proper time formatting
            if ('hr' in item2) or ('min' in item2) or ('sec' in item2) or ('h' in item2) or ('m' in item2) or ('s' in item2) or ('hour' in item2) or ('minute' in item2) or ('second' in item2):
                pass
            else:
                raise argparse.ArgumentTypeError("solint_list needs to have proper time formatting (h(r), m(in), s(ec))")
        return arg
    else:
        raise argparse.ArgumentTypeError("solint_list must be a list of positive integers or a list of properly formatted strings")


def compute_distance_to_pointingcenter(msname, HBAorLBA='HBA', warn=False, returnval=False, dologging=True):
    ''' Compute distance to the pointing center. This is mainly useful for international baseline observation to check of the delay calibrator is not too far away.

    Args:
        msname (str): path to the measurement set to check.
        HBAorLBA (str): whether the data is HBA or LBA data. Can be 'HBA' or 'LBA'.
    Returns:
        None
    '''
    if HBAorLBA == 'HBA':
        warn_distance = 1.25
    if HBAorLBA == 'LBA':
        warn_distance = 3.0
    if HBAorLBA == 'other':
        warn_distance = 3.0

    field_table = pt.table(msname + '::FIELD', ack=False)
    direction = field_table.getcol('PHASE_DIR').squeeze()
    ref_direction = field_table.getcol('REFERENCE_DIR').squeeze()
    field_table.close()
    c1 = SkyCoord(direction[0] * units.radian, direction[1] * units.radian, frame='icrs')
    c2 = SkyCoord(ref_direction[0] * units.radian, ref_direction[1] * units.radian, frame='icrs')
    seperation = c1.separation(c2).to(units.deg)
    print('Distance to pointing center', seperation)
    if dologging:
       logger.info('Distance to pointing center:' + str(seperation))
    if (seperation.value > warn_distance) and warn:
        print('Warning: you are trying to selfcal a source far from the pointing, this is probably going to produce bad results')
        logger.warning('Warning: you are trying to selfcal a source far from the pointing, this is probably going to produce bad results')
    if returnval:
       return seperation.value  
    return


def remove_flagged_data_startend(mslist):
    ''' Trim flagged data at the start and end of the observation.

    Args:
        mslist (list): list of measurement sets to iterate over.
    Returns:
        mslistout (list): list of measurement sets with flagged data trimmed.
    '''

    taql = 'taql'
    mslistout = []

    for ms in mslist:
        t = pt.table(ms, readonly=True, ack=False)
        alltimes = t.getcol('TIME')
        alltimes = np.unique(alltimes)

        newt = pt.taql('select TIME from $t where FLAG[0,0]=False')
        time = newt.getcol('TIME')
        time = np.unique(time)

        print('There are', len(alltimes), 'times')
        print('There are', len(time), 'unique unflagged times')

        print('First unflagged time', np.min(time))
        print('Last unflagged time', np.max(time))

        goodstartid = np.where(alltimes == np.min(time))[0][0]
        goodendid = np.where(alltimes == np.max(time))[0][0] + 1

        print(goodstartid, goodendid)
        t.close()

        if (goodstartid != 0) or (goodendid != len(alltimes)):
            msout = ms + '.cut'
            if os.path.isdir(msout):
                os.system('rm -rf ' + msout)

            cmd = taql + " ' select from " + ms + " where TIME in (select distinct TIME from " + ms
            cmd += " offset " + str(goodstartid)
            cmd += " limit " + str((goodendid - goodstartid)) + ") giving "
            cmd += msout + " as plain'"
            print(cmd)
            run(cmd)
            mslistout.append(msout)
        else:
            mslistout.append(ms)
    return mslistout


def check_code_is_uptodate():
    ''' Check if the code is at its latest version.
    
    From https://jckantor.github.io/cbe61622/A.02-Downloading_Python_source_files_from_github.html
    '''
    import filecmp
    url = "https://raw.githubusercontent.com/jurjen93/lofar_helpers/master/h5_merger.py"

    try:
        result = subprocess.run(["wget", "--no-cache", "--backups=1", url, "--output-document=tmpfile"], stderr=subprocess.PIPE, stdout=subprocess.PIPE)
        print(result.stderr.decode("utf-8"))
    except:  # for Python versions 3.5 and lower
        os.system("wget --no-cache --backups=1 " + url + " --output-document=tmpfile")

    if not filecmp.cmp('h5_merger.py', 'tmpfile'):
        print('Warning, you are using an old version of h5_merger.py')
        print('Download the latest version from https://github.com/jurjen93/lofar_helpers')
        logger.warning('Using an old h5_merger.py version, download the latest one from https://github.com/jurjen93/lofar_helpers')
        time.sleep(1)

    with open('h5_merger.py') as f:
        if 'propagate_flags' not in f.read():
            print("Update h5_merger, this version misses the propagate_flags option")
            raise Exception("Update h5_merger, this version misses the propagate_flags option")
    return


def force_close(h5):
    ''' Close indivdual HDF5 file by force.

    Args:
        h5 (str): name of the h5parm to close.
    Returns:
        None
    '''
    h5s = list(tables.file._open_files._handlers)
    for h in h5s:
        if h.filename == h5:
            logger.warning('force_close: Closed --> ' + h5 + '\n')
            print('Forced (!) closing', h5)
            h.close()
            return
    # sys.stderr.write(h5 + ' not found\n')
    return


def create_mergeparmdbname(mslist, selfcalcycle):
    ''' Merges the h5parms for a given list of measurement sets and selfcal cycle.

    Args:
        mslist (list): list of measurement sets to iterate over.
        selfcalcycle (int): the selfcal cycle for which to merge h5parms.
    Returns:
        parmdblist (list): list of names of the merged h5parms.
    '''
    parmdblist = mslist[:]
    for ms_id, ms in enumerate(mslist):
        parmdblist[ms_id] = 'merged_selfcalcyle' + str(selfcalcycle).zfill(3) + '_' + ms + '.avg.h5'
    print('Created parmdblist', parmdblist)
    return parmdblist


def preapplydelay(H5filelist, mslist, applydelaytype, dysco=True):
    ''' Pre-apply a given list of h5parms to a measurement set, specifically intended for post-delay calibration sources.

    Args:
        H5filelist (list): list of h5parms to apply.
        mslist (list): list of measurement set to apply corrections to.
        applydelaytype (str): 'linear' or 'circular' to indicate the polarisation type of the solutions.
        dysco (bool): dysco compress the circular data column or not.
    Returns:
        None
    '''
    for ms in mslist:
        parmdb = time_match_mstoH5(H5filelist, ms)
        # from LINEAR to CIRCULAR
        if applydelaytype == 'circular':
            scriptn = 'python lin2circ.py'
            cmdlin2circ = scriptn + ' -i ' + ms + ' --column=DATA --outcol=DATA_CIRC'
            if not dysco:
                cmdlin2circ += ' --nodysco'
            run(cmdlin2circ)
            # APPLY solutions
            applycal(ms, parmdb, msincol='DATA_CIRC', msoutcol='CORRECTED_DATA', dysco=dysco)
        else:
            applycal(ms, parmdb, msincol='DATA', msoutcol='CORRECTED_DATA', dysco=dysco)
        # from CIRCULAR to LINEAR
        if applydelaytype == 'circular':
            cmdlin2circ = scriptn + ' -i ' + ms + ' --column=CORRECTED_DATA --lincol=DATA --back'
            if not dysco:
                cmdlin2circ += ' --nodysco'
            run(cmdlin2circ)
        else:
            run("taql 'update " + ms + " set DATA=CORRECTED_DATA'")
    return


def preapply(H5filelist, mslist, updateDATA=True, dysco=True):
    ''' Pre-apply a given set of corrections to a list of measurement sets.

    Args:
        H5filelist (list): list of h5parms to apply.
        mslist (list): list of measurement set to apply corrections to.
        updateDATA (bool): overwrite DATA with CORRECTED_DATA after solutions have been applied.
        dysco (bool): dysco compress the CORRECTED_DATA column or not.
    Returns:
        None
    '''
    for ms in mslist:
        parmdb = time_match_mstoH5(H5filelist, ms)
        applycal(ms, parmdb, msincol='DATA', msoutcol='CORRECTED_DATA', dysco=dysco)
        if updateDATA:
            run("taql 'update " + ms + " set DATA=CORRECTED_DATA'")
    return


def time_match_mstoH5(H5filelist, ms):
    ''' Find the h5parms, from a given list, that overlap in time with the specified Measurement Set.

    Args:
        H5filelist (list): list of h5parms to apply.
        ms (str): Measurement Set to match h5parms to.
    Returns:
        H5filematch (list): list of h5parms matching the measurement set.
    '''
    t = pt.table(ms)
    timesms = np.unique(t.getcol('TIME'))
    t.close()
    H5filematch = None

    for H5file in H5filelist:
        H = tables.open_file(H5file, mode='r')    
        try:
            times = H.root.sol000.amplitude000.time[:]
        except:
            pass
        try:
            times = H.root.sol000.rotation000.time[:]
        except:
            pass 
        try:
            times = H.root.sol000.phase000.time[:]
        except:
            pass      
        try:
            times = H.root.sol000.tec000.time[:]
        except:
            pass
        if np.median(times) >= np.min(timesms) and np.median(times) <= np.max(timesms):
            print(H5file, 'overlaps in time with', ms)
            H5filematch = H5file
        H.close()

    if H5filematch is None:
        print('Cannot find matching H5file and ms')
        raise Exception('Cannot find matching H5file and ms')

    return H5filematch


def logbasicinfo(args, fitsmask, mslist, version, inputsysargs):
    ''' Prints basic information to the screen.

    Args:
        args (iterable): list of input arguments.
        fitsmask (str): name of the user-provided FITS mask.
        mslist (list): list of input measurement sets.
    '''
    logger.info(' '.join(map(str,inputsysargs)))

    logger.info('Version:                   ' + str(version))
    logger.info('Imsize:                    ' + str(args['imsize']))
    logger.info('Pixelscale:                ' + str(args['pixelscale']))
    logger.info('Niter:                     ' + str(args['niter']))
    logger.info('Uvmin:                     ' + str(args['uvmin']  ))
    logger.info('Multiscale:                ' + str(args['multiscale']))
    logger.info('Beam correction:           ' + str(args['beamcor']))
    logger.info('IDG:                       ' + str(args['idg']))
    logger.info('Widefield:                 ' + str(args['forwidefield']))
    logger.info('Flagslowamprms:            ' + str(args['flagslowamprms']))
    logger.info('flagslowphaserms:          ' + str(args['flagslowphaserms']))
    logger.info('Do linear:                 ' + str(args['dolinear']))
    logger.info('Do circular:               ' + str(args['docircular']))
    if args['boxfile'] is not None:
        logger.info('Bobxfile:                  ' + args['boxfile'])
    logger.info('Mslist:                    ' + ' '.join(map(str,mslist)))
    logger.info('User specified clean mask: ' + str(fitsmask))
    logger.info('Threshold for MakeMask:    ' + str(args['maskthreshold']))
    logger.info('Briggs robust:             ' + str(args['robust']))
    return


def max_area_of_island(grid):
    ''' Calculate the area of an island.

    Args:
        grid (ndarray): input image.
    Returns:
        None
    '''
    rlen, clen = len(grid), len(grid[0])

    def neighbors(r, c):
        ''' Generate the neighbor coordinates of the given row and column that are within the bounds of the grid.

        Args:
            r (int): row coordinate.
            c (int): column coordinate.
        '''
        for dr, dc in [(-1, 0), (1, 0), (0, -1), (0, 1)]:
            if (0 <= r + dr < rlen) and (0 <= c + dc < clen):
                yield r + dr, c + dc

    visited = [[False] * clen for _ in range(rlen)]

    def island_size(r, c):
        ''' Find the area of the land connected to the given coordinate.

        Return 0 if the coordinate is water or if it has already been explored in a previous call to island_size().

        Args:
            r (int): row coordinate.
            c (int): column coordinate.
        '''
        if grid[r][c] == 0 or visited[r][c]:
            return 0
        area = 1
        stack = [(r, c)]
        visited[r][c] = True
        while stack:
            for r, c in neighbors(*stack.pop()):
                if grid[r][c] and not visited[r][c]:
                    stack.append((r, c))
                    visited[r][c] = True
                    area += 1
        return area
    return max(island_size(r, c) for r, c in product(range(rlen), range(clen)))


def getlargestislandsize(fitsmask):
    ''' Find the largest island in a given FITS mask.

    Args:
        fitsmask (str): path to the FITS file.
    Returns:
        max_area (float): area of the largest island.
    '''
    hdulist = fits.open(fitsmask)
    data = hdulist[0].data
    max_area = max_area_of_island(data[0, 0, :, :])
    hdulist.close()
    return max_area


def create_phase_slope(inmslist, incol='DATA', outcol='DATA_PHASE_SLOPE', \
                       ampnorm=False, dysco=False, testscfactor=1., crosshandtozero=True):
    ''' Creates a new column to solve for a phase slope from.

    Args:
        inmslist (list): list of input measurement sets.
        incol (str): name of the input column to copy (meta)data from.
        outcol (str): name of the output column that will be created.
        ampnorm (bool): If True, only takes phases from the input visibilities and sets their amplitude to 1.
        dysco (bool): dysco compress the output column.
    Returns:
        None
    '''
    if not isinstance(inmslist, list):
        inmslist = [inmslist]
    for ms in inmslist:
        t = pt.table(ms, readonly=False, ack=True)
        if outcol not in t.colnames():
            print('Adding', outcol, 'to', ms)
            desc = t.getcoldesc(incol)
            newdesc = pt.makecoldesc(outcol, desc)
            newdmi = t.getdminfo(incol)
            if dysco:
                newdmi['NAME'] = 'Dysco' + outcol
            else:
                newdmi['NAME'] = outcol
            t.addcols(newdesc, newdmi)
        data = t.getcol(incol)
        dataslope = np.copy(data)
        for ff in range(data.shape[1] - 1):
            if ampnorm:
                dataslope[:, ff, 0] = np.copy(np.exp(1j*testscfactor*(np.angle(data[:, ff, 0]) - np.angle(data[:, ff + 1, 0]))))
                dataslope[:, ff, 3] = np.copy(np.exp(1j*testscfactor*(np.angle(data[:, ff, 3]) - np.angle(data[:, ff + 1, 3]))))
                if crosshandtozero:
                   dataslope[:, ff, 1] = 0.*np.exp(1j*0)
                   dataslope[:, ff, 2] = 0.*np.exp(1j*0)
            else:
                dataslope[:, ff, 0] = np.copy(np.abs(data[:, ff, 0]) * np.exp(1j * testscfactor*(np.angle(data[:, ff, 0]) - np.angle(data[:, ff + 1, 0]))))
                dataslope[:, ff, 3] = np.copy(np.abs(data[:, ff, 3]) * np.exp(1j * testscfactor*(np.angle(data[:, ff, 3]) - np.angle(data[:, ff + 1, 3]))))
                if crosshandtozero:
                   dataslope[:, ff, 1] = 0.*np.exp(1j*0)
                   dataslope[:, ff, 2] = 0.*np.exp(1j*0)

        # last freq set to second to last freq because difference reduces length of freq axis with one
        dataslope[:, -1, :] = np.copy(dataslope[:, -2, :])
        t.putcol(outcol, dataslope)
        t.close()
        # print( np.nanmedian(np.abs(data)))
        # print( np.nanmedian(np.abs(dataslope)))
        del data, dataslope
    return

def stackwrapper(inmslist: list, msout: str = 'stack.MS', column_to_normalise: str = 'DATA') -> None:
    ''' Wraps the stack
    Arguments
    ---------
    inmslist : list
        List of input MSes to stack
    '''
    if type(inmslist) is not list:
        raise TypeError('Incorrect input type for inmslist')
    print('Adding weight spectrum to stack')
    #create_weight_spectrum(inmslist, 'WEIGHT_SPECTRUM_PM', updateweights=True,\
    create_weight_spectrum(inmslist, 'WEIGHT_SPECTRUM_PM', updateweights=True,\
                            updateweights_from_thiscolumn='MODEL_DATA')
    print('Attempting to normalise data to point source')
    normalize_data_bymodel(inmslist, outcol='DATA_NORM', incol=column_to_normalise, \
                          modelcol='MODEL_DATA')
    print('Stacking datasets')
    import time
    start = time.time()
    stackMS_taql(inmslist, outputms=msout, incol='DATA_NORM', outcol='DATA', weightref='WEIGHT_SPECTRUM_PM')
    #stackMS(inmslist, outputms='stack.MS', incol='DATA_NORM', outcol='DATA', weightref='WEIGHT_SPECTRUM_PM')
    now = time.time()
    print(f'Stacking took {now - start} seconds')

def create_weight_spectrum_modelratio(inmslist, outweightcol, updateweights=False,\
                            originalmodel='MODEL_DATA',newmodel='MODEL_DATA_PHASE_SLOPE', backup=True):
   if not isinstance(inmslist, list):
        inmslist = [inmslist]
   stepsize = 1000000
   for ms in inmslist:
      t = pt.table(ms, readonly=False, ack=True)
      weightref = 'WEIGHT_SPECTRUM'
      if 'WEIGHT_SPECTRUM_SOLVE' in t.colnames():
         weightref = 'WEIGHT_SPECTRUM_SOLVE' # for LoTSS-DR2 datasets 
      if backup and ('WEIGHT_SPECTRUM_BACKUP' not in t.colnames()):
         desc = t.getcoldesc(weightref)
         desc['name'] = 'WEIGHT_SPECTRUM_BACKUP'
         t.addcols(desc)
        
      if outweightcol not in t.colnames():
         print('Adding', outweightcol, 'to', ms, 'based on', weightref)
         desc = t.getcoldesc(weightref)
         desc['name'] = outweightcol
         t.addcols(desc)
      #os.system('DP3 msin={ms} msin.datacolumn={weightref} msout=. msout.datacolumn={outweightcol} steps=[]')
      for row in range(0,t.nrows(),stepsize):   
         print("Doing {} out of {}, (step: {})".format(row, t.nrows(), stepsize))
         weight = t.getcol(weightref,startrow=row,nrow=stepsize,rowincr=1).astype(np.float64)
         if updateweights and originalmodel in t.colnames() and newmodel in t.colnames():
            model_orig = t.getcol(originalmodel,startrow=row,nrow=stepsize,rowincr=1).astype(np.complex256)
            model_new = t.getcol(newmodel,startrow=row,nrow=stepsize,rowincr=1).astype(np.complex256)
            
            model_orig[:,:,1] = model_orig[:,:,0] # make everything XX/RR
            model_orig[:,:,2] = model_orig[:,:,0] # make everything XX/RR
            model_orig[:,:,3] = model_orig[:,:,0] # make everything XX/RR
            model_new[:,:,1] = model_new[:,:,0] # make everything XX/RR
            model_new[:,:,2] = model_new[:,:,0] # make everything XX/RR
            model_new[:,:,3] = model_new[:,:,0] # make everything XX/RR
         else: 
            model_orig = 1.
            model_new = 1.
         print('Mean weights input',np.nanmean(weight))
         print('Mean weights change factor',np.nanmean((np.abs(model_orig))**2))
         t.putcol(outweightcol, (weight*(np.abs(model_orig/model_new))**2).astype(np.float64), startrow=row, nrow=stepsize, rowincr=1)
         #print(weight.shape, model_orig.shape)
      t.close()
      print()
      del weight, model_orig, model_new


def create_weight_spectrum(inmslist, outweightcol, updateweights=False,\
                            updateweights_from_thiscolumn='MODEL_DATA', backup=True):
   if not isinstance(inmslist, list):
        inmslist = [inmslist]
   stepsize = 1000000
   for ms in inmslist:
      t = pt.table(ms, readonly=False, ack=True)
      weightref = 'WEIGHT_SPECTRUM'
      if 'WEIGHT_SPECTRUM_SOLVE' in t.colnames():
         weightref = 'WEIGHT_SPECTRUM_SOLVE' # for LoTSS-DR2 datasets 
      if backup and ('WEIGHT_SPECTRUM_BACKUP' not in t.colnames()):
         desc = t.getcoldesc(weightref)
         desc['name'] = 'WEIGHT_SPECTRUM_BACKUP'
         t.addcols(desc)
        
      if outweightcol not in t.colnames():
         print('Adding', outweightcol, 'to', ms, 'based on', weightref)
         desc = t.getcoldesc(weightref)
         desc['name'] = outweightcol
         t.addcols(desc)
      #os.system('DP3 msin={ms} msin.datacolumn={weightref} msout=. msout.datacolumn={outweightcol} steps=[]')
      for row in range(0,t.nrows(),stepsize):   
         print("Doing {} out of {}, (step: {})".format(row, t.nrows(), stepsize))
         weight = t.getcol(weightref,startrow=row,nrow=stepsize,rowincr=1).astype(np.float64)
         if updateweights and updateweights_from_thiscolumn in t.colnames():
            model = t.getcol(updateweights_from_thiscolumn,startrow=row,nrow=stepsize,rowincr=1).astype(np.complex256)
            model[:,:,1] = model[:,:,0] # make everything XX/RR
            model[:,:,2] = model[:,:,0] # make everything XX/RR
            model[:,:,3] = model[:,:,0] # make everything XX/RR
         else: 
            model = 1.
         print('Mean weights input',np.nanmean(weight))
         print('Mean weights change factor',np.nanmean((np.abs(model))**2))
         t.putcol(outweightcol, (weight*(np.abs(model))**2).astype(np.float64), startrow=row, nrow=stepsize, rowincr=1)
         #print(weight.shape, model.shape)
      t.close()
      print()
      del weight, model

def create_weight_spectrum_taql(inmslist, outweightcol, updateweights=False,\
                            updateweights_from_thiscolumn='MODEL_DATA'):
   if not isinstance(inmslist, list):
        inmslist = [inmslist]
   for ms in inmslist:
      t = pt.table(ms, readonly=False, ack=True)
      weightref = 'WEIGHT_SPECTRUM'
      if 'WEIGHT_SPECTRUM_SOLVE' in t.colnames():
         weightref = 'WEIGHT_SPECTRUM_SOLVE' # for LoTSS-DR2 datasets 
      if outweightcol not in t.colnames():
         print('Adding', outweightcol, 'to', ms, 'based on', weightref)
         desc = t.getcoldesc(weightref)
         desc['name'] = outweightcol
         t.addcols(desc)
      pt.taql(f'UPDATE {ms} SET {updateweights_from_thiscolumn}[,1] = {updateweights_from_thiscolumn}[,0]')
      pt.taql(f'UPDATE {ms} SET {updateweights_from_thiscolumn}[,2] = {updateweights_from_thiscolumn}[,0]')
      pt.taql(f'UPDATE {ms} SET {updateweights_from_thiscolumn}[,3] = {updateweights_from_thiscolumn}[,0]')
      pt.taql(f'UPDATE {ms} SET {outweightcol} = {weightref} * abs({updateweights_from_thiscolumn})**2')
      weightmean = pt.taql('SELECT gmean(WEIGHT_SPECTRUM_PM) AS MEAN FROM ms1_nodysco_pointsource.ms').getcol('MEAN')
      change_factor = pt.taql('SELECT gmean(abs(MODEL_DATA)**2) AS MEAN FROM ms1_nodysco_pointsource.ms').getcol('MEAN')
      print('Mean weights input', weightmean)
      print('Mean weights change factor', change_factor)
      print()

def normalize_data_bymodel(inmslist, outcol='DATA_NORM', incol='DATA', \
                           modelcol='MODEL_DATA', stepsize=1000000):
   """
    Normalize visibility data by model data.

    Args:
        inmslist (str or list of str): List of input Measurement Set(s).
        outcol (str, optional): Name of the output column for normalized data. Default is 'DATA_NORM'.
        incol (str, optional): Name of the input column containing original data. Default is 'DATA'.
        modelcol (str, optional): Name of the model column. Default is 'MODEL_DATA'.
        stepsize (int, optional): Step size for processing rows. Default is 1000000.

    Returns:
        None

   """
   if not isinstance(inmslist, list):
        inmslist = [inmslist]
   for ms in inmslist:
      t = pt.table(ms, readonly=False, ack=True)
      if outcol not in t.colnames():
         print('Adding', outcol, 'to', ms, 'based on', incol)
         desc = t.getcoldesc(incol)
         desc['name'] = outcol
         t.addcols(desc)
      for row in range(0,t.nrows(),stepsize):   
         data = t.getcol(incol, startrow=row, nrow=stepsize, rowincr=1)
         if modelcol in t.colnames():
            model = t.getcol(modelcol, startrow=row, nrow=stepsize, rowincr=1)
            print("Doing {} out of {}, (step: {})".format(row, t.nrows(), stepsize))
            #print(np.max(abs(model)))
            #print(np.min(abs(model)))
            np.divide(data, model, out=data, where=np.abs(model)>0)
            t.putcol(outcol,data,startrow=row,nrow=stepsize,rowincr=1)
         else:
            t.putcol(outcol, data, startrow=row, nrow=stepsize, rowincr=1)
      t.close()

def stackMS(inmslist, outputms='stack.MS', incol='DATA_NORM', outcol='DATA', weightref='WEIGHT_SPECTRUM_PM', outcol_weight='WEIGHT_SPECTRUM', stepsize=1000000):
    """ Stack a list of MSes.
    
    Arguments
    ---------
    inmslist : list
        
    """
    print(f'Using input column {incol}')
    print(f'Writing to {outputms}')
    if not isinstance(inmslist, list):
        os.system('cp -r {} {}'.format(inmslist, outputms))
        print("WARNING: Stacking was performed on only one MS, so not really a meaningful stack")
        return True
    if os.path.isdir(outputms): # delete MS if it exists
        os.system('rm -rf ' +  outputms)
    os.system('cp -r {} {}'.format(inmslist[0], outputms))
    pt.taql('UPDATE stack.MS SET DATA=DATA_NORM*WEIGHT_SPECTRUM_PM')
    t_main = pt.table(outputms, readonly=False, ack=True)
    for ms in inmslist[1:]:
        t = pt.table(ms, readonly=True, ack=True)        
        for row in range(0, t.nrows(), stepsize):
            print("Doing {} out of {}, (step: {})".format(row, t.nrows(), stepsize))
            weight_main = t_main.getcol(outcol_weight, startrow=row, nrow=stepsize, rowincr=1)
            visibi_main = t_main.getcol(outcol, startrow=row, nrow=stepsize, rowincr=1)
            
            weight = t.getcol(weightref, startrow=row, nrow=stepsize, rowincr=1)
            visibi = t.getcol(incol, startrow=row, nrow=stepsize, rowincr=1)
            
            stacked_vis = visibi_main + (visibi * weight)

            average_wgt = weight + weight_main
            print(f'Writing stacked data to outputcolumn {outcol}')
            t_main.putcol(outcol, stacked_vis, startrow=row, nrow=stepsize, rowincr=1)
            print(f'Writing stacked weights to outputcolumn {outcol_weight}')
            t_main.putcol(outcol_weight, average_wgt, startrow=row, nrow=stepsize, rowincr=1)
        t.close()
    t_main.close()
    # This is probably wrong / not needed.
    pt.taql('UPDATE stack.MS SET DATA=DATA/WEIGHT_SPECTRUM')

def stackMS_taql(inmslist: list, outputms: str ='stack.MS', incol: str ='DATA_NORM', outcol: str ='DATA', weightref: str = 'WEIGHT_SPECTRUM_PM', outcol_weight: str = 'WEIGHT_SPECTRUM'):
    """ Stack a list of MSes.
    
    Arguments
    ---------
    inmslist : list
        List of input Measurement Sets to stack.
    outputms : str
        Name of the output MS.
    incol : str
        Column to stack from the individual MSes.
    outcol : str
        Name of the stacked data column in the output MS.
    weightref : str
        Name of the weight column to stack from the individual files.
    outcol_weight : str
        Name of the stacked weight column in the output MS.
    """
    print(f'Using input column {incol}')
    print(f'Writing to {outputms}')
    if not isinstance(inmslist, list):
        os.system('cp -r {} {}'.format(inmslist, outputms))
        print("WARNING: Stacking was performed on only one MS, so not really a meaningful stack")
        return True
    if os.path.isdir(outputms): # delete MS if it exists
        os.system('rm -rf ' +  outputms)
    os.system('cp -r {} {}'.format(inmslist[0], outputms))

    TAQLSTR = f'UPDATE {outputms} SET DATA = ('
    sum_clause = ' + '.join([f'ms{idx:02d}.DATA_NORM * ms{idx:02d}.WEIGHT_SPECTRUM_PM' for idx in range(1, len(inmslist)+1)])
    sum_weight_clause = ' + '.join([f'ms{idx:02d}.WEIGHT_SPECTRUM_PM' for idx in range(1, len(inmslist)+1)])
    from_clause = ', '.join([f'{ms} AS ms{idx:02d}' for idx,ms in enumerate(inmslist, start=1)])

    taql_query = f'{TAQLSTR} {sum_clause}) / ({sum_weight_clause}) FROM {from_clause}'


    print('Stacking DATA')
    print(taql_query)
    pt.taql(taql_query)

    print('Stacking WEIGHT_SPECTRUM')
    print(f'UPDATE {outputms} SET {outcol_weight} = ({sum_weight_clause}) FROM {from_clause}')
    pt.taql(f'UPDATE {outputms} SET {outcol_weight} = ({sum_weight_clause}) FROM {from_clause}')


def create_phasediff_column(inmslist, incol='DATA', outcol='DATA_CIRCULAR_PHASEDIFF', \
                            dysco=True, stepsize = 1000000):
    ''' Creates a new column for the phase difference solve.

    Args:
        inmslist (list): list of input Measurement Sets.
        incol (str): name of the input column to copy (meta)data from.
        outcol (str): name of the output column that will be created.
        dysco (bool): dysco compress the output column.
        stepsize (int): step size for row looping in casacore tables getcol/putcol 
    '''
    

    if not isinstance(inmslist, list):
        inmslist = [inmslist]
    for ms in inmslist:
        t = pt.table(ms, readonly=False, ack=True)
        if outcol not in t.colnames():
            print('Adding', outcol, 'to', ms)
            desc = t.getcoldesc(incol)
            newdesc = pt.makecoldesc(outcol, desc)
            newdmi = t.getdminfo(incol)
            if dysco:
                newdmi['NAME'] = 'Dysco' + outcol
            else:
                newdmi['NAME'] = outcol
            t.addcols(newdesc, newdmi)


        for row in range(0,t.nrows(),stepsize):
            print("Doing {} out of {}, (step: {})".format(row, t.nrows(), stepsize))
            data = t.getcol(incol,startrow=row,nrow=stepsize,rowincr=1)
            phasediff =  np.copy(np.angle(data[:, :, 0]) - np.angle(data[:, :, 3]))  #RR - LL
            data[:, :, 0] = 0.5 * np.exp(1j * phasediff)  # because I = RR+LL/2 (this is tricky because we work with phase diff)
            data[:, :, 3] = data[:, :, 0]
            t.putcol(outcol, data, startrow=row, nrow=stepsize, rowincr=1)
            del data
            del phasediff
        t.close()
        

    if False:
        # data = t.getcol(incol)
        # t.putcol(outcol, data)
        # t.close()

        time.sleep(2)
        cmd = "taql 'update " + ms + " set "
        cmd += outcol + "[,0]=0.5*EXP(1.0i*(PHASE(" + incol + "[,0])-PHASE(" + incol + "[,3])))'"
        # cmd += outcol + "[,3]=" + outcol + "[,0],"
        # cmd += outcol + "[,1]=0+0i,"
        # cmd += outcol + "[,2]=0+0i'"
        print(cmd)
        run(cmd)
        cmd = "taql 'update " + ms + " set "
        # cmd += outcol + "[,0]=0.5*EXP(1.0i*(PHASE(" + incol + "[,0])-PHASE(" + incol + "[,3]))),"
        cmd += outcol + "[,3]=" + outcol + "[,0]'"
        # cmd += outcol + "[,1]=0+0i,"
        # cmd += outcol + "[,2]=0+0i'"
        print(cmd)
        run(cmd)
    return


def create_phase_column(inmslist, incol='DATA', outcol='DATA_PHASEONLY', dysco=True):
    ''' Creates a new column containging visibilities with their original phase, but unity amplitude.

    Args:
        inmslist (list): list of input Measurement Sets.
        incol (str): name of the input column to copy (meta)data from.
        outcol (str): name of the output column that will be created.
        dysco (bool): dysco compress the output column.
    '''
    if not isinstance(inmslist, list):
        inmslist = [inmslist]
    for ms in inmslist:
        t = pt.table(ms, readonly=False, ack=True)
        if outcol not in t.colnames():
            print('Adding', outcol, 'to', ms)
            desc = t.getcoldesc(incol)
            newdesc = pt.makecoldesc(outcol, desc)
            newdmi = t.getdminfo(incol)
            if dysco:
                newdmi['NAME'] = 'Dysco' + outcol
            else:
                newdmi['NAME'] = outcol
            t.addcols(newdesc, newdmi)
        data = t.getcol(incol)
        data[:, :, 0] = np.copy(np.exp(1j * np.angle(data[:, :, 0])))  # because I = xx+yy/2
        data[:, :, 3] = np.copy(np.exp(1j * np.angle(data[:, :, 3])))  # because I = xx+yy/2
        t.putcol(outcol, data)
        t.close()
        del data
    return


def create_MODEL_DATA_PDIFF(inmslist):
    ''' Creates the MODEL_DATA_PDIFF column.

    Args:
      inmslist (list): list of input Measurement Sets.
    '''
    if not isinstance(inmslist, list):
        inmslist = [inmslist] 
    for ms in inmslist:
        run('DP3 msin=' + ms + ' msout=. msout.datacolumn=MODEL_DATA_PDIFF steps=[]')
        run("taql" + " 'update " + ms + " set MODEL_DATA_PDIFF[,0]=(0.5+0i)'")  # because I = RR+LL/2 (this is tricky because we work with phase diff)
        run("taql" + " 'update " + ms + " set MODEL_DATA_PDIFF[,3]=(0.5+0i)'")  # because I = RR+LL/2 (this is tricky because we work with phase diff)
        run("taql" + " 'update " + ms + " set MODEL_DATA_PDIFF[,1]=(0+0i)'")
        run("taql" + " 'update " + ms + " set MODEL_DATA_PDIFF[,2]=(0+0i)'")


def fulljonesparmdb(h5):
    ''' Checks if a given h5parm has a fulljones solution table as sol000.

    Args:
        h5 (str): path to the h5parm.
    Returns:
        fulljones (bool): whether the sol000 contains fulljones solutions.
    '''
    H=tables.open_file(h5) 
    try:
        pol_p = H.root.sol000.phase000.pol[:]
        pol_a = H.root.sol000.amplitude000.pol[:]
        if len(pol_p) == 4 and len(pol_a) == 4:
            fulljones = True
        else:
            fulljones = False
    except:
        fulljones = False
    H.close()
    return fulljones

def fix_weights_rotationh5(h5parm):
     '''
     DP3 bug causing weird weight values in rotation000, fix these
     https://github.com/lofar-astron/DP3/issues/327
     '''
     H = tables.open_file(h5parm, mode='a')
     weights = H.root.sol000.rotation000.weight[:]
     weights[(weights > 0.0) & (weights < 1.0)] = 1.0
     H.root.sol000.rotation000.weight[:] = np.copy(weights)
     H.flush()
     H.close()
     
     try:
         H = tables.open_file(h5parm, mode='a')
         weights = H.root.sol000.phase000.weight[:]
         weights[(weights > 0.0) & (weights < 1.0)] = 1.0
         H.root.sol000.phase000.weight[:] = np.copy(weights)
         H.flush()
         H.close()
     except:
         pass

     try:
         H.close()  
     except:
         pass
      
     try:
         H = tables.open_file(h5parm, mode='a')
         weights = H.root.sol000.amplitude000.weight[:]
         weights[(weights > 0.0) & (weights < 1.0)] = 1.0
         H.root.sol000.amplitude000.weight[:] = np.copy(weights)
         H.flush()
         H.close()
     except:
         pass

     try:
         H.close()  
     except:
         pass

     return


def h5_has_dir(h5):
   H=tables.open_file(h5)
   try:
       if 'dir' in H.root.sol000.phase000.val.attrs['AXES'].decode().split(','):
           H.close()
           return True
   except:
       pass  
   try:
       if 'dir' in H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(','):
           H.close()
           return True
   except:
       pass  
   try:
       if 'dir' in H.root.sol000.tec000.val.attrs['AXES'].decode().split(','):
           H.close()
           return True
   except:
       pass  
   try:
       if 'dir' in H.root.sol000.rotation000.val.attrs['AXES'].decode().split(','):
           H.close()
           return True
   except:
       pass  
   try:
       if 'dir' in H.root.sol000.rotationmeasure000.val.attrs['AXES'].decode().split(','):
           H.close()
           return True
   except:
       pass  
        
   H.close()
   return False

def reset_gains_noncore(h5parm, keepanntennastr='CS'):
    ''' Resets the gain of non-CS stations to unity amplitude and zero phase.

    Args:
        h5parm (str): path to the H5parm to reset gains of.
        keepantennastr (str): string containing antennas to keep.
    Returns:
      None
    '''
    fulljones = fulljonesparmdb(h5parm)  # True/False
    hasphase = True
    hasamps = True
    hasrotation = True
    hastec = True

    H = tables.open_file(h5parm, mode='a')
    # Figure out if we have phase and/or amplitude solutions.
    try:
        antennas = H.root.sol000.amplitude000.ant[:]
        axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
    except: 
        hasamps = False
    try:
        antennas = H.root.sol000.phase000.ant[:]
        axisn = H.root.sol000.phase000.val.attrs['AXES'].decode().split(',')
    except:
        hasphase = False
    try:
        antennas = H.root.sol000.tec000.ant[:]
        axisn = H.root.sol000.tec000.val.attrs['AXES'].decode().split(',')
    except:
        hastec = False
    try:
        antennas = H.root.sol000.rotation000.ant[:]
        axisn = H.root.sol000.rotation000.val.attrs['AXES'].decode().split(',')
    except:
        hasrotation = False     

    if hasphase:
        phase = H.root.sol000.phase000.val[:]
    if hasamps:  
        amp = H.root.sol000.amplitude000.val[:]
    if hastec:
        tec = H.root.sol000.tec000.val[:]
    if hasrotation:
        rotation = H.root.sol000.rotation000.val[:]

    for antennaid, antenna in enumerate(antennas):
        if antenna[0:2] != keepanntennastr:
            if hasphase:
                antennaxis = axisn.index('ant')  
                axisn = H.root.sol000.phase000.val.attrs['AXES'].decode().split(',')
                print('Resetting phase', antenna, 'Axis entry number', axisn.index('ant'))
                # print(phase[:,:,antennaid,...])
                if antennaxis == 0:
                    phase[antennaid, ...] = 0.0
                if antennaxis == 1:
                    phase[:, antennaid, ...] = 0.0
                if antennaxis == 2:
                    phase[:, :, antennaid, ...] = 0.0
                if antennaxis == 3:
                    phase[:, :, :, antennaid, ...] = 0.0  
                if antennaxis == 4:
                    phase[:, :, :, :, antennaid, ...] = 0.0
                # print(phase[:,:,antennaid,...])  
            if hasamps:
                antennaxis = axisn.index('ant')  
                axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
                print('Resetting amplitude', antenna, 'Axis entry number', axisn.index('ant'))
                if antennaxis == 0:
                    amp[antennaid, ...] = 1.0
                if antennaxis == 1:
                    amp[:, antennaid, ...] = 1.0
                if antennaxis == 2:
                    amp[:, :, antennaid, ...] = 1.0
                if antennaxis == 3:
                    amp[:, :, :, antennaid, ...] = 1.0  
                if antennaxis == 4:
                    amp[:, :, :, :, antennaid, ...] = 1.0
                if fulljones:  
                    amp[..., 1] = 0.0  # XY, assume pol is last axis
                    amp[..., 2] = 0.0  # YX, assume pol is last axis

            if hastec:
                antennaxis = axisn.index('ant')  
                axisn = H.root.sol000.tec000.val.attrs['AXES'].decode().split(',')
                print('Resetting TEC', antenna, 'Axis entry number', axisn.index('ant'))
                if antennaxis == 0:
                    tec[antennaid, ...] = 0.0
                if antennaxis == 1:
                    tec[:, antennaid, ...] = 0.0
                if antennaxis == 2:
                    tec[:, :, antennaid, ...] = 0.0
                if antennaxis == 3:
                    tec[:, :, :, antennaid, ...] = 0.0
                if antennaxis == 4:
                    tec[:, :, :, :, antennaid, ...] = 0.0

            if hasrotation:
                antennaxis = axisn.index('ant')  
                axisn = H.root.sol000.rotation000.val.attrs['AXES'].decode().split(',')
                print('Resetting rotation', antenna, 'Axis entry number', axisn.index('ant'))
                if antennaxis == 0:
                    rotation[antennaid, ...] = 0.0
                if antennaxis == 1:
                    rotation[:, antennaid, ...] = 0.0
                if antennaxis == 2:
                    rotation[:, :, antennaid, ...] = 0.0
                if antennaxis == 3:
                    rotation[:, :, :, antennaid, ...] = 0.0  
                if antennaxis == 4:
                    rotation[:, :, :, :, antennaid, ...] = 0.0     

    # fill values back in
    if hasphase:
        H.root.sol000.phase000.val[:] = np.copy(phase)
    if hasamps:  
        H.root.sol000.amplitude000.val[:] = np.copy(amp)
    if hastec:
        H.root.sol000.tec000.val[:] = np.copy(tec) 
    if hasrotation:
        H.root.sol000.rotation000.val[:] = np.copy(rotation)

    H.flush()
    H.close()
    return

# reset_gains_noncore('merged_selfcalcyle11_testquick260.ms.avg.h5')
# sys.exit()


def phaseup(msinlist, datacolumn='DATA', superstation='core', start=0, dysco=True):
    ''' Phase up stations into a superstation.

    Args:
        msinlist (list): list of input Measurement Sets to iterate over.
        datacolumn (str): the input data column to phase up data from.
        superstation (str): stations to phase up. Can be 'core' or 'superterp'.
        start (int): selfcal cylce that is being started from. Phaseup will only occur if start == 0.
        dysco (bool): dysco compress the output dataset.
    Returns:
        msoutlist (list): list of output Measurement Sets.
    '''
    msoutlist = []
    for ms in msinlist:
        msout = ms + '.phaseup'
        msoutlist.append(msout)

        cmd = "DP3 msin=" + ms + " steps=[add,filter] "
        cmd += "msout=" + msout + " msin.datacolumn=" + datacolumn + " "
        cmd += "filter.type=filter filter.remove=True "
        if dysco:
            cmd += "msout.storagemanager=dysco "
            cmd += 'msout.storagemanager.weightbitrate=16 '
        cmd += "add.type=stationadder "
        if superstation == 'core':
            cmd += "add.stations={ST001:'CS*'} filter.baseline='!CS*&&*' "
        if superstation == 'superterp':
            cmd += "add.stations={ST001:'CS00[2-7]*'} filter.baseline='!CS00[2-7]*&&*' "

        if start == 0:  # only phaseup if start selfcal from cycle 0, so skip for a restart
            if os.path.isdir(msout):
                os.system('rm -rf ' + msout)
            print(cmd)
            run(cmd)
    return msoutlist


def findfreqavg(ms, imsize, bwsmearlimit=1.0):
    ''' Find the frequency averaging factor for a Measurement Set given a bandwidth smearing constraint.

    Args:
        ms (str): path to the Measurement Set.
        imsize (float): size of the image in pixels.
        bwsmearlimit (float): the fractional acceptable bandwidth smearing.
    Returns:
        avgfactor (int): the frequency averaging factor for the Measurement Set.
    '''
    t = pt.table(ms + '/SPECTRAL_WINDOW',ack=False)
    bwsmear = bandwidthsmearing(np.median(t.getcol('CHAN_WIDTH')), np.min(t.getcol('CHAN_FREQ')[0]), float(imsize), verbose=False)
    nfreq = len(t.getcol('CHAN_FREQ')[0])
    t.close()
    avgfactor = 0

    for count in range(2, 21):  # try average values between 2 to 20
        if bwsmear < (bwsmearlimit / float(count)):  # factor X avg
            if nfreq % count == 0:
                avgfactor = count
    return avgfactor


def compute_markersize(H5file):
    ''' Computes matplotlib markersize for an H5parm.

    Args:
        H5file (str): path to an H5parm.
    Returns:
        markersize (int): marker size.
    '''
    ntimes = ntimesH5(H5file)
    markersize = 2
    if ntimes < 450:
        markersize = 4
    if ntimes < 100:
        markersize = 10
    if ntimes < 50:
        markersize = 15      
    return markersize


def ntimesH5(H5file):
    ''' Returns the number of timeslots in an H5parm.

    Args:
        H5file (str): path to H5parm.
    Returns:
        times (int): length of the time axis.
    '''
    H = tables.open_file(H5file, mode='r')
    try:
        times = H.root.sol000.amplitude000.time[:]
    except: # apparently no slow amps available
        try:
            times = H.root.sol000.phase000.time[:]
        except:
            try:  
                times = H.root.sol000.tec000.time[:]    
            except:  
                try:
                    times = H.root.sol000.rotationmeasure000.time[:]    
                except:
                    try:
                        times = H.root.sol000.rotation000.time[:]
                    except:    
                        print('No amplitude000,phase000, tec000, rotation000, or rotationmeasure000 solutions found')  
                        raise Exception('No amplitude000,phase000, tec000, rotation000, or rotationmeasure000 solutions found')
    H.close()
    return len(times)


def create_backup_flag_col(ms, flagcolname='FLAG_BACKUP'):
    ''' Creates a backup of the FLAG column.

    Args:
        ms (str): path to the Measurement Set.
        flagcolname (str): name of the output column.
    Returns:
        None
    '''
    cname = 'FLAG'
    flags = []
    t = pt.table(ms, readonly=False, ack=True)
    if flagcolname not in t.colnames():
        flags = t.getcol('FLAG')
        print('Adding flagging column', flagcolname, 'to', ms)
        desc = t.getcoldesc(cname)
        newdesc = pt.makecoldesc(flagcolname, desc)
        newdmi = t.getdminfo(cname)
        newdmi['NAME'] = flagcolname
        t.addcols(newdesc, newdmi)
        t.putcol(flagcolname, flags)
    t.close()
    del flags
    return


def check_phaseup_station(ms):
    ''' Check if the Measurement Set contains a superstation.

    Args:
        ms (str): path to the Measurement Set.
    Returns:
        None
    '''
    t = pt.table(ms + '/ANTENNA', ack=False)
    antennasms = list(t.getcol('NAME'))
    t.close()
    substr = 'ST'  # to check if a a superstation is present, assume this 'ST' string, usually ST001
    hassuperstation = any(substr in mystring for mystring in antennasms)
    print('Contains superstation?', hassuperstation)
    return hassuperstation

def checklongbaseline(ms):
    ''' Check if the Measurement Set contains international stations.

    Args:
        ms (str): path to the Measurement Set.
    Returns:
        None
    '''
    t = pt.table(ms + '/ANTENNA', ack=False)
    antennasms = list(t.getcol('NAME'))
    t.close()
    substr = 'DE'  # to check if a German station is present, if yes assume this is long baseline data
    haslongbaselines = any(substr in mystring for mystring in antennasms)
    print('Contains long baselines?', haslongbaselines)
    return haslongbaselines


def average(mslist, freqstep, timestep=None, start=0, msinnchan=None, msinstartchan=0., \
            phaseshiftbox=None, msinntimes=None, makecopy=False, \
            makesubtract=False, delaycal=False, freqresolution='195.3125kHz',\
            dysco=True, cmakephasediffstat=False, dataincolumn='DATA', \
            removeinternational=False, removemostlyflaggedstations=False):
    ''' Average and/or phase-shift a list of Measurement Sets.

    Args:
        mslist (list): list of Measurement Sets to iterate over.
        freqstep (int): the number of frequency slots to average.
        timestep (int): the number of time slots to average.
        start (int): selfcal cycle that is being started from.
        msinnchan (int): number of channels to take from the input Measurement Set.
        msinstartchan (int): start chanel for msinnchan
        phaseshiftbox (str): path to a DS9 region file to phaseshift to.
        msinntimes (int): number of timeslots to take from the input Measurement Set.
        makecopy (bool): appends '.copy' when making a copy of a Measurement Set.
        dysco (bool): Dysco compress the output Measurement Set.
    Returns:
        outmslist (list): list of output Measurement Sets.
    '''
    # sanity check
    if len(mslist) != len(freqstep):
        print('Hmm, made a mistake with freqstep?')
        raise Exception('len(mslist) != len(freqstep)')

    outmslist = []
    for ms_id, ms in enumerate(mslist):
        if (int(''.join([i for i in str(freqstep[ms_id]) if i.isdigit()])) > 0) or (timestep is not None) or (
                msinnchan is not None) or \
                (phaseshiftbox is not None) or (msinntimes is not None) \
                or removeinternational or removemostlyflaggedstations:  # if this is True then average
            
            # set this first, change name if needed below
            msout = ms + '.avg'
            if makecopy:
                msout = ms + '.copy'
            if makesubtract:
                msout = ms + '.subtracted'
            if cmakephasediffstat:
                msout =  ms + '.avgphasediffstat'
            
            msout = os.path.basename(msout)
            cmd = 'DP3 msin=' + ms + ' av.type=averager '
            cmd += 'msout=' + msout + ' msin.weightcolumn=WEIGHT_SPECTRUM '
            cmd += 'msin.datacolumn=' + dataincolumn + ' '
            if dysco:
                cmd += 'msout.storagemanager=dysco '
                cmd += 'msout.storagemanager.weightbitrate=16 '
            if phaseshiftbox is not None:
                if removeinternational:
                    cmd += ' steps=[f,shift,av] '
                    cmd += " f.type=filter f.baseline='[CR]S*&' f.remove=True "
                else:
                    cmd += ' steps=[shift,av] '
                cmd += ' shift.type=phaseshifter '
                cmd += ' shift.phasecenter=\[' + getregionboxcenter(phaseshiftbox) + '\] '
            else:
                if removeinternational:
                    cmd += ' steps=[f,av] '
                    cmd += " f.type=filter f.baseline='[CR]S*&' f.remove=True "
                else:
                    cmd += ' steps=[av] '
            if removemostlyflaggedstations: 
                flagstationlist = return_antennas_highflaggingpercentage(ms)
                if len(flagstationlist) > 0:
                    baselinestr = filter_baseline_str_removestations(flagstationlist)
                    cmd += 'fs.type=filter fs.baseline=' + baselinestr + ' fs.remove=True '
                    cmd = cmd.replace('steps=[', 'steps=[fs,')          

            # freqavg
            if freqstep[ms_id] is not None:
                if str(freqstep[ms_id]).isdigit():
                    cmd += 'av.freqstep=' + str(freqstep[ms_id]) + ' '
                else:
                    freqstepstr = ''.join([i for i in freqstep[ms_id] if not i.isalpha()])
                    freqstepstrnot = ''.join([i for i in freqstep[ms_id] if i.isalpha()])
                    if freqstepstrnot != 'Hz' and freqstepstrnot != 'kHz' and freqstepstrnot != 'MHz':
                        print('For frequency averaging only units of (k/M)Hz are allowed, used:', freqstepstrnot)
                        raise Exception('For frequency averaging only units of " (k/M)Hz" are allowed')
                    cmd += 'av.freqresolution=' + str(freqstep[ms_id]) + ' '

                    # timeavg
            if timestep is not None:
                if str(timestep).isdigit():
                    cmd += 'av.timestep=' + str(int(timestep)) + ' '
                else:
                    timestepstr = ''.join([i for i in timestep if not i.isalpha()])
                    timestepstrnot = ''.join([i for i in timestep if i.isalpha()])
                    if timestepstrnot != 's' and timestepstrnot != 'sec':
                        print('For time averaging only units of s(ec) are allowed, used:', timestepstrnot)
                        raise Exception('For time averaging only units of "s(ec)" are allowed')
                    cmd += 'av.timeresolution=' + str(timestepstr) + ' '

            if msinnchan is not None:
                cmd += 'msin.nchan=' + str(msinnchan) + ' '
                cmd += 'msin.startchan=' + str(msinstartchan) + ' '
            if msinntimes is not None:
                cmd += 'msin.ntimes=' + str(msinntimes) + ' '
            if start == 0:
                print('Average with default WEIGHT_SPECTRUM:', cmd)
                if os.path.isdir(msout):
                    os.system('rm -rf ' + msout)
                run(cmd)

            msouttmp = ms + '.avgtmp'
            msouttmp = os.path.basename(msouttmp)
            cmd = 'DP3 msin=' + ms + ' av.type=averager '
            if removeinternational:
                cmd += ' steps=[f,av] '
                cmd += " f.type=filter f.baseline='[CR]S*&' f.remove=True "
            else:
                cmd += ' steps=[av] ' 
            if dysco:
                cmd += ' msout.storagemanager=dysco '
                cmd += 'msout.storagemanager.weightbitrate=16 '
            cmd += 'msout=' + msouttmp + ' msin.weightcolumn=WEIGHT_SPECTRUM_SOLVE '
            if removemostlyflaggedstations: 
                # step below can be skipped since flagstationlist was already made/defined
                #flagstationlist = return_antennas_highflaggingpercentage(ms)
                if len(flagstationlist) > 0:
                    baselinestr = filter_baseline_str_removestations(flagstationlist)
                    cmd += 'fs.type=filter fs.baseline=' + baselinestr + ' fs.remove=True '
                    cmd = cmd.replace('steps=[', 'steps=[fs,')
            
            # freqavg
            if freqstep[ms_id] is not None:
                if str(freqstep[ms_id]).isdigit():
                    cmd += 'av.freqstep=' + str(freqstep[ms_id]) + ' '
                else:
                    freqstepstr = ''.join([i for i in freqstep[ms_id] if not i.isalpha()])
                    freqstepstrnot = ''.join([i for i in freqstep[ms_id] if i.isalpha()])
                    if freqstepstrnot != 'Hz' and freqstepstrnot != 'kHz' and freqstepstrnot != 'MHz':
                        print('For frequency averaging only units of (k/M)Hz are allowed, used:', freqstepstrnot)
                        raise Exception('For frequency averaging only units of " (k/M)Hz" are allowed')
                    cmd += 'av.freqresolution=' + str(freqstep[ms_id]) + ' '

                    # timeavg
            if timestep is not None:
                if str(timestep).isdigit():
                    cmd += 'av.timestep=' + str(int(timestep)) + ' '
                else:
                    timestepstr = ''.join([i for i in timestep if not i.isalpha()])
                    timestepstrnot = ''.join([i for i in timestep if i.isalpha()])
                    if timestepstrnot != 's' and timestepstrnot != 'sec':
                        print('For time averaging only units of s(ec) are allowed, used:', timestepstrnot)
                        raise Exception('For time averaging only units of "s(ec)" are allowed')
                    cmd += 'av.timeresolution=' + str(timestepstr) + ' '
            if msinnchan is not None:
                cmd += 'msin.nchan=' + str(msinnchan) + ' '
                cmd += 'msin.startchan=' + str(msinstartchan) + ' '
            if msinntimes is not None:
                cmd += 'msin.ntimes=' + str(msinntimes) + ' '

            if start == 0:
                t = pt.table(ms)
                if 'WEIGHT_SPECTRUM_SOLVE' in t.colnames():  # check if present otherwise this is not needed
                    t.close()
                    print('Average with default WEIGHT_SPECTRUM_SOLVE:', cmd)
                    if os.path.isdir(msouttmp):
                        os.system('rm -rf ' + msouttmp)
                    run(cmd)

                    # Make a WEIGHT_SPECTRUM from WEIGHT_SPECTRUM_SOLVE
                    t = pt.table(msout, readonly=False)
                    print('Adding WEIGHT_SPECTRUM_SOLVE')
                    desc = t.getcoldesc('WEIGHT_SPECTRUM')
                    desc['name'] = 'WEIGHT_SPECTRUM_SOLVE'
                    t.addcols(desc)

                    t2 = pt.table(msouttmp, readonly=True)
                    imweights = t2.getcol('WEIGHT_SPECTRUM')
                    t.putcol('WEIGHT_SPECTRUM_SOLVE', imweights)

                    # Fill WEIGHT_SPECTRUM with WEIGHT_SPECTRUM from second ms
                    t2.close()
                    t.close()

                    # clean up
                    os.system('rm -rf ' + msouttmp)
                else:
                    t.close()
        
            outmslist.append(msout)
        else:
            outmslist.append(ms)  # so no averaging happened

    return outmslist

def uvmaxflag(msin, uvmax):
  cmd = 'DP3 msin=' + msin  + ' msout=. steps=[f] f.type=uvwflag f.uvlambdamax=' + str(uvmax)
  print(cmd)
  run(cmd)
  return


def tecandphaseplotter(h5, ms, outplotname='plot.png'):
    ''' Make TEC and phase plots.

    Args:
        h5 (str): path to the H5parm to plot.
        ms (str): path to th ecorresponding Measurement Set.
        outplotname (str): name of the output plot.
    Returns:
        None
    '''
    if not os.path.isdir('plotlosoto%s' % os.path.basename(ms)):  # needed because if this is the first plot this directory does not yet exist
        os.system('mkdir plotlosoto%s' % os.path.basename(ms))
    cmd = 'python plot_tecandphase.py  '
    cmd += '--H5file=' + h5 + ' --outfile=plotlosoto%s/%s_nolosoto.png' % (os.path.basename(ms), outplotname)
    print(cmd)
    run(cmd)
    return


def runaoflagger(mslist, strategy=None):
    ''' Run aoglagger on a Measurement Set.

    Args:
        mslist (list): list of Measurement Sets to iterate over.
    Returns:
        None
    '''
    for ms in mslist:
        if strategy is not None:
           cmd = 'aoflagger -strategy ' + strategy + ' ' + ms
        else:
           cmd = 'aoflagger ' + ms
        print(cmd)
        run(cmd)
    return

def build_applycal_dde_cmd(inparmdblist):
   if not isinstance(inparmdblist, list):
      inparmdblist = [inparmdblist]
   cmd = ''  # empy string to start with
   count = 0
   for parmdb in inparmdblist:
      H=tables.open_file(parmdb)
      try:
         tmp = H.root.sol000.phase000.val[:]
         cmd += 'ddecal.applycal.ac' + str(count) + '.parmdb=' + parmdb + ' '
         #cmd += 'ddecal.applycal.ac' + str(count) + '.type=applycal '  
         cmd += 'ddecal.applycal.ac' + str(count) + '.correction=phase000 '
         count = count + 1        
      except:
         pass
      try:
         tmp = H.root.sol000.amplitude000.val[:]
         cmd += 'ddecal.applycal.ac' + str(count) + '.parmdb=' + parmdb + ' '
         #cmd += 'ddecal.applycal.ac' + str(count) + '.type=applycal '  
         cmd += 'ddecal.applycal.ac' + str(count) + '.correction=amplitude000 '
         count = count + 1        
      except:
         pass

      H.close()

   if count < 1:
        print('Something went wrong, cannot build the applycal command. H5 file is valid?')
        raise Exception('Something went wrong, cannot build the applycal command. H5 file is valid?')  
   
   cmd += 'ddecal.applycal.steps=['
   for i in range(count):
     cmd += 'ac' + str(i)
     if i < count - 1:  # to avoid last comma in the steps list
       cmd += ','
   cmd += ']'
    
   return cmd

def corrupt_modelcolumns(ms, h5parm, modeldatacolumns):
    ''' Ccorrupt a list of model data columns with H5parm solutions

    Args:
        ms (str): path to a Measurement Set to apply solutions to.
        h5parm (list/str): H5parms to apply.
        modeldatacolumns (list): Model data columns list, there should be more than one, also these columns should alread exist. Note that input column will be overwritten.
    Returns:
        None
    '''
    
    # check for special case where direction (.dir) names contain DIL.
    special_DIL = False
    H = tables.open_file(h5parm,mode='r')
    try:
        dirnames = H.root.sol000.phase000.dir[:]
    except:
        pass
    try:
        dirnames = H.root.sol000.amplitude000.dir[:]
    except:
        pass
    try:
        dirnames = H.root.sol000.tec000.dir[:]
    except:
        pass      
    try:
        dirnames = H.root.sol000.rotation000.dir[:]
    except:
        pass      
    H.close()
    
    dirnames = dirnames.tolist()
    if 'DIL' in dirnames[0].decode("utf-8"):
        special_DIL = True
        
    for m_id, modelcolumn in enumerate(modeldatacolumns):
        if special_DIL:
          applycal(ms, h5parm, msincol=modelcolumn, msoutcol=modelcolumn, \
                 dysco=False, invert=False, direction=dirnames[m_id].decode("utf-8"))
        else:  
           applycal(ms, h5parm, msincol=modelcolumn, msoutcol=modelcolumn, \
                 dysco=False, invert=False, direction=modelcolumn)
    return    

def applycal(ms, inparmdblist, msincol='DATA',msoutcol='CORRECTED_DATA', \
             msout='.', dysco=True, modeldatacolumns=[], invert=True, direction=None, find_closestdir=False):
    ''' Apply an H5parm to a Measurement Set.

    Args:
        ms (str): path to a Measurement Set to apply solutions to.
        inparmdblist (list): list of H5parms to apply.
        msincol (str): input column to apply solutions to.
        msoutcol (str): output column to store corrected data in.
        msout (str): name of the output Measurement Set.
        dysco (bool): Dysco compress the output Measurement Set.
        modeldatacolumns (list): Model data columns list, if len(modeldatacolumns) > 1 we have a DDE solve
    Returns:
        None
    '''
    if find_closestdir and direction is not None:
       print('Wrong input, you cannot use find_closestdir and set a direction')
       raise Exception('Wrong input, you cannot use find_closestdir and set a direction')
    
    
    if len(modeldatacolumns) > 1:      
        return  
    # to allow both a list or a single file (string)
    if not isinstance(inparmdblist, list):
        inparmdblist = [inparmdblist]

    cmd = 'DP3 numthreads=' + str(np.min([multiprocessing.cpu_count(),8])) + ' msin=' + ms
    cmd += ' msout=' + msout + ' '
    cmd += 'msin.datacolumn=' + msincol + ' '
    if msout == '.':
        cmd += 'msout.datacolumn=' + msoutcol + ' '
    if dysco:
        cmd += 'msout.storagemanager=dysco '
        cmd += 'msout.storagemanager.weightbitrate=16 '
    count = 0
    for parmdb in inparmdblist:
        if find_closestdir:
           direction = make_utf8(find_closest_ddsol(parmdb,ms))
           print('Applying direction:', direction)
        if fulljonesparmdb(parmdb):
            cmd += 'ac' + str(count) + '.parmdb=' + parmdb + ' '
            cmd += 'ac' + str(count) + '.type=applycal '
            cmd += 'ac' + str(count) + '.correction=fulljones '
            cmd += 'ac' + str(count) + '.soltab=[amplitude000,phase000] '
            if not invert:
                cmd += 'ac' + str(count) + '.invert=False '  
            if direction is not None:
                if direction.startswith('MODEL_DATA'): # because then the direction name in the h5 contains bracket strings
                   cmd += 'ac' + str(count) + '.direction=[' + direction + '] '
                else:
                   cmd += 'ac' + str(count) + '.direction=' + direction + ' ' 
            count = count + 1
        else:  
            H=tables.open_file(parmdb) 

            if not invert: # so corrupt, rotation comes first in a rotation+diagonal apply
                try:
                    phase = H.root.sol000.rotation000.val[:]  # note that rotation comes before amplitude&phase for a corrupt (important if the solve was a rotation+diagonal one)
                    cmd += 'ac' + str(count) + '.parmdb=' + parmdb + ' '
                    cmd += 'ac' + str(count) + '.type=applycal '  
                    cmd += 'ac' + str(count) + '.correction=rotation000 '
                    cmd += 'ac' + str(count) + '.invert=False '                 
                    if direction is not None:
                        if direction.startswith('MODEL_DATA'): # because then the direction name in the h5 contains bracket strings
                           cmd += 'ac' + str(count) + '.direction=[' + direction + '] '
                        else:
                           cmd += 'ac' + str(count) + '.direction=' + direction + ' '
                    count = count + 1        
                except:
                    pass

            try:
                phase = H.root.sol000.phase000.val[:]
                cmd += 'ac' + str(count) + '.parmdb=' + parmdb + ' '
                cmd += 'ac' + str(count) + '.type=applycal '
                cmd += 'ac' + str(count) + '.correction=phase000 '
                if not invert:
                    cmd += 'ac' + str(count) + '.invert=False '                 
                if direction is not None:
                    if direction.startswith('MODEL_DATA'): # because then the direction name in the h5 contains bracket strings
                       cmd += 'ac' + str(count) + '.direction=[' + direction + '] '
                    else:
                       cmd += 'ac' + str(count) + '.direction=' + direction + ' '
                count = count + 1    
            except:
                pass

            try:
                phase = H.root.sol000.amplitude000.val[:]
                cmd += 'ac' + str(count) + '.parmdb=' + parmdb + ' '
                cmd += 'ac' + str(count) + '.type=applycal '  
                cmd += 'ac' + str(count) + '.correction=amplitude000 '
                if not invert:
                    cmd += 'ac' + str(count) + '.invert=False '                 
                if direction is not None:
                    if direction.startswith('MODEL_DATA'): # because then the direction name in the h5 contains bracket strings
                       cmd += 'ac' + str(count) + '.direction=[' + direction + '] '
                    else:
                       cmd += 'ac' + str(count) + '.direction=' + direction + ' '
                count = count + 1        
            except:
                pass


            try:
                phase = H.root.sol000.tec000.val[:]
                cmd += 'ac' + str(count) + '.parmdb=' + parmdb + ' '
                cmd += 'ac' + str(count) + '.type=applycal '
                cmd += 'ac' + str(count) + '.correction=tec000 '
                if not invert:
                    cmd += 'ac' + str(count) + '.invert=False '                 
                if direction is not None:
                    if direction.startswith('MODEL_DATA'): # because then the direction name in the h5 contains bracket strings
                       cmd += 'ac' + str(count) + '.direction=[' + direction + '] '
                    else:
                       cmd += 'ac' + str(count) + '.direction=' + direction + ' '                                     
                count = count + 1
            except:
                pass

            if invert: # so applycal, rotation comes last in a rotation+diagonal apply
                try:
                    phase = H.root.sol000.rotation000.val[:]  # note that rotation comes after amplitude&phase for an applycal (important if the solve was a rotation+diagonal one)
                    cmd += 'ac' + str(count) + '.parmdb=' + parmdb + ' '
                    cmd += 'ac' + str(count) + '.type=applycal '  
                    cmd += 'ac' + str(count) + '.correction=rotation000 '
                    cmd += 'ac' + str(count) + '.invert=True '   # by default True but set here as a reminder because order matters for rotation+diagonal in this DP3 step depending on invert=True/False              
                    if direction is not None:
                        if direction.startswith('MODEL_DATA'): # because then the direction name in the h5 contains bracket strings
                           cmd += 'ac' + str(count) + '.direction=[' + direction + '] '
                        else:
                           cmd += 'ac' + str(count) + '.direction=' + direction + ' '
                    count = count + 1        
                except:
                    pass

            H.close()

    if count < 1:
        print('Something went wrong, cannot build the applycal command. H5 file is valid?')
        raise Exception('Something went wrong, cannot build the applycal command. H5 file is valid?')
    # build the steps command
    cmd += 'steps=['
    for i in range(count):
        cmd += 'ac' + str(i)
        if i < count - 1:  # to avoid last comma in the steps list
            cmd += ','
    cmd += ']'

    print('DP3 applycal:', cmd)
    run(cmd,log=True)
    return


def inputchecker(args, mslist):
    ''' Check input validity.
    Args:
        args (dict): argparse inputs.
    '''
    #if args['BLsmooth']:
    #    if True in args['BLsmooth_list']:
    #        print('--BLsmooth cannot be used together with --BLsmooth-list')
    #        raise Exception('--BLsmooth cannot be used together with --BLsmooth-list') 

    # set telescope
    t = pt.table(mslist[0] + '/OBSERVATION', ack=False)
    telescope = t.getcol('TELESCOPE_NAME')[0] 
    t.close()
    #if telescope != 'LOFAR':
    #    check_equidistant_times(mslist)  

    if True in args['BLsmooth_list']:
        if len(args['soltypecycles_list']) != len(args['BLsmooth_list']):
            print('--BLsmooth-list length does not match the length of --soltype-list')
            raise Exception('--BLsmooth-list length does not match the length of --soltype-list') 
    
    for tmp in args['BLsmooth_list']:
       #print(args['BLsmooth_list'])
       if not (isinstance(tmp, bool)):
          print(args['BLsmooth_list'])
          print('--BLsmooth-list is not a list of booleans')
          raise Exception('--BLsmooth-list is not a list of booleans')
    
    if args['stack']: # avoid options that cannot be used when --stack is set
        if args['DDE']:
            print('--dde cannot be used with --stack')
            raise Exception('--dde cannot be used with --stack') 
        if args['compute_phasediffstat']:
            print('--compute-phasediffstat cannot be used with --stack')
            raise Exception('--compute-phasediffstat cannot be used with --stack') 
        if args['fitsmask'] is not None:
            print('--fitsmask cannot be used with --stack')
            raise Exception('--fitsmask cannot be used with --stack')
        if args['update_uvmin']:
            print('--update-uvmin cannot be used with --stack')
            raise Exception('--update-uvmin cannot be used with --stack') 
        if args['update_multiscale']:
            print('--update-multiscale cannot be used with --stack')
            raise Exception('--update-multiscale cannot be used with --stack') 
        if args['remove_outside_center']:
            print('--remove-outside-center cannot be used with --stack')
            raise Exception('--remove-outside-center cannot be used with --stack') 
        if args['auto']:
            print('--auto cannot be used with --stack')
            raise Exception('--auto cannot be used with --stack') 
        if args['tgssfitsimage'] is not None:
            print('--tgssfitsimage cannot be used with --stack')
            raise Exception('--tgssfitsimage cannot be used with --stack')  
        if args['QualityBasedWeights']:
            print('--QualityBasedWeights cannot be used with --stack')
            raise Exception('--QualityBasedWeights cannot be used with --stack')  

    if not args['stack']:
        if type(args['skymodel']) is list:
            print('Skymodel cannot be a list if --stack is not set')
            raise Exception('Skymodel cannot be a list if --stack is not set')  

    if args['DDE'] and args['preapplyH5_list'][0] is not None:
        print('--DDE and --preapplyH5-list cannot be used together')
        raise Exception('--DDE and --preapplyH5_list cannot be used together')

    if args['DDE']:
        for ms in mslist:
             t = pt.table(ms, readonly=True, ack=False) 
             if 'CORRECTED_DATA' in t.colnames(): # not allowed for DDE runs (because solving from DATA and imaging from DATA with an h5)
                 print(ms, 'contains a CORRECTED_DATA column, this is not allowed when using --DDE')
                 raise Exception('CORRECTED_DATA should not be present when using option --DDE')
             t.close()  

    if args['DDE'] and not args['forwidefield']:    
        print('--forwidefield needs to be set in DDE mode')
        raise Exception('--forwidefield needs to be set in DDE mode')

    if args['DDE'] and args['idg']:    
        print('Option --idg cannot be used with option --DDE')
        raise Exception('Option --idg cannot be used with option --DDE')

    if not args['stack']:
        if type(args['skymodelpointsource']) is list:
            print('skymodelpointsource cannot be a list if --stack is not set')
            raise Exception('skymodelpointsource cannot be a list if --stack is not set')  

    if not args['stack']:
        if type(args['wscleanskymodel']) is list:
            print('wscleanskymodel cannot be a list if --stack is not set')
            raise Exception('wscleanskymodel cannot be a list if --stack is not set')  

    # sanity check for resetdir_list input
    if type(args['resetdir_list']) is not list:
        print('--resetdir-list needs to be of type list')
        raise Exception('--resetdir-list needs to be of type list') 
    for resetdir in args['resetdir_list']: # check if it contains None or a integer list-type
        if resetdir is not None:
            if type(resetdir) is not list:
                print('--resetdir-list needs to None list-items, or contain a list of directions_id')
                raise Exception('--resetdir-list needs to None list-items, or contain a list of directions_id')         
            else:
                for dir_id in resetdir:
                    if type(dir_id) is not int:
                        print('--resetdir-list, direction IDs provided need to be integers')
                        raise Exception('--resetdir-list, direction IDs provided need to be integers')                             
                    if dir_id < 0: # if we get here we have an integer
                        print('--resetdir-list, direction IDs provided need to be integers >= 0')
                        raise Exception('--resetdir-list, direction IDs provided need to be integers >= 0')
                    data = ascii.read(args['facetdirections'])
                    if dir_id+1 > len(data): 
                        print('--direction IDs provided for reset is too high for the number of directions provided by ' + args['facetdirections'])
                        raise Exception('--direction IDs provided for reset is too high for the number of directions provided by ' + args['facetdirections'])
                    
    if args['groupms_h5facetspeedup']:
        if not args['DDE']:
            print('--groupms-h5facetspeedup can only be used with --DDE')
            raise Exception('--groupms-h5facetspeedup can only be used with --DDE')
    if args['DDE_predict'] == 'DP3':
        if type(args['fitspectralpol']) is not str:
          if args['fitspectralpol'] < 1:  
            print('--fitspectralpol needs to be turned on, otherwise no skymodel is produced by WSClean and we cannot predict these components with DP3. Put --DDE-predict=WSCLEAN or fitspectralpol>0')
            raise Exception('--Invalid combination of --fitspectralpol and --DDE-predict') 

    if args['uvmin'] is not None and type(args['uvmin']) is not list:
        if args['uvmin'] < 0.0:
            print('--uvmin needs to be positive')
            raise Exception('--uvmin needs to be positive')    
    if args['uvminim'] is not None and type(args['uvminim']) is not list:
       if args['uvminim'] < 0.0:
            print('--uvminim needs to be positive')
            raise Exception('--uvminim needs to be positive')
    if args['uvmaxim'] is not None and args['uvminim'] is not None and type(args['uvmaxim']) is not list and type(args['uvminim']) is not list:
        if args['uvmaxim'] <= args['uvminim']:
            print('--uvmaxim needs to be larger than --uvminim')
            raise Exception('--uvmaxim needs to be larger than --uvminim')
    if args['uvmax'] is not None and args['uvmin'] is not None and type(args['uvmax']) is not list  and type(args['uvmin']) is not list:
        if args['uvmax'] <= args['uvmin']:
            print('--uvmax needs to be larger than --uvmin')
            raise Exception('--uvmaxim needs to be larger than --uvmin')          
    #print(args['uvmax'], args['uvmin'], args['uvminim'],args['uvmaxim'])

    if 'fulljones' in args['soltype_list'] and args['doflagging'] and not args['forwidefield']:
        print('--doflagging is True, cannot be combined with fulljones solve, set it to False or use --forwidefield')
        raise Exception('--doflagging is True, cannot be combined with fulljones solve')

    if args['iontimefactor'] <= 0.0:
        print('BLsmooth iontimefactor needs to be positive')
        raise Exception('BLsmooth iontimefactor needs to be positive')
    if args['iontimefactor'] > 10.0:
        print('BLsmooth iontimefactor is way too high')
        raise Exception('BLsmooth iontimefactor is way too high')

    if args['ionfreqfactor'] <= 0.0:
        print('BLsmooth tecfactor needs to be positive')
        raise Exception('BLsmooth tecfactor needs to be positive')
    if args['ionfreqfactor'] > 10000.0:
        print('BLsmooth tecfactor is way too high')
        raise Exception('BLsmooth tecfactor is way too high')

    if args['aoflagger_strategy'] is not None and not os.path.isfile(args['aoflagger_strategy']):
        print('Cannot find aoflagger-strategy ' + args['aoflagger_strategy'] + ', file does not exist')
        raise Exception('Cannot find aoflagger-strategy, file does not exist')
       
    if not os.path.isfile('lib_multiproc.py'):
        print('Cannot find lib_multiproc.py, file does not exist, use --helperscriptspath')
        raise Exception('Cannot find lib_multiproc.py, file does not exist, use --helperscriptspath')
    if not os.path.isfile('h5_merger.py'):
        print('Cannot find h5_merger.py, file does not exist, use --helperscriptspath or --helperscriptspathh5merge')
        raise Exception(
            'Cannot find h5_merger.py, file does not exist, use --helperscriptspath or --helperscriptspathh5merge')
    if not os.path.isfile('plot_tecandphase.py'):
        print('Cannot find plot_tecandphase.py, file does not exist, use --helperscriptspath')
        raise Exception('Cannot find plot_tecandphase.py, file does not exist, use --helperscriptspath')
    if not os.path.isfile('lin2circ.py'):
        print('Cannot find lin2circ.py, file does not exist, use --helperscriptspath')
        raise Exception('Cannot find lin2circ.py, file does not exist, use --helperscriptspath')
    if not os.path.isfile('BLsmooth.py'):
        print('Cannot find BLsmooth.py, file does not exist, use --helperscriptspath')
        raise Exception('Cannot find BLsmooth.py, file does not exist, use --helperscriptspath')
    if not os.path.isfile('polconv.py'):
        print('Cannot find polconv.py, file does not exist, use --helperscriptspath')
        raise Exception('Cannot find polconv.py, file does not exist, use --helperscriptspath')
    if not os.path.isfile('vlass_search.py'):
        print('Cannot find vlass_search.py, file does not exist, use --helperscriptspath')
        raise Exception('Cannot find vlass_search.py, file does not exist, use --helperscriptspath')
    if not os.path.isfile('VLASS_dyn_summary.php'):
        print('Cannot find VLASS_dyn_summary.php, file does not exist, use --helperscriptspath')
        raise Exception('Cannot find VLASS_dyn_summary.php, file does not exist, use --helperscriptspath')      
    if not os.path.isfile('overwrite_table.py'):
        print('Cannot find overwrite_table.py, file does not exist, use --helperscriptspath or --helperscriptspathh5merge')
        raise Exception('Cannot find overwrite_table.py, file does not exist, use --helperscriptspath or --helperscriptspathh5merge') 

    if args['phaseshiftbox'] is not None:
        if not os.path.isfile(args['phaseshiftbox']):
            print('Cannot find:', args['phaseshiftbox'])
            raise Exception('Cannot find:' + args['phaseshiftbox'])

    if args['beamcor'] not in ['auto','yes','no']:
        print('beamcor is not auto, yes, or no')
        raise Exception('Invalid input, beamcor is not auto, yes, or no')

    if args['DDE_predict'] not in ['DP3', 'WSCLEAN']:
        print('DDE-predict is not DP3 or WSCLEAN')
        raise Exception('DDE-predict is not DP3 or WSCLEAN')

    for nrtmp in args['normamps_list']:
        if nrtmp not in ['normamps_per_ant', 'normslope', 'normamps','normslope+normamps','normslope+normamps_per_ant'] and nrtmp is not None:
            print('Invalid input: --normamps_list can only contain "normamps", "normslope", "normamps_per_ant", "normslope+normamps", "normslope+normamps_per_ant" or None')
            raise Exception('Invalid input: --normamps_list can only contain "normamps", "normslope", "normamps_per_ant", "normslope+normamps", "normslope+normamps_per_ant" or None')  

    for antennaconstraint in args['antennaconstraint_list']:
        if antennaconstraint not in ['superterp', 'coreandfirstremotes', 'core', 'remote', \
                                     'all', 'international', 'alldutch', 'core-remote',
                                     'coreandallbutmostdistantremotes', 'alldutchbutnoST001',\
                                      'distantremote','alldutchandclosegerman'] \
                and antennaconstraint is not None:
            print(
                'Invalid input, antennaconstraint can only be core, superterp, coreandfirstremotes, remote, alldutch, international, alldutchandclosegerman, or all')
            raise Exception(
                'Invalid input, antennaconstraint can only be core, superterp, coreandfirstremotes, remote, alldutch, international, alldutchandclosegerman, or all')

    for resetsols in args['resetsols_list']:
        if resetsols not in ['superterp', 'coreandfirstremotes', 'core', 'remote', \
                             'all', 'international', 'alldutch', 'core-remote', 'coreandallbutmostdistantremotes',
                             'alldutchbutnoST001','distantremote','alldutchandclosegerman'] \
                and resetsols is not None:
            print(
                'Invalid input, resetsols can only be core, superterp, coreandfirstremotes, remote, alldutch, international, distantremote, alldutchandclosegerman, or all')
            raise Exception(
                'Invalid input, resetsols can only be core, superterp, coreandfirstremotes, remote, alldutch, international, distantremote, alldutchandclosegerman, or all')

    #if args['DDE']:
    #   for soltype in args['soltype_list']:
    #    if soltype in ['scalarphasediff', 'scalarphasediffFR']:
    #        print('Invalid soltype input in combination with DDE type solve')
    #        raise Exception('Invalid soltype input in combination with DDE type solve') 

    for soltype in args['soltype_list']:
        if soltype not in ['complexgain', 'scalarcomplexgain', 'scalaramplitude', \
                           'amplitudeonly', 'phaseonly', 'fulljones', 'rotation', \
                           'rotation+diagonal', 'rotation+diagonalphase', \
                           'rotation+diagonalamplitude', 'rotation+scalar', \
                           'rotation+scalaramplitude','rotation+scalarphase','tec', \
                           'tecandphase', 'scalarphase', \
                           'scalarphasediff', 'scalarphasediffFR', 'phaseonly_phmin', \
                           'rotation_phmin', 'tec_phmin', \
                           'tecandphase_phmin', 'scalarphase_phmin', 'scalarphase_slope', 'phaseonly_slope']:
            print('Invalid soltype input')
            raise Exception('Invalid soltype input')

    # check that there is only on scalarphasediff solve and it the first entry
    if 'scalarphasediff' in args['soltype_list'] or 'scalarphasediffFR' in args['soltype_list']:
       if (args['soltype_list'][0] != 'scalarphasediff') and \
          (args['soltype_list'][0] != 'scalarphasediffFR'):
          print('scalarphasediff/scalarphasediffFR need to be to first solves in the list')
          raise Exception('scalarphasediff/scalarphasediffFR need to be to first solves in the list') 
       sccount = 0
       for soltype in args['soltype_list']:
          if soltype == 'scalarphasediff' or soltype == 'scalarphasediffFR':
             sccount = sccount + 1
       if sccount > 1:
          print('only one scalarphasediff/scalarphasediffFR solve allowed')
          raise Exception('only one scalarphasediff/scalarphasediffFR solve allowed') 
       
    if args['facetdirections'] is not None:
       if not os.path.isfile(args['facetdirections']):
          print('--facetdirections file does not exist')
          raise Exception('--facetdirections file does not exist')      
       check_for_BDPbug_longsolint(mslist, args['facetdirections'], args=args)
    

    if args['DDE']:
       if 'fulljones' in  args['soltype_list']:
          print('Invalid soltype input in combination with --DDE')
          raise Exception('Invalid soltype input in combination with --DDE')  
       if 'rotation' in  args['soltype_list']:
          print('Invalid soltype input in combination with --DDE')
          raise Exception('Invalid soltype input in combination with --DDE')  
       if 'rotation+diagonal' in  args['soltype_list']:
          print('Invalid soltype input in combination with --DDE')
          raise Exception('Invalid soltype input in combination with --DDE') 
       if 'rotation+diagonalamplitude' in  args['soltype_list']:
          print('Invalid soltype input in combination with --DDE')
          raise Exception('Invalid soltype input in combination with --DDE') 
       if 'rotation+diagonalphase' in  args['soltype_list']:
          print('Invalid soltype input in combination with --DDE')
          raise Exception('Invalid soltype input in combination with --DDE') 
       if 'rotation+scalar' in  args['soltype_list']:
          print('Invalid soltype input in combination with --DDE')
          raise Exception('Invalid soltype input in combination with --DDE') 
       if 'rotation+scalarphase' in  args['soltype_list']:
          print('Invalid soltype input in combination with --DDE')
          raise Exception('Invalid soltype input in combination with --DDE') 
       if 'rotation+scalaramplitude' in  args['soltype_list']:
          print('Invalid soltype input in combination with --DDE')
          raise Exception('Invalid soltype input in combination with --DDE') 
       if args['wscleanskymodel'] is not None and args['facetdirections'] is None:
          print('If --DDE and --wscleanskymodel are set provide a direction file via --facetdirections')
          raise Exception('DDE with a wscleanskymodel requires a user-specified facetdirections')
       if args['wscleanskymodel'] is not None and args['Nfacets'] > 0:
          print('If --DDE and --wscleanskymodel are set you cannot use Nfacets')
          raise Exception('If --DDE and --wscleanskymodel are set you cannot use Nfacets')
       #if (args['wscleanskymodel'] is not None) and (not args['disable_primary_beam')] \
       #     and (telescope == 'LOFAR'):
          #nonpblist = glob.glob(args['wscleanskymodel'] + '-????-model.fits')
          #pblist = glob.glob(args['wscleanskymodel'] + '-????-model-pb.fits')
          
          #if len(pblist) != len(nonpblist)
          #    print('Number of model-pb.fits and  model.fits images are not the same')
          #    raise Exception('Number of model-pb.fits and  model.fits images are not the same')
          #check number of model-pb images matches channelsout
          #if not args['disable_primary_beam'] and telescope == 'LOFAR':
          #   if len(pblist) != args['channelsout']:
          #       print('Number of model-pb.fits images does not match channelsout')
          #       raise Exception('Number of model-pb.fits images does not match channelsout')
         

    for ms in mslist:
        if not check_phaseup_station(ms):  
            for soltype_id, soltype in enumerate(args['soltype_list']):
                if soltype in ['scalarphasediff','scalarphasediff']:  
                    if args['antennaconstraint_list'][soltype_id] not in ['superterp', 'coreandfirstremotes', 'core', 'remote', 'distantremote', \
                             'all', 'international', 'alldutch', 'core-remote', 'coreandallbutmostdistantremotes',
                             'alldutchbutnoST001','alldutchandclosegerman'] and args['phaseupstations'] is None:
                        print('scalarphasediff/scalarphasediff type solves require a antennaconstraint, for example "core", or phased-up data')
                        raise Exception('scalarphasediff/scalarphasediff type solves require a antennaconstraint, or phased-up data')  

    if args['boxfile'] is not None:
        if not (os.path.isfile(args['boxfile'])):
            print('Cannot find boxfile, file does not exist')
            raise Exception('Cannot find boxfile, file does not exist')

    if args['fitsmask'] is not None and args['fitsmask'] != 'nofitsmask':
        if not (os.path.isfile(args['fitsmask'])):
            print('Cannot find fitsmask, file does not exist')
            raise Exception('Cannot find fitsmask, file does not exist')

    if args['skymodel'] is not None:
        if type(args['skymodel']) is str:
            #print(type(args['skymodel']), args['skymodel'][0])
            if not (os.path.isfile(args['skymodel'])) and not (os.path.isdir(args['skymodel'])):
                print('Cannot find skymodel, file does not exist', args['skymodel'])
                raise Exception('Cannot find skymodel, file does not exist')
        if type(args['skymodel']) is list:
            for skym in args['skymodel']:
                if not os.path.isfile(skym) and not os.path.isdir(skym):
                    print('Cannot find skymodel, file does not exist', skym)
                    raise Exception('Cannot find skymodel, file does not exist')
            
    if args['docircular'] and args['dolinear']:
        print('Conflicting input, docircular and dolinear used')
        raise Exception('Conflicting input, docircular and dolinear used')

    if which('DP3') is None:
        print('Cannot find DP3, forgot to source lofarinit.[c]sh?')
        raise Exception('Cannot find DP3, forgot to source lofarinit.[c]sh?')

    if which('wsclean') is None:
        print('Cannot find WSclean, forgot to source lofarinit.[c]sh?')
        raise Exception('Cannot find WSClean, forgot to source lofarinit.[c]sh?')

    if which('MakeMask.py') is None:
        print('Cannot find MakeMask.py, forgot to install it?')
        raise Exception('Cannot find MakeMask.py, forgot to install it?')

    if which('taql') is None:
        print('Cannot find taql, forgot to install it?')
        raise Exception('Cannot find taql, forgot to install it?')

    # Check boxfile and imsize settings
    if args['boxfile'] is None and args['imsize'] is None:
        if not checklongbaseline(sorted(args['ms'])[0]):
            print('Incomplete input detected, either boxfile or imsize is required')
            raise Exception('Incomplete input detected, either boxfile or imsize is required')

    if args['boxfile'] is not None and args['imsize'] is not None:
        print('Wrong input detected, both boxfile and imsize are set')
        raise Exception('Wrong input detected, both boxfile and imsize are set')

    if args['imager'] not in ['DDFACET', 'WSCLEAN']:
        print('Wrong input detected for option --imager, should be DDFACET or WSCLEAN')
        raise Exception('Wrong input detected for option --imager, should be DDFACET or WSCLEAN')

    if args['phaseupstations'] is not None:
        if args['phaseupstations'] not in ['core', 'superterp']:
            print('Wrong input detected for option --phaseupstations, should be core or superterp')
            raise Exception('Wrong input detected for option --phaseupstations, should be core or superterp')
    if args['phaseupstations'] is not None:
        if args['phaseupstations'] in args['antennaconstraint_list']:
            print('Wrong input detected for option --antennaconstraint-list, --phaseupstations is set and phased-up stations are not available anymore for --antennaconstraint-list')
            raise Exception('Wrong input detected for option --antennaconstraint-list, --phaseupstations is set and phased-up stations are not available anymore for --antennaconstraint-list')

    if args['soltypecycles_list'][0] != 0:
        print('Wrong input detected for option --soltypecycles-list should always start with 0')
        raise Exception('Wrong input detected for option --soltypecycles-list should always start with 0')

    if len(args['soltypecycles_list']) != len(args['soltype_list']):
        print('Wrong input detected, length soltypecycles-list does not match that of soltype-list')
        raise Exception('Wrong input detected, length soltypecycles-list does not match that of soltype-list')

    for soltype_id, soltype in enumerate(args['soltype_list']):
        wronginput = False
        if soltype in ['tecandphase', 'tec', 'tec_phmin', 'tecandphase_phmin']:
            try:  # in smoothnessconstraint_list is not filled by the user
                if args['smoothnessconstraint_list'][soltype_id] > 0.0:
                    print('smoothnessconstraint should be 0.0 for a tec-like solve')
                    wronginput = True
            except:
                pass
            if wronginput:
                raise Exception('smoothnessconstraint should be 0.0 for a tec-like solve')

    for smoothnessconstraint in args['smoothnessconstraint_list']:
        if smoothnessconstraint < 0.0:
            print('Smoothnessconstraint must be equal or larger than 0.0')
            raise Exception('Smoothnessconstraint must be equal or larger than 0.0')
    for smoothnessreffrequency in args['smoothnessreffrequency_list']:
        if smoothnessreffrequency < 0.0:
            print('Smoothnessreffrequency must be equal or larger than 0.0')
            raise Exception('Smoothnessreffrequency must be equal or larger than 0.0')

    if (args['skymodel'] is not None) and (args['skymodelpointsource']) is not None:
        print('Wrong input, you cannot use a separate skymodel file and then also set skymodelpointsource')
        raise Exception('Wrong input, you cannot use a separate skymodel file and then also set skymodelpointsource')
    if (args['skymodelpointsource'] is not None and type(args['skymodelpointsource']) is not list):
        if args['skymodelpointsource'] <= 0.0:
            print('Wrong input, flux density provided for skymodelpointsource is <= 0.0')
            raise Exception('Wrong input, flux density provided for skymodelpointsource is <= 0.0')
    if type(args['skymodelpointsource']) is list:
        for skymp in args['skymodelpointsource']:
            if float(skymp) <= 0.0:
                print('Wrong input, flux density provided for skymodelpointsource is <= 0.0')
                raise Exception('Wrong input, flux density provided for skymodelpointsource is <= 0.0')             

    if (args['msinstartchan'] < 0):
        print('Wrong input for msinstartchan, must be larger than zero')
        raise Exception('Wrong input for msinstartchan, must be larger than zero')
          
    if (args['msinnchan'] is not None):
        if (args['msinnchan'] <= 0):
            print('Wrong input for msinnchan, must be larger than zero')
            raise Exception('Wrong input for msinnchan, must be larger than zero')
    if (args['msinntimes'] is not None):
        if (args['msinntimes'] <= 1):
            print('Wrong input for msinntimes, must be larger than 1')
            raise Exception('Wrong input for msinntimes, must be larger than 1')

    if (args['skymodelpointsource'] is not None) and (args['predictskywithbeam']):
        print('Combination of skymodelpointsource and predictskywithbeam not supported')
        print('Provide a skymodel file to predict the sky with the beam')
        raise Exception('Combination of skymodelpointsource and predictskywithbeam not supported')

    if (args['wscleanskymodel'] is not None) and (args['skymodelpointsource']) is not None:
        print('Wrong input, you cannot use a wscleanskymodel and then also set skymodelpointsource')
        raise Exception('Wrong input, you cannot use a wscleanskymodel and then also set skymodelpointsource')

    if (args['wscleanskymodel'] is not None) and (args['skymodel']) is not None:
        print('Wrong input, you cannot use a wscleanskymodel and then also set skymodel')
        raise Exception('Wrong input, you cannot use a wscleanskymodel and then also set skymodel')

    if (args['wscleanskymodel'] is not None) and (args['predictskywithbeam']):
        print('Combination of wscleanskymodel and predictskywithbeam not supported')
        print('Provide a skymodel component file to predict the sky with the beam')
        raise Exception('Combination of wscleanskymodel and predictskywithbeam not supported')

    if (args['wscleanskymodel'] is not None) and (args['imager'] == 'DDFACET'):
        print('Combination of wscleanskymodel and DDFACET as an imager is not supported')
        raise Exception('Combination of wscleanskymodel and DDFACET as an imager is not supported')
    if (args['wscleanskymodel'] is not None):
        if len(glob.glob(args['wscleanskymodel'] + '-????-model.fits')) < 2:
            print('Not enough WSClean channel model images found')
            print(glob.glob(args['wscleanskymodel'] + '-????-model.fits'))
            raise Exception('Not enough WSClean channel model images found')
        #if len(glob.glob(args['wscleanskymodel'] + '-????-model.fits')) != args['channelsout']:
        #    print('Number of model images provided needs to match channelsout')
        #    raise Exception('Number of model images provided needs to match channelsout')
        if (args['wscleanskymodel'].find('/') != -1):
            print('wscleanskymodel contains a slash, not allowed, needs to be in pwd')
            raise Exception('wscleanskymodel contains a slash, not allowed, needs to be in pwd')
        if (args['wscleanskymodel'].find('..') != -1):
            print('wscleanskymodel contains .., not allowed, needs to be in pwd')
            raise Exception('wscleanskymodel contains .., not allowed, needs to be in pwd')
    return


def get_resolution(ms):
   uvmax = get_uvwmax(ms)
   t = pt.table(ms + '/SPECTRAL_WINDOW', ack=False)
   freq = np.median(t.getcol('CHAN_FREQ'))
   print('Central freq [MHz]', freq/1e6, 'Longest baselines [km]', uvmax/1e3)
   t.close()
   res = 1.22*3600.*180.*((299792458./freq )/uvmax)/np.pi
   return res

  
def get_uvwmax(ms):
    ''' Find the maximum squared sum of UVW coordinates.
    
    Args:
        ms (str): path to a Measurement Set.
    Returns:
        None
    '''
    t = pt.table(ms, ack=False)
    uvw = t.getcol('UVW')
    ssq = np.sqrt(np.sum(uvw**2, axis=1))
    print(uvw.shape)
    t.close()
    return np.max(ssq)

def makeBBSmodelforVLASS(filename, extrastrname=''):
    img = bdsf.process_image(filename,mean_map='zero', rms_map=True, rms_box = (100,10))#, \
                            # frequency=150e6, beam=(25./3600,25./3600,0.0) )
    img.write_catalog(format='bbs', bbs_patches='source', \
                      outfile='vlass' + extrastrname + '.skymodel'  , clobber=True)
    #bbsmodel = 'bla.skymodel'
    del img
    return 'vlass' + extrastrname + '.skymodel'  
    

def makeBBSmodelforTGSS(boxfile=None, fitsimage=None, pixelscale=None, imsize=None, \
                        ms=None, extrastrname=''):
    ''' Creates a TGSS skymodel in DP3-readable format.
    
    Args:
        boxfile (str): path to the DS9 region to create a model for.
        fitsimage (str): name of the FITS image the model will be created from.
        pixelscale (float): number of arcsec per pixel.
        imsize (int): image size in pixels.
        ms (str): if no box file is given, use this Measurement Set to determine the sky area to make a model of.
    Returns:
        tgss.skymodel: name of the output skymodel (always tgss[#nr].skymodel).
    '''
    tgsspixsize = 6.2    
    if boxfile is None and imsize is None:
        print('Wring input detected, boxfile or imsize needs to be set')
        raise Exception('Wring input detected, boxfile or imsize needs to be set')
    if boxfile is not None:
       r = pyregion.open(boxfile)
       if len(r[:]) > 1:
          print('Composite region file, not allowed')
          raise Exception('Composite region file, not allowed')
       phasecenter = getregionboxcenter(boxfile)
       phasecenterc = phasecenter.replace('deg','')
       xs = np.ceil((r[0].coord_list[2]) * 3600./tgsspixsize)
       ys = np.ceil((r[0].coord_list[3]) * 3600./tgsspixsize)
    else:
       t2 = pt.table(ms + '::FIELD')
       phasedir = t2.getcol('PHASE_DIR').squeeze()
       t2.close()
       phasecenterc =  ('{:12.8f}'.format(180. * np.mod(phasedir[0], 2. * np.pi) / np.pi) + ',' + '{:12.8f}'.format(180. * phasedir[1] / np.pi)).replace(' ','')
       
       # phasecenterc = str() + ', ' + str()
       xs = np.ceil(imsize * pixelscale / tgsspixsize)
       ys = np.ceil(imsize * pixelscale / tgsspixsize)
    
    print('TGSS imsize:', xs)
    print('TGSS image center:', phasecenterc)
    logger.info('TGSS imsize:' + str(xs))
    logger.info('TGSS image center:' + str(phasecenterc))
    
    # sys.exit()
 
    if fitsimage is None:
        filename = SkyView.get_image_list(position=phasecenterc, survey='TGSS ADR1', pixels=int(xs), cache=False)
        print(filename)
        if os.path.isfile(filename[0].split('/')[-1]):
            os.system('rm -f ' + filename[0].split('/')[-1])
        time.sleep(10)
        os.system('wget ' + filename[0])
        filename = filename[0].split('/')[-1]
        print(filename)
    else:
        filename = fitsimage

    img = bdsf.process_image(filename,mean_map='zero', rms_map=True, rms_box = (100,10), \
                             frequency=150e6, beam=(25./3600,25./3600,0.0) )
    img.write_catalog(format='bbs', bbs_patches='source', \
                      outfile='tgss' + extrastrname + '.skymodel', clobber=True)
    # bbsmodel = 'bla.skymodel'
    del img
    print(filename)
    return 'tgss' + extrastrname + '.skymodel', filename

def getregionboxcenter(regionfile, standardbox=True):
    ''' Extract box center of a DS9 box region.

    Args:
        regionfile (str): path to the region file.
        standardbox (bool): only allow square, non-rotated boxes.
    Returns:
        regioncenter (str): DP3 compatible string for phasecenter shifting.
    '''
    r = pyregion.open(regionfile)

    if len(r[:]) > 1:
        print('Only one region can be specified, your file contains', len(r[:]))
        raise Exception('Only one region can be specified, your file contains')

    if r[0].name != 'box':
        print('Only box region supported')
        raise Exception('Only box region supported')

    ra  = r[0].coord_list[0]
    dec = r[0].coord_list[1]
    boxsizex = r[0].coord_list[2]
    boxsizey = r[0].coord_list[3]
    angle = r[0].coord_list[4]

    if standardbox:
        if boxsizex != boxsizey:
            print('Only a square box region supported, you have these sizes:', boxsizex, boxsizey)
            raise Exception('Only a square box region supported')
        if np.abs(angle) > 1:
            print('Only normally oriented sqaure boxes are supported, your region is oriented under angle:', angle)
            raise Exception('Only normally oriented sqaure boxes are supported, your region is oriented under angle')
    
    regioncenter =  ('{:12.8f}'.format(ra) + 'deg,' + '{:12.8f}'.format(dec) + 'deg').replace(' ', '')
    return regioncenter


def bandwidthsmearing(chanw, freq, imsize, verbose=True):
    ''' Calculate the fractional intensity loss due to bandwidth smearing.
    
    Args:
        chanw (float): bandwidth.
        freq (float): observing frequency.
        imsize (int): image size in pixels.
        verbose (bool): print information to the screen.
    Returns:
        R (float): fractional intensity loss.
    '''
    R = (chanw / freq) * (imsize / 6.)  # asume we have used 3 pixels per beam
    if verbose:
        print('R value for bandwidth smearing is:', R)
        logger.info('R value for bandwidth smearing is: ' + str(R))
        if R > 1.:
            print('Warning, try to increase your frequency resolution, or lower imsize, to reduce the R value below 1')
            logger.warning('Warning, try to increase your frequency resolution, or lower imsize, to reduce the R value below 1')
    return R

def number_freqchan_h5(h5parmin):
    ''' Function to get the number of freqcencies in H5 solution file.

    Args:
        h5parmin (str): input H5parm.
    Returns:
        freqs (int): number of freqcencies in the H5 file.
    '''
    H=tables.open_file(h5parmin)

    try:
        freq = H.root.sol000.phase000.freq[:]
        # print('You solutions do not contain phase values')
    except:    
        pass

    try:
        freq = H.root.sol000.amplitude000.freq[:]  # apparently we only have amplitudes
    except:
        pass

    try:
        freq = H.root.sol000.rotation000.freq[:]  # apparently we only have rotatioon
    except:
        pass

    try:
        freq = H.root.sol000.tec000.freq[:]  # apparently we only have rotatioon
    except:
        pass

    H.close()
    print('Number of frequency channels in this solutions file is:', len(freq))
    return len(freq)


def calculate_restoringbeam(mslist, LBA):
    ''' Returns the restoring beam.

    Args:
        mslist (list): currently unused.
        LBA (bool): if data is LBA or not.
    Returns:
        restoringbeam (float): the restoring beam in arcsec.
    '''
    if LBA: # so we have LBA
      restoringbeam = 15.
    else : # so we have HBA
      restoringbeam = 6.

    return restoringbeam


def print_title(version):
    print("""
              __        ______    _______    ___      .______      
             |  |      /  __  \  |   ____|  /   \     |   _  \     
             |  |     |  |  |  | |  |__    /  ^  \    |  |_)  |    
             |  |     |  |  |  | |   __|  /  /_\  \   |      /     
             |  `----.|  `--'  | |  |    /  _____  \  |  |\  \----.
             |_______| \______/  |__|   /__/     \__\ | _| `._____|
                                                                   
               _______    ___       ______  _______ .___________.
              |   ____|  /   \     /      ||   ____||           |
              |  |__    /  ^  \   |  ,----'|  |__   `---|  |----`
              |   __|  /  /_\  \  |  |     |   __|      |  |     
              |  |    /  _____  \ |  `----.|  |____     |  |     
              |__|   /__/     \__\ \______||_______|    |__|     
                                                                 
         _______. _______  __       _______   ______      ___       __      
        /       ||   ____||  |     |   ____| /      |    /   \     |  |     
       |   (----`|  |__   |  |     |  |__   |  ,----'   /  ^  \    |  |     
        \   \    |   __|  |  |     |   __|  |  |       /  /_\  \   |  |     
    .----)   |   |  |____ |  `----.|  |     |  `----. /  _____  \  |  `----.
    |_______/    |_______||_______||__|      \______|/__/     \__\ |_______|
                                                                              
    
                      Reinout van Weeren (2021, A&A, 651, 115)

                              Starting.........
          """)

    print('\n\nVERSION: ' + version + '\n\n')
    logger.info('VERSION: ' + version)
    return

def makemslist(mslist):
    ''' Create the input list for e.g. ddf-pipeline.
    
    Args:
        mslist (list): list of input Measurement Sets
    Returns:
        None
    '''
    os.system('rm -rf mslist.txt')
    f=open('mslist.txt', 'w')
    for ms in mslist:
        f.write(str(ms)+'\n')
    f.close()
    return

def antennaconstraintstr(ctype, antennasms, HBAorLBA, useforresetsols=False, telescope='LOFAR'):
    ''' Formats an anntena constraint string in a DP3-suitable format.

    Args:
        ctype (str): constraint type. Can be superterp, core, coreandfirstremotes, remote, alldutch, all, international, core-remote, coreandallbutmostdistantremotes, alldutchandclosegerman or alldutchbutnoST001.
        antennasms (list): antennas present in the Measurement Set.
        HBAorLBA (str): indicate HBA or LBA data. Can be HBA or LBA.
        useforresetsols (bool): whether it will be used with reset solution. Removes antennas that are not in antennasms.
        telescope (str): telescope name, used to check if MeerKAT data is used
    Returns:
        antstr (str): antenna constraint string for DP3.
    '''
    antennasms = list(antennasms)
    # print(antennasms)
    if ctype != 'superterp' and ctype != 'core' and ctype != 'coreandfirstremotes' and \
       ctype != 'remote' and ctype != 'alldutch' and ctype != 'all' and \
       ctype != 'international' and ctype != 'core-remote' and ctype != 'coreandallbutmostdistantremotes' and ctype != 'alldutchandclosegerman' and \
       ctype != 'alldutchbutnoST001' and ctype != 'distantremote':
        print('Invalid input, ctype can only be "superterp" or "core"')
        raise Exception('Invalid input, ctype can only be "superterp" or "core"')
    if HBAorLBA == 'LBA':  
        if ctype == 'superterp':  
            antstr=['CS002LBA', 'CS003LBA', 'CS004LBA', 'CS005LBA', 'CS006LBA', 'CS007LBA', 'ST001']
        if ctype == 'core':
            antstr=['CS001LBA', 'CS002LBA', 'CS003LBA', 'CS004LBA', 'CS005LBA', 'CS006LBA', 'CS007LBA',  \
                    'CS011LBA', 'CS013LBA', 'CS017LBA', 'CS021LBA', 'CS024LBA', 'CS026LBA', 'CS028LBA',  \
                    'CS030LBA', 'CS031LBA', 'CS032LBA', 'CS101LBA', 'CS103LBA', 'CS201LBA', 'CS301LBA',  \
                    'CS302LBA', 'CS401LBA', 'CS501LBA', 'ST001']
        if ctype == 'coreandfirstremotes':
            antstr=['CS001LBA', 'CS002LBA', 'CS003LBA', 'CS004LBA', 'CS005LBA', 'CS006LBA', 'CS007LBA',  \
                    'CS011LBA', 'CS013LBA', 'CS017LBA', 'CS021LBA', 'CS024LBA', 'CS026LBA', 'CS028LBA',  \
                    'CS030LBA', 'CS031LBA', 'CS032LBA', 'CS101LBA', 'CS103LBA', 'CS201LBA', 'CS301LBA',  \
                    'CS302LBA', 'CS401LBA', 'CS501LBA', 'RS503LBA', 'RS305LBA', 'RS205LBA', 'RS306LBA',  \
                    'RS106LBA', 'ST001']
        if ctype == 'coreandallbutmostdistantremotes':
            antstr=['CS001LBA', 'CS002LBA', 'CS003LBA', 'CS004LBA', 'CS005LBA', 'CS006LBA', 'CS007LBA',  \
                    'CS011LBA', 'CS013LBA', 'CS017LBA', 'CS021LBA', 'CS024LBA', 'CS026LBA', 'CS028LBA',  \
                    'CS030LBA', 'CS031LBA', 'CS032LBA', 'CS101LBA', 'CS103LBA', 'CS201LBA', 'CS301LBA',  \
                    'CS302LBA', 'CS401LBA', 'CS501LBA', 'RS503LBA', 'RS305LBA', 'RS205LBA', 'RS306LBA',  \
                    'RS106LBA', 'RS307LBA', 'RS406LBA', 'RS407LBA', 'ST001']
        if ctype == 'remote':
            antstr=['RS503LBA', 'RS305LBA', 'RS205LBA', 'RS306LBA',  'RS310LBA', 'RS406LBA', 'RS407LBA', \
                    'RS106LBA', 'RS307LBA', 'RS208LBA', 'RS210LBA',  'RS409LBA', 'RS508LBA', 'RS509LBA']
        if ctype == 'distantremote':
            antstr=['RS310LBA', 'RS407LBA','RS208LBA', 'RS210LBA',  'RS409LBA', 'RS508LBA', 'RS509LBA']
        if ctype == 'alldutch':
            antstr=['CS001LBA', 'CS002LBA', 'CS003LBA', 'CS004LBA', 'CS005LBA', 'CS006LBA', 'CS007LBA',  \
                    'CS011LBA', 'CS013LBA', 'CS017LBA', 'CS021LBA', 'CS024LBA', 'CS026LBA', 'CS028LBA',  \
                    'CS030LBA', 'CS031LBA', 'CS032LBA', 'CS101LBA', 'CS103LBA', 'CS201LBA', 'CS301LBA',  \
                    'CS302LBA', 'CS401LBA', 'CS501LBA', 'RS503LBA', 'RS305LBA', 'RS205LBA', 'RS306LBA',  \
                    'RS310LBA', 'RS406LBA', 'RS407LBA', 'RS106LBA', 'RS307LBA', 'RS208LBA', 'RS210LBA',  \
                    'RS409LBA', 'RS508LBA', 'RS509LBA',  'ST001']
        if ctype == 'alldutchbutnoST001':
            antstr=['CS001LBA', 'CS002LBA', 'CS003LBA', 'CS004LBA', 'CS005LBA', 'CS006LBA', 'CS007LBA',  \
                    'CS011LBA', 'CS013LBA', 'CS017LBA', 'CS021LBA', 'CS024LBA', 'CS026LBA', 'CS028LBA',  \
                    'CS030LBA', 'CS031LBA', 'CS032LBA', 'CS101LBA', 'CS103LBA', 'CS201LBA', 'CS301LBA',  \
                    'CS302LBA', 'CS401LBA', 'CS501LBA', 'RS503LBA', 'RS305LBA', 'RS205LBA', 'RS306LBA',  \
                    'RS310LBA', 'RS406LBA', 'RS407LBA', 'RS106LBA', 'RS307LBA', 'RS208LBA', 'RS210LBA',  \
                    'RS409LBA', 'RS508LBA', 'RS509LBA']

        if ctype == 'all':
            antstr=['CS001LBA', 'CS002LBA', 'CS003LBA', 'CS004LBA', 'CS005LBA', 'CS006LBA', 'CS007LBA',  \
                    'CS011LBA', 'CS013LBA', 'CS017LBA', 'CS021LBA', 'CS024LBA', 'CS026LBA', 'CS028LBA',  \
                    'CS030LBA', 'CS031LBA', 'CS032LBA', 'CS101LBA', 'CS103LBA', 'CS201LBA', 'CS301LBA',  \
                    'CS302LBA', 'CS401LBA', 'CS501LBA', 'RS503LBA', 'RS305LBA', 'RS205LBA', 'RS306LBA',  \
                    'RS310LBA', 'RS406LBA', 'RS407LBA', 'RS106LBA', 'RS307LBA', 'RS208LBA', 'RS210LBA',  \
                    'RS409LBA', 'RS508LBA', 'RS509LBA',  \
                    'DE601LBA', 'DE602LBA', 'DE603LBA', 'DE604LBA',  'DE605LBA', 'DE609LBA', 'FR606LBA',  \
                    'SE607LBA', 'UK608LBA', 'PL610LBA', 'PL611LBA',  'PL612LBA', 'IE613LBA', 'LV614LBA', 'ST001']          
        if ctype == 'international':
            antstr=['DE601LBA', 'DE602LBA', 'DE603LBA', 'DE604LBA', 'DE605LBA', 'DE609LBA', 'FR606LBA',  \
                    'SE607LBA', 'UK608LBA', 'PL610LBA', 'PL611LBA', 'PL612LBA', 'IE613LBA', 'LV614LBA']    
        if ctype == 'core-remote':
            antstr1=['CS001LBA', 'CS002LBA', 'CS003LBA', 'CS004LBA', 'CS005LBA', 'CS006LBA', 'CS007LBA',  \
                    'CS011LBA', 'CS013LBA', 'CS017LBA', 'CS021LBA', 'CS024LBA', 'CS026LBA', 'CS028LBA',  \
                    'CS030LBA', 'CS031LBA', 'CS032LBA', 'CS101LBA', 'CS103LBA', 'CS201LBA', 'CS301LBA',  \
                    'CS302LBA', 'CS401LBA', 'CS501LBA', 'ST001']
            antstr2=['RS503LBA', 'RS305LBA', 'RS205LBA', 'RS306LBA',  'RS310LBA', 'RS406LBA', 'RS407LBA', \
                    'RS106LBA', 'RS307LBA', 'RS208LBA', 'RS210LBA',  'RS409LBA', 'RS508LBA', 'RS509LBA']
        if ctype == 'alldutchandclosegerman':  
            antstr=['CS001LBA', 'CS002LBA', 'CS003LBA', 'CS004LBA', 'CS005LBA', 'CS006LBA', 'CS007LBA',  \
                    'CS011LBA', 'CS013LBA', 'CS017LBA', 'CS021LBA', 'CS024LBA', 'CS026LBA', 'CS028LBA',  \
                    'CS030LBA', 'CS031LBA', 'CS032LBA', 'CS101LBA', 'CS103LBA', 'CS201LBA', 'CS301LBA',  \
                    'CS302LBA', 'CS401LBA', 'CS501LBA', 'RS503LBA', 'RS305LBA', 'RS205LBA', 'RS306LBA',  \
                    'RS310LBA', 'RS406LBA', 'RS407LBA', 'RS106LBA', 'RS307LBA', 'RS208LBA', 'RS210LBA',  \
                    'RS409LBA', 'RS508LBA', 'RS509LBA',  'ST001', 'DE601LBA', 'DE605LBA']

    if HBAorLBA == 'HBA':    
        if ctype == 'superterp': 
            antstr=['CS002HBA0', 'CS003HBA0', 'CS004HBA0', 'CS005HBA0', 'CS006HBA0', 'CS007HBA0',  \
                    'CS002HBA1', 'CS003HBA1', 'CS004HBA1', 'CS005HBA1', 'CS006HBA1', 'CS007HBA1', 'ST001']
        if ctype == 'remote':
            antstr=['RS503HBA', 'RS305HBA', 'RS205HBA', 'RS306HBA', 'RS310HBA', 'RS406HBA', 'RS407HBA',  \
                    'RS106HBA', 'RS307HBA', 'RS208HBA', 'RS210HBA', 'RS409HBA', 'RS508HBA', 'RS509HBA']
        if ctype == 'distantremote':
            antstr=['RS310HBA', 'RS407HBA','RS208HBA', 'RS210HBA',  'RS409HBA', 'RS508HBA', 'RS509HBA']            
        if ctype == 'core':
            antstr=['CS001HBA0', 'CS002HBA0', 'CS003HBA0', 'CS004HBA0', 'CS005HBA0', 'CS006HBA0', 'CS007HBA0',  \
                    'CS011HBA0', 'CS013HBA0', 'CS017HBA0', 'CS021HBA0', 'CS024HBA0', 'CS026HBA0', 'CS028HBA0',  \
                    'CS030HBA0', 'CS031HBA0', 'CS032HBA0', 'CS101HBA0', 'CS103HBA0', 'CS201HBA0', 'CS301HBA0',  \
                    'CS302HBA0', 'CS401HBA0', 'CS501HBA0', \
                    'CS001HBA1', 'CS002HBA1', 'CS003HBA1', 'CS004HBA1', 'CS005HBA1', 'CS006HBA1', 'CS007HBA1',  \
                    'CS011HBA1', 'CS013HBA1', 'CS017HBA1', 'CS021HBA1', 'CS024HBA1', 'CS026HBA1', 'CS028HBA1',  \
                    'CS030HBA1', 'CS031HBA1', 'CS032HBA1', 'CS101HBA1', 'CS103HBA1', 'CS201HBA1', 'CS301HBA1',  \
                    'CS302HBA1', 'CS401HBA1', 'CS501HBA1', 'ST001']
        if ctype == 'coreandfirstremotes':
            antstr=['CS001HBA0', 'CS002HBA0', 'CS003HBA0', 'CS004HBA0', 'CS005HBA0', 'CS006HBA0', 'CS007HBA0',  \
                    'CS011HBA0', 'CS013HBA0', 'CS017HBA0', 'CS021HBA0', 'CS024HBA0', 'CS026HBA0', 'CS028HBA0',  \
                    'CS030HBA0', 'CS031HBA0', 'CS032HBA0', 'CS101HBA0', 'CS103HBA0', 'CS201HBA0', 'CS301HBA0',  \
                    'CS302HBA0', 'CS401HBA0', 'CS501HBA0', \
                    'CS001HBA1', 'CS002HBA1', 'CS003HBA1', 'CS004HBA1', 'CS005HBA1', 'CS006HBA1', 'CS007HBA1',  \
                    'CS011HBA1', 'CS013HBA1', 'CS017HBA1', 'CS021HBA1', 'CS024HBA1', 'CS026HBA1', 'CS028HBA1',  \
                    'CS030HBA1', 'CS031HBA1', 'CS032HBA1', 'CS101HBA1', 'CS103HBA1', 'CS201HBA1', 'CS301HBA1',  \
                    'CS302HBA1', 'CS401HBA1', 'CS501HBA1', 'RS503HBA' , 'RS305HBA' , 'RS205HBA' , 'RS306HBA',   \
                    'RS106HBA', 'ST001']
        if ctype == 'coreandallbutmostdistantremotes':
            antstr=['CS001HBA0', 'CS002HBA0', 'CS003HBA0', 'CS004HBA0', 'CS005HBA0', 'CS006HBA0', 'CS007HBA0',  \
                    'CS011HBA0', 'CS013HBA0', 'CS017HBA0', 'CS021HBA0', 'CS024HBA0', 'CS026HBA0', 'CS028HBA0',  \
                    'CS030HBA0', 'CS031HBA0', 'CS032HBA0', 'CS101HBA0', 'CS103HBA0', 'CS201HBA0', 'CS301HBA0',  \
                    'CS302HBA0', 'CS401HBA0', 'CS501HBA0', \
                    'CS001HBA1', 'CS002HBA1', 'CS003HBA1', 'CS004HBA1', 'CS005HBA1', 'CS006HBA1', 'CS007HBA1',  \
                    'CS011HBA1', 'CS013HBA1', 'CS017HBA1', 'CS021HBA1', 'CS024HBA1', 'CS026HBA1', 'CS028HBA1',  \
                    'CS030HBA1', 'CS031HBA1', 'CS032HBA1', 'CS101HBA1', 'CS103HBA1', 'CS201HBA1', 'CS301HBA1',  \
                    'CS302HBA1', 'CS401HBA1', 'CS501HBA1', 'RS503HBA' , 'RS305HBA' , 'RS205HBA' , 'RS306HBA',   \
                    'RS106HBA', 'RS307HBA', 'RS406HBA', 'RS407HBA', 'ST001']
        if ctype == 'alldutch':
            antstr=['CS001HBA0', 'CS002HBA0', 'CS003HBA0', 'CS004HBA0', 'CS005HBA0', 'CS006HBA0', 'CS007HBA0',  \
                    'CS011HBA0', 'CS013HBA0', 'CS017HBA0', 'CS021HBA0', 'CS024HBA0', 'CS026HBA0', 'CS028HBA0',  \
                    'CS030HBA0', 'CS031HBA0', 'CS032HBA0', 'CS101HBA0', 'CS103HBA0', 'CS201HBA0', 'CS301HBA0',  \
                    'CS302HBA0', 'CS401HBA0', 'CS501HBA0', \
                    'CS001HBA1', 'CS002HBA1', 'CS003HBA1', 'CS004HBA1', 'CS005HBA1', 'CS006HBA1', 'CS007HBA1',  \
                    'CS011HBA1', 'CS013HBA1', 'CS017HBA1', 'CS021HBA1', 'CS024HBA1', 'CS026HBA1', 'CS028HBA1',  \
                    'CS030HBA1', 'CS031HBA1', 'CS032HBA1', 'CS101HBA1', 'CS103HBA1', 'CS201HBA1', 'CS301HBA1',  \
                    'CS302HBA1', 'CS401HBA1', 'CS501HBA1',  \
                    'RS503HBA', 'RS305HBA', 'RS205HBA', 'RS306HBA',  'RS310HBA', 'RS406HBA', 'RS407HBA',  \
                    'RS106HBA', 'RS307HBA', 'RS208HBA', 'RS210HBA',  'RS409HBA', 'RS508HBA', 'RS509HBA', 'ST001']
        if ctype == 'alldutchandclosegerman':
            antstr=['CS001HBA0', 'CS002HBA0', 'CS003HBA0', 'CS004HBA0', 'CS005HBA0', 'CS006HBA0', 'CS007HBA0',  \
                    'CS011HBA0', 'CS013HBA0', 'CS017HBA0', 'CS021HBA0', 'CS024HBA0', 'CS026HBA0', 'CS028HBA0',  \
                    'CS030HBA0', 'CS031HBA0', 'CS032HBA0', 'CS101HBA0', 'CS103HBA0', 'CS201HBA0', 'CS301HBA0',  \
                    'CS302HBA0', 'CS401HBA0', 'CS501HBA0', \
                    'CS001HBA1', 'CS002HBA1', 'CS003HBA1', 'CS004HBA1', 'CS005HBA1', 'CS006HBA1', 'CS007HBA1',  \
                    'CS011HBA1', 'CS013HBA1', 'CS017HBA1', 'CS021HBA1', 'CS024HBA1', 'CS026HBA1', 'CS028HBA1',  \
                    'CS030HBA1', 'CS031HBA1', 'CS032HBA1', 'CS101HBA1', 'CS103HBA1', 'CS201HBA1', 'CS301HBA1',  \
                    'CS302HBA1', 'CS401HBA1', 'CS501HBA1',  \
                    'RS503HBA', 'RS305HBA', 'RS205HBA', 'RS306HBA',  'RS310HBA', 'RS406HBA', 'RS407HBA',  \
                    'RS106HBA', 'RS307HBA', 'RS208HBA', 'RS210HBA',  'RS409HBA', 'RS508HBA', 'RS509HBA', 'ST001','DE601HBA','DE605HBA']          
          
        if ctype == 'alldutchbutnoST001':
            antstr=['CS001HBA0', 'CS002HBA0', 'CS003HBA0', 'CS004HBA0', 'CS005HBA0', 'CS006HBA0', 'CS007HBA0',  \
                    'CS011HBA0', 'CS013HBA0', 'CS017HBA0', 'CS021HBA0', 'CS024HBA0', 'CS026HBA0', 'CS028HBA0',  \
                    'CS030HBA0', 'CS031HBA0', 'CS032HBA0', 'CS101HBA0', 'CS103HBA0', 'CS201HBA0', 'CS301HBA0',  \
                    'CS302HBA0', 'CS401HBA0', 'CS501HBA0', \
                    'CS001HBA1', 'CS002HBA1', 'CS003HBA1', 'CS004HBA1', 'CS005HBA1', 'CS006HBA1', 'CS007HBA1',  \
                    'CS011HBA1', 'CS013HBA1', 'CS017HBA1', 'CS021HBA1', 'CS024HBA1', 'CS026HBA1', 'CS028HBA1',  \
                    'CS030HBA1', 'CS031HBA1', 'CS032HBA1', 'CS101HBA1', 'CS103HBA1', 'CS201HBA1', 'CS301HBA1',  \
                    'CS302HBA1', 'CS401HBA1', 'CS501HBA1',  \
                    'RS503HBA', 'RS305HBA', 'RS205HBA', 'RS306HBA', 'RS310HBA', 'RS406HBA', 'RS407HBA',  \
                    'RS106HBA', 'RS307HBA', 'RS208HBA', 'RS210HBA', 'RS409HBA', 'RS508HBA', 'RS509HBA']
        if ctype == 'all':
            antstr=['CS001HBA0', 'CS002HBA0', 'CS003HBA0', 'CS004HBA0', 'CS005HBA0', 'CS006HBA0', 'CS007HBA0',  \
                    'CS011HBA0', 'CS013HBA0', 'CS017HBA0', 'CS021HBA0', 'CS024HBA0', 'CS026HBA0', 'CS028HBA0',  \
                    'CS030HBA0', 'CS031HBA0', 'CS032HBA0', 'CS101HBA0', 'CS103HBA0', 'CS201HBA0', 'CS301HBA0',  \
                    'CS302HBA0', 'CS401HBA0', 'CS501HBA0', \
                    'CS001HBA1', 'CS002HBA1', 'CS003HBA1', 'CS004HBA1', 'CS005HBA1', 'CS006HBA1', 'CS007HBA1',  \
                    'CS011HBA1', 'CS013HBA1', 'CS017HBA1', 'CS021HBA1', 'CS024HBA1', 'CS026HBA1', 'CS028HBA1',  \
                    'CS030HBA1', 'CS031HBA1', 'CS032HBA1', 'CS101HBA1', 'CS103HBA1', 'CS201HBA1', 'CS301HBA1',  \
                    'CS302HBA1', 'CS401HBA1', 'CS501HBA1',  \
                    'RS503HBA', 'RS305HBA', 'RS205HBA', 'RS306HBA', 'RS310HBA', 'RS406HBA', 'RS407HBA',  \
                    'RS106HBA', 'RS307HBA', 'RS208HBA', 'RS210HBA', 'RS409HBA', 'RS508HBA', 'RS509HBA',  \
                    'DE601HBA', 'DE602HBA', 'DE603HBA', 'DE604HBA', 'DE605HBA', 'DE609HBA', 'FR606HBA',  \
                    'SE607HBA', 'UK608HBA', 'PL610HBA', 'PL611HBA', 'PL612HBA', 'IE613HBA', 'LV614HBA', 'ST001']
        if ctype == 'international':
            antstr=['DE601HBA', 'DE602HBA', 'DE603HBA', 'DE604HBA',  'DE605HBA', 'DE609HBA', 'FR606HBA',  \
                    'SE607HBA', 'UK608HBA', 'PL610HBA', 'PL611HBA',  'PL612HBA', 'IE613HBA', 'LV614HBA']
        if ctype == 'core-remote':
            antstr1=['CS001HBA0', 'CS002HBA0', 'CS003HBA0', 'CS004HBA0', 'CS005HBA0', 'CS006HBA0', 'CS007HBA0',  \
                    'CS011HBA0', 'CS013HBA0', 'CS017HBA0', 'CS021HBA0', 'CS024HBA0', 'CS026HBA0', 'CS028HBA0',  \
                    'CS030HBA0', 'CS031HBA0', 'CS032HBA0', 'CS101HBA0', 'CS103HBA0', 'CS201HBA0', 'CS301HBA0',  \
                    'CS302HBA0', 'CS401HBA0', 'CS501HBA0', \
                    'CS001HBA1', 'CS002HBA1', 'CS003HBA1', 'CS004HBA1', 'CS005HBA1', 'CS006HBA1', 'CS007HBA1',  \
                    'CS011HBA1', 'CS013HBA1', 'CS017HBA1', 'CS021HBA1', 'CS024HBA1', 'CS026HBA1', 'CS028HBA1',  \
                    'CS030HBA1', 'CS031HBA1', 'CS032HBA1', 'CS101HBA1', 'CS103HBA1', 'CS201HBA1', 'CS301HBA1',  \
                    'CS302HBA1', 'CS401HBA1', 'CS501HBA1', 'ST001']
            antstr2=['RS503HBA', 'RS305HBA', 'RS205HBA', 'RS306HBA', 'RS310HBA', 'RS406HBA', 'RS407HBA',  \
                    'RS106HBA', 'RS307HBA', 'RS208HBA', 'RS210HBA', 'RS409HBA', 'RS508HBA', 'RS509HBA']

    if telescope == 'MeerKAT':    
        if ctype == 'core': 
            antstr = MeerKAT_antconstraint(ctype='core')
        if ctype == 'remote':
            antstr = MeerKAT_antconstraint(ctype='remote')
        if ctype == 'all':
            antstr = MeerKAT_antconstraint(ctype='all')

    if useforresetsols:
        antstrtmp = list(antstr)
        for ant in antstr:
            if ant not in antennasms:
                antstrtmp.remove(ant)
        return antstrtmp

    if ctype != 'core-remote':
        antstrtmp = list(antstr) # important to use list here, otherwise it's not a copy(!!) and antstrtmp refers to antstr
        for ant in antstr:
            if ant not in antennasms:
                antstrtmp.remove(ant)
        antstr = ','.join(map(str, antstrtmp))
        antstr = '[[' + antstr + ']]'
    else:
        antstrtmp1 = list(antstr1)
        for ant in antstr1:
            if ant not in antennasms:
                antstrtmp1.remove(ant)
        antstr1 = ','.join(map(str, antstrtmp1))

        antstrtmp2 = list(antstr2)
        for ant in antstr2:
            if ant not in antennasms:
                antstrtmp2.remove(ant)
        antstr2 = ','.join(map(str, antstrtmp2))

        antstr =  '[[' + antstr1 + '],[' + antstr2 + ']]'

    return antstr


def makephasediffh5(phaseh5, refant): 
    # note for scalarphase/phaseonly solve, does not work for tecandphase as freq axis is missing there for phase000
    H5pol = tables.open_file(phaseh5,mode='a')

    phase_pol = H5pol.root.sol000.phase000.val[:] # time, freq, ant, dir, pol
    phase_pol_tmp = np.copy(phase_pol)
    # antenna   = H5pol.root.sol000.phase000.ant[:]
    print('Shape to make phase diff array', phase_pol.shape)
    print('Using refant:', refant)
    logger.info('Refant for XX/YY or RR/LL phase-referencing' + refant)
   
    #Reference phases so that we correct the phase difference with respect to a reference station
    refant_idx = np.where(H5pol.root.sol000.phase000.ant[:].astype(str) == refant)
    phase_pol_tmp_ref = phase_pol_tmp - phase_pol_tmp[:,:,refant_idx[0],:,:]

    phase_pol[:, :, :, :,0]  = phase_pol_tmp_ref[:, :, :, :,0] # XX
    phase_pol[:, :, :, :,-1] = 0.0*phase_pol_tmp_ref[:, :, :, :,0] # YY


    H5pol.root.sol000.phase000.val[:] = phase_pol
    H5pol.flush()
    H5pol.close()
    return
    
def makephaseCDFh5(phaseh5, backup=True, testscfactor=1.): 
    # note for scalarphase/phaseonly solve, does not work for tecandphase as freq axis is missing there for phase000
    if backup:
       if os.path.isfile(phaseh5 + '.psbackup'):
         os.system('rm -f ' + phaseh5 + '.psbackup')
       os.system('cp ' + phaseh5 + ' ' + phaseh5 + '.psbackup')
       
    H5 = tables.open_file(phaseh5,mode='a')

    phaseCDF = H5.root.sol000.phase000.val[:] # time, freq, ant, dir, pol
    print('Shape to make phase CDF array', phaseCDF.shape)
    nfreq = len(H5.root.sol000.phase000.freq[:])
    for ff in range(nfreq-1):
      # reverse order so phase increase towards lower frequnecies
      phaseCDF[:,nfreq-ff-2, ...]  = np.copy(phaseCDF[:,nfreq-ff-2, ...] + (testscfactor*phaseCDF[:, nfreq-ff-1, ...]))

    print(phaseCDF.shape)
    H5.root.sol000.phase000.val[:] = phaseCDF
    H5.flush()
    H5.close()
    return

def makephaseCDFh5_h5merger(phaseh5, ms, modeldatacolumns, backup=True, testscfactor=1.): 
    # note for scalarphase/phaseonly solve, does not work for tecandphase as freq axis is missing there for phase000
    #if soltypein == 'scalarphase_slope':
    #   single_pol_merge = True
    #if soltypein == 'phaseonly_slope':
    #   single_pol = False
    #if soltypein not in ['scalarphase_slope','phaseonly_slope']:
    #   print('Wrong input in makephaseCDFh5_h5merger')
    #   sys.exit()

    if len(modeldatacolumns) > 1:
       merge_all_in_one = False
    else:
       merge_all_in_one = True
       
      
    if backup:
       if os.path.isfile(phaseh5 + '.psbackup'):
         os.system('rm -f ' + phaseh5 + '.psbackup')
       os.system('cp ' + phaseh5 + ' ' + phaseh5 + '.psbackup')
    # going to overwrite phaseh5, first move to new file
    if os.path.isfile(phaseh5 + '.in'):
       os.system('rm -f ' + phaseh5 + '.in')
    os.system('mv ' + phaseh5 + ' ' + phaseh5 + '.in')

    h5_merger.merge_h5(h5_out=phaseh5,h5_tables=phaseh5+'.in',ms_files=ms,\
                          merge_all_in_one=merge_all_in_one, \
                          propagate_flags=True)       
    H5 = tables.open_file(phaseh5,mode='a')

    phaseCDF = H5.root.sol000.phase000.val[:] # time, freq, ant, dir, pol
    phaseCDF_tmp = np.copy(phaseCDF)
    print('Shape to make phase CDF array', phaseCDF.shape)
    nfreq = len(H5.root.sol000.phase000.freq[:])
    for ff in range(nfreq-1):
      # reverse order so phase increase towards lower frequnecies
      phaseCDF[:,nfreq-ff-2, ...]  = np.copy(phaseCDF[:,nfreq-ff-2, ...] + (testscfactor*phaseCDF[:, nfreq-ff-1, ...]))

    print(phaseCDF.shape)
    H5.root.sol000.phase000.val[:] = phaseCDF
    H5.flush()
    H5.close()
    return  
  

def copyoverscalarphase(scalarh5, phasexxyyh5): 
    # note for scalarphase/phaseonly solve, does not work for tecandphase as freq axis is missing there for phase000
    H5    = tables.open_file(scalarh5, mode='r')
    H5pol = tables.open_file(phasexxyyh5,mode='a')

    phase     = H5.root.sol000.phase000.val[:] # time, freq, ant, dir
    phase_pol = H5pol.root.sol000.phase000.val[:] # time, freq, ant, dir, pol
    antenna   = H5.root.sol000.phase000.ant[:]
    print('Shapes for pol copy', phase.shape, phase_pol.shape)

    for ant in range(len(antenna)):
      phase_pol[:, :, ant, :,0] = phase[:, :, ant, :] # XX
      phase_pol[:, :, ant, :,-1] = phase[:, :, ant, :] # YY

    H5pol.root.sol000.phase000.val[:] = phase_pol[:,:,:]
    H5pol.flush()


    H5.close()
    H5pol.close()
    return

def copyovergain(gaininh5,gainouth5, soltype):
    H5in    = tables.open_file(gaininh5, mode='r')
    H5out   = tables.open_file(gainouth5,mode='a')
    antenna   = H5in.root.sol000.amplitude000.ant[:]

    h5 = h5parm.h5parm(gaininh5)
    ss = h5.getSolset('sol000')
    st = ss.getSoltab('amplitude000')
    axesnames = st.getAxesNames()
    h5.close()

    if 'pol' in axesnames:

        if soltype != 'scalaramplitude' and soltype != 'amplitudeonly':
            phase     = H5in.root.sol000.phase000.val[:]
            H5out.root.sol000.phase000.val[:] = phase
        else:
            H5out.root.sol000.phase000.val[:] = 0.0

        amplitude = H5in.root.sol000.amplitude000.val[:]
        print('Shapes for gain copy with polarizations', amplitude.shape)
        H5out.root.sol000.amplitude000.val[:] = amplitude

    else:
        if soltype != 'scalaramplitude' and soltype != 'amplitudeonly':
            phase     = H5in.root.sol000.phase000.val[:]
            phase_pol = H5out.root.sol000.phase000.val[:] # time, freq, ant, dir, pol

        amplitude = H5in.root.sol000.amplitude000.val[:]
        amplitude_pol   = H5out.root.sol000.amplitude000.val[:] # time, freq, ant, dir, pol
        print('Shapes for gain copy 1 pol', amplitude.shape)

        for ant in range(len(antenna)):
            if soltype != 'scalaramplitude' and soltype != 'amplitudeonly':
                phase_pol[:, :, ant, :,0] = phase[:, :, ant, :] # XX
                phase_pol[:, :, ant, :,-1] = phase[:, :, ant, :] # YY
            amplitude_pol[:, :, ant, :,0] = amplitude[:, :, ant, :] # XX
            amplitude_pol[:, :, ant, :,-1] = amplitude[:, :, ant, :] # YY
        if soltype != 'scalaramplitude' and soltype != 'amplitudeonly':
            H5out.root.sol000.phase000.val[:] = phase_pol[:,:,:]
        else:
            H5out.root.sol000.phase000.val[:] = 0.0
        H5out.root.sol000.amplitude000.val[:] = amplitude_pol[:,:,:]

    H5out.flush()
    H5in.close()
    H5out.close()
    return

def resetgains(parmdb):
    H5 = tables.open_file(parmdb, mode='a')
    H5.root.sol000.phase000.val[:] = 0.0
    H5.root.sol000.amplitude000.val[:] = 1.0
    H5.flush()
    H5.close()
    return


def fix_tecreference(h5parm, refant):
    ''' Tec reference values with respect to a reference station
    Args:
      h5parm: h5parm file
      refant: reference antenna
    '''
    
    H=tables.open_file(h5parm, mode='a')

    axisn = H.root.sol000.tec000.val.attrs['AXES'].decode().split(',')
    
    tec = H.root.sol000.tec000.val[:]
    refant_idx = np.where(H.root.sol000.tec000.ant[:].astype(str) == refant) # to deal with byte strings
    print(refant_idx, refant)
    antennaxis = axisn.index('ant')
    
    print('Referencing tec to ', refant, 'Axis entry number', axisn.index('ant'))
    if antennaxis == 0:
       tecn = tec - tec[refant_idx[0],...]
    if antennaxis == 1:
       tecn = tec - tec[:,refant_idx[0],...]
    if antennaxis == 2:
       tecn = tec - tec[:,:,refant_idx[0],...]
    if antennaxis == 3:
       tecn = tec - tec[:,:,:,refant_idx[0],...]
    if antennaxis == 4:
       tecn = tec - tec[:,:,:,:,refant_idx[0],...]
    tec = np.copy(tecn)

    # fill values back in
    H.root.sol000.tec000.val[:] = np.copy(tec)

    H.flush()
    H.close()
    return


def fix_phasereference(h5parm, refant):
    ''' Phase reference values with respect to a reference station
    Args:
      h5parm: h5parm file
      refant: reference antenna
    '''
    
    H=tables.open_file(h5parm, mode='a')

    axisn = H.root.sol000.phase000.val.attrs['AXES'].decode().split(',')
    
    phase = H.root.sol000.phase000.val[:]
    refant_idx = np.where(H.root.sol000.phase000.ant[:].astype(str) == refant) # to deal with byte strings
    print(refant_idx, refant)
    antennaxis = axisn.index('ant')
    
    print('Referencing phase to ', refant, 'Axis entry number', axisn.index('ant'))
    if antennaxis == 0:
       phasen = phase - phase[refant_idx[0],...]
    if antennaxis == 1:
       phasen = phase - phase[:,refant_idx[0],...]
    if antennaxis == 2:
       phasen = phase - phase[:,:,refant_idx[0],...]
    if antennaxis == 3:
       phasen = phase - phase[:,:,:,refant_idx[0],...]
    if antennaxis == 4:
       phasen = phase - phase[:,:,:,:,refant_idx[0],...]
    phase = np.copy(phasen)

    # fill values back in
    H.root.sol000.phase000.val[:] = np.copy(phase)

    H.flush()
    H.close()
    return


def fix_rotationreference(h5parm, refant):
    ''' Phase reference rotation values with respect to a reference station
    Args:
      h5parm: h5parm file
      refant: reference antenna
    '''
    
    H=tables.open_file(h5parm, mode='a')

    axisn = H.root.sol000.rotation000.val.attrs['AXES'].decode().split(',')
    
    rotation = H.root.sol000.rotation000.val[:]
    refant_idx = np.where(H.root.sol000.rotation000.ant[:].astype(str) == refant) # to deal with byte strings
    print(refant_idx, refant)
    antennaxis = axisn.index('ant')
    
    print('Referencing rotation to ', refant, 'Axis entry number', axisn.index('ant'))
    if antennaxis == 0:
       rotationn = rotation - rotation[refant_idx[0],...]
    if antennaxis == 1:
       rotationn = rotation - rotation[:,refant_idx[0],...]
    if antennaxis == 2:
       rotationn = rotation - rotation[:,:,refant_idx[0],...]
    if antennaxis == 3:
       rotationn = rotation - rotation[:,:,:,refant_idx[0],...]
    if antennaxis == 4:
       rotationn = rotation - rotation[:,:,:,:,refant_idx[0],...]
    rotation = np.copy(rotationn)

    # fill values back in
    H.root.sol000.rotation000.val[:] = np.copy(rotation)

    H.flush()
    H.close()
    return


def resetsolsforstations(h5parm, stationlist, refant=None):
    ''' Reset solutions for stations

    Args:
      h5parm: h5parm file
      stationlist: station name list
      refant: reference antenna
    '''
    print(h5parm, stationlist)
    fulljones = fulljonesparmdb(h5parm) # True/False
    hasphase = True
    hasamps  = True
    hasrotation = True
    hastec = True

    H=tables.open_file(h5parm)

    # figure of we have phase and/or amplitude solutions
    try:
     antennas = H.root.sol000.amplitude000.ant[:]
     axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
    except:
      hasamps = False
    try:
     antennas = H.root.sol000.phase000.ant[:]
     axisn = H.root.sol000.phase000.val.attrs['AXES'].decode().split(',')
    except:
     hasphase = False
    try:
     antennas = H.root.sol000.tec000.ant[:]
     axisn = H.root.sol000.tec000.val.attrs['AXES'].decode().split(',')
    except:
     hastec = False
    try:
     antennas = H.root.sol000.rotation000.ant[:]
     axisn = H.root.sol000.rotation000.val.attrs['AXES'].decode().split(',')
    except:
     hasrotation = False
    H.close()

    # in case refant is None but h5 still has phase
    # this can happen with a scalaramplitude and soltypelist_includedir is used
    # in this case we have pertubative direction
    # in this case h5_merger has already been run which created a phase000 entry
    if refant is None and hasphase: 
       refant=findrefant_core(h5parm)
       force_close(h5parm)

    # should not be needed as h5_merger does not create rotation000
    # keep this code in case of future h5_merger updates so we are safe
    if refant is None and hasrotation: 
       refant=findrefant_core(h5parm)
       force_close(h5parm)

    # should not be needed as h5_merger does not create tec000
    # keep this code in case of future h5_merger updates so we are safe
    if refant is None and hastec:
       refant=findrefant_core(h5parm)
       force_close(h5parm)       
  
    
    H=tables.open_file(h5parm, mode='a')
    if hasamps:
     amp = H.root.sol000.amplitude000.val[:]
    if hasphase: # also phasereference
     phase = H.root.sol000.phase000.val[:]
     refant_idx = np.where(H.root.sol000.phase000.ant[:].astype(str) == refant) # to deal with byte strings
     print(refant_idx, refant)
     antennaxis = axisn.index('ant')
     axisn = H.root.sol000.phase000.val.attrs['AXES'].decode().split(',')
     print('Referencing phase to ', refant, 'Axis entry number', axisn.index('ant'))
     if antennaxis == 0:
        phasen = phase - phase[refant_idx[0],...]
     if antennaxis == 1:
        phasen = phase - phase[:,refant_idx[0],...]
     if antennaxis == 2:
        phasen = phase - phase[:,:,refant_idx[0],...]
     if antennaxis == 3:
        phasen = phase - phase[:,:,:,refant_idx[0],...]
     if antennaxis == 4:
        phasen = phase - phase[:,:,:,:,refant_idx[0],...]
     phase = np.copy(phasen)


    if hastec:
     tec = H.root.sol000.tec000.val[:]
     refant_idx = np.where(H.root.sol000.tec000.ant[:].astype(str) == refant) # to deal with byte strings
     print(refant_idx, refant)
     antennaxis = axisn.index('ant')
     axisn = H.root.sol000.tec000.val.attrs['AXES'].decode().split(',')
     print('Referencing tec to ', refant, 'Axis entry number', axisn.index('ant'))
     if antennaxis == 0:
        tecn = tec - tec[refant_idx[0],...]
     if antennaxis == 1:
        tecn = tec - tec[:,refant_idx[0],...]
     if antennaxis == 2:
        tecn = tec - tec[:,:,refant_idx[0],...]
     if antennaxis == 3:
        tecn = tec - tec[:,:,:,refant_idx[0],...]
     if antennaxis == 4:
        tecn = tec - tec[:,:,:,:,refant_idx[0],...]
     tec = np.copy(tecn)

    if hasrotation:
     rotation = H.root.sol000.rotation000.val[:]
     refant_idx = np.where(H.root.sol000.rotation000.ant[:].astype(str) == refant) # to deal with byte strings
     print(refant_idx, refant)
     antennaxis = axisn.index('ant')
     axisn = H.root.sol000.rotation000.val.attrs['AXES'].decode().split(',')
     print('Referencing rotation to ', refant, 'Axis entry number', axisn.index('ant'))
     if antennaxis == 0:
        rotationn = rotation - rotation[refant_idx[0],...]
     if antennaxis == 1:
        rotationn = rotation - rotation[:,refant_idx[0],...]
     if antennaxis == 2:
        rotationn = rotation - rotation[:,:,refant_idx[0],...]
     if antennaxis == 3:
        rotationn = rotation - rotation[:,:,:,refant_idx[0],...]
     if antennaxis == 4:
        rotationn = rotation - rotation[:,:,:,:,refant_idx[0],...]
     rotation = np.copy(rotationn)


    for antennaid,antenna in enumerate(antennas.astype(str)): # to deal with byte formatted array
     # if not isinstance(antenna, str):
     #  antenna_str = antenna.decode() # to deal with byte formatted antenna names
     # else:
     #  antenna_str = antenna # already str type

     print(antenna, hasphase, hasamps, hastec, hasrotation)
     if antenna in stationlist: # in this case reset value to 0.0 (or 1.0)
       if hasphase:
         antennaxis = axisn.index('ant')
         axisn = H.root.sol000.phase000.val.attrs['AXES'].decode().split(',')
         print('Resetting phase', antenna, 'Axis entry number', axisn.index('ant'))
         # print(phase[:,:,antennaid,...])
         if antennaxis == 0:
           phase[antennaid,...] = 0.0
         if antennaxis == 1:
           phase[:,antennaid,...] = 0.0
         if antennaxis == 2:
           phase[:,:,antennaid,...] = 0.0
         if antennaxis == 3:
           phase[:,:,:,antennaid,...] = 0.0
         if antennaxis == 4:
           phase[:,:,:,:,antennaid,...] = 0.0
         # print(phase[:,:,antennaid,...])
       if hasamps:
         antennaxis = axisn.index('ant')
         axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
         print('Resetting amplitude', antenna, 'Axis entry number', axisn.index('ant'))
         if antennaxis == 0:
           amp[antennaid,...] = 1.0
         if antennaxis == 1:
           amp[:,antennaid,...] = 1.0
         if antennaxis == 2:
           amp[:,:,antennaid,...] = 1.0
         if antennaxis == 3:
           amp[:,:,:,antennaid,...] = 1.0
         if antennaxis == 4:
           amp[:,:,:,:,antennaid,...] = 1.0
         if fulljones:
           print('pol entry axis:', axisn.index('pol'))
           if len(axisn) != axisn.index('pol')+1:
              print('Pol-axis not the last enrty, cannot handle this')
              sys.exit()
           # hardcoded, assumes pol-axis is last
           if antennaxis == 0:
             amp[antennaid,...,1] = 0.
             amp[antennaid,...,2] = 0.
           if antennaxis == 1:
             amp[:,antennaid,...,1] = 0.
             amp[:,antennaid,...,2] = 0.
           if antennaxis == 2:
             amp[:,:,antennaid,...,1] = 0.
             amp[:,:,antennaid,...,2] = 0.
           if antennaxis == 3:
             amp[:,:,:,antennaid,...,1] = 0.
             amp[:,:,:,antennaid,...,2] = 0.
           if antennaxis == 4:
             amp[:,:,:,:,antennaid,...,1] = 0.
             amp[:,:,:,:,antennaid,...,2] = 0.
           
           #k = axisn.index('pol')
           #amp[tuple(slice(None) if j != k else antennaid for j in range(arr.ndim))] 
           #amp[...,1] = 0.0 # XY, assumpe pol is last axis
           #amp[...,2] = 0.0 # YX, assume pol is last axis

       if hastec:
         antennaxis = axisn.index('ant')
         axisn = H.root.sol000.tec000.val.attrs['AXES'].decode().split(',')
         print('Resetting TEC', antenna, 'Axis entry number', axisn.index('ant'))
         if antennaxis == 0:
           tec[antennaid,...] = 0.0
         if antennaxis == 1:
           tec[:,antennaid,...] = 0.0
         if antennaxis == 2:
           tec[:,:,antennaid,...] = 0.0
         if antennaxis == 3:
           tec[:,:,:,antennaid,...] = 0.0
         if antennaxis == 4:
           tec[:,:,:,:,antennaid,...] = 0.0
       if hasrotation:
         antennaxis = axisn.index('ant')
         axisn = H.root.sol000.rotation000.val.attrs['AXES'].decode().split(',')
         print('Resetting rotation', antenna, 'Axis entry number', axisn.index('ant'))
         if antennaxis == 0:
           rotation[antennaid,...] = 0.0
         if antennaxis == 1:
           rotation[:,antennaid,...] = 0.0
         if antennaxis == 2:
           rotation[:,:,antennaid,...] = 0.0
         if antennaxis == 3:
           rotation[:,:,:,antennaid,...] = 0.0
         if antennaxis == 4:
           rotation[:,:,:,:,antennaid,...] = 0.0
    # fill values back in
    if hasphase:
     H.root.sol000.phase000.val[:] = np.copy(phase)
    if hasamps:
     H.root.sol000.amplitude000.val[:] = np.copy(amp)
    if hastec:
     H.root.sol000.tec000.val[:] = np.copy(tec)
    if hasrotation:
     H.root.sol000.rotation000.val[:] = np.copy(rotation)

    H.flush()
    H.close()
    return

def resetsolsfordir(h5parm, dirlist, refant=None):
    ''' Reset solutions for directions (DDE solves only)

    Args:
      h5parm: h5parm file
      dirlist: list of direction_id to reset
      refant: reference antenna
    '''
    print(h5parm, dirlist)
    fulljones = fulljonesparmdb(h5parm) # True/False
    hasphase = True
    hasamps  = True
    hasrotation = True
    hastec = True

    H=tables.open_file(h5parm)

    # figure of we have phase and/or amplitude solutions
    try:
     directions = H.root.sol000.amplitude000.dir[:]
     axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
    except:
      hasamps = False
    try:
     directions = H.root.sol000.phase000.dir[:]
     axisn = H.root.sol000.phase000.val.attrs['AXES'].decode().split(',')
    except:
     hasphase = False
    try:
     directions = H.root.sol000.tec000.dir[:]
     axisn = H.root.sol000.tec000.val.attrs['AXES'].decode().split(',')
    except:
     hastec = False
    try:
     directions = H.root.sol000.rotation000.dir[:]
     axisn = H.root.sol000.rotation000.val.attrs['AXES'].decode().split(',')
    except:
     hasrotation = False
    H.close()

    # in case refant is None but h5 still has phase
    # this can happen with a scalaramplitude and soltypelist_includedir is used
    # in this case we have pertubative direction
    # in this case h5_merger has already been run which created a phase000 entry
    if refant is None and hasphase: 
       refant=findrefant_core(h5parm)
       force_close(h5parm)

    # should not be needed as h5_merger does not create rotation000
    # keep this code in case of future h5_merger updates so we are safe
    if refant is None and hasrotation: 
       refant=findrefant_core(h5parm)
       force_close(h5parm)

    # should not be needed as h5_merger does not create tec000
    # keep this code in case of future h5_merger updates so we are safe
    if refant is None and hastec:
       refant=findrefant_core(h5parm)
       force_close(h5parm)       

    H=tables.open_file(h5parm, mode='a')
    if hasamps:
     amp = H.root.sol000.amplitude000.val[:]
    if hasphase: # also phasereference
     phase = H.root.sol000.phase000.val[:]
     refant_idx = np.where(H.root.sol000.phase000.ant[:].astype(str) == refant) # to deal with byte strings
     print(refant_idx, refant)
     antennaxis = axisn.index('ant')
     axisn = H.root.sol000.phase000.val.attrs['AXES'].decode().split(',')
     print('Referencing phase to ', refant, 'Axis entry number', axisn.index('ant'))
     if antennaxis == 0:
        phasen = phase - phase[refant_idx[0],...]
     if antennaxis == 1:
        phasen = phase - phase[:,refant_idx[0],...]
     if antennaxis == 2:
        phasen = phase - phase[:,:,refant_idx[0],...]
     if antennaxis == 3:
        phasen = phase - phase[:,:,:,refant_idx[0],...]
     if antennaxis == 4:
        phasen = phase - phase[:,:,:,:,refant_idx[0],...]
     phase = np.copy(phasen)


    if hastec:
     tec = H.root.sol000.tec000.val[:]
     refant_idx = np.where(H.root.sol000.tec000.ant[:].astype(str) == refant) # to deal with byte strings
     print(refant_idx, refant)
     antennaxis = axisn.index('ant')
     axisn = H.root.sol000.tec000.val.attrs['AXES'].decode().split(',')
     print('Referencing tec to ', refant, 'Axis entry number', axisn.index('ant'))
     if antennaxis == 0:
        tecn = tec - tec[refant_idx[0],...]
     if antennaxis == 1:
        tecn = tec - tec[:,refant_idx[0],...]
     if antennaxis == 2:
        tecn = tec - tec[:,:,refant_idx[0],...]
     if antennaxis == 3:
        tecn = tec - tec[:,:,:,refant_idx[0],...]
     if antennaxis == 4:
        tecn = tec - tec[:,:,:,:,refant_idx[0],...]
     tec = np.copy(tecn)

    if hasrotation:
     rotation = H.root.sol000.rotation000.val[:]
     refant_idx = np.where(H.root.sol000.rotation000.ant[:].astype(str) == refant) # to deal with byte strings
     print(refant_idx, refant)
     antennaxis = axisn.index('ant')
     axisn = H.root.sol000.rotation000.val.attrs['AXES'].decode().split(',')
     print('Referencing rotation to ', refant, 'Axis entry number', axisn.index('ant'))
     if antennaxis == 0:
        rotationn = rotation - rotation[refant_idx[0],...]
     if antennaxis == 1:
        rotationn = rotation - rotation[:,refant_idx[0],...]
     if antennaxis == 2:
        rotationn = rotation - rotation[:,:,refant_idx[0],...]
     if antennaxis == 3:
        rotationn = rotation - rotation[:,:,:,refant_idx[0],...]
     if antennaxis == 4:
        rotationn = rotation - rotation[:,:,:,:,refant_idx[0],...]
     rotation = np.copy(rotationn)


    for directionid,direction in enumerate(directions.astype(str)): # to deal with byte formatted array
     # if not isinstance(antenna, str):
     #  antenna_str = antenna.decode() # to deal with byte formatted antenna names
     # else:
     #  antenna_str = antenna # already str type

     print(directionid,direction, hasphase, hasamps, hastec, hasrotation)
     if directionid in dirlist: # in this case reset value to 0.0 (or 1.0)
       if hasphase:
         diraxis = axisn.index('dir')
         axisn = H.root.sol000.phase000.val.attrs['AXES'].decode().split(',')
         print('Resetting phase direction ID', directionid, 'Axis entry number', axisn.index('dir'))
         # print(phase[:,:,directionid,...])
         if diraxis == 0:
           phase[directionid,...] = 0.0
         if diraxis == 1:
           phase[:,directionid,...] = 0.0
         if diraxis == 2:
           phase[:,:,directionid,...] = 0.0
         if diraxis == 3:
           phase[:,:,:,directionid,...] = 0.0
         if diraxis == 4:
           phase[:,:,:,:,directionid,...] = 0.0
         # print(phase[:,:,directionid,...])
       if hasamps:
         diraxis = axisn.index('dir')
         axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
         print('Resetting amplitude direction ID', directionid, 'Axis entry number', axisn.index('dir'))
         if diraxis == 0:
           amp[directionid,...] = 1.0
         if diraxis == 1:
           amp[:,directionid,...] = 1.0
         if diraxis == 2:
           amp[:,:,directionid,...] = 1.0
         if diraxis == 3:
           amp[:,:,:,directionid,...] = 1.0
         if diraxis == 4:
           amp[:,:,:,:,directionid,...] = 1.0
         if fulljones:
           print('pol entry axis:', axisn.index('pol'))
           if len(axisn) != axisn.index('pol')+1:
              print('Pol-axis not the last enrty, cannot handle this')
              sys.exit()
           # hardcoded, assumes pol-axis is last
           if diraxis == 0:
             amp[directionid,...,1] = 0.
             amp[directionid,...,2] = 0.
           if diraxis == 1:
             amp[:,directionid,...,1] = 0.
             amp[:,directionid,...,2] = 0.
           if diraxis == 2:
             amp[:,:,directionid,...,1] = 0.
             amp[:,:,directionid,...,2] = 0.
           if diraxis == 3:
             amp[:,:,:,directionid,...,1] = 0.
             amp[:,:,:,directionid,...,2] = 0.
           if diraxis == 4:
             amp[:,:,:,:,directionid,...,1] = 0.
             amp[:,:,:,:,directionid,...,2] = 0.
           
           #amp[...,1] = 0.0 # XY, assumpe pol is last axis
           #amp[...,2] = 0.0 # YX, assume pol is last axis

       if hastec:
         diraxis = axisn.index('dir')
         axisn = H.root.sol000.tec000.val.attrs['AXES'].decode().split(',')
         print('Resetting TEC direction ID', directionid, 'Axis entry number', axisn.index('dir'))
         if diraxis == 0:
           tec[directionid,...] = 0.0
         if diraxis == 1:
           tec[:,directionid,...] = 0.0
         if diraxis == 2:
           tec[:,:,directionid,...] = 0.0
         if diraxis == 3:
           tec[:,:,:,directionid,...] = 0.0
         if diraxis == 4:
           tec[:,:,:,:,directionid,...] = 0.0
       if hasrotation:
         diraxis = axisn.index('dir')
         axisn = H.root.sol000.rotation000.val.attrs['AXES'].decode().split(',')
         print('Resetting rotation direction ID', directionid, 'Axis entry number', axisn.index('dir'))
         if diraxis == 0:
           rotation[directionid,...] = 0.0
         if diraxis == 1:
           rotation[:,directionid,...] = 0.0
         if diraxis == 2:
           rotation[:,:,directionid,...] = 0.0
         if diraxis == 3:
           rotation[:,:,:,directionid,...] = 0.0
         if diraxis == 4:
           rotation[:,:,:,:,directionid,...] = 0.0
    # fill values back in
    if hasphase:
     H.root.sol000.phase000.val[:] = np.copy(phase)
    if hasamps:
     H.root.sol000.amplitude000.val[:] = np.copy(amp)
    if hastec:
     H.root.sol000.tec000.val[:] = np.copy(tec)
    if hasrotation:
     H.root.sol000.rotation000.val[:] = np.copy(rotation)

    H.flush()
    H.close()
    return


def str_or_int(arg):
    try:
        return int(arg)  # try convert to int
    except ValueError:
        pass
    if isinstance(arg, str):
        return arg
    raise argparse.ArgumentTypeError("Input must be an int or string")

def str_or_float(arg):
    try:
        return float(arg)  # try convert to int
    except ValueError:
        pass
    if isinstance(arg, str):
        return arg
    raise argparse.ArgumentTypeError("Input must be an int or string")


def floatlist_or_float(argin):
    if argin is None:
      return argin
    try:
        return float(argin)  # try convert to float
    except ValueError:
        pass
    
    arg = ast.literal_eval(argin)

    if type(arg) is not list:
        raise argparse.ArgumentTypeError("Argument \"%s\" is not a list" % (argin))

    # check for float list
    if all([(isinstance(item, float) or isinstance(item, int)) for item in arg]):
        return arg  
    else:
      raise argparse.ArgumentTypeError("This needs to be a float or list of floats")


def removenans(parmdb, soltab):
    ''' Remove nan values in h5parm

    Args:
      parmdb: h5parm file
      soltab: solution table name (amplitude000, phase000, rotation000, ...)
    '''
    H5 = h5parm.h5parm(parmdb, readonly=False)
    vals =H5.getSolset('sol000').getSoltab(soltab).getValues()[0]
    weights = H5.getSolset('sol000').getSoltab(soltab).getValues(weight=True)[0]

    idxnan  = np.where((~np.isfinite(vals)))

    # print(idxnan)
    # print('Found some NaNs', vals[idxnan])
    print('Found some NaNs, flagging them....')

    if H5.getSolset('sol000').getSoltab(soltab).getType() == 'phase':
       vals[idxnan] = 0.0
    if H5.getSolset('sol000').getSoltab(soltab).getType() == 'amplitude':
       vals[idxnan] = 1.0
    if H5.getSolset('sol000').getSoltab(soltab).getType() == 'rotation':
       vals[idxnan] = 0.0

    weights[idxnan] = 0.0

    H5.getSolset('sol000').getSoltab(soltab).setValues(weights,weight=True)
    H5.getSolset('sol000').getSoltab(soltab).setValues(vals)
    H5.close()
    return

def removenans_fulljones(parmdb):
    ''' Remove nan values in full jones h5parm

    Args:
      parmdb: h5parm file
    '''
    H=tables.open_file(parmdb, mode='a')
    amplitude = H.root.sol000.amplitude000.val[:]
    weights   = H.root.sol000.amplitude000.weight[:]
    phase = H.root.sol000.phase000.val[:]
    weights_p = H.root.sol000.phase000.weight[:]

    # XX
    amps_xx = amplitude[...,0]
    weights_xx = weights[...,0]
    idx = np.where((~np.isfinite(amps_xx)))
    amps_xx[idx] = 1.0
    weights_xx[idx] =  0.0
    phase_xx = phase[...,0]
    weights_p_xx = weights_p[...,0]
    phase_xx[idx] = 0.0 
    weights_p_xx[idx] = 0.0

    # XY
    amps_xy = amplitude[...,1]
    weights_xy = weights[...,1]
    idx = np.where((~np.isfinite(amps_xy)))
    amps_xy[idx] = 0.0
    weights_xy[idx] =  0.0
    phase_xy = phase[...,1]
    weights_p_xy = weights_p[...,1]
    phase_xy[idx] = 0.0 
    weights_p_xy[idx] = 0.0

    # XY
    amps_yx = amplitude[...,2]
    weights_yx = weights[...,2]
    idx = np.where((~np.isfinite(amps_yx)))
    amps_yx[idx] = 0.0
    weights_yx[idx] =  0.0
    phase_yx = phase[...,2]
    weights_p_yx = weights_p[...,2]
    phase_yx[idx] = 0.0 
    weights_p_yx[idx] = 0.0

    # YY
    amps_yy = amplitude[...,3]
    weights_yy = weights[...,3]
    idx = np.where((~np.isfinite(amps_yy)))
    amps_yy[idx] = 1.0
    weights_yy[idx] =  0.0
    phase_yy = phase[...,3]
    weights_p_yy = weights_p[...,3]
    phase_yy[idx] = 0.0 
    weights_p_yy[idx] = 0.0
       
    amplitude[...,0] = amps_xx
    amplitude[...,1] = amps_xy
    amplitude[...,2] = amps_yx
    amplitude[...,3] = amps_yy
  
    weights[...,0] = weights_yy
    weights[...,1] = weights_xy
    weights[...,2] = weights_yx
    weights[...,3] = weights_yy
    H.root.sol000.amplitude000.val[:] = amplitude
    H.root.sol000.amplitude000.weight[:] = weights 
  
    phase[...,0] = phase_xx
    phase[...,1] = phase_xy
    phase[...,2] = phase_yx
    phase[...,3] = phase_yy
  
    weights_p[...,0] = weights_p_yy
    weights_p[...,1] = weights_p_xy
    weights_p[...,2] = weights_p_yx
    weights_p[...,3] = weights_p_yy
    H.root.sol000.phase000.val[:] = phase
    H.root.sol000.phase000.weight[:] = weights_p 
    H.close()
    return


def radec_to_xyz(ra, dec, time):
    ''' Convert ra and dec coordinates to ITRS coordinates for LOFAR observations.

    Args:
        ra (astropy Quantity): right ascension
        dec (astropy Quantity): declination
        time (float): MJD time in seconds
    Returns:
        pointing_xyz (ndarray): NumPy array containing the X, Y and Z coordinates
    '''
    obstime = Time(time/3600/24, scale='utc', format='mjd')
    loc_LOFAR = EarthLocation(lon=0.11990128407256424, lat=0.9203091252660295, height=6364618.852935438*units.m)

    dir_pointing = SkyCoord(ra, dec)
    dir_pointing_altaz = dir_pointing.transform_to(AltAz(obstime=obstime, location=loc_LOFAR))
    dir_pointing_xyz = dir_pointing_altaz.transform_to(ITRS)

    pointing_xyz = np.asarray([dir_pointing_xyz.x, dir_pointing_xyz.y, dir_pointing_xyz.z])
    return pointing_xyz

def losotolofarbeam(parmdb, soltabname, ms, inverse=False, useElementResponse=True, useArrayFactor=True, useChanFreq=True, beamlib='stationresponse'):
    """
    Do the beam correction via this imported losoto operation

    Args:
        parmdb (str): path to the h5parm corrections will be stored in.
        soltabname (str): name of the soltab corrections will be stored in.
        ms (str): path to the MS (used to determine the stations present).
        inverse (bool): calculate the inverse beam correction (i.e. undo the beam).
        useElementResponse (bool): correct for the "element beam" (distance to the tile beam centre).
        useArrayFactor (bool): correct for the "array factor" (sensitivity loss as function of distance to the pointing centre).
        useChanFreq (bool): calculate a beam correction for every channel.
        beamlib (str): beam calculation mode. Can be 'stationresponse' to use the LOFARBeam library (deprecated) or everybeam to use the EveryBeam library.
    """

    H5 = h5parm.h5parm(parmdb, readonly=False)
    soltab = H5.getSolset('sol000').getSoltab(soltabname)
    times = soltab.getAxisValues('time')
    numants = pt.taql('select gcount(*) as numants from '+ms+'::ANTENNA').getcol('numants')[0]
    H5ants = len(soltab.getAxisValues('ant'))
    if numants != H5ants:
        H5.close()
        raise ValueError('Number of antennas in Measurement Set does not match number of antennas in H5parm.')

    if (beamlib.lower() == 'stationresponse') or (beamlib.lower() == 'lofarbeam'):
        from lofar.stationresponse import stationresponse
        sr = stationresponse(ms, inverse, useElementResponse, useArrayFactor, useChanFreq)

        for vals, coord, selection in soltab.getValuesIter(returnAxes=['ant','time','pol','freq'], weight=False):
            vals = losoto.lib_operations.reorderAxes( vals, soltab.getAxesNames(), ['ant','time','freq','pol'] )

            for stationnum in range(numants):
                logger.debug('Working on station number %i' % stationnum)
                for itime, time in enumerate(times):
                    beam = sr.evaluateStation(time=time, station=stationnum)
                    # Reshape from [nfreq, 2, 2] to [nfreq, 4]
                    beam = beam.reshape(beam.shape[0], 4)

                    if soltab.getAxisLen('pol') == 2:
                        beam = beam[:,[0,3]] # get only XX and YY

                    if soltab.getType() == 'amplitude':
                        vals[stationnum, itime, :, :] = np.abs(beam)
                    elif soltab.getType() == 'phase':
                        vals[stationnum, itime, :, :] = np.angle(beam)
                    else:
                        logger.error('Beam prediction works only for amplitude/phase solution tables.')
                        return 1

            vals = losoto.lib_operations.reorderAxes( vals, ['ant','time','freq','pol'], [ax for ax in soltab.getAxesNames() if ax in ['ant','time','freq','pol']] )
            soltab.setValues(vals, selection)
    elif beamlib.lower() == 'everybeam':
        from tqdm import tqdm
        from joblib import Parallel, delayed, parallel_backend
        import dill as pickle
        import psutil
        freqs = soltab.getAxisValues('freq')

        # Obtain direction to calculate beam for.
        dirs = pt.taql('SELECT REFERENCE_DIR,PHASE_DIR FROM {ms:s}::FIELD'.format(ms=ms))
        ra_ref, dec_ref = dirs.getcol('REFERENCE_DIR').squeeze()
        ra, dec = dirs.getcol('PHASE_DIR').squeeze()
        reference_xyz = list(zip(*radec_to_xyz(ra_ref * units.rad, dec_ref * units.rad, times)))
        phase_xyz = list(zip(*radec_to_xyz(ra * units.rad, dec * units.rad, times)))


        for vals, coord, selection in soltab.getValuesIter(returnAxes=['ant','time','pol','freq'], weight=False):
            vals = losoto.lib_operations.reorderAxes( vals, soltab.getAxesNames(), ['ant','time','freq','pol'] )
            stationloop = tqdm(range(numants))
            stationloop.set_description('Stations processed: ')
            for stationnum in range(numants):
                stationloop.update()
                logger.debug('Working on station number %i' % stationnum)
                # Parallelise over channels to speed things along.
                with parallel_backend('loky', n_jobs=len(psutil.Process().cpu_affinity())):
                    results = Parallel()(delayed(process_channel_everybeam)(f, stationnum=stationnum, useElementResponse=useElementResponse, useArrayFactor=useArrayFactor, useChanFreq=useChanFreq, ms=ms, freqs=freqs, times=times, ra=ra, dec=dec, ra_ref=ra_ref, dec_ref=dec_ref, reference_xyz=reference_xyz, phase_xyz=phase_xyz) for f in range(len(freqs)))
                    for freqslot in results:
                        ifreq, beam = freqslot
                        if soltab.getAxisLen('pol') == 2:
                            beam = beam.reshape((beam.shape[0], 4))[:, [0, 3]] # get only XX and YY
                        if soltab.getType() == 'amplitude':
                            vals[stationnum, :, ifreq, :] = np.abs(beam)
                        elif soltab.getType() == 'phase':
                            vals[stationnum, :, ifreq, :] = np.angle(beam)
                        else:
                            logger.error('Beam prediction works only for amplitude/phase solution tables.')
                            return 1
            vals = losoto.lib_operations.reorderAxes( vals, ['ant','time','freq','pol'], [ax for ax in soltab.getAxesNames() if ax in ['ant','time','freq','pol']] )
            soltab.setValues(vals, selection)

    else:
        H5.close()
        raise ValueError('Unsupported beam library specified')

    H5.close()
    return

def process_channel_everybeam(ifreq, stationnum, useElementResponse, useArrayFactor, useChanFreq, ms, freqs, times, ra, dec, ra_ref, dec_ref, reference_xyz, phase_xyz):
    if useElementResponse and useArrayFactor:
        #print('Full (element+array_factor) beam correction requested. Using use_differential_beam=False.')
        obs = everybeam.load_telescope(ms, use_differential_beam=False, use_channel_frequency=useChanFreq)
    elif not useElementResponse and useArrayFactor:
        #print('Array factor beam correction requested. Using use_differential_beam=True.')
        obs = everybeam.load_telescope(ms, use_differential_beam=True, use_channel_frequency=useChanFreq)
    elif useElementResponse and not useArrayFactor:
        #print('Element beam correction requested.')
        # Not sure how to do this with EveryBeam.
        raise NotImplementedError('Element beam only correction is not implemented in facetselfcal.')

    #print(f'Processing channel {ifreq}')
    freq = freqs[ifreq]
    timeslices = np.empty((len(times), 2, 2), dtype=np.complex128)
    for itime, time in enumerate(times):
        #timeloop.update()
        if not useElementResponse and useArrayFactor:
            # Array-factor-only correction.
            beam = obs.array_factor(times[itime], stationnum, freq, phase_xyz[itime], reference_xyz[itime])
        else:
            beam = obs.station_response(time=time, station_idx=stationnum, freq=freq, ra=ra, dec=dec)
        #beam = beam.reshape(4)
        timeslices[itime] = beam
    return ifreq, timeslices

# losotolofarbeam('P214+55_PSZ2G098.44+56.59.dysco.sub.shift.avg.weights.ms.archive_templatejones.h5', 'amplitude000', 'P214+55_PSZ2G098.44+56.59.dysco.sub.shift.avg.weights.ms.archive', inverse=False, useElementResponse=False, useArrayFactor=True, useChanFreq=True)


def cleanup(mslist):
    ''' Clean up directory

    Args:
        mslist: list with MS files
    '''
    for ms in mslist:
        os.system('rm -rf ' + ms)

    os.system('rm -f *first-residual.fits')
    os.system('rm -f *psf.fits')
    os.system('rm -f *-00*-*.fits')
    os.system('rm -f *dirty.fits')
    os.system('rm -f solintimage*model.fits')
    os.system('rm -f solintimage*residual.fits')
    os.system('rm -f *pybdsf.log')
    return


def flagms_startend(ms, tecsolsfile, tecsolint):
    '''

    Args:
        ms: measurement set
        tecsolsfile: solution file with TEC
        tecsolint:
        example of taql command: taql ' select from test.ms where TIME in (select distinct TIME from test.ms offset 0 limit 1798) giving test.ms.cut as plain'
    '''

    taql = 'taql'

    msout = ms + '.cut'

    H5 =h5parm.h5parm(tecsolsfile)
    tec = H5.getSolset('sol000').getSoltab('tec000').getValues()
    tecvals = tec[0]

    axis_names = H5.getSolset('sol000').getSoltab('tec000').getAxesNames()
    time_ind = axis_names.index('time')
    ant_ind = axis_names.index('ant')
    
    # ['time', 'ant', 'dir', 'freq']
    reftec = tecvals[:,0,0,0] 
    
    # print np.shape( tecvals[:,:,0,0]), np.shape( reftec[:,None]), 
    tecvals = tecvals[:,:,0,0] - reftec[:,None] # reference to zero

    times   = tec[1]['time']
    
    # print tecvals[:,0]
    
    goodtimesvec = []

    for timeid, time in enumerate(times):

      tecvals[timeid,:]
      
      # print timeid, np.count_nonzero( tecvals[timeid,:])
      goodtimesvec.append(np.count_nonzero( tecvals[timeid,:]))


    goodstartid = np.argmax (np.array(goodtimesvec) > 0)
    goodendid   = len(goodtimesvec) - np.argmax (np.array(goodtimesvec[::-1]) > 0)

    print('First good solutionslot,', goodstartid, ' out of', len(goodtimesvec))
    print('Last good solutionslot,', goodendid, ' out of', len(goodtimesvec))
    H5.close()

    if (goodstartid != 0) or (goodendid != len(goodtimesvec)): # only do if needed to save some time
        cmd = taql + " ' select from " + ms + " where TIME in (select distinct TIME from " + ms
        cmd+= " offset " + str(goodstartid*int(tecsolint))
        cmd+= " limit " + str((goodendid-goodstartid)*int(tecsolint)) +") giving "
        cmd+= msout + " as plain'"

        print(cmd)
        run(cmd)

        os.system('rm -rf ' + ms)
        os.system('mv ' + msout + ' ' + ms)
    return


# flagms_startend('P215+50_PSZ2G089.52+62.34.dysco.sub.shift.avg.weights.ms.archive','phaseonlyP215+50_PSZ2G089.52+62.34.dysco.sub.shift.avg.weights.ms.archivesolsgrid_9.h5', 2)


def removestartendms(ms, starttime=None, endtime=None, dysco=True):

    # chdeck if output is already there and remove
    if os.path.isdir(ms + '.cut'):
          os.system('rm -rf ' + ms + '.cut')
    if os.path.isdir(ms + '.cuttmp'):
          os.system('rm -rf ' + ms + '.cuttmp')

    cmd = 'DP3 msin=' + ms + ' ' + 'msout=' + ms + '.cut '
    if dysco:
      cmd+= 'msout.storagemanager=dysco '
      cmd += 'msout.storagemanager.weightbitrate=16 '
    cmd+=  'msin.weightcolumn=WEIGHT_SPECTRUM steps=[] '
    if starttime is not None:
      cmd+= 'msin.starttime=' + starttime + ' '
    if endtime is not None:
      cmd+= 'msin.endtime=' + endtime   + ' '
    print(cmd)
    run(cmd)

    cmd = 'DP3 msin=' + ms + ' ' + 'msout=' + ms + '.cuttmp '
    if dysco:
      cmd+= 'msout.storagemanager=dysco '
      cmd += 'msout.storagemanager.weightbitrate=16 '
    cmd+= 'msin.weightcolumn=WEIGHT_SPECTRUM_SOLVE steps=[] '
    if starttime is not None:
      cmd+= 'msin.starttime=' + starttime + ' '
    if endtime is not None:
      cmd+= 'msin.endtime=' + endtime   + ' '
    print(cmd)
    run(cmd)

    # Make a WEIGHT_SPECTRUM from WEIGHT_SPECTRUM_SOLVE
    t  = pt.table(ms + '.cut' , readonly=False)

    print('Adding WEIGHT_SPECTRUM_SOLVE')
    desc = t.getcoldesc('WEIGHT_SPECTRUM')
    desc['name']='WEIGHT_SPECTRUM_SOLVE'
    t.addcols(desc)

    t2 = pt.table(ms + '.cuttmp' , readonly=True)
    imweights = t2.getcol('WEIGHT_SPECTRUM')
    t.putcol('WEIGHT_SPECTRUM_SOLVE', imweights)

    # Fill WEIGHT_SPECTRUM with WEIGHT_SPECTRUM from second ms
    t2.close()
    t.close()

    # clean up
    os.system('rm -rf ' + ms + '.cuttmp')

    return

# removestartendms('P219+50_PSZ2G084.10+58.72.dysco.sub.shift.avg.weights.ms.archive',endtime='16-Apr-2015/02:14:47.0')
# removestartendms('P223+50_PSZ2G084.10+58.72.dysco.sub.shift.avg.weights.ms.archive',starttime='24-Feb-2015/22:16:00.0')
# removestartendms('P223+52_PSZ2G088.98+55.07.dysco.sub.shift.avg.weights.ms.archive',starttime='19-Feb-2015/22:40:00.0')
# removestartendms('P223+55_PSZ2G096.14+56.24.dysco.sub.shift.avg.weights.ms.archive',starttime='31-Mar-2015/20:11:00.0')
# removestartendms('P227+53_PSZ2G088.98+55.07.dysco.sub.shift.avg.weights.ms.archive',starttime='19-Feb-2015/22:40:00.0')

def which(file_name):
    for path in os.environ["PATH"].split(os.pathsep):
        full_path = os.path.join(path, file_name)
        if os.path.exists(full_path) and os.access(full_path, os.X_OK):
            return full_path
    return None

def _add_astropy_beam(fitsname):
    ''' Add beam from astropy

    Args:
        fitsname: name of fits file
    Returns:
        ellipse
    '''

    head = fits.getheader(fitsname)
    bmaj = head['BMAJ']
    bmin = head['BMIN']
    bpa  = head['BPA']
    cdelt = head['CDELT2']
    bmajpix = bmaj/cdelt
    bminpix = bmin/cdelt
    ellipse = matplotlib.patches.Ellipse((20,20), bmajpix,bminpix,bpa)
    return ellipse

def plotimage_astropy(fitsimagename, outplotname, mask=None, rmsnoiseimage=None):
  # image noise for plotting
  if rmsnoiseimage is None:
    hdulist = fits.open(fitsimagename)
  else:
    hdulist = fits.open(rmsnoiseimage)
  imagenoise = findrms(np.ndarray.flatten(hdulist[0].data))
  hdulist.close()

  # image noise info
  hdulist = fits.open(fitsimagename) 
  imagenoiseinfo = findrms(np.ndarray.flatten(hdulist[0].data))
  logger.info(fitsimagename + ' Max image: ' + str(np.max(np.ndarray.flatten(hdulist[0].data))))
  logger.info(fitsimagename + ' Min image: ' + str(np.min(np.ndarray.flatten(hdulist[0].data))))
  hdulist.close()

  data = fits.getdata(fitsimagename)
  head = fits.getheader(fitsimagename)
  f = plt.figure()
  ax = f.add_subplot(111,projection=WCS(head),slices=('x','y',0,0))
  img = ax.imshow(data[0,0,:,:],cmap='bone',vmax=16*imagenoise, vmin=-6*imagenoise)
  ax.set_title(fitsimagename+' (noise = {} mJy/beam)'.format(round(imagenoiseinfo*1e3, 3)))
  ax.grid(True)
  ax.set_xlabel('Right Ascension (J2000)')
  ax.set_ylabel('Declination (J2000)')
  cbar = plt.colorbar(img)
  cbar.set_label('Flux (Jy beam$^{-1}$)')
  ax.add_artist(_add_astropy_beam(fitsimagename))

  if mask is not None:
    maskdata = fits.getdata(mask)[0,0,:,:]
    ax.contour(maskdata, colors='red', levels=[0.1*imagenoise],filled=False, smooth=1, alpha=0.6, linewidths=1)

  if os.path.isfile(outplotname + '.png'):
      os.system('rm -f ' + outplotname + '.png')
  plt.savefig(outplotname, dpi=450, format='png')
  logger.info(fitsimagename + ' RMS noise: ' + str(imagenoiseinfo))
  return

def plotimage_aplpy(fitsimagename, outplotname, mask=None, rmsnoiseimage=None):
  import aplpy
  # image noise for plotting
  if rmsnoiseimage is None:
    hdulist = fits.open(fitsimagename)
  else:
    hdulist = fits.open(rmsnoiseimage)
  imagenoise = findrms(np.ndarray.flatten(hdulist[0].data))
  hdulist.close() 
  
  # image noise info
  hdulist = fits.open(fitsimagename) 
  imagenoiseinfo = findrms(np.ndarray.flatten(hdulist[0].data))
  logger.info(fitsimagename + ' Max image: ' + str(np.max(np.ndarray.flatten(hdulist[0].data))))
  logger.info(fitsimagename + ' Min image: ' + str(np.min(np.ndarray.flatten(hdulist[0].data))))
  hdulist.close()

  f = aplpy.FITSFigure(fitsimagename, slices=[0, 0])
  f.show_colorscale(vmax=16*imagenoise, vmin=-6*imagenoise, cmap='bone')
  f.set_title(fitsimagename+' (noise = {} mJy/beam)'.format(round(imagenoiseinfo*1e3, 3)))
  try: # to work around an aplpy error
    f.add_beam()
    f.beam.set_frame(True)
    f.beam.set_color('white')
    f.beam.set_edgecolor('black')
    f.beam.set_linewidth(1.)
  except:
    pass

  f.add_grid()
  f.grid.set_color('white')
  f.grid.set_alpha(0.5)
  f.grid.set_linewidth(0.2)
  f.add_colorbar()
  f.colorbar.set_axis_label_text('Flux (Jy beam$^{-1}$)')
  if mask is not None:
    try:
      f.show_contour(mask, colors='red', levels=[0.1*imagenoise], filled=False, smooth=1, alpha=0.6, linewidths=1)
    except:
      pass
  if os.path.isfile(outplotname + '.png'):
      os.system('rm -f ' + outplotname + '.png')
  f.save(outplotname, dpi=120, format='png')
  logger.info(fitsimagename + ' RMS noise: ' + str(imagenoiseinfo))
  return


def plotimage(fitsimagename,outplotname,mask=None,rmsnoiseimage=None):
  # This code tries astropy first, switches to aplpy afterwards.
  try:
      plotimage_astropy(fitsimagename,outplotname,mask,rmsnoiseimage)
  except:
      plotimage_aplpy(fitsimagename,outplotname,mask,rmsnoiseimage)


def archive(mslist, outtarname, regionfile, fitsmask, imagename, dysco=True, mergedh5_i=None, facetregionfile=None):
  path = '/disks/ftphome/pub/vanweeren'
  for ms in mslist:
    msout = ms + '.calibrated'
    if os.path.isdir(msout):
      os.system('rm -rf ' + msout)
    cmd  ='DP3 numthreads='+ str(multiprocessing.cpu_count()) +' msin=' + ms + ' msout=' + msout + ' '
    cmd +='msin.datacolumn=CORRECTED_DATA steps=[] '
    if dysco:
      cmd += 'msout.storagemanager=dysco '
      cmd += 'msout.storagemanager.weightbitrate=16 '
    run(cmd)


  msliststring = ' '.join(map(str, glob.glob('*.calibrated') ))
  cmd = 'tar -zcf ' + outtarname + ' ' + msliststring + ' selfcal.log ' +  imagename + ' '

  if fitsmask is not None:  # add fitsmask to tar if it exists
    if os.path.isfile(fitsmask):
      cmd +=  fitsmask + ' '

  if regionfile is not None:  # add box regionfile to tar if it exists
    if os.path.isfile(regionfile):
      cmd +=  regionfile + ' '

  if mergedh5_i is not None:
    mergedh5_i_string = ' '.join(map(str, mergedh5_i ))
    cmd += mergedh5_i_string + ' '

  if facetregionfile is not None:  # add facet region file to tar if it exists
    if os.path.isfile(facetregionfile):
      cmd +=  facetregionfile + ' '	

	
  if os.path.isfile(outtarname):
      os.system('rm -f ' + outtarname)
  logger.info('Creating archived calibrated tarball: ' + outtarname)
  run(cmd)

  for ms in mslist:
    msout = ms + '.calibrated'
    os.system('rm -rf ' + msout)
  return


def setinitial_solint(mslist, longbaseline, LBA, options):
   """
   take user input solutions,nchan,smoothnessconstraint,antennaconstraint and expand them to all ms
   these list can then be updated later with values from auto_determinesolints for example
   """

   nchan_list  = [] # list with len(options.soltype_list)
   solint_list = [] # list with len(options.soltype_list)
   smoothnessconstraint_list = [] # nested list with len(options.soltype_list), inner list is for ms
   smoothnessreffrequency_list = [] # nested list with len(options.soltype_list), inner list is for ms
   smoothnessspectralexponent_list = [] # nest list with len(options.soltype_list), inner list is for ms
   smoothnessrefdistance_list = [] #  # nest list with len(options.soltype_list), inner list is for ms
   antennaconstraint_list = [] # nested list with len(options.soltype_list), inner list is for ms
   resetsols_list = [] # nested list with len(options.soltype_list), inner list is for ms
   resetdir_list = [] # nested list with len(options.soltype_list), inner list is for ms
   normamps_list = [] #  # nested list with len(options.soltype_list), inner list is for ms
   soltypecycles_list = []  # nested list with len(options.soltype_list), inner list is for ms
   uvmin_list = []  # nested list with len(options.soltype_list), inner list is for ms
   uvmax_list = []  # nested list with len(options.soltype_list), inner list is for ms
   uvminim_list = []  # nested list with len(options.soltype_list), inner list is for ms
   uvmaxim_list = []  # nested list with len(options.soltype_list), inner list is for ms
   BLsmooth_list = []  # nested list with len(options.soltype_list), inner list is for ms
   
   # make here uvminim_list and uvmaxim_list, because the have just the length of mslist
   for ms_id, ms in enumerate(mslist):
      try:
         uvminim = options.uvminim[ms_id]
      except:
         uvminim = options.uvminim # apparently we just have a float and not a list
      uvminim_list.append(uvminim)
   for ms_id, ms in enumerate(mslist):
      try:
         uvmaxim = options.uvmaxim[ms_id]
      except:
         uvmaxim = options.uvmaxim # apparently we just have a float and not a list
      uvmaxim_list.append(uvmaxim)


   for soltype_id, soltype in enumerate(options.soltype_list):
     nchan_ms   = [] # list with len(mslist)
     solint_ms  = [] # list with len(mslist)
     antennaconstraint_list_ms   = [] # list with len(mslist)
     resetsols_list_ms = [] # list with len(mslist)
     resetdir_list_ms = [] # list with len(mslist)
     normamps_list_ms = [] # list with len(mslist)
     smoothnessconstraint_list_ms  = [] # list with len(mslist)
     smoothnessreffrequency_list_ms  = [] # list with len(mslist)
     smoothnessspectralexponent_list_ms = [] # list with len(mslist)
     smoothnessrefdistance_list_ms = [] # list with len(mslist)
     BLsmooth_list_ms = [] # list with len(mslist)
     soltypecycles_list_ms = [] # list with len(mslist)
     uvmin_list_ms = []  # list with len(mslist)
     uvmax_list_ms = []  # list with len(mslist)
     #uvminim_list_ms = []  # list with len(mslist)
     #uvmaxim_list_ms = []  # list with len(mslist)
   
     for ms in mslist:
       # use try statement in case the user did not provide all the info for certain soltypes
          
       # solint 
       try:
         solint = options.solint_list[soltype_id]
       except:
         solint = 1

       # nchan
       try:
         nchan = options.nchan_list[soltype_id]
       except:
         nchan = 1 # if nothing is set use 1

       # smoothnessconstraint
       try:
         smoothnessconstraint = options.smoothnessconstraint_list[soltype_id]
       except:
         smoothnessconstraint = 0.0

       # BLsmooth
       try:
         BLsmooth = options.BLsmooth_list[soltype_id]  
       except:
         BLsmooth = False
         
       # smoothnessreffrequency
       try:
         smoothnessreffrequency = options.smoothnessreffrequency_list[soltype_id]
       except:
         smoothnessreffrequency = 0.0

       # smoothnessspectralexponent
       try:
         smoothnessspectralexponent = options.smoothnessspectralexponent_list[soltype_id]
       except:
         smoothnessspectralexponent = -1.0

       # smoothnessrefdistance
       try:
         smoothnessrefdistance = options.smoothnessrefdistance_list[soltype_id]
       except:
         smoothnessrefdistance = 0.0

       # antennaconstraint
       try:
         antennaconstraint = options.antennaconstraint_list[soltype_id]
       except:
         antennaconstraint = None

       # resetsols
       try:
         resetsols = options.resetsols_list[soltype_id]
       except:
         resetsols = None

       # resetdir
       try:
         resetdir = options.resetdir_list[soltype_id]
       except:
         resetdir = None

       # normamps
       try:
         normamps = options.normamps_list[soltype_id]
       except:
         normamps = 'normamps'


       # uvmin
       try:
         uvmin = options.uvmin[soltype_id]
       except:
         uvmin = None

       # uvmax
       try:
         uvmax = options.uvmax[soltype_id]
       except:
         uvmax = None

       # uvminim
       #try:
       #  uvminim = options.uvminim[soltype_id]
       #except:
       #  uvminim = 80.

       # uvmaxim
       #try:
       #  uvmaxim = options.uvmaxim[soltype_id]
       #except:
       #  uvmaxim = None

       # soltypecycles
       soltypecycles = options.soltypecycles_list[soltype_id]

       # force nchan 1 for tec(andphase) solve and in case smoothnessconstraint is invoked
       #if soltype == 'tec' or  soltype == 'tecandphase' or smoothnessconstraint > 0.0:
       if soltype == 'tec' or  soltype == 'tecandphase':
         nchan  = 1


       nchan_ms.append(nchan)
       solint_ms.append(solint)
       smoothnessconstraint_list_ms.append(smoothnessconstraint)
       BLsmooth_list_ms.append(BLsmooth)
       smoothnessreffrequency_list_ms.append(smoothnessreffrequency)
       smoothnessspectralexponent_list_ms.append(smoothnessspectralexponent)
       smoothnessrefdistance_list_ms.append(smoothnessrefdistance)
       antennaconstraint_list_ms.append(antennaconstraint)
       resetsols_list_ms.append(resetsols)
       resetdir_list_ms.append(resetdir)
       normamps_list_ms.append(normamps)
       
       soltypecycles_list_ms.append(soltypecycles)
       uvmin_list_ms.append(uvmin)
       uvmax_list_ms.append(uvmax)
       #uvminim_list_ms.append(uvminim)
       #uvmaxim_list_ms.append(uvmaxim)


     nchan_list.append(nchan_ms)   # list of lists
     solint_list.append(solint_ms) # list of lists
     antennaconstraint_list.append(antennaconstraint_list_ms)   # list of lists
     resetsols_list.append(resetsols_list_ms) # list of lists
     resetdir_list.append(resetdir_list_ms) # list of lists
     normamps_list.append(normamps_list_ms) # list of lists
     BLsmooth_list.append(BLsmooth_list_ms) # list of lists
     smoothnessconstraint_list.append(smoothnessconstraint_list_ms) # list of lists
     smoothnessreffrequency_list.append(smoothnessreffrequency_list_ms) # list of lists
     smoothnessspectralexponent_list.append(smoothnessspectralexponent_list_ms) # list of lists
     smoothnessrefdistance_list.append(smoothnessrefdistance_list_ms)
     uvmin_list.append(uvmin_list_ms) # list of lists
     uvmax_list.append(uvmax_list_ms) # list of lists
     #uvminim_list.append(uvminim_list_ms) # list of lists
     #uvmaxim_list.append(uvmaxim_list_ms)      # list of lists

     soltypecycles_list.append(soltypecycles_list_ms)

    
   print('soltype:',options.soltype_list, mslist)
   print('nchan:',nchan_list)
   print('solint:',solint_list)
   print('BLsmooth:',BLsmooth_list)
   print('smoothnessconstraint:',smoothnessconstraint_list)
   print('smoothnessreffrequency:',smoothnessreffrequency_list)
   print('smoothnessspectralexponent:',smoothnessspectralexponent_list)
   print('smoothnessrefdistance:',smoothnessrefdistance_list)
   print('antennaconstraint:',antennaconstraint_list)
   print('resetsols:',resetsols_list)
   print('resetdir:', resetdir_list)
   print('normamps:', normamps_list)
   print('soltypecycles:',soltypecycles_list)
   print('uvmin:',uvmin_list)
   print('uvmax:',uvmax_list)
   print('uvminim:',uvminim_list)
   print('uvmaxim:',uvmaxim_list)

   logger.info('soltype: '+ str(options.soltype_list) + ' ' + str(mslist))
   logger.info('nchan: ' + str(options.nchan_list))
   logger.info('solint: ' + str(options.solint_list))
   logger.info('BLsmooth: ' + str(options.BLsmooth_list))
   logger.info('smoothnessconstraint: ' + str(options.smoothnessconstraint_list))
   logger.info('smoothnessreffrequency: ' + str(options.smoothnessreffrequency_list))
   logger.info('smoothnessspectralexponent: ' + str(options.smoothnessspectralexponent_list))
   logger.info('smoothnessrefdistance: ' + str(options.smoothnessrefdistance_list))
   logger.info('antennaconstraint: ' + str(options.antennaconstraint_list))
   logger.info('resetsols: ' + str(options.resetsols_list))
   logger.info('resetdir: ' + str(options.resetdir_list))
   logger.info('normamps: ' + str(options.normamps_list))
   logger.info('soltypecycles: ' + str(options.soltypecycles_list))
   logger.info('uvmin: ' + str(options.uvmin))
   logger.info('uvmax: ' + str(options.uvmax))
   logger.info('uvminim: ' + str(options.uvminim))
   logger.info('uvmaxim: ' + str(options.uvmaxim))


   return nchan_list, solint_list, BLsmooth_list, smoothnessconstraint_list, smoothnessreffrequency_list, smoothnessspectralexponent_list, smoothnessrefdistance_list, antennaconstraint_list, resetsols_list, resetdir_list, soltypecycles_list, uvmin_list, uvmax_list, uvminim_list, uvmaxim_list, normamps_list

def getms_amp_stats(ms, datacolumn='DATA',uvcutfraction=0.666, robustsigma=True):
   uvdismod = get_uvwmax(ms)*uvcutfraction  
   t = pt.taql('SELECT ' + datacolumn + ',UVW,TIME,FLAG FROM ' + ms + ' WHERE SQRT(SUMSQR(UVW[:2])) > '+ str(uvdismod) )
   flags = t.getcol('FLAG')
   data  = t.getcol(datacolumn)
   data = np.ma.masked_array(data, flags)
   t.close()
  
   amps_rr = np.abs(data[:,:,0])
   amps_ll = np.abs(data[:,:,3])
   
   # remove zeros from LL
   idx = np.where(amps_ll != 0.0)
   amps_ll = amps_ll[idx]
   amps_rr = amps_rr[idx]

   # remove zeros from RR
   idx = np.where(amps_rr != 0.0)
   amps_ll = amps_ll[idx]
   amps_rr = amps_rr[idx]

   amplogratio = np.log10(amps_rr/amps_ll) # we assume Stokes V = 0, so RR = LL
   if robustsigma:
      logampnoise = astropy.stats.sigma_clipping.sigma_clipped_stats(amplogratio)[2]
   else:
      logampnoise = np.std(amplogratio)
   print(ms, logampnoise, np.mean(amplogratio))
   return logampnoise


def getms_phase_stats(ms, datacolumn='DATA',uvcutfraction=0.666):
   import scipy.stats 
   uvdismod = get_uvwmax(ms)*uvcutfraction  
   t = pt.taql('SELECT ' + datacolumn + ',UVW,TIME,FLAG FROM ' + ms + ' WHERE SQRT(SUMSQR(UVW[:2])) > '+ str(uvdismod) )
   flags = t.getcol('FLAG')
   data  = t.getcol(datacolumn)
   data = np.ma.masked_array(data, flags)
   t.close()
  
   phase_rr = np.angle(data[:,:,0])
   phase_ll = np.angle(data[:,:,3])
   
   # remove zeros from LL (flagged data)
   idx = np.where(phase_ll != 0.0)
   phase_ll = phase_ll[idx]
   phase_rr = phase_rr[idx]

   # remove zeros from RR (flagged data)
   idx = np.where(phase_rr != 0.0)
   phase_ll = phase_ll[idx]
   phase_rr = phase_rr[idx]

   phasediff =  np.mod(phase_rr-phase_ll, 2.*np.pi)
   phasenoise = scipy.stats.circstd(phasediff, nan_policy='omit')

   print(ms, phasenoise, scipy.stats.circmean(phasediff,  nan_policy='omit'))
   return phasenoise


def getmsmodelinfo(ms, modelcolumn, fastrms=False, uvcutfraction=0.333):
   t = pt.table(ms + '/SPECTRAL_WINDOW', ack=False)
   chanw = np.median(t.getcol('CHAN_WIDTH'))
   freq = np.median(t.getcol('CHAN_FREQ'))
   nfreq = len(t.getcol('CHAN_FREQ')[0])
   t.close()
   uvdismod = get_uvwmax(ms)*uvcutfraction # take range [uvcutfraction*uvmax - 1.0uvmax]

   HBA_upfreqsel = 0.75 # select only freqcencies above 75% of the available bandwidth
   freqct = 1000e6
   # the idea is that for HBA if you are far out in the beam the noise gets up much more at the higher freqs and the model flux goes down due to the spectral index. In this way we get more conservative solints


   t = pt.taql('SELECT ' + modelcolumn + ',DATA,UVW,TIME,FLAG FROM ' + ms + ' WHERE SQRT(SUMSQR(UVW[:2])) > '+ str(uvdismod) )
   model = np.abs(t.getcol(modelcolumn))
   flags = t.getcol('FLAG')
   data  = t.getcol('DATA')
   print('Compute visibility noise of the dataset with robust sigma clipping', ms)
   logger.info('Compute visibility noise of the dataset with robust sigma clipping: ' + ms)
   if fastrms:    # take only every fifth element of the array to speed up the computation
     if freq > freqct: # HBA
        noise = astropy.stats.sigma_clipping.sigma_clipped_stats(data[0:data.shape[0]:5,int(np.floor(float(nfreq)*HBA_upfreqsel)):-1,1:3],\
        mask=flags[0:data.shape[0]:5,int(np.floor(float(nfreq)*HBA_upfreqsel)):-1,1:3])[2] # use XY and YX
     else:
        noise = astropy.stats.sigma_clipping.sigma_clipped_stats(data[0:data.shape[0]:5,:,1:3],\
        mask=flags[0:data.shape[0]:5,:,1:3])[2] # use XY and YX
   else:
     if freq > freqct: # HBA
        noise = astropy.stats.sigma_clipping.sigma_clipped_stats(data[:,int(np.floor(float(nfreq)*HBA_upfreqsel)):-1,1:3],\
        mask=flags[:,int(np.floor(float(nfreq)*HBA_upfreqsel)):-1,1:3])[2] # use XY and YX
     else:
        noise = astropy.stats.sigma_clipping.sigma_clipped_stats(data[:,:,1:3],\
        mask=flags[:,:,1:3])[2] # use XY and YX

   model = np.ma.masked_array(model, flags)
   if freq > freqct: # HBA:
      flux  = np.ma.mean((model[:,int(np.floor(float(nfreq)*HBA_upfreqsel)):-1,0] + model[:,int(np.floor(float(nfreq)*HBA_upfreqsel)):-1,3])*0.5) # average XX and YY (ignore XY and YX, they are zero, or nan, in other words this is Stokes I)
   else:
      flux  = np.ma.mean((model[:,:,0] + model[:,:,3])*0.5) # average XX and YY (ignore XY and YX, they are zero, or nan)
   time  = np.unique(t.getcol('TIME'))
   tint  = np.abs(time[1]-time[0])
   print('Integration time visibilities', tint)
   logger.info('Integration time visibilities: ' + str(tint))
   t.close()

   del data, flags, model
   print('Noise visibilities:', noise, 'Jy')
   print('Flux in model:', flux, 'Jy')
   print('UV-selection to compute model flux:', str(uvdismod/1e3), 'km')
   logger.info('Noise visibilities: ' + str(noise) + 'Jy')
   logger.info('Flux in model: ' + str(flux) + 'Jy')
   logger.info('UV-selection to compute model flux: ' + str(uvdismod/1e3) + 'km')


   return noise, flux, tint, chanw

def return_soltype_index(soltype_list, soltype, occurence=1, onetectypeoccurence=False):

   if onetectypeoccurence:
     if soltype == 'tecandphase' or soltype == 'tec':
       soltype_list = [sol.replace('tecandphase', 'tec') for sol in soltype_list]
       soltype = 'tec'

   sol_index = None
   count = 0
   for sol_id, sol in enumerate(soltype_list):
     if sol == soltype:
       sol_index = sol_id
       count = count + 1
       if occurence == count:
         return sol_index
       else:
         sol_index = None
   return sol_index

def auto_determinesolints(mslist, soltype_list, longbaseline, LBA,\
                          innchan_list=None, insolint_list=None,\
                          uvdismod=None, modelcolumn='MODEL_DATA', redo=False,\
                          inBLsmooth_list=None,\
                          insmoothnessconstraint_list=None, insmoothnessreffrequency_list=None, \
                          insmoothnessspectralexponent_list=None,\
                          insmoothnessrefdistance_list=None,\
                          inantennaconstraint_list=None, inresetsols_list=None, inresetdir_list=None, innormamps_list=None,\
                          insoltypecycles_list=None, tecfactorsolint=1.0, gainfactorsolint=1.0,\
                          phasefactorsolint=1.0, delaycal=False):
   """
   determine the solution time and frequency intervals based on the amount of compact source flux and noise
   """
   # 1 find the first tec/tecandphase in the soltype_list
   # set the solints there based on this code
   # update antennaconstraint if needed

   # find the first (scalar)complexgain
   # compute solints

   # based on scalarcomplexgain determine what to do
   # proceed normally, as is now
   # do an 'all' constrained solve
   # no complexgain solves at all, how to do this? update soltype_list here, or set

   # soltype_list == 'tec'

   for ms_id, ms in enumerate(mslist):
      if longbaseline:
         noise, flux, tint, chanw = getmsmodelinfo(ms, modelcolumn, uvcutfraction=0.075)
      else:
         noise, flux, tint, chanw = getmsmodelinfo(ms, modelcolumn)
      for soltype_id, soltype in enumerate(soltype_list):

          ######## TEC or TECANDPHASE ######
          ######## for first occurence of tec(andphase) #######
          if soltype in ['tec', 'tecandphase'] and \
              ((soltype_id == return_soltype_index(soltype_list, 'tec', occurence=1, onetectypeoccurence=True)) or \
              (soltype_id == return_soltype_index(soltype_list, 'tecandphase', occurence=1, onetectypeoccurence=True))) :

             if LBA:
               if longbaseline:
                 solint_sf = 3.0e-3*tecfactorsolint # untested
               else: #for -- LBA dutch --
                 solint_sf = 4.0e-2*tecfactorsolint #0.5e-3 # for tecandphase and coreconstraint

             else: # for -- HBA --
               if longbaseline:
                 solint_sf = 0.5e-2*tecfactorsolint # for tecandphase, no coreconstraint
               else: #for -- HBA dutch --
                 solint_sf = 4.0e-2*tecfactorsolint # for tecandphase, no coreconstraint

             if soltype == 'tec':
               solint_sf = solint_sf/np.sqrt(2.) # tec and coreconstraint


             # trigger antennaconstraint_phase core if solint > tint
             if not longbaseline and (tint*solint_sf* ((noise/flux)**2) * (chanw/390.625e3) > tint):
               print(tint*solint_sf* ((noise/flux)**2) * (chanw/390.625e3))
               solint_sf = solint_sf/30.
               print('Trigger_antennaconstraint core:', soltype, ms)
               logger.info('Trigger_antennaconstraint core: '+ soltype + ' ' + ms)
               inantennaconstraint_list[soltype_id][ms_id] = 'core'
               # do another pertubation, a slow solve of the core stations
               # if (tint*solint_sf* ((noise/flux)**2) * (chanw/390.625e3) < 360.0): # less than 6 min now, also doing constraint remote
               if (tint*solint_sf* ((noise/flux)**2) * (chanw/390.625e3) < 720.0): # less than 12 min now, also doing
                 inantennaconstraint_list[soltype_id+1][ms_id] = 'remote' # or copy over input ??
                 insoltypecycles_list[soltype_id+1][ms_id] = insoltypecycles_list[soltype_id][ms_id] # do + 1 here??
                 insolint_list[soltype_id+1][ms_id] = int(np.rint(10.*solint_sf* ((noise/flux)**2) * (chanw/390.625e3) ))
                 if insolint_list[soltype_id+1][ms_id] < 1:
                   insolint_list[soltype_id+1][ms_id] = 1
               else:
                 insoltypecycles_list[soltype_id+1][ms_id] = 999

             else:
               if inantennaconstraint_list[soltype_id][ms_id] != 'alldutch':
                 inantennaconstraint_list[soltype_id][ms_id] = None # or copy over input

             # round to nearest integer
             solint = np.rint(solint_sf* ((noise/flux)**2) * (chanw/390.625e3) )
             # frequency scaling is need because if we avearge in freqeuncy the solint should not change for a tec(andphase) solve

             if (longbaseline) and (not LBA) and (soltype == 'tec') \
                and (soltype_list[1] == 'tecandphase'):
                if solint < 0.5 and (solint*tint < 16.): # so less then 16 sec
                   print('Longbaselines bright source detected: changing from tec to tecandphase solve')
                   insoltypecycles_list[soltype_id][ms_id] = 999
                   insoltypecycles_list[1][ms_id] = 0

             if solint < 1:
                solint = 1
             if (float(solint)*tint/3600.) > 0.5: # so check if larger than 30 min
               print('Warning, it seems there is not enough flux density on the longer baselines for solving')
               logger.warning('Warning, it seems there is not enough flux density on the longer baselines for solving')
               solint = np.rint(0.5*3600./tint) # max is 30 min

             print(solint_sf*((noise/flux)**2)*(chanw/390.625e3), 'Using tec(andphase) solint:', solint)
             logger.info(str(solint_sf*((noise/flux)**2)*(chanw/390.625e3)) + '-- Using tec(andphase) solint:' + str(solint))
             print('Using tec(andphase) solint [s]:', float(solint)*tint)
             logger.info('Using tec(andphase) solint [s]: ' + str(float(solint)*tint))

             insolint_list[soltype_id][ms_id] = int(solint)
             innchan_list[soltype_id][ms_id] = 1

          ######## SCALARPHASE or PHASEONLY ######
          ######## for first occurence of tec(andphase) #######
          if soltype in ['scalarphase', 'phaseonly'] and \
              (insmoothnessconstraint_list[soltype_id][ms_id] > 0.0) and \
              ((soltype_id == return_soltype_index(soltype_list, 'scalarphase', occurence=1, onetectypeoccurence=True)) or \
              (soltype_id == return_soltype_index(soltype_list, 'phaseonly', occurence=1, onetectypeoccurence=True))) :

             if LBA:
               if longbaseline:
                 solint_sf = 3.0e-3*phasefactorsolint # untested
               else: #for -- LBA dutch --
                 solint_sf = 4.0e-2*phasefactorsolint #0.5e-3 # for tecandphase and coreconstraint

             else: # for -- HBA --
               if longbaseline:
                 solint_sf = 0.5e-2*phasefactorsolint # for tecandphase, no coreconstraint
               else: #for -- HBA dutch --
                 solint_sf = 4.0e-2*phasefactorsolint # for tecandphase, no coreconstraint

             if soltype == 'scalarphase':
               solint_sf = solint_sf/np.sqrt(2.) # decrease solint if scalarphase


             # trigger antennaconstraint_phase core if solint > tint
             # needs checking, this might be wrong, this assumes we use [scalarphase/phaseonly,scalarphase/phaseonly, (scalar)complexgain] so 3 steps.....
             if not longbaseline and (tint*solint_sf* ((noise/flux)**2) * (chanw/390.625e3) > tint):
               print(tint*solint_sf* ((noise/flux)**2) * (chanw/390.625e3))
               solint_sf = solint_sf/30.
               print('Trigger_antennaconstraint core:', soltype, ms)
               logger.info('Trigger_antennaconstraint core: '+ soltype + ' ' + ms)
               inantennaconstraint_list[soltype_id][ms_id] = 'core'
               # do another pertubation, a slow solve of the core stations
               # if (tint*solint_sf* ((noise/flux)**2) * (chanw/390.625e3) < 360.0): # less than 6 min now, also doing constraint remote
               if (tint*solint_sf* ((noise/flux)**2) * (chanw/390.625e3) < 720.0): # less than 12 min now, also doing
                 inantennaconstraint_list[soltype_id+1][ms_id] = 'remote' # or copy over input ??
                 insoltypecycles_list[soltype_id+1][ms_id] = insoltypecycles_list[soltype_id][ms_id] # do + 1 here??
                 insolint_list[soltype_id+1][ms_id] = int(np.rint(10.*solint_sf* ((noise/flux)**2) * (chanw/390.625e3) ))
                 if insolint_list[soltype_id+1][ms_id] < 1:
                   insolint_list[soltype_id+1][ms_id] = 1
               else:
                 insoltypecycles_list[soltype_id+1][ms_id] = 999

             else:
               if inantennaconstraint_list[soltype_id][ms_id] != 'alldutch':
                  inantennaconstraint_list[soltype_id][ms_id] = None # or copy over input

             # round to nearest integer
             solint = np.rint(solint_sf* ((noise/flux)**2) * (chanw/390.625e3) )
             # frequency scaling is needed because if we avearge in freqeuncy the solint should not change for a (scalar)phase solve with smoothnessconstraint
             
             # if (longbaseline) and (not LBA) and (soltype == 'tec') \
             #   and (soltype_list[1] == 'tecandphase'):
             #   if solint < 0.5 and (solint*tint < 16.): # so less then 16 sec
             #      print('Longbaselines bright source detected: changing from tec to tecandphase solve')
             #      insoltypecycles_list[soltype_id][ms_id] = 999
             #      insoltypecycles_list[1][ms_id] = 0

             if solint < 1:
                solint = 1
             if (float(solint)*tint/3600.) > 0.5: # so check if larger than 30 min
               print('Warning, it seems there is not enough flux density on the longer baselines for solving')
               logger.warning('Warning, it seems there is not enough flux density on the longer baselines for solving')
               solint = np.rint(0.5*3600./tint) # max is 30 min

             print(solint_sf*((noise/flux)**2)*(chanw/390.625e3), 'Using (scalar)phase solint:', solint)
             logger.info(str(solint_sf*((noise/flux)**2)*(chanw/390.625e3)) + '-- Using (scalar)phase solint:' + str(solint))
             print('Using (scalar)phase solint [s]:', float(solint)*tint)
             logger.info('Using (scalar)phase solint [s]: ' + str(float(solint)*tint))

             insolint_list[soltype_id][ms_id] = int(solint)
             innchan_list[soltype_id][ms_id] = 1 # because we use smoothnessconstraint


          ######## COMPLEXGAIN or SCALARCOMPLEXGAIN or AMPLITUDEONLY or SCALARAMPLITUDE ######
          # requires smoothnessconstraint
          # for first occurence of (scalar)complexgain 
          if soltype in ['complexgain', 'scalarcomplexgain'] and (insmoothnessconstraint_list[soltype_id][ms_id] > 0.0) and \
              ((soltype_id == return_soltype_index(soltype_list, 'complexgain', occurence=1)) or \
              (soltype_id == return_soltype_index(soltype_list, 'scalarcomplexgain', occurence=1))):

             if longbaseline:
                thr_disable_gain = 24. # 32. #  72.
             else:
                thr_disable_gain = 64. # 32. #  72.
             
             thr_SM15Mhz = 1.5
             thr_gain_trigger_allantenna =  32. # 16. # 8.

             tgain_max = 4. # do not allow ap solves that are more than 4 hrs
             tgain_min = 0.3333  # check if less than 20 min, min solint is 20 min

             innchan_list[soltype_id][ms_id] = 1

             if LBA:
               if longbaseline:
                 solint_sf = 0.4*gainfactorsolint # untested
               else: #for -- LBA dutch --
                 solint_sf = 10.0*gainfactorsolint

             else: # for -- HBA --
               if longbaseline:
                 solint_sf = 0.8*gainfactorsolint #
               else: #for -- HBA dutch --
                 solint_sf = 0.8*gainfactorsolint #

             solint = np.rint(solint_sf*((noise/flux)**2)*(chanw/390.625e3))
             print(solint_sf*((noise/flux)**2)*(chanw/390.625e3), 'Computes gain solint:', solint, ' ')
             logger.info(str(solint_sf*((noise/flux)**2)*(chanw/390.625e3)) + ' Computes gain solint: ' + str(solint))
             print('Computes gain solint [hr]:', float(solint)*tint/3600.)
             logger.info('Computes gain solint [hr]: ' + str(float(solint)*tint/3600.))

             # do not allow very short ap solves
             if ((solint_sf*((noise/flux)**2)*(chanw/390.625e3))*tint/3600.) < tgain_min: #  check if less than tgain_min (20 min)
               solint = np.rint(tgain_min*3600./tint) # minimum tgain_min is 20 min
               print('Setting gain solint to 20 min (the min value allowed):', float(solint)*tint/3600.)
               logger.info('Setting gain solint to 20 min (the min value allowed): ' + str(float(solint)*tint/3600.))

             # do not allow ap solves that are more than tgain_max (4) hrs
             if ((solint_sf*((noise/flux)**2)*(chanw/390.625e3))*tint/3600.) > tgain_max: # so check if larger than 4 hrs
               print('Warning, it seems there is not enough flux density for gain solving')
               logger.warning('Warning, it seems there is not enough flux density for gain solving')
               solint = np.rint(tgain_max*3600./tint) # max is tgain_max (4) hrs

             # trigger 15 MHz smoothnessconstraint 
             # print('TEST:', ((solint_sf*((noise/flux)**2)*(chanw/390.625e3))*tint/3600.))
             if ((solint_sf*((noise/flux)**2)*(chanw/390.625e3))*tint/3600.) < thr_SM15Mhz: # so check if smaller than 2 hr
               insmoothnessconstraint_list[soltype_id][ms_id] = 5.0
             else:
               print('Increasing smoothnessconstraint to 15 MHz')
               logger.info('Increasing smoothnessconstraint to 15 MHz')
               insmoothnessconstraint_list[soltype_id][ms_id] = 15.0

             # trigger nchan=0 solve because not enough S/N
             if not longbaseline and (((solint_sf*((noise/flux)**2)*(chanw/390.625e3))*tint/3600.) > thr_gain_trigger_allantenna):
               inantennaconstraint_list[soltype_id][ms_id] = 'all'
               solint = np.rint(2.0*3600./tint) # 2 hrs nchan=0 solve (do not do bandpass because slope can diverge)
               innchan_list[soltype_id][ms_id] = 0 # no frequency dependence, smoothnessconstraint will be turned of in runDPPPbase
               print('Triggering antennaconstraint all:', soltype, ms)
               logger.info('Triggering antennaconstraint all: ' + soltype + ' ' + ms)
             else:
               if inantennaconstraint_list[soltype_id][ms_id] != 'alldutch':
                 inantennaconstraint_list[soltype_id][ms_id] = None

             # completely disable slow solve if the solints get too long, target is too faint
             if (((solint_sf*((noise/flux)**2)*(chanw/390.625e3))*tint/3600.) > thr_disable_gain):
               insoltypecycles_list[soltype_id][ms_id] = 999
               print('Disabling solve:', soltype, ms)
               logger.info('Disabling solve: ' + soltype + ' '+ ms)
             else:
               insoltypecycles_list[soltype_id][ms_id] = 3 # set to user input value? problem because not retained now

             insolint_list[soltype_id][ms_id] = int(solint)

             # --------------- NCHAN ------------- NOT BEING USED, keep code in case we need it later

             if insmoothnessconstraint_list[soltype_id][ms_id] == 0.0 and innchan_list[soltype_id][ms_id] != 0: # DOES NOT GET HERE BECAUSE smoothnessconstraint > 0 test above

                if LBA:
                  if longbaseline:
                    print('Long baselines LBA not supported with --auto')
                    raise Exception('Long baselines LBA not supported with --auto')
                  else: #for -- LBA dutch, untested --
                    nchan_sf = 0.75 # for tecandphase and coreconstraint

                else: # for -- HBA --
                  if longbaseline:
                    nchan_sf = 0.0075 #
                  else: #for -- HBA dutch --
                    nchan_sf = 0.75 #

                nchan = np.rint(nchan_sf*(noise/flux)**2)

                # do not allow very low nchan solves
                if (float(nchan)*chanw/1e6) < 2.0: #  check if less than 2 MHz
                  nchan = np.rint(2.0*1e6/chanw) # 2 MHz

                # do not allow nchan solves that are more than 15 MHz
                if (float(nchan)*chanw/1e6) > 15.0:
                  print('Warning, it seems there is not enough flux density on the longer baselines for solving')
                  nchan = np.rint(15*1e6/chanw) # 15 MHz

                print(nchan_sf*(noise/flux)**2, 'Using gain nchan:', nchan)
                print('Using gain nchan [MHz]:', float(nchan)*chanw/1e6)

                innchan_list[soltype_id][ms_id] = int(nchan)


   print('soltype:',soltype_list, mslist)
   print('nchan:',innchan_list)
   print('solint:',insolint_list)
   print('BLsmooth:', inBLsmooth_list)
   print('smoothnessconstraint:',insmoothnessconstraint_list)
   print('smoothnessreffrequency:',insmoothnessreffrequency_list)
   print('smoothnessspectralexponent_list:',insmoothnessspectralexponent_list)
   print('smoothnessrefdistance_list:',insmoothnessrefdistance_list)
   print('antennaconstraint:',inantennaconstraint_list)
   print('resetsols:',inresetsols_list)
   print('resetdir:',inresetdir_list)
   print('normamps:',innormamps_list)
   print('soltypecycles:',insoltypecycles_list)

   logger.info('soltype: '+ str(soltype_list) + ' ' + str(mslist))
   logger.info('nchan: ' + str(innchan_list))
   logger.info('solint: ' + str(insolint_list))
   logger.info('BLsmooth: ' + str(inBLsmooth_list))
   logger.info('smoothnessconstraint: ' + str(insmoothnessconstraint_list))
   logger.info('smoothnessreffrequency: ' + str(insmoothnessreffrequency_list))
   logger.info('smoothnessspectralexponent: ' + str(insmoothnessspectralexponent_list))
   logger.info('smoothnessrefdistance: ' + str(insmoothnessrefdistance_list))
   logger.info('antennaconstraint: ' + str(inantennaconstraint_list))
   logger.info('resetsols: ' + str(inresetsols_list))
   logger.info('resetdir: ' + str(inresetdir_list))
   logger.info('normamps: ' + str(innormamps_list))
   logger.info('soltypecycles: ' + str(insoltypecycles_list))


   return innchan_list, insolint_list, inBLsmooth_list, insmoothnessconstraint_list, insmoothnessreffrequency_list, insmoothnessspectralexponent_list, insmoothnessrefdistance_list, inantennaconstraint_list, inresetsols_list, inresetdir_list, insoltypecycles_list, innormamps_list


def create_beamcortemplate(ms):
  """
  create a DPPP gain H5 template solutution file that can be filled with losoto
  """
  H5name = ms + '_templatejones.h5'

  cmd = "DP3 numthreads="+str(np.min([multiprocessing.cpu_count(),24]))+ " msin=" + ms + " msin.datacolumn=DATA msout=. "
  #cmd += 'msin.modelcolumn=DATA '
  cmd += "steps=[ddecal] ddecal.type=ddecal "
  cmd += "ddecal.maxiter=1 ddecal.nchan=1 "
  cmd += "ddecal.modeldatacolumns='[DATA]' "
  cmd += "ddecal.mode=complexgain ddecal.h5parm=" + H5name  + " "
  cmd += "ddecal.solint=10 ddecal.solveralgorithm=directioniterative "
  cmd += "ddecal.datause=dual" # extra speedup
  #cmd += "ddecal.usedualvisibilities=True" # extra speedup
  print(cmd)
  run(cmd)

  return H5name

def create_losoto_beamcorparset(ms, refant='CS003HBA0'):
    """
    Create a losoto parset to fill the beam correction values'.
    """
    parset = 'losotobeam.parset'
    os.system('rm -f ' + parset)
    f=open(parset, 'w')

    f.write('pol = [XX,YY]\n')
    f.write('soltab = [sol000/*]\n\n\n')

    f.write('[plotphase]\n')
    f.write('operation = PLOT\n')
    f.write('soltab = [sol000/phase000]\n')
    f.write('axesInPlot = [time,freq]\n')
    f.write('axisInTable = ant\n')
    f.write('minmax = [-0.5,0.5]\n')
    f.write('prefix = plotlosoto%s/phases_beam\n' % os.path.basename(ms))
    f.write('refAnt = %s\n\n\n' % refant)

    f.write('[plotamp]\n')
    f.write('operation = PLOT\n')
    f.write('soltab = [sol000/amplitude000]\n')
    f.write('axesInPlot = [time,freq]\n')
    f.write('axisInTable = ant\n')
    f.write('minmax = [0.2,1]\n')
    f.write('prefix = plotlosoto%s/amplitudes_beam\n' % os.path.basename(ms))

    f.close()
    return parset

def create_losoto_tecandphaseparset(ms, refant='CS003HBA0', outplotname='fasttecandphase', markersize=2):
    parset = 'losoto_plotfasttecandphase.parset'
    os.system('rm -f ' + parset)
    f=open(parset, 'w')

    f.write('pol = []\n')
    f.write('Ncpu = 0\n\n\n')

    f.write('[plottecandphase]\n')
    f.write('operation = PLOT\n')
    f.write('soltab = [sol000/phase000]\n')
    f.write('axesInPlot = [time]\n')
    f.write('axisInTable = ant\n')
    f.write('minmax = [-3.14,3.14]\n')
    f.write('soltabToAdd = tec000\n')
    f.write('figSize=[120,20]\n')
    f.write('markerSize=%s\n' % int(markersize))
    f.write('prefix = plotlosoto%s/fasttecandphase\n' % os.path.basename(ms))
    f.write('refAnt = %s\n' % refant)

    f.close()
    return parset

def create_losoto_tecparset(ms, refant='CS003HBA0', outplotname='fasttec', markersize=2):
    parset = 'losoto_plotfasttec.parset'
    os.system('rm -f ' + parset)
    f=open(parset, 'w')

    f.write('pol = []\n')
    f.write('Ncpu = 0\n\n\n')

    f.write('[plottec]\n')
    f.write('operation = PLOT\n')
    f.write('soltab = [sol000/tec000]\n')
    f.write('axesInPlot = [time]\n')
    f.write('axisInTable = ant\n')
    f.write('minmax = [-0.2,0.2]\n')
    f.write('figSize=[120,20]\n')
    f.write('markerSize=%s\n' % int(markersize))
    f.write('prefix = plotlosoto%s/%s\n' % (ms,outplotname))
    f.write('refAnt = %s\n' % refant)

    f.close()
    return parset


def create_losoto_rotationparset(ms, refant='CS003HBA0', onechannel=False, \
                                 outplotname='rotation', markersize=2):
    parset = 'losoto_plotrotation.parset'
    os.system('rm -f ' + parset)
    f=open(parset, 'w')

    f.write('pol = [XX,YY]\n')
    f.write('soltab = [sol000/*]\n')
    f.write('Ncpu = 0\n\n\n')

    f.write('[plotrotation]\n')
    f.write('operation = PLOT\n')
    f.write('soltab = [sol000/rotation000]\n')
    f.write('markerSize=%s\n' % int(markersize))
    if onechannel:
      f.write('axesInPlot = [time]\n')
    else:
      f.write('axesInPlot = [time,freq]\n')
    f.write('axisInTable = ant\n')
    f.write('minmax = [-1.57,1.57]\n') # rotation needs to be plotted from -pi/2 to pi/2
    f.write('figSize=[120,20]\n')
    f.write('prefix = plotlosoto%s/%s\n' % (ms,outplotname))
    f.write('refAnt = %s\n' % refant)
    f.close()
    return parset


def create_losoto_fastphaseparset(ms, refant='CS003HBA0', onechannel=False, onepol=False, outplotname='fastphase'):
    parset = 'losoto_plotfastphase.parset'
    os.system('rm -f ' + parset)
    f=open(parset, 'w')

    f.write('pol = [XX,YY]\n')
    f.write('soltab = [sol000/*]\n')
    f.write('Ncpu = 0\n\n\n')

    f.write('[plotphase]\n')
    f.write('operation = PLOT\n')
    f.write('soltab = [sol000/phase000]\n')
    if onechannel:
      f.write('axesInPlot = [time]\n')
      if not onepol:
        f.write('axisInCol = pol\n')

    else:
      f.write('axesInPlot = [time,freq]\n')
    f.write('axisInTable = ant\n')
    f.write('minmax = [-3.14,3.14]\n')
    f.write('figSize=[120,20]\n')
    f.write('prefix = plotlosoto%s/%s\n' % (ms,outplotname))
    f.write('refAnt = %s\n' % refant)

    if not onepol:
      f.write('[plotphasediff]\n')
      f.write('operation = PLOT\n')
      f.write('soltab = [sol000/phase000]\n')
      if onechannel:
        f.write('axesInPlot = [time]\n')
      else:
        f.write('axesInPlot = [time,freq]\n')
      f.write('axisInTable = ant\n')
      f.write('minmax = [-3.14,3.14]\n')
      f.write('figSize=[120,20]\n')
      f.write('prefix = plotlosoto%s/%spoldiff\n' % (ms,outplotname))
      f.write('refAnt = %s\n' % refant)
      f.write('axisDiff=pol\n')


    f.close()
    return parset


def create_losoto_flag_apgridparset(ms, flagging=True, maxrms=7.0, maxrmsphase=7.0, includesphase=True, \
                                    refant='CS003HBA0', onechannel=False, medamp=2.5, flagphases=True, \
                                    onepol=False, outplotname='slowamp', fulljones=False):

    parset= 'losoto_flag_apgrid.parset'
    os.system('rm -f ' + parset)
    f=open(parset, 'w')

    # f.write('pol = []\n')
    f.write('soltab = [sol000/*]\n')
    f.write('Ncpu = 0\n\n\n')

    f.write('[plotamp]\n')
    f.write('operation = PLOT\n')
    f.write('soltab = [sol000/amplitude000]\n')
    if onechannel:
      f.write('axesInPlot = [time]\n')
      if not onepol:
        f.write('axisInCol = pol\n')
    else:
      f.write('axesInPlot = [time,freq]\n')
    f.write('axisInTable = ant\n')
    # if longbaseline:
    #  f.write('minmax = [0,2.5]\n')        
    # else:    
    f.write('minmax = [%s,%s]\n' % (str(medamp/4.0), str(medamp*2.5)))
    # f.write('minmax = [0,2.5]\n')
    f.write('prefix = plotlosoto%s/%samp\n\n\n' % (ms,outplotname))

    if fulljones:
       f.write('[plotampXYYX]\n')
       f.write('operation = PLOT\n')
       f.write('soltab = [sol000/amplitude000]\n')
       f.write('pol = [XY, YX]\n')
       if onechannel:
         f.write('axesInPlot = [time]\n')
       else:
         f.write('axesInPlot = [time,freq]\n')
       f.write('axisInTable = ant\n')
       f.write('minmax = [%s,%s]\n' % (str(0.0), str(0.5)))
       f.write('prefix = plotlosoto%s/%sampXYYX\n\n\n' % (ms,outplotname))


    if includesphase:
        f.write('[plotphase]\n')
        f.write('operation = PLOT\n')
        f.write('soltab = [sol000/phase000]\n')
        if onechannel:
          f.write('axesInPlot = [time]\n')
          if not onepol:
            f.write('axisInCol = pol\n')
        else:
           f.write('axesInPlot = [time,freq]\n')
        f.write('axisInTable = ant\n')
        f.write('minmax = [-3.14,3.14]\n')
        f.write('prefix = plotlosoto%s/%sphase\n' % (ms,outplotname))
        f.write('refAnt = %s\n\n\n' % refant)

        if not onepol and not fulljones:
          f.write('[plotphasediff]\n')
          f.write('operation = PLOT\n')
          f.write('soltab = [sol000/phase000]\n')
          if onechannel:
            f.write('axesInPlot = [time]\n')
          else:
            f.write('axesInPlot = [time,freq]\n')
          f.write('axisInTable = ant\n')
          f.write('minmax = [-3.14,3.14]\n')
          f.write('figSize=[120,20]\n')
          f.write('prefix = plotlosoto%s/%spoldiff\n' % (ms,outplotname))
          f.write('refAnt = %s\n' % refant)
          f.write('axisDiff=pol\n\n\n')


    if flagging:
        f.write('[flagamp]\n')
        f.write('soltab = [sol000/amplitude000]\n')
        f.write('operation = FLAG\n')
        if onechannel:
          f.write('axesToFlag = [time]\n')
        else:
          f.write('axesToFlag = [time,freq]\n')
        f.write('mode = smooth\n')
        f.write('maxCycles = 3\n')
        f.write('windowNoise = 7\n')
        f.write('maxRms = %s\n' % str(maxrms))
        if onechannel:
          f.write('order  = [5]\n\n\n')
        else:
          f.write('order  = [5,5]\n\n\n')

        if includesphase and flagphases:
            f.write('[flagphase]\n')
            f.write('soltab = [sol000/phase000]\n')
            f.write('operation = FLAG\n')
            if onechannel:
              f.write('axesToFlag = [time]\n')
            else:
              f.write('axesToFlag = [time,freq]\n')
            f.write('mode = smooth\n')
            f.write('maxCycles = 3\n')
            f.write('windowNoise = 7\n')
            f.write('maxRms = %s\n' % str(maxrmsphase))
            if onechannel:
              f.write('order  = [5]\n\n\n')
            else:
              f.write('order  = [5,5]\n\n\n')

        f.write('[plotampafter]\n')
        f.write('operation = PLOT\n')
        f.write('soltab = [sol000/amplitude000]\n')
        if onechannel:
          f.write('axesInPlot = [time]\n')
          if not onepol:
            f.write('axisInCol = pol\n')
        else:
          f.write('axesInPlot = [time,freq]\n')
        f.write('axisInTable = ant\n')
        # f.write('minmax = [0,2.5]\n')
        f.write('minmax = [%s,%s]\n' % (str(medamp/4.0), str(medamp*2.5)))
        f.write('prefix = plotlosoto%s/%sampfl\n\n\n' % (ms,outplotname))

        if includesphase and flagphases:
            f.write('[plotphase_after]\n')
            f.write('operation = PLOT\n')
            f.write('soltab = [sol000/phase000]\n')
            if onechannel:
              f.write('axesInPlot = [time]\n')
              if not onepol:
                f.write('axisInCol = pol\n')
            else:
              f.write('axesInPlot = [time,freq]\n')
            f.write('axisInTable = ant\n')
            f.write('minmax = [-3.14,3.14]\n')
            f.write('prefix = plotlosoto%s/%sphasefl\n' % (ms,outplotname))
            f.write('refAnt = %s\n' % refant)


    f.close()
    return parset

def create_losoto_mediumsmoothparset(ms, boxsize, longbaseline, includesphase=True, refant='CS003HBA0',\
                                     onechannel=False, outplotname='runningmedian'):
    parset= 'losoto_mediansmooth.parset'
    os.system('rm -f ' + parset)
    f=open(parset, 'w')

    f.write('pol = []\n')
    f.write('soltab = [sol000/*]\n')
    f.write('Ncpu = 0\n\n\n')

    if includesphase:
        f.write('[smoothphase]\n')
        f.write('soltab = [sol000/phase000]\n')
        f.write('operation= SMOOTH\n')
        if onechannel:
          f.write('axesToSmooth = [time]\n')
          f.write('size = [%s]\n' % (boxsize))
        else:
          f.write('axesToSmooth = [freq,time]\n')
          f.write('size = [%s,%s]\n' % (boxsize, boxsize))
        f.write('mode = runningmedian\n\n\n')

    f.write('[smoothamp]\n')
    f.write('soltab = [sol000/amplitude000]\n')
    f.write('operation= SMOOTH\n')
    if onechannel:
      f.write('axesToSmooth = [time]\n')
      f.write('size = [%s]\n' % (boxsize))
    else:
      f.write('axesToSmooth = [freq,time]\n')
      f.write('size = [%s,%s]\n' % (boxsize, boxsize))
    f.write('mode = runningmedian\n\n\n')

    f.write('[plotamp_after]\n')
    f.write('operation = PLOT\n')
    f.write('soltab = [sol000/amplitude000]\n')
    if onechannel:
      f.write('axesInPlot = [time]\n')
    else:
      f.write('axesInPlot = [time,freq]\n')
    f.write('axisInTable = ant\n')
    if longbaseline:
      f.write('minmax = [0,2.5]\n')
    else:
      f.write('minmax = [0,2.5]\n')
    f.write('prefix = plotlosoto%s/amps_smoothed\n\n\n' % os.path.basename(ms))

    if includesphase:
        f.write('[plotphase_after]\n')
        f.write('operation = PLOT\n')
        f.write('soltab = [sol000/phase000]\n')
        if onechannel:
          f.write('axesInPlot = [time]\n')
        else:
          f.write('axesInPlot = [time,freq]\n')
        f.write('axisInTable = ant\n')
        f.write('minmax = [-3.14,3.14]\n')
        f.write('prefix = plotlosoto%s/phases_smoothed\n\n\n' % os.path.basename(ms))
        f.write('refAnt = %s\n' % refant)


        f.write('[plotphase_after1rad]\n')
        f.write('operation = PLOT\n')
        f.write('soltab = [sol000/phase000]\n')
        if onechannel:
          f.write('axesInPlot = [time]\n')
        else:
          f.write('axesInPlot = [time,freq]\n')
        f.write('axisInTable = ant\n')
        f.write('minmax = [-1,1]\n')
        f.write('prefix = plotlosoto%s/phases_smoothed1rad\n' % os.path.basename(ms))
        f.write('refAnt = %s\n' % refant)

    f.close()
    return parset

def check_phaseup(H5name):
    H5 =  tables.open_file(H5name, mode='r')
    try:
      ants   = H5.root.sol000.phase000.ant[:]
    except:
      pass

    try:
      ants   = H5.root.sol000.amplitude000.ant[:]
    except:
      pass

    try:
      ants   = H5.root.sol000.rotation000.ant[:]
    except:
      pass

    try:
      ants   = H5.root.sol000.tec000.ant[:]
    except:
      pass
  
    # H5 = h5parm.h5parm(H5name, readonly=False)
    # ants = H5.getSolset('sol000').getAnt().keys()
    H5.close()
    if 'ST001' in ants:
        return True
    else:
        return False

def fixbeam_ST001(H5name):

   H5 = h5parm.h5parm(H5name, readonly=False)

   ants = H5.getSolset('sol000').getAnt().keys()
   antsrs = fnmatch.filter(ants,'RS*')
   ST001 = False

   if 'ST001' in ants:
     ST001 = True
     amps    = H5.getSolset('sol000').getSoltab('amplitude000').getValues()
     ampvals = H5.getSolset('sol000').getSoltab('amplitude000').getValues()[0]
     phasevals = H5.getSolset('sol000').getSoltab('phase000').getValues()[0]

     idx = np.where(amps[1]['ant'] == 'ST001')[0][0]
     idxrs = np.where(amps[1]['ant'] == antsrs[0])[0][0]
     # idx106 = np.where(amps[1]['ant'] == 'RS106HBA')[0][0]
     # idx305 = np.where(amps[1]['ant'] == 'RS305HBA')[0][0]
     # idx508 = np.where(amps[1]['ant'] == 'RS508HBA')[0][0]
     # idx406 = np.where(amps[1]['ant'] == 'RS406HBA')[0][0]
     # idxnonecheck = np.where(amps[1]['ant'] == 'blaHBA')[0][0]

     # ampvals[:,:, idx, 0,:] = 1.0  # set amplitude to 1.
     # phasevals[:,:, idx, 0,:] = 0.0 # set phase to 0.

     ampvals[:,:, idx, 0,:] = ampvals[:,:, idxrs, 0,:]
     phasevals[:,:, idx, 0,:] = 0.0

     H5.getSolset('sol000').getSoltab('amplitude000').setValues(ampvals)
     H5.getSolset('sol000').getSoltab('phase000').setValues(phasevals)

   H5.close()

   return ST001

def circular(ms, linear=False, dysco=True):
    """
    convert to circular correlations
    """
    taql = 'taql'
    scriptn = 'python lin2circ.py'
    if linear:
      cmdlin2circ = scriptn + ' -i ' + ms + ' --column=DATA --lincol=CORRECTED_DATA --back'
    else:
      cmdlin2circ = scriptn + ' -i ' + ms + ' --column=DATA --outcol=CORRECTED_DATA'
    if not dysco:
      cmdlin2circ += ' --nodysco'
    print(cmdlin2circ)
    run(cmdlin2circ)
    run(taql + " 'update " + ms + " set DATA=CORRECTED_DATA'")
    return


def beamcor_and_lin2circ(ms, msout='.', dysco=True, beam=True, lin2circ=False, \
                         circ2lin=False, losotobeamlib='stationresponse', update_poltable=True, idg=False):
    """
    correct a ms for the beam in the phase center (array_factor only)
    """

    # check if there are applybeam corrections in the header
    # should be there unless a very old DP3 version has been used
    usedppp = beamkeywords(ms)

    losoto = 'losoto'
    #taql = 'taql'
    H5name  = create_beamcortemplate(ms)
    phasedup = check_phaseup(H5name) # in case no beamcor is done we still need this

    if (lin2circ or circ2lin):
       tp = pt.table(ms+'/POLARIZATION',ack=False)
       polinfo = tp.getcol('CORR_TYPE')
       if lin2circ: # so in this case input must be linear
          if not np.array_equal(np.array([[9,10,11,12]]), polinfo):
             print(polinfo)
             raise Exception('Input data is not linear, cannot convert to circular')
       if circ2lin:  # so in this case input must be circular
          if not np.array_equal(np.array([[5,6,7,8]]), polinfo):
             print(polinfo)
             raise Exception('Input data is not circular, cannot convert to linear')  
       tp.close()

    if beam:
       tp = pt.table(ms+'/POLARIZATION',ack=False)
       polinfo = tp.getcol('CORR_TYPE')
       tp.close()
       if np.array_equal(np.array([[5,6,7,8]]), polinfo): # so we have circular data
          raise Exception('Cannot do DP3 beam correction on input data that is circular')

    if lin2circ and circ2lin:
       print('Wrong input in function, both lin2circ and circ2lin are True')
       raise Exception('Wrong input in function, both lin2circ and circ2lin are True')

    if beam:
       losotolofarbeam(H5name, 'phase000', ms, useElementResponse=False, useArrayFactor=True, useChanFreq=True, beamlib=losotobeamlib)
       losotolofarbeam(H5name, 'amplitude000', ms, useElementResponse=False, useArrayFactor=True, useChanFreq=True, beamlib=losotobeamlib)

       phasedup = fixbeam_ST001(H5name)
       parset = create_losoto_beamcorparset(ms, refant=findrefant_core(H5name))
       force_close(H5name)
    
       #print('Phase up dataset, cannot use DPPP beam, do manual correction')
       cmdlosoto = losoto + ' ' + H5name + ' ' + parset
       print(cmdlosoto)
       logger.info(cmdlosoto)
       run(cmdlosoto)

    if usedppp and not phasedup :
        cmddppp = 'DP3 numthreads='+str(multiprocessing.cpu_count())+ ' msin=' + ms + ' msin.datacolumn=DATA '
        cmddppp += 'msout=' + msout + ' '
        cmddppp += 'msin.weightcolumn=WEIGHT_SPECTRUM '
        if msout == '.':
          cmddppp += 'msout.datacolumn=CORRECTED_DATA '
        if (lin2circ or circ2lin) and beam:
          cmddppp += 'steps=[beam,pystep] '
          if idg:
            cmddppp += 'beam.type=applybeam beam.updateweights=False ' # weights
          else:
            cmddppp += 'beam.type=applybeam beam.updateweights=True ' # weights
          cmddppp += 'beam.direction=[] ' # correction for the current phase center
          # cmddppp += 'beam.beammode= ' default is full, will undo element as well(!)
          
          cmddppp += 'pystep.python.module=polconv '
          cmddppp += 'pystep.python.class=PolConv '
          cmddppp += 'pystep.type=PythonDPPP '
          if lin2circ:
             cmddppp += 'pystep.lin2circ=1 '
          if circ2lin:
             cmddppp += 'pystep.circ2lin=1 '

        if beam and not (lin2circ or circ2lin):
          cmddppp += 'steps=[beam] '
          if idg:
            cmddppp += 'beam.type=applybeam beam.updateweights=False ' # weights
          else:
            cmddppp += 'beam.type=applybeam beam.updateweights=True ' # weights                    
          cmddppp += 'beam.direction=[] ' # correction for the current phase center
          # cmddppp += 'beam.beammode= ' default is full, will undo element as well(!)
          
        if (lin2circ or circ2lin) and not beam:
          cmddppp += 'steps=[pystep] '
          cmddppp += 'pystep.python.module=polconv '
          cmddppp += 'pystep.python.class=PolConv '
          cmddppp += 'pystep.type=PythonDPPP '
          if lin2circ:
             cmddppp += 'pystep.lin2circ=1 '
          if circ2lin:
             cmddppp += 'pystep.circ2lin=1 '

        if dysco:
          cmddppp += 'msout.storagemanager=dysco '
          cmddppp += 'msout.storagemanager.weightbitrate=16 '

        print('DP3 applybeam/polconv:', cmddppp)
        run(cmddppp)
        if msout == '.':
          #run(taql + " 'update " + ms + " set DATA=CORRECTED_DATA'")
          run("DP3 msin=" + ms + " msout=. msin.datacolumn=CORRECTED_DATA msout.datacolumn=DATA steps=[]", log=True)
    else:
        cmd = 'DP3 numthreads='+str(multiprocessing.cpu_count())+ ' msin=' + ms + ' msin.datacolumn=DATA '
        cmd += 'msout=' + msout + ' '
        cmd += 'msin.weightcolumn=WEIGHT_SPECTRUM '
        if msout == '.':
          cmd += 'msout.datacolumn=CORRECTED_DATA '

        if (lin2circ or circ2lin) and beam:
          cmd += 'steps=[ac1,ac2,pystep] '
          cmd += 'pystep.python.module=polconv '
          cmd += 'pystep.python.class=PolConv '
          cmd += 'pystep.type=PythonDPPP '
          if lin2circ:
             cmd += 'pystep.lin2circ=1 '
          if circ2lin:
             cmd += 'pystep.circ2lin=1 '

          cmd += 'ac1.parmdb='+H5name + ' ac2.parmdb='+H5name + ' '
          cmd += 'ac1.type=applycal ac2.type=applycal '
          cmd += 'ac1.correction=phase000 ac2.correction=amplitude000 '
          if idg:
            cmd += 'ac2.updateweights=False '  
          else:
            cmd += 'ac2.updateweights=True '
        if beam and not (lin2circ or circ2lin):
          cmd += 'steps=[ac1,ac2] '
          cmd += 'ac1.parmdb='+H5name + ' ac2.parmdb='+H5name + ' '
          cmd += 'ac1.type=applycal ac2.type=applycal '
          cmd += 'ac1.correction=phase000 ac2.correction=amplitude000 '
          if idg:
            cmd += 'ac2.updateweights=False '  
          else:
            cmd += 'ac2.updateweights=True '
        if (lin2circ or circ2lin) and not beam:
          cmd += 'steps=[pystep] '
          cmd += 'pystep.python.module=polconv '
          cmd += 'pystep.python.class=PolConv '
          cmd += 'pystep.type=PythonDPPP '
          if lin2circ:
             cmd += 'pystep.lin2circ=1 '
          if circ2lin:
             cmd += 'pystep.circ2lin=1 '


        if dysco:
          cmd += 'msout.storagemanager=dysco '
          cmd += 'msout.storagemanager.weightbitrate=16 '
        print('DP3 applycal/polconv:', cmd)
        run(cmd, log=True)
        if msout == '.':
          #run(taql + " 'update " + ms + " set DATA=CORRECTED_DATA'")
          run("DP3 msin=" + ms + " msout=. msin.datacolumn=CORRECTED_DATA msout.datacolumn=DATA steps=[]", log=True)

    # update ms POLTABLE 
    if (lin2circ or circ2lin) and update_poltable:
       tp = pt.table(ms+'/POLARIZATION',readonly=False,ack=True)
       if lin2circ:
          tp.putcol('CORR_TYPE',np.array([[5,6,7,8]],dtype=np.int32)) # FROM LIN-->CIRC
       if circ2lin:  
          tp.putcol('CORR_TYPE',np.array([[9,10,11,12]],dtype=np.int32)) # FROM CIRC-->LIN
       tp.close()

    return


def beamkeywords(ms):
    t = pt.table(ms, readonly=True, ack=False)
    applybeam_info = False
    try:
       beammode = t.getcolkeyword('DATA', 'LOFAR_APPLIED_BEAM_MODE')
       applybeam_info = True
       print('DP3 applybeam was used')
    except:
       print('No applybeam beam keywords were found, very old DP3 version was used in prefactor?')
    t.close()
    return applybeam_info

def beamcormodel(ms, dysco=True):
    """
    create MODEL_DATA_BEAMCOR where we store beam corrupted model data
    """
    H5name = ms + '_templatejones.h5'

    cmd = 'DP3 numthreads='+str(multiprocessing.cpu_count())+' msin=' + ms + ' msin.datacolumn=MODEL_DATA msout=. '
    cmd += 'msout.datacolumn=MODEL_DATA_BEAMCOR steps=[ac1,ac2] '
    if dysco:
      cmd +=  'msout.storagemanager=dysco '
      cmd += 'msout.storagemanager.weightbitrate=16 '
    cmd += 'ac1.parmdb='+H5name + ' ac2.parmdb='+H5name + ' '
    cmd += 'ac1.type=applycal ac2.type=applycal '
    cmd += 'ac1.correction=phase000 ac2.correction=amplitude000 ac2.updateweights=False '
    cmd += 'ac1.invert=False ac2.invert=False ' # Here we corrupt with the beam !
    print('DP3 applycal:', cmd)
    run(cmd, log=True)

    return

def findrms(mIn,maskSup=1e-7):
    """
    find the rms of an array, from Cycil Tasse/kMS
    """
    m=mIn[np.abs(mIn)>maskSup]
    rmsold=np.std(m)
    diff=1e-1
    cut=3.
    med=np.median(m)
    for i in range(10):
        ind=np.where(np.abs(m-med)<rmsold*cut)[0]
        rms=np.std(m[ind])
        if np.abs((rms-rmsold)/rmsold)<diff: break
        rmsold=rms
    return rms

def write_RMsynthesis_weights(fitslist, outfile):
   rmslist = np.zeros(len(fitslist))
   
   for fits_id, fitsfile in enumerate(fitslist):
      hdu = flatten(fits.open(fitsfile,  ignore_missing_end=True))
      rmslist[fits_id] = findrms(hdu.data)
      
   print(rmslist*1e6)
   rmslist = 1/rmslist**2 # 1/variance
   rmslist = rmslist/np.max(rmslist) # normalize to max 1
   
   f=open(outfile, 'w')
   for rms in rmslist:
     f.write(str(rms) + '\n')
   f.close()
   return

def findamplitudenoise(parmdb):
      """
      find the 'amplitude noise' in a parmdb, return non-clipped rms value
      """
      H5 = h5parm.h5parm(parmdb, readonly=True)
      amps =H5.getSolset('sol000').getSoltab('amplitude000').getValues()[0]
      weights = H5.getSolset('sol000').getSoltab('amplitude000').getValues(weight=True)[0]
      H5.close()

      idx = np.where(weights != 0.0)

      amps = amps[idx]
      amps = amps[np.isfinite(amps)]
      amps = np.log10(np.ndarray.flatten(amps))


      noise = findrms(amps)

      logger.info('Noise and clipped noise' + str(parmdb) + ' ' + str(np.std(amps)) + ' ' + str(noise))

      # do not return clipped noise, we are intersted in finding data with high outliers
      return np.std(amps)


def getimsize(boxfile, cellsize=1.5, increasefactor=1.2, DDE=None):
   """
   find imsize need to image a DS9 boxfile region
   """
   r = pyregion.open(boxfile)

   xs = np.ceil((r[0].coord_list[2])*increasefactor*3600./cellsize)
   ys = np.ceil((r[0].coord_list[3])*increasefactor*3600./cellsize)

   imsize = np.ceil(xs) # // Round up decimals to an integer
   if(imsize % 2 == 1):
       imsize = imsize + 1
   
   # if int(imsize) < 512:
   #    imsize = 512
   return int(imsize)


def smoothsols(parmdb, ms, longbaseline, includesphase=True):

    losoto = 'losoto'

    cmdlosoto = losoto + ' ' + parmdb + ' '
    noise = findamplitudenoise(parmdb)
    smooth = False
    if noise >= 0.1:
      cmdlosoto += create_losoto_mediumsmoothparset(ms, '9', longbaseline, includesphase=includesphase)
      smooth = True
    if noise < 0.1 and noise >= 0.08:
      cmdlosoto += create_losoto_mediumsmoothparset(ms, '7', longbaseline, includesphase=includesphase)
      smooth = True
    if noise < 0.08 and noise >= 0.07:
      cmdlosoto += create_losoto_mediumsmoothparset(ms, '5', longbaseline, includesphase=includesphase)
      smooth = True
    if noise < 0.07 and noise >= 0.04:
      cmdlosoto += create_losoto_mediumsmoothparset(ms, '3', longbaseline, includesphase=includesphase)
      smooth = True
    if smooth:
       print(cmdlosoto)
       logger.info(cmdlosoto)
       run(cmdlosoto)
    return


def change_refant(parmdb, soltab):
    '''
    Changes the reference antenna, if needed, for phase
    '''
    H5     = h5parm.h5parm(parmdb, readonly=False)
    phases = H5.getSolset('sol000').getSoltab(soltab).getValues()[0]
    weights= H5.getSolset('sol000').getSoltab(soltab).getValues(weight=True)[0]
    axesnames = H5.getSolset('sol000').getSoltab(soltab).getAxesNames()
    print('axesname', axesnames)
    # print 'SHAPE', np.shape(weights)#, np.size(weights[:,:,0,:,:])


    antennas = list(H5.getSolset('sol000').getSoltab(soltab).getValues()[1]['ant'])
    # print antennas
    
    if 'pol' in axesnames:
      idx0    = np.where((weights[:,:,0,:,:] == 0.0))[0]
      idxnan  = np.where((~np.isfinite(phases[:,:,0,:,:])))[0]

      refant = ' '
      tmpvar = float(np.size(weights[:,:,0,:,:]))
    else:
      idx0    = np.where((weights[:,0,:,:] == 0.0))[0]
      idxnan  = np.where((~np.isfinite(phases[:,0,:,:])))[0]

      refant = ' '
      tmpvar = float(np.size(weights[:,0,:,:]))

    if ((float(len(idx0))/tmpvar) > 0.5) or ((float(len(idxnan))/tmpvar) > 0.5):
      logger.info('Trying to changing reference anntena')


      for antennaid,antenna in enumerate(antennas[1::]):
            print(antenna)
            if 'pol' in axesnames:
              idx0    = np.where((weights[:,:,antennaid+1,:,:] == 0.0))[0]
              idxnan  = np.where((~np.isfinite(phases[:,:,antennaid+1,:,:])))[0]
              tmpvar = float(np.size(weights[:,:,antennaid+1,:,:]))
            else:
              idx0    = np.where((weights[:,antennaid+1,:,:] == 0.0))[0]
              idxnan  = np.where((~np.isfinite(phases[:,antennaid+1,:,:])))[0]
              tmpvar = float(np.size(weights[:,antennaid+1,:,:]))

            print(idx0, idxnan, ((float(len(idx0))/tmpvar)))
            if  ((float(len(idx0))/tmpvar) < 0.5) and ((float(len(idxnan))/tmpvar) < 0.5):
              logger.info('Found new reference anntena,' + str(antenna))
              refant = antenna
              break


    if refant != ' ':
        for antennaid,antenna in enumerate(antennas):
            if 'pol' in axesnames:
              phases[:,:,antennaid,:,:] = phases[:,:,antennaid,:,:] - phases[:,:,antennas.index(refant),:,:]
            else:
              # phases[:,antennaid,:,:] = phases[:,antennaid,:,:] - phases[:,antennas.index(refant),:,:]
              phases[:,:,antennaid,:] = phases[:,:,antennaid,:] - phases[:,:,antennas.index(refant),:]   
        H5.getSolset('sol000').getSoltab(soltab).setValues(phases)     

    H5.close()
    return


def calculate_solintnchan(compactflux):

    if compactflux >= 3.5:
        nchan = 5.
        solint_phase = 1.

    if compactflux <= 3.5:
        nchan = 5.
        solint_phase = 1.

    if compactflux <= 1.0:
        nchan= 10.
        solint_phase = 2

    if compactflux <= 0.75:
        nchan= 15.
        solint_phase = 3.
 
    # solint_ap = 100. / np.sqrt(compactflux)
    solint_ap = 120. /(compactflux**(1./3.)) # do third power-scaling
    # print solint_ap
    if solint_ap < 60.:
        solint_ap = 60.  # shortest solint_ap allowed
    if solint_ap > 180.:
        solint_ap = 180.  # longest solint_ap allowed

    if compactflux <= 0.4:
        nchan= 15.
        solint_ap = 180.

    return int(nchan), int(solint_phase), int(solint_ap)


def determine_compactsource_flux(fitsimage):
    '''
    return total flux in compect sources in the fitsimage
    input: a fits image
    output: flux density in Jy
    '''
    hdul = fits.open(fitsimage)
    bmaj = hdul[0].header['BMAJ']
    bmin = hdul[0].header['BMIN']
    avgbeam = 3600.*0.5*(bmaj + bmin)
    pixsize = 3600.*(hdul[0].header['CDELT2'])
    rmsbox1 = int(7.*avgbeam/pixsize)
    rmsbox2 = int((rmsbox1/10.) + 1.)

    img = bdsf.process_image(fitsimage,mean_map='zero', rms_map=True, rms_box = (rmsbox1,rmsbox2))
    total_flux_gaus = np.copy(img.total_flux_gaus)
    hdul.close()
    # trying to reset.....
    del img

    return total_flux_gaus


def getdeclinationms(ms):
    '''
    return approximate declination of pointing center of the ms
    input: a ms
    output: declination in degrees
    '''
    t = pt.table(ms +'/FIELD', readonly=True, ack=False)
    direction = np.squeeze ( t.getcol('PHASE_DIR') )
    t.close()
    return 360.*direction[1]/(2.*np.pi)

# print getdeclinationms('1E216.dysco.sub.shift.avg.weights.set0.ms')

def declination_sensivity_factor(declination):
    '''
    compute sensitivy factor lofar data, reduced by delclination, eq. from G. Heald.
    input declination is units of degrees
    '''
    factor = 1./(np.cos(2.*np.pi*(declination - 52.9)/360.)**2)

    return factor


def flaglowamps_fulljones(parmdb, lowampval=0.1, flagging=True, setweightsphases=True):
    '''
    flag bad amplitudes in H5 parmdb, those with values < lowampval
    assume pol-axis is present (can handle length 2 (diagonal), or 4 (fulljones))
    '''
    H5 = h5parm.h5parm(parmdb, readonly=False)
    amps =H5.getSolset('sol000').getSoltab('amplitude000').getValues()[0]
    weights = H5.getSolset('sol000').getSoltab('amplitude000').getValues(weight=True)[0]

    amps_xx = amps[...,0]
    amps_yy = amps[...,-1] # so this also works for pol axis length 1
    weights_xx = weights[...,0]
    weights_yy =weights[...,-1]
    idx_xx = np.where(amps_xx < lowampval)
    idx_yy = np.where(amps_yy < lowampval)

    if flagging: # no flagging
      weights_xx[idx_xx] = 0.0
      weights_yy[idx_yy] = 0.0
      print('Settting some weights to zero in flaglowamps_fulljones')

    amps_xx[idx_xx] = 1.0
    amps_yy[idx_yy] = 1.0

    weights[...,0] = weights_xx
    weights[...,-1] = weights_yy
    amps[...,0] = amps_xx
    amps[...,-1] = amps_yy

    H5.getSolset('sol000').getSoltab('amplitude000').setValues(weights,weight=True)
    H5.getSolset('sol000').getSoltab('amplitude000').setValues(amps)

    # also put phases weights and phases to zero
    if setweightsphases:
        phases = H5.getSolset('sol000').getSoltab('phase000').getValues()[0]
        weights_p = H5.getSolset('sol000').getSoltab('phase000').getValues(weight=True)[0]
        phases_xx = phases[...,0]
        phases_yy = phases[...,-1]
        weights_p_xx = weights_p[...,0]
        weights_p_yy = weights_p[...,-1]

        if flagging: # no flagging
            weights_p_xx[idx_xx] = 0.0
            weights_p_yy[idx_yy] = 0.0
            phases_xx[idx_xx] = 0.0
            phases_yy[idx_yy] = 0.0

            weights_p[...,0] = weights_p_xx
            weights_p[...,-1] = weights_p_yy
            phases[...,0] = phases_xx
            phases[...,-1] = phases_yy

            H5.getSolset('sol000').getSoltab('phase000').setValues(weights_p,weight=True)
            H5.getSolset('sol000').getSoltab('phase000').setValues(phases)
    H5.close()
    return

def flaglowamps(parmdb, lowampval=0.1,flagging=True, setweightsphases=True):
    '''
    flag bad amplitudes in H5 parmdb, those with values < lowampval
    '''
    H5 = h5parm.h5parm(parmdb, readonly=False)
    amps =H5.getSolset('sol000').getSoltab('amplitude000').getValues()[0]
    idx = np.where(amps < lowampval)
    weights = H5.getSolset('sol000').getSoltab('amplitude000').getValues(weight=True)[0]


    if flagging:
      weights[idx] = 0.0
      print('Settting some weights to zero in flaglowamps')
    amps[idx] = 1.0
    H5.getSolset('sol000').getSoltab('amplitude000').setValues(weights,weight=True)
    H5.getSolset('sol000').getSoltab('amplitude000').setValues(amps)

    # also put phases weights and phases to zero
    if setweightsphases:
        phases =H5.getSolset('sol000').getSoltab('phase000').getValues()[0]
        weights_p = H5.getSolset('sol000').getSoltab('phase000').getValues(weight=True)[0]
        if flagging:
            weights_p[idx] = 0.0
            phases[idx] = 0.0
            # print(idx)
            H5.getSolset('sol000').getSoltab('phase000').setValues(weights_p,weight=True)
            H5.getSolset('sol000').getSoltab('phase000').setValues(phases)
    
    # H5.getSolset('sol000').getSoltab('phase000').flush()
    # H5.getSolset('sol000').getSoltab('amplitude000').flush()
    H5.close()
    return


def flaghighamps(parmdb, highampval=10.,flagging=True, setweightsphases=True):
    '''
    flag bad amplitudes in H5 parmdb, those with values > highampval
    '''
    H5 = h5parm.h5parm(parmdb, readonly=False)
    amps =H5.getSolset('sol000').getSoltab('amplitude000').getValues()[0]
    idx = np.where(amps > highampval)
    weights = H5.getSolset('sol000').getSoltab('amplitude000').getValues(weight=True)[0]


    if flagging:
      weights[idx] = 0.0
      print('Settting some weights to zero in flaghighamps')
    amps[idx] = 1.0
    H5.getSolset('sol000').getSoltab('amplitude000').setValues(weights,weight=True)
    H5.getSolset('sol000').getSoltab('amplitude000').setValues(amps)

    # also put phases weights and phases to zero
    if setweightsphases:
        phases =H5.getSolset('sol000').getSoltab('phase000').getValues()[0]
        weights_p = H5.getSolset('sol000').getSoltab('phase000').getValues(weight=True)[0]
        if flagging:
            weights_p[idx] = 0.0
            phases[idx] = 0.0
            # print(idx)
            H5.getSolset('sol000').getSoltab('phase000').setValues(weights_p,weight=True)
            H5.getSolset('sol000').getSoltab('phase000').setValues(phases)
    
    # H5.getSolset('sol000').getSoltab('phase000').flush()
    # H5.getSolset('sol000').getSoltab('amplitude000').flush()
    H5.close()
    return

def flaghighamps_fulljones(parmdb, highampval=10.,flagging=True, setweightsphases=True):
    '''
    flag bad amplitudes in H5 parmdb, those with values > highampval
    assume pol-axis is present (can handle 2 (diagonal), or 4 (fulljones))
    '''
    H5 = h5parm.h5parm(parmdb, readonly=False)
    amps =H5.getSolset('sol000').getSoltab('amplitude000').getValues()[0]
    weights = H5.getSolset('sol000').getSoltab('amplitude000').getValues(weight=True)[0]

    amps_xx = amps[...,0]
    amps_yy = amps[...,-1] # so this also works for pol axis length 1
    weights_xx = weights[...,0]
    weights_yy =weights[...,-1]
    idx_xx = np.where(amps_xx > highampval)
    idx_yy = np.where(amps_yy > highampval)

    if flagging: # no flagging
      weights_xx[idx_xx] = 0.0
      weights_yy[idx_yy] = 0.0
      print('Settting some weights to zero in flaghighamps_fulljones')

    amps_xx[idx_xx] = 1.0
    amps_yy[idx_yy] = 1.0

    weights[...,0] = weights_xx
    weights[...,-1] = weights_yy
    amps[...,0] = amps_xx
    amps[...,-1] = amps_yy

    H5.getSolset('sol000').getSoltab('amplitude000').setValues(weights,weight=True)
    H5.getSolset('sol000').getSoltab('amplitude000').setValues(amps)

    # also put phases weights and phases to zero
    if setweightsphases:
        phases = H5.getSolset('sol000').getSoltab('phase000').getValues()[0]
        weights_p = H5.getSolset('sol000').getSoltab('phase000').getValues(weight=True)[0]
        phases_xx = phases[...,0]
        phases_yy = phases[...,-1]
        weights_p_xx = weights_p[...,0]
        weights_p_yy = weights_p[...,-1]

        if flagging: # no flagging
            weights_p_xx[idx_xx] = 0.0
            weights_p_yy[idx_yy] = 0.0
            phases_xx[idx_xx] = 0.0
            phases_yy[idx_yy] = 0.0

            weights_p[...,0] = weights_p_xx
            weights_p[...,-1] = weights_p_yy
            phases[...,0] = phases_xx
            phases[...,-1] = phases_yy

            H5.getSolset('sol000').getSoltab('phase000').setValues(weights_p,weight=True)
            H5.getSolset('sol000').getSoltab('phase000').setValues(phases)
    H5.close()
    return


def flagbadamps(parmdb, setweightsphases=True, flagamp1=True, flagampxyzero=True):
    '''
    flag bad amplitudes in H5 parmdb, those with amplitude==1.0
    '''
    # check if full jones
    H=tables.open_file(parmdb, mode='a')
    amplitude = H.root.sol000.amplitude000.val[:]
    weights   = H.root.sol000.amplitude000.weight[:]
    if amplitude.shape[-1] == 4:
      fulljones = True
    else:
      fulljones = False
 
    if not fulljones:
       idx = np.where(amplitude <= 0.0)      
       amplitude[idx] = 1.0
       if flagamp1:
          idx = np.where(amplitude == 1.0)
          weights[idx] = 0.0
       
       H.root.sol000.amplitude000.val[:] = amplitude
       H.root.sol000.amplitude000.weight[:] = weights 
       # also put phases weights and phases to zero
       if setweightsphases:
          phase = H.root.sol000.phase000.val[:]
          weights_p = H.root.sol000.phase000.weight[:]
          phase[idx] = 0.0
          weights_p[idx] = 0.0
          H.root.sol000.phase000.val[:] = phase
          H.root.sol000.phase000.weight[:] = weights_p 
       H.close()


    if fulljones:
       if setweightsphases:
          phase = H.root.sol000.phase000.val[:]
          weights_p = H.root.sol000.phase000.weight[:]

       # XX
       amps_xx = amplitude[...,0]
       weights_xx = weights[...,0]
       idx = np.where(amps_xx <= 0.0)
       amps_xx[idx] = 1.0
       if flagamp1:
          idx = np.where(amps_xx == 1.0)
          weights_xx[idx] =  0.0
       if setweightsphases:
          phase_xx = phase[...,0]
          weights_p_xx = weights_p[...,0]
          phase_xx[idx] = 0.0 
          weights_p_xx[idx] = 0.0

       # XY
       amps_xy = amplitude[...,1]
       weights_xy = weights[...,1]
       idx = np.where(amps_xy == 1.0)
       amps_xy[idx] = 0.0
       if flagampxyzero:
          idx = np.where(amps_xy == 0.0) # we do not want this if we resetsols
          weights_xy[idx] =  0.0
       if setweightsphases:
          phase_xy = phase[...,1]
          weights_p_xy = weights_p[...,1]
          phase_xy[idx] = 0.0 
          weights_p_xy[idx] = 0.0

       # YX
       amps_yx = amplitude[...,2]
       weights_yx = weights[...,2]
       idx = np.where(amps_yx == 1.0)
       amps_yx[idx] = 0.0
       if flagampxyzero:
          idx = np.where(amps_yx == 0.0)
          weights_yx[idx] =  0.0
       if setweightsphases:
          phase_yx = phase[...,2]
          weights_p_yx = weights_p[...,2]
          phase_yx[idx] = 0.0 
          weights_p_yx[idx] = 0.0

       # YY
       amps_yy = amplitude[...,3]
       weights_yy = weights[...,3]
       idx = np.where(amps_yy <= 0.0)
       amps_yy[idx] = 1.0
       if flagamp1:
          idx = np.where(amps_yy == 1.0)
          weights_yy[idx] =  0.0
       if setweightsphases:
          phase_yy = phase[...,3]
          weights_p_yy = weights_p[...,3]
          phase_yy[idx] = 0.0 
          weights_p_yy[idx] = 0.0
       
       amplitude[...,0] = amps_xx
       amplitude[...,1] = amps_xy
       amplitude[...,2] = amps_yx
       amplitude[...,3] = amps_yy
  
       weights[...,0] = weights_yy
       weights[...,1] = weights_xy
       weights[...,2] = weights_yx
       weights[...,3] = weights_yy
       H.root.sol000.amplitude000.val[:] = amplitude
       H.root.sol000.amplitude000.weight[:] = weights 
  
       if setweightsphases:
          phase[...,0] = phase_xx
          phase[...,1] = phase_xy
          phase[...,2] = phase_yx
          phase[...,3] = phase_yy
  
          weights_p[...,0] = weights_p_yy
          weights_p[...,1] = weights_p_xy
          weights_p[...,2] = weights_p_yx
          weights_p[...,3] = weights_p_yy
          H.root.sol000.phase000.val[:] = phase
          H.root.sol000.phase000.weight[:] = weights_p 
       H.close()
    return


def medianamp(h5):
    # assume pol-axis is present (can handle length, 1 (scalar), 2 (diagonal), or 4 (fulljones))
    H=tables.open_file(h5)
    amplitude = H.root.sol000.amplitude000.val[:]
    weights   = H.root.sol000.amplitude000.weight[:]
    if amplitude.shape[-1] == 4:
      fulljones = True
    else:
      fulljones = False
    H.close()

    print('Amplitude and Weights shape:', weights.shape, amplitude.shape)
    amps_xx = amplitude[...,0]
    amps_yy = amplitude[...,-1] # so this also works for pol axis length 1
    weights_xx = weights[...,0]
    weights_yy = weights[...,-1]

    idx_xx = np.where(weights_xx != 0.0) 
    idx_yy = np.where(weights_yy != 0.0) 
    amps_xx_tmp = amps_xx[idx_xx]
    amps_yy_tmp = amps_yy[idx_yy]
    
    idx_xx = np.where(amps_xx_tmp != 1.0) # remove 1.0, these can be "resetsols" values
    idx_yy = np.where(amps_yy_tmp != 1.0) # remove 1.0, these can be "resetsols" values
    if any(map(len, idx_xx)) and any(map(len, idx_yy)):
       medamps = 0.5*(10**(np.nanmedian(np.log10(amps_xx_tmp[idx_xx]))) + 10**(np.nanmedian(np.log10(amps_yy_tmp[idx_yy]))))
    else:
       medamps = 1.
    print('Median  Stokes I amplitude of ', h5, ':', medamps)

    if fulljones:
       amps_xy = amplitude[...,1]
       amps_yx = amplitude[...,2]
       weights_xy = weights[...,1]
       weights_yx = weights[...,2]
       idx_xy = np.where(weights_xy != 0.0)
       idx_yx = np.where(weights_yx != 0.0)
       
       amps_xy_tmp = amps_xy[idx_xy]
       amps_yx_tmp = amps_yx[idx_yx]
       
       idx_xy = np.where(amps_xy_tmp > 0.0)
       idx_yx = np.where(amps_yx_tmp > 0.0)
       
       medamps_cross = 0.5*(10**(np.nanmedian(np.log10(amps_xy_tmp[idx_xy]))) + 10**(np.nanmedian(np.log10(amps_yx_tmp[idx_yx]))))
       print('Median amplitude of XY+YX ', h5, ':', medamps_cross)

    logger.info('Median Stokes I amplitude of ' + h5 + ': ' + str(medamps))
    return medamps

def get_double_slice(values, idx: list = None, axes: list = None):
    """
    Get double slices
    
    :param values: numpy array
    :param idx: list of indices
    :param axes: list of axes corresponding to indices
    
    return slice
    """
    
    ax1, ax2 = axes
    id1, id2 = idx
    l = list([slice(None)] * ax1 + [id1] + [slice(None)] * (len(values.shape) - ax1 - 1))
    l[ax2] = id2
    return tuple(l)


def get_double_slice_len(values, idx: list = None, axes: list = None):
    """
    Get double slices
    
    :param values: numpy array
    :param idx: list of indices
    :param axes: list of axes corresponding to indices
    
    return slice
    """
    
    ax1, ax2 = axes
    id1, id2 = idx
    l = list([slice(None)] * ax1 + [id1] + [slice(None)] * (len(values) - ax1 - 1))
    l[ax2] = id2
    return tuple(l)


def getallantennafromh5list(h5list):
    '''
    get all unique antenna names in a list of h5 files
    '''
    hasphase = True
    hasamps = True
    hasrotation = True
    hastec = True

    H = tables.open_file(h5list[0], mode='a')
    # Figure out if we what solutions there are
    
    try:
        antennas = H.root.sol000.amplitude000.ant[:]
    except: 
        hasamps = False
    try:
        antennas = H.root.sol000.phase000.ant[:]
    except:
        hasphase = False
    try:
        antennas = H.root.sol000.tec000.ant[:]
    except:
        hastec = False
    try:
        antennas = H.root.sol000.rotation000.ant[:]
    except:
        hasrotation = False     
    print('Reading:', h5list[0], ' -- Number of anntena:', len(antennas))
    H.close()

    if len(h5list) > 0: # if there is only 1 we are already done given the code above
        for h5 in h5list[1::]:
            H = tables.open_file(h5, mode='a')
            if hasphase:
                ants = H.root.sol000.phase000.ant[:]
            elif hasamps:  
                ants = H.root.sol000.amplitude000.ant[:]
            elif hastec:
                ants = H.root.sol000.tec000.ant[:]
            elif hasrotation:
                ants = H.root.sol000.rotation000.ant[:]
            print('Reading:', h5, ' -- Number of anntena:', len(ants))
            H.close()    
            antennas = np.concatenate((antennas, np.ndarray.flatten(ants)),axis=0)
    return np.unique(antennas)


def get_matrix_forslopenorm(parmdblist):
    assert type(parmdblist) == list, 'input is not list' # use only lists as input
    #allantenna =  getallantennafromh5list(parmdblist)
    H = tables.open_file(parmdblist[0])
    directions = H.root.sol000.amplitude000.dir[:] # should be the same for all parmdblist in the list
    H.close()

    N_h5  = len(parmdblist)
    #N_ant = len(allantenna)
    N_direction = len(directions)
    
    
    #matrix_amps = np.zeros((N_h5,N_direction)) # sum of log10 of amps
    matrix_weights = np.zeros((N_h5,N_direction)) # number if input values
    matrix_slope = np.zeros((N_h5,N_direction)) # of mean slope log10 amps
    
    for h5_id, h5 in enumerate(parmdblist):
        H = tables.open_file(h5)
        ampsfull =H.root.sol000.amplitude000.val[:]
        #weightsfull = H.root.sol000.amplitude000.weight[:]
        ants_inh5 = H.root.sol000.amplitude000.ant[:]
        axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
        diraxis = axisn.index('dir')
        freqaxis = axisn.index('freq')
        H.close()

        for dir_id, direction in enumerate(directions):
            slice_obj = [slice(None)] * diraxis + [dir_id] + [slice(None)] * (ampsfull.ndim - diraxis - 1)
            amps = ampsfull[tuple(slice_obj)]
            #weights = weightsfull[tuple(slice_obj)]
    
            matrix_slope[h5_id,dir_id] = np.mean(np.diff(np.log10(amps),axis=freqaxis))
            matrix_weights[h5_id,dir_id] = amps.size/N_direction
            print('Direction:', dir_id, 'Slope:', matrix_slope[h5_id,dir_id])
    return matrix_slope, matrix_weights


def normslope_withmatrix(parmdblist):
    '''
    Global slope normalization per direction
    input: list of h5 solution files
    '''
    assert type(parmdblist) == list, 'input is not list' # use only lists as input
    H = tables.open_file(parmdblist[0])
    directions = H.root.sol000.amplitude000.dir[:] # should be the same for all parmdb in the list
    H.close()

    #allantenna =  getallantennafromh5list(parmdblist)
    matrix_slope, matrix_weights = get_matrix_forslopenorm(parmdblist)
    #print(matrix_slope.shape)
    
    #create norm factors
    norm_array = np.zeros((matrix_slope.shape[1]))
    #matrix_weights[h5_id,ant_id,dir_id]
    for dir_id, direction in enumerate(directions):
        norm_array[dir_id] = np.average(matrix_slope[:,dir_id], weights=matrix_weights[:,dir_id])
   
    # write result
    for h5_id, h5 in enumerate(parmdblist):
        H = tables.open_file(h5, mode='a')
        ampsfull =H.root.sol000.amplitude000.val[:]
        weightsfull = H.root.sol000.amplitude000.weight[:]
        ants_inh5 = H.root.sol000.amplitude000.ant[:]
        axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
        diraxis = axisn.index('dir')
        freqaxis = axisn.index('freq')
        frequencies = H.root.sol000.amplitude000.freq[:]
 
        for dir_id, direction in enumerate(directions):
          print(h5, dir_id, norm_array[dir_id])
          for freq_id, frequency in enumerate(frequencies):    
            slice_obj = get_double_slice(ampsfull, [freq_id, dir_id], [freqaxis, diraxis])
          
            amps = ampsfull[slice_obj]
            ampsfull[slice_obj] = 10**( np.log10(amps) - (norm_array[dir_id]*float(freq_id)))
            
      
        H.root.sol000.amplitude000.val[:] = ampsfull
        H.flush()
        H.close()
    return  


def get_matrix_forampnorm(parmdblist):
    assert type(parmdblist) == list, 'input is not list' # use only lists as input
    allantenna =  getallantennafromh5list(parmdblist)
    H = tables.open_file(parmdblist[0])
    directions = H.root.sol000.amplitude000.dir[:] # should be the same for all parmdblist in the list
    H.close()


    N_h5  = len(parmdblist)
    N_ant = len(allantenna)
    N_direction = len(directions)
    
    
    matrix_amps = np.zeros((N_h5,N_ant,N_direction)) # sum of log10 of amps
    matrix_weights = np.zeros((N_h5,N_ant,N_direction)) # number if input values
    #matrix_slope = np.zeros((N_h5,N_ant,N_direction)) # of mean slope log10 amps
    
    for h5_id, h5 in enumerate(parmdblist):
        H = tables.open_file(h5)
        amps =H.root.sol000.amplitude000.val[:]
        weights = H.root.sol000.amplitude000.weight[:]
        ants_inh5 = H.root.sol000.amplitude000.ant[:]
        axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
        diraxis = axisn.index('dir')
        antaxis = axisn.index('ant')
        H.close()

        for antenna in allantenna:
            ant_id = np.where(ants_inh5 == antenna)[0]
            print(h5, antenna)
            if len(ant_id) > 0:
                ant_id = ant_id[0]
                for dir_id, direction in enumerate(directions):
                    #print(str(antenna) + ' ' +'Normalizing direction', direction)
                    slice_obj = get_double_slice(amps, [ant_id, dir_id], [antaxis, diraxis])
                    amps_sel = amps[slice_obj]
                    weights_sel = weights[slice_obj]
                    idx = np.where(weights_sel != 0.0)
                    weights_sel[idx] = 1.0
                    
                    matrix_amps[h5_id,ant_id,dir_id] = np.sum(np.log10(amps_sel[idx]))
                    matrix_weights[h5_id,ant_id,dir_id] = np.sum(weights_sel[idx])
                    #print(np.sum(weights_sel[idx]))
                    #matrix_slope[h5_id,ant_id,dir_id] = np.mean(np.diff(np.log10(amps_sel[idx])))
    return matrix_amps, matrix_weights

def normamplitudes_withmatrix(parmdblist):
    '''
    Normalize global amplitues per direction and per antenna
    '''
    H = tables.open_file(parmdblist[0])
    directions = H.root.sol000.amplitude000.dir[:] # should be the same for all parmdb in the list
    H.close()

    allantenna =  getallantennafromh5list(parmdblist)
    matrix_amps, matrix_weights = get_matrix_forampnorm(parmdblist)
    print(matrix_amps.shape)
    #sys.exit()
    #create norm factors
    norm_array = np.zeros((matrix_amps.shape[1],matrix_amps.shape[2]))
    #matrix_weights[h5_id,ant_id,dir_id]
    for ant_id, antenna in enumerate(allantenna):
         for dir_id, direction in enumerate(directions):
             norm_array[ant_id,dir_id] = np.sum(matrix_amps[:,ant_id,dir_id])/np.sum(matrix_weights[:,ant_id,dir_id])
    
   
    # write result
    for h5_id, h5 in enumerate(parmdblist):
        H = tables.open_file(h5, mode='a')
        amps =H.root.sol000.amplitude000.val[:]
        weights = H.root.sol000.amplitude000.weight[:]
        ants_inh5 = H.root.sol000.amplitude000.ant[:]
        axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
        diraxis = axisn.index('dir')
        antaxis = axisn.index('ant')
 
        #matrix_weights[h5_id,ant_id,dir_id]
        for antenna in allantenna:
            ant_id = np.where(ants_inh5 == antenna)[0]
            print(h5, antenna)
            if len(ant_id) > 0:
                ant_id = ant_id[0]
                for dir_id, direction in enumerate(directions):
                    print(ant_id, dir_id,  norm_array[ant_id,dir_id])
                    slice_obj = get_double_slice(amps, [ant_id, dir_id], [antaxis, diraxis])
                    amps[slice_obj] = 10**(np.log10(amps[slice_obj]) - norm_array[ant_id,dir_id])
        H.root.sol000.amplitude000.val[:] = amps
        H.flush()
        H.close()
    return        
     

def normamplitudes(parmdb, norm_per_ms=False, norm_per_ant=False):
    """
    Normalize H5 amplitudes
  
    :param paramdb: list of h5 files
    :param norm_per_ms : boolean 
    :param norm_per_ant : boolean
    
    return None
    """
    has_dir = h5_has_dir(parmdb[0])
    H = tables.open_file(parmdb[0])
    axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
    if has_dir:
        directions = H.root.sol000.amplitude000.dir[:] # should be the same for all parmdb in the list
    H.close()
   
   
    # ---------------------- THIS IS FOR norm_per_ant=False ----------
    # ----------------------------------------------------------------
    # ----------------------------------------------------------------
    if norm_per_ms and not norm_per_ant:
        for parmdbi in parmdb:
            H = tables.open_file(parmdbi,mode='a')
            if not has_dir:        
                amps =H.root.sol000.amplitude000.val[:]
                weights = H.root.sol000.amplitude000.weight[:]
                idx = np.where(weights != 0.0)
                amps = np.log10(amps)
                logger.info(parmdbi + ' Mean amplitudes before normalization: ' + str(10**(np.nanmean(amps[idx]))))
                amps = amps - (np.nanmean(amps[idx]))
                logger.info(parmdbi + ' Mean amplitudes after normalization: ' + str(10**(np.nanmean(amps[idx]))))
                amps = 10**(amps)
                H.root.sol000.amplitude000.val[:] = amps
                H.flush()
                H.close()
            else:    
                axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
                diraxis = axisn.index('dir')
                ampsfull =H.root.sol000.amplitude000.val[:]
                weightsfull = H.root.sol000.amplitude000.weight[:]
                for dir_id, direction in enumerate(directions):
                    print('Normalizing direction', direction, 'Axis entry number', axisn.index('dir'))
                    slice_obj = [slice(None)] * diraxis + [dir_id] + [slice(None)] * (ampsfull.ndim - diraxis - 1)
                    amps = ampsfull[tuple(slice_obj)]
                    weights = weightsfull[tuple(slice_obj)]
    
                    idx = np.where(weights != 0.0)
                    amps = np.log10(amps)
                    logger.info('Direction:' + str(dir_id) + '  ' + parmdbi + ' Mean amplitudes before normalization: ' + str(10**(np.nanmean(amps[idx]))))
                    print('Direction:' + str(dir_id) + '  ' + parmdbi + ' Mean amplitudes before normalization: ' + str(10**(np.nanmean(amps[idx]))))
                    amps = amps - (np.nanmean(amps[idx]))
                    logger.info('Direction:' + str(dir_id) + '  ' + parmdbi + ' Mean amplitudes after normalization: ' + str(10**(np.nanmean(amps[idx]))))
                    amps = 10**(amps)    
                    # put back vales in ampsfull
                    ampsfull[tuple(slice_obj)] = amps
                    
                H.root.sol000.amplitude000.val[:] = ampsfull
                H.flush()
                H.close()        
        print('Return with norm_per_ant=False')
        return  # norm_per_ms

    if not has_dir and not norm_per_ant:      
        for i, parmdbi in enumerate(parmdb):
            H = tables.open_file(parmdbi,mode='r')
            ampsfull = H.root.sol000.amplitude000.val[:]
            weightsfull = H.root.sol000.amplitude000.weight[:]
            idx = np.where(weightsfull != 0.0)
            logger.info(parmdbi + '  Normfactor: '+ str(10**(np.nanmean(np.log10(ampsfull[idx])))))
            if i == 0:
                amps = np.ndarray.flatten(ampsfull[idx])
            else:
                amps = np.concatenate((amps, np.ndarray.flatten(ampsfull[idx])),axis=0)

            H.close()
        normmin = (np.nanmean(np.log10(amps)))
        logger.info('Global normfactor: ' + str(10**normmin))
        # now write the new H5 files
        for parmdbi in parmdb:
            H = tables.open_file(parmdbi,mode='a')
            ampsfull = H.root.sol000.amplitude000.val[:]
            ampsfull = (np.log10(ampsfull)) - normmin
            ampsfull = 10**ampsfull
            H.root.sol000.amplitude000.val[:] = ampsfull
            H.flush()
            H.close()
    elif not norm_per_ant:    
        for dir_id, direction in enumerate(directions):  
            for i, parmdbi in enumerate(parmdb):
                H = tables.open_file(parmdbi,mode='r')
                axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
                ampsfull = H.root.sol000.amplitude000.val[:]
                weightsfull = H.root.sol000.amplitude000.weight[:]
                diraxis = axisn.index('dir')  
                H.close() 
                
                slice_obj = [slice(None)] * diraxis + [dir_id] + [slice(None)] * (ampsfull.ndim - diraxis - 1)
                ampsi = ampsfull[tuple(slice_obj)]
                weights = weightsfull[tuple(slice_obj)]
                
                idx = np.where(weights != 0.0)
                if i == 0:
                    amps = np.ndarray.flatten(ampsi[idx])
                else:
                    amps = np.concatenate((amps, np.ndarray.flatten(ampsi[idx])),axis=0)
            normmin = (np.nanmean(np.log10(amps)))
            logger.info('Global normfactor directon:' +  str(dir_id) + ' ' + str(10**normmin))
            print('Global normfactor directon:' +  str(dir_id) + ' ' + str(10**normmin))
            for parmdbi in parmdb:
                H = tables.open_file(parmdbi,mode='a')
                axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
                ampsfull = H.root.sol000.amplitude000.val[:]
                diraxis = axisn.index('dir')
                # put back vales in ampsfull
                slices = tuple(slice(None) if i != diraxis else dir_id for i in range(diraxis + 1))
                ampsfull[slices] = np.log10(ampsfull[slices]) - normmin
                ampsfull[slices] = 10**ampsfull[slices]
                H.root.sol000.amplitude000.val[:] = ampsfull
                H.flush()
                H.close()
        print('Return with norm_per_ant=False')
        return # return because we do not need to go to the norm_per_an=True part


    # ---------------------- THIS IS FOR norm_per_ant=True ----------
    # ----------------------------------------------------------------
    # ----------------------------------------------------------------
    allantenna =  getallantennafromh5list(parmdb)

    if norm_per_ms and norm_per_ant:
        for parmdbi in parmdb:
            H = tables.open_file(parmdbi,mode='a')
            ants_inh5 = H.root.sol000.amplitude000.ant[:]
            antaxis = axisn.index('ant')
            if not has_dir:        
                ampsfull =H.root.sol000.amplitude000.val[:]
                weightsfull = H.root.sol000.amplitude000.weight[:]
                
                for antenna in allantenna:
                    ant_id = np.where(ants_inh5 == antenna)[0]
                    if len(ant_id) > 0:
                        ant_id = ant_id[0]
                        print('Doing:',antenna) 
                        print('antenna index: ', )
                        slice_obj = [slice(None)] * antaxis + [ant_id] + [slice(None)] * (ampsfull.ndim - diraxis - 1)
                        amps = ampsfull[tuple(slice_obj)]
                        weights = weightsfull[tuple(slice_obj)] 
                
                        idx = np.where(weights != 0.0)
                        amps = np.log10(amps)
                        logger.info(str(antenna) + ' ' + parmdbi + ' Mean amplitudes before normalization: ' + str(10**(np.nanmean(amps[idx]))))
                        amps = amps - (np.nanmean(amps[idx]))
                        logger.info(str(antenna) + ' ' + parmdbi + ' Mean amplitudes after normalization: ' + str(10**(np.nanmean(amps[idx]))))
                        amps = 10**(amps)
          
                        ampsfull[tuple(slice_obj)] = amps
                    else:
                        print('Skipping this antenna as it is not present in the h5', antenna)
                 
                H.root.sol000.amplitude000.val[:] = ampsfull
                H.flush()
                H.close()
            else:    
                axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
                diraxis = axisn.index('dir')
                antaxis = axisn.index('ant')
                ampsfull =H.root.sol000.amplitude000.val[:]
                weightsfull = H.root.sol000.amplitude000.weight[:]
                
                for antenna in allantenna:
                    ant_id = np.where(ants_inh5 == antenna)[0]
                    if len(ant_id) > 0:
                        for dir_id, direction in enumerate(directions):
                            print(str(antenna) + ' ' +'Normalizing direction', direction)
                            
                            slice_obj = get_double_slice(ampsfull, [ant_id, dir_id], [antaxis, diraxis])
                           
                            amps = ampsfull[slice_obj]
                            weights = weightsfull[slice_obj]
            
                            idx = np.where(weights != 0.0)
                            amps = np.log10(amps)
                            logger.info(str(antenna) + ' ' +'Direction:' + str(dir_id) + '  ' + parmdbi + ' Mean amplitudes before normalization: ' + str(10**(np.nanmean(amps[idx]))))
                            print('Direction:' + str(dir_id) + '  ' + parmdbi + ' Mean amplitudes before normalization: ' + str(10**(np.nanmean(amps[idx]))))
                            amps = amps - (np.nanmean(amps[idx]))
                            logger.info(str(antenna) + ' ' +'Direction:' + str(dir_id) + '  ' + parmdbi + ' Mean amplitudes after normalization: ' + str(10**(np.nanmean(amps[idx]))))
                            amps = 10**(amps)    
                            # put back vales in ampsfull
                            ampsfull[slice_obj] = amps
                    else:
                        print('Skipping this antenna as it is not present in the h5', antenna)
                
                H.root.sol000.amplitude000.val[:] = ampsfull
                H.flush()
                H.close()        
        print('Return with norm_per_ant=True')
        return  # norm_per_ms

    if not has_dir and norm_per_ant:      
        print('Not implemented  "if not has_dir and norm_per_ant" ')
        sys.exit()

    elif norm_per_ant:    
        for antenna in allantenna:        
                for dir_id, direction in enumerate(directions):  
                    try:
                        del(amps) # delete variable at the start
                    except:
                        pass
                    for i, parmdbi in enumerate(parmdb):
                        H = tables.open_file(parmdbi,mode='r')
                        ants_inh5 = H.root.sol000.amplitude000.ant[:]
                        axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
                        #ampsfull = H.root.sol000.amplitude000.val[:]
                        #weightsfull = H.root.sol000.amplitude000.weight[:]
                        diraxis = axisn.index('dir')  
                        antaxis = axisn.index('ant')  
                        
                        
                        ant_id = np.where(ants_inh5 == antenna)[0]
                        if len(ant_id) > 0:
                            slice_obj = get_double_slice_len(axisn, [ant_id, dir_id], [antaxis, diraxis])
                            ampsi = H.root.sol000.amplitude000.val[slice_obj]
                            weights = H.root.sol000.amplitude000.weight[slice_obj]
                        
                            idx = np.where(weights != 0.0)
                            if 'amps' in locals(): # in this case amps was already made
                                amps = np.concatenate((amps, np.ndarray.flatten(ampsi[idx])),axis=0)
                            else: # create amps
                                amps = np.ndarray.flatten(ampsi[idx])
                        H.close() 
                        
                    normmin = (np.nanmean(np.log10(amps)))
                    
                    logger.info(str(antenna) + ' Global normfactor directon:' +  str(dir_id) + ' ' + str(10**normmin))
                    print(str(antenna) + ' Global normfactor directon:' +  str(dir_id) + ' ' + str(10**normmin))
                    for parmdbi in parmdb:
                        print('Write to:', parmdbi)
                        H = tables.open_file(parmdbi,mode='a')
                        ants_inh5 = H.root.sol000.amplitude000.ant[:]
                        axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
                        #ampsfull = H.root.sol000.amplitude000.val[:]
                        diraxis = axisn.index('dir')
                        antaxis = axisn.index('ant')
                        
                        # put back vales in ampsfull
                        ant_id = np.where(ants_inh5 == antenna)[0]
                        if len(ant_id) > 0:
                            slice_obj = get_double_slice_len(axisn, [ant_id, dir_id], [antaxis, diraxis])
                            ampsfull = H.root.sol000.amplitude000.val[slice_obj]
                        
                            ampsfull = 10**(np.log10(ampsfull) - normmin)
                            #ampsfull = 10**ampsfull
                            H.root.sol000.amplitude000.val[slice_obj] = ampsfull
                        H.flush()
                        H.close()
            #else:
            #    print('Skipping this antenna as it is not present in the h5', antenna)
    
    print('Return with norm_per_ant=True')
    return           


def normamplitudes_old2(parmdb, norm_per_ms=False, norm_per_ant=False):
    has_dir = h5_has_dir(parmdb[0])
    H = tables.open_file(parmdb[0])
    axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
    if has_dir:
        directions = H.root.sol000.amplitude000.dir[:] # should be the same for all parmdb in the list
    H.close()

    if norm_per_ms:
        for parmdbi in parmdb:
            H = tables.open_file(parmdbi,mode='a')
            if not has_dir:        
                amps =H.root.sol000.amplitude000.val[:]
                weights = H.root.sol000.amplitude000.weight[:]
                idx = np.where(weights != 0.0)
                amps = np.log10(amps)
                logger.info(parmdbi + ' Mean amplitudes before normalization: ' + str(10**(np.nanmean(amps[idx]))))
                amps = amps - (np.nanmean(amps[idx]))
                logger.info(parmdbi + ' Mean amplitudes after normalization: ' + str(10**(np.nanmean(amps[idx]))))
                amps = 10**(amps)
                H.root.sol000.amplitude000.val[:] = amps
                H.flush()
                H.close()
            else:    
                axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
                diraxis = axisn.index('dir')
                ampsfull =H.root.sol000.amplitude000.val[:]
                weightsfull = H.root.sol000.amplitude000.weight[:]
                for dir_id, direction in enumerate(directions):
                    print('Normalizing direction', direction, 'Axis entry number', axisn.index('dir'))
                    if diraxis == 0:
                        amps = ampsfull[dir_id, ...]
                        weights = weightsfull[dir_id, ...]
                    if diraxis == 1:
                        amps = ampsfull[:, dir_id, ...]
                        weights = weightsfull[:, dir_id, ...]
                    if diraxis == 2:
                        amps = ampsfull[:, :, dir_id, ...]
                        weights = weightsfull[:, :, dir_id, ...]
                    if diraxis == 3:
                        amps = ampsfull[:, :, :, dir_id, ...]
                        weights = weightsfull[:, :, :, dir_id, ...]
                    if diraxis == 4:
                        amps = ampsfull[:, :, :, :, dir_id, ...]
                        weights = weightsfull[:, :, :, :, dir_id, ...]
                   
                   
                    #amp[get_double_slice(amp, [antennaid, dirid], [antennaxis, diraxis])
                   
                    idx = np.where(weights != 0.0)
                    amps = np.log10(amps)
                    logger.info('Direction:' + str(dir_id) + '  ' + parmdbi + ' Mean amplitudes before normalization: ' + str(10**(np.nanmean(amps[idx]))))
                    print('Direction:' + str(dir_id) + '  ' + parmdbi + ' Mean amplitudes before normalization: ' + str(10**(np.nanmean(amps[idx]))))
                    amps = amps - (np.nanmean(amps[idx]))
                    logger.info('Direction:' + str(dir_id) + '  ' + parmdbi + ' Mean amplitudes after normalization: ' + str(10**(np.nanmean(amps[idx]))))
                    amps = 10**(amps)    

                    # put back vales in ampsfull
                    if diraxis == 0:
                        ampsfull[dir_id, ...] = amps
                    if diraxis == 1:
                        ampsfull[:, dir_id, ...] = amps
                    if diraxis == 2:
                        ampsfull[:, :, dir_id, ...] = amps
                    if diraxis == 3:
                        ampsfull[:, :, :, dir_id, ...] = amps
                    if diraxis == 4:
                        ampsfull[:, :, :, :, dir_id, ...] = amps
                H.root.sol000.amplitude000.val[:] = ampsfull
                H.flush()
                H.close()        
        return  # norm_per_ms

    if not has_dir:      
        for i, parmdbi in enumerate(parmdb):
            H = tables.open_file(parmdbi,mode='r')
            ampsfull = H.root.sol000.amplitude000.val[:]
            weightsfull = H.root.sol000.amplitude000.weight[:]
            idx = np.where(weightsfull != 0.0)
            logger.info(parmdbi + '  Normfactor: '+ str(10**(np.nanmean(np.log10(ampsfull[idx])))))
            if i == 0:
                amps = np.ndarray.flatten(ampsfull[idx])
            else:
                amps = np.concatenate((amps, np.ndarray.flatten(ampsfull[idx])),axis=0)

            H.close()
        normmin = (np.nanmean(np.log10(amps)))
        logger.info('Global normfactor: ' + str(10**normmin))
        # now write the new H5 files
        for parmdbi in parmdb:
            H = tables.open_file(parmdbi,mode='a')
            ampsfull = H.root.sol000.amplitude000.val[:]
            ampsfull = (np.log10(ampsfull)) - normmin
            ampsfull = 10**ampsfull
            H.root.sol000.amplitude000.val[:] = ampsfull
            H.flush()
            H.close()
    else:    
        for dir_id, direction in enumerate(directions):  
            for i, parmdbi in enumerate(parmdb):
                H = tables.open_file(parmdbi,mode='r')
                axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
                ampsfull = H.root.sol000.amplitude000.val[:]
                weightsfull = H.root.sol000.amplitude000.weight[:]
                diraxis = axisn.index('dir')  
                H.close() 
                if diraxis == 0:
                    ampsi = ampsfull[dir_id, ...]
                    weights = weightsfull[dir_id, ...]
                if diraxis == 1:
                    ampsi = ampsfull[:, dir_id, ...]
                    weights = weightsfull[:, dir_id, ...]
                if diraxis == 2:
                    ampsi = ampsfull[:, :, dir_id, ...]
                    weights = weightsfull[:, :, dir_id, ...]
                if diraxis == 3:
                    ampsi = ampsfull[:, :, :, dir_id, ...]
                    weights = weightsfull[:, :, :, dir_id, ...]
                if diraxis == 4:
                    ampsi = ampsfull[:, :, :, :, dir_id, ...]
                    weights = weightsfull[:, :, :, :, dir_id, ...]
                idx = np.where(weights != 0.0)
                if i == 0:
                    amps = np.ndarray.flatten(ampsi[idx])
                else:
                    amps = np.concatenate((amps, np.ndarray.flatten(ampsi[idx])),axis=0)
            normmin = (np.nanmean(np.log10(amps)))
            logger.info('Global normfactor directon:' +  str(dir_id) + ' ' + str(10**normmin))
            print('Global normfactor directon:' +  str(dir_id) + ' ' + str(10**normmin))
            for parmdbi in parmdb:
                H = tables.open_file(parmdbi,mode='a')
                axisn = H.root.sol000.amplitude000.val.attrs['AXES'].decode().split(',')
                ampsfull = H.root.sol000.amplitude000.val[:]
                diraxis = axisn.index('dir')
                # put back vales in ampsfull
                if diraxis == 0:
                    ampsfull[dir_id, ...] = (np.log10(ampsfull[dir_id, ...])) - normmin
                    ampsfull[dir_id, ...] = 10**ampsfull[dir_id, ...]
                if diraxis == 1:
                    ampsfull[:, dir_id, ...] = (np.log10(ampsfull[:, dir_id, ...])) - normmin
                    ampsfull[:, dir_id, ...] = 10**ampsfull[:, dir_id, ...]
                if diraxis == 2:
                    ampsfull[:, :, dir_id, ...] = (np.log10(ampsfull[:, :, dir_id, ...])) - normmin
                    ampsfull[:, :, dir_id, ...] = 10**ampsfull[:, :, dir_id, ...]
                if diraxis == 3:
                    ampsfull[:, :, :, dir_id, ...] = (np.log10(ampsfull[:, :, :, dir_id, ...])) - normmin
                    ampsfull[:, :, :, dir_id, ...] = 10**ampsfull[:, :, :, dir_id, ...]
                if diraxis == 4:
                    ampsfull[:, :, :, :, dir_id, ...] = (np.log10(ampsfull[:, :, :, :, dir_id, ...])) - normmin
                    ampsfull[:, :, :, :, dir_id, ...] = 10**ampsfull[:, :, :, :, dir_id, ...]
                H.root.sol000.amplitude000.val[:] = ampsfull
                H.flush()
                H.close()
    return           


def normamplitudes_old(parmdb, norm_per_ms=False):
    '''
    normalize amplitude solutions to one
    '''
    if norm_per_ms:
      for parmdbi in parmdb:
        H5 = h5parm.h5parm(parmdbi, readonly=False)
        amps =H5.getSolset('sol000').getSoltab('amplitude000').getValues()[0]
        weights = H5.getSolset('sol000').getSoltab('amplitude000').getValues(weight=True)[0]
        idx = np.where(weights != 0.0)

        amps = np.log10(amps)
        logger.info(parmdbi + ' Mean amplitudes before normalization: ' + str(10**(np.nanmean(amps[idx]))))
        amps = amps - (np.nanmean(amps[idx]))
        logger.info(parmdbi + ' Mean amplitudes after normalization: ' + str(10**(np.nanmean(amps[idx]))))
        amps = 10**(amps)

        H5.getSolset('sol000').getSoltab('amplitude000').setValues(amps)
        H5.close()
      return    

    if len(parmdb) == 1:
      H5 = h5parm.h5parm(parmdb[0], readonly=False)
      amps =H5.getSolset('sol000').getSoltab('amplitude000').getValues()[0]
      weights = H5.getSolset('sol000').getSoltab('amplitude000').getValues(weight=True)[0]
      idx = np.where(weights != 0.0)

      amps = np.log10(amps)
      logger.info('Mean amplitudes before normalization: ' + str(10**(np.nanmean(amps[idx]))))
      amps = amps - (np.nanmean(amps[idx]))
      logger.info('Mean amplitudes after normalization: ' + str(10**(np.nanmean(amps[idx]))))
      amps = 10**(amps)

      H5.getSolset('sol000').getSoltab('amplitude000').setValues(amps)
      H5.close()

    else:
      # amps = []  
      for i, parmdbi in enumerate(parmdb):
          H5 = h5parm.h5parm(parmdbi, readonly=True)
          ampsi = np.copy(H5.getSolset('sol000').getSoltab('amplitude000').getValues()[0])
          weights = H5.getSolset('sol000').getSoltab('amplitude000').getValues(weight=True)[0]
          idx = np.where(weights != 0.0)
          logger.info(parmdbi + '  Normfactor: '+ str(10**(np.nanmean(np.log10(ampsi[idx])))))
          if i == 0:
            amps = np.ndarray.flatten(ampsi[idx])
          else:
            amps = np.concatenate((amps, np.ndarray.flatten(ampsi[idx])),axis=0)

          # print np.shape(amps), parmdbi
          H5.close()
      normmin = (np.nanmean(np.log10(amps)))
      logger.info('Global normfactor: ' + str(10**normmin))
      # now write the new H5 files
      for parmdbi in parmdb:
         H5   = h5parm.h5parm(parmdbi, readonly=False)
         ampsi = np.copy(H5.getSolset('sol000').getSoltab('amplitude000').getValues()[0])
         ampsi = (np.log10(ampsi)) - normmin
         ampsi = 10**ampsi
         H5.getSolset('sol000').getSoltab('amplitude000').setValues(ampsi)
         H5.close()
    return


def checkforzerocleancomponents(imagenames):
    """ Check if something was cleaned, if not stop de script to avoid more obscure errors later

    Args:
        imagenames (list): List of model images to check for clean components.

    Returns:
        True if all model images are zero, False otherwise.
    """
    n_images = len(imagenames)
    n_zeros = 0
    for image_id, image in enumerate(imagenames):
        print("Check if there are non-zero pixels: ", image)
        hdul = fits.open(image)
        data = hdul[0].data
        if not np.any(data):  # this checks if all elements are 0.0
            print("Model image:", image, "contains only zeros.")
            n_zeros = n_zeros + 1
        hdul.close()
    if n_zeros == n_images:
        return True
    else:
        return False


def get_image_dynamicrange(image):
    '''
    get dynamic range of an image (peak over rms)
    '''
    print('Compute image dynamic range (peak over rms): ', image)
    hdul = fits.open(image)
    image_rms = findrms(np.ndarray.flatten(hdul[0].data))
    DR = np.nanmax(np.ndarray.flatten(hdul[0].data))/image_rms
    hdul.close()
    return DR


def removeneNaNfrommodel(imagenames):
    '''
    replace NaN/inf pixels values in WSCLEAN model images with zeros
    '''
    for image_id, image in enumerate(imagenames):
        print('remove NaN/Inf values from model: ', image)
        hdul = fits.open(image)
        data = hdul[0].data
        data[np.where(~np.isfinite(data))] = 0.0
        hdul[0].data = data
        hdul.writeto(image, overwrite=True)
        hdul.close()
    return


def removenegativefrommodel(imagenames):
    '''
    replace negative pixel values in WSCLEAN model images with zeros
    '''
    perseus = False
    A1795   = False
    A1795imlist = sorted(glob.glob('/net/nieuwerijn/data2/rtimmerman/A1795_HBA/A1795/selfcal/selfcal_pix0.15_wide-????-model.fits'))

    for image_id, image in enumerate(imagenames):
        print('remove negatives from model: ', image)
        hdul = fits.open(image)
        data = hdul[0].data

        data[np.where(data < 0.0)] = 0.0
        hdul[0].data = data
        hdul.writeto(image, overwrite=True)
        hdul.close()

        if perseus:
          run('python /net/rijn/data2/rvweeren/LoTSS_ClusterCAL/editmodel.py {} /net/ouderijn/data2/rvweeren/PerseusHBA/inner_ring_j2000.reg /net/ouderijn/data2/rvweeren/PerseusHBA/outer_ring_j2000.reg'.format(image))
         # run('python /net/rijn/data2/rvweeren/LoTSS_ClusterCAL/editmodel.py ' + image)
        if A1795: 
          cmdA1795 = 'python /net/rijn/data2/rvweeren/LoTSS_ClusterCAL/insert_highres.py '
          cmdA1795 +=  image + ' '
          cmdA1795 +=  A1795imlist[image_id] + ' '
          cmdA1795 += '/net/rijn/data2/rvweeren/LoTSS_ClusterCAL/A1795core.reg '
          print(cmdA1795)
          run(cmdA1795)

    return

def parse_facetdirections(facetdirections,selfcalcycle, args=None):
    '''
       parse the facetdirections.txt file and return a list of facet directions
       for the given selfcalcycle. In the future, this function should also return a 
       list of solints, nchans and other things 
    '''
    data = ascii.read(facetdirections, format='commented_header', comment="\s*#")
    ra,dec = data['RA'],data['DEC']
    try:
      start = data['start']
    except KeyError:
      start = np.zeros(len(ra))
    try:
      solints = data['solints']
    except KeyError:
      solints = None
    try:
      soltypelist_includedir = data['soltypelist_includedir']
    except KeyError:
      soltypelist_includedir = None
      
    # Only select ra/dec which are if they are in the selfcalcycle range
    a = np.where((start <= selfcalcycle))[0]
    rasel = ra[a]
    decsel = dec[a]

    if soltypelist_includedir is not None and args is not None:
        soltypelist_includedir_sel_tmp = soltypelist_includedir[a]
        
    
        # create 2D array booleans
        soltypelist_includedir_sel = np.zeros((len(rasel),len(args['soltype_list'])), dtype=bool)
        for dir_id in range(len(rasel)):
            #print(dir_id, soltypelist_includedir_sel_tmp[dir_id])
            soltypelist_includedir_sel[dir_id,:] = ast.literal_eval(soltypelist_includedir_sel_tmp[dir_id])
    
    PatchPositions_array = np.zeros((len(rasel),2))
    PatchPositions_array[:,0] = (rasel*units.deg).to(units.rad).value
    PatchPositions_array[:,1] = (decsel*units.deg).to(units.rad).value

    if solints is not None:
      solintsel = solints[a]
      if soltypelist_includedir is not None:
        return PatchPositions_array,[ast.literal_eval(solint) for solint in solintsel], soltypelist_includedir_sel
      else:  
        return PatchPositions_array,[ast.literal_eval(solint) for solint in solintsel], None
    else:
      if soltypelist_includedir is not None:
        return PatchPositions_array, None, soltypelist_includedir_sel
      else:
        return PatchPositions_array, None, None

def prepare_DDE(imagebasename, selfcalcycle, mslist, imsize, pixelscale, \
                channelsout, args, numClusters=0, facetdirections=None, \
                DDE_predict='DP3', restart=False, disable_IDG_DDE_predict=True, \
                telescope='LOFAR', dde_skymodel=None, targetFlux=2.0,skyview=None, \
                fitspectralpol=3,disable_primary_beam=False, wscleanskymodel=None, \
                skymodel=None):

   if telescope == 'LOFAR' and not disable_IDG_DDE_predict:
      idg = True # predict WSCLEAN with beam using IDG (wsclean facet mode with h5 is not efficient here)
   else:
      idg = False

   solints, soltypelist_includedir = create_facet_directions(imagebasename,selfcalcycle,\
                                     targetFlux=targetFlux, ms=mslist[0], imsize=imsize, \
                                     pixelscale=pixelscale, numClusters=numClusters,\
                                     facetdirections=facetdirections, restart=restart, args=args)  

   # --- start CREATE facets.fits -----
   # remove previous facets.fits if needed
   if os.path.isfile('facets.fits'):
     os.system ('rm -f facets.fits')  
   if skyview==None:
     if not restart and wscleanskymodel is None and skymodel is None:
        os.system('cp ' + imagebasename + str(selfcalcycle).zfill(3) +'-MFS-image.fits' + ' facets.fits')   
     if not restart and wscleanskymodel is not None:
        #os.system('cp ' + glob.glob(wscleanskymodel + '-????-*model*.fits')[0] + ' facets.fits')
        create_empty_fitsimage(mslist[0], int(imsize), float(pixelscale), 'facets.fits')
     if not restart and skymodel is not None: 
        create_empty_fitsimage(mslist[0], int(imsize), float(pixelscale), 'facets.fits')
   else:
     os.system('cp ' + skyview + ' facets.fits')   

   if restart: # in that case we also have a previous image avaialble
      os.system('cp ' + imagebasename + str(selfcalcycle-1).zfill(3) +'-MFS-image.fits' + ' facets.fits')   
   #else:
   #   if selfcalcycle == 0 and wscleanskymodel is not None: 
   #     os.system('cp ' + glob.glob(wscleanskymodel + '-????-*model*.fits')[0] + ' facets.fits')
        
      #else:
      #  os.system('cp ' + imagebasename + str(selfcalcycle).zfill(3) +'-MFS-image.fits' + ' facets.fits')   
   # --- end CREATE facets.fits -----


   # FILL in facets.fits with values, every facets get a constant value, for lsmtool
   hdu=fits.open('facets.fits')
   hduflat = flatten(hdu)
   region = pyregion.open('facets.reg')
   for facet_id, facet in enumerate(region):
       region[facet_id:facet_id+1].write('facet' + str(facet_id) + '.reg') # split facet from region file
       r = pyregion.open('facet' + str(facet_id) + '.reg')
       manualmask = r.get_mask(hdu=hduflat)
       if len(hdu[0].data.shape) == 4:
          hdu[0].data[0][0][np.where(manualmask == True)] = facet_id
       else:
          hdu[0].data[np.where(manualmask == True)] = facet_id
   hdu.writeto('facets.fits',overwrite=True)


   if restart: 
      # restart with DDE_predict=DP3 because then only the variable modeldatacolumns is made
      # So the wsclean predict step is skipped in makeimage but modeldatacolumns is created
      modeldatacolumns = makeimage(mslist, imagebasename + str(selfcalcycle).zfill(3), \
                                pixelscale, imsize, channelsout, predict=True, \
                                onlypredict=True, facetregionfile='facets.reg', \
                                DDE_predict='DP3',\
                                disable_primarybeam_image=disable_primary_beam, \
                                disable_primarybeam_predict=disable_primary_beam,\
                                fulljones_h5_facetbeam=not args['single_dual_speedup'])
      # selfcalcycle-1 because makeimage has not yet produced an image at this point
      if fitspectralpol > 0 and DDE_predict == 'DP3':
         dde_skymodel = groupskymodel(imagebasename + str(selfcalcycle-1).zfill(3) + \
                                   '-sources.txt', 'facets.fits') 
      else: 
         dde_skymodel = 'dummy.skymodel' # no model exists if spectralpol is turned off
   elif skyview is not None:
      modeldatacolumns = makeimage(mslist, imagebasename + str(selfcalcycle).zfill(3), \
                              pixelscale, imsize, channelsout, predict=True, \
                              onlypredict=True, facetregionfile='facets.reg', \
                              DDE_predict=DDE_predict,\
                              disable_primarybeam_image=disable_primary_beam, \
                              disable_primarybeam_predict=disable_primary_beam,\
                              fulljones_h5_facetbeam=not args['single_dual_speedup'])
      if fitspectralpol > 0:
         dde_skymodel = groupskymodel(imagebasename, 'facets.fits')  # imagebasename
      else: 
         dde_skymodel = 'dummy.skymodel' # no model exists if spectralpol is turned off
   
   elif wscleanskymodel is not None: # DDE wscleanskymodel solve at the start
      
      nonpblist = glob.glob(wscleanskymodel + '-????-model.fits')
      pblist = glob.glob(wscleanskymodel + '-????-model-pb.fits')
      
      if len(pblist) > 0 :
        channelsout_forpredict = len(pblist)
      else:   
        channelsout_forpredict = len(nonpblist)
        
      modeldatacolumns = makeimage(mslist, wscleanskymodel, \
                                pixelscale, imsize, channelsout_forpredict, predict=True, \
                                onlypredict=True, facetregionfile='facets.reg', \
                                DDE_predict='WSCLEAN', idg=idg, \
                                disable_primarybeam_image=disable_primary_beam, \
                                disable_primarybeam_predict=disable_primary_beam, \
                                fulljones_h5_facetbeam=not args['single_dual_speedup'])
      # assume there is no model for DDE wscleanskymodel solve at the start
      # since we are making image000 afterwards anyway setting a dummy now is ok
      dde_skymodel = 'dummy.skymodel' 
      print(modeldatacolumns)
   else: 
      modeldatacolumns = makeimage(mslist, imagebasename + str(selfcalcycle).zfill(3), \
                                pixelscale, imsize, channelsout, predict=True, \
                                onlypredict=True, facetregionfile='facets.reg', \
                                DDE_predict=DDE_predict, idg=idg, \
                                disable_primarybeam_image=disable_primary_beam, \
                                disable_primarybeam_predict=disable_primary_beam, \
                                fulljones_h5_facetbeam=not args['single_dual_speedup'])
      if fitspectralpol > 0 and DDE_predict == 'DP3':
         dde_skymodel = groupskymodel(imagebasename + str(selfcalcycle).zfill(3)  + \
                                   '-sources.txt', 'facets.fits')
      else:
         dde_skymodel = 'dummy.skymodel' # no model exists if spectralpol is turned off
   # check if -pb version of source list exists
   # needed because image000 does not have a pb version as no facet imaging is used, however, if IDG is used it does exist and hence the following does also handfle that
   if telescope == 'LOFAR' and wscleanskymodel is None: # not for MeerKAT because WSCclean still has a bug if no primary beam is used, for now assume we do not use a primary beam for MeerKAT
      if os.path.isfile(imagebasename + str(selfcalcycle).zfill(3)  + \
                        '-sources-pb.txt'):
         if fitspectralpol > 0:
            dde_skymodel = groupskymodel(imagebasename + str(selfcalcycle).zfill(3)  + \
                                      '-sources-pb.txt', 'facets.fits')
         else:
            dde_skymodel = 'dummy.skymodel' # no model exists if spectralpol is turned off
   
   return modeldatacolumns, dde_skymodel, solints, soltypelist_includedir
   
def groupskymodel(skymodelin, facetfitsfile, skymodelout=None):   
   import lsmtool
   print('Loading:', skymodelin)
   LSM = lsmtool.load(skymodelin)
   LSM.group(algorithm='facet', facet=facetfitsfile)
   if skymodelout is not None: 
      LSM.write(skymodelout, clobber=True)
      return skymodelout
   else:
      LSM.write('grouped_' + skymodelin, clobber=True)
      return 'grouped_' + skymodelin


def create_facet_directions(imagename, selfcalcycle, targetFlux=1.0, ms=None, imsize=None, \
                            pixelscale=None, numClusters=0, weightBySize=False, \
                            facetdirections=None, imsizemargin=100, restart=False, \
                            args=None):
   '''
   create a facet region file based on an input image or file provided by the user
   if there is an image use lsmtool tessellation algorithm 

   This function also returns the solints obtained out of the facetdirections file (if avail). It is up to 
   the function that calls this to do something with it or not.
   ''' 
   # groupalgorithm =
   solints = None # initialize, if not filled then this is not used here and the settings are taken from facetselfcal argsparse
   soltypelist_includedir = None  # initialize
   if facetdirections is not None:
     try:
       PatchPositions_array,solints, soltypelist_includedir = parse_facetdirections(facetdirections,selfcalcycle,args=args)
     except:
       try:
         f = open(facetdirections, 'rb')
         PatchPositions_array = pickle.load(f)
         f.close()
       except: 
         raise Exception('Trouble read file format:' + facetdirections) 
     print(PatchPositions_array)

     # write new facetdirections.p file
     if os.path.isfile('facetdirections.p'):
         os.system('rm -f facetdirections.p')  
     f = open('facetdirections.p', 'wb')
     pickle.dump(PatchPositions_array,f)
     f.close()
     
     # generate polygon composite regions file for WSClean imaging
     # in case of a restart this is not done, and the old facets.reg is kept
     # using the old facets.reg is important in case we change the number of facet directions, so the that first image after the restart is done with the old directions (and the h5file used was made using that)
     if ms is not None and imsize is not None and pixelscale is not None and not restart:
         cmd = 'python ds9facetgenerator.py '
         cmd += '--ms=' + ms + ' '
         cmd += '--h5=facetdirections.p --imsize=' + str(imsize+imsizemargin) +' --pixelscale=' + str(pixelscale)
         run(cmd)
     return solints, soltypelist_includedir
   elif selfcalcycle==0:
     # Only run this if selfcalcycle==0 [elif]
     # Try to load previous facetdirections.skymodel
     import lsmtool  
     if 'skymodel' not in imagename:
      img = bdsf.process_image(imagename + str(selfcalcycle).zfill(3) +'-MFS-image.fits',mean_map='zero', rms_map=True, rms_box = (160,40))  
      img.write_catalog(format='bbs', bbs_patches=None, outfile='facetdirections.skymodel', clobber=True)
     else:
      os.system('cp -r {} facetdirections.skymodel'.format(imagename))
     LSM = lsmtool.load('facetdirections.skymodel')
     
     if numClusters > 0:
        LSM.group(algorithm='cluster',numClusters=numClusters)
     else:
        LSM.group(algorithm='tessellate', targetFlux=str(targetFlux) +' Jy',weightBySize=weightBySize)
     
     print('Number of directions', len(LSM.getPatchPositions()))
     PatchPositions = LSM.getPatchPositions()
   
     PatchPositions_array = np.zeros( (len(LSM.getPatchPositions()),2) )
   
     for patch_id, patch in enumerate(PatchPositions.keys()):
       PatchPositions_array[patch_id,0] = PatchPositions[patch][0].to(units.rad).value # RA
       PatchPositions_array[patch_id,1] = PatchPositions[patch][1].to(units.rad).value # Dec
     # else: PatchPostioins=LSM.load('facetdirections.skymodel').getPatchPositions)  
     # Run code below for if and elif
     if os.path.isfile('facetdirections.p'):
         os.system('rm -f facetdirections.p')  
     f = open('facetdirections.p', 'wb')
     pickle.dump(PatchPositions_array,f)
     f.close()
     
    # generate polygon composite regions file for WSClean imaging 
     if ms is not None and imsize is not None and pixelscale is not None:
         cmd = 'python ds9facetgenerator.py '
         cmd += '--ms=' + ms + ' '
         cmd += '--h5=facetdirections.p --imsize=' + str(imsize+imsizemargin) +' --pixelscale=' + str(pixelscale)
         run(cmd)
     return solints, soltypelist_includedir
   else:
    return solints, soltypelist_includedir

def split_facetdirections(facetregionfile):
   '''
   split composite facet region file into individual polygon region files 
   ''' 
   r = pyregion.open(facetregionfile)   
   for facet_id, facet in enumerate(r):
     r[facet_id:facet_id+1].write('facet' + str(facet_id) + '.reg')  
   return  


def mask_region_inv(infilename,ds9region,outfilename):

    hdu=fits.open(infilename)
    hduflat = flatten(hdu)
    map=hdu[0].data

    r = pyregion.open(ds9region)
    manualmask = r.get_mask(hdu=hduflat)
    hdu[0].data[0][0][np.where(manualmask == False)] = 0.0
    hdu.writeto(outfilename,overwrite=True)
    return

def mask_region(infilename,ds9region,outfilename):

    hdu=fits.open(infilename)
    hduflat = flatten(hdu)
    map=hdu[0].data

    r = pyregion.open(ds9region)
    manualmask = r.get_mask(hdu=hduflat)
    hdu[0].data[0][0][np.where(manualmask == True)] = 0.0
    hdu.writeto(outfilename,overwrite=True)
    return


def flatten(f):
    """ Flatten a fits file so that it becomes a 2D image. Return new header and data """

    naxis=f[0].header['NAXIS']
    if naxis==2:
        return fits.PrimaryHDU(header=f[0].header,data=f[0].data)

    w = WCS(f[0].header)
    wn=WCS(naxis=2)
    
    wn.wcs.crpix[0]=w.wcs.crpix[0]
    wn.wcs.crpix[1]=w.wcs.crpix[1]
    wn.wcs.cdelt=w.wcs.cdelt[0:2]
    wn.wcs.crval=w.wcs.crval[0:2]
    wn.wcs.ctype[0]=w.wcs.ctype[0]
    wn.wcs.ctype[1]=w.wcs.ctype[1]
    
    header = wn.to_header()
    header["NAXIS"]=2
    copy=('EQUINOX','EPOCH','BMAJ', 'BMIN', 'BPA', 'RESTFRQ', 'TELESCOP', 'OBSERVER')
    for k in copy:
        r=f[0].header.get(k)
        if r is not None:
            header[k]=r

    slice=[]
    for i in range(naxis,0,-1):
        if i<=2:
            slice.append(np.s_[:],)
        else:
            slice.append(0)
        
    hdu = fits.PrimaryHDU(header=header,data=f[0].data[tuple(slice)])
    return hdu


def remove_outside_box(mslist, imagebasename,  pixsize, imsize, \
                       channelsout, single_dual_speedup=True, \
                       outcol='SUBTRACTED_DATA', dysco=True, userbox=None, \
                       idg=False, h5list=[], facetregionfile=None, \
                       disable_primary_beam=False):
   # get imageheader to check frequency
   hdul = fits.open(imagebasename + '-MFS-image.fits')
   header = hdul[0].header

   if len(h5list) != 0:
      datacolumn = 'DATA' # for DDE
   else:
      datacolumn = 'CORRECTED_DATA'
   
   if (header['CRVAL3'] < 500e6): # means we have LOFAR?, just a random value here
      boxsize = 1.5 # degr   
   if (header['CRVAL3'] > 500e6) and (header['CRVAL3'] < 1.0e9): # UHF-band
      boxsize = 3.0 # degr   
   if (header['CRVAL3'] >= 1.0e9) and (header['CRVAL3'] < 1.7e9): # L-band
      boxsize = 2.0 # degr
   if (header['CRVAL3'] >= 1.7e9) and (header['CRVAL3'] < 4.0e9): # S-band
      boxsize = 1.5 # degr  
  
  
   # create square box file templatebox.reg
   region_string = """
   # Region file format: DS9 version 4.1
   global color=green dashlist=8 3 width=1 font="helvetica 10 normal roman" select=1
   fk5
   box(137.2868914,-9.6412498,7200.000",7200.000",0)
   """
   r = pyregion.parse(region_string)
   r.write('templatebox.reg')
   r = pyregion.open('templatebox.reg')
   r[0].coord_list[0] = header['CRVAL1'] # units degr
   r[0].coord_list[1] = header['CRVAL2'] # units degr
   r[0].coord_list[2] = boxsize # units degr
   r[0].coord_list[3] = boxsize # units degr
   r.write('templatebox.reg')
   
   # predict the model non-DDE case
   if len(h5list) == 0:
      if userbox is None:
         makeimage(mslist, imagebasename, pixsize, imsize, \
                   channelsout, onlypredict=True, squarebox='templatebox.reg', \
                   idg=idg, disable_primarybeam_predict=disable_primary_beam,\
                   fulljones_h5_facetbeam=not single_dual_speedup)
         phaseshiftbox = 'templatebox.reg'
      else:
         if userbox != 'keepall':
            makeimage(mslist, imagebasename, pixsize, imsize, \
                      channelsout, onlypredict=True, squarebox=userbox, \
                      idg=idg,  disable_primarybeam_predict=disable_primary_beam, \
                      fulljones_h5_facetbeam=not single_dual_speedup) 
            phaseshiftbox = userbox
         else:  
            phaseshiftbox = None # so option keepall was set by the user
   else: # so this we are in DDE mode as h5list is not empty
      if userbox is None:
         makeimage(mslist, imagebasename, pixsize, imsize, \
                   channelsout, onlypredict=True, squarebox='templatebox.reg', \
                   idg=idg, h5list=h5list, facetregionfile=facetregionfile, \
                    disable_primarybeam_predict=disable_primary_beam, \
                    fulljones_h5_facetbeam=not single_dual_speedup)
         phaseshiftbox = 'templatebox.reg'
      else:
         if userbox != 'keepall':
            makeimage(mslist, imagebasename, pixsize, imsize, \
                      channelsout, onlypredict=True, squarebox=userbox, \
                      idg=idg, h5list=h5list, facetregionfile=facetregionfile, \
                       disable_primarybeam_predict=disable_primary_beam, \
                       fulljones_h5_facetbeam=not single_dual_speedup) 
            phaseshiftbox = userbox
         else:  
            phaseshiftbox = None # so option keepall was set by the user
   # write new data column (if keepall was not set) where rest of the field outside the box is removed
   if phaseshiftbox is not None:
      stepsize = 100000
      for ms in mslist:
         # check if outcol exists, if not create it with DP3 
         t = pt.table(ms)
         colnames = t.colnames()
         t.close()
         if outcol not in colnames:
            cmd = 'DP3 msin=' + ms + ' msout=. steps=[] msout.datacolumn=' + outcol + ' '
            cmd += 'msin.datacolumn='+ datacolumn + ' '
            if dysco:
               cmd += 'msout.storagemanager=dysco'
               cmd += 'msout.storagemanager.weightbitrate=16 '
            print(cmd)
            run(cmd)
         t = pt.table(ms, readonly=False)
         for row in range(0,t.nrows(),stepsize):
            print("Doing {} out of {}, (step: {})".format(row, t.nrows(), stepsize))
            data = t.getcol(datacolumn,startrow=row,nrow=stepsize,rowincr=1)
            model = t.getcol('MODEL_DATA', startrow=row,nrow=stepsize,rowincr=1)
            t.putcol(outcol, data-model, startrow=row,nrow=stepsize,rowincr=1)
         t.close()
      average(mslist, freqstep=[1]*len(mslist), timestep=1, \
              phaseshiftbox=phaseshiftbox, dysco=dysco,makesubtract=True,\
              dataincolumn=outcol)
   else: # so have have "keepall", no subtract, just a copy
      average(mslist, freqstep=[1]*len(mslist), timestep=1, \
              phaseshiftbox=phaseshiftbox, dysco=dysco,makesubtract=True,\
              dataincolumn=datacolumn)     

   return  

def is_scallar_array_forwsclean(h5list):
  is_scalar = True # set to True as a start, this also catches cases where last pol. dimension is missing
  for h5 in h5list:
     H5 = tables.open_file(h5,mode='r')
     try:
        phase = H5.root.sol000.phase000.val[:] # time, freq, ant, dir, pol
        if not np.array_equal(phase[:,:,:,:,0],phase[:,:,:,:,-1]):
           is_scalar = False
     except:
        pass
     try:
        amplitude = H5.root.sol000.amplitude000.val[:] # time, freq, ant, dir, pol
        if not np.array_equal(amplitude[:,:,:,:,0],amplitude[:,:,:,:,-1]):
           is_scalar = False
     except:
        pass
     H5.close()
  return is_scalar

def makeimage(mslist, imageout, pixsize, imsize, channelsout, niter=100000, robust=-0.5, \
              uvtaper=None, multiscale=False, predict=True, onlypredict=False, fitsmask=None, \
              idg=False, uvminim=80, fitspectralpol=3, \
              imager='WSCLEAN', restoringbeam=15, automask=2.5, \
              removenegativecc=True, usewgridder=True, paralleldeconvolution=0, \
              deconvolutionchannels=0, parallelgridding=1, multiscalescalebias=0.8, \
              fullpol=False, taperinnertukey=None, gapchanneldivision=False, \
              uvmaxim=None, h5list=[], facetregionfile=None, squarebox=None, \
              DDE_predict='WSCLEAN', localrmswindow=0, DDEimaging=False, \
              wgridderaccuracy=1e-4, nosmallinversion=False, multiscalemaxscales=0, \
              stack=False, disable_primarybeam_predict=False, disable_primarybeam_image=False, \
              facet_beam_update_time=120, groupms_h5facetspeedup=False, \
              singlefacetpredictspeedup=True, forceimagingwithfacets=True, ddpsfgrid=None, \
              fulljones_h5_facetbeam=False):
    '''
    forceimagingwithfacets (bool): force imaging with facetregionfile (facets.reg) even if len(h5list)==0, in this way we can still get a primary beam correction per facet and this image can be use for a DDE predict with the same type of beam correction (this is useful for making image000 when there are no DDE h5 corrections yet and we do not want to use IDG)
    '''
    if '-model-column' in subprocess.check_output(['wsclean'], text=True):    
      predict_inmodelcol = True
    else:
      predict_inmodelcol = False

    
    fitspectrallogpol = False # for testing Perseus
    msliststring = ' '.join(map(str, mslist))
    if idg:
      parallelgridding=1
    t = pt.table(mslist[0] + '/OBSERVATION', ack=False)
    telescope = t.getcol('TELESCOPE_NAME')[0] 
    t.close()

    if telescope != 'LOFAR' and not onlypredict and facetregionfile is not None:
      nosmallinversion = True

    #  --- DI predict only without facets ---
    # for example to subtract region of sky for the --remove-outside-center option
    if onlypredict and facetregionfile is None:
      if predict:
        if squarebox is not None:
           for model in sorted(glob.glob(imageout + '-????-*model*.fits')):
              print (model, 'box_' + model)
              mask_region(model,squarebox,'box_' + model)  
        
        cmd = 'wsclean -predict '
        #if not usewgridder and not idg:
        #  cmd += '-padding 1.8 '
        if channelsout > 1:
          cmd += '-channels-out ' + str(channelsout) + ' '
          if gapchanneldivision:
            cmd += '-gap-channel-division '
        if idg:
          cmd += '-gridder idg -idg-mode cpu '
          if not disable_primarybeam_predict:
            if telescope == 'LOFAR':
              cmd += '-grid-with-beam -use-differential-lofar-beam '
              cmd += '-beam-aterm-update ' + str(facet_beam_update_time) + ' '
          #cmd += '-pol iquv '
          cmd += '-pol i '
          cmd += '-padding 1.8 '
        else:
          if usewgridder:
            cmd += '-gridder wgridder '
            cmd += '-wgridder-accuracy ' + str(wgridderaccuracy) + ' '
            if nosmallinversion:
              cmd += '-no-min-grid-resolution ' #'-no-small-inversion '  
          if parallelgridding > 1:
            cmd += '-parallel-gridding ' + str(parallelgridding) + ' '
        
        if squarebox is None:
           cmd += '-name ' + imageout + ' ' + msliststring
        else:
           cmd += '-name ' + 'box_' + imageout + ' ' + msliststring
        print('PREDICT STEP: ', cmd)
        run(cmd)
      return
    #  --- end predict only ---


    #  --- DDE-NO-FACET-LOOP CORRUPT-predict, so everything ends up in MODEL_DATA and is corrupted
    # for example for --remove-outside-center option with --DDE
    if onlypredict and facetregionfile is not None and predict and squarebox is not None:
        # do the masking
        for model in sorted(glob.glob(imageout + '-????-*model*.fits')):
          print (squarebox, model, 'box_' + model)
          mask_region(model,squarebox,'box_' + model)  
              
        # predict with wsclean
        cmd = 'wsclean -predict '
        #if not usewgridder and not idg:
        #  cmd += '-padding 1.8 '
        if channelsout > 1:
          cmd += '-channels-out ' + str(channelsout) + ' '
          if gapchanneldivision:
            cmd += '-gap-channel-division '
        if idg:
          cmd += '-gridder idg -idg-mode cpu '
          if not disable_primarybeam_predict:
            if telescope == 'LOFAR':        
              cmd += '-grid-with-beam -use-differential-lofar-beam '
              cmd += '-beam-aterm-update ' + str(facet_beam_update_time) + ' '
          #cmd += '-pol iquv '
          cmd += '-pol i '
          cmd += '-padding 1.8 '
        else:
          if usewgridder:
            cmd += '-gridder wgridder '
            cmd += '-wgridder-accuracy ' + str(wgridderaccuracy) + ' '
            if nosmallinversion:
              cmd += '-no-min-grid-resolution '  # '-no-small-inversion ' 
          if parallelgridding > 1:
            cmd += '-parallel-gridding ' + str(parallelgridding) + ' '
      
        cmd += '-facet-regions ' + facetregionfile  + ' '
        cmd += '-apply-facet-solutions ' + ','.join(map(str, h5list)) + ' amplitude000,phase000 '
        
        if not fulljones_h5_facetbeam:
          if not is_scallar_array_forwsclean(h5list):
            cmd += '-diagonal-visibilities ' # different XX and YY solutions
          else:    
            cmd += '-scalar-visibilities ' # scalar solutions
            
        if telescope == 'LOFAR':
          if not disable_primarybeam_predict:
            cmd += '-apply-facet-beam -facet-beam-update ' + str(facet_beam_update_time) + ' '
            cmd += '-use-differential-lofar-beam '
      
        cmd += '-name box_' + imageout + ' ' + msliststring
        if DDE_predict == 'WSCLEAN':
          print('DDE PREDICT STEP: ', cmd)
          run(cmd)
        return 
    #  --- NO-FACET-LOOP end DDE CORRUPT-predict only ---


    #  --- DDE-FACET-LOOP predict, so all facets are predicted  ---
    #  --- each facet gets its own model column ---
    if onlypredict and facetregionfile is not None and predict:
      # step 1 open facetregionfile
      modeldatacolumns_list=[]
      r = pyregion.open(facetregionfile)   
      for facet_id, facet in enumerate(r):
        r[facet_id:facet_id+1].write('facet' + str(facet_id) + '.reg') # split facet from region file
     
        # step 2 mask outside of region file
        if not singlefacetpredictspeedup: # not needed, because WSClean will do the facet cutting
          for model in sorted(glob.glob(imageout + '-????-*model*.fits')):
            modelout = 'facet_' + model
            if DDE_predict == 'WSCLEAN':
              print (model, modelout)
              mask_region_inv(model,'facet' + str(facet_id) + '.reg',modelout)
        
        # step 3 predict with wsclean
        cmd = 'wsclean -predict '
        if predict_inmodelcol: # directly predict the right column name
          cmd += '-model-column MODEL_DATA_DD' + str(facet_id) + ' '
        #if not usewgridder and not idg:
        #  cmd += '-padding 1.8 '
        if channelsout > 1:
          cmd += '-channels-out ' + str(channelsout) + ' '
          if gapchanneldivision:
            cmd += '-gap-channel-division '
        if idg:
          cmd += '-gridder idg -idg-mode cpu '
          if not disable_primarybeam_predict:
            if telescope == 'LOFAR':        
              cmd += '-grid-with-beam -use-differential-lofar-beam '
              cmd += '-beam-aterm-update ' + str(facet_beam_update_time) + ' '
          #cmd += '-pol iquv '
          cmd += '-pol i '
          cmd += '-padding 1.8 '
        else:
          if usewgridder:
            cmd += '-gridder wgridder '
            cmd += '-wgridder-accuracy ' + str(wgridderaccuracy) + ' '
            if nosmallinversion:
              cmd += '-no-min-grid-resolution ' # '-no-small-inversion ' 
          if parallelgridding > 1:
            cmd += '-parallel-gridding ' + str(parallelgridding) + ' '
        
        # NEW CODE FOR SPEEDUP
        if singlefacetpredictspeedup:
          cmd += '-facet-regions ' + 'facet' + str(facet_id) + '.reg'  + ' '
          if telescope == 'LOFAR':
            if not disable_primarybeam_predict:
              cmd += '-apply-facet-beam -facet-beam-update ' +str(facet_beam_update_time)  + ' '
              cmd += '-use-differential-lofar-beam '
              if not fulljones_h5_facetbeam:
                 #cmd += '-diagonal-visibilities ' # different XX and YY solutions
                 cmd += '-scalar-visibilities ' # scalar solutions
                  
          cmd += '-name ' + imageout + ' ' + msliststring
        else:
          cmd += '-name facet_' + imageout + ' ' + msliststring
        
        
        if DDE_predict == 'WSCLEAN':
          print('DDE PREDICT STEP: ', cmd)
          run(cmd)
       
        # step 4 copy over to MODEL_DATA_DDX
        for ms in mslist:
          cmddppp = 'DP3 msin=' + ms + ' msin.datacolumn=MODEL_DATA msout=. steps=[] '
          cmddppp += 'msout.datacolumn=MODEL_DATA_DD' +str(facet_id)  
          if DDE_predict == 'WSCLEAN' and not predict_inmodelcol:
            run(cmddppp)
        modeldatacolumns_list.append('MODEL_DATA_DD' +str(facet_id))
      
      return modeldatacolumns_list
    #  --- end DDE predict only ---


    # ----- MAIN IMAGING PART ------
    os.system('rm -f ' + imageout + '-*.fits')
    imcol = 'CORRECTED_DATA'
    # check for all ms in mslist
    # situation can be that only some ms have CORRECTED_DATA based on what happens in the beamcor
    # so some ms can have a beam correction and others not
    # for example because of different directions where the beam was applied
    for ms in mslist:
      t = pt.table(ms,readonly=True, ack=False) 
      colnames =t.colnames()
      if 'CORRECTED_DATA' not in colnames: # for first imaging run
         imcol = 'DATA'
      t.close()
    
    baselineav = str (1.5e3*60000.*2.*np.pi *1.5/(24.*60.*60*float(imsize)) )

    if imager == 'WSCLEAN':
      cmd = 'wsclean '
      cmd += '-no-update-model-required ' 
      cmd += '-minuv-l ' + str(uvminim) + ' '
      if uvmaxim is not None:
         cmd += '-maxuv-l ' + str(uvmaxim) + ' '  
      cmd += '-size ' + str(int(imsize)) + ' ' + str(int(imsize)) + ' -reorder '
      if type(robust) is not str:
         cmd += '-weight briggs ' + str(robust) 
      else:
         cmd += '-weight ' + str(robust)
      #cmd += ' -clean-border 1 ' # not needed anymore for WSCleand
      cmd += ' -parallel-reordering 4 '
      # -weighting-rank-filter 3 -fit-beam
      cmd += '-mgain 0.8 -data-column ' + imcol + ' '
      #if not usewgridder and not idg:
      #  cmd += '-padding 1.4 '
      if channelsout > 1:
        cmd += ' -join-channels -channels-out ' + str(channelsout) + ' '
        if gapchanneldivision:
          cmd += '-gap-channel-division '
      if paralleldeconvolution > 0:
        cmd += '-parallel-deconvolution ' +  str(paralleldeconvolution) + ' '
      if parallelgridding > 1:
        cmd += '-parallel-gridding ' + str(parallelgridding) + ' '
      if deconvolutionchannels > 0 and channelsout > 1:
        cmd += '-deconvolution-channels ' +  str(deconvolutionchannels) + ' '
      if automask > 0.5:
        cmd += '-auto-mask '+ str(automask)  + ' -auto-threshold 0.5 ' # to avoid automask 0
      if localrmswindow > 0:
        cmd += '-local-rms-window ' + str(localrmswindow) + ' '

      if ddpsfgrid is not None:
        cmd += '-dd-psf-grid ' + str(ddpsfgrid) + ' ' +  str(ddpsfgrid) + ' '

      if multiscale:
         # cmd += '-multiscale '+' -multiscale-scales 0,4,8,16,32,64 -multiscale-scale-bias 0.6 '
         # cmd += '-multiscale '+' -multiscale-scales 0,6,12,16,24,32,42,64,72,128,180,256,380,512,650 '
         cmd += '-multiscale '
         cmd += '-multiscale-scale-bias ' + str(multiscalescalebias) + ' '
         if multiscalemaxscales == 0:
           cmd += '-multiscale-max-scales ' + str(int(np.rint(np.log2(float(imsize)) -3))) + ' '
         else: # use value set by user
           cmd += '-multiscale-max-scales ' + str(int(multiscalemaxscales)) + ' '
      if fitsmask is not None and fitsmask != 'nofitsmask':
        if os.path.isfile(fitsmask):
          cmd += '-fits-mask '+ fitsmask + ' '
        else:
          print('fitsmask: ', fitsmask, 'does not exist')
          raise Exception('fitsmask does not exist')
      if uvtaper is not None:
         cmd += '-taper-gaussian ' + uvtaper + ' '
      if taperinnertukey is not None:
         cmd += '-taper-inner-tukey ' + str(taperinnertukey) + ' '

      if (fitspectralpol > 0) and not (fullpol):
         cmd += '-save-source-list '

      if (fitspectralpol > 0) and (channelsout > 1) and not (fullpol):
        if fitspectrallogpol:
          cmd += '-fit-spectral-log-pol ' + str(fitspectralpol) + ' '
        else:
          cmd += '-fit-spectral-pol ' + str(fitspectralpol) + ' '
      if idg:
        cmd += '-gridder idg -idg-mode cpu '
        if not disable_primarybeam_image:
          if telescope == 'LOFAR':
            cmd += '-grid-with-beam -use-differential-lofar-beam '
            cmd += '-beam-aterm-update ' + str(facet_beam_update_time) + ' '
        #cmd += '-pol iquv -link-polarizations i '
        cmd += '-pol i '
        cmd += '-padding 1.4 '
      else:
        if fullpol:
          cmd += '-pol iquv -join-polarizations '
        else:
          cmd += '-pol i '
        if len(h5list) == 0 and facetregionfile is None: # only use baseline-averaging without facets
          #if not forceimagingwithfacets:
          cmd += '-baseline-averaging ' + baselineav + ' '
        if usewgridder:
          cmd += '-gridder wgridder '
          cmd += '-wgridder-accuracy ' + str(wgridderaccuracy) + ' '
          if nosmallinversion:
            cmd += '-no-min-grid-resolution ' #'-no-small-inversion ' 

      if len(h5list) > 0:
         cmd += '-facet-regions ' + facetregionfile  + ' '
         if groupms_h5facetspeedup and len(mslist) > 1:
            mslist_concat, h5list_concat = concat_ms_wsclean_facetimaging(mslist, h5list=h5list, concatms=False)
            cmd += '-apply-facet-solutions ' + ','.join(map(str, h5list_concat)) + ' '
            cmd += ' amplitude000,phase000 '
         else:
            cmd += '-apply-facet-solutions ' + ','.join(map(str, h5list)) + ' amplitude000,phase000 '
            
         if not fulljones_h5_facetbeam:
           if not is_scallar_array_forwsclean(h5list):
             cmd += '-diagonal-visibilities ' # different XX and YY solutions
           else:    
             cmd += '-scalar-visibilities ' # scalar solutions
                  
         if telescope == 'LOFAR':
            if not disable_primarybeam_image:
               cmd += '-apply-facet-beam -facet-beam-update ' + str(facet_beam_update_time) + ' '
               cmd += '-use-differential-lofar-beam '
      elif forceimagingwithfacets and facetregionfile is not None: # so h5list is zero, but we still want facet imaging
         cmd += '-facet-regions ' + facetregionfile  + ' '
         if telescope == 'LOFAR' and not disable_primarybeam_image:
            cmd += '-apply-facet-beam -facet-beam-update ' + str(facet_beam_update_time) + ' '
            cmd += '-use-differential-lofar-beam '
            if not fulljones_h5_facetbeam:
              #cmd += '-diagonal-visibilities ' # different XX and YY solutions
              cmd += '-scalar-visibilities ' # scalar solutions
      else:
         if telescope == 'LOFAR' and not check_phaseup_station(mslist[0]) and not idg:
            if not disable_primarybeam_image:
               cmd += '-apply-primary-beam -use-differential-lofar-beam '
               cmd += '-facet-beam-update ' + str(facet_beam_update_time) + ' '

      cmd += '-name ' + imageout + ' -scale ' + str(pixsize) + 'arcsec ' 
      if len(h5list) > 0 and groupms_h5facetspeedup and len(mslist) > 1:
         msliststring_concat = ' '.join(map(str, mslist_concat))
         print('WSCLEAN: ', cmd + '-nmiter 12 -niter ' + str(niter) + ' ' + msliststring_concat)
         logger.info(cmd + ' -niter ' + str(niter) + ' ' + msliststring_concat)
         run(cmd + '-nmiter 12 -niter ' + str(niter) + ' ' + msliststring_concat)
      else:
         print('WSCLEAN: ', cmd + '-nmiter 12 -niter ' + str(niter) + ' ' + msliststring)
         logger.info(cmd + ' -niter ' + str(niter) + ' ' + msliststring)
         run(cmd + '-nmiter 12 -niter ' + str(niter) + ' ' + msliststring)


      # REMOVE nagetive model components, these are artifacts (only for Stokes I)
      if removenegativecc:
        if idg:
            removenegativefrommodel(sorted(glob.glob(imageout +'-????-*model*.fits')))  # only Stokes I
        else:
            removenegativefrommodel(sorted(glob.glob(imageout + '-????-*model*.fits')))

      # Remove NaNs from array (can happen if certain channels from channels-out are flagged, or from -apply-facet-beam far into the sidelobes)
      if idg:
        removeneNaNfrommodel(glob.glob(imageout +'-????-*model*.fits'))  # only Stokes I
      else:
        removeneNaNfrommodel(glob.glob(imageout + '-????-*model*.fits'))

      # Check is anything was cleaned. If not, stop the selfcal to avoid obscure errors later
      if channelsout > 1: 
        model_allzero = checkforzerocleancomponents(glob.glob(imageout +'-????-*model*.fits'))  # only Stokes I
      else:
        model_allzero = checkforzerocleancomponents(glob.glob(imageout + '-*model*.fits'))
      if model_allzero:
          logger.error("All channel maps models were zero: Stopping the selfcal")
          print("All channel maps models were zero: Stopping the selfcal")
          sys.exit(0)

      if predict and len(h5list) == 0 and not DDEimaging: 
        # we check for DDEimaging to avoid a predict for image000 in a --DDE run
        # because at that moment there is no h5list yet and this avoids an unnecessary DI-type predict 
        cmd = 'wsclean -predict ' #-size '
        #cmd += str(int(imsize)) + ' ' + str(int(imsize)) +  ' -predict '
        #if not usewgridder and not idg:
        #   cmd += '-padding 1.8 ' 
        if channelsout > 1:
          cmd += '-channels-out ' + str(channelsout) + ' '
          if gapchanneldivision:
            cmd += '-gap-channel-division '
        if idg:
          cmd += '-gridder idg -idg-mode cpu '
          if telescope == 'LOFAR':
            if not disable_primarybeam_predict:
              cmd += '-grid-with-beam -use-differential-lofar-beam '
              cmd += '-beam-aterm-update ' + str(facet_beam_update_time) + ' '
          #cmd += '-pol iquv '
          cmd += '-pol i '
          cmd += '-padding 1.8 ' 
        else:
          if usewgridder:
            cmd += '-gridder wgridder '  
            cmd += '-wgridder-accuracy ' + str(wgridderaccuracy) + ' '
            if nosmallinversion:
              cmd += '-no-min-grid-resolution ' # '-no-small-inversion ' 
          if parallelgridding > 1:
            cmd += '-parallel-gridding ' + str(parallelgridding) + ' '

        # needs multi-col predict
        #if h5 is not None:
        #   cmd += '-facet-regions ' + facetregionfile  + ' '
        #   cmd += '-apply-facet-solutions ' + h5 + ' amplitude000,phase000 '
        #   if telescope == 'LOFAR':
        #      cmd += '-apply-facet-beam -facet-beam-update 600 -use-differential-lofar-beam '
        #      cmd += '-diagonal-solutions '
        
        cmd += '-name ' + imageout + ' -scale ' + str(pixsize) + 'arcsec ' + msliststring
        print('PREDICT STEP: ', cmd)
        run(cmd)


    if imager == 'DDFACET':
        makemslist(mslist)
        # restoringbeam = '15'
        cmd = 'DDF.py --Data-MS=mslist.txt --Deconv-PeakFactor=0.001 --Data-ColName=' + imcol + ' ' + \
              '--Parallel-NCPU=32 --Output-Mode=Clean --Deconv-CycleFactor=0 ' + \
              '--Deconv-MaxMinorIter=' + str(niter) + ' --Deconv-MaxMajorIter=5 ' + \
              '--Deconv-Mode=SSD --Weight-Robust=' + str(robust) + ' --Image-NPix=' + str(int(imsize)) + ' ' + \
              '--CF-wmax=50000 --CF-Nw=100 --Beam-Model=None --Beam-LOFARBeamMode=A --Beam-NBand=1 ' + \
              '--Output-Also=onNeds --Image-Cell=' + str(pixsize) + ' --Facets-NFacets=1 --Freq-NDegridBand=1 ' + \
              '--Deconv-RMSFactor=3.0 --Deconv-FluxThreshold=0.0 --Data-Sort=1 --Cache-Dir=. --Freq-NBand=2 ' + \
              '--GAClean-MinSizeInit=10 --Facets-DiamMax=1.5 --Facets-DiamMin=0.1 ' + \
              '--Cache-Dirty=auto --Weight-ColName=WEIGHT_SPECTRUM --Output-Name=' + imageout + ' ' + \
              '--Comp-BDAMode=1 --DDESolutions-DDModeGrid=AP --DDESolutions-DDModeDeGrid=AP --Cache-Reset=1 ' + \
              '--RIME-ForwardMode=BDA-degrid --Predict-ColName=MODEL_DATA --Selection-UVRange=[0.1,2000.] ' + \
              '--Output-RestoringBeam=' + str(restoringbeam) + ' --Mask-SigTh=5.0 '
        if fitsmask is not None and fitsmask != 'nofitsmask':
           cmd += '--Mask-External=' + fitsmask + ' --Mask-Auto=0 '
        else:
           cmd += '--Mask-Auto=1 '

        print(cmd)
        run(cmd)


def smearing_bandwidth(r, th, nu, dnu):
    ''' Returns the left over intensity I/I0 after bandwidth smearing.
    Args:
        r (float or Astropy Quantity): distance from the phase center in arcsec.
        th (float or Astropy Quantity): angular resolution in arcsec.
        nu (float): observing frequency.
        dnu (float): averaging frequency.
    '''
    r = r + 1e-9 # Add a tiny offset to prevent division by zero.
    I = (np.sqrt(np.pi) / (2 * np.sqrt(np.log(2)))) * ((th * nu) / (r * dnu)) * scipy.special.erf(np.sqrt(np.log(2)) * ((r * dnu) / (th * nu)))
    return I

def smearing_time(r, th, t):
    ''' Returns the left over intensity I/I0 after time smearing.
    Args:
        r (float or Astropy Quantity): distance from the phase center in arcsec.
        th (float or Astropy Quantity): angular resolution in arcsec.
        t (float): averaging time in seconds.
    '''
    r = r + 1e-9 # Add a tiny offset to prevent division by zero.
    
    I = 1 - 1.22e-9 * (r / th) ** 2 * t ** 2
    return I

def smearing_time_ms(msin, t):
    res = get_resolution(msin)
    r_dis = 3600.*compute_distance_to_pointingcenter(msin, returnval=True, dologging=False)
    return smearing_time(r_dis, res, t)
    
def flag_smeared_data(msin):
   Ismear = smearing_time_ms(msin, get_time_preavg_factor_LTAdata(msin))  
   if Ismear < 0.5:
     print('Smeared', Ismear)
     #uvmaxflag(msin, uvmax)
   
   #uvmax = get_uvwmax(ms)
   t = pt.table(msin + '/SPECTRAL_WINDOW', ack=False)
   freq = np.median(t.getcol('CHAN_FREQ'))
   #print('Central freq [MHz]', freq/1e6, 'Longest baselines [km]', uvmax/1e3)
   t.close()
   
   
   t = get_time_preavg_factor_LTAdata(msin)
   r_dis = 3600.*compute_distance_to_pointingcenter(msin, returnval=True, dologging=False)
   
   flagval = None
   for uvrange in list(np.arange(100e3,5000e3, 10e3)):
      res = 1.22*3600.*180.*((299792458./freq )/uvrange)/np.pi
      Ismear = smearing_time(r_dis, res, t)
      if Ismear > 0.968:
        flagval = uvrange  
      #print(uvrange,Ismear)
   print('Data above', flagval/1e3,  'klambda is affected by time smearing')
   if flagval/1e3 < 650:
      print('Flagging data above uvmin value of [klambda]', msin, flagval/1e3)
      uvmaxflag(msin, flagval)  
   return


# this version corrupts the MODEL_DATA column
def calibrateandapplycal(mslist, selfcalcycle, args, solint_list, nchan_list, \
              soltype_list, soltypecycles_list, smoothnessconstraint_list, \
              smoothnessreffrequency_list, smoothnessspectralexponent_list, \
              smoothnessrefdistance_list, \
              antennaconstraint_list, resetsols_list, resetdir_list, normamps_list, \
              BLsmooth_list, uvmin=0, \
              normamps=False, normamps_per_ms=False, skymodel=None, \
              predictskywithbeam=False, restoreflags=False, flagging=False, \
              longbaseline=False, flagslowphases=True, \
              flagslowamprms=7.0, flagslowphaserms=7.0, skymodelsource=None, \
              skymodelpointsource=None, wscleanskymodel=None, iontimefactor=0.01, \
              ionfreqfactor=1.0, blscalefactor=1.0, dejumpFR=False, uvminscalarphasediff=0, \
              docircular=False, mslist_beforephaseup=None, dysco=True, blsmooth_chunking_size=8, \
              gapchanneldivision=False, modeldatacolumns=[], dde_skymodel=None, \
              DDE_predict='WSCLEAN', QualityBasedWeights=False, QualityBasedWeights_start=5, \
              QualityBasedWeights_dtime=10.,QualityBasedWeights_dfreq=5., telescope='LOFAR',\
              ncpu_max=24, mslist_beforeremoveinternational=None, soltypelist_includedir=None):

   ## --- start STACK code ---
   if args['stack']:
     # create MODEL_DATA because in case it does not exist, happens under these conditions
     # only for first (=0) selfcalcycle cycle and if user provides a model
     if ((skymodel is not None) or (skymodelpointsource is not None) \
         or (wscleanskymodel is not None)) and selfcalcycle == 0:
       for ms_id, ms in enumerate(mslist): # do the predicts (only used for stacking)   
         print('Doing sky predict for stacking...') 
         if skymodel is not None and type(skymodel) is str:
           predictsky(ms, skymodel, modeldata='MODEL_DATA', predictskywithbeam=predictskywithbeam, sources=skymodelsource)
         if skymodel is not None and type(skymodel) is list:
           predictsky(ms, skymodel[ms_id], modeldata='MODEL_DATA', predictskywithbeam=predictskywithbeam, sources=skymodelsource)
         if wscleanskymodel is not None and type(wscleanskymodel) is str:
           makeimage([ms], wscleanskymodel, 1., 1., \
                     len(glob.glob(wscleanskymodel + '-????-model.fits')),\
                     0, 0.0, onlypredict=True, idg=False, \
                     gapchanneldivision=gapchanneldivision, \
                     fulljones_h5_facetbeam=not args['single_dual_speedup'])
         if wscleanskymodel is not None and type(wscleanskymodel) is list:
           makeimage([ms], wscleanskymodel[ms_id], 1., 1., \
                     len(glob.glob(wscleanskymodel[ms_id] + '-????-model.fits')),\
                     0, 0.0, onlypredict=True, idg=False, \
                     gapchanneldivision=gapchanneldivision,\
                     fulljones_h5_facetbeam=not args['single_dual_speedup'])   

         if skymodelpointsource is not None and type(skymodelpointsource) is float :
           # create MODEL_DATA (no dysco!)
           run('DP3 msin=' + ms + ' msout=. msout.datacolumn=MODEL_DATA steps=[]',log=True)
           # do the predict with taql
           run("taql" + " 'update " + ms + " set MODEL_DATA[,0]=(" + str(skymodelpointsource)+ "+0i)'",log=True)
           run("taql" + " 'update " + ms + " set MODEL_DATA[,3]=(" + str(skymodelpointsource)+ "+0i)'",log=True)
           run("taql" + " 'update " + ms + " set MODEL_DATA[,1]=(0+0i)'",log=True)
           run("taql" + " 'update " + ms + " set MODEL_DATA[,2]=(0+0i)'",log=True)

         if skymodelpointsource is not None and type(skymodelpointsource) is list :
           # create MODEL_DATA (no dysco!)
           run('DP3 msin=' + ms + ' msout=. msout.datacolumn=MODEL_DATA steps=[]',log=True)
           # do the predict with taql
           run("taql" + " 'update " + ms + " set MODEL_DATA[,0]=(" + str(skymodelpointsource[ms_id])+ "+0i)'",log=True)
           run("taql" + " 'update " + ms + " set MODEL_DATA[,3]=(" + str(skymodelpointsource[ms_id])+ "+0i)'",log=True)
           run("taql" + " 'update " + ms + " set MODEL_DATA[,1]=(0+0i)'",log=True)
           run("taql" + " 'update " + ms + " set MODEL_DATA[,2]=(0+0i)'",log=True)


     # do the stack and normalization
     stackwrapper(mslist, msout='stack.MS', column_to_normalise='DATA')
     mslist_orig = mslist[:] # so we can use it for the applycal
     mslist = ['stack.MS']
     
     # set MODEL_DATA to point source in stack
     t = pt.table('stack.MS', ack=False)
     if 'MODEL_DATA' not in t.colnames():
       t.close()
       run('DP3 msin=stack.MS msout=. msout.datacolumn=MODEL_DATA steps=[]', log=True)
     else:
       t.close()
     print('Predict point source for stack.MS')
     # do the predict with taql
     run("taql" + " 'update stack.MS set MODEL_DATA[,0]=(1.0+ +0i)'", log=True)
     run("taql" + " 'update stack.MS set MODEL_DATA[,3]=(1.0+ +0i)'", log=True)
     run("taql" + " 'update stack.MS set MODEL_DATA[,1]=(0+0i)'", log=True)
     run("taql" + " 'update stack.MS set MODEL_DATA[,2]=(0+0i)'", log=True)
     
     print(mslist, mslist_orig)
     
     # set all these to None to avoid skymodel predicts in runDPPPbase()
     skymodelpointsource = None
     wscleanskymodel = None
     skymodel = None
   ## --- end STACK code ---     
    

   if len(modeldatacolumns) > 1:
     merge_all_in_one = False
   else:
     merge_all_in_one = True

   single_pol_merge = False

   soltypecycles_list_array = np.array(soltypecycles_list) # needed to slice (slicing does not work in nested l
   pertubation = [] # len(mslist)
   for ms in mslist:
     pertubation.append(False)

   parmdbmergelist =  [[] for x in range(len(mslist))]   #  [[],[],[],[]] nested list length mslist used for Jurjen's h5_merge
   # LOOP OVER THE ENTIRE SOLTYPE LIST (so includes pertubations via a pre-applycal)
   for soltypenumber, soltype in enumerate(soltype_list):
     # SOLVE LOOP OVER MS
     parmdbmslist = []
     for msnumber, ms in enumerate(mslist):
       # check we are above far enough in the selfcal to solve for the extra pertubation
       if selfcalcycle >= soltypecycles_list[soltypenumber][msnumber]:
         print('selfcalcycle, soltypenumber',selfcalcycle, soltypenumber)
         if (soltypenumber < len(soltype_list)-1):

           print(selfcalcycle,soltypecycles_list[soltypenumber+1][msnumber])
           print('_______________________')
           print(soltypecycles_list_array,soltypenumber,len(soltypecycles_list_array))
           print('Array soltypecycles_list ahead',soltypecycles_list_array[soltypenumber+1:len(soltypecycles_list_array[:,0]),msnumber])
           # if (selfcalcycle >= soltypecycles_list[soltypenumber+1][msnumber]): # this looks one soltype ahead...hmmm, not good 
           if selfcalcycle >= np.min(soltypecycles_list_array[soltypenumber+1:len(soltypecycles_list_array[:,0]),msnumber]): # this looks all soltype ahead   
             pertubation[msnumber] = True
           else:
             pertubation[msnumber] = False
         else:
           pertubation[msnumber] = False

         if ((skymodel is not None) or (skymodelpointsource is not None) or (wscleanskymodel is not None)) and selfcalcycle == 0:
           parmdb = soltype + str(soltypenumber) + '_skyselfcalcyle' + str(selfcalcycle).zfill(3) + '_' + os.path.basename(ms) + '.h5'
         else:
           parmdb = soltype + str(soltypenumber) + '_selfcalcyle' + str(selfcalcycle).zfill(3) + '_' + os.path.basename(ms) + '.h5'

         # set create_modeldata to False it was already prediceted before
         create_modeldata = True 
         if soltypenumber >= 1:
            create_modeldata = False  
            
            #for tmpsoltype in ['complexgain', 'scalarcomplexgain', 'scalaramplitude',\
            #                   'amplitudeonly', 'phaseonly', \
            #                   'fulljones', 'rotation', 'rotation+diagonal', 'tec', 'tecandphase', 'scalarphase', \
            #                   'phaseonly_phmin', 'rotation_phmin', 'tec_phmin', \
            #                   'tecandphase_phmin', 'scalarphase_phmin', 'scalarphase_slope', 'phaseonly_slope']:
            #   if tmpsoltype in soltype_list[0:soltypenumber]:
            #      print('Previous solve already predicted MODEL_DATA, will skip that step', soltype, soltypenumber)
            #      create_modeldata = False  
         print(ms)
         print(solint_list)
         print(soltypenumber)
         print(msnumber)
         print(modeldatacolumns)
         runDPPPbase(ms, solint_list[soltypenumber][msnumber], nchan_list[soltypenumber][msnumber], parmdb, soltype, \
                     uvmin=uvmin, \
                     SMconstraint=smoothnessconstraint_list[soltypenumber][msnumber], \
                     SMconstraintreffreq=smoothnessreffrequency_list[soltypenumber][msnumber],\
                     SMconstraintspectralexponent=smoothnessspectralexponent_list[soltypenumber][msnumber],\
                     SMconstraintrefdistance=smoothnessrefdistance_list[soltypenumber][msnumber],\
                     antennaconstraint=antennaconstraint_list[soltypenumber][msnumber], \
                     resetsols=resetsols_list[soltypenumber][msnumber], \
                     resetsols_list = resetsols_list, \
                     resetdir=resetdir_list[soltypenumber][msnumber], \
                     restoreflags=restoreflags, flagging=flagging, skymodel=skymodel, \
                     flagslowphases=flagslowphases, flagslowamprms=flagslowamprms, \
                     flagslowphaserms=flagslowphaserms, \
                     predictskywithbeam=predictskywithbeam, BLsmooth=BLsmooth_list[soltypenumber][msnumber], skymodelsource=skymodelsource, \
                     skymodelpointsource=skymodelpointsource, wscleanskymodel=wscleanskymodel,\
                     iontimefactor=iontimefactor, ionfreqfactor=ionfreqfactor, blscalefactor=blscalefactor, dejumpFR=dejumpFR, uvminscalarphasediff=uvminscalarphasediff, create_modeldata=create_modeldata, \
                     selfcalcycle=selfcalcycle, dysco=dysco, blsmooth_chunking_size=blsmooth_chunking_size, gapchanneldivision=gapchanneldivision, soltypenumber=soltypenumber,\
                     clipsolutions=args['clipsolutions'], clipsolhigh=args['clipsolhigh'],\
                     clipsollow=args['clipsollow'], uvmax=args['uvmax'],modeldatacolumns=modeldatacolumns, preapplyH5_dde=parmdbmergelist[msnumber], dde_skymodel=dde_skymodel, DDE_predict=DDE_predict, telescope=telescope, ncpu_max=ncpu_max, soltype_list=soltype_list, DP3_dual_single=args['single_dual_speedup'], soltypelist_includedir=soltypelist_includedir, normamps=normamps)

         parmdbmslist.append(parmdb)
         parmdbmergelist[msnumber].append(parmdb) # for h5_merge

     # NORMALIZE amplitudes
     if normamps and (soltype in ['complexgain','scalarcomplexgain','rotation+diagonal',\
                                  'rotation+diagonalamplitude','rotation+scalar',\
                                  'rotation+scalaramplitude','amplitudeonly','scalaramplitude']) and len(parmdbmslist) > 0:
       print('Doing global amplitude-type normalization')
       
       #[soltypenumber][msnumber] msnumber=0 is ok because we  do all ms at once
       if normamps_list[soltypenumber][0] == 'normamps':  # 
          print('Performing global amplitude normalization')
          normamplitudes(parmdbmslist, norm_per_ms=normamps_per_ms) # list of h5 for different ms, all same soltype

       if normamps_list[soltypenumber][0] == 'normamps_per_ant':
          print('Performing global amplitude normalization per antenna')
          normamplitudes_withmatrix(parmdbmslist)
     
       if normamps_list[soltypenumber][0] == 'normslope':
          print('Performing global slope normalization')
          normslope_withmatrix(parmdbmslist)
          
       if normamps_list[soltypenumber][0] == 'normslope+normamps':
          print('Performing global slope normalization')
          normslope_withmatrix(parmdbmslist) # first do the slope
          normamplitudes(parmdbmslist, norm_per_ms=normamps_per_ms)
          
       if normamps_list[soltypenumber][0] == 'normslope+normamps_per_ant':
          print('Performing global slope normalization')
          normslope_withmatrix(parmdbmslist) # first do the slope
          normamplitudes_withmatrix(parmdbmslist)        
        
         
     # APPLYCAL or PRE-APPLYCAL or CORRUPT
     count = 0
     for msnumber, ms in enumerate(mslist):
       if selfcalcycle >= soltypecycles_list[soltypenumber][msnumber]: #
         print(pertubation[msnumber], parmdbmslist[count], msnumber, count)
         if pertubation[msnumber]: # so another solve follows after this
           if soltypenumber == 0:
             if len(modeldatacolumns) > 1:
               if DDE_predict == 'WSCLEAN':
                 corrupt_modelcolumns(ms, parmdbmslist[count], modeldatacolumns) # for DDE
             else:  
               corrupt_modelcolumns(ms, parmdbmslist[count], ['MODEL_DATA']) # saves disk space
           else:
             if len(modeldatacolumns) > 1:
               if DDE_predict == 'WSCLEAN':
                 corrupt_modelcolumns(ms, parmdbmslist[count], modeldatacolumns) # for DDE
             else:
               corrupt_modelcolumns(ms, parmdbmslist[count], ['MODEL_DATA']) # saves disk space
         else: # so this is the last solve, no other pertubation
           # note we reverse ([::-1]) the solution tables here because we switch from a corrupt approach to a correct. This is important as fulljones and diagonal solutions do not commute
           applycal(ms, parmdbmergelist[msnumber][::-1], msincol='DATA', msoutcol='CORRECTED_DATA',\
                    dysco=dysco, modeldatacolumns=modeldatacolumns) # saves disks space
         count = count + 1 # extra counter because parmdbmslist can have less length than mslist as soltypecycles_list goes per ms

   wsclean_h5list = []

   # merge all solutions 
   if True:
     # import h5_merger
     for msnumber, ms in enumerate(mslist):
       if ((skymodel is not None) or (skymodelpointsource is not None) or (wscleanskymodel is not None)) and selfcalcycle == 0:
         parmdbmergename = 'merged_skyselfcalcyle' + str(selfcalcycle).zfill(3) + '_' + os.path.basename(ms) + '.h5'
         parmdbmergename_pc = 'merged_skyselfcalcyle' + str(selfcalcycle).zfill(3) + '_linearfulljones_' + os.path.basename(ms) + '.h5'
       else:
         parmdbmergename = 'merged_selfcalcyle' + str(selfcalcycle).zfill(3) + '_' + os.path.basename(ms) + '.h5'
         parmdbmergename_pc = 'merged_selfcalcyle' + str(selfcalcycle).zfill(3) + '_linearfulljones_' + os.path.basename(ms) + '.h5' 
       if os.path.isfile(parmdbmergename):
         os.system('rm -f ' + parmdbmergename)
       if os.path.isfile(parmdbmergename_pc):
         os.system('rm -f ' + parmdbmergename_pc)
       wsclean_h5list.append(parmdbmergename)  

       # add extra from preapplyH5_list
       if args['preapplyH5_list'][0] is not None:
         preapplyh5parm = time_match_mstoH5(args['preapplyH5_list'], ms)
         # replace the source direction coordinates so that the merge goes correctly
         copy_over_sourcedirection_h5(parmdbmergelist[msnumber][0], preapplyh5parm)
         parmdbmergelist[msnumber].append(preapplyh5parm)
        

       if is_scallar_array_forwsclean(parmdbmergelist[msnumber]):
         single_pol_merge = True
       else:  
         single_pol_merge = False
       
       # remove this once h5 merger is fixed
       if not merge_all_in_one: # so only for a DDE solve
          fix_h5(parmdbmergelist[msnumber])
       
       print(parmdbmergename,parmdbmergelist[msnumber],ms)
       h5_merger.merge_h5(h5_out=parmdbmergename,h5_tables=parmdbmergelist[msnumber][::-1],ms_files=ms,\
                          convert_tec=True, merge_all_in_one=merge_all_in_one, \
                          propagate_flags=True, single_pol=single_pol_merge)
       # add CS stations back for superstation
       if mslist_beforephaseup is not None:
         print('mslist_beforephaseup: ' + mslist_beforephaseup[msnumber])
         if is_scallar_array_forwsclean([parmdbmergename]):
           single_pol_merge = True 
         else:
           single_pol_merge = False 
         h5_merger.merge_h5(h5_out=parmdbmergename.replace("selfcalcyle",\
                            "addCS_selfcalcyle"),h5_tables=parmdbmergename, \
                            ms_files=mslist_beforephaseup[msnumber], convert_tec=True, merge_all_in_one=merge_all_in_one, single_pol=single_pol_merge, \
                            propagate_flags=True, add_cs=True)

       # make LINEAR solutions from CIRCULAR (never do a single_pol merge here!)
       if ('scalarphasediff' in soltype_list) or ('scalarphasediffFR' in soltype_list) or docircular:
         h5_merger.merge_h5(h5_out=parmdbmergename_pc, h5_tables=parmdbmergename, circ2lin=True, propagate_flags=True)
         # add CS stations back for superstation
         if mslist_beforephaseup is not None:
           h5_merger.merge_h5(h5_out=parmdbmergename_pc.replace("selfcalcyle",\
                              "addCS_selfcalcyle"),h5_tables=parmdbmergename_pc, \
                              ms_files=mslist_beforephaseup[msnumber], convert_tec=True, merge_all_in_one=merge_all_in_one, \
                              propagate_flags=True, add_cs=True)


       if False:
         # testing only to check if merged H5 file is correct and makes a good image
         applycal(ms, parmdbmergename, msincol='DATA',msoutcol='CORRECTED_DATA', dysco=dysco)

       # plot merged solution file
       losotoparset = create_losoto_flag_apgridparset(ms, flagging=False, \
                            medamp=medianamp(parmdbmergename), \
                            outplotname=parmdbmergename.split('_' + os.path.basename(ms) + '.h5')[0], \
                            refant=findrefant_core(parmdbmergename),\
                            fulljones=fulljonesparmdb(parmdbmergename), onepol=single_pol_merge)
       run('losoto ' + parmdbmergename + ' ' + losotoparset)
       force_close(parmdbmergename)
   
   if QualityBasedWeights and selfcalcycle >= QualityBasedWeights_start:
     for ms in mslist:       
       run('python3 NeReVar.py --filename=' + ms +\
           ' --dt=' + str(QualityBasedWeights_dtime) + ' --dnu=' + str(QualityBasedWeights_dfreq) +\
            ' --DiagDir=plotlosoto' + ms + '/NeReVar/ --basename=_selfcalcycle' + str(selfcalcycle).zfill(3) + ' --modelcol=MODEL_DATA')

   ## --- start STACK code ---
   if args['stack']:
     for ms in mslist_orig:
       applycal(ms, parmdbmergename, msincol='DATA',msoutcol='CORRECTED_DATA', dysco=dysco)
       # note parmdbmergename should alwats be correct since we only had one MS (stack.MS) and so it does only "loop" over one MS. 
   ## --- end STACK code ---
   
   if len(modeldatacolumns) > 0:
      np.save('wsclean_h5list.npy', wsclean_h5list)
      return wsclean_h5list
   else:
      return []


def is_binary(file_name):
    ''' Check if a file contains text (and thus is a skymodel file, for example).
    Example from https://stackoverflow.com/questions/2472221/how-to-check-if-a-file-contains-plain-text
    Args:
        file_name (str): path to the file to determine the binary nature of.
    Returns:
        result (bool): returns whether the file is binary (True) or not (False).
    '''
    try:
      import magic
    except:
      return False # if magic is not installed just assume this is not a binary
    f = magic.Magic(mime=True)
    mime = f.from_file(file_name)
    if 'text' in mime:
        return False
    else:
        return True


def predictsky_wscleanfits(ms, imagebasename, usewgridder=True, \
                           wgridderaccuracy=1e-4, nosmallinversion=False):
    '''
    Predict the sky from model channels fits images (from a previous run, so frequencies need to overlap)
    '''
    channelsout = len(glob.glob(imagebasename + '-????-model.fits'))
    cmd = 'wsclean -channels-out '+ str(channelsout)+ ' -pol i '
    if usewgridder:
       cmd += '-gridder wgridder '
       cmd += '-wgridder-accuracy ' + str(wgridderaccuracy) + ' '
       if nosmallinversion:
          cmd += '-no-min-grid-resolution ' #'-no-small-inversion ' 
    else:
       cmd += '-padding 1.8 ' 
    cmd+= '-name ' + imagebasename + ' -predict ' + ms
    print(cmd)
    run(cmd)
    time.sleep(1)
    return


def predictsky(ms, skymodel, modeldata='MODEL_DATA', predictskywithbeam=False, sources=None,beamproximitylimit=240.0):

   cmd = 'DP3 numthreads='+str(multiprocessing.cpu_count())+ ' msin=' + ms + ' msout=. '
   cmd += 'p.sourcedb=' + skymodel + ' steps=[p] p.type=predict msout.datacolumn=' + modeldata + ' '
   if sources is not None:
      cmd += 'p.sources=[' + str(sources) + '] '
   if predictskywithbeam:
      cmd += 'p.usebeammodel=True p.usechannelfreq=True p.beammode=array_factor '
      cmd += 'p.beamproximitylimit=' + str(beamproximitylimit) + ' '

   print(cmd)
   run(cmd)

def updatemodelcols_includedir(modeldatacolumns, soltypenumber, soltypelist_includedir, ms, dryrun=False):
   modeldatacolumns_solve = []
   modeldatacolumns_notselected = []
   id_kept = []
   id_removed = []
   
   f = open('facetdirections.p', 'rb')
   sourcedir = pickle.load(f) # units are radian
   f.close()
   assert sourcedir.shape[0] == len(modeldatacolumns)
   assert soltypenumber < soltypelist_includedir.shape[1] 
   assert len(modeldatacolumns) == soltypelist_includedir.shape[0] 

   soltypelist_includedir_sel = soltypelist_includedir[:,soltypenumber] # select the correct soltype pertubation
   assert soltypelist_includedir_sel.sum() > 0 # some element must be True

   if soltypelist_includedir_sel.sum() == len(modeldatacolumns): # all are True, trivial case
      return modeldatacolumns, sourcedir, id_kept
    
   # step 1 remove columns from list that should not be solved
   for modelcolumn_id, modelcolumn in enumerate(modeldatacolumns):
      if soltypelist_includedir_sel[modelcolumn_id]:
         modeldatacolumns_solve.append(modelcolumn)
         id_kept.append(modelcolumn_id)
      else:
         modeldatacolumns_notselected.append(modelcolumn)
         id_removed.append(modelcolumn_id)
   
   modeldatacolumns_solve_newnames = modeldatacolumns_solve[:]
   print('soltypelist_includedir_sel for this pertubation', soltypelist_includedir_sel)
   #print(modeldatacolumns_solve)
   #print('Not selected', modeldatacolumns_notselected)
   #print(id_kept)
   #print(id_removed)
   print('Removed these directions coordinates')
   print(sourcedir[id_removed][:])
   #print(sourcedir)
   #print(sourcedir[id_kept][:])
   #print(sourcedir.shape)
   #sourcedir_kept = sourcedir[id_kept][:]
   #sourcedir_removed = sourcedir[id_removed][:]
   #sys.exit()
 
   for removed_id in id_removed:  
      c1 = SkyCoord(sourcedir[removed_id,0]*units.radian, sourcedir[removed_id,1]* units.radian, frame='icrs') # removed source
      distance = 1e9 # just a big number, larger than 180 degr
      for kept_id in id_kept:
         c2 = SkyCoord(sourcedir[kept_id,0]*units.radian, sourcedir[kept_id,1]*units.radian, frame='icrs') # kept source, looping over to find the closest
         angsep = c1.separation(c2).to(units.degree)
         #print(kept_id, angsep.value, '[degree]')
         if angsep.value < distance:
           distance = angsep.value
           closest_kept_modelcol = modeldatacolumns[kept_id]
      print('Removed', modeldatacolumns[removed_id] ,'Closest kept is:', closest_kept_modelcol)    
      
      modeldatacolumns_solve_newnames[modeldatacolumns_solve.index(closest_kept_modelcol)] = modeldatacolumns_solve_newnames[modeldatacolumns_solve.index(closest_kept_modelcol)] + '+' + modeldatacolumns[removed_id].split('MODEL_DATA_DD')[1]
  
   
   #print(modeldatacolumns_solve_newnames)
   # DP3 to create the missing columns
   for modelcol in modeldatacolumns_solve_newnames:
      t = pt.table(ms, ack=False)
      colnames = t.colnames()
      t.close()
      if modelcol not in colnames:
         cmddppp = 'DP3 msin=' + ms + ' msin.datacolumn=MODEL_DATA_DD0 msout=. steps=[] ' # pick MODEL_DATA_DD0 because it always exists (note MODEL_DATA is not there anymore as a template with the new WSClean -model-column option
         cmddppp += 'msout.datacolumn=' + modelcol + ' '  
         print(cmddppp)
         if not dryrun:
           run(cmddppp)
   
   # taql to fill the missing columns
   for modelcol in modeldatacolumns_solve_newnames:  
      modeldatacolumns_taql_tmp =list(modelcol.split('+'))
      modeldatacolumns_taql = modeldatacolumns_taql_tmp[:]
      for mm_id, mm in enumerate(modeldatacolumns_taql_tmp):
        if mm_id > 0:
          modeldatacolumns_taql[mm_id] = 'MODEL_DATA_DD' + mm
      #print(modeldatacolumns_taql)
      colstr ='(' + '+'.join(map(str, modeldatacolumns_taql)) + ')'
      #print(colstr)
      
      if '+' in modelcol: # we have a composite column
         taqlcmd =  "taql" + " 'update " + ms + " set " + modelcol.replace("+", "\\+") + "=" + colstr + "'"
         print(taqlcmd)
         if not dryrun:
           run(taqlcmd)
   

   # create new column name MODEL_DATA_DDX+Y+Z with DP3
   # fill this column with taql
   
   # create modeldatacolumns_solve
   
   # return modeldatacolumns_solve
   
   
   return modeldatacolumns_solve_newnames, sourcedir[id_removed][:],id_kept

def runDPPPbase(ms, solint, nchan, parmdb, soltype, uvmin=1, \
                SMconstraint=0.0, SMconstraintreffreq=0.0, \
                SMconstraintspectralexponent=-1.0, SMconstraintrefdistance=0.0, antennaconstraint=None, \
                resetsols=None, resetsols_list=[None], resetdir=None, \
                resetdir_list=[None], restoreflags=False, \
                maxiter=100, tolerance=1e-4, flagging=False, skymodel=None, flagslowphases=True, \
                flagslowamprms=7.0, flagslowphaserms=7.0, incol='DATA', \
                predictskywithbeam=False, BLsmooth=False, skymodelsource=None, \
                skymodelpointsource=None, wscleanskymodel=None, iontimefactor=0.01, ionfreqfactor=1.0,\
                blscalefactor=1.0, dejumpFR=False, uvminscalarphasediff=0,selfcalcycle=0, dysco=True, blsmooth_chunking_size=8, gapchanneldivision=False, soltypenumber=0, create_modeldata=True, \
                clipsolutions=False, clipsolhigh=1.5, clipsollow=0.667, \
                ampresetvalfactor=10., uvmax=None, \
                modeldatacolumns=[], solveralgorithm='directioniterative', solveralgorithm_dde='directioniterative', preapplyH5_dde=[], \
                dde_skymodel=None, DDE_predict='WSCLEAN',telescope='LOFAR', beamproximitylimit=240.,\
                ncpu_max=24, bdaaverager=False, DP3_dual_single=True, soltype_list=None, soltypelist_includedir=None, normamps=True):

    soltypein = soltype # save the input soltype is as soltype could be modified (for example by scalarphasediff)

    modeldata = 'MODEL_DATA' # the default, update if needed for scalarphasediff and phmin solves
    if BLsmooth:
      t = pt.table(ms, ack=False)
      colnames = t.colnames()
      t.close()
      if 'SMOOTHED_DATA' not in colnames:
        print('python BLsmooth.py -n 8 -c '+ str(blsmooth_chunking_size) + ' -i '+ incol + ' -o SMOOTHED_DATA -f ' + str(iontimefactor) + \
                   ' -s ' + str(blscalefactor) + ' -u ' + str(ionfreqfactor) + ' ' + ms)
        run('python BLsmooth.py -n 8 -c '+ str(blsmooth_chunking_size) + ' -i '+ incol + ' -o SMOOTHED_DATA -f ' + str(iontimefactor) + \
                ' -s ' + str(blscalefactor) + ' -u ' + str(ionfreqfactor) + ' ' + ms)
      incol = 'SMOOTHED_DATA'


    if skymodel is not None and create_modeldata and selfcalcycle == 0 and len(modeldatacolumns) == 0:
        predictsky(ms, skymodel, modeldata='MODEL_DATA', predictskywithbeam=predictskywithbeam, sources=skymodelsource)

    #if wscleanskymodel is not None and soltypein != 'scalarphasediff' and soltypein != 'scalarphasediffFR' and create_modeldata:
    if wscleanskymodel is not None and create_modeldata and len(modeldatacolumns) == 0:
        makeimage([ms], wscleanskymodel, 1., 1., len(glob.glob(wscleanskymodel + '-????-model.fits')),\
        0, 0.0, onlypredict=True, idg=False, \
        gapchanneldivision=gapchanneldivision)


    #if skymodelpointsource is not None and soltypein != 'scalarphasediff' and soltypein != 'scalarphasediffFR' and create_modeldata:
    if skymodelpointsource is not None and create_modeldata:
        # create MODEL_DATA (no dysco!)
        run('DP3 msin=' + ms + ' msout=. msout.datacolumn=MODEL_DATA steps=[]')
        # do the predict with taql
        run("taql" + " 'update " + ms + " set MODEL_DATA[,0]=(" + str(skymodelpointsource)+ "+0i)'")
        run("taql" + " 'update " + ms + " set MODEL_DATA[,3]=(" + str(skymodelpointsource)+ "+0i)'")
        run("taql" + " 'update " + ms + " set MODEL_DATA[,1]=(0+0i)'")
        run("taql" + " 'update " + ms + " set MODEL_DATA[,2]=(0+0i)'")

    if soltype == 'scalarphasediff' or soltype == 'scalarphasediffFR':
      # PM means point source model adjusted weights
      create_weight_spectrum(ms, 'WEIGHT_SPECTRUM_PM', updateweights_from_thiscolumn='MODEL_DATA', updateweights=False) # always do to re-initialize WEIGHT_SPECTRUM_PM (because stack.MS is re-created each selfcalcycle, also MODEL_DATA changes
      # for now use updateweights=False, seems to give better results for scalarphasediff type solves
      # updateweights means WEIGHT_SPECTRUM_PM is updated based on MODEL_DATA**2, however so far this does not seem to give better results
      # update July 2024, tested on Perseus LBA with updateweights True and False, again difference is small
            
      # check if colnames are there each time because of stack.MS
      t = pt.table(ms, ack=False)
      colnames = t.colnames()
      t.close() # needs a close here because below were are writing columns potentially
      if 'DATA_CIRCULAR_PHASEDIFF' not in colnames:
        create_phasediff_column(ms, incol=incol, dysco=dysco)
      if 'MODEL_DATA_PDIFF' not in colnames:
        create_MODEL_DATA_PDIFF(ms) # make a point source
      soltype = 'phaseonly' # do this type of solve, maybe scalarphase is fine? 'scalarphase' #
      incol='DATA_CIRCULAR_PHASEDIFF'      
      modeldata = 'MODEL_DATA_PDIFF'

    if soltype in ['phaseonly_phmin', 'rotation_phmin', 'tec_phmin', 'tecandphase_phmin','scalarphase_phmin']:
      create_phase_column(ms, incol=incol, outcol='DATA_PHASEONLY', dysco=dysco)
      create_phase_column(ms, incol='MODEL_DATA', outcol='MODEL_DATA_PHASEONLY', dysco=dysco)
      soltype = soltype.split('_phmin')[0]
      incol = 'DATA_PHASEONLY'
      modeldata = 'MODEL_DATA_PHASEONLY'

    if soltype in ['phaseonly_slope', 'scalarphase_slope']:
      create_phase_slope(ms, incol=incol, outcol='DATA_PHASE_SLOPE', ampnorm=True, dysco=dysco)
      create_phase_slope(ms, incol='MODEL_DATA', outcol='MODEL_DATA_PHASE_SLOPE', ampnorm=True, dysco=dysco)
      soltype = soltype.split('_slope')[0]
      incol = 'DATA_PHASE_SLOPE'
      modeldata = 'MODEL_DATA_PHASE_SLOPE'
      # udpate weights according to weights * (MODEL_DATA/MODEL_DATA_PHASE_SLOPE)**2
      create_weight_spectrum_modelratio(ms, 'WEIGHT_SPECTRUM_PM', \
                                        updateweights=True, originalmodel='MODEL_DATA',\
                                        newmodel='MODEL_DATA_PHASE_SLOPE', backup=True)

    #if soltype in ['fulljones']:
    #  print('Setting XY and YX to 0+0i')
    #  if len(modeldatacolumns) > 1:
    #    if DDE_predict == 'WSCLEAN':
    #      for mcol in modeldatacolumns:
    #        run("taql" + " 'update " + ms + " set " + mcol + "[,1]=(0+0i)'")
    #        run("taql" + " 'update " + ms + " set " + mcol + "[,2]=(0+0i)'")
    #  else:
    #    run("taql" + " 'update " + ms + " set MODEL_DATA[,1]=(0+0i)'")
    #    run("taql" + " 'update " + ms + " set MODEL_DATA[,2]=(0+0i)'")

    if soltype in ['phaseonly','complexgain','fulljones','rotation+diagonal',\
                   'amplitudeonly','rotation+diagonalamplitude',\
                   'rotation+diagonalphase']: # for 1D plotting
      onepol = False
    if soltype in ['scalarphase','tecandphase','tec','scalaramplitude',\
                   'scalarcomplexgain','rotation','rotation+scalar',\
                   'rotation+scalarphase','rotation+scalaramplitude']:
      onepol = True

    if restoreflags:
      cmdtaql = "'update " + ms + " set FLAG=FLAG_BACKUP'"
      print("Restore flagging column: " + "taql " + cmdtaql)
      run("taql " + cmdtaql)


    t = pt.table(ms + '/SPECTRAL_WINDOW',ack=False)
    freq = np.median(t.getcol('CHAN_FREQ')[0])
    t.close()

    t = pt.table(ms + '/ANTENNA',ack=False)
    antennasms = t.getcol('NAME')
    t.close()

    t = pt.table(ms, readonly=True, ack=False)
    ms_ntimes = len(np.unique(t.getcol('TIME')))
    t.close()
    
    
    if telescope == 'LOFAR':
      if freq > 100e6:
        HBAorLBA = 'HBA'
      else:
        HBAorLBA = 'LBA'
      print('This is', HBAorLBA, 'data')
    else:
        HBAorLBA = 'other'
    print('This ms contains', antennasms)

    # determine if phases needs to be included, important if slowgains do not contain phase solutions
    includesphase = True
    if soltype == 'scalaramplitude' or soltype == 'amplitudeonly' \
       or soltype == 'rotation+diagonalphase' or soltype == 'rotation+scalarphase':
      includesphase = False

    # figure out which weight_spectrum column to use
    if soltypein == 'scalarphasediff' or soltypein == 'scalarphasediffFR' or \
           soltypein == 'phaseonly_slope' or soltypein == 'scalarphase_slope' :
       weight_spectrum = 'WEIGHT_SPECTRUM_PM'
    else:
      # check for WEIGHT_SPECTRUM_SOLVE from DR2 products
      t = pt.table(ms, ack=False)
      if 'WEIGHT_SPECTRUM_SOLVE' in t.colnames():
         weight_spectrum =  'WEIGHT_SPECTRUM_SOLVE'
      else:
         weight_spectrum =  'WEIGHT_SPECTRUM'
      t.close()  
 
   # check for previous old parmdb and remove them
    if os.path.isfile(parmdb):
      print('H5 file exists  ', parmdb)
      os.system('rm -f ' + parmdb)

    cmd = 'DP3 numthreads='+str(np.min([multiprocessing.cpu_count(),ncpu_max])) + \
          ' msin=' + ms + ' msout=. '

    if soltype == 'rotation+diagonal':
       cmd += 'ddecal.rotationdiagonalmode=diagonal ' 
    if soltype == 'rotation+diagonalamplitude':
       cmd += 'ddecal.rotationdiagonalmode=diagonalamplitude ' 
    if soltype == 'rotation+diagonalphase':
       cmd += 'ddecal.rotationdiagonalmode=diagonalphase ' 
    if soltype == 'rotation+scalar': # =scalarcomplexgain
       cmd += 'ddecal.rotationdiagonalmode=scalar ' 
    if soltype == 'rotation+scalaramplitude':
       cmd += 'ddecal.rotationdiagonalmode=scalaramplitude ' 
    if soltype == 'rotation+scalarphase':
       cmd += 'ddecal.rotationdiagonalmode=scalarphase '        
    
    # deal with the special cases because DP3 only knows soltype rotation+diagonal (it uses rotationdiagonalmode)
    if soltype in ['rotation+diagonalamplitude','rotation+diagonalphase',\
                   'rotation+scalar','rotation+scalaramplitude','rotation+scalarphase']:
       cmd += 'ddecal.mode=rotation+diagonal '
       #cmd += 'ddecal.rotationreference=True '
    else:
       cmd += 'ddecal.mode=' + soltype + ' '

    # note there are two things to check before we can use ddecal.datause=single/dual
    # 1 current solve needs to be of the correct type
    # 2 previous solves should not violate the assumptions of the current single/dual solve
    if soltype_list is not None:
      print(f"soltype_list slice: {soltype_list[0:soltypenumber]}")
      print(soltype, soltype_list)
      if DP3_dual_single:
        if soltype in ['complexgain', 'amplitudeonly', 'phaseonly'] \
          and 'fulljones' not in soltype_list[0:soltypenumber] \
          and 'rotation' not in soltype_list[0:soltypenumber] \
          and 'rotation+diagonalphase' not in soltype_list[0:soltypenumber] \
          and 'rotation+diagonalamplitude' not in soltype_list[0:soltypenumber] \
          and 'rotation+scalar' not in soltype_list[0:soltypenumber] \
          and 'rotation+scalaramplitude' not in soltype_list[0:soltypenumber] \
          and 'rotation+scalarphase' not in soltype_list[0:soltypenumber] \
          and 'rotation+diagonal' not in soltype_list[0:soltypenumber]:
            cmd += 'ddecal.datause=dual '
        if soltype in ['scalarcomplexgain', 'scalaramplitude', \
                     'tec', 'tecandphase', 'scalarphase'] \
          and 'fulljones' not in soltype_list[0:soltypenumber] \
          and 'rotation' not in soltype_list[0:soltypenumber] \
          and 'rotation+diagonalphase' not in soltype_list[0:soltypenumber] \
          and 'rotation+diagonalamplitude' not in soltype_list[0:soltypenumber] \
          and 'rotation+scalar' not in soltype_list[0:soltypenumber] \
          and 'rotation+scalaramplitude' not in soltype_list[0:soltypenumber] \
          and 'rotation+scalarphase' not in soltype_list[0:soltypenumber] \
          and 'rotation+diagonal' not in soltype_list[0:soltypenumber] \
          and 'complexgain' not in soltype_list[0:soltypenumber] \
          and 'amplitudeonly' not in soltype_list[0:soltypenumber] \
          and 'phaseonly' not in soltype_list[0:soltypenumber]: \
            cmd += 'ddecal.datause=single '

    cmd += 'msin.weightcolumn=' + weight_spectrum + ' '
    if bdaaverager:
      cmd += 'steps=[bda,ddecal] ddecal.type=ddecal bda.type=bdaaverager '
    else:
      cmd += 'steps=[ddecal] ddecal.type=ddecal ' 
    if dysco:
      cmd += 'msout.storagemanager=dysco '
      cmd += 'msout.storagemanager.weightbitrate=16 '
    
    if bdaaverager:
      cmd += 'bda.frequencybase= ' + 'bda.minchannels=' + format_nchan(nchan, ms) + ' ' 
      if type(solint) == list:
        cmd += 'bda.timebase= ' + 'bda.maxinterval=' + int(lcm/np.max(divisors)) + ' ' #TODO: Comment from Jurjen: lcm and divisors are non-existing variables --> need fix
      else:
        cmd += 'bda.timebase= ' + 'bda.maxinterval=' + format_solint(solint, ms) + ' ' 

    modeldatacolumns_solve = [] # empty, will be filled below if applicable
    dir_id_kept = [] # empty, will be filled below if applicable
    if len(modeldatacolumns) > 0:
      if DDE_predict == 'DP3' and soltypelist_includedir is not None:
         print('DDE_predict with soltypelist_includedir is not supported')
         raise Exception('DDE_predict with soltypelist_includedir is not supported')
      
      if soltypelist_includedir is not None:
          modeldatacolumns_solve, sourcedir_removed, dir_id_kept = updatemodelcols_includedir(modeldatacolumns, soltypenumber, soltypelist_includedir, ms) 
      
      if DDE_predict == 'DP3':
         cmd += 'ddecal.sourcedb=' + dde_skymodel + ' '
         if telescope == 'LOFAR': # predict with array factor for LOFAR data
           cmd += 'ddecal.usebeammodel=True '
           cmd += 'ddecal.usechannelfreq=True ddecal.beammode=array_factor '
           cmd += 'ddecal.beamproximitylimit=' + str(beamproximitylimit) + ' '
      else:
         if len(modeldatacolumns_solve) >0: # >0 (and not > 1 because we can have 1 direction left)
           cmd += "ddecal.modeldatacolumns='[" + ','.join(map(str, modeldatacolumns_solve)) + "]' " 
         else:
           cmd += "ddecal.modeldatacolumns='[" + ','.join(map(str, modeldatacolumns)) + "]' "
      if len(modeldatacolumns) > 1: # so we are doing a dde solve
        cmd += 'ddecal.solveralgorithm=' + solveralgorithm_dde + ' '
      else: # in case the list still has length 1
        cmd += 'ddecal.solveralgorithm=' + solveralgorithm + ' '
    else:
      cmd += "ddecal.modeldatacolumns='[" + modeldata + "]' " 
      cmd += 'ddecal.solveralgorithm=' + solveralgorithm + ' '


    cmd += 'ddecal.maxiter='+str(int(maxiter)) + ' ddecal.propagatesolutions=True '    
    # Do list comprehension if solint is a list
    if type(solint) == list:
       if len(dir_id_kept) > 0:
         print(solint)
         print(dir_id_kept)
         solint = [solint[i] for i in dir_id_kept] # overwrite solint, selecting on the directions kept
       solints = [int(format_solint(x, ms)) for x in solint]
       solints = tweak_solints(solints, ms_ntimes=ms_ntimes)
       import math
       lcm = math.lcm(*solints)
       divisors = [int(lcm/i) for i in solints]
       cmd += 'ddecal.solint=' + str(lcm) + ' '
       cmd += 'ddecal.solutions_per_direction=' + "'"+str(divisors).replace(' ','') + "' "
    else:
       solint_integer = format_solint(solint, ms) # create the integer number for DP3
       cmd += 'ddecal.solint=' + str(tweak_solints_single(int(solint_integer), ms_ntimes)) + ' '
    cmd += 'ddecal.nchan=' + format_nchan(nchan, ms) + ' '
    cmd += 'ddecal.h5parm=' + parmdb + ' '


    # preapply H5 from previous pertubation for DDE solves with DP3
    if (len(modeldatacolumns) > 1) and (len(preapplyH5_dde) > 0):
      if DDE_predict == 'DP3':
        cmd += build_applycal_dde_cmd(preapplyH5_dde) + ' '
      else:
        cmd += 'msin.datacolumn=DATA ' # to prevent solving out of CORRECTED_PREAPPLY$N
    else:
      cmd += 'msin.datacolumn=' + incol + ' '


    # SET UVMIN
    if soltypein == 'scalarphasediff' or soltypein == 'scalarphasediffFR':
       if uvminscalarphasediff is not None:
         cmd += 'ddecal.uvlambdamin=' + str(uvminscalarphasediff) + ' '
       else:
         if uvmin != 0:
           cmd += 'ddecal.uvlambdamin=' + str(uvmin) + ' '
    else:
       if uvmin != 0:
         cmd += 'ddecal.uvlambdamin=' + str(uvmin) + ' '
       if uvmax is not None: # no need to see uvlambdamax for scalarphasediff solves since there we always solve against a point source
         cmd += 'ddecal.uvlambdamax=' + str(uvmax) + ' '

    if antennaconstraint is not None:
        cmd += 'ddecal.antennaconstraint=' + antennaconstraintstr(antennaconstraint, antennasms, HBAorLBA, telescope=telescope) + ' '
    if SMconstraint > 0.0 and nchan != 0:
        cmd += 'ddecal.smoothnessconstraint=' + str(SMconstraint*1e6) + ' '
        cmd += 'ddecal.smoothnessreffrequency=' + str(SMconstraintreffreq*1e6) + ' '
        cmd += 'ddecal.smoothnessspectralexponent=' + str(SMconstraintspectralexponent) + ' '
        cmd += 'ddecal.smoothnessrefdistance=' + str(SMconstraintrefdistance*1e3) + ' ' # input units in km

    if soltype in ['phaseonly','scalarphase','tecandphase','tec','rotation',\
                   'rotation+scalarphase','rotation+diagonalphase']:
       cmd += 'ddecal.tolerance=' + str(tolerance) + ' '
       if soltype in ['tecandphase','tec']:
          cmd += 'ddecal.approximatetec=True '
          cmd += 'ddecal.stepsize=0.2 '
          cmd += 'ddecal.maxapproxiter=45 '
          cmd += 'ddecal.approxtolerance=6e-3 '
    if soltype in ['complexgain','scalarcomplexgain','scalaramplitude','amplitudeonly',\
                   'rotation+diagonal','fulljones','rotation+scalar',\
                   'rotation+diagonalamplitude','rotation+scalaramplitude']:
       cmd += 'ddecal.tolerance=' + str(tolerance) + ' ' # for now the same as phase soltypes
    #cmd += 'ddecal.detectstalling=False '

    print('DP3 solve:', cmd)
    logger.info('DP3 solve: ' + cmd)
    
    # START prepare to remove this at some point
    run(cmd)
    
    #if soltype == 'fulljones':
    #   sys.exit()
    #sys.exit()
    
    if False: 
        if selfcalcycle > 0 and (soltypein=="scalarphasediffFR" or soltypein=="scalarphasediff"):
            h5_tocopy = soltypein + str(soltypenumber)+"_selfcalcyle000_" + os.path.basename(ms)+".h5.scbackup"
            print("COPYING PREVIOUS SCALARPHASEDIFF SOLUTION")
            print('cp -r ' + h5_tocopy + ' ' + parmdb)
            os.system('cp -r ' + h5_tocopy + ' ' + parmdb)
        else:
            run(cmd)
    if selfcalcycle==0 and (soltypein=="scalarphasediffFR" or soltypein=="scalarphasediff"):
        os.system("cp -r " + parmdb + " " + parmdb + ".scbackup")
    # END prepare to remove this at some point

    if (len(modeldatacolumns_solve) >0) and (len(modeldatacolumns) != len(modeldatacolumns_solve)):
       # fix coordinates otherwise h5merge will merge all directions into one when add_directions is done (as all coordinates are the same up to this point)
       update_sourcedir_h5_dde(parmdb, 'facetdirections.p', dir_id_kept=dir_id_kept)

       # we need to add back the extra direction into the h5 file  
       import h5_merger
       import split_h5
       outparmdb = 'adddirback' + parmdb
       if os.path.isfile(outparmdb):
          os.system('rm -f ' + outparmdb)
       h5_merger.merge_h5(h5_out=outparmdb,h5_tables=parmdb,add_directions=sourcedir_removed.tolist(),propagate_flags=False)

       # now we split them all into separate h5 per direction so we can reorder and fill them
       print('Splitting directions into separate h5')
       split_h5.split_multidir(outparmdb)
       
       #fill the added emtpy directions with the closest ones that were solved for
       print('Copy over solutions from skipped directions')
       copy_over_solutions_from_skipped_directions(modeldatacolumns,dir_id_kept)
   
       # create backup of parmdb and remove orginal and cleanup
       os.system('cp ' + parmdb + ' ' + parmdb + '.backup')
       os.system('rm -f ' + parmdb)
       os.system('rm -f ' + outparmdb)
    
       # merge h5 files in order of the directions in facetdirections.p and recreate parmdb
       # clean up previously splitted directions inside this function
       print('Merge h5 files in correct order and recreate parmdb')
       merge_splitted_h5_ordered(modeldatacolumns, parmdb, clean_up=True)
       
       # fix direction names
       update_sourcedirname_h5_dde(parmdb, modeldatacolumns)
       #sys.exit()

    if len(modeldatacolumns) > 1: # and DDE_predict == 'WSCLEAN':
       update_sourcedir_h5_dde(parmdb, 'facetdirections.p')

    if has0coordinates(parmdb):
       logger.warning('Direction coordinates are zero in: ' + parmdb)

    # Roation checking
    if soltype in ['rotation','rotation+diagonal','rotation+diagonalphase','rotation+diagonalamplitude',\
                   'rotation+scalar','rotation+scalaramplitude','rotation+scalarphase']:
      removenans(parmdb, 'rotation000')
      fix_weights_rotationh5(parmdb)
      refant=findrefant_core(parmdb)
      force_close(parmdb)
      fix_rotationreference(parmdb, refant)

    # tec checking
    if soltype in ['tec','tecandphase']:
       removenans(parmdb, 'tec000')
       refant=findrefant_core(parmdb)
       fix_tecreference(parmdb, refant)
       force_close(parmdb)

    # phase checking
    if soltype in ['rotation+diagonal','rotation+diagonalphase',\
                   'rotation+scalar','rotation+scalarphase',\
                   'scalarcomplexgain','complexgain','scalarphase',\
                   'phaseonly']:
       removenans(parmdb, 'phase000')
       refant=findrefant_core(parmdb)
       fix_phasereference(parmdb, refant)
       force_close(parmdb)
         
    if int(maxiter) == 1: # this is a template solve only
      print('Template solve, not going to make plots or do solution flagging')
      return

    outplotname = parmdb.split('_' + os.path.basename(ms) + '.h5')[0]

    if incol == 'DATA_CIRCULAR_PHASEDIFF':
      print('Manually updating H5 to get the phase difference correct')
      refant=findrefant_core(parmdb) # phase matrix plot
      force_close(parmdb)
      makephasediffh5(parmdb, refant)
    if incol == 'DATA_CIRCULAR_PHASEDIFF' and soltypein == 'scalarphasediffFR':
      print('Fiting for Faraday Rotation with losoto on the phase differences')
      # work with copies H5 because losoto changes the format splitting off the length 1 direction axis creating issues with H5merge (also add additional solution talbes which we do not want)
      os.system('cp -f ' + parmdb + ' ' + 'FRcopy' + parmdb)
      losoto_parsetFR = create_losoto_FRparset(ms, refant=findrefant_core(parmdb), outplotname=outplotname,dejump=dejumpFR)
      run('losoto ' + 'FRcopy' + parmdb + ' ' + losoto_parsetFR)
      rotationmeasure_to_phase('FRcopy' + parmdb, parmdb, dejump=dejumpFR)
      run('losoto ' + parmdb + ' ' + create_losoto_FRparsetplotfit(ms, refant=findrefant_core(parmdb), outplotname=outplotname))
      force_close(parmdb)


    if incol == 'DATA_PHASE_SLOPE':
      print('Manually updating H5 to get the cumulative phase')
      #makephaseCDFh5(parmdb)
      makephaseCDFh5_h5merger(parmdb, ms, modeldatacolumns)

    if resetsols is not None:
      if soltype in ['phaseonly','scalarphase','tecandphase','tec','rotation','fulljones',\
                     'complexgain','scalarcomplexgain','rotation+diagonal',\
                     'rotation+diagonalamplitude','rotation+diagonalphase',\
                     'rotation+scalar','rotation+scalarphase','rotation+scalaramplitude']:
         refant=findrefant_core(parmdb)
         force_close(parmdb)
      else:
         refant = None
      resetsolsforstations(parmdb, antennaconstraintstr(resetsols, antennasms, HBAorLBA, useforresetsols=True, telescope=telescope), refant=refant)

    if resetdir is not None:
      if soltype in ['phaseonly','scalarphase','tecandphase','tec','rotation','fulljones',\
                     'complexgain','scalarcomplexgain','rotation+diagonal',\
                      'rotation+diagonalamplitude','rotation+diagonalphase',\
                      'rotation+scalar','rotation+scalarphase','rotation+scalaramplitude']:
         refant=findrefant_core(parmdb)
         force_close(parmdb)
      else:
         refant = None
      
      resetsolsfordir(parmdb, resetdir, refant=refant)


    if number_freqchan_h5(parmdb) > 1:
      onechannel = False
    else:
      onechannel = True


    # Check for bad values (amplitudes/fulljones)
    if soltype in ['scalarcomplexgain','complexgain','amplitudeonly','scalaramplitude',\
                   'fulljones','rotation+diagonal','rotation+diagonalamplitude',\
                   'rotation+scalar','rotation+scalaramplitude']:
      if resetdir is not None or resetsols is not None:
         flagbadamps(parmdb, setweightsphases=includesphase, flagamp1=False, flagampxyzero=False) # otherwise it flags the solutions which where reset
      else:
         flagbadamps(parmdb, setweightsphases=includesphase)
      if soltype == 'fulljones':
         removenans_fulljones(parmdb)
      else:  
         removenans(parmdb, 'amplitude000')
      medamp = medianamp(parmdb)


      if soltype != 'amplitudeonly' and soltype != 'scalaramplitude' \
             and soltype != 'rotation+diagonalamplitude' \
             and soltype != 'rotation+scalaramplitude':
         #try:
         #  change_refant(parmdb,'phase000')
         #except:
         #  pass
         removenans(parmdb, 'phase000')
      
      if soltype == 'fulljones':
         #if normamps: #and all(rsl is None for rsl in resetsols_list) and all(rdl is None for rdl in resetdir_list):
             # otherwise you get too much setting to 1 due to large amp deviations, in particular fullones on raw data which has very high correlator amps (with different ILT vals), also resets in that case cause issues (resets are ok if the amplitudes are close to 1). Hence using the normamps test seems the most logical choice
             flaglowamps_fulljones(parmdb, lowampval=medamp/ampresetvalfactor, flagging=flagging, setweightsphases=includesphase)
             flaghighamps_fulljones(parmdb, highampval=medamp*ampresetvalfactor, flagging=flagging, setweightsphases=includesphase)
      else:
         #if normamps: #and all(rsl is None for rsl in resetsols_list) and all(rdl is None for rdl in resetdir_list): 
            # otherwise you get too much setting to 1 due to large amp deviations, in particular fullones on raw data which has very high correlator amps (with different ILT vals), also resets in that case cause issues (resets are ok if the amplitudes are close to 1).  Hence using the normamps test seems the most logical choice
            flaglowamps(parmdb, lowampval=medamp/ampresetvalfactor, flagging=flagging, setweightsphases=includesphase)
            flaghighamps(parmdb, highampval=medamp*ampresetvalfactor, flagging=flagging, setweightsphases=includesphase)

      if soltype == 'fulljones' and clipsolutions:
        print('Fulljones and solution clipping not supported')
        raise Exception('Fulljones and clipsolutions not implemtened')
      if clipsolutions:
        flaglowamps(parmdb, lowampval=clipsollow, flagging=True, setweightsphases=True)
        flaghighamps(parmdb, highampval=clipsolhigh, flagging=True, setweightsphases=True)

    # ---------------------------------
    # ---------------------------------
    # makes plots and do LOSOTO flagging
    if soltype in ['rotation','rotation+diagonal','rotation+diagonalamplitude',\
                   'rotation+scalar','rotation+scalaramplitude',\
                   'rotation+scalarphase','rotation+diagonalphase']:

      losotoparset_rotation = create_losoto_rotationparset(ms, onechannel=onechannel, outplotname=outplotname + 'ROT', refant=findrefant_core(parmdb)) # phase matrix plot
      force_close(parmdb)
      cmdlosoto = 'losoto ' + parmdb + ' ' + losotoparset_rotation
      print(cmdlosoto)
      logger.info(cmdlosoto)
      run(cmdlosoto)
      
      
      if soltype in ['rotation+scalarphase','rotation+diagonalphase']:
         losotoparset_phase = create_losoto_fastphaseparset(ms, onechannel=onechannel, onepol=onepol, outplotname=outplotname, refant=findrefant_core(parmdb)) # phase matrix plot
         cmdlosoto = 'losoto ' + parmdb + ' ' + losotoparset_phase
         force_close(parmdb)
         print(cmdlosoto)
         logger.info(cmdlosoto)
         run(cmdlosoto)


    if soltype in ['phaseonly','scalarphase']:
      losotoparset_phase = create_losoto_fastphaseparset(ms, onechannel=onechannel, onepol=onepol, outplotname=outplotname, refant=findrefant_core(parmdb)) # phase matrix plot
      cmdlosoto = 'losoto ' + parmdb + ' ' + losotoparset_phase
      force_close(parmdb)
      print(cmdlosoto)
      logger.info(cmdlosoto)
      run(cmdlosoto)


    if soltype in ['tecandphase', 'tec']:
       tecandphaseplotter(parmdb, ms, outplotname=outplotname) # use own plotter because losoto cannot add tec and phase

    if soltype in ['tec']:
       losotoparset_tec = create_losoto_tecparset(ms, outplotname=outplotname,\
                             refant=findrefant_core(parmdb), markersize=compute_markersize(parmdb))
       cmdlosoto = 'losoto ' + parmdb + ' ' + losotoparset_tec
       print(cmdlosoto)
       logger.info(cmdlosoto)
       run(cmdlosoto)
       force_close(parmdb)


    if soltype in ['scalarcomplexgain','complexgain','amplitudeonly','scalaramplitude', \
                   'fulljones','rotation+diagonal','rotation+diagonalamplitude',\
                   'rotation+scalar','rotation+scalaramplitude'] and (ntimesH5(parmdb) > 1): # plotting/flagging fails if only 1 timeslot
       print('Do flagging?:', flagging)
       if flagging and not onechannel:
          if soltype == 'fulljones':
            print('Fulljones and flagging not implemtened')
            raise Exception('Fulljones and flagging not implemtened')
          else:
            losotoparset = create_losoto_flag_apgridparset(ms, flagging=True, maxrms=flagslowamprms, \
                                                           maxrmsphase=flagslowphaserms, \
                                                           includesphase=includesphase, onechannel=onechannel, \
                                                           medamp=medamp, flagphases=flagslowphases, onepol=onepol,\
                                                           outplotname=outplotname, refant=findrefant_core(parmdb))
            force_close(parmdb)
       else:
          losotoparset = create_losoto_flag_apgridparset(ms, flagging=False, includesphase=includesphase, \
                         onechannel=onechannel, medamp=medamp, onepol=onepol, outplotname=outplotname,\
                         refant=findrefant_core(parmdb), fulljones=fulljonesparmdb(parmdb))
          force_close(parmdb)

       # MAKE losoto command
       if flagging:
         os.system('cp -f ' + parmdb + ' ' + parmdb + '.backup')
       cmdlosoto = 'losoto ' + parmdb + ' ' + losotoparset
       print(cmdlosoto)
       logger.info(cmdlosoto)
       run(cmdlosoto)
    if len(tables.file._open_files.filenames) >= 1: # for debugging
      print('End runDPPPbase, some HDF5 files are not closed:', tables.file._open_files.filenames)
      force_close(parmdb)
    return

def rotationmeasure_to_phase(H5filein, H5fileout, dejump=False): 
    # note for scalarphase/phaseonly solve, does not work for tecandphase as freq axis is missing there for phase000
    H5in = tables.open_file(H5filein,mode='r')
    H5out = tables.open_file(H5fileout,mode='a')
    c = 2.99792458e8

    if dejump:
       rotationmeasure = H5in.root.sol000.rotationmeasure001.val[:]
    else:
       rotationmeasure = H5in.root.sol000.rotationmeasure000.val[:]
    phase = H5in.root.sol000.phase000.val[:] # time, freq, ant, dir, pol
    freq  =  H5in.root.sol000.phase000.freq[:]
    wav = c/freq

    print('FR step: Shape rotationmeasure000/1', rotationmeasure.shape)
    print('FR step: Shape phase000', phase.shape)

    for antenna_id,antennatmp in enumerate(H5in.root.sol000.phase000.ant[:]):
       for freq_id, freqtmp in enumerate(freq):
          phase[:, freq_id, antenna_id, 0, 0]  = \
              2.*rotationmeasure[antenna_id,:]*(wav[freq_id])**2  # notice the factor of 2 because of RR-LL
    # note slice over time-axis
    phase[..., -1] = 0.0 # assume last axis is pol-axis, set YY to zero because losoto residual computation changes this froom 0.0 (it divides the poll diff over the XX and YY phases and does not put it all in XX)

    H5out.root.sol000.phase000.val[:] = phase
    H5out.flush()
    H5out.close()
    H5in.close()
    return

def update_sourcedir_h5_dde(h5, sourcedirpickle, dir_id_kept=None):
    f = open(sourcedirpickle, 'rb')
    sourcedir = pickle.load(f)
    f.close()
    
    if dir_id_kept is not None:
       print('Before directions')
       print(sourcedir)
       sourcedir =  np.copy(sourcedir[dir_id_kept][:])
       print('After directions')
       print(sourcedir)
    
    H = tables.open_file(h5,mode='a')
    for direction_id, direction in enumerate(np.copy(H.root.sol000.source[:])):
       H.root.sol000.source[direction_id] =  (direction['name'], [sourcedir[direction_id,0], sourcedir[direction_id,1]])
    H.close()
    
    return

def has0coordinates(h5):
    """
    Check if the coordinates in the directions are 0, avoids being hit by this rare DP3 bug
    """
    h5 = tables.open_file(h5)
    for c in h5.root.sol000.source[:]:
        x, y = c[1]
        if x==0. and y==0.:
            h5.close()
            return True
    h5.close()
    return False

def findrefant_core(H5file):
    """
    Basically like the other one, but now it actually uses losoto
    """
    H = h5parm.h5parm(H5file)
    solset = H.getSolset('sol000')
    soltabs = solset.getSoltabNames()
    for st in soltabs:
        # Find a reasonable soltab to use
        if 'phase000' in st or 'rotation000' in st or 'tec000' in st:
            break
    soltab = solset.getSoltab(st)

    # Find core stations
    ants = soltab.getValues()[1]['ant']
    if 'ST001' in ants:
        H.close()
        return 'ST001'
    cs_indices = np.where(['CS' in ant for ant in ants])[0]

    # temporary MeerKAT fix
    if 'm013' in ants:
        H.close()
        return 'm013'
    if 'm012' in ants:
        H.close()
        return 'm012'
    if 'm011' in ants:
        H.close()
        return 'm011'
    if 'm010' in ants:
        H.close()
        return 'm010'
    if 'm009' in ants:
        H.close()
        return 'm009'      
    if 'm002' in ants:
        H.close()
        return 'm002'    
    if 'm001' in ants:
        H.close()
        return 'm001'          


    if len(cs_indices) == 0: # in case there are no CS stations try with RS
       cs_indices = np.where(['RS' in ant for ant in ants])[0]

    # Find the antennas and which dimension that corresponds to
    ant_index = np.where(np.array(soltab.getAxesNames())=='ant')[0][0]

    # Find the antenna with the least flagged datapoint
    weightsum = []
    ndims = soltab.getValues()[0].ndim
    for cs in cs_indices:
        slc = [slice(None)]*ndims
        slc[ant_index] = cs
        weightsum.append(np.nansum(soltab.getValues(weight=True)[0][tuple(slc)]))
    maxant = np.argmax(weightsum)
    H.close()
    # force_close(H5file) this does not work for some reasons, because it is inside a function that's called in a function call ass argument?
    return ants[maxant]

def create_losoto_FRparsetplotfit(ms, refant='CS001LBA', outplotname='FR'):
    """
    Create a losoto parset to fit Faraday Rotation on the phase difference'.
    """
    parset = 'losotoFR_plotresult.parset'
    os.system('rm -f ' + parset)
    f=open(parset, 'w')

    f.write('[plotFRresult]\n')
    f.write('pol = [XX,YY]\n')
    f.write('operation = PLOT\n')
    f.write('soltab = [sol000/phase000]\n')
    f.write('axesInPlot = [time,freq]\n')
    f.write('axisInTable = ant\n')
    f.write('minmax = [-3.14,3.14]\n')
    f.write('prefix = plotlosoto%s/%s\n' % (ms,outplotname + 'phases_fitFR'))
    f.write('refAnt = %s\n\n\n' % refant)
    f.close()
    return parset

def create_losoto_FRparset(ms, refant='CS001LBA', freqminfitFR=20e6, outplotname='FR', onlyplotFRfit=False, dejump=False):
    """
    Create a losoto parset to fit Faraday Rotation on the phase difference'.
    """
    parset = 'losotoFR.parset'
    os.system('rm -f ' + parset)
    f=open(parset, 'w')

    f.write('[duplicate]\n')
    f.write('operation = DUPLICATE\n')
    f.write('soltab = sol000/phase000\n')
    f.write('soltabOut = phaseOrig000\n\n\n')

    # should not be needed as already done but just in case....
    f.write('[reset]\n')
    f.write('operation = RESET\n')
    f.write('soltab = sol000/phase000\n')
    f.write('pol = YY\n')
    f.write('dataVal = 0.0\n\n\n')

    f.write('[plotphase]\n')
    f.write('pol = [XX,YY]\n')
    f.write('operation = PLOT\n')
    f.write('soltab = [sol000/phase000]\n')
    f.write('axesInPlot = [time,freq]\n')
    f.write('axisInTable = ant\n')
    f.write('minmax = [-3.14,3.14]\n')
    f.write('prefix = plotlosoto%s/%s\n' % (ms,outplotname + 'phases_beforeFR'))
    f.write('refAnt = %s\n\n\n' % refant)

    f.write('[faraday]\n')
    f.write('operation = FARADAY\n')
    f.write('soltab = sol000/phase000\n')
    f.write('refAnt = %s\n' % refant)
    f.write('maxResidual = 2\n')
    f.write('freq.minmaxstep = [%s,1e9]\n' % str(freqminfitFR))
    f.write('soltabOut = rotationmeasure000\n\n\n')

    f.write('[plotFR]\n')
    f.write('operation = PLOT\n')
    f.write('soltab = sol000/rotationmeasure000\n')
    f.write('axesInPlot = [time]\n')
    f.write('axisInTable = ant\n')
    f.write('prefix = plotlosoto%s/%s\n\n\n' % (ms,outplotname + 'FR'))

    if dejump:
       f.write('[frdejump]\n')
       f.write('operation = FRJUMP\n')
       f.write('soltab = sol000/rotationmeasure000\n')
       f.write('soltabOut = rotationmeasure001\n')
       f.write('clipping = [%s,1e9]\n\n\n' % str(freqminfitFR))

       f.write('[plotFR_dejump]\n')
       f.write('operation = PLOT\n')
       f.write('soltab = sol000/rotationmeasure001\n')
       f.write('axesInPlot = [time]\n')
       f.write('axisInTable = ant\n')
       f.write('prefix = plotlosoto%s/%s\n\n\n' % (ms,outplotname + 'FRdejumped'))


    f.write('[residuals]\n')
    f.write('operation = RESIDUALS\n')
    f.write('soltab = sol000/phase000\n')
    if dejump:
       f.write('soltabsToSub = rotationmeasure001\n\n\n')
    else:
       f.write('soltabsToSub = rotationmeasure000\n\n\n')

    f.write('[plotRES]\n')
    f.write('operation = PLOT\n')
    f.write('soltab = sol000/phase000\n')
    f.write('axesInPlot = [time,freq]\n')
    f.write('AxisInTable = ant\n')
    f.write('AxisDiff = pol\n')
    f.write('plotFlag = True\n')
    f.write('prefix = plotlosoto%s/%s\n' % (ms,outplotname + 'residualphases_afterFR'))
    f.write('refAnt = %s\n' % refant)
    f.write('minmax = [-3.14,3.14]\n\n\n')

    f.close()
    return parset


# to remove H5/h5 and other files out of a wildcard selection if needed
def removenonms(mslist):
    """ Remove files that are not MS (ending on wrong extension)

    Args:
        mslist: measurement set list

    Returns:
        New list
    """
    newmslist = []
    for ms in mslist:
        if ms.lower().endswith(('.h5', '.png', '.parset', '.fits', '.backup', '.obj', '.log', '.reg', '.gz', '.tar', '.tmp', '.ddfcache')) or \
        ms.lower().startswith(('plotlosoto','solintimage')):
            print('WARNING, removing ', ms, 'not a ms-type? Removed it!')
        else:
            newmslist.append(ms)
    return newmslist

# check is there are enough timesteps in the ms
# for example this will remove an observations of length 600s
# in that case a lot of assumptions break, for example amplitude flagging in losoto
# also if a "ms" does not open iwht pt.table it means wrong input was provided 
def check_valid_ms(mslist):
  for ms in mslist:
    if not os.path.isdir(ms):
      print(ms, ' does not exist')
      raise Exception('ms does not exist')
    if ms.startswith("."):
      print(ms, ' This ms starts with a "." character, this is not allowed')
      raise Exception('Invalid ms name, do not use relative paths')
      
  for ms in mslist:
    t = pt.table(ms, ack=False)
    times = np.unique(t.getcol('TIME'))

    if len(times) <= 20:
      print('---------------------------------------------------------------------------')
      print('ERROR, ', ms, 'not enough timesteps in ms/too short observation')
      print('---------------------------------------------------------------------------')
      raise Exception('You are providing a MS with less than 20 timeslots, that is not enough to self-calibrate on')
    t.close()
  return 

def arg_as_list(s):
    v = ast.literal_eval(s)
    if type(v) is not list:
        raise argparse.ArgumentTypeError("Argument \"%s\" is not a list" % (s))
    return v

def arg_as_str_or_list(s):
    if "[" not in s and "]" not in s:
        #print('Return str')
        return str(s)
    v = ast.literal_eval(s)
    if type(v) is list:
        #print('Skymodel is a list')
        return v
    raise argparse.ArgumentTypeError("Argument \"%s\" is not a string or list" % (s))


def arg_as_float_or_list(s):
    try:
        return float(s)
    except:
        pass
    v = ast.literal_eval(s)
    if type(v) is list:
        #print('Skymodel is a list')
        return v
    raise argparse.ArgumentTypeError("Argument \"%s\" is not a float or list" % (s))


def makemaskthresholdlist(maskthresholdlist, stop):
   maskthresholdselfcalcycle = []
   for mm in range(stop):
      try:
        maskthresholdselfcalcycle.append(maskthresholdlist[mm])
      except:
        maskthresholdselfcalcycle.append(maskthresholdlist[-1]) # add last value
   return maskthresholdselfcalcycle

def niter_from_imsize(imsize):
   if imsize is None:
     print('imsize not set')
     raise Exception('imsize not set')
   if imsize < 1024:
     niter = 15000 # minimum  value
   else:
     niter = 15000*int((float(imsize)/1024.))

   return niter

def basicsetup(mslist, args):
   longbaseline =  checklongbaseline(mslist[0])
   if args['removeinternational']:
      print('Forcing longbaseline to False as --removeinternational has been specified')  
      longbaseline = False  
   # Determine HBA or LBA
   t    = pt.table(mslist[0] + '/SPECTRAL_WINDOW',ack=False)
   freq = np.median(t.getcol('CHAN_FREQ')[0])
   t.close()
   # set telescope
   t = pt.table(mslist[0] + '/OBSERVATION', ack=False)
   telescope = t.getcol('TELESCOPE_NAME')[0] 
   t.close()

   if telescope == 'LOFAR':
     if freq < 100e6:
       LBA = True
       HBAorLBA = 'HBA'
     else:
       LBA = False
       HBAorLBA = 'LBA'
   else: 
     HBAorLBA = 'other'
     LBA = False
     HBA = False

   # set some default values if not provided
   if args['uvmin'] is None:
     if longbaseline:
        args['uvmin'] = 20000.
     else:  
        if LBA:
            if freq >= 40e6:
              args['uvmin'] = 80.
            if freq < 40e6:
              args['uvmin'] = 60.
        else:
            args['uvmin'] = 350.

   if type(args['uvminim']) is not list: 
      if args['uvminim'] is None:
         if telescope == 'LOFAR':
            args['uvminim'] = 80.  
         else:
            args['uvminim'] = 10. # MeerKAt for example 

   if args['pixelscale'] is None and telescope != 'MeerKAT':
     if LBA:
       if longbaseline:
         args['pixelscale'] = 0.08
       else:
         args['pixelscale'] = np.rint(3.0*54e6/freq)
     else:
       if longbaseline:
         args['pixelscale'] = 0.04
       else:
         args['pixelscale'] = 1.5
   elif telescope == 'MeerKAT':
      if freq < 1e9: # UHF-band
         args['pixelscale'] = pixelscale = 1.8  
      elif freq < 2e9: # L-band
         args['pixelscale'] = pixelscale = 1.
      elif freq < 4e9: # S-band   
         args['pixelscale'] = pixelscale = 0.5
 
   if (args['delaycal'] or args['auto']) and  longbaseline and not LBA:
     if args['imsize'] is None:
       args['imsize'] = 2048

   if args['boxfile'] is not None:
     if args['DDE']:
        args['imsize']   = getimsize(args['boxfile'], args['pixelscale'], increasefactor=1.025)
     else:
        args['imsize']   = getimsize(args['boxfile'], args['pixelscale'])
   if args['niter'] is None:
     args['niter'] = niter_from_imsize(args['imsize'])

   if args['auto'] and not longbaseline:
     args['update_uvmin'] = True
     args['usemodeldataforsolints'] = True
     args['forwidefield'] = True
     args['autofrequencyaverage'] = True
     if LBA:
       args['BLsmooth_list'] = [True]*len(args['soltype_list'])
     else:
       args['update_multiscale'] = True # HBA only
       if args['autofrequencyaverage_calspeedup']:
           args['soltypecycles_list'] = [0,999,2]
           args['stop'] = 8

   if args['auto'] and  longbaseline and not args['delaycal']:
     args['update_uvmin'] = False
     args['usemodeldataforsolints'] = True
     args['forwidefield'] = True
     args['autofrequencyaverage'] = True
     args['update_multiscale'] = True

     args['soltypecycles_list'] = [0,3]
     args['soltype_list'] = [args['targetcalILT'],'scalarcomplexgain']
     if args['targetcalILT'] == 'tec' or args['targetcalILT'] == 'tecandphase':
        args['smoothnessconstraint_list'] = [0.0, 5.0]
     else:
        args['smoothnessconstraint_list'] = [10.0, 5.0]
        args['smoothnessreffrequency_list'] = [120.0, 0.0]
        args['smoothnessspectralexponent_list'] = [-1.0, -1.0]
        args['smoothnessrefdistance_list'] = [0.0,0.0]
     args['uvmin'] =  20000
     
     if args['imsize'] > 1600:
        args['paralleldeconvolution'] = np.min([2600,int(args['imsize']/2)])
     
     if LBA:
       args['BLsmooth_list'] = [True]*len(args['soltype_list'])

   if args['delaycal'] and LBA:
       print('Option automated delaycal can only be used for HBA')
       raise Exception('Option automated delaycal can only be used for HBA')
   if args['delaycal'] and not longbaseline:
       print('Option automated delaycal can only be used for longbaseline data')
       raise Exception('Option automated delaycal can only be used for longbaseline data')

   if args['delaycal'] and longbaseline and not LBA:
     args['update_uvmin'] = False
     # args['usemodeldataforsolints'] = True # NEEDS SPECIAL SETTINGS to be implemented
     args['solint_list']="['5min','32sec','1hr']" 
     args['forwidefield'] = True
     args['autofrequencyaverage'] = True
     args['update_multiscale'] = True

     args['soltypecycles_list'] = [0,0,3]
     args['soltype_list'] = ['scalarphasediff','scalarphase','scalarcomplexgain']
     args['smoothnessconstraint_list'] = [8.0,2.0,15.0]
     args['smoothnessreffrequency_list'] = [120.,144.,0.0]
     args['smoothnessspectralexponent_list'] = [-2.0,-1.0,-1.0]
     args['smoothnessrefdistance_list'] = [0.0,0.0,0.0]
     args['antennaconstraint_list'] = ['alldutch',None,None]
     args['nchan_list'] = [1,1,1]
     args['uvmin'] =  40000
     args['stop'] = 8
     args['maskthreshold'] = [5]
     args['docircular'] = True


   # reset tecandphase -> tec for LBA
   if LBA and args['usemodeldataforsolints']:
     args['soltype_list'][1] = 'tec'  
     # args['soltype_list'][0] = 'tec'  

     if freq < 30e6:
       # args['soltype_list'] = ['tecandphase','tec']    # no scalarcomplexgain in the list, do not use "tec" that gives rings around sources for some reason
       args['soltype_list'] = ['tecandphase','tecandphase']    # no scalarcomplexgain in the list

   if args['forwidefield']:
      args['doflagging'] = False
      args['clipsolutions'] = False

   automask = 2.5
   if args['maskthreshold'][-1] < automask:
     automask = args['maskthreshold'][-1] # in case we use a low value for maskthreshold, like Herc A

   args['imagename']  = args['imagename'] + '_'
   if args['fitsmask'] is not None:
     fitsmask = args['fitsmask']
   else:
     fitsmask = None

   if args['boxfile'] is not None:
     outtarname = (args['boxfile'].split('/')[-1]).split('.reg')[0] + '.tar.gz'
   else:
     outtarname = 'calibrateddata' + '.tar.gz'

   maskthreshold_selfcalcycle = makemaskthresholdlist(args['maskthreshold'], args['stop'])

   # set telescope
   t = pt.table(mslist[0] + '/OBSERVATION', ack=False)
   telescope = t.getcol('TELESCOPE_NAME')[0] 
   t.close()
   #idgin = args['idg'] # store here as we update args['idg'] at some point to made image000 for selfcalcycle 0 in when --DDE is enabled

   if type(args['channelsout']) is str:
     if args['channelsout'] == 'auto':
        args['channelsout'] = set_channelsout(mslist)
     else: 
        raise Exception("channelsout needs to be an integer or 'auto'") 
   else:
     if args['channelsout'] < 1:
        print('channelsout',  args['channelsout'])
        raise Exception("channelsout needs to be a positive integer") 
   
   if type(args['fitspectralpol']) is str:
     if args['fitspectralpol'] == 'auto':
        args['fitspectralpol'] = set_fitspectralpol(args['channelsout'])
     else: 
        raise Exception("channelsout needs to be an integer or 'auto'") 
        
        
   return longbaseline, LBA, HBAorLBA, freq, automask, fitsmask, \
          maskthreshold_selfcalcycle, outtarname, telescope, args


def get_phasediff_score(h5, station=False):
        """
        Calculate score for phasediff

        :return: circular standard deviation score
        """
        from scipy.stats import circstd
        H = tables.open_file(h5)

        stations = [make_utf8(s) for s in list(H.root.sol000.antenna[:]['name'])]

        if not station:
            stations_idx = [stations.index(stion) for stion in stations if
                            ('RS' not in stion) &
                            ('ST' not in stion) &
                            ('CS' not in stion) &
                            ('DE' not in stion)]
        else:
            stations_idx = [stations.index(station)]

        axes = str(H.root.sol000.phase000.val.attrs["AXES"]).replace("b'", '').replace("'", '').split(',')
        axes_idx = sorted({ax: axes.index(ax) for ax in axes}.items(), key=lambda x: x[1], reverse=True)

        phase = H.root.sol000.phase000.val[:] * H.root.sol000.phase000.weight[:]
        H.close()

        phasemod = phase % (2 * np.pi)

        for ax in axes_idx:
            if ax[0] == 'pol':  # YX should be zero
                phasemod = phasemod.take(indices=0, axis=ax[1])
            elif ax[0] == 'dir':  # there should just be one direction
                if phasemod.shape[ax[1]] == 1:
                    phasemod = phasemod.take(indices=0, axis=ax[1])
                else:
                    sys.exit('ERROR: This solution file should only contain one direction, but it has ' +
                             str(phasemod.shape[ax[1]]) + ' directions')
            elif ax[0] == 'freq':  # faraday corrected
                phasemod = np.diff(phasemod, axis=ax[1])
            elif ax[0] == 'ant':  # take only international stations
                phasemod = phasemod.take(indices=stations_idx, axis=ax[1])

        phasemod[phasemod == 0] = np.nan

        return circstd(phasemod, nan_policy='omit')


def compute_phasediffstat(mslist, args, nchan='1953.125kHz', solint='10min'):
    """
    Compute phasediff statistics using circular standard deviations on the solutions of a scalarphasediff solve for
    international stations.

    The procedure and rational is described in Section 3.3 of de Jong et al. (2024)

    :param mslist: list of measurement sets
    :param args: input arguments
    :param nchan: n channels
    :param solint: solution interval
    """

    from source_selection.phasediff_output import GetSolint
   
    mslist_input = mslist[:] # make a copy

    # Verify if we are in circular pol basis and do beam correction
    for ms in mslist:
        beamcor_and_lin2circ(ms, dysco=args['dysco'], \
                           beam=set_beamcor(ms, args['beamcor']), \
                           lin2circ=True,
                           losotobeamlib=args['losotobeamcor_beamlib'])

    # Phaseup if needed
    if args['phaseupstations']:
        mslist = phaseup(mslist,datacolumn='DATA',superstation=args['phaseupstations'], \
                       dysco=args['dysco'])
   
    # Solve and get best solution interval
    for ms_id, ms in enumerate(mslist):
        scorelist = []
        parmdb = 'phasediffstat' + '_' + os.path.basename(ms) + '.h5'
        runDPPPbase(ms, str(solint) + 'min', nchan, parmdb, 'scalarphasediff', uvminscalarphasediff=0.0,\
                   dysco=args['dysco'])

        # Get the statistic
        score = get_phasediff_score(parmdb)
        scorelist.append(score)
        print('phasediff score', score, ms)
        logger.info('phasediff score: ' +str(score) + '   ' +  ms)

        # Reference solution interval
        ref_solint = solint

        # Write to STAT SCORE to original MS DATA-col header mslist_input
        t = pt.table(mslist_input[ms_id],  readonly=False)
        t.putcolkeyword('DATA', 'SCALARPHASEDIFF_STAT', score)
        t.close()

        print(scorelist)

        # Set optimal std score
        optimal_score = 1.75

        if type(ref_solint) == str:
            if 'min' in ref_solint:
                ref_solint = float(re.findall(r'-?\d+', ref_solint)[0])
            elif ref_solint[-1]=='s' or ref_solint[-1]=='sec':
                ref_solint = float(re.findall(r'-?\d+', ref_solint)[0])//60
            else:
                sys.exit("ERROR: ref_solint needs to be a float with solution interval in minutes "
                         "or string ending on min (minutes) or s/sec (seconds)")

        S = GetSolint(parmdb, optimal_score=optimal_score, ref_solint=ref_solint)

        print(solint, S.best_solint, S.ref_solint, S.optimal_score)

        S.plot_C("T=" + str(round(S.best_solint, 2)) + " min",  ms + '_phasediffscore.png')
   
    return

def multiscale_trigger(fitsmask, args):
   # update multiscale cleaning setting if allowed/requested
   multiscale = args['multiscale']
   if args['update_multiscale'] and fitsmask is not None:
      print('Size largest island [pixels]:', getlargestislandsize(fitsmask))
      logger.info('Size largest island [pixels]:' + str(getlargestislandsize(fitsmask)))
      if getlargestislandsize(fitsmask) > 1000:
         logger.info('Triggering multiscale clean')
         multiscale = True
   return multiscale

def update_uvmin(fitsmask, longbaseline, args, LBA):
   # update uvmin if allowed/requested
   if args['stack']:
      return args['uvmin']  
   uvmin = args['uvmin']
   if not longbaseline and args['update_uvmin'] and fitsmask is not None:
      if getlargestislandsize(fitsmask) > 1000:
         print('Size of largest island [pixels]:', getlargestislandsize(fitsmask))
         logger.info('Size of largest island [pixels]:' + str(getlargestislandsize(fitsmask)))
         if not LBA:
            print('Extended emission found, setting uvmin to 750 klambda')
            logger.info('Extended emission found, setting uvmin to 750 klambda')
            args['uvmin'] = 750
         else:
            print('Extended emission found, setting uvmin to 250 klambda')
            logger.info('Extended emission found, setting uvmin to 250 klambda')
            args['uvmin'] = 250
   return uvmin  

def update_fitsmask(fitsmask, maskthreshold_selfcalcycle, selfcalcycle, args, mslist):
   # MAKE MASK IF REQUESTED
   fitsmask_list = []
   for msim_id, mslistim in enumerate(nested_mslistforimaging(mslist, stack=args['stack'])):
      if args['stack']:
         stackstr= '_stack' + str(msim_id).zfill(2)
      else:
         stackstr='' # empty string
   
      # set imagename
      if args['imager'] == 'WSCLEAN':
          if args['idg']:
            imagename  = args['imagename'] + str(selfcalcycle).zfill(3) + stackstr + '-MFS-image.fits'
          else:
            imagename  = args['imagename'] + str(selfcalcycle).zfill(3) + stackstr + '-MFS-image.fits'
      if args['imager'] == 'DDFACET':
          imagename  = args['imagename'] + str(selfcalcycle).zfill(3) + stackstr + '.app.restored.fits'
      if args['channelsout'] == 1: # strip MFS from name if no channels images present
          imagename = imagename.replace('-MFS', '').replace('-I','')

      # check if we need/can do masking & mask
      if args['fitsmask'] is None:     
          if maskthreshold_selfcalcycle[selfcalcycle] > 0.0:
            cmdm  = 'MakeMask.py --Th='+ str(maskthreshold_selfcalcycle[selfcalcycle]) + \
                    ' --RestoredIm=' + imagename
            if fitsmask is not None:
                if os.path.isfile(imagename + '.mask.fits'):
                  os.system('rm -f ' + imagename + '.mask.fits')
            run(cmdm)
            fitsmask = imagename + '.mask.fits'
            fitsmask_list.append(fitsmask)
          else:
            fitsmask = None # no masking requested as args['maskthreshold'] less/equal 0
            fitsmask_list.append(fitsmask)
      else:
        fitsmask_list.append(fitsmask)  
   return fitsmask, fitsmask_list, imagename

def set_fitsmask_restart(args, i, mslist):
   fitsmask_list = []
   for msim_id, mslistim in enumerate(nested_mslistforimaging(mslist, stack=args['stack'])):
      if args['stack']:
         stackstr= '_stack' + str(msim_id).zfill(2)
      else:
         stackstr='' # empty string
   
      if args['idg']:
        if os.path.isfile(args['imagename'] + str(i-1).zfill(3) + stackstr + '-MFS-image.fits.mask.fits'):
          fitsmask = args['imagename'] + str(i-1).zfill(3)+ stackstr + '-MFS-image.fits.mask.fits'
      else:
        if args['imager'] == 'WSCLEAN':
          if os.path.isfile(args['imagename'] + str(i-1).zfill(3) + stackstr + '-MFS-image.fits.mask.fits'):
            fitsmask = args['imagename'] + str(i-1).zfill(3)+ stackstr + '-MFS-image.fits.mask.fits'
        if args['imager'] == 'DDFACET':
          if os.path.isfile(args['imagename'] + str(i-1).zfill(3) + stackstr + '.app.restored.fits'):
            fitsmask = args['imagename'] + str(i-1).zfill(3) + stackstr + '.app.restored.fits.mask.fits'
      if args['channelsout'] == 1:
        if args['imager'] == 'WSCLEAN':
            fitsmask = args['imagename'] + str(i-1).zfill(3)+ stackstr + '-MFS-image.fits.mask.fits'
        if args['imager'] == 'DDFACET':
            fitsmask = args['imagename'] + str(i-1).zfill(3) + stackstr + '.app.restored.fits.mask.fits'
        fitsmask = fitsmask.replace('-MFS', '').replace('-I','')
      
      fitsmask_list.append(fitsmask)
   return fitsmask, fitsmask_list

def create_Ateam_seperation_plots(mslist, start=0):
   '''
   Create Ateam and Sun, Moon, Jupiter seperation plots
   input: mslist (list), list of MS
   '''
   if start != 0:
      return  
   for ms in mslist:
      outputname = 'Ateam_' + ms + '.png'
      run('check_Ateam_separation.py --outputimage=' + outputname + ' ' + ms)
   return
   
   
def nested_mslistforimaging(mslist, stack=False):
   if not stack:
      return [mslist] # has format [[ms1.ms,ms2.ms,....]]
   else:
      mslistreturn = []
      for ms in mslist:
         mslistreturn.append([ms])
      return mslistreturn # has format [[ms1.ms],[ms2.ms],[...]] 

def mslist_return_stack(mslist, stack):
   if stack:
      return mslist
   else:
      return [mslist[0]] # just the first one

def set_skymodels_external_surveys(args, mslist):
   # Make starting skymodel from TGSS, VLASS, or LOFAR/LINC GSM if requested
   skymodel_list = []
   tgssfitsfile = None
   # --- TGSS ---
   for mstmp_id, mstmp in enumerate(mslist_return_stack(mslist, args['stack'])):
     if args['startfromtgss'] and args['start'] == 0:
       if args['skymodel'] is None:
         tmpskymodel, tgssfitsfile = makeBBSmodelforTGSS(args['boxfile'],\
                                         fitsimage = args['tgssfitsimage'], \
                                         pixelscale=args['pixelscale'], \
                                         imsize=args['imsize'], ms=mstmp, extrastrname=str(mstmp_id))
         skymodel_list.append(tmpskymodel)
       else:
         print('You cannot provide a skymodel/skymodelpointsource file manually while using --startfromtgss')
         raise Exception('You cannot provide a skymodel/skymodelpointsource manually while using --startfromtgss')

   # --- VLASS ---
   for mstmp_id, mstmp in enumerate(mslist_return_stack(mslist, args['stack'])):
     if args['startfromvlass'] and args['start'] == 0:
       if args['skymodel'] is None and args['skymodelpointsource'] is None:
         run('python vlass_search.py '+ mstmp)
         skymodel_list.append(makeBBSmodelforVLASS('vlass_poststamp.fits', extrastrname=str(mstmp_id)))
       else:
         print('You cannot provide a skymodel/skymodelpointsource manually while using --startfromvlass')
         raise Exception('You cannot provide a skymodel/skymodelpointsource manually while using --startfromvlass')

   # --- GSM ---
   for mstmp_id, mstmp in enumerate(mslist_return_stack(mslist, args['stack'])):
     if args['startfromgsm'] and args['start'] == 0:
       if args['skymodel'] is None and args['skymodelpointsource'] is None:
         skymodel_list.append(getGSM(mstmp, SkymodelPath='gsm'+str(mstmp_id)+'.skymodel', Radius=str(args['pixelscale']*args['imsize']/3600.)))
       else:
         print('You cannot provide a skymodel/skymodelpointsource manually while using --startfromgsm')
         raise Exception('You cannot provide a skymodel/skymodelpointsource manually while using --startfromgsm')

   # note if skymodel_list is not set (len==0), args['skymodel'] keeps it value from argparse
   if len(skymodel_list) > 1: # so startfromtgss or startfromvlass was done and --stack was true
      args['skymodel'] = skymodel_list
   if len(skymodel_list) == 1:  # so startfromtgss or startfromvlass was done
      args['skymodel'] = skymodel_list[0] # make string again, not a list type
   print(args['skymodel'])

   return args, tgssfitsfile   


###############################
############## MAIN ###########
###############################

def main():
   
   # flagms_startend('P217+57_object.dysco.sub.shift.avg.weights.ms.archive0','tecandphase0_selfcalcyle1_P217+57_object.dysco.sub.shift.avg.weights.ms.archive0.h5',1)
   # sys.exit()

   parser = argparse.ArgumentParser(description='Self-Calibrate a facet from a LOFAR observation')

   imagingparser = parser.add_argument_group("-------------------------Imaging Settings-------------------------")
   # Imaging settings
   imagingparser.add_argument('--imager', help="Imager to use WSClean or DDFACET. The default is WSCLEAN.", default='WSCLEAN', type=str)
   imagingparser.add_argument('-i','--imagename', help='Prefix name for image. This is by default "image".', default='image', type=str)
   imagingparser.add_argument('--imsize', help='Image size, required if boxfile is not used. The default is None.', type=int)
   imagingparser.add_argument('-n', '--niter', help='Number of iterations. This is computed automatically if None.', default=None, type=int)
   imagingparser.add_argument('--maskthreshold', help="Mask noise thresholds used from image 1 to 10 made by MakeMask.py. This is by default [5.0,4.5,4.5,4.5,4.0].", default=[5.0,4.5,4.5,4.5,4.0], type=arg_as_list)
   imagingparser.add_argument('--localrmswindow', help="local-rms-window parameter for automasking in WSClean (in units of psfs), default=0 (0 means it is not used; suggested value 50)", default=0, type=int)
   imagingparser.add_argument('--removenegativefrommodel', help="Remove negative clean components in model predict. This is by default turned off at selfcalcycle 2. See also option autoupdate-removenegativefrommodel.", type=ast.literal_eval, default=True)
   imagingparser.add_argument('--autoupdate-removenegativefrommodel', help="Turn off removing negative clean components at selfcalcycle 2 (for high dynamic range imaging it is better to keep all clean components). The default is True.", type=ast.literal_eval, default=True)
   imagingparser.add_argument('--fitsmask', help='Fits mask for deconvolution (needs to match image size). If this is not provided automasking is used in combination with MakeMask.py. If set to "nofitsmask" then only WSCLean auto-masking is used', type=str)
   imagingparser.add_argument('--robust', help='Briggs robust parameter for imagaging. The default is -0.5. Also allowed are the strings uniform or naturual which will override Briggs weighting.', default=-0.5, type=str_or_float)
   imagingparser.add_argument('--multiscale-start', help='Start multiscale deconvolution at this selfcal cycle. This is by default 1.', default=1, type=int)

   imagingparser.add_argument('--uvminim', help='Inner uv-cut for imaging in lambda. The default is 80 for LOFAR and 10 for all other', type=floatlist_or_float)
   imagingparser.add_argument('--uvmaxim', help='Outer uv-cut for imaging in lambda. The default is None', default=None, type=floatlist_or_float)
   imagingparser.add_argument('--pixelscale','--pixelsize', help='Pixels size in arcsec. Typically, 3.0 for LBA and 1.5 for HBA for the Dutch stations (these are also the default values). For MeerKAT the defaults are 1.8, 1.0, 0.5 for UHF-, L-, and S-band, repspectively.', type=float)
   imagingparser.add_argument('--channelsout', help='Number of channelsout during imaging (see WSClean documentation). The default is to set it automatically.', default='auto', type=str_or_int)
   imagingparser.add_argument('--multiscale', help='Use multiscale deconvolution (see WSClean documentation).', action='store_true')
   imagingparser.add_argument('--multiscalescalebias', help='Multiscalescale bias scale parameter for WSClean (see WSClean documentation). This is by default 0.75.', default=0.75, type=float)
   imagingparser.add_argument('--multiscalemaxscales', help='Multiscalescale max scale parameter for WSClean (see WSClean documentation). Default 0 (means set automatically).', default=0, type=int)

   imagingparser.add_argument("--update-channelsout", help='Change --channelsout automatically if there is high peak flux.', action='store_true')
   imagingparser.add_argument("--update-fitspectralpol", help='Change --fitspectralpol automatically if there is high peak flux.', action='store_true')
   
   imagingparser.add_argument('--paralleldeconvolution', help="Parallel-deconvolution size for WSCLean (see WSClean documentation). This is by default 0 (no parallel deconvolution). Suggested value for very large images is about 2000.", default=0, type=int)
   imagingparser.add_argument('--parallelgridding', help="Parallel-gridding for WSClean (see WSClean documentation). This is by default 1.", default=1, type=int)
   imagingparser.add_argument('--deconvolutionchannels', help="Deconvolution channels value for WSClean (see WSClean documentation). This is by default 0 (means deconvolution-channels equals channels-out).", default=0, type=int)
   imagingparser.add_argument('--idg', help="Use the Image Domain gridder (see WSClean documentation).", action='store_true')
   imagingparser.add_argument('--fitspectralpol', help="Use fit-spectral-pol in WSClean (see WSClean documentation) with this order. The default is to set it automatically. fit-spectral-pol can be disabled by setting it to a value less than 1", default='auto', type=str_or_int)
   imagingparser.add_argument('--ddpsfgrid', help="Value for option -dd-psf-grid with WSClean (integer, by default this value is not set and the option is not used", type=int)
   

   imagingparser.add_argument("--gapchanneldivision", help='Use the -gap-channel-division option in wsclean imaging and predicts (default is not to use it)', action='store_true')
   imagingparser.add_argument('--taperinnertukey', help="Value for taper-inner-tukey in WSClean (see WSClean documentation), useful to supress negative bowls when using --uvminim. Typically values between 1.5 and 4.0 give good results. The default is None.", default=None, type=float)
   imagingparser.add_argument('--makeimage-ILTlowres-HBA', help='Make 1.2 arcsec tapered image as quality check of ILT 1 arcsec imaging.', action='store_true')
   imagingparser.add_argument('--makeimage-fullpol', help='Make Stokes IQUV version for quality checking.', action='store_true')
   imagingparser.add_argument('--groupms-h5facetspeedup', help='Speed up DDE imaging with h5s', action='store_true')
   

   calibrationparser = parser.add_argument_group("-------------------------Calibration Settings-------------------------")
   # Calibration options
   calibrationparser.add_argument('--avgfreqstep', help="Extra DP3 frequency averaging to speed up a solve. This is done before any other correction and could be useful for long baseline infield calibrators. Allowed are integer values or for example '195.3125kHz'; options for units: 'Hz', 'kHz', or 'MHz'. The default is None.", type=str_or_int, default=None)
   calibrationparser.add_argument('--avgtimestep', help="Extra DP3 time averaging to speed up a solve. This is done before any other correction and could be useful for long baseline infield calibrators. Allowed are integer values or for example '16.1s'; options for units: 's' or 'sec'. The default is None.", type=str_or_int, default=None)
   calibrationparser.add_argument('--msinnchan', help="Before averaging, only take this number of input channels. The default is None.", type=int, default=None)
   calibrationparser.add_argument('--msinstartchan', help="Before averaging, start channel for --msinnchan. The default is 0. ", type=int, default=0)
   calibrationparser.add_argument('--msinntimes', help="DP3 msin.ntimes setting. This is mainly used for testing purposes. The default is None.", type=int, default=None)
   calibrationparser.add_argument('--autofrequencyaverage-calspeedup', help="Update April 24: Avoid usage because of corrupt vs correct. Try extra averaging during some selfcalcycles to speed up calibration.", action='store_true')
   calibrationparser.add_argument('--autofrequencyaverage', help='Try frequency averaging if it does not result in bandwidth smearing',  action='store_true')

   calibrationparser.add_argument('--phaseupstations', help="Phase up to a superstation. Possible input: 'core' or 'superterp'. The default is None.", default=None, type=str)
   calibrationparser.add_argument('--phaseshiftbox', help="DS9 region file to shift the phasecenter to. This is by default None.", default=None, type=str)
   calibrationparser.add_argument('--weightspectrum-clipvalue', help="Extra option to clip WEIGHT_SPECTRUM values above the provided number. Use with care and test first manually to see what is a fitting value. The default is None.", type=float, default=None)
   calibrationparser.add_argument('-u', '--uvmin', help="Inner uv-cut for calibration in lambda. The default is 80 for LBA and 350 for HBA.", type=floatlist_or_float, default=None)
   calibrationparser.add_argument('--uvmax', help="Outer uv-cut for calibration in lambda. The default is None", type=floatlist_or_float, default=None)   
   calibrationparser.add_argument('--uvminscalarphasediff', help='Inner uv-cut for scalarphasediff calibration in lambda. The default is equal to input for --uvmin.', type=float, default=None)
   calibrationparser.add_argument("--update-uvmin", help='Update uvmin automatically for the Dutch array.', action='store_true')
   calibrationparser.add_argument("--update-multiscale", help='Switch to multiscale automatically if large islands of emission are present.', action='store_true')
   calibrationparser.add_argument("--soltype-list", type=arg_as_list, default=['tecandphase','tecandphase','scalarcomplexgain'], help="List with solution types. Possible input: 'complexgain', 'scalarcomplexgain', 'scalaramplitude', 'amplitudeonly', 'phaseonly', 'fulljones', 'rotation', 'rotation+diagonal', 'rotation+diagonalphase','rotation+diagonalamplitude',                   'rotation+scalar','rotation+scalaramplitude','rotation+scalarphase', 'tec', 'tecandphase', 'scalarphase', 'scalarphasediff', 'scalarphasediffFR', 'phaseonly_phmin', 'rotation_phmin', 'tec_phmin', 'tecandphase_phmin', 'scalarphase_phmin', 'scalarphase_slope', 'phaseonly_slope'. The default is [tecandphase,tecandphase,scalarcomplexgain].")
   calibrationparser.add_argument("--solint-list", type=check_strlist_or_intlist, default=[1,1,120], help="Solution interval corresponding to solution types (in same order as soltype-list input). The default is [1,1,120].")
   calibrationparser.add_argument("--nchan-list", type=arg_as_list, default=[1,1,10], help="Number of channels corresponding to solution types (in same order as soltype-list input). The default is [1,1,10].")
   calibrationparser.add_argument("--smoothnessconstraint-list", type=arg_as_list, default=[0.,0.,5.], help="List with frequency smoothness values (in same order as soltype-list input). The default is [0.,0.,5.].")
   calibrationparser.add_argument("--smoothnessreffrequency-list", type=arg_as_list, default=[0.,0.,0.], help="List with optional reference frequencies (in MHz) for the smoothness constraint (in same order as soltype-list input). When unequal to 0, the size of the smoothing kernel will vary over frequency by a factor of smoothnessreffrequency*(frequency^smoothnessspectralexponent). The default is [0.,0.,0.].")
   calibrationparser.add_argument("--smoothnessspectralexponent-list", type=arg_as_list, default=[-1.,-1.,-1.], help="If smoothnessreffrequency is not equal to zero then this parameter determines the frequency scaling law. It is typically useful to take -2 for scalarphasediff, otherwise -1 (1/nu). The default is [-1.,-1.,-1.].")
   calibrationparser.add_argument("--smoothnessrefdistance-list", type=arg_as_list, default=[0.,0.,0.], help="If smoothnessrefdistance is not equal to zero then this parameter determines the freqeuency smoothness reference distance in units of km, with the smoothness scaling with distance. See DP3 documentation. The default is [0.,0.,0.].")
   calibrationparser.add_argument("--antennaconstraint-list", type=arg_as_list, default=[None,None,None], help="List with constraints on the antennas used (in same order as soltype-list input). Possible input: 'superterp', 'coreandfirstremotes', 'core', 'remote', 'distantremote', 'all', 'international', 'alldutch', 'core-remote', 'coreandallbutmostdistantremotes, alldutchandclosegerman', 'alldutchbutnoST001'. The default is [None,None,None].")
   calibrationparser.add_argument("--resetsols-list", type=arg_as_list, default=[None,None,None], help="Values of these stations will be rest to 0.0 (phases), or 1.0 (amplitudes), default None, possible settings are the same as for antennaconstraint-list (alldutch, core, etc)). The default is [None,None,None].")
   calibrationparser.add_argument("--resetdir-list", type=arg_as_list, default=[None,None,None], help="Values of these directions will be rest to 0.0 (phases), or 1.0 (amplitudes) for DDE solves. The default is [None,None,None]. It requires --facetdirections being set a user defined direction list so the directions are known. An example would be '[None,[1,4],None]', meaning that directions 1 and 4 are being reset, counting starts at zero in the second solve in the pertubation list.")
   calibrationparser.add_argument("--soltypecycles-list", type=arg_as_list, default=[0,999,3], help="Selfcalcycle where step from soltype-list starts. The default is [0,999,3].")

   calibrationparser.add_argument("--BLsmooth-list", type=arg_as_list, default=[False,False,False], help="Employ BLsmooth, this is a list of length soltype-list. For example --BLsmooth-list='[True, False,True]'. Default is all False.")
   calibrationparser.add_argument('--dejumpFR', help='Dejump Faraday solutions when using scalarphasediffFR.', action='store_true')
   calibrationparser.add_argument('--usemodeldataforsolints', help='Determine solints from MODEL_DATA.', action='store_true')
   calibrationparser.add_argument("--preapplyH5-list", type=arg_as_list, default=[None], help="Update April 2024: Avoid usage because of corrupt vs correct. List of H5 files to preapply (one for each MS). The default is [None].")
   calibrationparser.add_argument('--normamps', help='Normalize global amplitudes to 1.0. The default is True (False if fulljones is used). Note that if set to False --normamps-list is ignored.', type=ast.literal_eval, default=True)
   calibrationparser.add_argument('--normampsskymodel', help='Normalize global amplitudes to 1.0 when solving against an external skymodel. The default is False (turned off if fulljones is used). Note that this parameter is False (the default) --normamps-list is ignored for the solve against the skymodel', type=ast.literal_eval, default=False)
   #calibrationparser.add_argument('--normamps-per-ms', help='Normalize amplitudes to 1.0 for each MS separately, by default this is not done', action='store_true')

   calibrationparser.add_argument("--normamps-list", type=arg_as_list, default=['normamps','normamps','normamps'], help="List with amplitude normalization options. Possible input: 'normamps', 'normslope', 'normamps_per_ant, 'normslope+normamps', 'normslope+normamps_per_ant', or None. The default is [normamps,normamps,normamps,etc]. Only has an effect if the corresponding soltype outputs and amplitude000 table (and is not fulljones).")
   
   # calibrationparser.add_argument("--applydelaycalH5-list", type=arg_as_list, default=[None], help="List of H5 files from the delay calibrator, one per ms")
   # calibrationparser.add_argument("--applydelaytype", type=str, default='circular', help="Options: circular or linear. If --docircular was used for finding the delay solutions use circular (the default)")
   # Expert settings
   calibrationparser.add_argument('--tecfactorsolint', help='Experts only.', type=float, default=1.0)
   calibrationparser.add_argument('--gainfactorsolint', help='Experts only.', type=float, default=1.0)
   calibrationparser.add_argument('--phasefactorsolint', help='Experts only.', type=float, default=1.0)
   calibrationparser.add_argument('--compute-phasediffstat', help='Experts only: Get phasediff statistics for long-baseline calibrator dataset (see de Jong et al. 2024)',  action='store_true')
   calibrationparser.add_argument('--get-diagnostics', help='Experts only: With this functionality you can get a prediction which selfcal cycle gives the highest quality output (works only when >5 selfcal cycle)', action='store_true')
   calibrationparser.add_argument('--QualityBasedWeights', help='Experts only.',  action='store_true')
   calibrationparser.add_argument('--QualityBasedWeights-start', help='Experts only.',  type=int, default=5)
   calibrationparser.add_argument('--QualityBasedWeights-dtime', help='QualityBasedWeights timestep in units of minutes (default 5)',  type=float, default=5.0)
   calibrationparser.add_argument('--QualityBasedWeights-dfreq', help='QualityBasedWeights frequency in units of MHz (default 5)',  type=float, default=5.0)
   calibrationparser.add_argument('--ncpu-max-DP3solve', help='Maximum number of threads for DP3 solves, default=64 (too high value can result in BLAS errors)', type=int, default=64)
   calibrationparser.add_argument('--DDE', help='Experts only.',  action='store_true')
   calibrationparser.add_argument('--Nfacets', help='Number of directions to solve into when --DDE is used. Directions are found automatically. Only used if --facetdirections is not set. Keep to default (=0) if you want to use --targetFlux instead', type=int, default=0)
   calibrationparser.add_argument('--targetFlux', help='targetFlux in Jy for groupalgorithm to create facet directions when --DDE is set (default = 2.0). Directions are found automatically. Only used if --facetdirections is not set. Ignored when --NFacets is set to > 0', type=float, default=2.0)
   calibrationparser.add_argument('--facetdirections', help='Experts only. ASCII csv file containing facet directions. File needs two columns with decimal degree RA and Dec. Default is None.', type=str, default=None)
   calibrationparser.add_argument('--DDE-predict', help='Type of DDE predict to use. Options: DP3 or WSCLEAN, default=WSCLEAN (note: option WSCLEAN will use a lot of disk space as there is one MODEL column per direction written to the MS)', type=str, default='WSCLEAN')
   #calibrationparser.add_argument('--disable-IDG-DDE-predict', help='Normally, if LOFAR data is detected the WSCLean predict of the facets will use IDG, setting this option turns it off and predicts the apparent model with wridding (facet mode is never used here in these predicts). For non-LOFAR data the predicts uses the apparent model with wridding. Note: if the primary beam is not time varying and scalar then using the apparent model is fully accurate.', action='store_true')
   calibrationparser.add_argument('--disable-primary-beam', help='For WSCLEAN imaging and predicts disable the primary beam corrections (so run with "apparent" images only)', action='store_true')
   

   blsmoothparser = parser.add_argument_group("-------------------------BLSmooth Settings-------------------------")
   # BLsmooth settings
   blsmoothparser.add_argument("--iontimefactor", help='BLsmooth ionfactor. The default is 0.01. Larger is more smoothing (see BLsmooth documentation).', type=float, default=0.01)
   blsmoothparser.add_argument("--ionfreqfactor", help='BLsmooth tecfactor. The default is 1.0. Larger is more smoothing (see BLsmooth documentation).', type=float, default=1.0)
   blsmoothparser.add_argument("--blscalefactor", help='BLsmooth blscalefactor. The default is 1.0 (see BLsmooth documentation).', type=float, default=1.0)
   blsmoothparser.add_argument('--blsmooth_chunking_size', type=int, help='Chunking size for blsmooth. Larger values are slower but save on memory, lower values are faster. The default is 8.',default=8)

   flaggingparser = parser.add_argument_group("-------------------------Flagging Settings-------------------------")
   # Flagging options
   flaggingparser.add_argument('--doflagging', help='Flag on complexgain solutions via rms outlier detection (True/False, default=True). The default is True (will be set to False if --forwidefield is set).', type=ast.literal_eval, default=True)
   flaggingparser.add_argument('--clipsolutions', help='Flag amplitude solutions above --clipsolhigh and below  --clipsollow (will be set to False if --forwidefield is set).', action='store_true')
   flaggingparser.add_argument('--clipsolhigh', help='Flag amplitude solutions above this value, only done if --clipsolutions is set.', default=1.5, type=float)
   flaggingparser.add_argument('--clipsollow', help='Flag amplitude solutions below this value, only done if --clipsolutions is set.', default=0.667, type=float)
   flaggingparser.add_argument('--restoreflags', help='Restore flagging column after each selfcal cycle, only relevant if --doflagging=True.', action='store_true')
   flaggingparser.add_argument('--remove-flagged-from-startend', help='Remove flagged time slots at the start and end of an observations. Do not use if you want to combine DD solutions later for widefield imaging.', action='store_true')
   flaggingparser.add_argument('--flagslowamprms', help='RMS outlier value to flag on slow amplitudes. The default is 7.0.', default=7.0, type=float)
   flaggingparser.add_argument('--flagslowphaserms', help='RMS outlier value to flag on slow phases. The default 7.0.', default=7.0, type=float)
   flaggingparser.add_argument('--doflagslowphases', help='If solution flagging is done also flag outliers phases in the slow phase solutions. The default is True.', type=ast.literal_eval, default=True)
   flaggingparser.add_argument('--useaoflagger', help='Run AOflagger on input data.', action='store_true')
   flaggingparser.add_argument('--aoflagger-strategy', help='Use this strategy for AOflagger (options are: "default_StokesV.lua", "LBAdefaultwideband.lua")', default=None, type=str)
   flaggingparser.add_argument('--useaoflaggerbeforeavg', help='Flag with AOflagger before (True) or after averaging (False). The default is True.', type=ast.literal_eval, default=True)
   flaggingparser.add_argument('--flagtimesmeared', help='Flag data that is severely time smeared. Warning: expert only', action='store_true')
   flaggingparser.add_argument('--removeinternational', help='Remove the international stations if present', action='store_true')
   flaggingparser.add_argument('--removemostlyflaggedstations', help='Remove the staions that have a flaging percentage above 85 percent', action='store_true')
      
   startmodelparser = parser.add_argument_group("-------------------------Starting model Settings-------------------------")
   # Startmodel
   startmodelparser.add_argument('--skymodel', help='Skymodel for first selfcalcycle. The default is None.', type=arg_as_str_or_list)
   startmodelparser.add_argument('--skymodelsource', help='Source name in skymodel. The default is None (means the skymodel only contains one source/patch).', type=str)
   startmodelparser.add_argument('--skymodelpointsource', help='If set, start from a point source in the phase center with the flux density given by this parameter. The default is None (means do not use this option).', type=arg_as_float_or_list, default=None)
   startmodelparser.add_argument('--wscleanskymodel', help='WSclean basename for model images (for a WSClean predict). The default is None.', type=arg_as_str_or_list, default=None)   
   startmodelparser.add_argument('--predictskywithbeam', help='Predict the skymodel with the beam array factor.', action='store_true')
   startmodelparser.add_argument('--startfromtgss', help='Start from TGSS skymodel for positions (boxfile required).', action='store_true')
   startmodelparser.add_argument('--startfromvlass', help='Start from VLASS skymodel for ILT phase-up core data.', action='store_true')
   startmodelparser.add_argument('--startfromgsm', help='Start from LINC GSM skymodel.', action='store_true')
   startmodelparser.add_argument('--tgssfitsimage', help='Start TGSS fits image for model (if not provided use SkyView). The default is None.', type=str)

   # General options
   parser.add_argument('-b','--boxfile', help='DS9 box file. You need to provide a boxfile to use --startfromtgss. The default is None.', type=str)
   parser.add_argument('--beamcor', help='Correct the visibilities for beam in the phase center, options: yes, no, auto (default is auto, auto means beam is taken out in the curent phase center, tolerance for that is 10 arcsec)', type=str, default='auto')
   parser.add_argument('--losotobeamcor-beamlib', help="Beam library to use when not using DP3 for the beam correction. Possible input: 'stationresponse', 'lofarbeam' (identical and deprecated). The default is 'stationresponse'.", type=str, default='stationresponse')
   parser.add_argument('--docircular', help='Convert linear to circular correlations.', action='store_true')
   parser.add_argument('--dolinear', help='Convert circular to linear correlations.', action='store_true')
   parser.add_argument('--forwidefield', help='Keep solutions such that they can be used for widefield imaging/screens.', action='store_true')
   parser.add_argument('--remove-outside-center', help='Subtract sources that are outside the central parts of the FoV, square box is used with sizes of 3.0, 2.0, 1.5 degr for MeerKAT UHF, L, and S-band, repspectively. In case you want something else set --remove-outside-center-box', action='store_true')
   parser.add_argument('--remove-outside-center-box', help='User defined box to subtract sources that are outside this part of the image. If not set boxsize is set automatically. If "keepall" is set then no subtract is done and everything is kept, this is mainly useful if you are already working on box-extracted data', type=str, default=None)
   parser.add_argument('--single-dual-speedup', help='Speed up calibration and imaging if possible using datause=single/dual in DP3 and -scalar/diagonal-visibilities in WSClean. Requires a recent (mid July 2024) DP3 and WSClean versions. Default is True. Set to --single-dual-speedup=False to disable to speed-up', type=ast.literal_eval, default=True)
   parser.add_argument('--dysco', help='Use Dysco compression. The default is True.', type=ast.literal_eval, default=True)
   parser.add_argument('--resetweights', help='If you want to ignore weight_spectrum_solve.', action='store_true')
   parser.add_argument('--start', help='Start selfcal cycle at this iteration number. The default is 0.', default=0, type=int)
   parser.add_argument('--stop', help='Stop selfcal cycle at this iteration number. The default is 10.', default=10, type=int)
   parser.add_argument('--stopafterskysolve', help='Stop calibration after solving against external skymodel.', action='store_true')
   parser.add_argument('--stopafterpreapply', help='Stop after preapply of solutions', action='store_true')
   parser.add_argument('--noarchive', help='Do not archive the data.', action='store_true')
   parser.add_argument('--skipbackup', help='Leave the original MS intact and work always work on a DP3 copied dataset.', action='store_true')
   parser.add_argument('--phasediff_only', help='For finding only the phase difference, we want to stop after calibrating and before imaging', action='store_true')
   parser.add_argument('--helperscriptspath', help='Path to file location pulled from https://github.com/rvweeren/lofar_facet_selfcal.', default='/net/rijn/data2/rvweeren/LoTSS_ClusterCAL/', type=str)
   parser.add_argument('--helperscriptspathh5merge', help='Path to file location pulled from https://github.com/jurjen93/lofar_helpers.', default=None, type=str)
   parser.add_argument('--configpath', help = 'Path to user config file which will overwrite command line arguments', default = 'facetselfcal_config.txt', type = str)
   parser.add_argument('--auto', help='Trigger fully automated processing (HBA only for now).', action='store_true')
   parser.add_argument('--delaycal', help='Trigger settings suitable for ILT delay calibration, HBA-ILT only - still under construction.', action='store_true')
   parser.add_argument('--targetcalILT', help="Type of automated target calibration for HBA international baseline data when --auto is used. Options are: 'tec', 'tecandphase', 'scalarphase'. The default is 'scalarphase'.", default='scalarphase', type=str)
   parser.add_argument('--stack', help='Stacking of visibility data for multiple sources to increase S/N - still under construction.', action='store_true')


   parser.add_argument('ms', nargs='+', help='msfile(s)')

   options = parser.parse_args()

   # If a config file exists, then read the information. Priotise specified config over default.
   if os.path.isfile(options.configpath):
       config = options.configpath
   else:
       config = "facetselfcal_config.txt"

   if os.path.isfile(config):
       print("A config file (%s) exists, using it. This contains:" % config)
       parser = configparser.ConfigParser()
       # Preserve upper case in options
       parser.optionxform = str
       with open(config) as f:
           parser.read_string("[DEFAULT]\n" + f.read())
       for k, v in parser["DEFAULT"].items():
           print(f"{k} = {v}")
           if k not in vars(options).keys():
               raise KeyError(
                   "Encountered invalid option {:s} in config file {:s}.".format(
                       k, os.path.abspath(config)
                   )
               )
           if os.path.exists(os.path.expanduser(v)):
               setattr(options, k, v)
           else:
               setattr(options, k, ast.literal_eval(v))
   args = vars(options)
   
   if args['stack']:
      args['dysco'] = False # no dysco compression allowed as this the various steps violate the assumptions that need to be valud for proper dysco compression    
      args['noarchive'] = True

   version = '11.3.0'
   print_title(version)

   os.system('cp ' + args['helperscriptspath'] + '/lib_multiproc.py .')
   if args['helperscriptspathh5merge'] is not None:
     os.system('cp ' + args['helperscriptspathh5merge'] + '/h5_merger.py .')
     os.system('cp ' + args['helperscriptspathh5merge'] + '/h5_helpers/overwrite_table.py .')
     os.system('cp ' + args['helperscriptspathh5merge'] + '/h5_helpers/split_h5.py .')
     os.system('mkdir h5_helpers && cp ' + args['helperscriptspathh5merge'] + '/h5_helpers/make_template_h5.py  h5_helpers/')
     sys.path.append(os.path.abspath(args['helperscriptspathh5merge']))
   else:
     os.system('cp ' + args['helperscriptspath'] + '/h5_merger.py .')
     os.system('cp ' + args['helperscriptspath'] + '/overwrite_table.py .')
     os.system('cp ' + args['helperscriptspath'] + '/split_h5.py .')
     os.system('mkdir h5_helpers && cp ' + args['helperscriptspath'] + '/make_template_h5.py h5_helpers/')
     

   global h5_merger
   import h5_merger
   os.system('cp ' + args['helperscriptspath'] + '/plot_tecandphase.py .')
   os.system('cp ' + args['helperscriptspath'] + '/lin2circ.py .')
   os.system('cp ' + args['helperscriptspath'] + '/split_irregular_timeaxis.py .')
   os.system('cp ' + args['helperscriptspath'] + '/BLsmooth.py .')
   os.system('cp ' + args['helperscriptspath'] + '/polconv.py .')
   os.system('cp ' + args['helperscriptspath'] + '/vlass_search.py .')
   os.system('cp ' + args['helperscriptspath'] + '/VLASS_dyn_summary.php .')
   os.system('cp ' + args['helperscriptspath'] + '/ds9facetgenerator.py .')
   os.system('cp ' + args['helperscriptspath'] + '/default_StokesV.lua .')
   os.system('cp ' + args['helperscriptspath'] + '/LBAdefaultwideband.lua .')
   os.system('cp ' + args['helperscriptspath'] + '/MeerKATlayout.csv .')
   
   if args['helperscriptspathh5merge'] is None:  
      check_code_is_uptodate()

   # copy h5s locally
   for h5parm_id, h5parmdb in enumerate(args['preapplyH5_list']):
     if h5parmdb is not None:
       os.system('cp ' + h5parmdb +  ' .') # make them local because source direction will ne updated for merging
       args['preapplyH5_list'][h5parm_id] = h5parmdb.split('/')[-1] # update input list to local location

   # reorder lists based on sorted(args['ms'])    
   if type(args['skymodel']) is list: 
      args['skymodel'] = [x for _, x in sorted(zip(args['ms'],args['skymodel']))]
   if type(args['wscleanskymodel']) is list: 
      args['wscleanskymodel'] = [x for _, x in sorted(zip(args['ms'],args['wscleanskymodel']))]
   if type(args['skymodelpointsource']) is list: 
      args['skymodelpointsource'] = [x for _, x in sorted(zip(args['ms'],args['skymodelpointsource']))]
   mslist = sorted(args['ms'])


   # remove non-ms that ended up in mslist
   # mslist = removenonms(mslist)

   # remove trailing slashes
   mslist_tmp = []
   for ms in mslist:
     mslist_tmp.append(ms.rstrip('/'))
   mslist = mslist_tmp[:] #.copy()

   # remove ms which are too short (to catch Elais-N1 case of 600s of data)
   check_valid_ms(mslist)

   # check if ms channels are equidistant in freuqency (to confirm DP3 concat was used properly)
   check_equidistant_freqs(mslist)
   
   # do some input checking 
   inputchecker(args, mslist)
   
   # TEST ONLY REMOVE
   if False:
     modeldatacolumnsin = ['MODEL_DATA_DD0','MODEL_DATA_DD1','MODEL_DATA_DD2','MODEL_DATA_DD3','MODEL_DATA_DD4']
     soltypenumber = 0
     dirs, solints, soltypelist_includedir = parse_facetdirections(args['facetdirections'],0, args=args)
     modeldatacolumns, sourcedir_removed, id_kept = updatemodelcols_includedir(modeldatacolumnsin, soltypenumber, soltypelist_includedir, mslist[0], dryrun=True)
     #print(len(sourcedir_removed))
     #for ddir in sourcedir_removed:
     sourcedir_removed = sourcedir_removed.tolist()
     print(sourcedir_removed[0])
     print(modeldatacolumns)
     
     copy_over_solutions_from_skipped_directions(modeldatacolumnsin,id_kept)
     merge_splitted_h5_ordered(modeldatacolumnsin, 'test.h5', clean_up=False)
     sys.exit()


   # cut ms if there are flagged times at the start or end of the ms
   if args['remove_flagged_from_startend']:
      mslist = sorted(remove_flagged_data_startend(mslist))

   if not args['skipbackup']: # work on copy of input data as a backup
      print('Creating a copy of the data and work on that....')
      mslist = average(mslist, freqstep=[0]*len(mslist), timestep=1, start=args['start'], \
                       makecopy=True, dysco=args['dysco'])

   # take out bad WEIGHT_SPECTRUM values if weightspectrum_clipvalue is set
   if args['weightspectrum_clipvalue'] is not None:
      fix_bad_weightspectrum(mslist, clipvalue=args['weightspectrum_clipvalue'])

   # extra flagging if requested
   if args['start'] == 0 and args['useaoflagger'] and args['useaoflaggerbeforeavg']:
     runaoflagger(mslist, strategy=args['aoflagger_strategy'])

   # create Ateam plots
   create_Ateam_seperation_plots(mslist, start=args['start'])

   # fix irregular time axes if needed (do this after flaging)
   mslist =fix_equidistant_times(mslist, args['start']!=0, dysco=args['dysco'])
   
   # reset weights if requested
   if args['resetweights']:
     for ms in mslist:
       cmd = "'update " + ms + " set WEIGHT_SPECTRUM=WEIGHT_SPECTRUM_SOLVE'"
       run("taql " + cmd)

   # SETUP VARIOUS PARAMETERS
   longbaseline, LBA, HBAorLBA, freq, automask, fitsmask, maskthreshold_selfcalcycle, \
       outtarname, telescope, args = basicsetup(mslist, args)
 
   # PRE-APPLY SOLUTIONS (from a nearby direction for example)
   # if (args['applydelaycalH5_list'][0]) is not None and  args['start'] == 0:
   #      preapplydelay(args['applydelaycalH5_list'], mslist, args['applydelaytype'], dysco=args['dysco'])

   # check if we could average more
   avgfreqstep = []  # vector of len(mslist) with average values, 0 means no averaging
   for ms in mslist:
      if args['avgfreqstep'] is None and args['autofrequencyaverage'] and not LBA \
        and not args['autofrequencyaverage_calspeedup']: # autoaverage
        avgfreqstep.append(findfreqavg(ms,float(args['imsize'])))
      else:
        if args['avgfreqstep'] is not None:
           avgfreqstep.append(args['avgfreqstep']) # take over handpicked average value
        else:
           avgfreqstep.append(0) # put to zero, zero means no average


   # COMPUTE PHASE-DIFF statistic
   if args['compute_phasediffstat']:
      if longbaseline:
          compute_phasediffstat(mslist, args)
      else:
          logger.info("--compute-phasediffstat requested but no long-baselines in dataset.")

   # set once here, preserve original mslist in case --removeinternational was set
   if args['removeinternational'] is not None:
      # used for h5_merge add_ms_stations option
      mslist_beforeremoveinternational = mslist[:]  #copy by slicing otherwise list refers to original
   else:
      mslist_beforeremoveinternational = None

   # AVERAGE if requested/possible
   mslist = average(mslist, freqstep=avgfreqstep, timestep=args['avgtimestep'], \
                    start=args['start'], msinnchan=args['msinnchan'], msinstartchan=['msinstartchan'],\
                    phaseshiftbox=args['phaseshiftbox'], msinntimes=args['msinntimes'],\
                    dysco=args['dysco'],removeinternational=args['removeinternational'],\
                    removemostlyflaggedstations=args['removemostlyflaggedstations'])


   for ms in mslist:
     compute_distance_to_pointingcenter(ms, HBAorLBA=HBAorLBA, warn=longbaseline, returnval=False)

   # extra flagging if requested
   if args['start'] == 0 and args['useaoflagger'] and not args['useaoflaggerbeforeavg']:
     runaoflagger(mslist, strategy=args['aoflagger_strategy'])

   # compute bandwidth smearing
   t = pt.table(mslist[0] + '/SPECTRAL_WINDOW',ack=False)
   bwsmear = bandwidthsmearing(np.median(t.getcol('CHAN_WIDTH')), np.min(t.getcol('CHAN_FREQ')[0]), float(args['imsize']))
   t.close()


   # backup flagging column for option --restoreflags if needed
   if args['restoreflags']:
     for ms in mslist:
       create_backup_flag_col(ms)

   # LOG INPUT SETTINGS
   logbasicinfo(args, fitsmask, mslist, version, sys.argv)

   # Make starting skymodel from TGSS or VLASS survey if requested
   args, tgssfitsfile = set_skymodels_external_surveys(args, mslist)
   
   nchan_list, solint_list, BLsmooth_list, smoothnessconstraint_list, smoothnessreffrequency_list, \
   smoothnessspectralexponent_list, smoothnessrefdistance_list, \
   antennaconstraint_list, resetsols_list, resetdir_list, soltypecycles_list, \
   uvmin_list, uvmax_list, uvminim_list, uvmaxim_list, normamps_list  = \
                                              setinitial_solint(mslist, longbaseline, LBA, options)


   # Get restoring beam for DDFACET in case it is needed
   restoringbeam = calculate_restoringbeam(mslist, LBA)

   # set once here, will be updated in the loop below if phaseup is requested
   if args['phaseupstations'] is not None:
      # used for h5_merge add_CS option
      mslist_beforephaseup = mslist[:]  # note copy by slicing otherwise list refers to original
   else:
      mslist_beforephaseup = None

   # extra smearing flagging
   if args['flagtimesmeared'] and args['start'] == 0:
      for ms in mslist:  
         flag_smeared_data(ms)
         

   wsclean_h5list = []
   facetregionfile = None
   soltypelist_includedir = None
   modeldatacolumns = []
   if args['stack']:
      fitsmask_list = [None]*len(mslist)
   else:   
      fitsmask_list = [fitsmask] # *len(mslist) last part not needed because of the enumerate(nested_mslistforimaging(mslist, stack=args['stack']))

   if args['groupms_h5facetspeedup'] and args['start'] == 0 and len(mslist) > 1: 
      concat_ms_wsclean_facetimaging(mslist)

   # create facets.reg so we have it avaialble for image000 
   # so that we can use WSClean facet mode, but without having h5 DDE solutions
   if args['facetdirections'] is not None and  args['start'] == 0:
      create_facet_directions(None,0, ms=mslist[0], imsize=args['imsize'], \
	              pixelscale=args['pixelscale'],facetdirections=args['facetdirections'], \
                  args=args)
      facetregionfile = 'facets.reg' # so when making image000 we can use it without having h5 DDE solutions
      
   # ----- START SELFCAL LOOP -----
   for i in range(args['start'],args['stop']):

     # update removenegativefrommodel setting, for high dynamic range it is better to keep negative clean components (based on very clear 3C84 test case)
     if args['autoupdate_removenegativefrommodel'] and i > 1 and not args['DDE']:
        args['removenegativefrommodel'] = False
     if args['autoupdate_removenegativefrommodel'] and args['DDE']: # never remove negative clean components for a DDE solve
        args['removenegativefrommodel'] = False
        
     # AUTOMATICALLY PICKUP PREVIOUS MASK (in case of a restart) and trigger multiscale
     if (i > 0) and (args['fitsmask'] is None):
       fitsmask, fitsmask_list = set_fitsmask_restart(args, i, mslist)
       # update to multiscale cleaning if large island is present
       args['multiscale'] = multiscale_trigger(fitsmask, args)
       # update uvmin if allowed/requested
       args['uvmin'] = update_uvmin(fitsmask, longbaseline, args, LBA)
       # update channelsout
       args['channelsout'] = update_channelsout(args, i-1, mslist)
       # update fitspectralpol
       args['fitspectralpol'] = update_fitspectralpol(args)
       
       
     # BEAM CORRECTION AND/OR CONVERT TO CIRCULAR/LINEAR CORRELATIONS
     for ms in mslist:
       if ((args['docircular'] or args['dolinear']) or (set_beamcor(ms, args['beamcor']))) and (i == 0):
         beamcor_and_lin2circ(ms, dysco=args['dysco'], \
                              beam=set_beamcor(ms, args['beamcor']), \
                              lin2circ=args['docircular'], \
                              circ2lin=args['dolinear'], \
                              losotobeamlib=args['losotobeamcor_beamlib'], idg=args['idg'])


     # TMP AVERAGE TO SPEED UP CALIBRATION
     if args['autofrequencyaverage_calspeedup'] and i == 0:
         avgfreqstep = []
         mslist_backup = mslist[:] # make a backup list, note copy by slicing otherwise list refers to original
         for ms in mslist:
            avgfreqstep.append(findfreqavg(ms,float(args['imsize']),bwsmearlimit=3.5))
         mslist = average(mslist, freqstep=avgfreqstep, timestep=4, dysco=args['dysco'])
     if args['autofrequencyaverage_calspeedup'] and i == args['stop'] - 3:
         mslist = mslist_backup[:]  # reset back, note copy by slicing otherwise list refers to original
         preapply(create_mergeparmdbname(mslist, i-1), mslist, updateDATA=False, dysco=args['dysco']) # do not overwrite DATA column

     # PHASE-UP if requested
     if args['phaseupstations'] is not None:
         if (i == 0) or (i == args['start']):
             mslist = phaseup(mslist,datacolumn='DATA',superstation=args['phaseupstations'], \
                              start=i, dysco=args['dysco'])
     # PRE-APPLY SOLUTIONS (from a nearby direction for example)
     if (args['preapplyH5_list'][0]) is not None and i == 0:
         preapply(args['preapplyH5_list'], mslist, dysco=args['dysco'])

     if args['stopafterpreapply']:
       print('Stopping as requested via --stopafterpreapply')
       return

     # CALIBRATE AGAINST THE INITAL SKYMODEL (selfcalcycle 0) IF REQUESTED
     if (args['skymodel'] is not None or args['skymodelpointsource'] is not None \
         or args['wscleanskymodel'] is not None) and (i ==0):
         # Function that 
         # add patches for DDE predict
         # also do prepare_DDE
        if args['DDE']:
           modeldatacolumns, dde_skymodel, candidate_solints, soltypelist_includedir = prepare_DDE(args['skymodel'], i, \
                   mslist, args['imsize'], args['pixelscale'], \
                   args['channelsout'], args, numClusters=args['Nfacets'], \
                   facetdirections=args['facetdirections'], \
                   DDE_predict='DP3', restart=False,skyview=tgssfitsfile,\
                   targetFlux=args['targetFlux'], fitspectralpol=args['fitspectralpol'],\
                   disable_primary_beam=args['disable_primary_beam'], \
                   wscleanskymodel=args['wscleanskymodel'], skymodel=args['skymodel'])
           
           if candidate_solints is not None:
             candidate_solints = np.swapaxes(np.array([candidate_solints]*len(mslist)),1,0).T.tolist()
             solint_list = candidate_solints
        else:
           dde_skymodel = None  
        wsclean_h5list = calibrateandapplycal(mslist, i, args, solint_list, nchan_list, args['soltype_list'], \
                             soltypecycles_list, smoothnessconstraint_list, smoothnessreffrequency_list, \
                             smoothnessspectralexponent_list, smoothnessrefdistance_list, \
                             antennaconstraint_list, resetsols_list, resetdir_list, \
                             normamps_list, BLsmooth_list,\
                             uvmin=args['uvmin'], normamps=args['normampsskymodel'], \
                             skymodel=args['skymodel'], \
                             predictskywithbeam=args['predictskywithbeam'], \
                             restoreflags=args['restoreflags'], flagging=args['doflagging'], \
                             longbaseline=longbaseline, \
                             flagslowphases=args['doflagslowphases'], \
                             flagslowamprms=args['flagslowamprms'], flagslowphaserms=args['flagslowphaserms'],\
                             skymodelsource=args['skymodelsource'], skymodelpointsource=args['skymodelpointsource'],\
                             wscleanskymodel=args['wscleanskymodel'], iontimefactor=args['iontimefactor'], \
                             ionfreqfactor=args['ionfreqfactor'], \
                             blscalefactor=args['blscalefactor'], dejumpFR=args['dejumpFR'],\
                             uvminscalarphasediff=args['uvminscalarphasediff'], \
                             docircular=args['docircular'], mslist_beforephaseup=mslist_beforephaseup, dysco=args['dysco'], telescope=telescope, \
                             blsmooth_chunking_size=args['blsmooth_chunking_size'], \
                             gapchanneldivision=args['gapchanneldivision'],modeldatacolumns=modeldatacolumns, dde_skymodel=dde_skymodel,\
                             DDE_predict=set_DDE_predict_skymodel_solve(args['wscleanskymodel']),\
                             QualityBasedWeights=args['QualityBasedWeights'], QualityBasedWeights_start=args['QualityBasedWeights_start'], \
                             QualityBasedWeights_dtime=args['QualityBasedWeights_dtime'],\
                             QualityBasedWeights_dfreq=args['QualityBasedWeights_dfreq'],\
                             ncpu_max=args['ncpu_max_DP3solve'],\
                             mslist_beforeremoveinternational=mslist_beforeremoveinternational,\
                             soltypelist_includedir=soltypelist_includedir)
        
     if args['phasediff_only']:
       return
     
     # SET MULTISCALE
     if args['multiscale'] and i >= args['multiscale_start']:
       multiscale = True
     else:
       multiscale = False

     # RESTART FOR A DDE RUN, set modeldatacolumns and dde_skymodel
     if args['DDE'] and args['start'] != 0 and i == args['start']: 
        modeldatacolumns, dde_skymodel, candidate_solints, soltypelist_includedir = prepare_DDE(args['imagename'], i, \
                   mslist, args['imsize'], args['pixelscale'], \
                   args['channelsout'], args, numClusters=args['Nfacets'], \
                   facetdirections=args['facetdirections'], \
                   DDE_predict=args['DDE_predict'], restart=True, \
                   telescope=telescope, \
                   targetFlux=args['targetFlux'], fitspectralpol=args['fitspectralpol'],\
                   disable_primary_beam=args['disable_primary_beam'])
        wsclean_h5list = list(np.load('wsclean_h5list.npy'))
     
     
     #  --- start imaging part ---
     for msim_id, mslistim in enumerate(nested_mslistforimaging(mslist, stack=args['stack'])):
        if args['stack']:
          stackstr= '_stack' + str(msim_id).zfill(2)
        else:
          stackstr='' # empty string
        if len(modeldatacolumns) > 1:
          facetregionfile = 'facets.reg'
        #else:
          #if args['DDE'] and i == 0: # we are making image000 without having DDE solutions yet
            #if telescope == 'LOFAR' and not args['disable_IDG_DDE_predict']: # so image000 has model-pb
            #    args['idg'] = True
        makeimage(mslistim, args['imagename'] + str(i).zfill(3) + stackstr, \
                  args['pixelscale'], args['imsize'], \
                  args['channelsout'], args['niter'], args['robust'], \
                  multiscale=multiscale, idg=args['idg'], fitsmask=fitsmask_list[msim_id], \
                  uvminim=args['uvminim'], predict=not args['stopafterskysolve'],\
                  fitspectralpol=args['fitspectralpol'], uvmaxim=args['uvmaxim'], \
                  imager=args['imager'], restoringbeam=restoringbeam, automask=automask, \
                  removenegativecc=args['removenegativefrommodel'],\
                  paralleldeconvolution=args['paralleldeconvolution'],\
                  deconvolutionchannels=args['deconvolutionchannels'], \
                  parallelgridding=args['parallelgridding'], multiscalescalebias=args['multiscalescalebias'],\
                  taperinnertukey=args['taperinnertukey'], gapchanneldivision=args['gapchanneldivision'], h5list=wsclean_h5list, localrmswindow=args['localrmswindow'], \
                  facetregionfile=facetregionfile, DDEimaging=args['DDE'], \
                  multiscalemaxscales=args['multiscalemaxscales'],stack=args['stack'],\
                  disable_primarybeam_image=args['disable_primary_beam'], \
                  disable_primarybeam_predict=args['disable_primary_beam'], groupms_h5facetspeedup=args['groupms_h5facetspeedup'], ddpsfgrid=args['ddpsfgrid'],fulljones_h5_facetbeam=not args['single_dual_speedup'])
        #args['idg'] = idgin # set back
        if args['makeimage_ILTlowres_HBA']:
          if args['phaseupstations'] is None:
              briggslowres = -1.5
          else:
              briggslowres = -0.5
          makeimage(mslistim, args['imagename'] +'1.2arcsectaper' + str(i).zfill(3) + stackstr, \
                  args['pixelscale'], args['imsize'], \
                  args['channelsout'], args['niter'],briggslowres, uvtaper='1.2arcsec', \
                  multiscale=multiscale, idg=args['idg'], fitsmask=fitsmask_list[msim_id], \
                  uvminim=args['uvminim'], uvmaxim=args['uvmaxim'], fitspectralpol=args['fitspectralpol'], \
                  automask=automask, removenegativecc=False, \
                  predict=False, \
                  paralleldeconvolution=args['paralleldeconvolution'],\
                  deconvolutionchannels=args['deconvolutionchannels'], \
                  parallelgridding=args['parallelgridding'], multiscalescalebias=args['multiscalescalebias'],\
                  taperinnertukey=args['taperinnertukey'], gapchanneldivision=args['gapchanneldivision'], h5list=wsclean_h5list, multiscalemaxscales=args['multiscalemaxscales'], stack=args['stack'],\
                  disable_primarybeam_image=args['disable_primary_beam'], \
                  disable_primarybeam_predict=args['disable_primary_beam'],\
                  groupms_h5facetspeedup=args['groupms_h5facetspeedup'], \
                  ddpsfgrid=args['ddpsfgrid'], \
                  fulljones_h5_facetbeam=not args['single_dual_speedup'])
        if args['makeimage_fullpol']:
          makeimage(mslistim, args['imagename'] +'fullpol' + str(i).zfill(3) + stackstr, \
                  args['pixelscale'], args['imsize'], \
                  args['channelsout'], args['niter'], args['robust'], \
                  multiscale=multiscale, idg=args['idg'], fitsmask=fitsmask_list[msim_id], \
                  uvminim=args['uvminim'], uvmaxim=args['uvmaxim'], fitspectralpol=0, \
                  automask=automask, removenegativecc=False, predict=False, \
                  paralleldeconvolution=args['paralleldeconvolution'],\
                  deconvolutionchannels=args['deconvolutionchannels'], \
                  parallelgridding=args['parallelgridding'],\
                  multiscalescalebias=args['multiscalescalebias'], fullpol=True,\
                  taperinnertukey=args['taperinnertukey'], gapchanneldivision=args['gapchanneldivision'], facetregionfile=facetregionfile, localrmswindow=args['localrmswindow'], multiscalemaxscales=args['multiscalemaxscales'], stack=args['stack'],\
                  disable_primarybeam_image=args['disable_primary_beam'], \
                  disable_primarybeam_predict=args['disable_primary_beam'], \
                  groupms_h5facetspeedup=args['groupms_h5facetspeedup'], ddpsfgrid=args['ddpsfgrid'],\
                  fulljones_h5_facetbeam=not args['single_dual_speedup'])

        # make figure
        if args['imager'] == 'WSCLEAN':
          if args['idg']:
            plotpngimage = args['imagename'] + str(i).zfill(3) + stackstr + '.png'
            plotfitsimage= args['imagename'] + str(i).zfill(3) + stackstr +'-MFS-image.fits'
          else:
            plotpngimage = args['imagename'] + str(i).zfill(3) + stackstr + '.png'
            plotfitsimage= args['imagename'] + str(i).zfill(3) + stackstr +'-MFS-image.fits'
        if args['imager'] == 'DDFACET':
          plotpngimage = args['imagename'] + str(i) + '.png'   
          plotfitsimage = args['imagename'] + str(i).zfill(3) + stackstr +'.app.restored.fits'
          
        if args['channelsout'] == 1:
          plotpngimage = plotpngimage.replace('-MFS', '').replace('-I','')
          plotfitsimage = plotfitsimage.replace('-MFS', '').replace('-I','')
        plotimage(plotfitsimage, plotpngimage, mask=fitsmask_list[msim_id], rmsnoiseimage=plotfitsimage)
        
     #  --- end imaging part ---

     modeldatacolumns = [] 
     if args['DDE']:
        modeldatacolumns, dde_skymodel, candidate_solints, soltypelist_includedir = prepare_DDE(args['imagename'], i, \
                   mslist, args['imsize'], args['pixelscale'], \
                   args['channelsout'], args, numClusters=args['Nfacets'], \
                   facetdirections=args['facetdirections'], DDE_predict=args['DDE_predict'], \
                   telescope=telescope, \
                   targetFlux=args['targetFlux'], fitspectralpol=args['fitspectralpol'],\
                   disable_primary_beam=args['disable_primary_beam'])
        if candidate_solints is not None:
          candidate_solints = np.swapaxes(np.array([candidate_solints]*len(mslist)),1,0).T.tolist()
          solint_list = candidate_solints
     else:
        dde_skymodel = None  


     if args['stopafterskysolve']:
       print('Stopping as requested via --stopafterskysolve')
       if args['DDE']:
         print('Clean up MODEL_DATA_DD columns')  
         t = pt.table(mslist[0])
         colnames = t.colnames()
         t.close()
         collist_del = [xdel for xdel in colnames if re.match('MODEL_DATA*', xdel)]
         for colname_remove in collist_del:
           remove_column_ms(mslist, colname_remove)
       return

     # REDETERMINE SOLINTS IF REQUESTED
     if (i >= 0) and (args['usemodeldataforsolints']):
       print('Recomputing solints .... ')
       nchan_list, solint_list, BLsmooth_list, smoothnessconstraint_list,smoothnessreffrequency_list,\
                              smoothnessspectralexponent_list, smoothnessrefdistance_list, \
                              antennaconstraint_list, resetsols_list, resetdir_list, \
                              soltypecycles_list, normamps_list  = \
                              auto_determinesolints(mslist, args['soltype_list'], \
                              longbaseline, LBA, \
                              innchan_list=nchan_list, insolint_list=solint_list, \
                              insmoothnessconstraint_list=smoothnessconstraint_list, \
                              insmoothnessreffrequency_list=smoothnessreffrequency_list,\
                              insmoothnessspectralexponent_list=smoothnessspectralexponent_list,\
                              insmoothnessrefdistance_list=smoothnessrefdistance_list,\
                              inantennaconstraint_list=antennaconstraint_list, \
                              inresetsols_list=resetsols_list, \
                              inresetdir_list=resetdir_list,\
                              innormamps_list=normamps_list,\
                              inBLsmooth_list=BLsmooth_list,\
                              insoltypecycles_list=soltypecycles_list, redo=True, \
                              tecfactorsolint=args['tecfactorsolint'], \
                              gainfactorsolint=args['gainfactorsolint'], \
                              phasefactorsolint=args['phasefactorsolint'], \
                              delaycal=args['delaycal'])

     # CALIBRATE AND APPLYCAL
     wsclean_h5list = calibrateandapplycal(mslist, i, args, solint_list, nchan_list, args['soltype_list'], soltypecycles_list,\
                           smoothnessconstraint_list, smoothnessreffrequency_list,\
                           smoothnessspectralexponent_list, smoothnessrefdistance_list,\
                           antennaconstraint_list, resetsols_list, resetdir_list, \
                           normamps_list, BLsmooth_list, uvmin=args['uvmin'], \
                           normamps=args['normamps'], \
                           restoreflags=args['restoreflags'], \
                           flagging=args['doflagging'], longbaseline=longbaseline, \
                           flagslowphases=args['doflagslowphases'], \
                           flagslowamprms=args['flagslowamprms'], flagslowphaserms=args['flagslowphaserms'],\
                           iontimefactor=args['iontimefactor'], ionfreqfactor=args['ionfreqfactor'], blscalefactor=args['blscalefactor'],\
                           dejumpFR=args['dejumpFR'], uvminscalarphasediff=args['uvminscalarphasediff'],\
                           docircular=args['docircular'], mslist_beforephaseup=mslist_beforephaseup, dysco=args['dysco'],\
                           blsmooth_chunking_size=args['blsmooth_chunking_size'], \
                           gapchanneldivision=args['gapchanneldivision'],modeldatacolumns=modeldatacolumns, dde_skymodel=dde_skymodel,DDE_predict=args['DDE_predict'], QualityBasedWeights=args['QualityBasedWeights'], QualityBasedWeights_start=args['QualityBasedWeights_start'], QualityBasedWeights_dtime=args['QualityBasedWeights_dtime'],QualityBasedWeights_dfreq=args['QualityBasedWeights_dfreq'], telescope=telescope, ncpu_max=args['ncpu_max_DP3solve'],mslist_beforeremoveinternational=mslist_beforeremoveinternational, soltypelist_includedir=soltypelist_includedir)

     # update uvmin if allowed/requested
     args['uvmin'] = update_uvmin(fitsmask, longbaseline, args, LBA)

     # update fitsmake if allowed/requested 
     fitsmask, fitsmask_list, imagename = update_fitsmask(fitsmask, maskthreshold_selfcalcycle, i, args, mslist)
  
     # update to multiscale cleaning if large island is present
     args['multiscale'] = multiscale_trigger(fitsmask, args)

     # update channelsout
     args['channelsout'] = update_channelsout(args, i, mslist)

     # update fitspectralpol
     args['fitspectralpol'] = update_fitspectralpol(args)

     # CUT FLAGGED DATA FROM MS AT START&END to win some compute time if possible
     # if TEC and not args['forwidefield']: # does not work for phaseonly sols
     #  if (i == 0) or (i == args['phasecycles']) or (i == args['phasecycles'] + 1) or (i == args['phasecycles'] + 2) \
     #    or (i == args['phasecycles'] + 3) or (i == args['phasecycles'] + 4):
     #     for msnumber, ms in enumerate(mslist):
     #         flagms_startend(ms, 'phaseonly' + ms + parmdb + str(i) + '.h5', int(solint_phase[msnumber]))

   # remove sources outside central region after selfcal (to prepare for DDE solves)
   if args['remove_outside_center']:
      # make image after calibration so the calibration and images match 
      # normally we would finish with calirbation and not have the subsequent image, make this i+1 image here
      makeimage(mslistim, args['imagename'] + str(i+1).zfill(3), \
                  args['pixelscale'], args['imsize'], \
                  args['channelsout'], args['niter'], args['robust'], \
                  multiscale=multiscale, idg=args['idg'], fitsmask=fitsmask, \
                  uvminim=args['uvminim'], predict=False,\
                  fitspectralpol=args['fitspectralpol'], uvmaxim=args['uvmaxim'], \
                  imager=args['imager'], restoringbeam=restoringbeam, automask=automask, \
                  removenegativecc=args['removenegativefrommodel'],\
                  paralleldeconvolution=args['paralleldeconvolution'],\
                  deconvolutionchannels=args['deconvolutionchannels'], \
                  parallelgridding=args['parallelgridding'], multiscalescalebias=args['multiscalescalebias'],\
                  taperinnertukey=args['taperinnertukey'], gapchanneldivision=args['gapchanneldivision'], h5list=wsclean_h5list, localrmswindow=args['localrmswindow'], \
                  facetregionfile=facetregionfile, DDEimaging=args['DDE'], \
                  multiscalemaxscales=args['multiscalemaxscales'],\
                  disable_primarybeam_image=args['disable_primary_beam'], \
                  disable_primarybeam_predict=args['disable_primary_beam'], groupms_h5facetspeedup=args['groupms_h5facetspeedup'], \
                  ddpsfgrid=args['ddpsfgrid'], fulljones_h5_facetbeam=not args['single_dual_speedup'])


      remove_outside_box(mslist, args['imagename'] + str(i+1).zfill(3), args['pixelscale'], \
                         args['imsize'],args['channelsout'], single_dual_speedup= args['single_dual_speedup'], dysco=args['dysco'],\
                         userbox=args['remove_outside_center_box'], idg=args['idg'],\
                         h5list=wsclean_h5list, facetregionfile=facetregionfile, \
                         disable_primary_beam=args['disable_primary_beam'])
               
   # ARCHIVE DATA AFTER SELFCAL if requested
   if not longbaseline and not args['noarchive'] :
     if not LBA:
       if args['DDE']:
         mergedh5_i = glob.glob('merged_selfcalcyle' + str(i).zfill(3) + '*.h5')
         archive(mslist, outtarname, args['boxfile'], fitsmask, imagename, \
                 dysco=args['dysco'], mergedh5_i=mergedh5_i, facetregionfile=facetregionfile)
       else:
          archive(mslist, outtarname, args['boxfile'], fitsmask, imagename, dysco=args['dysco'])
       cleanup(mslist)

   # Get additional diagnostics about the selfcal quality --> in particular useful for calibrator selection
   if args['get_diagnostics']:
       from source_selection.selfcal_selection import main as quality_check
       if abs(args['stop']-args['start'])>5:
           mergedh5 = sorted([h5 for h5 in glob.glob('merged_selfcal*.h5') if 'linearfulljones' not in h5])
           if len(mergedh5)>0:
               if longbaseline:
                   station = 'international'
               else:
                   station = 'alldutch'
               images = glob.glob("*MFS-I-image.fits")
               if len(images)==0:
                   images = glob.glob("*MFS-image.fits")
               # Remove 1.2arcsectaper
               images = sorted([im for im in images if 'arcsectaper' not in im])
               quality_check(mergedh5, images, station)
           else:
               logger.info("Cannot find merged_selfcal*.h5, so cannot perform --get-diagnostics.")
       else:
           logger.info("Need at least 5 selfcal cycles for getting diagnostics")


if __name__ == "__main__":
   main()