submit.py

###!/usr/bin/python

import optparse
import configparser
import os
import sys
import shutil
import subprocess
import platform
import tarfile
import warnings
import git
from process_pickler import pickler

import yaml

def parse_yaml(filename):
    with open(filename, 'r') as stream:
        cfgfile = yaml.load(stream, Loader=yaml.FullLoader)
    return cfgfile


class SandboxTarball(object):
    def __init__(self, name=None, mode='w:xz', params=None):
        self.params = params
        self.tarfile = tarfile.open(name=name, mode=mode, dereference=True)
        self.checksum = None
        self.content = None

    def addFiles(self, cfgOutputName=None):
        """
        Add the necessary files to the tarball
        """
        directories = ['python', 'cfipython', 'lib', 'biglib', 'module', 'bin']
        # Note that dataDirs are only looked-for and added under the src/ folder.
        # /data/ subdirs contain data files needed by the code
        # /interface/ subdirs contain C++ header files needed e.g. by ROOT6
        dataDirs = ['data', 'interface', 'python']

        # Tar up whole directories
        for directory in directories:
            fullPath = os.path.join(self.params['TEMPL_CMSSWBASE'], directory)
            print(("Checking directory %s" % fullPath))
            if os.path.exists(fullPath):
                print(("Adding directory %s to tarball" % fullPath))
                self.checkdirectory(fullPath)
                self.tarfile.add(fullPath, directory, recursive=True)

        # Search for and tar up "data" directories in src/
        srcPath = os.path.join(self.params['TEMPL_CMSSWBASE'], 'src')
        for root, _, _ in os.walk(srcPath):
            if os.path.basename(root) in dataDirs:
                directory = root.replace(srcPath, 'src')
                print(("Adding data directory %s to tarball" % root))
                self.checkdirectory(root)
                self.tarfile.add(root, directory, recursive=True)


    def writeContent(self):
        """Save the content of the tarball"""
        self.content = [(int(x.size), x.name) for x in self.tarfile.getmembers()]


    def close(self):
        """
        Calculate the checkum and close
        """
        self.writeContent()
        return self.tarfile.close()

    def printSortedContent(self):
        """
	To be used for diagnostic printouts
        returns a string containing tarball content as a list of files sorted by size
        already formatted for use in a print statement
        """
        sortedContent = sorted(self.content, reverse=True)
        biggestFileSize = sortedContent[0][0]
        ndigits = int(math.ceil(math.log(biggestFileSize+1, 10)))
        contentList = "\nsandbox content sorted by size[Bytes]:"
        for (size, name) in sortedContent:
            contentList += ("\n%" + str(ndigits) + "s\t%s") % (size, name)
        return contentList


    def checkdirectory(self, dir_):
        #checking for infinite symbolic link loop
        try:
            for root, _, files in os.walk(dir_, followlinks=True):
                for file_ in files:
                    os.stat(os.path.join(root, file_))
        except OSError as msg:
            err = '%sError%s: Infinite directory loop found in: %s \nStderr: %s' % \
                    (colors.RED, colors.NORMAL, dir_, msg)
            raise EnvironmentException(err)


class TaskConfig:
    def __init__(self, taskName, cfgfile):
        # print('Task: {}'.format(taskName))
        common_config = cfgfile['Common']
        task_config = cfgfile[taskName]

        self.task_name = taskName
        self.version = common_config['version']
        self.cmssw_configs = cfgfile['Configuration']
        

        for key, value in list(task_config.items()):
            setattr(self, key, value)

        self.task_base_dir = '{}/{}/'.format(
            common_config['name'],
            common_config['version'])
        self.task_dir = '{}/{}/{}'.format(
            common_config['name'],
            common_config['version'],
            taskName)
        if 'output_dir_base' in common_config.keys():
            self.output_dir_base = common_config['output_dir_base']
            self.output_dir = '{}/{}/{}/{}'.format(
                common_config['output_dir_base'],
                self.task_name,
                common_config['mode'],
                self.version)
        else:
            self.output_dir_base = None
            self.output_dir = '{}/{}/{}/{}'.format(
                'userOutput',
                self.task_base_dir,
                common_config['mode'],
                self.version)
        self.ncpu = common_config['ncpu']
        if 'max_memory' in common_config.keys():
            self.max_memory = common_config['max_memory']
        else:
            self.max_memory = 3000
        self.output_file_name = common_config['output_file_name']
        if 'storage_site' in common_config.keys():
            self.storage_site = common_config['storage_site']
        else:
            self.storage_site = 'T2_CH_CERN'

    def __str__(self):
        return 'task-name {}: version {}'.format(self.task_name, self.version)


def check_substitution_complete(template):
    if('TEMPL_' in template):
        for line in template.split('\n'):
            if 'TEMPL_' in line:
                raise RuntimeError(
                    'Templated argument below not addressed!\n{0}'.format(line))

def getLSs(file_name):
    from subprocess import Popen, PIPE
    lumis = []
    p = Popen('edmFileUtil --eventsInLumis {}'.format(file_name),
              stdout=PIPE,
              shell=True)
    pipe = p.stdout.read()
    lines = pipe.split('\n')
    for line in lines[4:-2]:
        lumis.append(line.split()[1])
    return lumis


def splitFiles(files, splitting_mode, splitting_granularity, max_events=None):
    split_files = []
    split_logic = []
    if splitting_mode == 'file_based':
        size = int(splitting_granularity)
        split_files = [files[i:i+size] for i in range(0, len(files), size)]
    elif splitting_mode == 'lumi_based':
        for file_name in files:
            # print file_name
            file_lss = getLSs(file_name)
            for ls in file_lss:
                split_files.append([file_name])
                logic = '1:{}-1:{}'.format(ls, ls)
                split_logic.append(logic)
    elif splitting_mode == 'event_ranges':
        njobs = int(max_events/splitting_granularity)
        for ij in range(0, njobs):
            split_files.append(files)
            split_logic.append(ij*int(splitting_granularity))
    
    # elif splitting_mode == 'EventAwareLumiBased' or splitting_mode == 'Automatic':
    #     pass
    else:
        print('[submission] Splitting-Mode: {} is not implemented! Exiting...'.format(splitting_mode))
        sys.exit(6)
    return split_files, split_logic


def getFilesForDataset(dataset, site=None):
    import time
    from subprocess import Popen, PIPE
    options = ''
    eC = 5
    count = 0
    site_query = ''
    if site is not None:
        site_query = ' and site={}'.format(site)
    query = 'dasgoclient {} --query "file dataset={} {}"'.format(options, dataset, site_query)

    # print query
    while (eC != 0 and count < 3):
        if count != 0:
            print('Sleeping, then retrying DAS')
            time.sleep(100)
        p = Popen(query,
                  stdout=PIPE,
                  universal_newlines=True,
                  shell=True)
        pipe = p.stdout.read()
        tupleP = os.waitpid(p.pid, 0)
        eC = tupleP[1]
        count = count+1
        if eC == 0:
            print("DAS succeeded after", count, "attempts", eC)
            return [filename for filename in pipe.split('\n') if '.root' in filename]
        else:
            print("DAS failed 3 times- I give up")
            return []


def getJobParams(mode, task_conf):
    params = {}
    # if mode in ['NTP', 'L1IN', 'SIMDIGI', 'INFP', 'FP', 'GENSIM']:
    if True:
        input_files = []
        if not task_conf.crab:
            if hasattr(task_conf, 'input_directory'):
                print(('Reading input files from directory: {}'.format(task_conf.input_directory)))
                input_files = ['root://eoscms.cern.ch/'+os.path.join(task_conf.input_directory, file_name) for file_name in os.listdir(task_conf.input_directory) if file_name.endswith('.root')]
            elif hasattr(task_conf, 'input_dataset'):
                print(('Reading input files from dataset: {}'.format(task_conf.input_dataset)))
                input_files = getFilesForDataset(task_conf.input_dataset, site='T2_CH_CERN')
            elif hasattr(task_conf, 'input_files'):
                print(('Reading input files : {}'.format(task_conf.input_files)))
                input_files = task_conf.input_files
            else:
                print(('ERROR: no input specified for task: {}'.format(task_conf.task_name)))
                sys.exit(1)
        # print input_files

        max_events = -1
        # NOTE: this is not considered when submitting tasks without crab...unless the splitting is event_ranges
        if(hasattr(task_conf, 'max_events')):
            max_events = task_conf.max_events

        if not task_conf.crab:
            split_files, split_logic = splitFiles(
                input_files, 
                task_conf.splitting_mode, 
                task_conf.splitting_granularity, 
                max_events)
            n_jobs_max = len(split_files)
            n_jobs = n_jobs_max
            if(hasattr(task_conf, 'max_njobs')):
                n_jobs = min(n_jobs_max, task_conf.max_njobs)

            print('preparing batch submission:')
            print('  # of files: {}'.format(len(input_files)))
            print('  # of jobs: {}'.format(n_jobs))
            params['NJOBS'] = n_jobs
            params['TEMPL_JOBFLAVOR'] = task_conf.job_flavor
            params['INFILES'] = split_files
            params['SEEDS'] = list(range(1, n_jobs+1))
            params['SPLIT'] = split_logic
            if task_conf.splitting_mode == 'event_ranges':
                params['TEMPL_NEVENTS'] = task_conf.splitting_granularity
            else:
                params['TEMPL_NEVENTS'] = -1

        else:
            print('preparing crab submission')
            params['TEMPL_NEVENTS'] = max_events

        split_pu_files = []
        if(hasattr(task_conf, 'pu_dataset')):
            pu_files = getFilesForDataset(dataset=task_conf.pu_dataset, site=None)
            pu_splitting_granularity = min(100,  int(len(pu_files)/n_jobs))
            print("# of PU files: {}".format(len(pu_files)))
            print("# PU file per job: {}".format(pu_splitting_granularity))
            split_pu_files, split_pu_logic = splitFiles(files=pu_files,
                                                        splitting_mode='file_based',
                                                        splitting_granularity=pu_splitting_granularity)
            print(len(split_pu_files))
        # the first 2 are compulsory for all modes
        params['PUFILES'] = split_pu_files
        
        params['TEMPL_TASKBASEDIR'] = task_conf.task_base_dir
        params['TEMPL_ABSTASKBASEDIR'] = os.path.join(os.environ["PWD"], task_conf.task_base_dir)
        params['TEMPL_TASKDIR'] = task_conf.task_dir
        params['TEMPL_TASKCONFDIR'] = '{}/conf'.format(task_conf.task_dir)
        params['TEMPL_ABSTASKCONFDIR'] = os.path.join(os.environ["PWD"], params['TEMPL_TASKCONFDIR'])
        params['TEMPL_ABSTASKLOGDIR'] = os.path.join(os.environ["PWD"], params['TEMPL_TASKDIR'], 'logs')
        params['TEMPL_OUTFILE'] = task_conf.output_file_name
        params['TEMPL_OUTDIR'] = task_conf.output_dir
        params['TEMPL_NCPU'] = task_conf.ncpu

        params['TEMPL_MEMORY'] = task_conf.max_memory
        params['TEMPL_SPLITGRANULARITY'] = task_conf.splitting_granularity
        params['TEMPL_SPLITTINGMODE'] = task_conf.splitting_mode
        params['TEMPL_REQUESTNAME'] = task_conf.task_name
        if hasattr(task_conf, 'input_dataset'):
            params['TEMPL_INPUTDATASET'] = task_conf.input_dataset
        params['TEMPL_DATASETTAG'] = '{}_{}'.format(task_conf.task_name, task_conf.version)
        if task_conf.output_dir_base is not None:
            if task_conf.output_dir_base.startswith('/eos/cms'):
                params['TEMPL_CRABOUTDIR'] = task_conf.output_dir_base.split('/eos/cms')[1].replace('/cmst3/', '/group/cmst3/')
            else:
                warnings.warn('For crab submissions, setting the "output_dir_base" defines LFNDirBase which might be wrong!'
                              ' Make sure that the LFNDirBase looks reasonable. Default implementation for "/eos/cms"'
                              ' is defined.')
                params['TEMPL_CRABOUTDIR'] = task_conf.output_dir_base
        if hasattr(task_conf, 'inline_customize'):
            params['TEMPL_CUSTOMIZE'] = '\n'.join(task_conf.inline_customize)
        if hasattr(task_conf, 'storage_site'):
            params['TEMPL_STORAGE'] = task_conf.storage_site

        def get_from_env(variable):
            if variable in os.environ:
                return os.environ[variable]
            else:
                print(("ERROR: {} not found in shell enviroment!".format(variable)))
                sys.exit(11)

        if not task_conf.crab:
            params['TEMPL_SCRAMARCH'] = get_from_env('SCRAM_ARCH')
            params['TEMPL_CMSSWBASE'] = get_from_env('CMSSW_BASE')
            params['TEMPL_CMSSWVERSION'] = get_from_env('CMSSW_VERSION')


    else:
        print('Mode: {} is not implemented! Exiting...'.format(mode))
        sys.exit(4)
    return params


def formatFileList(input_files):
    input_file_names = ['\'{}\''.format(file_name) for file_name in input_files]
    return ',\n'.join(input_file_names)


def createJobSandbox(params):
    sb_tar_name = os.path.join(params['TEMPL_TASKBASEDIR'], 'sandbox.tgz')
    if not os.path.isfile(sb_tar_name):
        print(('--- Creating sandbox tar: {}'.format(sb_tar_name)))
        sb_tar = SandboxTarball(name=sb_tar_name, params=params)
        sb_tar.addFiles()
        sb_tar.close()
    else:
        print(('NOTE: Sandbox tar: {} already exists, reusing it!'.format(sb_tar_name)))

def createJobConfig(mode, params, step_name=None, in_file=None, out_file=None):
    step_name_str = ''
    if step_name:
        step_name_str = f'_{step_name}'
    custom_template_filename = 'templates/jobCustomization_{}_cfg.py'.format(mode)
    default_template_filename = 'templates/jobCustomization_{}_cfg.py'.format('DEFAULT')
    if not os.path.isfile(custom_template_filename):
        custom_template_filename = default_template_filename
    for job_idx in range(0, params['NJOBS']):
        custom_template_file = open(custom_template_filename)
        custom_template = custom_template_file.read()
        custom_template_file.close()
        # root cfg
        
        custom_template = custom_template.replace('TEMPL_ROOTCFG', f'input{step_name_str}_cfg')
        # input files
        file_list = formatFileList(params['INFILES'][job_idx])
        # we override the input file list for steps which are not the first one
        if in_file:
            file_list = formatFileList([in_file])
        custom_template = custom_template.replace('TEMPL_INFILES', file_list)
        if out_file:
            custom_template = custom_template.replace('TEMPL_OUTFILE', out_file)

        # pu files
        if len(params['PUFILES']) != 0:
            pu_file_list = formatFileList(params['PUFILES'][job_idx])
            custom_template = custom_template.replace('TEMPL_PUFILELIST', pu_file_list)

        if params['TEMPL_SPLITTINGMODE'] == 'lumi_based':
            if len(params['SPLIT']) != 0:
                job_logic = params['SPLIT'][job_idx]
                custom_template += 'process.source.lumisToProcess = cms.untracked.VLuminosityBlockRange("{}")\n'.format(job_logic)
        elif params['TEMPL_SPLITTINGMODE'] == 'event_ranges':
            params['TEMPL_FIRSTLUMI'] = 1000+job_idx
            params['TEMPL_SKIPENVETS'] = params['SPLIT'][job_idx]


        custom_template = custom_template.replace('TEMPL_SEED', str(params['SEEDS'][job_idx]*100))

        templs_keys = [key for key in list(params.keys()) if 'TEMPL_' in key]
        for key in templs_keys:
            custom_template = custom_template.replace(key, str(params[key]))

        # we now check that all templated arguments have been addressed
        if('TEMPL_') in custom_template:
            print("*** ERROR: not all the templated arguments of file {} have been addressed!".format(custom_template_filename))
            for line in custom_template.split('\n'):
                if 'TEMPL_' in line:
                    print(line)
            sys.exit(20)

        job_config_file = open(os.path.join(params['TEMPL_TASKCONFDIR'], f'job_config{step_name_str}_{job_idx}.py'), 'w')
        job_config_file.write(custom_template)
        job_config_file.close()


def createCondorConfig(mode, params):
    condor_template_name = 'templates/condorSubmit_{}.sub'.format(mode)
    default_template_name = 'templates/condorSubmit_{}.sub'.format('DEFAULT')
    if not os.path.isfile(condor_template_name):
        condor_template_name = default_template_name
    condor_template_file = open(condor_template_name)
    condor_template = condor_template_file.read()
    condor_template_file.close()
    condor_template = condor_template.replace('TEMPL_NJOBS', str(params['NJOBS']))
    templs_keys = [key for key in list(params.keys()) if 'TEMPL_' in key]
    for key in templs_keys:
        condor_template = condor_template.replace(key, str(params[key]))

    check_substitution_complete(condor_template)
    condor_file = open(os.path.join(params['TEMPL_TASKCONFDIR'], 'condorSubmit.sub'), 'w')
    condor_file.write(condor_template)
    condor_file.close()


def createJobExecutable(mode, params):
    run_template_name = 'templates/run_{}.sh'.format(mode)
    default_template_name = 'templates/run_{}.sh'.format('DEFAULT')
    if not os.path.isfile(run_template_name):
        run_template_name = default_template_name
    shutil.copy(run_template_name, '{}/run.sh'.format(params['TEMPL_TASKCONFDIR']))
    shutil.copy('templates/copy_files.sh', '{}/copy_files.sh'.format(params['TEMPL_TASKDIR']))
    os.chmod(os.path.join(params['TEMPL_TASKDIR'], 'copy_files.sh'),  0o754)
    shutil.copy('templates/cmssw_setup.sh', '{}/cmssw_setup.sh'.format(params['TEMPL_TASKBASEDIR']))
    os.chmod(os.path.join(params['TEMPL_TASKBASEDIR'], 'cmssw_setup.sh'),  0o754)
    params_file = open(os.path.join(params['TEMPL_TASKCONFDIR'], 'params.sh'), 'w')
    templs_keys = [key for key in list(params.keys()) if 'TEMPL_' in key]
    for key in templs_keys:
        # print(key)
        # print(str(params[key]))
        # print(str(params[key]).encode("unicode_escape").decode())
        if(key != 'TEMPL_CUSTOMIZE'):
            params_file.write('{}={}\n'.format(key.split('_')[1], str(params[key]).encode("unicode_escape").decode()))
    
    params_file.close()


def createCrabConfig(mode, params):
    crab_template_name = 'templates/crab_{}.py'.format(mode)
    default_template_name = 'templates/crab_{}.py'.format('DEFAULT')
    if not os.path.isfile(crab_template_name):
        crab_template_name = default_template_name
    crab_template_file = open(crab_template_name)
    crab_template = crab_template_file.read()
    crab_template_file.close()
    templs_keys = [key for key in list(params.keys()) if 'TEMPL_' in key]
    for key in templs_keys:
        crab_template = crab_template.replace(key, str(params[key]))

    if 'TEMPL_CRABOUTDIR' not in templs_keys:
        crab_template_lines = crab_template.split('\n')
        crab_template_lines = [line for line in crab_template_lines if 'outLFNDirBase' not in line]
        crab_template = '\n'.join(crab_template_lines)

    check_substitution_complete(crab_template)
    crab_file = open(os.path.join(params['TEMPL_TASKCONFDIR'], 'crab.py'), 'w')
    crab_file.write(crab_template)
    crab_file.close()


def createTaskSetup(task_config, config_file):
    mode = config_file['Common']['mode']
    pwd = os.environ["PWD"]
    if not os.path.exists(task_config.task_dir):
        print("   creating task directory {}".format(task_config.task_dir))
        os.makedirs(task_config.task_dir)
        os.mkdir(task_config.task_dir+'/conf/')
        os.mkdir(task_config.task_dir+'/logs/')

    if not os.path.exists(task_config.output_dir):
        try:
            os.makedirs(task_config.output_dir)
        except:
            print('   ERROR: output dir {} doesn\'t exist: please create it first!'.format(task_config.output_dir))
            print("Unexpected error:", sys.exc_info()[0])
            print(sys.exit(2))

    # shutil.copy(task_config.cmssw_config, '{}/conf/input_cfg.py'.format(task_config.task_dir))
    

    params = getJobParams(mode, task_config)
    if not task_config.crab:
        # pickler(task_config.cmssw_config, 'input_cfg.py')
        # shutil.move("input_cfg.py", '{}/conf/input_cfg.py'.format(task_config.task_dir))
        # shutil.move("input_cfg.pkl", '{}/conf/input_cfg.pkl'.format(task_config.task_dir))
        previous_step_out_file = None
        out_file = None
        for ic,config in enumerate(task_config.cmssw_configs):
            lastc = (ic == len(task_config.cmssw_configs) - 1)
            step_name = None
            step_name_str_ = ''

            if len(task_config.cmssw_configs) > 1:
                step_name = f'step{ic+1}'
                step_name_str_ = f'_{step_name}'
            
            if not lastc:
                out_file = f'out{step_name_str_}.root'
            else:
                out_file = None

            shutil.copy(config['cmssw_config'], f'{task_config.task_dir}/conf/input{step_name_str_}_cfg.py')
            createJobConfig(config['mode'], params, step_name, previous_step_out_file, out_file)
            previous_step_out_file = f'file:{out_file}'

        createJobSandbox(params)
        createCondorConfig(mode, params)
        createJobExecutable(mode, params)
    else:
        # FIXME: should throw an error if more than 1 step used with crab
        shutil.copy(task_config.cmssw_configs[0]['cmssw_config'], '{}/conf/input_cfg.py'.format(task_config.task_dir))
        createCrabConfig(mode, params)
    return


def submitTask(sub_name, task_config):
    submit_cmd = 'condor_submit {}/conf/condorSubmit.sub -batch-name {}_{}_{}'.format(task_config.task_dir, sub_name, task_config.version, task_config.task_name)
    if task_config.crab:
        submit_cmd = 'crab submit {}/conf/crab.py'.format(task_config.task_dir)
    try:
        output = subprocess.check_output(submit_cmd, shell=True).splitlines()
    except subprocess.CalledProcessError as e:
        print('Command: {} FAILED!'.format(submit_cmd))
        output = e.output.splitlines()
    for line in output:
        print(line.decode('UTF-8'))


def getCondorCluster(task_config):
    # clusterId = 529700
    condorLogs = [x for x in os.listdir(os.path.join(task_config.task_dir, 'logs')) if x.endswith('.log')]
    condorLogs.sort()
    clusterId = condorLogs[-1].split('.')[1]
    # print condorLogs
    return clusterId


def printStatus(clusterId):
    condor_cmd = 'condor_q {}'.format(clusterId)
    try:
        print(subprocess.check_output(condor_cmd, shell=True))
    except subprocess.CalledProcessError as e:
        print('Command: {} FAILED!'.format(condor_cmd))
        print(e.output)

def printWait(task_conf, clusterId):
    condor_cmd = 'condor_wait -wait 30 -status {}/logs/condor.{}.log'.format(task_conf.task_dir, clusterId)
    try:
        print(subprocess.check_output(condor_cmd, shell=True))
    except subprocess.CalledProcessError as e:
        print('Command: {} FAILED!'.format(condor_cmd))
        print(e.output)


def printDoc(task_configs):
    cmssw_src = os.path.join(os.environ['CMSSW_BASE'], 'src')

    cmssw_repo = git.Repo(cmssw_src)
  
    
    print('\n\n\n')
    print(f'## {task_configs[0].version}')

    print(f'   * directory: `{os.environ["PWD"]}`')
    print(f'   * CMSSW version: `{os.environ["CMSSW_VERSION"]}`')
    print(f'   * CMSSW git branch: `{cmssw_repo.active_branch.name}`')


    for pkg in ['Phase2EGTriggerAnalysis', 'FastPUPPI']:
        ntp_src = os.path.join(cmssw_src, pkg)
        if(os.path.exists(ntp_src)):
            ntp_repo = git.Repo(ntp_src)
            print(f'   * `{pkg}` git branch: `{ntp_repo.active_branch.name}`')

    if len(task_configs[0].cmssw_configs) > 1:
        print(f'   * config files:')
        
        for ic,conf in enumerate(task_configs[0].cmssw_configs):
            print(f'       - step{ic}: `{conf["cmssw_config"]}`, mode: `{conf["mode"]}`')
    else:
        print(f'   * config file: `{task_configs[0].cmssw_configs[0]["cmssw_config"]}` mode: `{task_configs[0].cmssw_configs[0]["mode"]}`')


    print(f'   * tasks:')
    for task in task_configs:
        print(f'      * `{task.task_name}`')
        if hasattr(task, 'input_dataset'):
            print(f'          * dataset: `{task.input_dataset}`')
        if hasattr(task, 'input_directory'):
            print(f'          * dataset: `{task.input_directory}`')

import multiprocessing
import time
import glob

class TaskManager:
    def __init__(self, sub_name, tasks, num_processes, local_dir_base):
        self.tasks = tasks
        self.num_processes = num_processes
        self.sub_name = sub_name
        self.local_dir_base = local_dir_base

    def configure(self, task_config, cluster, job_id):
        # Simulate configuration step
        print(f"Configuring task {task_config}")
        job_dir = os.path.join(self.local_dir_base, f'{self.sub_name}_{task_config.version}_{task_config.task_name}_{cluster}_{job_id}')
        os.mkdir(job_dir)
        shutil.copy(f'{task_config.task_base_dir}/sandbox.tgz' , job_dir)
        shutil.copy(f'{task_config.task_base_dir}/cmssw_setup.sh' , job_dir)
        shutil.copy(f'{task_config.task_dir}/copy_files.sh' , job_dir)
        shutil.copy(f'{task_config.task_dir}/conf/params.sh' , job_dir)
        shutil.copy(f'{task_config.task_dir}/conf/run.sh' , job_dir)
        shutil.copy(f'{task_config.task_dir}/conf/input_cfg.py' , job_dir)
        shutil.copy(f'{task_config.task_dir}/conf/job_config_{job_id}.py' , job_dir)
        return job_dir

    def execute(self, task):
        def execute_script_in_dir(directory, command, stdout_file, stderr_file):
            print(f'dir: {directory}')
            print(f'command: {command}')
            print(f'std out: {stdout_file}')
            print(f'std err: {stderr_file}')
            # Execute the script
            with open(stdout_file, "a") as stdout_f:
                with open(stderr_file, "a") as stderr_f:
                    # Execute the script in the subprocess
                    proc = subprocess.Popen(command, cwd=directory, stdout=stdout_f, stderr=stderr_f, env={})
                    proc.wait()
            print(f'process return code: {proc.returncode}')
            return proc.returncode

        # execute_script_in_dir(job_dir, 'cmssw_setup.sh')
        print (task)
        task_config = task[0]
        cluster = task[1]
        job = task[2]
        # Simulate execution step
        print(f"Executing task {task_config}, cluster: {cluster}, job: {job}")
        job_dir = self.configure(task_config, cluster, job)
        stdout_file = f'{job_dir}/local_{cluster}_{job}.out'
        stderr_file = f'{job_dir}/local_{cluster}_{job}.err'
        cmsRunRet = 1
        copyRet = 1
        cmsRunRet = execute_script_in_dir(job_dir, ['sh', 'run.sh', str(cluster), str(job)], stdout_file, stderr_file)
        if cmsRunRet == 0:
            copyRet = execute_script_in_dir(job_dir, ['./copy_files.sh'], stdout_file, stderr_file)
        shutil.copy(stdout_file , f'{task_config.task_dir}/logs/')
        shutil.copy(stderr_file , f'{task_config.task_dir}/logs/')
        if copyRet == 0:
            shutil.rmtree(job_dir)


    def count_exec_files(self, task_config):
        file_pattern = "job_config_*.py"
        # Use glob to find files matching the pattern
        matching_files = glob.glob(f'{task_config.task_dir}/conf/job_config_*.py')
        return len(matching_files)

    def run(self):
        with multiprocessing.Pool(processes=self.num_processes) as pool:
            args_list = []
            for task in self.tasks:
                n_jobs = self.count_exec_files(task)
                # n_jobs = 2
                print(f"task: {task} # of jobs: {n_jobs}")
                for job in range(0, n_jobs):
                    args_list.append((task, 0, job))
                    # self.execute((task, 0, job))
            pool.map(self.execute, args_list)

def main():
    usage = ('usage: %prog [options]\n'
             + '%prog -h for help')
    parser = optparse.OptionParser(usage)
    parser.add_option('-f', '--file', dest='CONFIGFILE', help='specify the yaml configuration file')
    parser.add_option("--create", action="store_true", dest="CREATE", default=False, help="create the job configuration")
    parser.add_option("--submit", action="store_true", dest="SUBMIT", default=False, help="submit the jobs to condor")
    parser.add_option("--status", action="store_true", dest="STATUS", default=False, help="check the status of the condor tasks")
    parser.add_option("--run-local", action="store_true", dest="RUN", default=False, help="run the tasks on the local host")
    parser.add_option("--doc", action="store_true", dest="DOC", default=False, help="print setup for documentation")
    parser.add_option('-j', '--jobs', dest='NJOBS', help='specify the # of parallel jobs for local processing', default=4)
    parser.add_option('-d', '--dir', dest='LOCALDIR', help='specify the top local directory for local jobs')

    global opt, args
    (opt, args) = parser.parse_args()

    # cfgfile = ConfigParser.ConfigParser()
    # cfgfile.optionxform = str
    # 
    # cfgfile.read(opt.CONFIGFILE)
    
    
    cfgfile = {}
    cfgfile.update(parse_yaml(opt.CONFIGFILE))
    
    sub_name = cfgfile['Common']['name']
    tasks = cfgfile['Common']['tasks']
    task_configs = []
    print(tasks)
    for task in tasks:
        task_configs.append(TaskConfig(task, cfgfile))

    for task_conf in task_configs:
        print(task_conf)

    if opt.CREATE:
        for task_conf in task_configs:
            print('-- Creating task {}'.format(task_conf.task_name))
            # 1 create local dir
            createTaskSetup(task_conf, cfgfile)
    elif opt.SUBMIT:
        for task_conf in task_configs:
            print('-- Submitting task {}'.format(task_conf.task_name))
            # 1 create local dir
            submitTask(sub_name, task_conf)
    elif opt.RUN:
        if not opt.LOCALDIR:
            print("Error: LOCALDIR not specified. Please use the -d option to specify the top local directory for local jobs.")
            parser.print_help()
            exit(1)
        tm = TaskManager(sub_name, task_configs, int(opt.NJOBS), opt.LOCALDIR)
        tm.run()
    elif opt.STATUS:
        for task_conf in task_configs:
            print('-- Status of task {}'.format(task_conf.task_name))
            clusterId = getCondorCluster(task_conf)
            printStatus(clusterId)
            printWait(task_conf, clusterId)
            print('   out dir: {}'.format(task_conf.output_dir))
    elif opt.DOC:
        printDoc(task_configs)

if __name__ == "__main__":
    main()