Python RLFSMの例、dynamo.fileop.rlfsm.RLFSM Pythonの例

コード例 #1

0

ファイルを表示

ファイル: rates.py プロジェクト: ellenlee1/dynamo

class CurrentFileTransfers(WebModule):
    def __init__(self, config):
        WebModule.__init__(self, config)

        self.rlfsm = RLFSM()
        self.rlfsm.set_read_only(True)

    def run(self, caller, request, inventory):
        sql = 'SELECT q.`id`, q.`batch_id`, ss.`name`, sd.`name`, f.`name`, f.`size` FROM `transfer_tasks` AS q'
        sql += ' INNER JOIN `file_subscriptions` AS u ON u.`id` = q.`subscription_id`'
        sql += ' INNER JOIN `sites` AS ss ON ss.`id` = q.`source_id`'
        sql += ' INNER JOIN `sites` AS sd ON sd.`id` = u.`site_id`'
        sql += ' INNER JOIN `files` AS f ON f.`id` = u.`file_id`'
        sql += ' ORDER BY q.`id`'

        current_tasks = self.rlfsm.db.query(sql)

        batch_ids = set(s[1] for s in current_tasks)

        transfers = []
        for batch_id in batch_ids:
            transfers.extend(
                self.rlfsm.transfer_query.get_transfer_status(batch_id))

        transfers_map = dict((t[0], t[1:]) for t in transfers)

        data = []
        for task_id, batch_id, source, destination, lfn, size in current_tasks:
            try:
                transfer = transfers_map[task_id]
            except KeyError:
                status = 'unknown'
                start = ''
                finish = ''
            else:
                status = FileQuery.status_name(transfer[0])
                if transfer[2] is None:
                    start = ''
                else:
                    start = time.strftime('%Y-%m-%d %H:%M:%S',
                                          time.gmtime(transfer[2]))
                if transfer[3] is None:
                    finish = ''
                else:
                    finish = time.strftime('%Y-%m-%d %H:%M:%S',
                                           time.gmtime(transfer[3]))

            data.append({
                'id': task_id,
                'from': source,
                'to': destination,
                'lfn': lfn,
                'size': size,
                'status': status,
                'start': start,
                'finish': finish
            })

        return data

コード例 #2

0

ファイルを表示

ファイル: rlfsmphedexcopy.py プロジェクト: SmartDataProjects/dynamo-cms

class RLFSMPhEDExReserveCopyInterface(CopyInterface):
    """
    CopyInterface using the Dynamo RLFSM.
    """

    def __init__(self, config = None):
        CopyInterface.__init__(self, config)
        self.rlfsm = RLFSM(config.get('rlfsm', None))
        self.mysql = MySQL(config.reserve_db_params)

    def set_read_only(self, value = True): #override
        self._read_only = value
        self.rlfsm.set_read_only(value)

    def schedule_copies(self, replica_list, operation_id, comments = ''): #override
        sites = set(r.site for r in replica_list)
        if len(sites) != 1:
            raise OperationalError('schedule_copies should be called with a list of replicas at a single site.')

        LOG.info('Scheduling copy of %d replicas to %s using RLFSM (operation %d)', len(replica_list), list(sites)[0], operation_id)

        result = []

        for replica in replica_list:
            # Function spec is to return clones (so that if specific block fails to copy, we can return a dataset replica without the block)
            clone_replica = DatasetReplica(replica.dataset, replica.site)
            clone_replica.copy(replica)
            result.append(clone_replica)

            for block_replica in replica.block_replicas:
                LOG.debug('Subscribing files for %s', str(block_replica))

                if block_replica.file_ids is None:
                    LOG.debug('No file to subscribe for %s', str(block_replica))
                    return
        
                all_files = block_replica.block.files
                missing_files = all_files - block_replica.files()

                for lfile in missing_files:
                    self.rlfsm.subscribe_file(block_replica.site, lfile)

                clone_block_replica = BlockReplica(block_replica.block, block_replica.site, block_replica.group)
                clone_block_replica.copy(block_replica)
                clone_block_replica.last_update = int(time.time())
                clone_replica.block_replicas.add(clone_block_replica)

        if not self._read_only:
            for clone_replica in result:
                if clone_replica.growing:
                    self.mysql.query('INSERT INTO `phedex_transfer_reservations` (`operation_id`, `item`, `site`, `group`) VALUES (%s, %s, %s, %s)', operation_id, clone_replica.dataset.name, clone_replica.site.name, clone_replica.group.name)
                else:
                    for block_replica in clone_replica.block_replicas:
                        self.mysql.query('INSERT INTO `phedex_transfer_reservations` (`operation_id`, `item`, `site`, `group`) VALUES (%s, %s, %s, %s)', operation_id, block_replica.block.full_name(), clone_replica.site.name, block_replica.group.name)

        # no external dependency - everything is a success
        return result

コード例 #3

0

ファイルを表示

ファイル: current.py プロジェクト: SmartDataProjects/dynamo

class CurrentFileTransfers(WebModule):
    def __init__(self, config):
        WebModule.__init__(self, config)

        self.rlfsm = RLFSM()
        self.rlfsm.set_read_only(True)

    def run(self, caller, request, inventory):
        sql = 'SELECT q.`id`, q.`batch_id`, ss.`name`, sd.`name`, f.`name`, f.`size` FROM `transfer_tasks` AS q'
        sql += ' INNER JOIN `file_subscriptions` AS u ON u.`id` = q.`subscription_id`'
        sql += ' INNER JOIN `sites` AS ss ON ss.`id` = q.`source_id`'
        sql += ' INNER JOIN `sites` AS sd ON sd.`id` = u.`site_id`'
        sql += ' INNER JOIN `files` AS f ON f.`id` = u.`file_id`'
        sql += ' ORDER BY q.`id`'

        current_tasks = self.rlfsm.db.query(sql)

        batch_ids = set(s[1] for s in current_tasks)

        transfers = []
        for batch_id in batch_ids:
            transfers.extend(self.rlfsm.transfer_query.get_transfer_status(batch_id))

        transfers_map = dict((t[0], t[1:]) for t in transfers)
        
        data = []
        for task_id, batch_id, source, destination, lfn, size in current_tasks:
            try:
                transfer = transfers_map[task_id]
            except KeyError:
                status = 'unknown'
                start = ''
                finish = ''
            else:
                status = FileQuery.status_name(transfer[0])
                if transfer[2] is None:
                    start = ''
                else:
                    start = time.strftime('%Y-%m-%d %H:%M:%S', time.gmtime(transfer[2]))
                if transfer[3] is None:
                    finish = ''
                else:
                    finish = time.strftime('%Y-%m-%d %H:%M:%S', time.gmtime(transfer[3]))

            data.append({
                    'id': task_id,
                    'from': source,
                    'to': destination,
                    'lfn': lfn,
                    'size': size,
                    'status': status,
                    'start': start,
                    'finish': finish})

        return data

コード例 #4

0

ファイルを表示

ファイル: rlfsmdeletion.py プロジェクト: SmartDataProjects/dynamo

class RLFSMDeletionInterface(DeletionInterface):
    """
    DeletionInterface using the Dynamo RLFSM.
    """

    def __init__(self, config = None):
        DeletionInterface.__init__(self, config)
        self.rlfsm = RLFSM(config.get('rlfsm', None))

    def set_read_only(self, value = True): #override
        self._read_only = value
        self.rlfsm.set_read_only(value)

    def schedule_deletions(self, replica_list, operation_id, comments = ''): #override
        sites = set(r.site for r, b in replica_list)
        if len(sites) != 1:
            raise OperationalError('schedule_copies should be called with a list of replicas at a single site.')

        site = list(sites)[0]

        LOG.info('Scheduling deletion of %d replicas from %s using RLFSM (operation %d)', len(replica_list), site.name, operation_id)

        clones = []

        for dataset_replica, block_replicas in replica_list:
            if block_replicas is None:
                to_delete = dataset_replica.block_replicas
            else:
                to_delete = block_replicas

            for block_replica in to_delete:
                for lfile in block_replica.files():
                    self.rlfsm.desubscribe_file(block_replica.site, lfile)

            # No external dependency -> all operations are successful

            clone_replica = DatasetReplica(dataset_replica.dataset, dataset_replica.site)
            clone_replica.copy(dataset_replica)

            if block_replicas is None:
                clones.append((clone_replica, None))
            else:
                clones.append((clone_replica, []))
                for block_replica in block_replicas:
                    clone_block_replica = BlockReplica(block_replica.block, block_replica.site)
                    clone_block_replica.copy(block_replica)
                    clone_block_replica.last_update = int(time.time())
                    clones[-1][1].append(clone_block_replica)

        return clones

    def deletion_status(self, operation_id): #override
        raise NotImplementedError('deletion_status')

コード例 #5

0

ファイルを表示

def transfer(site, files):
    """
    Requests a transfer for files from other sites
    :param str site: The target site for the transfer
    :param list files: List of file LFNs to transfer
    :returns: Two lists of files.
              The first list is of files that were not on another disk.
              The second list is of files that were also not on tape.
    :rtype: list, list
    """

    rlfsm = RLFSM()
    siteobj = inventory.sites[site]

    no_disk = []
    unrecoverable = []

    for line in files:

        path = line.strip()
        fileobj = inventory.find_file(path)

        ondisk = False
        ontape = False

        for repl in fileobj.block.replicas:
            if repl.site == siteobj:
                continue

            if not repl.has_file(fileobj):
                continue

            if repl.site.storage_type == Site.TYPE_DISK:
                ondisk = True
            elif repl.site.storage_type == Site.TYPE_MSS:
                ontape = True

        if not ondisk:
            no_disk.append(line)
            if not ontape:
                unrecoverable.append(line)

        if ondisk or ontape:
            rlfsm.subscribe_file(siteobj, fileobj)

        LOG.info('Copying %s', path)

    rlfsm.db.close()

    return no_disk, unrecoverable

コード例 #6

0

ファイルを表示

ファイル: rlfsmcopy.py プロジェクト: SmartDataProjects/dynamo

class RLFSMCopyInterface(CopyInterface):
    """
    CopyInterface using the Dynamo RLFSM.
    """

    def __init__(self, config = None):
        CopyInterface.__init__(self, config)
        self.rlfsm = RLFSM(config.get('rlfsm', None))

    def set_read_only(self, value = True): #override
        self._read_only = value
        self.rlfsm.set_read_only(value)

    def schedule_copies(self, replica_list, operation_id, comments = ''): #override
        sites = set(r.site for r in replica_list)
        if len(sites) != 1:
            raise OperationalError('schedule_copies should be called with a list of replicas at a single site.')

        LOG.info('Scheduling copy of %d replicas to %s using RLFSM (operation %d)', len(replica_list), list(sites)[0], operation_id)

        result = []

        for replica in replica_list:
            # Function spec is to return clones (so that if specific block fails to copy, we can return a dataset replica without the block)
            clone_replica = DatasetReplica(replica.dataset, replica.site)
            clone_replica.copy(replica)
            result.append(clone_replica)

            for block_replica in replica.block_replicas:
                LOG.debug('Subscribing files for %s', str(block_replica))

                if block_replica.file_ids is None:
                    LOG.debug('No file to subscribe for %s', str(block_replica))
                    return
        
                all_files = block_replica.block.files
                missing_files = all_files - block_replica.files()

                for lfile in missing_files:
                    self.rlfsm.subscribe_file(block_replica.site, lfile)

                clone_block_replica = BlockReplica(block_replica.block, block_replica.site, block_replica.group)
                clone_block_replica.copy(block_replica)
                clone_block_replica.last_update = int(time.time())
                clone_replica.block_replicas.add(clone_block_replica)

        # no external dependency - everything is a success
        return result

コード例 #7

0

ファイルを表示

def delete(site, files):
    """
    Enters files into the deletion queue for a site
    :param str site: Site to execute deletion
    :param list files: Full LFNs of files or directories to delete
    :returns: Number of files deleted, in case ``files`` is an rvalue or something
    :rtype: int
    """

    rlfsm = RLFSM()
    siteobj = inventory.sites[site]

    for path in files:
        path = path.strip()
        LOG.info('Deleting %s', path)

        rlfsm.desubscribe_file(siteobj, inventory.find_file(path))

    rlfsm.db.close()

    return len(files)

コード例 #8

0

ファイルを表示

ファイル: rlfsmcopy.py プロジェクト: SmartDataProjects/dynamo

 def __init__(self, config = None):
     CopyInterface.__init__(self, config)
     self.rlfsm = RLFSM(config.get('rlfsm', None))

コード例 #9

0

ファイルを表示

ファイル: rlfsmphedexcopy.py プロジェクト: SmartDataProjects/dynamo-cms

 def __init__(self, config = None):
     CopyInterface.__init__(self, config)
     self.rlfsm = RLFSM(config.get('rlfsm', None))
     self.mysql = MySQL(config.reserve_db_params)

コード例 #10

0

ファイルを表示

ファイル: rlfsmdeletion.py プロジェクト: kpark1/dynamo

 def __init__(self, config=None):
     DeletionInterface.__init__(self, config)
     self.rlfsm = RLFSM(config.get('rlfsm', None))

コード例 #11

0

ファイルを表示

ファイル: rlfsmdeletion.py プロジェクト: kpark1/dynamo

class RLFSMDeletionInterface(DeletionInterface):
    """
    DeletionInterface using the Dynamo RLFSM.
    """
    def __init__(self, config=None):
        DeletionInterface.__init__(self, config)
        self.rlfsm = RLFSM(config.get('rlfsm', None))

    def set_read_only(self, value=True):  #override
        self._read_only = value
        self.rlfsm.set_read_only(value)

    def schedule_deletions(self,
                           replica_list,
                           operation_id,
                           comments=''):  #override
        sites = set(r.site for r, b in replica_list)
        if len(sites) != 1:
            raise OperationalError(
                'schedule_copies should be called with a list of replicas at a single site.'
            )

        site = list(sites)[0]

        LOG.info(
            'Scheduling deletion of %d replicas from %s using RLFSM (operation %d)',
            len(replica_list), site.name, operation_id)

        clones = []

        for dataset_replica, block_replicas in replica_list:
            if block_replicas is None:
                to_delete = dataset_replica.block_replicas
            else:
                to_delete = block_replicas

            for block_replica in to_delete:
                for lfile in block_replica.files():
                    self.rlfsm.desubscribe_file(block_replica.site, lfile)

            # No external dependency -> all operations are successful

            clone_replica = DatasetReplica(dataset_replica.dataset,
                                           dataset_replica.site)
            clone_replica.copy(dataset_replica)

            if block_replicas is None:
                clones.append((clone_replica, None))
            else:
                clones.append((clone_replica, []))
                for block_replica in block_replicas:
                    clone_block_replica = BlockReplica(block_replica.block,
                                                       block_replica.site)
                    clone_block_replica.copy(block_replica)
                    clone_block_replica.last_update = int(time.time())
                    clones[-1][1].append(clone_block_replica)

        return clones

    def deletion_status(self, operation_id):  #override
        raise NotImplementedError('deletion_status')

コード例 #12

0

ファイルを表示

ファイル: release_subscriptions.py プロジェクト: dr-stringfellow/dynamo

parser.add_argument('--site', '-s', metavar = 'SITE', dest = 'site', help = 'Site name.')
parser.add_argument('--reason', '-r', metavar = 'REASON', dest = 'reason', help = 'Hold reason.')
parser.add_argument('--id', '-i', metavar = 'ID', dest = 'ids', nargs = '+', type = int, help = 'Subscription ids.')

args = parser.parse_args()
sys.argv = []

if args.site is None and args.reason is None and args.ids is None:
    sys.stderr.write('Cannot release all subscriptions.')
    sys.exit(1)

from dynamo.core.executable import inventory, authorized
from dynamo.fileop.rlfsm import RLFSM

rlfsm = RLFSM()

if not authorized:
    rlfsm.set_read_only()

subscriptions = rlfsm.get_subscriptions(inventory, op = 'transfer', status = ['held'])

num_released = 0

for subscription in subscriptions:
    if args.ids is not None and subscription.id not in args.ids:
        continue

    if args.site is not None and subscription.destination.name != args.site:
        continue

コード例 #13

0

ファイルを表示

ファイル: current.py プロジェクト: SmartDataProjects/dynamo

    def __init__(self, config):
        WebModule.__init__(self, config)

        self.rlfsm = RLFSM()
        self.rlfsm.set_read_only(True)

コード例 #14

0

ファイルを表示

ファイル: rates.py プロジェクト: ellenlee1/dynamo

    def __init__(self, config):
        WebModule.__init__(self, config)

        self.rlfsm = RLFSM()
        self.rlfsm.set_read_only(True)