Source code for dbs.apis.dbsClient

from __future__ import print_function
from dbs.exceptions.dbsClientException import dbsClientException
from RestClient.ErrorHandling.RestClientExceptions import HTTPError
from RestClient.RestApi import RestApi
from RestClient.AuthHandling.X509Auth import X509Auth
from RestClient.ProxyPlugins.Socks5Proxy import Socks5Proxy

import cjson
import os
import socket
import sys
import urllib

[docs]def slicedIterator(sourceList, sliceSize): """ :param: sourceList: list which need to be sliced :type: list :param: sliceSize: size of the slice :type: int :return: iterator of the sliced list """ start = 0 end = 0 while len(sourceList) > end: end = start + sliceSize yield sourceList[start: end] start = end
[docs]def checkInputParameter(method, parameters, validParameters, requiredParameters=None): """ Helper function to check input by using before sending to the server :param method: Name of the API :type method: str :param validParameters: Allow parameters for the API call :type validParameters: list :param requiredParameters: Required parameters for the API call (Default: None) :type requiredParameters: list """ for parameter in parameters: if parameter not in validParameters: raise dbsClientException("Invalid input", "API %s does not support parameter %s. Supported parameters are %s" \ % (method, parameter, validParameters)) if requiredParameters is not None: if 'multiple' in requiredParameters: match = False for requiredParameter in requiredParameters['multiple']: if requiredParameter!='detail' and requiredParameter in parameters: match = True break if not match: raise dbsClientException("Invalid input", "API %s does require one of the parameters %s" \ % (method, requiredParameters['multiple'])) if 'forced' in requiredParameters: for requiredParameter in requiredParameters['forced']: if requiredParameter not in parameters: raise dbsClientException("Invalid input", "API %s does require the parameter %s. Forced required parameters are %s" \ % (method, requiredParameter, requiredParameters['forced'])) if 'standalone' in requiredParameters: overlap = [] for requiredParameter in requiredParameters['standalone']: if requiredParameter in parameters: overlap.append(requiredParameter) if len(overlap) != 1: raise dbsClientException("Invalid input", "API %s does requires only *one* of the parameters %s." \ % (method, requiredParameters['standalone']))
[docs]def list_parameter_splitting(data, key, size_limit=8000, method='GET'): """ Helper function split list used as input parameter for requests, since Apache has a limitation to 8190 Bytes for the lenght of an URI. We extended it to also split lfn and dataset list length for POST calls to avoid DB abuse even if there is no limit on hoe long the list can be. YG 2015-5-13 :param data: url parameters :type data: dict :param key: key of parameter dictionary to split by lenght :type used_size: str :param size_limit: Split list in chunks of maximal size_limit bytes :type size_limit: int """ values = list(data[key]) data[key] = [] for element in values: data[key].append(element) if method =='GET': size = len(urllib.urlencode(data)) else: size = len(data) if size > size_limit: last_element = data[key].pop() yield data data[key] = [last_element] yield data
[docs]def split_calls(func): """ Decorator to split up server calls for methods using url parameters, due to the lenght limitation of the URI in Apache. By default 8190 bytes """ def wrapper(*args, **kwargs): #The size limit is 8190 bytes minus url and api to call #For example (https://cmsweb-testbed.cern.ch/dbs/prod/global/filechildren), so 192 bytes should be safe. size_limit = 8000 encoded_url = urllib.urlencode(kwargs) if len(encoded_url) > size_limit: for key, value in kwargs.iteritems(): ###only one (first) list at a time is splitted, ###currently only file lists are supported if key in ('logical_file_name', 'block_name', 'lumi_list', 'run_num') and isinstance(value, list): ret_val = [] for splitted_param in list_parameter_splitting(data=dict(kwargs), #make a copy, since it is manipulated key=key, size_limit=size_limit): try: ret_val.extend(func(*args, **splitted_param)) except (TypeError, AttributeError):#update function call do not return lists ret_val= [] return ret_val raise dbsClientException("Invalid input", "The lenght of the urlencoded parameters to API %s \ is exceeding %s bytes and cannot be splitted." % (func.__name__, size_limit)) else: return func(*args, **kwargs) return wrapper
[docs]class DbsApi(object): """DbsApi class""" #added CAINFO and userAgent (see github issue #431 & #432) def __init__(self, url="", proxy=None, key=None, cert=None, verifypeer=True, debug=0, ca_info=None, userAgent=""): """ DbsApi Constructor :param url: server URL. :type url: str :param proxy: socks5 proxy format=(socks5://username:password@host:port) :type proxy: str :param key: full path to the private key to use :type key: str :param cert: full path to the certificate to use :type cert: str .. note:: By default the DbsApi is trying to lookup the private key and the certificate in the common locations """ self.url = url self.proxy = proxy self.key = key self.cert = cert self.userAgent = userAgent self.rest_api = RestApi(auth=X509Auth(ssl_cert=cert, ssl_key=key, ssl_verifypeer=verifypeer, ca_info=ca_info), proxy=Socks5Proxy(proxy_url=self.proxy) if self.proxy else None) def __callServer(self, method="", params={}, data={}, callmethod='GET', content='application/json'): """ A private method to make HTTP call to the DBS Server :param method: REST API to call, e.g. 'datasets, blocks, files, ...'. :type method: str :param params: Parameters to the API call, e.g. {'dataset':'/PrimaryDS/ProcessedDS/TIER'}. :type params: dict :param callmethod: The HTTP method used, by default it is HTTP-GET, possible values are GET, POST and PUT. :type callmethod: str :param content: The type of content the server is expected to return. DBS3 only supports application/json :type content: str """ UserID = os.environ['USER']+'@'+socket.gethostname() try: UserAgent = "DBSClient/"+os.environ['DBS3_CLIENT_VERSION']+"/"+ self.userAgent except: UserAgent = "DBSClient/Unknown"+"/"+ self.userAgent request_headers = {"Content-Type": content, "Accept": content, "UserID": UserID, "User-Agent":UserAgent } method_func = getattr(self.rest_api, callmethod.lower()) data = cjson.encode(data) try: self.http_response = method_func(self.url, method, params, data, request_headers) except HTTPError as http_error: self.__parseForException(http_error) if content != "application/json": return self.http_response.body try: json_ret=cjson.decode(self.http_response.body) except cjson.DecodeError: print("The server output is not a valid json, most probably you have a typo in the url.\n%s.\n" % self.url, file=sys.stderr) raise dbsClientException("Invalid url", "Possible urls are %s" %self.http_response.body) return json_ret def __parseForException(self, http_error): """ An internal method, should not be used by clients :param httperror: Thrown httperror by the server """ data = http_error.body try: if isinstance(data, str): data = cjson.decode(data) except: raise http_error if isinstance(data, dict) and 'exception' in data:# re-raise with more details raise HTTPError(http_error.url, data['exception'], data['message'], http_error.header, http_error.body) raise http_error @property def requestTimingInfo(self): """ Returns the time needed to process the request by the frontend server in microseconds and the EPOC timestamp of the request in microseconds. :rtype: tuple containing processing time and timestamp """ try: return tuple(item.split('=')[1] for item in self.http_response.header.get('CMS-Server-Time').split()) except AttributeError: return None, None @property def requestContentLength(self): """ Returns the content-length of the content return by the server :rtype: str """ try: return self.http_response.header.get('Content-Length') except AttributeError: return None
[docs] def blockDump(self,**kwargs): """ API the list all information related with the block_name :param block_name: Name of the block to be dumped (Required) :type block_name: str """ validParameters = ['block_name'] requiredParameters = {'forced':validParameters} checkInputParameter(method="blockDump", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("blockdump", params=kwargs)
[docs] def help(self, **kwargs): """ API to get a list of supported REST APIs. In the case a particular API is specified, the docstring of that API is displayed. :param call: REST API call for which help is desired (Optional) :type call: str :return: List of APIs or detailed information about a specific call (parameters and docstring) :rtype: List of strings or a dictionary containing params and doc keys depending on the input parameter """ validParameters = ['call'] checkInputParameter(method="help", parameters=kwargs.keys(), validParameters=validParameters) return self.__callServer("help", params=kwargs)
[docs] def insertAcquisitionEra(self, acqEraObj): """ API to insert an Acquisition Era in DBS :param acqEraObj: Acquisition Era object :type acqEraObj: dict :key acquisition_era_name: Acquisition Era Name (Required) :key start_date: start date of the acquisition era (unixtime, int) (Optional, default current date) :key end_date: end data of the acquisition era (unixtime, int) (Optional) """ return self.__callServer("acquisitioneras", data=acqEraObj, callmethod='POST' )
[docs] def insertBlock(self, blockObj): """ API to insert a block into DBS :param blockObj: Block object :type blockObj: dict :key open_for_writing: Open For Writing (1/0) (Optional, default 1) :key block_size: Block Size (Optional, default 0) :key file_count: File Count (Optional, default 0) :key block_name: Block Name (Required) :key origin_site_name: Origin Site Name (Required) """ return self.__callServer("blocks", data=blockObj, callmethod='POST' )
[docs] def insertBulkBlock(self, blockDump): """ API to insert a bulk block :param blockDump: Output of the block dump command, example can be found in https://svnweb.cern.ch/trac/CMSDMWM/browser/DBS/trunk/Client/tests/dbsclient_t/unittests/blockdump.dict :type blockDump: dict """ return self.__callServer("bulkblocks", data=blockDump, callmethod='POST' )
[docs] def insertDataset(self, datasetObj): """ API to insert a dataset in DBS :param datasetObj: Dataset object :type datasetObj: dict :key primary_ds_name: Primary Dataset Name (Required) :key dataset: Name of the dataset (Required) :key dataset_access_type: Dataset Access Type (Required) :key processed_ds_name: Processed Dataset Name (Required) :key data_tier_name: Data Tier Name (Required) :key acquisition_era_name: Acquisition Era Name (Required) :key processing_version: Processing Version (Required) :key physics_group_name: Physics Group Name (Optional, default None) :key prep_id: ID of the Production and Reprocessing management tool (Optional, default None) :key xtcrosssection: Xtcrosssection (Optional, default None) :key output_configs: List(dict) with keys release_version, pset_hash, app_name, output_module_label and global tag """ return self.__callServer("datasets", data = datasetObj, callmethod='POST' )
[docs] def insertDataTier(self, dataTierObj): """ API to insert A Data Tier in DBS :param dataTierObj: Data Tier object :type dataTierObj: dict :key data_tier_name: Data Tier that needs to be inserted """ return self.__callServer("datatiers", data = dataTierObj, callmethod='POST' )
[docs] def insertFiles(self, filesList, qInserts=False): """ API to insert a list of file into DBS in DBS. Up to 10 files can be inserted in one request. :param qInserts: True means that inserts will be queued instead of done immediately. INSERT QUEUE Manager will perform the inserts, within few minutes. :type qInserts: bool :param filesList: List of dictionaries containing following information :type filesList: list of dicts :key logical_file_name: File to be inserted (str) (Required) :key is_file_valid: (optional, default = 1): (bool) :key block: required: /a/b/c#d (str) :key dataset: required: /a/b/c (str) :key file_type: (optional, default = EDM) one of the predefined types, (str) :key check_sum: (optional, default = '-1') (str) :key event_count: (optional, default = -1) (int) :key file_size: (optional, default = -1.) (float) :key adler32: (optional, default = '') (str) :key md5: (optional, default = '') (str) :key auto_cross_section: (optional, default = -1.) (float) :key file_lumi_list: (optional, default = []) [{'run_num': 123, 'lumi_section_num': 12},{}....] :key file_parent_list: (optional, default = []) [{'file_parent_lfn': 'mylfn'},{}....] :key file_assoc_list: (optional, default = []) [{'file_parent_lfn': 'mylfn'},{}....] :key file_output_config_list: (optional, default = []) [{'app_name':..., 'release_version':..., 'pset_hash':...., output_module_label':...},{}.....] """ if not qInserts: #turn off qInserts return self.__callServer("files", params={'qInserts': qInserts}, data=filesList, callmethod='POST' ) return self.__callServer("files", data=filesList, callmethod='POST' )
[docs] def insertOutputConfig(self, outputConfigObj): """ API to insert An OutputConfig in DBS :param outputConfigObj: Output Config object :type outputConfigObj: dict :key app_name: App Name (Required) :key release_version: Release Version (Required) :key pset_hash: Pset Hash (Required) :key output_module_label: Output Module Label (Required) :key global_tag: Global Tag (Required) :key scenario: Scenario (Optional, default is None) :key pset_name: Pset Name (Optional, default is None) """ return self.__callServer("outputconfigs", data=outputConfigObj, callmethod='POST' )
[docs] def insertPrimaryDataset(self, primaryDSObj): """ API to insert A primary dataset in DBS :param primaryDSObj: primary dataset object :type primaryDSObj: dict :key primary_ds_type: TYPE (out of valid types in DBS, MC, DATA) (Required) :key primary_ds_name: Name of the primary dataset (Required) """ return self.__callServer("primarydatasets", data=primaryDSObj, callmethod='POST' )
[docs] def insertProcessingEra(self, procEraObj): """ API to insert A Processing Era in DBS :param procEraObj: Processing Era object :type procEraObj: dict :key processing_version: Processing Version (Required) :key description: Description (Optional) """ return self.__callServer("processingeras", data=procEraObj, callmethod='POST' )
[docs] def listApiDocumentation(self): """ API to retrieve the auto-generated documentation page from server """ return self.__callServer(content="text/html")
[docs] def listAcquisitionEras(self, **kwargs): """ API to list all Acquisition Eras in DBS. :param acquisition_era_name: Acquisition era name (Optional, wild cards allowed) :type acquisition_era_name: str :returns: List of dictionaries containing following keys (description, end_date, acquisition_era_name, create_by, creation_date and start_date) :rtype: list of dicts """ validParameters = ['acquisition_era_name'] checkInputParameter(method="listAcquisitionEras", parameters=kwargs.keys(), validParameters=validParameters) return self.__callServer("acquisitioneras", params=kwargs)
[docs] def listAcquisitionEras_ci(self, **kwargs): """ API to list all Acquisition Eras (case insensitive) in DBS. :param acquisition_era_name: Acquisition era name (Optional, wild cards allowed) :type acquisition_era_name: str :returns: List of dictionaries containing following keys (description, end_date, acquisition_era_name, create_by, creation_date and start_date) :rtype: list of dicts """ validParameters = ['acquisition_era_name'] checkInputParameter(method="listAcquisitionEras", parameters=kwargs.keys(), validParameters=validParameters) return self.__callServer("acquisitioneras_ci", params=kwargs)
[docs] def listBlockChildren(self, **kwargs): """ API to list block children. :param block_name: name of block who's children needs to be found (Required) :type block_name: str :returns: List of dictionaries containing following keys (block_name) :rtype: list of dicts """ validParameters = ['block_name'] requiredParameters = {'forced': validParameters} checkInputParameter(method="listBlockChildren", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("blockchildren", params=kwargs)
[docs] def listBlockParents(self, **kwargs): """ API to list block parents. :param block_name: name of block who's parents needs to be found (Required) :type block_name: str :returns: List of dictionaries containing following keys (block_name) :rtype: list of dicts """ validParameters = ['block_name'] requiredParameters = {'forced': validParameters} checkInputParameter(method="listBlockParents", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) if isinstance(kwargs["block_name"], list): return self.__callServer("blockparents", data=kwargs, callmethod='POST') else: return self.__callServer("blockparents", params=kwargs)
[docs] def listBlocks(self, **kwargs): """ API to list a block in DBS. At least one of the parameters block_name, dataset, data_tier_name or logical_file_name are required. If data_tier_name is provided, min_cdate and max_cdate have to be specified and the difference in time have to be less than 31 days. :param block_name: name of the block :type block_name: str :param dataset: dataset :type dataset: str :param data_tier_name: data tier :type data_tier_name: str :param logical_file_name: Logical File Name :type logical_file_name: str :param origin_site_name: Origin Site Name (Optional) :type origin_site_name: str :param run_num: run numbers (Optional). Possible format: run_num, "run_min-run_max", or ["run_min-run_max", run1, run2, ...] :type run_num: int, list of runs or list of run ranges :param min_cdate: Lower limit for the creation date (unixtime) (Optional) :type min_cdate: int, str :param max_cdate: Upper limit for the creation date (unixtime) (Optional) :type max_cdate: int, str :param min_ldate: Lower limit for the last modification date (unixtime) (Optional) :type min_ldate: int, str :param max_ldate: Upper limit for the last modification date (unixtime) (Optional) :type max_ldate: int, str :param cdate: creation date (unixtime) (Optional) :type cdate: int, str :param ldate: last modification date (unixtime) (Optional) :type ldate: int, str :param detail: Get detailed information of a block (Optional) :type detail: bool :returns: List of dictionaries containing following keys (block_name). If option detail is used the dictionaries contain the following keys (block_id, create_by, creation_date, open_for_writing, last_modified_by, dataset, block_name, file_count, origin_site_name, last_modification_date, dataset_id and block_size) :rtype: list of dicts """ validParameters = ['dataset', 'block_name', 'data_tier_name', 'origin_site_name', 'logical_file_name', 'run_num', 'open_for_writing', 'min_cdate', 'max_cdate', 'min_ldate', 'max_ldate', 'cdate', 'ldate', 'detail'] #requiredParameters = {'multiple': validParameters} requiredParameters = {'multiple': ['dataset', 'block_name', 'data_tier_name', 'logical_file_name']} #set defaults if 'detail' not in kwargs.keys(): kwargs['detail'] = False checkInputParameter(method="listBlocks", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("blocks", params=kwargs)
@split_calls def listBlockSummaries(self, **kwargs): """ API that returns summary information like total size and total number of events in a dataset or a list of blocks :param block_name: list block summaries for block_name(s) :type block_name: str, list :param dataset: list block summaries for all blocks in dataset :type dataset: str :param detail: list block summary by block names if detail=True, default=False :type detail: str, bool :returns: list of dicts containing total block_sizes, file_counts and event_counts of dataset or blocks provided """ validParameters = ['block_name', 'dataset', 'detail'] requiredParameters = {'standalone': ['block_name', 'dataset']} checkInputParameter(method="listBlockSummaries", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer('blocksummaries', params=kwargs)
[docs] def listBlockOrigin(self, **kwargs): """ API to list blocks first generated in origin_site_name. :param origin_site_name: Origin Site Name (Optional No wildcards) :type origin_site_name: str :param dataset: dataset (Either dataset or block_name is required, No wildcards) :type dataset: str :param block_name: block (Either dataset or block_name is required, No wildcards) :type block_name: str :returns: List of dictionaries containing the following keys (create_by, creation_date, open_for_writing, last_modified_by, dataset, block_name, file_count, origin_site_name, last_modification_date, block_size) :rtype: list of dicts """ validParameters = ['origin_site_name', 'dataset', 'block_name'] requiredParameters = {'multiple': ['dataset', 'block_name']} checkInputParameter(method="listBlockOrigin", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer('blockorigin', params=kwargs)
[docs] def listDatasets(self, **kwargs): """ API to list dataset(s) in DBS * You can use ANY combination of these parameters in this API * In absence of parameters, all valid datasets known to the DBS instance will be returned :param dataset: Full dataset (path) of the dataset :type dataset: str :param parent_dataset: Full dataset (path) of the dataset :type parent_dataset: str :param release_version: cmssw version :type release_version: str :param pset_hash: pset hash :type pset_hash: str :param app_name: Application name (generally it is cmsRun) :type app_name: str :param output_module_label: output_module_label :type output_module_label: str :param processing_version: Processing Version :type processing_version: str :param acquisition_era_name: Acquisition Era :type acquisition_era_name: str :param run_num: Specify a specific run number or range: Possible format: run_num, "run_min-run_max", or ["run_min-run_max", run1, run2, ...] :type run_num: int,list,str :param physics_group_name: List only dataset having physics_group_name attribute :type physics_group_name: str :param logical_file_name: List dataset containing the logical_file_name :type logical_file_name: str :param primary_ds_name: Primary Dataset Name :type primary_ds_name: str :param primary_ds_type: Primary Dataset Type (Type of data, MC/DATA) :type primary_ds_type: str :param processed_ds_name: List datasets having this processed dataset name :type processed_ds_name: str :param data_tier_name: Data Tier :type data_tier_name: str :param dataset_access_type: Dataset Access Type ( PRODUCTION, DEPRECATED etc.) :type dataset_access_type: str :param prep_id: prep_id :type prep_id: str :param create_by: Creator of the dataset :type create_by: str :param last_modified_by: Last modifier of the dataset :type last_modified_by: str :param min_cdate: Lower limit for the creation date (unixtime) (Optional) :type min_cdate: int, str :param max_cdate: Upper limit for the creation date (unixtime) (Optional) :type max_cdate: int, str :param min_ldate: Lower limit for the last modification date (unixtime) (Optional) :type min_ldate: int, str :param max_ldate: Upper limit for the last modification date (unixtime) (Optional) :type max_ldate: int, str :param cdate: creation date (unixtime) (Optional) :type cdate: int, str :param ldate: last modification date (unixtime) (Optional) :type ldate: int, str :param detail: List all details of a dataset :type detail: bool :param dataset_id: DB primary key of datasets table. :type dataset_id: int, str :returns: List of dictionaries containing the following keys (dataset). If the detail option is used. The dictionary contain the following keys (primary_ds_name, physics_group_name, acquisition_era_name, create_by, dataset_access_type, data_tier_name, last_modified_by, creation_date, processing_version, processed_ds_name, xtcrosssection, last_modification_date, dataset_id, dataset, prep_id, primary_ds_type) :rtype: list of dicts """ validParameters = ['dataset', 'parent_dataset', 'is_dataset_valid', 'release_version', 'pset_hash', 'app_name', 'output_module_label', 'processing_version', 'acquisition_era_name', 'run_num', 'physics_group_name', 'logical_file_name', 'primary_ds_name', 'primary_ds_type', 'data_tier_name', 'dataset_access_type', 'prep_id', 'create_by', 'last_modified_by', 'min_cdate', 'max_cdate', 'min_ldate', 'max_ldate', 'cdate', 'ldate', 'detail', 'dataset_id'] #set defaults if 'detail' not in kwargs.keys(): kwargs['detail'] = False checkInputParameter(method="listDatasets", parameters=kwargs.keys(), validParameters=validParameters) return self.__callServer("datasets", params=kwargs)
[docs] def listDatasetAccessTypes(self, **kwargs): """ API to list dataset access types. :param dataset_access_type: List that dataset access type (Optional) :type dataset_access_type: str :returns: List of dictionary containing the following key (dataset_access_type). :rtype: List of dicts """ validParameters = ['dataset_access_type'] checkInputParameter(method="listDatasetAccessTypes", parameters=kwargs.keys(), validParameters=validParameters) return self.__callServer("datasetaccesstypes", params=kwargs)
[docs] def listDatasetArray(self, **kwargs): """ API to list datasets in DBS. :param dataset: list of datasets [dataset1,dataset2,..,dataset n] (Required if dataset_id is not presented), Max length 1000. :type dataset: list :param dataset_id: list of dataset_ids that are the primary keys of datasets table: [dataset_id1,dataset_id2,..,dataset_idn] (Required if dataset is not presented), Max length 1000. :type dataset: list :param dataset_access_type: List only datasets with that dataset access type (Optional) :type dataset_access_type: str :param detail: brief list or detailed list 1/0 :type detail: bool :returns: List of dictionaries containing the following keys (dataset). If the detail option is used. The dictionary contains the following keys (primary_ds_name, physics_group_name, acquisition_era_name, create_by, dataset_access_type, data_tier_name, last_modified_by, creation_date, processing_version, processed_ds_name, xtcrosssection, last_modification_date, dataset_id, dataset, prep_id, primary_ds_type) :rtype: list of dicts """ validParameters = ['dataset', 'dataset_access_type', 'detail', 'dataset_id'] requiredParameters = {'multiple': ['dataset', 'dataset_id']} checkInputParameter(method="listDatasetArray", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) #set defaults if 'detail' not in kwargs.keys(): kwargs['detail'] = False return self.__callServer("datasetlist", data=kwargs, callmethod='POST')
[docs] def listDatasetChildren(self, **kwargs): """ API to list A datasets children in DBS. :param dataset: dataset (Required) :type dataset: str :returns: List of dictionaries containing the following keys (child_dataset_id, child_dataset, dataset) :rtype: list of dicts """ validParameters = ['dataset'] requiredParameters = {'forced': validParameters} checkInputParameter(method="listDatasetChildren", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("datasetchildren", params=kwargs)
[docs] def listDatasetParents(self, **kwargs): """ API to list A datasets parents in DBS. :param dataset: dataset (Required) :type dataset: str :returns: List of dictionaries containing the following keys (this_dataset, parent_dataset_id, parent_dataset) :rtype: list of dicts """ validParameters = ['dataset'] requiredParameters = {'forced': validParameters} checkInputParameter(method="listDatasetParents", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("datasetparents", params=kwargs)
[docs] def listDataTiers(self, **kwargs): """ API to list data tiers known to DBS. :param data_tier_name: List details on that data tier (Optional) :type data_tier_name: str :returns: List of dictionaries containing the following keys (data_tier_id, data_tier_name, create_by, creation_date) :rtype: list of dicts """ validParameters = ['data_tier_name'] checkInputParameter(method="listDataTiers", parameters=kwargs.keys(), validParameters=validParameters) return self.__callServer("datatiers", params=kwargs)
[docs] def listDataTypes(self, **kwargs): """ API to list data types known to dbs (when no parameter supplied). :param dataset: Returns data type (of primary dataset) of the dataset (Optional) :type dataset: str :param datatype: List specific data type :type datatype: str :returns: List of dictionaries containing the following keys (primary_ds_type_id, data_type) :rtype: list of dicts """ validParameters = ['datatype', 'dataset'] checkInputParameter(method="listDataTypes", parameters=kwargs.keys(), validParameters=validParameters) return self.__callServer("datatypes", params=kwargs)
[docs] def listFileChildren_doc(self, **kwargs): """ API to list file children. One of the parameters in mandatory. :param logical_file_name: logical_file_name of file :type logical_file_name: str, list :param block_name: block_name :type block_name: str :param block_id: block_id :type block_id: str, int :returns: List of dictionaries containing the following keys (child_logical_file_name, logical_file_name) :rtype: List of dicts """ pass
@split_calls def listFileChildren(self, **kwargs): """ API to list file children. One of the parameters in mandatory. :param logical_file_name: logical_file_name of file :type logical_file_name: str, list :param block_name: block_name :type block_name: str :param block_id: block_id :type block_id: str, int :returns: List of dictionaries containing the following keys (child_logical_file_name, logical_file_name) :rtype: List of dicts """ validParameters = ['logical_file_name', 'block_name', 'block_id'] requiredParameters = {'standalone': validParameters} checkInputParameter(method="listFileChildren", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("filechildren", params=kwargs)
[docs] def listFileLumis(self, **kwargs): """ API to list Lumi for files. Either logical_file_name or block_name is required. No wild card support in this API :param block_name: Name of the block :type block_name: str :param logical_file_name: logical_file_name of file :type logical_file_name: str :param run_num: List lumi sections for a given run number (Optional). Possible format: run_num, "run_min-run_max", or ["run_min-run_max", run1, run2, ...] . run_num=1 is MC data and it will cause almost whole table scan, so run_num=1 will cause an input error. :type run_num: int,str,list :param validFileOnly: default value is 0 (optional), when set to 1, only valid files counted. :type validFileOnly: int, str :returns: List of dictionaries containing the following keys (lumi_section_num, logical_file_name, run) :rtype: list of dicts """ validParameters = ['logical_file_name', 'block_name', 'run_num', 'validFileOnly'] requiredParameters = {'standalone': ['logical_file_name', 'block_name']} checkInputParameter(method="listFileLumis", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("filelumis", params=kwargs)
[docs] def listFileLumiArray(self, **kwargs): """ API to list Lumiis for a list of files. A list of logical_file_names is required. No wild card support in this API :param logical_file_name: logical_file_name of file, Max length 1000. :type logical_file_name: str, list :param run_num: List lumi sections for a given run number (Optional). Possible format: run_num, "run_min-run_max", or ["run_min-run_max", run1, run2, ...] . run_num=1 is MC data and it will cause almost whole table scan, so run_num=1 will cause an input error. Max length 1000. :type run_num: int,str,list :param validFileOnly: default value is 0 (optional), when set to 1, only valid files counted. :type validFileOnly: int, str :returns: List of dictionaries containing the following keys (lumi_section_num, logical_file_name, run) :rtype: list of dicts """ validParameters = ['logical_file_name', 'run_num', 'validFileOnly'] requiredParameters = {'forced': ['logical_file_name']} checkInputParameter(method="listFileLumiArray", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("filelumis", data=kwargs, callmethod="POST")
[docs] def listFileParents_doc(self, **kwargs): """ API to list file parents :param logical_file_name: logical_file_name of file (Required) :type logical_file_name: str :param block_id: ID of the a block, whose files should be listed :type block_id: int, str :param block_name: Name of the block, whose files should be listed :type block_name: int, str :returns: List of dictionaries containing the following keys (parent_logical_file_name, logical_file_name) :rtype: list of dicts """ pass
@split_calls def listFileParents(self, **kwargs): """ API to list file parents :param logical_file_name: logical_file_name of file (Required) :type logical_file_name: str :param block_id: ID of the a block, whose files should be listed :type block_id: int, str :param block_name: Name of the block, whose files should be listed :type block_name: int, str :returns: List of dictionaries containing the following keys (parent_logical_file_name, logical_file_name) :rtype: list of dicts """ validParameters = ['logical_file_name', 'block_id', 'block_name'] requiredParameters = {'standalone': validParameters} checkInputParameter(method="listFileParents", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("fileparents", params=kwargs)
[docs] def listFiles_doc(self, **kwargs): """ API to list files in DBS. Either non-wildcarded logical_file_name, non-wildcarded dataset, non-wildcarded block_name is required. The combination of a non-wildcarded dataset or block_name with an wildcarded logical_file_name is supported. - For lumi_list the following two json formats are supported: - [a1, a2, a3,] - [[a,b], [c, d],] - lumi_list can be either a list of lumi section numbers as [a1, a2, a3,] or a list of lumi section range as [[a,b], [c, d],]. Thay cannot be mixed. - If lumi_list is provided run only run_num=single-run-number is allowed - When lfn list is present, no run or lumi list is allowed. - There are five dataset access types: VALID, INVALID, PRODUCTION, DEPRECATED and DELETED. - One file status: IS_FILE_VALID: 1 or 0. - There are five dataset access types: VALID, INVALID, PRODUCTION, DEPRECATED and DELETED. - One file status: IS_FILE_VALID: 1 or 0. - When a dataset is INVALID/ DEPRECATED/ DELETED, DBS will consider all the files under it is invalid not matter what value is_file_valid has. In general, when the dataset is in one of INVALID/ DEPRECATED/ DELETED, is_file_valid should all marked as 0, but some old DBS2 data was not. - When Dataset is VALID/PRODUCTION, by default is_file_valid is all 1. But if individual file is invalid, then the file's is_file_valid is set to 0. - DBS use this logical in its APIs that have validFileOnly variable. :param logical_file_name: logical_file_name of the file :type logical_file_name: str :param dataset: dataset :type dataset: str :param block_name: block name :type block_name: str :param release_version: release version :type release_version: str :param pset_hash: parameter set hash :type pset_hash: str :param app_name: Name of the application :type app_name: str :param output_module_label: name of the used output module :type output_module_label: str :param run_num: run , run ranges, and run list. Possible format: run_num, "run_min-run_max", or ["run_min-run_max", run1, run2, ...]. :type run_num: int, list, string :param origin_site_name: site where the file was created :type origin_site_name: str :param lumi_list: List containing luminosity sections :type lumi_list: list :param detail: Get detailed information about a file :type detail: bool :param validFileOnly: 0 or 1. default=0. Return only valid files if set to 1. :type validFileOnly: int :returns: List of dictionaries containing the following keys (logical_file_name). If detail parameter is true, the dictionaries contain the following keys (check_sum, branch_hash_id, adler32, block_id, event_count, file_type, create_by, logical_file_name, creation_date, last_modified_by, dataset, block_name, file_id, file_size, last_modification_date, dataset_id, file_type_id, auto_cross_section, md5, is_file_valid) :rtype: list of dicts """ pass
@split_calls def listFiles(self, **kwargs): """ listFiles(**kwargs) API to list files in DBS. Either non-wildcarded logical_file_name, non-wildcarded dataset, non-wildcarded block_name is required. The combination of a non-wildcarded dataset or block_name with an wildcarded logical_file_name is supported. * For lumi_list the following two json formats are supported: - [a1, a2, a3,] - [[a,b], [c, d],] * lumi_list can be either a list of lumi section numbers as [a1, a2, a3,] or a list of lumi section range as [[a,b], [c, d],]. Thay cannot be mixed. * If lumi_list is provided run only run_num=single-run-number is allowed * When lfn list is present, no run or lumi list is allowed. * There are five dataset access types: VALID, INVALID, PRODUCTION, DEPRECATED and DELETED. * One file status: IS_FILE_VALID: 1 or 0. * There are five dataset access types: VALID, INVALID, PRODUCTION, DEPRECATED and DELETED. * One file status: IS_FILE_VALID: 1 or 0. * When a dataset is INVALID/ DEPRECATED/ DELETED, DBS will consider all the files under it is invalid not matter what value is_file_valid has. In general, when the dataset is in one of INVALID/ DEPRECATED/ DELETED, is_file_valid should all marked as 0, but some old DBS2 data was not. * When Dataset is VALID/PRODUCTION, by default is_file_valid is all 1. But if individual file is invalid, then the file's is_file_valid is set to 0. * DBS use this logical in its APIs that have validFileOnly variable. :param logical_file_name: logical_file_name of the file :type logical_file_name: str :param dataset: dataset :type dataset: str :param block_name: block name :type block_name: str :param release_version: release version :type release_version: str :param pset_hash: parameter set hash :type pset_hash: str :param app_name: Name of the application :type app_name: str :param output_module_label: name of the used output module :type output_module_label: str :param run_num: run , run ranges, and run list. Possible format: run_num, "run_min-run_max", or ["run_min-run_max", run1, run2, ...]. :type run_num: int, list, string :param origin_site_name: site where the file was created :type origin_site_name: str :param lumi_list: List containing luminosity sections :type lumi_list: list :param detail: Get detailed information about a file :type detail: bool :param validFileOnly: 0 or 1. default=0. Return only valid files if set to 1. :type validFileOnly: int :returns: List of dictionaries containing the following keys (logical_file_name). If detail parameter is true, the dictionaries contain the following keys (check_sum, branch_hash_id, adler32, block_id, event_count, file_type, create_by, logical_file_name, creation_date, last_modified_by, dataset, block_name, file_id, file_size, last_modification_date, dataset_id, file_type_id, auto_cross_section, md5, is_file_valid) :rtype: list of dicts """ validParameters = ['dataset', 'block_name', 'logical_file_name', 'release_version', 'pset_hash', 'app_name', 'output_module_label', 'run_num', 'origin_site_name', 'lumi_list', 'detail', 'validFileOnly'] requiredParameters = {'multiple': validParameters} #set defaults if 'detail' not in kwargs.keys(): kwargs['detail'] = False checkInputParameter(method="listFiles", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("files", params=kwargs)
[docs] def listFileArray(self, **kwargs): """ API to list files in DBS. Non-wildcarded logical_file_name, non-wildcarded dataset, non-wildcarded block_name or non-wildcarded lfn list is required. The combination of a non-wildcarded dataset or block_name with an wildcarded logical_file_name is supported. * For lumi_list the following two json formats are supported: - [a1, a2, a3,] - [[a,b], [c, d],] * lumi_list can be either a list of lumi section numbers as [a1, a2, a3,] or a list of lumi section range as [[a,b], [c, d],]. They cannot be mixed. * If lumi_list is provided run only run_num=single-run-number is allowed. * When run_num=1, one has to provide logical_file_name. * When lfn list is present, no run or lumi list is allowed. :param logical_file_name: logical_file_name of the file, Max length 1000. :type logical_file_name: str, list :param dataset: dataset :type dataset: str :param block_name: block name :type block_name: str :param release_version: release version :type release_version: str :param pset_hash: parameter set hash :type pset_hash: str :param app_name: Name of the application :type app_name: str :param output_module_label: name of the used output module :type output_module_label: str :param run_num: run , run ranges, and run list, Max list length 1000. :type run_num: int, list, string :param origin_site_name: site where the file was created :type origin_site_name: str :param lumi_list: List containing luminosity sections, Max length 1000. :type lumi_list: list :param detail: Get detailed information about a file :type detail: bool :param validFileOnly: 0 or 1. default=0. Return only valid files if set to 1. :type validFileOnly: int :returns: List of dictionaries containing the following keys (logical_file_name). If detail parameter is true, the dictionaries contain the following keys (check_sum, branch_hash_id, adler32, block_id, event_count, file_type, create_by, logical_file_name, creation_date, last_modified_by, dataset, block_name, file_id, file_size, last_modification_date, dataset_id, file_type_id, auto_cross_section, md5, is_file_valid) :rtype: list of dicts """ validParameters = ['dataset', 'block_name', 'logical_file_name', 'release_version', 'pset_hash', 'app_name', 'output_module_label', 'run_num', 'origin_site_name', 'lumi_list', 'detail', 'validFileOnly'] requiredParameters = {'multiple': ['dataset', 'block_name', 'logical_file_name']} #set defaults if 'detail' not in kwargs.keys(): kwargs['detail'] = False checkInputParameter(method="listFileArray", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) # In order to protect DB and make sure the query can be return in 300 seconds, we limit the length of # logical file names, lumi and run num to 1000. These number may be adjusted later if # needed. YG May-20-2015. # CMS has all MC data with run_num=1. It almost is a full table scan if run_num=1 without lfn. So we will request lfn # to be present when run_num=1. YG Jan 14, 2016 if 'logical_file_name' in kwargs.keys() and isinstance(kwargs['logical_file_name'], list)\ and len(kwargs['logical_file_name']) > 1: if 'run_num' in kwargs.keys() and isinstance(kwargs['run_num'],list) and len(kwargs['run_num']) > 1 : raise dbsClientException('Invalid input', 'files API does not supprt two lists: run_num and lfn. ') elif 'lumi_list' in kwargs.keys() and kwargs['lumi_list'] and len(kwargs['lumi_list']) > 1 : raise dbsClientException('Invalid input', 'files API does not supprt two lists: lumi_lis and lfn. ') elif 'lumi_list' in kwargs.keys() and kwargs['lumi_list']: if 'run_num' not in kwargs.keys() or not kwargs['run_num'] or kwargs['run_num'] ==-1 : raise dbsClientException('Invalid input', 'When Lumi section is present, a single run is required. ') else: if 'run_num' in kwargs.keys(): if isinstance(kwargs['run_num'], list): if 1 in kwargs['run_num'] or '1' in kwargs['run_num']: raise dbsClientException('Invalid input', 'files API does not supprt run_num=1 when no lumi.') else: if kwargs['run_num']==1 or kwargs['run_num']=='1': raise dbsClientException('Invalid input', 'files API does not supprt run_num=1 when no lumi.') #check if no lfn is given, but run_num=1 is used for searching if ('logical_file_name' not in kwargs.keys() or not kwargs['logical_file_name']) and 'run_num' in kwargs.keys(): if isinstance(kwargs['run_num'], list): if 1 in kwargs['run_num'] or '1' in kwargs['run_num']: raise dbsClientException('Invalid input', 'files API does not supprt run_num=1 without logical_file_name.') else: if kwargs['run_num'] == 1 or kwargs['run_num'] == '1': raise dbsClientException('Invalid input', 'files API does not supprt run_num=1 without logical_file_name.') results = [] mykey = None total_lumi_len = 0 split_lumi_list = [] max_list_len = 1000 #this number is defined in DBS server for key, value in kwargs.iteritems(): if key == 'lumi_list' and isinstance(kwargs['lumi_list'], list)\ and kwargs['lumi_list'] and isinstance(kwargs['lumi_list'][0], list): lapp = 0 l = 0 sm = [] for i in kwargs['lumi_list']: while i[0]+max_list_len < i[1]: split_lumi_list.append([[i[0], i[0]+max_list_len-1]]) i[0] = i[0] + max_list_len else: l += (i[1]-i[0]+1) if l <= max_list_len: sm.append([i[0], i[1]]) lapp = l #number lumis in sm else: split_lumi_list.append(sm) sm=[] sm.append([i[0], i[1]]) lapp = i[1]-i[0]+1 if sm: split_lumi_list.append(sm) elif key in ('logical_file_name', 'run_num', 'lumi_list') and isinstance(value, list) and len(value)>max_list_len: mykey =key # if mykey: sourcelist = [] #create a new list to slice sourcelist = kwargs[mykey][:] for slice in slicedIterator(sourcelist, max_list_len): kwargs[mykey] = slice results.extend(self.__callServer("fileArray", data=kwargs, callmethod="POST")) elif split_lumi_list: for item in split_lumi_list: kwargs['lumi_list'] = item results.extend(self.__callServer("fileArray", data=kwargs, callmethod="POST")) else: return self.__callServer("fileArray", data=kwargs, callmethod="POST") #make sure only one dictionary per lfn. #Make sure this changes when we move to 2.7 or 3.0 #http://stackoverflow.com/questions/11092511/python-list-of-unique-dictionaries # YG May-26-2015 return dict((v['logical_file_name'], v) for v in results).values()
[docs] def listFileSummaries(self, **kwargs): """ API to list number of files, event counts and number of lumis in a given block or dataset. If the optional run parameter is used, output are: - The number of files which have data (lumis) for that run number; - The total number of events in those files; - The total number of lumis for that run_number. Note that in general this is different from the total number of lumis in those files, since lumis are filtered by the run_number they belong to, while events are only counted as total per file; - The total num blocks that have the run_num; Either block_name or dataset name is required. No wild-cards are allowed :param block_name: Block name :type block_name: str :param dataset: Dataset name :type dataset: str :param run_num: Run number (Optional). Possible format: run_num, "run_min-run_max", or ["run_min-run_max", run1, run2, ...]. run_num=1 is MC data and it will cause almost whole table scan, so run_num=1 will cause an input error. :type run_num: int, str, list :param validFileOnly: default=0 all files included. if 1, only valid file counted. :type validFileOnly: int :returns: List of dictionaries containing the following keys (num_files, num_lumi, num_block, num_event, file_size) :rtype: list of dicts """ validParameters = ['block_name', 'dataset', 'run_num', 'validFileOnly'] requiredParameters = {'standalone': ['block_name', 'dataset']} checkInputParameter(method="listFileSummaries", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("filesummaries", params=kwargs)
[docs] def listOutputConfigs(self, **kwargs): """ API to list OutputConfigs in DBS. * You can use any combination of these parameters in this API * All parameters are optional, if you do not provide any parameter, all configs will be listed from DBS :param dataset: Full dataset (path) of the dataset :type dataset: str :param logical_file_name: logical_file_name of the file :type logical_file_name: str :param release_version: cmssw version :type release_version: str :param pset_hash: pset hash :type pset_hash: str :param app_name: Application name (generally it is cmsRun) :type app_name: str :param output_module_label: output_module_label :type output_module_label: str :param block_id: ID of the block :type block_id: int :param global_tag: Global Tag :type global_tag: str :returns: List of dictionaries containing the following keys (app_name, output_module_label, create_by, pset_hash, creation_date, release_version, global_tag, pset_name) :rtype: list of dicts """ validParameters = ['dataset', 'logical_file_name', 'release_version', 'pset_hash', 'app_name', 'output_module_label', 'block_id', 'global_tag'] checkInputParameter(method="listOutputConfigs", parameters=kwargs.keys(), validParameters=validParameters) return self.__callServer("outputconfigs", params=kwargs)
[docs] def listPhysicsGroups(self, **kwargs): """ API to list all physics groups. :param physics_group_name: List that specific physics group (Optional) :type physics_group_name: str :returns: List of dictionaries containing the following key (physics_group_name) :rtype: list of dicts """ validParameters = ['physics_group_name'] checkInputParameter(method="listPhysicsGroups", parameters=kwargs.keys(), validParameters=validParameters) return self.__callServer("physicsgroups", params=kwargs)
[docs] def listPrimaryDatasets(self, **kwargs): """ API to list primary datasets :param primary_ds_type: List primary datasets with primary dataset type (Optional) :type primary_ds_type: str :param primary_ds_name: List that primary dataset (Optional) :type primary_ds_name: str :returns: List of dictionaries containing the following keys (create_by, primary_ds_type, primary_ds_id, primary_ds_name, creation_date) :rtype: list of dicts """ validParameters = ['primary_ds_name', 'primary_ds_type'] checkInputParameter(method="listPrimaryDatasets", parameters=kwargs.keys(), validParameters=validParameters) return self.__callServer("primarydatasets", params=kwargs)
[docs] def listPrimaryDSTypes(self, **kwargs): """ API to list primary dataset types :param primary_ds_type: List that primary dataset type (Optional) :type primary_ds_type: str :param dataset: List the primary dataset type for that dataset (Optional) :type dataset: str :returns: List of dictionaries containing the following keys (primary_ds_type_id, data_type) :rtype: list of dicts """ validParameters = ['primary_ds_type', 'dataset'] checkInputParameter(method="listPrimaryDSTypes", parameters=kwargs.keys(), validParameters=validParameters) return self.__callServer("primarydstypes", params=kwargs)
[docs] def listProcessingEras(self, **kwargs): """ API to list all Processing Eras in DBS. :param processing_version: Processing Version (Optional). If provided just this processing_version will be listed :type processing_version: str :returns: List of dictionaries containing the following keys (create_by, processing_version, description, creation_date) :rtype: list of dicts """ validParameters = ['processing_version'] checkInputParameter(method="listProcessingEras", parameters=kwargs.keys(), validParameters=validParameters) return self.__callServer("processingeras", params=kwargs)
[docs] def listReleaseVersions(self, **kwargs): """ API to list all release versions in DBS :param release_version: List only that release version :type release_version: str :param dataset: List release version of the specified dataset :type dataset: str :param logical_file_name: List release version of the logical file name :type logical_file_name: str :returns: List of dictionaries containing following keys (release_version) :rtype: list of dicts """ validParameters = ['dataset', 'release_version', 'logical_file_name'] checkInputParameter(method="listReleaseVersions", parameters=kwargs.keys(), validParameters=validParameters) return self.__callServer("releaseversions", params=kwargs)
[docs] def listRuns(self, **kwargs): """ API to list all run dictionary, for example: [{'run_num': [160578, 160498, 160447, 160379]}]. At least one parameter is mandatory. :param logical_file_name: List all runs in the file :type logical_file_name: str :param block_name: List all runs in the block :type block_name: str :param dataset: List all runs in that dataset :type dataset: str :param run_num: List all runs :type run_num: int, string or list """ validParameters = ['run_num', 'logical_file_name', 'block_name', 'dataset'] requiredParameters = {'multiple': validParameters} checkInputParameter(method="listRuns", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("runs", params=kwargs)
[docs] def listRunSummaries(self, **kwargs): """ API to list run summaries, like the maximal lumisection in a run. :param dataset: dataset name (Optional) :type dataset: str :param run_num: Run number (Required) :type run_num: str, long, int :returns: list containing a dictionary with key max_lumi :rtype: list of dicts """ validParameters = ['dataset', 'run_num'] requiredParameters = {'forced': ['run_num']} checkInputParameter(method="listRunSummaries", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("runsummaries", params=kwargs)
[docs] def submitMigration(self, migrationObj): """ Submit a migration request to the migration service :param migrationObj: migration request object :type migrationObj: dict :key migration_url: The source DBS url for migration (required) :key migration_input: The block or dataset names to be migrated (required) """ return self.__callServer("submit", data=migrationObj, callmethod='POST')
[docs] def statusMigration(self, **kwargs): """ Check the status of migration request: 0-request created; 1-migration in process; 2-migration successed; 3-migration failed, but has three chances to try; 9-migration Permanently failed. :param migration_rqst_id: Migration Request ID :type migration_rqst_id: str, int, long :param block_name: Block name :type block_name: str :param dataset: Dataset name :type dataset: str :param user: user :type user: str """ validParameters = ['migration_rqst_id', 'block_name', 'dataset', 'user'] checkInputParameter(method='statusMigration', parameters=kwargs.keys(), validParameters=validParameters) return self.__callServer("status", params=kwargs)
[docs] def removeMigration(self, migrationObj): """ Remove a migration request from the queue. Only Permanently FAILED (status 9) and PENDING (status 0) requests can be removed. Running and succeeded requests cannot be removed. :param migrationObj: migration request object :type migrationObj: dict :key migration_rqst_id: The migration request id (required) """ return self.__callServer("remove", data=migrationObj, callmethod='POST')
[docs] def serverinfo(self): """ Method that provides information about DBS Server to the clients The information includes :return: Server Version - CVS Tag, Schema Version - Version of Schema this DBS instance is working with, ETC - TBD :rtype: dictionary containing tagged_version, schema, and components keys """ return self.__callServer("serverinfo")
[docs] def updateAcqEraEndDate(self, **kwargs): """ API to update the end_date of an acquisition era :param acquisition_era_name: acquisition_era_name to update (Required) :type acquisition_era_name: str :param end_date: end_date not zero (Required) :type end_date: int """ validParameters = ['end_date', 'acquisition_era_name'] requiredParameters = {'forced': validParameters} checkInputParameter(method="updateAcqEraEndDate", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("acquisitioneras", params=kwargs, callmethod='PUT')
[docs] def updateBlockStatus(self, **kwargs): """ API to update block status :param block_name: block name (Required) :type block_name: str :param open_for_writing: open_for_writing=0 (close), open_for_writing=1 (open) (Required) :type open_for_writing: str """ validParameters = ['block_name', 'open_for_writing'] requiredParameters = {'forced': validParameters} checkInputParameter(method="updateBlockStatus", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("blocks", params=kwargs, callmethod='PUT')
[docs] def updateBlockSiteName(self, **kwargs): """ API to update origin_site_name of a block :param block_name: block name (Required) :type block_name: str :param origin_site_name: New origin site name of the block (Required) :type open_for_writing: str """ validParameters = ['block_name', 'origin_site_name'] requiredParameters = {'forced': validParameters} checkInputParameter(method="updateBlockSiteName", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("blocks", params=kwargs, callmethod='PUT')
[docs] def updateDatasetType(self, **kwargs): """ API to update dataset type :param dataset: Dataset to update (Required) :type dataset: str :param dataset_access_type: production, deprecated, etc (Required) :type dataset_access_type: str """ validParameters = ['dataset', 'dataset_access_type'] requiredParameters = {'forced': validParameters} checkInputParameter(method="updateDatasetType", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("datasets", params=kwargs, callmethod='PUT')
@split_calls def updateFileStatus(self, **kwargs): """ API to update file status :param logical_file_name: logical_file_name to update (Required if no dataset). :type logical_file_name: str or a list of str :param dataset : dataset name to update all the files under it (Required if no lfn). :type dataset: basestring :param is_file_valid: valid=1, invalid=0 (Required) :type is_file_valid: bool :param lost: default lost=0 to indicate a file is not lost in transfer :type lost: bool """ validParameters = ['logical_file_name', 'is_file_valid', 'lost', 'dataset'] requiredParameters = {'forced': ['is_file_valid'], 'multiple': ['logical_file_name', 'dataset']} checkInputParameter(method="updateFileStatus", parameters=kwargs.keys(), validParameters=validParameters, requiredParameters=requiredParameters) return self.__callServer("files", params=kwargs, callmethod='PUT')
if __name__ == "__main__": # DBS Service URL url="http://cmssrv18.fnal.gov:8585/dbs3" #read_proxy="http://cmst0frontier1.cern.ch:3128" #read_proxy="http://cmsfrontier1.fnal.gov:3128" read_proxy="" api = DbsApi(url=url, proxy=read_proxy) print(api.serverinfo()) #print api.listPrimaryDatasets() #print api.listAcquisitionEras() #print api.listProcessingEras()