forked from CMSCompOps/WmAgentScripts
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathMissingRuns.py
57 lines (50 loc) · 1.68 KB
/
MissingRuns.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
#!/usr/bin/env python
import urllib2,urllib, httplib, sys, re, os, json, dbsTest, phedexSubscription
from xml.dom.minidom import getDOMImplementation
from das_client import get_data
das_host='https://cmsweb.cern.ch'
#Return true if a run is not present in any of the output datasets of a request, false if it is present in at least one
def runsNotPresent(url, workflow):
runWhitelist=dbsTest.getRunWhitelist(url, workflow)
newRunWhiteList=[]
for run in runWhitelist:
if not runNotinAllDatasets(url, run, workflow):
newRunWhiteList.append(run)
print run
print newRunWhiteList
def runNotinAllDatasets(url, run, workflow):
Datasets=phedexSubscription.outputdatasetsWorkflow(url, workflow)
InputDataset=dbsTest.getInputDataSet(url, workflow)
runInputDataset=runInDataset(url, run, InputDataset)
if not runInputDataset:
return True
for dataset in Datasets:
if runInDataset(url, run, dataset):#the run is in at least one of the output datasets
return True
return False
def runInDataset(url, run, dataset):
query="file run="+str(run)+ " dataset="+dataset
output = {}
das_data = get_data(das_host,query,0,0,0)
if isinstance(das_data, basestring):
result = json.loads(das_data)
else:
result = das_data
if result['status'] == 'fail' :
print 'DAS query failed with reason:',result['reason']
else:
if len(result['data'])>0:
return True
else:
return False
def main():
url='cmsweb.cern.ch'
args=sys.argv[1:]
if not len(args)==1:
print "usage:runsMissing workflowname"
sys.exit(0);
workflow=args[0]
runsNotPresent(url, workflow)
sys.exit(0);
if __name__ == "__main__":
main()