Skip to content

Commit

Permalink
autopep8 action fixes
Browse files Browse the repository at this point in the history
  • Loading branch information
alexanderrichards authored Nov 27, 2023
1 parent 45bf8f9 commit 4e1c029
Showing 1 changed file with 17 additions and 17 deletions.
34 changes: 17 additions & 17 deletions ganga/GangaDirac/Lib/Splitters/OfflineGangaDiracSplitter.py
Original file line number Diff line number Diff line change
Expand Up @@ -57,7 +57,7 @@
number of SE add this subset to the list of used LFN and continue to the next
unallocated LFN.
So on the first iteration of the splitter we identify how many files we can put
into a larger subset of files.
i.e. how many jobs >= 0.75 * 100LFN and <= 100LFN with 2 site redundancy
Expand Down Expand Up @@ -86,7 +86,7 @@
This favours generating larger subsets with multiple sites where the jobs can run
This favours generating larger subsets with multiple sites where the jobs can run
but when there are LFN which can't be allocated to sites with multiple SE the algorithm
will attempt to find larger subsets with reduced redundancy.
"""
Expand Down Expand Up @@ -133,7 +133,7 @@ def find_random_site(original_SE_list, banned_SE):
while chosen_element == "" and len(input_list) > 0:
global global_random
this_element = global_random.sample(input_list, 1)[0]
if not this_element in banned_SE:
if this_element not in banned_SE:
chosen_element = this_element
break
else:
Expand Down Expand Up @@ -305,7 +305,7 @@ def lookUpLFNReplicas(inputs, ignoremissing):
"""
This method launches several worker threads to collect the replica information for all LFNs which are given as inputs and stores this in allLFNData

Check failure on line 306 in ganga/GangaDirac/Lib/Splitters/OfflineGangaDiracSplitter.py

View workflow job for this annotation

GitHub Actions / Linting

E501 line too long (151 > 127 characters)
Args:
inputs (list): This is a list of input DiracFile which are
inputs (list): This is a list of input DiracFile which are
Returns:
bad_lfns (list): A list of LFN which have no replica information when querying `getReplicasForJobs` from DIRAC
"""
Expand Down Expand Up @@ -336,7 +336,7 @@ def lookUpLFNReplicas(inputs, ignoremissing):

file_replicas = {}
for _lfn in LFNdict:
if not _lfn in bad_lfns:
if _lfn not in bad_lfns:
file_replicas[_lfn] = LFNdict[_lfn].locations

# Check if we have any bad lfns
Expand Down Expand Up @@ -377,17 +377,17 @@ def updateLFNData(bad_lfns, allLFNs, LFNdict, ignoremissing, allLFNData):
if upper_limit > len(allLFNs):
upper_limit = len(allLFNs)

#logger.debug("Updating LFN Physical Locations: [%s:%s] of %s" % (str(i * LFN_parallel_limit), str(upper_limit), str(len(allLFNs))))
# logger.debug("Updating LFN Physical Locations: [%s:%s] of %s" % (str(i * LFN_parallel_limit), str(upper_limit), str(len(allLFNs))))

Check failure on line 380 in ganga/GangaDirac/Lib/Splitters/OfflineGangaDiracSplitter.py

View workflow job for this annotation

GitHub Actions / Linting

E501 line too long (141 > 127 characters)

for this_lfn in values.keys():
#logger.debug("LFN: %s" % str(this_lfn))
# logger.debug("LFN: %s" % str(this_lfn))
this_dict = {}
this_dict[this_lfn] = values.get(this_lfn)

if this_lfn in LFNdict:
#logger.debug("Updating RemoteURLs")
# logger.debug("Updating RemoteURLs")
LFNdict[this_lfn]._updateRemoteURLs(this_dict)
#logger.debug("This_dict: %s" % str(this_dict))
# logger.debug("This_dict: %s" % str(this_dict))
else:
logger.error("Error updating remoteURLs for: %s" % str(this_lfn))

Expand Down Expand Up @@ -468,8 +468,8 @@ def OfflineGangaDiracSplitter(_inputs, filesPerJob, maxFiles, ignoremissing, ban

logger.debug("Found all SE in use")

#logger.info("%s" % str(CE_to_SE_mapping))
#logger.info("%s" % str(SE_to_CE_mapping))
# logger.info("%s" % str(CE_to_SE_mapping))
# logger.info("%s" % str(SE_to_CE_mapping))

# BELOW IS WHERE THE ACTUAL SPLITTING IS DONE

Expand Down Expand Up @@ -581,13 +581,13 @@ def performSplitting(site_dict, filesPerJob, allChosenSets, wanted_common_site,

# If subset is too small throw it away
if len(_this_subset) < limit and len(_this_subset) < max_limit:
#logger.debug("%s < %s" % (str(len(_this_subset)), str(limit)))
# logger.debug("%s < %s" % (str(len(_this_subset)), str(limit)))
allChosenSets[iterating_LFN] = generate_site_selection(
site_dict[iterating_LFN], wanted_common_site, uniqueSE, CE_to_SE_mapping, SE_to_CE_mapping)
continue
else:
#logger.info("found common LFN for: " + str(allChosenSets[iterating_LFN]))
#logger.info("%s > %s" % (str(len(_this_subset)), str(limit)))
# logger.info("found common LFN for: " + str(allChosenSets[iterating_LFN]))
# logger.info("%s > %s" % (str(len(_this_subset)), str(limit)))
# else Dataset was large enough to be considered useful
logger.debug("Generating Dataset of size: %s" % str(len(_this_subset)))
# Construct DiracFile here as we want to keep the above combination
Expand All @@ -601,8 +601,8 @@ def performSplitting(site_dict, filesPerJob, allChosenSets, wanted_common_site,
# Lets keep track of how many times we've tried this
iterations = iterations + 1

#logger.info("Iteration: %s" % iterations)
#logger.info("%s %s" % (good_fraction, bad_fraction))
# logger.info("Iteration: %s" % iterations)
# logger.info("%s %s" % (good_fraction, bad_fraction))

# Can take a while so lets not let threads become un-locked
import GangaCore.Runtime.Repository_runtime
Expand All @@ -623,7 +623,7 @@ def performSplitting(site_dict, filesPerJob, allChosenSets, wanted_common_site,
bad_fraction = 0.75
else:
good_fraction = good_fraction * 0.75
#bad_fraction = bad_fraction * 0.75
# bad_fraction = bad_fraction * 0.75

logger.debug("good_fraction: %s" % str(good_fraction))

Expand Down

0 comments on commit 4e1c029

Please sign in to comment.