-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathfcm_bdiff.py
249 lines (212 loc) · 9.22 KB
/
fcm_bdiff.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
#!/usr/bin/env python3
# *********************************COPYRIGHT************************************
# (C) Crown copyright Met Office. All rights reserved.
# For further details please refer to the file COPYRIGHT.txt
# which you should have received as part of this distribution.
# *********************************COPYRIGHT************************************
"""
This module provides the functionality to return a list of local files to
run tests on based on the branch-difference (to allow checking of only files
which a developer has actually modified on their branch)
"""
import re
import os
import subprocess
import time
# ------------------------------------------------------------------------------
class FCMError(Exception):
"""
Exception class for FCM commands
"""
def __str__(self):
return ("\nFCM command: \"{0:s}\""
"\nFailed with error: \"{1:s}\""
.format(" ".join(self.args[0]), self.args[1].strip()))
# ------------------------------------------------------------------------------
def is_trunk(url):
"""
Given an FCM url, returns True if it appears to be pointing to the
UM main trunk
"""
search = re.search(r"""
(svn://fcm\d+/\w+_svn/\w+/trunk|
.*/svn/[\w\.]+/\w+/trunk|
..*_svn/\w+/trunk)
""", url, flags=re.VERBOSE)
return search is not None
# ------------------------------------------------------------------------------
def text_decoder(bytes_type_string, codecs=['utf8', 'cp1252']):
"""
Given a bytes type string variable, attempt to decode it using the codecs
listed.
"""
errors = []
for codec in codecs:
try:
return bytes_type_string.decode(codec)
except UnicodeDecodeError as err:
errors.append(err)
for error in errors:
print(error)
raise errors[0]
# ------------------------------------------------------------------------------
def get_branch_info(branch, snooze=300, retries=0):
"""
Extract the output of the branch info command
(if the branch is the mirror, allow for a few retries in case
it hasn't picked up the latest commit yet)
"""
command = ["fcm", "binfo", branch]
return run_fcm_command(command, retries, snooze)
# ------------------------------------------------------------------------------
def get_bdiff_summarize(branch, snooze=300, retries=0):
"""
Extract the output of the branch diff command
(if the branch is the mirror, allow for a few retries in case
it hasn't picked up the latest commit yet)
"""
command = ["fcm", "bdiff", "--summarize", branch]
return run_fcm_command(command, retries, snooze)
# ------------------------------------------------------------------------------
def get_branch_diff_filenames(branch=".", path_override=None):
"""
The main routine of this module, given the path to a working copy or the
URL of a branch (or simply run from within a working copy), returns a list
of filenames based on the FCM branch diff. In most cases it should try
to resolve to local filenames;
The base file path can be overridden, which may be helpful in suites.
If no working copy exists and the base path was not overridden, it will
return URLs in that case.
"""
branch, retries = use_mirror(branch)
# Get information about the branch
info = get_branch_info(branch, retries=retries)
branch_url = get_url(info)
# The branch should not be the trunk (a branch-diff would make no sense)
if is_trunk(branch_url):
print("{} appears to be the trunk, nothing to do!".format(branch_url))
return []
# The branch parent should be the trunk; if it isn't assume this is a
# branch-of-branch (a test branch), and redirect the request to point at
# the parent branch
parent = get_branch_parent(info)
while not is_trunk(parent):
branch = parent
info = get_branch_info(branch, retries=retries)
parent = get_branch_parent(info)
# The command `fcm bdiff --summarize <branch_name>` returns a different
# format if the branch has been reversed off the trunk. The expected format
# is svn://fcm1/um.xm_svn/main/trunk/rose-stem/bin/suite_report.py
# but if it has been reversed then we get
# svn://fcm1/um.xm_svn/main/branches/dev/USER/BRANCH_NAME/PATH
# This results in an invalid path provided by relative_paths
bdiff = get_bdiff_summarize(branch, retries=retries)
# Extract files from the bdiff that have been modified (M) or added (A).
# Strip whitespace, and remove blank lines while turning the output into
# a list of strings.
bdiff_files = [x.strip() for x in bdiff.split("\n") if x.strip()]
bdiff_files = [bfile.split()[1] for bfile in bdiff_files
if bfile.split()[0].strip() == "M" or
bfile.split()[0].strip() == "A"]
# Convert the file paths to be relative to the current URL; to do this
# construct the base path of the trunk URL and compare it to the results
# of the bdiff command above
repos_root = get_repository_root(info)
relative_paths = [os.path.relpath(bfile,
os.path.join(repos_root,
"main", "trunk"))
for bfile in bdiff_files]
# These relative paths can be joined to an appropriate base to complete
# the filenames to return
base_source_key = "SOURCE_UM_BASE"
if path_override is not None:
# Allows for 'user directed' path reconstruction.
# Particularly useful in rose stem.
base = path_override
bdiff_files = [os.path.join(base, bfile) for bfile in relative_paths]
elif base_source_key in os.environ:
# If running as a suite, the base path to the working copy can be used
# However, unless the suite task is running on a machine with the same
# path to the working copy, the task can't really make much use of
# this.
base = os.environ[base_source_key]
bdiff_files = [os.path.join(base, bfile) for bfile in relative_paths]
else:
# Otherwise stick to the original path/URL to the branch
bdiff_files = [os.path.join(branch, bfile) for bfile in relative_paths]
return bdiff_files
# ------------------------------------------------------------------------------
def run_fcm_command(command, max_retries, snooze):
"""
Run an fcm command, optionally retrying on failure.
"""
retries = 0
while True:
output = subprocess.Popen(command,
stdout=subprocess.PIPE,
stderr=subprocess.PIPE)
_ = output.wait()
if output.returncode == 0:
return text_decoder(output.stdout.read())
else:
retries += 1
if retries > max_retries:
raise FCMError(command, text_decoder(output.stderr.read()))
else:
time.sleep(snooze)
# ------------------------------------------------------------------------------
def use_mirror(branch):
"""
Catch to work out if this is running as part of a suite using an
FCM mirror, if it is then redirect the request to the mirror.
If using the mirror then fcm calls can sometimes fail so specify a number
of retries for other routines to use.
Returns updated branch URL and a number of retries
"""
mirror_key = "SOURCE_UM_MIRROR"
if mirror_key in os.environ:
branch = os.environ[mirror_key]
retries = 2
print("[INFO] Switching branch used for fcm command to : {0:}".format(
branch))
else:
retries = 0
return branch, retries
# ------------------------------------------------------------------------------
def get_repository_root(branch_info):
"""
Given the raw output from an fcm binfo command - which can be retrieved by
calling get_branch_info() - returns the Repository Root field
"""
repos_root = re.search(r"^Repository Root:\s*(?P<url>.*)\s*$",
branch_info, flags=re.MULTILINE)
if repos_root:
repos_root = repos_root.group("url")
else:
raise Exception("Could not find Repository Root field")
return repos_root
# ------------------------------------------------------------------------------
def get_branch_parent(branch_info):
"""
Given the raw output from an fcm binfo command - which can be retrieved by
calling get_branch_info() - returns the Branch Parent Field
"""
parent = re.search(r"^Branch Parent:\s*(?P<parent>.*)$", branch_info,
flags=re.MULTILINE)
if parent:
parent = parent.group("parent")
else:
raise Exception("Could not find Branch Parent field")
return parent
# ------------------------------------------------------------------------------
def get_url(branch_info):
"""
Given the raw output from an fcm binfo command - which can be retrieved by
calling get_branch_info() - returns the URL field
"""
url = re.search(r"^URL:\s*(?P<url>.*)$", branch_info, flags=re.MULTILINE)
if url:
url = url.group("url")
else:
raise Exception("Could not find URL field")
return url