forked from ptodev/Distributed-Resilient-Storage
-
Notifications
You must be signed in to change notification settings - Fork 0
/
add-ec.py
473 lines (385 loc) · 16.9 KB
/
add-ec.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
#!/usr/bin/env python
'''
A script to erasure code and upload a single file to a location on the catalogue.
The required input parameters are "total", "split", "input_file", "temporary_directory" and "remote_directory"
IMORTANT: ONLY ABSOLUTE PATHS SHOULD BE USED
Example:
$ python add-ec.py --total 15
--split 10
--input_file Penguins.jpg
--temporary_directory /home/paulin/Distributed-Resilient-Storage/fec/
--remote_directory /gridpp/ptodev/
--se_list se_list.txt
--processes 4
"split" is the number of files the original will be split into.
"total" is the total number of files, ie the erasure coded files will be (total-split).
"se_list" is a file containing the SEs used for uploading and looks like this:
GLASGOW-disk
BIRMINGHAM-disk
LIVERPOOL-disk
"processes" is the number of concurrent processes that will be ran.
"temporary_directory" is where the .fec (intermediate) files will be stored
'''
#######################################################################
######################### GET INPUT AGRUMENTS #########################
#######################################################################
import zfec, sys, os, glob, multiprocessing, time, itertools, math, subprocess
from DIRAC import S_OK, S_ERROR, gLogger, exit
from DIRAC.Core.Base import Script
class Params:
def __init__(self):
self.SEList = ''
self.Processes = int(math.ceil(multiprocessing.cpu_count()/2.0))
def setSplit(self, value):
self.Split = value
return S_OK()
def getSplit(self):
return self.Split
def setTotal(self, value):
self.Total = value
return S_OK()
def getTotal(self):
return self.Total
def setRemDir(self, value):
self.RemDir = value
return S_OK()
def getRemDir(self):
return self.RemDir
def setTempDir(self, value):
self.TempDir = value
return S_OK()
def getTempDir(self):
return self.TempDir
def setInputFile(self, value):
self.InputFile = value
return S_OK()
def getInputFile(self):
return self.InputFile
def setSEList(self, value):
self.SEList = value
return S_OK()
def getSEList(self):
return self.SEList
def setProcesses(self, value):
self.Processes = value
return S_OK()
def getProcesses(self):
return self.Processes
# Instantiate the params class
cliParams = Params()
# Register accepted switches and their callbacks
Script.registerSwitch("sp:", "split=", "Number of files the original will be split into.", cliParams.setSplit)
Script.registerSwitch("t:", "total=", "Total number of files (split + EC generated ones).", cliParams.setTotal)
Script.registerSwitch("rd:", "remote_directory=", "Direcory where the files will be uploaded.", cliParams.setRemDir)
Script.registerSwitch("td:", "temporary_directory=", "Location of the temporary files until they are uploaded.", cliParams.setTempDir)
Script.registerSwitch("i:", "input_file=", "Location of the file to be uploaded.", cliParams.setInputFile)
Script.registerSwitch("se:", "se_list=", "A file with names of usable SEs.", cliParams.setSEList)
Script.registerSwitch("pr:", "processes=", "Number of processes to run concurrently.", cliParams.setProcesses)
# Parse the command line and initialize DIRAC
Script.parseCommandLine(ignoreErrors = False)
switches = dict(Script.getUnprocessedSwitches())
# Get the list of services
servicesList = Script.getPositionalArgs()
import DIRAC.Interfaces.API.Dirac as dirac_api
import DIRAC.Resources.Catalog.FileCatalogClient as FCC
def get_se_status(testdir):
# A function that tests the SEs visible by dirac-dms-show-se-status
# by adding a file to them to see if they work.
# Name of the file on the SE
testfile_remote = '1'
# Create a file to upload for testing
testfile_local = '1'
while(True):
if(os.path.isfile(testfile_local)):
testfile_local = str(int(testfile_local)+1)
else:
break
local_file = open(testfile_local, 'w')
local_file.write('A file for testing whether an SE works.')
local_file.close()
####### GET A LIST OF THE SEs #########
se_stat = subprocess.Popen("dirac-dms-show-se-status", shell=True, stdout=subprocess.PIPE).stdout.read()
# Split into lines
se_stat = se_stat.split('\n')
# Clean unnecessary lines
se_stat = se_stat[2:-1]
# Split each line into strings
for se_index in range(len(se_stat)):
se_stat[se_index] = se_stat[se_index].split()
# Create a list with the names of the SEs
ses = []
for se in se_stat:
ses.append(se[0])
######### TEST WHICH SEs WORK #########
dirac = dirac_api.Dirac()
ses_not_working = []
ses_working = []
small_log = ''
existing_file_error = "{'Message': 'putAndRegister: \
This file GUID already exists for another file. \
Please remove it and try again. True', 'OK': False}"
# This is for surpressing any print statements from dirac.addFile()
old_stdout = sys.stdout
sys.stdout = open(os.devnull, 'w')
for se in ses:
while (True):
# Try adding a test file
output = dirac.addFile(testdir+testfile_remote, testfile_local, se)
if(str(output) == existing_file_error):
testfile_remote = str(int(testfile_remote)+1)
else:
# Remove the test file
dirac.removeFile(testdir+testfile_remote)
break
if(not output['OK']):
ses_not_working.append(se)
else:
ses_working.append(se)
sys.stdout.close()
sys.stdout = old_stdout
try:
os.remove(testfile_local)
except OSError as e:
print "Failed to remove file" + testfile_local + " with:", e.strerror
print "Error code:", e.code
return ses_working, ses_not_working
class Counter(object):
# A counter class for easier incrementing
def __init__(self, initval, manager):
self.val = manager.Value('i', initval)
self.lock = manager.Lock()
def increment(self):
with self.lock:
self.val.value += 1
return self.val.value
def value(self):
with self.lock:
return self.val.value
def addFileCC(remote_path, local_path, se):
# A function to upload files via LFNs
dirac = dirac_api.Dirac()
time1 = time.time()
output = dirac.addFile(remote_path, local_path, se)
time2 = time.time()
local_counter = counter.increment()
result_queue.put([local_counter, remote_path, se, str(time2-time1), output])
def addFileCC_func(args):
# A function needed to unpack the two arguments
return addFileCC(*args)
def get_parameters(total, loc_dir, rem_ec_dir, ses_working):
# Set a counter for the current SE
i = 0
# Set a counter for the current file
j = 0
local_paths = []
remote_paths = []
ses = []
while(True):
# Break the loop when all the arrays are completed
if(j == total):
break
# Go back to the first SE when you run out of them
if(i == len(ses_working)):
i = 0
# Get the file numbering right, like "Penguins.jpg.01_15.fec" ...
# The number of zeros depends on the total number of files
# eg. Penguins.jpg.0_1.fec or Penguins.jpg.00_15.fec
num = ('0'*(len(str(total))-len(str(j)))) + str(j)
# ...and for such as "Penguins.jpg.13_15.fec"
local_path = loc_dir + ec_file.name.split('/')[-1] + "." + num + "_" + str(total) + ".fec"
local_paths.append(local_path)
remote_path = rem_ec_dir + ec_file.name.split('/')[-1] + "." + num + "_" + str(total) + ".fec"
remote_paths.append(remote_path)
ses.append(ses_working[i])
i += 1
j += 1
return (remote_paths, local_paths, ses)
def sanitize_directory(input_str):
# Add a / to the end of the string if there isn't one
if(input_str[-1] != '/'):
input_str = input_str + '/'
return input_str
def sanitizeProcesses(processes):
if(processes <= 0):
return 1
return processes
def format_time(num, precision):
total_time = str(num)
total_time = total_time.split('.')
if(precision <= 0):
return num[0]
return total_time[0] + '.' + total_time[1][:precision]
if __name__ == '__main__':
split = int(cliParams.getSplit())
total = int(cliParams.getTotal())
rem_dir = cliParams.getRemDir()
loc_dir = cliParams.getTempDir()
ec_file = open(cliParams.getInputFile(), 'rb')
if(cliParams.getSEList() != ''):
se_list = open(cliParams.getSEList())
else:
se_list = cliParams.getSEList()
processes = int(cliParams.getProcesses())
#######################################################################
########################### INPUT SANITIZING ##########################
#######################################################################
rem_dir = sanitize_directory(rem_dir)
loc_dir = sanitize_directory(loc_dir)
processes = sanitizeProcesses(processes)
#######################################################################
######################## CHECK SE AVAILABILITY ########################
#######################################################################
# Import a file with SE names if it is given
if(se_list):
print "Importing a list with SEs...",
ses_working = se_list.readlines()
for i in range(len(ses_working)):
ses_working[i] = ses_working[i].strip()
# If there is no list with SEs, check which ones are available with the se_check.py script
else:
print "Checking SE availability...",
res = get_se_status(rem_dir)
ses_working = res[0]
ses_not_working = res[1]
# Make sure the list with working SEs is not empty
if not ses_working:
print "None of the SEs work!"
sys.exit()
print 'done!'
#######################################################################
######################### DO ERASURE ENCODING #########################
#######################################################################
# Clean the local fec folder
print "Cleaning up the " + loc_dir + " folder... ",
files = glob.glob(loc_dir + '*')
for f in files:
os.remove(f)
print "done!"
print "Starting erasure encoding...",
# Find the size of the file
ec_file.seek(0, 2)
fsize = ec_file.tell()
ec_file.seek(0, 0)
# Split the file and do erasure encosing
zfec.filefec.encode_to_files(ec_file, fsize, loc_dir, ec_file.name.split('/')[-1], split, total, overwrite=False, verbose=False)
print 'done!'
#######################################################################
########################### CREATE DIRECTORY ##########################
#######################################################################
fc = FCC.FileCatalogClient()
rem_ec_dir = rem_dir + '_' + ec_file.name.split('/')[-1] + '/'
# See if the directory exists
output = fc.isDirectory(rem_ec_dir)
# Here we need the [:-1], because DIRAC return the name without a "/"
if(output['Value']['Successful'][rem_ec_dir[:-1]] == True):
print "ERROR! The remote directory already exists!"
while(True):
prompt = raw_input("Would you like to remove " + rem_ec_dir + "? (yes/no):")
if(prompt == 'yes'):
print 'Removing directory' + rem_ec_dir + '... ',
# List the files in the directory
output_ls = fc.listDirectory(rem_ec_dir)
# Check if the directory has subdirectories - if it does, it cannot be deleted
if(output_ls['Value']['Successful'][rem_ec_dir[:-1]]['SubDirs'] != {}):
print 'ERROR: Cannot delete a directory if it has subdirectories!'
sys.exit()
# loop and delete with fc.removeFile()
output_ls = output_ls['Value']['Successful'][rem_ec_dir[:-1]]['Files'].keys()
for file_to_be_deleted in output_ls:
fc.removeFile(file_to_be_deleted)
# Remove the empty directory
output_rm = fc.removeDirectory(rem_ec_dir)
# Check if the directory has been removed successfully
if(not output_rm['Value']['Successful']):
print 'ERROR: ' + output_rm['Value']['Failed'][rem_ec_dir[:-1]]
else:
print 'done!'
break
elif(prompt == 'no'):
print 'The directory was not removed. Exiting program...'
sys.exit()
else:
print 'Please type "yes" or "no"!'
# Create the directory
print 'Creating a directory "' + rem_ec_dir + '"... ',
fc.createDirectory(rem_ec_dir)
print 'done!'
#######################################################################
############################# UPLOAD FILES ############################
#######################################################################
(remote_paths, local_paths, ses) = get_parameters(total, loc_dir, rem_ec_dir, ses_working)
print 'Uploading files to ' + rem_ec_dir
if(processes == 1):
print 'A serial download method will be used.'
time1 = time.time()
dirac = dirac_api.Dirac()
#SCS Refactor loops more functionally
count = 0
for rp,lp,se in zip(remote_paths,local_paths,ses):
count += 1
# Print a counter showing the number of the
# downloaded file, like [3/10]
print '[' + str(count) + '/' + str(total) + ']',
print 'Uploading ' + lp + ' on ' + se + '...',
time_single_1 = time.time()
# Upload the files on the grid
output = dirac.addFile(rp, lp, se)
# See if the upload was successful
time_single_2 = time.time()
if(output['OK'] == True):
print 'done in ' + str(time_single_2-time_single_1)[:4] + ' seconds!'
else:
print 'ERROR DETECTED:'
print 'ERROR: ' + output['Message']
time2 = time.time()
print 'Total time for upload: ' + format_time(time2-time1, 2) + ' seconds.'
else:
print 'A multiprocessing download method will be used!'
print 'Number of cores on the computer: ' + str(multiprocessing.cpu_count())
print 'Number of processes used: ' + str(processes)
# The Pool() class takes an intit argument for how many
# processes the pool should have
manager = multiprocessing.Manager()
result_queue = manager.Queue()
counter = Counter(0, manager)
pool = multiprocessing.Pool(4)
time1 = time.time()
pool.map_async(addFileCC_func, itertools.izip(remote_paths, local_paths, ses))
queue_results = []
# Get results from the queue
while(True):
queue_results.append(result_queue.get())
# queue_results[-1][4] contains the output from dirac.addFile()
if(queue_results[-1][4]['OK'] == False):
print 'ERROR in uploading file ' + queue_results[-1][1] + ':'
print queue_results[-1][4]['Message']
else:
print '[' + str(queue_results[-1][0]) + '/' + str(len(ses)) + ']',
print 'File ' + queue_results[-1][1] + ' uploaded on ' + queue_results[-1][2] + ' in ' + str(queue_results[-1][3])[:4] + ' seconds!'
if(len(queue_results) == len(ses)):
pool.close()
pool.join()
break
time2 = time.time()
print 'Total time for upload: ' + format_time(time2-time1, 2) + ' seconds.'
#######################################################################
################# CLEAN THE LOCAL ERASURE CODED FILES #################
#######################################################################
print "Cleaning up the local EC files... ",
files = glob.glob(loc_dir + '*')
for f in files:
os.remove(f)
print "done!"
#######################################################################
############################# ADD METADATA ############################
#######################################################################
print 'Adding metadata... ',
#SCS make this a proper dict as fc expects
metadata = {'EC_FILE': ec_file.name.split('/')[-1], 'EC_VERSION': '0.1', 'TOTAL': total, 'SPLIT': split}
#SCS refactoring loops
for rp in remote_paths:
output = fc.setMetadata(rp, metadata)
if (output['OK'] == False):
print 'ERROR! Could not add metadata for ' + remote_paths[i] + ':'
print output['Message']
print 'done!'