88 lines
3.5 KiB
Python
88 lines
3.5 KiB
Python
|
# Copyright (c) 2006,2007 Mitch Garnaat http://garnaat.org/
|
||
|
#
|
||
|
# Permission is hereby granted, free of charge, to any person obtaining a
|
||
|
# copy of this software and associated documentation files (the
|
||
|
# "Software"), to deal in the Software without restriction, including
|
||
|
# without limitation the rights to use, copy, modify, merge, publish, dis-
|
||
|
# tribute, sublicense, and/or sell copies of the Software, and to permit
|
||
|
# persons to whom the Software is furnished to do so, subject to the fol-
|
||
|
# lowing conditions:
|
||
|
#
|
||
|
# The above copyright notice and this permission notice shall be included
|
||
|
# in all copies or substantial portions of the Software.
|
||
|
#
|
||
|
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
|
||
|
# OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABIL-
|
||
|
# ITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT
|
||
|
# SHALL THE AUTHOR BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
|
||
|
# WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
||
|
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
|
||
|
# IN THE SOFTWARE.
|
||
|
import time
|
||
|
import os
|
||
|
|
||
|
|
||
|
class Submitter(object):
|
||
|
|
||
|
def __init__(self, sd):
|
||
|
self.sd = sd
|
||
|
self.input_bucket = self.sd.get_obj('input_bucket')
|
||
|
self.output_bucket = self.sd.get_obj('output_bucket')
|
||
|
self.output_domain = self.sd.get_obj('output_domain')
|
||
|
self.queue = self.sd.get_obj('input_queue')
|
||
|
|
||
|
def get_key_name(self, fullpath, prefix):
|
||
|
key_name = fullpath[len(prefix):]
|
||
|
l = key_name.split(os.sep)
|
||
|
return '/'.join(l)
|
||
|
|
||
|
def write_message(self, key, metadata):
|
||
|
if self.queue:
|
||
|
m = self.queue.new_message()
|
||
|
m.for_key(key, metadata)
|
||
|
if self.output_bucket:
|
||
|
m['OutputBucket'] = self.output_bucket.name
|
||
|
self.queue.write(m)
|
||
|
|
||
|
def submit_file(self, path, metadata=None, cb=None, num_cb=0, prefix='/'):
|
||
|
if not metadata:
|
||
|
metadata = {}
|
||
|
key_name = self.get_key_name(path, prefix)
|
||
|
k = self.input_bucket.new_key(key_name)
|
||
|
k.update_metadata(metadata)
|
||
|
k.set_contents_from_filename(path, replace=False, cb=cb, num_cb=num_cb)
|
||
|
self.write_message(k, metadata)
|
||
|
|
||
|
def submit_path(self, path, tags=None, ignore_dirs=None, cb=None, num_cb=0, status=False, prefix='/'):
|
||
|
path = os.path.expanduser(path)
|
||
|
path = os.path.expandvars(path)
|
||
|
path = os.path.abspath(path)
|
||
|
total = 0
|
||
|
metadata = {}
|
||
|
if tags:
|
||
|
metadata['Tags'] = tags
|
||
|
l = []
|
||
|
for t in time.gmtime():
|
||
|
l.append(str(t))
|
||
|
metadata['Batch'] = '_'.join(l)
|
||
|
if self.output_domain:
|
||
|
self.output_domain.put_attributes(metadata['Batch'], {'type' : 'Batch'})
|
||
|
if os.path.isdir(path):
|
||
|
for root, dirs, files in os.walk(path):
|
||
|
if ignore_dirs:
|
||
|
for ignore in ignore_dirs:
|
||
|
if ignore in dirs:
|
||
|
dirs.remove(ignore)
|
||
|
for file in files:
|
||
|
fullpath = os.path.join(root, file)
|
||
|
if status:
|
||
|
print('Submitting %s' % fullpath)
|
||
|
self.submit_file(fullpath, metadata, cb, num_cb, prefix)
|
||
|
total += 1
|
||
|
elif os.path.isfile(path):
|
||
|
self.submit_file(path, metadata, cb, num_cb)
|
||
|
total += 1
|
||
|
else:
|
||
|
print('problem with %s' % path)
|
||
|
return (metadata['Batch'], total)
|