2013-09-25 21:50:03 +00:00
|
|
|
import cStringIO as StringIO
|
|
|
|
import os
|
2013-10-20 06:39:23 +00:00
|
|
|
import logging
|
2013-09-25 21:50:03 +00:00
|
|
|
|
|
|
|
import boto.s3.connection
|
|
|
|
import boto.s3.key
|
|
|
|
|
2014-04-03 21:31:46 +00:00
|
|
|
from storage.basestorage import BaseStorage
|
2013-09-25 21:50:03 +00:00
|
|
|
|
|
|
|
|
2013-10-20 06:39:23 +00:00
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
|
|
|
|
|
|
class StreamReadKeyAsFile(object):
|
2013-10-31 15:32:08 +00:00
|
|
|
def __init__(self, key):
|
|
|
|
self._key = key
|
|
|
|
self._finished = False
|
2013-10-20 06:39:23 +00:00
|
|
|
|
2013-10-31 15:32:08 +00:00
|
|
|
def __enter__(self):
|
|
|
|
return self
|
2013-10-20 06:39:23 +00:00
|
|
|
|
2013-10-31 15:32:08 +00:00
|
|
|
def __exit__(self, type, value, tb):
|
|
|
|
self._key.close(fast=True)
|
2013-10-20 06:39:23 +00:00
|
|
|
|
2013-10-31 15:32:08 +00:00
|
|
|
def read(self, amt=None):
|
|
|
|
if self._finished:
|
|
|
|
return None
|
2013-10-20 06:39:23 +00:00
|
|
|
|
2013-10-31 15:32:08 +00:00
|
|
|
resp = self._key.read(amt)
|
|
|
|
if not resp:
|
|
|
|
self._finished = True
|
|
|
|
return resp
|
2013-10-20 06:39:23 +00:00
|
|
|
|
|
|
|
|
2014-04-03 21:31:46 +00:00
|
|
|
class S3Storage(BaseStorage):
|
2013-09-25 21:50:03 +00:00
|
|
|
|
2013-10-31 15:32:08 +00:00
|
|
|
def __init__(self, storage_path, s3_access_key, s3_secret_key, s3_bucket):
|
2013-12-04 00:39:07 +00:00
|
|
|
self._initialized = False
|
2013-12-04 00:43:56 +00:00
|
|
|
self._bucket_name = s3_bucket
|
2013-12-04 00:39:07 +00:00
|
|
|
self._access_key = s3_access_key
|
|
|
|
self._secret_key = s3_secret_key
|
2013-10-31 15:32:08 +00:00
|
|
|
self._root_path = storage_path
|
2013-12-04 00:39:07 +00:00
|
|
|
self._s3_conn = None
|
|
|
|
self._s3_bucket = None
|
|
|
|
|
|
|
|
def _initialize_s3(self):
|
|
|
|
if not self._initialized:
|
|
|
|
self._s3_conn = boto.s3.connection.S3Connection(self._access_key,
|
|
|
|
self._secret_key)
|
2013-12-04 00:43:56 +00:00
|
|
|
self._s3_bucket = self._s3_conn.get_bucket(self._bucket_name)
|
2013-12-04 00:39:07 +00:00
|
|
|
self._initialized = True
|
2013-10-31 15:32:08 +00:00
|
|
|
|
|
|
|
def _debug_key(self, key):
|
|
|
|
"""Used for debugging only."""
|
|
|
|
orig_meth = key.bucket.connection.make_request
|
|
|
|
|
|
|
|
def new_meth(*args, **kwargs):
|
|
|
|
print '#' * 16
|
|
|
|
print args
|
|
|
|
print kwargs
|
|
|
|
print '#' * 16
|
|
|
|
return orig_meth(*args, **kwargs)
|
|
|
|
key.bucket.connection.make_request = new_meth
|
|
|
|
|
|
|
|
def _init_path(self, path=None):
|
|
|
|
path = os.path.join(self._root_path, path) if path else self._root_path
|
|
|
|
if path and path[0] == '/':
|
|
|
|
return path[1:]
|
|
|
|
return path
|
|
|
|
|
|
|
|
def get_content(self, path):
|
2013-12-04 00:39:07 +00:00
|
|
|
self._initialize_s3()
|
2013-10-31 15:32:08 +00:00
|
|
|
path = self._init_path(path)
|
|
|
|
key = boto.s3.key.Key(self._s3_bucket, path)
|
|
|
|
if not key.exists():
|
|
|
|
raise IOError('No such key: \'{0}\''.format(path))
|
|
|
|
return key.get_contents_as_string()
|
|
|
|
|
|
|
|
def put_content(self, path, content):
|
2013-12-04 00:39:07 +00:00
|
|
|
self._initialize_s3()
|
2013-10-31 15:32:08 +00:00
|
|
|
path = self._init_path(path)
|
|
|
|
key = boto.s3.key.Key(self._s3_bucket, path)
|
|
|
|
key.set_contents_from_string(content, encrypt_key=True)
|
|
|
|
return path
|
|
|
|
|
2013-12-04 00:39:07 +00:00
|
|
|
def get_direct_download_url(self, path, expires_in=60):
|
|
|
|
self._initialize_s3()
|
|
|
|
path = self._init_path(path)
|
|
|
|
k = boto.s3.key.Key(self._s3_bucket, path)
|
|
|
|
return k.generate_url(expires_in)
|
|
|
|
|
2013-10-31 15:32:08 +00:00
|
|
|
def stream_read(self, path):
|
2013-12-04 00:39:07 +00:00
|
|
|
self._initialize_s3()
|
2013-10-31 15:32:08 +00:00
|
|
|
path = self._init_path(path)
|
|
|
|
key = boto.s3.key.Key(self._s3_bucket, path)
|
|
|
|
if not key.exists():
|
|
|
|
raise IOError('No such key: \'{0}\''.format(path))
|
|
|
|
while True:
|
|
|
|
buf = key.read(self.buffer_size)
|
|
|
|
if not buf:
|
|
|
|
break
|
|
|
|
yield buf
|
|
|
|
|
|
|
|
def stream_read_file(self, path):
|
2013-12-04 00:39:07 +00:00
|
|
|
self._initialize_s3()
|
2013-10-31 15:32:08 +00:00
|
|
|
path = self._init_path(path)
|
|
|
|
key = boto.s3.key.Key(self._s3_bucket, path)
|
|
|
|
if not key.exists():
|
|
|
|
raise IOError('No such key: \'{0}\''.format(path))
|
|
|
|
return StreamReadKeyAsFile(key)
|
|
|
|
|
|
|
|
def stream_write(self, path, fp):
|
|
|
|
# Minimum size of upload part size on S3 is 5MB
|
2013-12-04 00:39:07 +00:00
|
|
|
self._initialize_s3()
|
2013-10-31 15:32:08 +00:00
|
|
|
buffer_size = 5 * 1024 * 1024
|
|
|
|
if self.buffer_size > buffer_size:
|
|
|
|
buffer_size = self.buffer_size
|
|
|
|
path = self._init_path(path)
|
|
|
|
mp = self._s3_bucket.initiate_multipart_upload(path, encrypt_key=True)
|
|
|
|
num_part = 1
|
|
|
|
while True:
|
|
|
|
try:
|
|
|
|
buf = fp.read(buffer_size)
|
|
|
|
if not buf:
|
|
|
|
break
|
|
|
|
io = StringIO.StringIO(buf)
|
|
|
|
mp.upload_part_from_file(io, num_part)
|
|
|
|
num_part += 1
|
|
|
|
io.close()
|
|
|
|
except IOError:
|
|
|
|
break
|
|
|
|
mp.complete_upload()
|
|
|
|
|
|
|
|
def list_directory(self, path=None):
|
2013-12-04 00:39:07 +00:00
|
|
|
self._initialize_s3()
|
2013-10-31 15:32:08 +00:00
|
|
|
path = self._init_path(path)
|
|
|
|
if not path.endswith('/'):
|
|
|
|
path += '/'
|
|
|
|
ln = 0
|
|
|
|
if self._root_path != '/':
|
|
|
|
ln = len(self._root_path)
|
|
|
|
exists = False
|
|
|
|
for key in self._s3_bucket.list(prefix=path, delimiter='/'):
|
|
|
|
exists = True
|
|
|
|
name = key.name
|
|
|
|
if name.endswith('/'):
|
|
|
|
yield name[ln:-1]
|
|
|
|
else:
|
|
|
|
yield name[ln:]
|
|
|
|
if exists is False:
|
|
|
|
# In order to be compliant with the LocalStorage API. Even though
|
|
|
|
# S3 does not have a concept of folders.
|
|
|
|
raise OSError('No such directory: \'{0}\''.format(path))
|
|
|
|
|
|
|
|
def exists(self, path):
|
2013-12-04 00:39:07 +00:00
|
|
|
self._initialize_s3()
|
2013-10-31 15:32:08 +00:00
|
|
|
path = self._init_path(path)
|
|
|
|
key = boto.s3.key.Key(self._s3_bucket, path)
|
|
|
|
return key.exists()
|
|
|
|
|
|
|
|
def remove(self, path):
|
2013-12-04 00:39:07 +00:00
|
|
|
self._initialize_s3()
|
2013-10-31 15:32:08 +00:00
|
|
|
path = self._init_path(path)
|
|
|
|
key = boto.s3.key.Key(self._s3_bucket, path)
|
|
|
|
if key.exists():
|
|
|
|
# It's a file
|
|
|
|
key.delete()
|
|
|
|
return
|
|
|
|
# We assume it's a directory
|
|
|
|
if not path.endswith('/'):
|
|
|
|
path += '/'
|
|
|
|
for key in self._s3_bucket.list(prefix=path):
|
|
|
|
key.delete()
|