deb-gnocchi/gnocchi/storage/incoming/s3.py

178 lines
6.4 KiB
Python

# -*- encoding: utf-8 -*-
#
# Copyright © 2016 Red Hat, Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License"); you may
# not use this file except in compliance with the License. You may obtain
# a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
# License for the specific language governing permissions and limitations
# under the License.
from collections import defaultdict
import contextlib
import datetime
import json
import uuid
import six
from gnocchi.storage.common import s3
from gnocchi.storage.incoming import _carbonara
boto3 = s3.boto3
botocore = s3.botocore
class S3Storage(_carbonara.CarbonaraBasedStorage):
def __init__(self, conf):
super(S3Storage, self).__init__(conf)
self.s3, self._region_name, self._bucket_prefix = (
s3.get_connection(conf)
)
self._bucket_name_measures = (
self._bucket_prefix + "-" + self.MEASURE_PREFIX
)
def get_storage_sacks(self):
try:
response = self.s3.get_object(Bucket=self._bucket_name_measures,
Key=self.CFG_PREFIX)
return json.loads(response['Body'].read().decode())[self.CFG_SACKS]
except botocore.exceptions.ClientError as e:
if e.response['Error'].get('Code') == "NoSuchKey":
return
def set_storage_settings(self, num_sacks):
data = {self.CFG_SACKS: num_sacks}
self.s3.put_object(Bucket=self._bucket_name_measures,
Key=self.CFG_PREFIX,
Body=json.dumps(data).encode())
def get_sack_prefix(self, num_sacks=None):
# NOTE(gordc): override to follow s3 partitioning logic
return '%s-' + ('%s/' % (num_sacks if num_sacks else self.NUM_SACKS))
@staticmethod
def remove_sack_group(num_sacks):
# nothing to cleanup since sacks are part of path
pass
def upgrade(self, indexer, num_sacks):
try:
s3.create_bucket(self.s3, self._bucket_name_measures,
self._region_name)
except botocore.exceptions.ClientError as e:
if e.response['Error'].get('Code') not in (
"BucketAlreadyExists", "BucketAlreadyOwnedByYou"
):
raise
# need to create bucket first to store storage settings object
super(S3Storage, self).upgrade(indexer, num_sacks)
def _store_new_measures(self, metric, data):
now = datetime.datetime.utcnow().strftime("_%Y%m%d_%H:%M:%S")
self.s3.put_object(
Bucket=self._bucket_name_measures,
Key=(self.get_sack_name(self.sack_for_metric(metric.id))
+ six.text_type(metric.id) + "/"
+ six.text_type(uuid.uuid4()) + now),
Body=data)
def _build_report(self, details):
metric_details = defaultdict(int)
response = {}
while response.get('IsTruncated', True):
if 'NextContinuationToken' in response:
kwargs = {
'ContinuationToken': response['NextContinuationToken']
}
else:
kwargs = {}
response = self.s3.list_objects_v2(
Bucket=self._bucket_name_measures,
**kwargs)
# FIXME(gordc): this can be streamlined if not details
for c in response.get('Contents', ()):
if c['Key'] != self.CFG_PREFIX:
__, metric, metric_file = c['Key'].split("/", 2)
metric_details[metric] += 1
return (len(metric_details), sum(metric_details.values()),
metric_details if details else None)
def list_metric_with_measures_to_process(self, sack):
limit = 1000 # 1000 is the default anyway
metrics = set()
response = {}
# Handle pagination
while response.get('IsTruncated', True):
if 'NextContinuationToken' in response:
kwargs = {
'ContinuationToken': response['NextContinuationToken']
}
else:
kwargs = {}
response = self.s3.list_objects_v2(
Bucket=self._bucket_name_measures,
Prefix=self.get_sack_name(sack),
Delimiter="/",
MaxKeys=limit,
**kwargs)
for p in response.get('CommonPrefixes', ()):
metrics.add(p['Prefix'].split('/', 2)[1])
return metrics
def _list_measure_files_for_metric_id(self, sack, metric_id):
files = set()
response = {}
while response.get('IsTruncated', True):
if 'NextContinuationToken' in response:
kwargs = {
'ContinuationToken': response['NextContinuationToken']
}
else:
kwargs = {}
response = self.s3.list_objects_v2(
Bucket=self._bucket_name_measures,
Prefix=(self.get_sack_name(sack)
+ six.text_type(metric_id) + "/"),
**kwargs)
for c in response.get('Contents', ()):
files.add(c['Key'])
return files
def delete_unprocessed_measures_for_metric_id(self, metric_id):
sack = self.sack_for_metric(metric_id)
files = self._list_measure_files_for_metric_id(sack, metric_id)
s3.bulk_delete(self.s3, self._bucket_name_measures, files)
def has_unprocessed(self, metric):
sack = self.sack_for_metric(metric.id)
return bool(self._list_measure_files_for_metric_id(sack, metric.id))
@contextlib.contextmanager
def process_measure_for_metric(self, metric):
sack = self.sack_for_metric(metric.id)
files = self._list_measure_files_for_metric_id(sack, metric.id)
measures = []
for f in files:
response = self.s3.get_object(
Bucket=self._bucket_name_measures,
Key=f)
measures.extend(
self._unserialize_measures(f, response['Body'].read()))
yield measures
# Now clean objects
s3.bulk_delete(self.s3, self._bucket_name_measures, files)