Merge "Add opensearch/elasticsearch datastreams support"

2025-01-20 15:07:22 +00:00
parent 0362e79771 0bcde58eb6
commit e64156c00b
5 changed files with 83 additions and 27 deletions
--- a/cloudkitty/storage/v2/elasticsearch/init.py
+++ b/cloudkitty/storage/v2/elasticsearch/init.py
@@ -52,6 +52,10 @@ elasticsearch_storage_opts = [
                    "should be kept alive.",
               advanced=True,
               default=30, min=0, max=300),
    cfg.BoolOpt('use_datastream',
                help='Use a datastream rather than an index. This is useful '
                     'starting with Elasticsearch 7.17.',
                default=False),
 ]
 CONF.register_opts(elasticsearch_storage_opts, ELASTICSEARCH_STORAGE_GROUP)
--- a/cloudkitty/storage/v2/elasticsearch/client.py
+++ b/cloudkitty/storage/v2/elasticsearch/client.py
@@ -12,11 +12,13 @@
 #    License for the specific language governing permissions and limitations
 #    under the License.
 #
 from datetime import datetime
 import itertools
 from oslo_log import log
 import requests
 from cloudkitty.storage.v2 import elasticsearch
 from cloudkitty.storage.v2.elasticsearch import exceptions
 from cloudkitty.utils import json
@@ -248,6 +250,10 @@ class ElasticsearchClient(object):
        data = '\n'.join(itertools.chain(
            *[(instruction, json.dumps(term)) for term in terms]
        )) + '\n'
        if elasticsearch.CONF.storage_elasticsearch.use_datastream:
            url = '/'.join(
                (self._url, self._index_name, '_bulk'))
        else:
            url = '/'.join(
                (self._url, self._index_name, self._mapping_name, '_bulk'))
        return self._req(self._sess.post, url, data, None, deserialize=False)
@@ -259,6 +265,9 @@ class ElasticsearchClient(object):
        :type terms: collections.abc.Iterable
        """
        LOG.debug("Indexing {} documents".format(len(terms)))
        if elasticsearch.CONF.storage_elasticsearch.use_datastream:
            return self.bulk_with_instruction({"create": {}}, terms)
        else:
            return self.bulk_with_instruction({"index": {}}, terms)
    def commit(self):
@@ -275,6 +284,20 @@ class ElasticsearchClient(object):
        :param type_: type of the DataPoint
        :type type_: str
        """
        if elasticsearch.CONF.storage_elasticsearch.use_datastream:
            self._docs.append({
                '@timestamp': datetime.now().strftime("%Y-%m-%dT%H:%M:%S"),
                'start': start,
                'end': end,
                'type': type_,
                'unit': point.unit,
                'description': point.description,
                'qty': point.qty,
                'price': point.price,
                'groupby': point.groupby,
                'metadata': point.metadata,
            })
        else:
            self._docs.append({
                'start': start,
                'end': end,
--- a/cloudkitty/storage/v2/opensearch/init.py
+++ b/cloudkitty/storage/v2/opensearch/init.py
@@ -52,6 +52,9 @@ opensearch_storage_opts = [
               "contexts should be kept alive.",
               advanced=True,
               default=30, min=0, max=300),
    cfg.BoolOpt('use_datastream',
                help='Use a datastream rather than an index.',
                default=False),
 ]
 CONF.register_opts(opensearch_storage_opts, OPENSEARCH_STORAGE_GROUP)
--- a/cloudkitty/storage/v2/opensearch/client.py
+++ b/cloudkitty/storage/v2/opensearch/client.py
@@ -12,11 +12,13 @@
 #    License for the specific language governing permissions and limitations
 #    under the License.
 #
 from datetime import datetime
 import itertools
 from oslo_log import log
 import requests
 from cloudkitty.storage.v2 import opensearch
 from cloudkitty.storage.v2.opensearch import exceptions
 from cloudkitty.utils import json
@@ -246,8 +248,7 @@ class OpenSearchClient(object):
        data = '\n'.join(itertools.chain(
            *[(instruction, json.dumps(term)) for term in terms]
        )) + '\n'
-        url = '/'.join(
+        url = '/'.join((self._url, self._index_name, '_bulk'))
            (self._url, self._index_name, '_bulk'))
        return self._req(self._sess.post, url, data, None, deserialize=False)
    def bulk_index(self, terms):
@@ -257,6 +258,9 @@ class OpenSearchClient(object):
        :type terms: collections.abc.Iterable
        """
        LOG.debug("Indexing {} documents".format(len(terms)))
        if opensearch.CONF.storage_opensearch.use_datastream:
            return self.bulk_with_instruction({"create": {}}, terms)
        else:
            return self.bulk_with_instruction({"index": {}}, terms)
    def commit(self):
@@ -273,6 +277,20 @@ class OpenSearchClient(object):
        :param type_: type of the DataPoint
        :type type_: str
        """
        if opensearch.CONF.storage_opensearch.use_datastream:
            self._docs.append({
                '@timestamp': datetime.now().strftime("%Y-%m-%dT%H:%M:%S"),
                'start': start,
                'end': end,
                'type': type_,
                'unit': point.unit,
                'description': point.description,
                'qty': point.qty,
                'price': point.price,
                'groupby': point.groupby,
                'metadata': point.metadata,
            })
        else:
            self._docs.append({
                'start': start,
                'end': end,
--- a/releasenotes/notes/add-opensearch-elasticsearch-datastreams-support-28b7c1ce700d33c0.yaml
+++ b/releasenotes/notes/add-opensearch-elasticsearch-datastreams-support-28b7c1ce700d33c0.yaml
@@ -0,0 +1,8 @@
 ---
 features:
  - |
    Adds support to the OpenSearch and Elasticsearch v2 storage backends for
    using datastreams, rather than indices. These are useful when a cluster
    has multiple storage types, as data can be rotated from hot to cold storage
    when not in active use. The option ``use_datastream`` can be set under
    either ``[storage_elasticsearch]`` or ``[storage_opensearch]``.