graphite-project · piotr1212 · Apr 16, 2020 · Apr 17, 2020 · Apr 22, 2020 · Apr 22, 2020
diff --git a/lib/carbon/cache.py b/lib/carbon/cache.py
@@ -190,6 +190,7 @@ def __init__(self, strategy=None):
     self.lock = threading.Lock()
     self.size = 0
     self.strategy = None
+    self.new_metrics = []
     if strategy:
       self.strategy = strategy(self)
     super(_MetricCache, self).__init__(dict)
@@ -236,6 +237,10 @@ def get_datapoints(self, metric):
     """Return a list of currently cached datapoints sorted by timestamp"""
     return sorted(self.get(metric, {}).items(), key=by_timestamp)
 
+  def pop_new_metric(self):
+    # return first seen metric
+    return self.new_metrics.pop(0)
+
   def pop(self, metric):
     with self.lock:
       datapoint_index = defaultdict.pop(self, metric)
@@ -247,6 +252,11 @@ def pop(self, metric):
   def store(self, metric, datapoint):
     timestamp, value = datapoint
     with self.lock:
+      # Metric not in cache yet, push to new_metrics list so it
+      # can be checked if the db already exists
+      if metric not in self:
+        self.new_metrics.append(metric)
+
       if timestamp not in self[metric]:
         # Not a duplicate, hence process if cache is not full
         if self.is_full:

diff --git a/lib/carbon/writer.py b/lib/carbon/writer.py
@@ -90,64 +90,67 @@ def getbatch(self, maxsize=1):
 tagQueue = TagQueue(maxsize=settings.TAG_QUEUE_SIZE, update_interval=settings.TAG_UPDATE_INTERVAL)
 
 
-def writeCachedDataPoints():
-  "Write datapoints until the MetricCache is completely empty"
-
-  cache = MetricCache()
-  while cache:
-    (metric, datapoints) = cache.drain_metric()
-    if metric is None:
-      # end the loop
-      break
-
-    dbFileExists = state.database.exists(metric)
-
-    if not dbFileExists:
-      if CREATE_BUCKET and not CREATE_BUCKET.drain(1):
+def create_database(metric):
+    if CREATE_BUCKET and not CREATE_BUCKET.drain(1):
         # If our tokenbucket doesn't have enough tokens available to create a new metric
         # file then we'll just drop the metric on the ground and move on to the next
         # metric.
-        # XXX This behavior should probably be configurable to no tdrop metrics
-        # when rate limitng unless our cache is too big or some other legit
+        # XXX This behavior should probably be configurable to not drop metrics
+        # when rate limiting unless our cache is too big or some other legit
         # reason.
         instrumentation.increment('droppedCreates')
-        continue
+        return
 
-      archiveConfig = None
-      xFilesFactor, aggregationMethod = None, None
+    archiveConfig = None
+    xFilesFactor, aggregationMethod = None, None
 
-      for schema in SCHEMAS:
+    for schema in SCHEMAS:
         if schema.matches(metric):
-          if settings.LOG_CREATES:
-            log.creates('new metric %s matched schema %s' % (metric, schema.name))
-          archiveConfig = [archive.getTuple() for archive in schema.archives]
-          break
+            if settings.LOG_CREATES:
+                log.creates('new metric %s matched schema %s' % (metric, schema.name))
+            archiveConfig = [archive.getTuple() for archive in schema.archives]
+            break
 
-      for schema in AGGREGATION_SCHEMAS:
+    for schema in AGGREGATION_SCHEMAS:
         if schema.matches(metric):
-          if settings.LOG_CREATES:
-            log.creates('new metric %s matched aggregation schema %s'
-                        % (metric, schema.name))
-          xFilesFactor, aggregationMethod = schema.archives
-          break
+            if settings.LOG_CREATES:
+                log.creates('new metric %s matched aggregation schema %s'
+                            % (metric, schema.name))
+            xFilesFactor, aggregationMethod = schema.archives
+            break
 
-      if not archiveConfig:
+    if not archiveConfig:
         raise Exception(("No storage schema matched the metric '%s',"
                          " check your storage-schemas.conf file.") % metric)
 
-      if settings.LOG_CREATES:
+    if settings.LOG_CREATES:
         log.creates("creating database metric %s (archive=%s xff=%s agg=%s)" %
                     (metric, archiveConfig, xFilesFactor, aggregationMethod))
-      try:
+
+    try:
         state.database.create(metric, archiveConfig, xFilesFactor, aggregationMethod)
         if settings.ENABLE_TAGS:
-          tagQueue.add(metric)
+            tagQueue.add(metric)
         instrumentation.increment('creates')
-      except Exception as e:
+    except Exception as e:
         log.err()
         log.msg("Error creating %s: %s" % (metric, e))
         instrumentation.increment('errors')
-        continue
+
+
+def writeCachedDataPoints():
+  "Write datapoints until the MetricCache is completely empty"
+
+  cache = MetricCache()
+  while cache:
+    new_metric = cache.pop_new_metric()
+    if not state.database.exists(new_metric):
+      create_database(new_metric)
+
+    (metric, datapoints) = cache.drain_metric()
+    if metric is None:
+      # end the loop
+      break
 
     # If we've got a rate limit configured lets makes sure we enforce it
     waitTime = 0
@@ -166,6 +169,10 @@ def writeCachedDataPoints():
       if settings.ENABLE_TAGS:
         tagQueue.update(metric)
       updateTime = time.time() - t1
+    except FileNotFoundError:  # don't log full stack trace when the db does not exist.
+      log.msg("Error writing %s: File does not exist (yet). " % metric +
+              "Increase MAX_CREATES_PER_MINUTE")
+      instrumentation.increment('errors')
     except Exception as e:
       log.err()
       log.msg("Error writing to %s: %s" % (metric, e))