From c6b1b9f2115c40be4a77be075844f584c0612795 Mon Sep 17 00:00:00 2001
From: Jacob Cody Wimer <jacob.wimer@gmail.com>
Date: Fri, 25 Dec 2020 09:57:18 -0500
Subject: [PATCH] Changed api response time to milliseconds, updated grafan
 dashbaords, and updated README to reflect that.

---
 README.md                                |   2 +-
 grafana-dashboards/Openstack Health.json | 164 ++++++++++++-----------
 lib/api_metrics.py                       |  29 ++--
 3 files changed, 100 insertions(+), 95 deletions(-)

diff --git a/README.md b/README.md
index f697d56..238b176 100644
--- a/README.md
+++ b/README.md
@@ -37,7 +37,7 @@ openstack_api_status{api_name="horizon",cloud_name="CLOUD_NAME"}
 ### Standard Metrics Provided
 | Metric | Metric Labels | Description|
 | :--- | :--- | :--- |
-| `openstack_api_response_seconds` | `{api_name="API_NAME",cloud_name="CLOUD_NAME"}` | Seconds for the api to respond via openstack sdk. nova, neutron, and cinder are currently recorded. |
+| `openstack_api_response_milliseconds` | `{api_name="API_NAME",cloud_name="CLOUD_NAME"}` | Milliseconds for the api to respond via openstack sdk. nova, neutron, and cinder are currently recorded. |
 | `openstack_api_status` | `{api_name="API_NAME",cloud_name="CLOUD_NAME"}` | Status of the openstack api. 1 = up 0 = down. nova, neutron, and cinder are currently recorded. |
 | `openstack_hypervisor_running_vms` | `{hypervisor_hostname="HYPERVISOR_NAME",cloud_name="CLOUD_NAME",aggregate="AGGREGATE_NAME"}` | Number of running VMs on every hypervisor in the region. |
 | `openstack_hypervisor_used_ram_mb` | `{hypervisor_hostname="HYPERVISOR_NAME",cloud_name="CLOUD_NAME",aggregate="AGGREGATE_NAME"}` | Amount of RAM in MB used (as reported by nova-compute) for every hypervisor in the region. |
diff --git a/grafana-dashboards/Openstack Health.json b/grafana-dashboards/Openstack Health.json
index b38924d..55f0d74 100644
--- a/grafana-dashboards/Openstack Health.json	
+++ b/grafana-dashboards/Openstack Health.json	
@@ -64,7 +64,7 @@
   "gnetId": null,
   "graphTooltip": 0,
   "id": null,
-  "iteration": 1606267613619,
+  "iteration": 1608835196471,
   "links": [],
   "panels": [
     {
@@ -361,7 +361,7 @@
         "#d44a3a"
       ],
       "datasource": "${DS_PROMETHEUS}",
-      "format": "none",
+      "format": "ms",
       "gauge": {
         "maxValue": 100,
         "minValue": 0,
@@ -393,7 +393,7 @@
       "nullPointMode": "connected",
       "nullText": null,
       "options": {},
-      "postfix": " Seconds",
+      "postfix": "",
       "postfixFontSize": "50%",
       "prefix": "",
       "prefixFontSize": "50%",
@@ -409,12 +409,12 @@
       "tableColumn": "",
       "targets": [
         {
-          "expr": "openstack_api_response_seconds{api_name=\"nova\", cloud_name=\"$cloud\"}",
+          "expr": "openstack_api_response_milliseconds{api_name=\"nova\", cloud_name=\"$cloud\"}",
           "instant": false,
           "refId": "A"
         }
       ],
-      "thresholds": "5,10",
+      "thresholds": "5000,10000",
       "timeFrom": null,
       "timeShift": null,
       "title": "Nova API Avg Response Time",
@@ -439,7 +439,8 @@
         "#d44a3a"
       ],
       "datasource": "${DS_PROMETHEUS}",
-      "format": "none",
+      "decimals": null,
+      "format": "ms",
       "gauge": {
         "maxValue": 100,
         "minValue": 0,
@@ -471,7 +472,7 @@
       "nullPointMode": "connected",
       "nullText": null,
       "options": {},
-      "postfix": " Seconds",
+      "postfix": "",
       "postfixFontSize": "50%",
       "prefix": "",
       "prefixFontSize": "50%",
@@ -487,12 +488,12 @@
       "tableColumn": "",
       "targets": [
         {
-          "expr": "openstack_api_response_seconds{api_name=\"neutron\", cloud_name=\"$cloud\"}",
+          "expr": "openstack_api_response_milliseconds{api_name=\"neutron\", cloud_name=\"$cloud\"}",
           "instant": false,
           "refId": "A"
         }
       ],
-      "thresholds": "5,10",
+      "thresholds": "5000,10000",
       "timeFrom": null,
       "timeShift": null,
       "title": "Neutron API Avg Response Time",
@@ -517,7 +518,7 @@
         "#d44a3a"
       ],
       "datasource": "${DS_PROMETHEUS}",
-      "format": "none",
+      "format": "ms",
       "gauge": {
         "maxValue": 100,
         "minValue": 0,
@@ -549,7 +550,7 @@
       "nullPointMode": "connected",
       "nullText": null,
       "options": {},
-      "postfix": " Seconds",
+      "postfix": "",
       "postfixFontSize": "50%",
       "prefix": "",
       "prefixFontSize": "50%",
@@ -565,12 +566,12 @@
       "tableColumn": "",
       "targets": [
         {
-          "expr": "openstack_api_response_seconds{api_name=\"cinder\", cloud_name=\"$cloud\"}",
+          "expr": "openstack_api_response_milliseconds{api_name=\"cinder\", cloud_name=\"$cloud\"}",
           "instant": false,
           "refId": "A"
         }
       ],
-      "thresholds": "5,10",
+      "thresholds": "5000,10000",
       "timeFrom": null,
       "timeShift": null,
       "title": "Cinder API Avg Response Time",
@@ -595,7 +596,7 @@
         "#d44a3a"
       ],
       "datasource": "${DS_PROMETHEUS}",
-      "format": "none",
+      "format": "s",
       "gauge": {
         "maxValue": 100,
         "minValue": 0,
@@ -627,7 +628,7 @@
       "nullPointMode": "connected",
       "nullText": null,
       "options": {},
-      "postfix": " Seconds",
+      "postfix": "",
       "postfixFontSize": "50%",
       "prefix": "",
       "prefixFontSize": "50%",
@@ -648,7 +649,7 @@
           "refId": "A"
         }
       ],
-      "thresholds": "5,10",
+      "thresholds": "8,12",
       "timeFrom": null,
       "timeShift": null,
       "title": "Horizon API Avg Response Time",
@@ -678,10 +679,10 @@
       "type": "row"
     },
     {
-      "content": "\n# Current Status\n\nAPIs marked as \"Good\" and in green have a current 10 minute average response time of below 5 seconds. \n\nAPIs marked as \"Degraded\" and in orange have a current 10 minute average response time of above 5 seconds and below 8 seconds.\n\nAPIs marked as \"Unusable\" and in red have a current 10 minute average response time above 8 seconds.\n\n\n",
+      "content": "\n# API Current Status\n\nAPIs marked as \"Good\" and in green have a current 10 minute average response time of below 5000 milliseconds. \n\nAPIs marked as \"Degraded\" and in orange have a current 10 minute average response time of above 5000 seconds and below 10000 milliseconds.\n\nAPIs marked as \"Unusable\" and in red have a current 10 minute average response time above 10000 milliseconds.\n\n# Horizon Current Status\n\nHorizon marked as \"Good\" and in green have a current 10 minute average response time of below 8 seconds. \n\nHorizon marked as \"Degraded\" and in orange have a current 10 minute average response time of above 8 seconds and below 12 seconds.\n\nHorizon marked as \"Unusable\" and in red have a current 10 minute average response time above 12 seconds.\n",
       "datasource": "${DS_PROMETHEUS}",
       "gridPos": {
-        "h": 4,
+        "h": 8,
         "w": 12,
         "x": 0,
         "y": 21
@@ -718,7 +719,7 @@
         "h": 3,
         "w": 3,
         "x": 0,
-        "y": 25
+        "y": 29
       },
       "id": 11,
       "interval": null,
@@ -746,15 +747,15 @@
         {
           "from": "0",
           "text": "Good",
-          "to": "4.99"
-        },
-        {
-          "from": "5",
-          "text": "Degraded",
           "to": "7.99"
         },
         {
           "from": "8",
+          "text": "Degraded",
+          "to": "11.99"
+        },
+        {
+          "from": "12",
           "text": "Unusable",
           "to": "600"
         }
@@ -775,7 +776,7 @@
           "refId": "A"
         }
       ],
-      "thresholds": "5,8",
+      "thresholds": "8,12",
       "timeFrom": null,
       "timeShift": null,
       "title": "Horizon Response Time",
@@ -800,7 +801,7 @@
         "#d44a3a"
       ],
       "datasource": "${DS_PROMETHEUS}",
-      "format": "none",
+      "format": "ms",
       "gauge": {
         "maxValue": 100,
         "minValue": 0,
@@ -812,7 +813,7 @@
         "h": 3,
         "w": 3,
         "x": 3,
-        "y": 25
+        "y": 29
       },
       "id": 10,
       "interval": null,
@@ -840,17 +841,17 @@
         {
           "from": "0",
           "text": "Good",
-          "to": "4.99"
+          "to": "4999.99"
         },
         {
-          "from": "5",
+          "from": "5000",
           "text": "Degraded",
-          "to": "9.99"
+          "to": "9999.99"
         },
         {
-          "from": "10",
+          "from": "10000",
           "text": "Unusable",
-          "to": "600"
+          "to": "600000"
         }
       ],
       "sparkline": {
@@ -864,12 +865,12 @@
       "tableColumn": "",
       "targets": [
         {
-          "expr": "avg_over_time(openstack_api_response_seconds{api_name=\"nova\", cloud_name=\"$cloud\"}[10m])",
+          "expr": "avg_over_time(openstack_api_response_milliseconds{api_name=\"nova\", cloud_name=\"$cloud\"}[10m])",
           "instant": true,
           "refId": "A"
         }
       ],
-      "thresholds": "5,10",
+      "thresholds": "5000,10000",
       "timeFrom": null,
       "timeShift": null,
       "title": "Nova API Response Time",
@@ -906,7 +907,7 @@
         "h": 3,
         "w": 3,
         "x": 6,
-        "y": 25
+        "y": 29
       },
       "id": 14,
       "interval": null,
@@ -934,17 +935,17 @@
         {
           "from": "0",
           "text": "Good",
-          "to": "4.99"
+          "to": "4999.99"
         },
         {
-          "from": "5",
+          "from": "5000",
           "text": "Degraded",
-          "to": "9.99"
+          "to": "9999.99"
         },
         {
-          "from": "10",
+          "from": "10000",
           "text": "Unusable",
-          "to": "600"
+          "to": "600000"
         }
       ],
       "sparkline": {
@@ -958,12 +959,12 @@
       "tableColumn": "",
       "targets": [
         {
-          "expr": "avg_over_time(openstack_api_response_seconds{api_name=\"neutron\", cloud_name=\"$cloud\"}[10m])",
+          "expr": "avg_over_time(openstack_api_response_milliseconds{api_name=\"neutron\", cloud_name=\"$cloud\"}[10m])",
           "instant": true,
           "refId": "A"
         }
       ],
-      "thresholds": "5,10",
+      "thresholds": "5000,10000",
       "timeFrom": null,
       "timeShift": null,
       "title": "Neutron API Response Time",
@@ -1000,7 +1001,7 @@
         "h": 3,
         "w": 3,
         "x": 9,
-        "y": 25
+        "y": 29
       },
       "id": 18,
       "interval": null,
@@ -1028,17 +1029,17 @@
         {
           "from": "0",
           "text": "Good",
-          "to": "4.99"
+          "to": "4999.99"
         },
         {
-          "from": "5",
+          "from": "5000",
           "text": "Degraded",
-          "to": "9.99"
+          "to": "9999.99"
         },
         {
-          "from": "10",
+          "from": "10000",
           "text": "Unusable",
-          "to": "600"
+          "to": "600000"
         }
       ],
       "sparkline": {
@@ -1052,12 +1053,12 @@
       "tableColumn": "",
       "targets": [
         {
-          "expr": "avg_over_time(openstack_api_response_seconds{api_name=\"cinder\", cloud_name=\"$cloud\"}[10m])",
+          "expr": "avg_over_time(openstack_api_response_milliseconds{api_name=\"cinder\", cloud_name=\"$cloud\"}[10m])",
           "instant": true,
           "refId": "A"
         }
       ],
-      "thresholds": "5,10",
+      "thresholds": "5000,10000",
       "timeFrom": null,
       "timeShift": null,
       "title": "Cinder API Response Time",
@@ -1094,7 +1095,7 @@
         "h": 3,
         "w": 3,
         "x": 0,
-        "y": 28
+        "y": 32
       },
       "id": 12,
       "interval": null,
@@ -1188,7 +1189,7 @@
         "h": 3,
         "w": 3,
         "x": 3,
-        "y": 28
+        "y": 32
       },
       "id": 13,
       "interval": null,
@@ -1282,7 +1283,7 @@
         "h": 3,
         "w": 3,
         "x": 6,
-        "y": 28
+        "y": 32
       },
       "id": 15,
       "interval": null,
@@ -1376,7 +1377,7 @@
         "h": 3,
         "w": 3,
         "x": 9,
-        "y": 28
+        "y": 32
       },
       "id": 19,
       "interval": null,
@@ -1455,7 +1456,7 @@
         "h": 1,
         "w": 24,
         "x": 0,
-        "y": 31
+        "y": 35
       },
       "id": 28,
       "panels": [],
@@ -1474,7 +1475,7 @@
         "h": 8,
         "w": 12,
         "x": 0,
-        "y": 32
+        "y": 36
       },
       "id": 30,
       "legend": {
@@ -1560,7 +1561,7 @@
         "h": 8,
         "w": 12,
         "x": 12,
-        "y": 32
+        "y": 36
       },
       "id": 31,
       "legend": {
@@ -1646,7 +1647,7 @@
         "h": 8,
         "w": 12,
         "x": 0,
-        "y": 40
+        "y": 44
       },
       "id": 32,
       "legend": {
@@ -1732,7 +1733,7 @@
         "h": 8,
         "w": 12,
         "x": 12,
-        "y": 40
+        "y": 44
       },
       "id": 33,
       "legend": {
@@ -1813,7 +1814,7 @@
         "h": 1,
         "w": 24,
         "x": 0,
-        "y": 48
+        "y": 52
       },
       "id": 6,
       "panels": [],
@@ -1832,7 +1833,7 @@
         "h": 9,
         "w": 12,
         "x": 0,
-        "y": 49
+        "y": 53
       },
       "id": 2,
       "legend": {
@@ -1860,7 +1861,7 @@
       "steppedLine": false,
       "targets": [
         {
-          "expr": "openstack_api_response_seconds{api_name=\"nova\", cloud_name=\"$cloud\"}",
+          "expr": "openstack_api_response_milliseconds{api_name=\"nova\", cloud_name=\"$cloud\"}",
           "legendFormat": "{{ app }}",
           "refId": "A"
         }
@@ -1885,7 +1886,8 @@
       },
       "yaxes": [
         {
-          "format": "short",
+          "decimals": 1,
+          "format": "ms",
           "label": null,
           "logBase": 1,
           "max": null,
@@ -1918,7 +1920,7 @@
         "h": 9,
         "w": 12,
         "x": 12,
-        "y": 49
+        "y": 53
       },
       "id": 16,
       "legend": {
@@ -1946,7 +1948,7 @@
       "steppedLine": false,
       "targets": [
         {
-          "expr": "openstack_api_response_seconds{api_name=\"neutron\", cloud_name=\"$cloud\"}",
+          "expr": "openstack_api_response_milliseconds{api_name=\"neutron\", cloud_name=\"$cloud\"}",
           "legendFormat": "{{ app }}",
           "refId": "A"
         }
@@ -1971,7 +1973,7 @@
       },
       "yaxes": [
         {
-          "format": "short",
+          "format": "ms",
           "label": null,
           "logBase": 1,
           "max": null,
@@ -1979,7 +1981,7 @@
           "show": true
         },
         {
-          "format": "short",
+          "format": "ms",
           "label": null,
           "logBase": 1,
           "max": null,
@@ -2004,7 +2006,7 @@
         "h": 9,
         "w": 12,
         "x": 0,
-        "y": 58
+        "y": 62
       },
       "id": 17,
       "legend": {
@@ -2032,7 +2034,7 @@
       "steppedLine": false,
       "targets": [
         {
-          "expr": "openstack_api_response_seconds{api_name=\"cinder\", cloud_name=\"$cloud\"}",
+          "expr": "openstack_api_response_milliseconds{api_name=\"cinder\", cloud_name=\"$cloud\"}",
           "legendFormat": "{{ app }}",
           "refId": "A"
         }
@@ -2057,7 +2059,7 @@
       },
       "yaxes": [
         {
-          "format": "short",
+          "format": "ms",
           "label": null,
           "logBase": 1,
           "max": null,
@@ -2065,7 +2067,7 @@
           "show": true
         },
         {
-          "format": "short",
+          "format": "ms",
           "label": null,
           "logBase": 1,
           "max": null,
@@ -2090,7 +2092,7 @@
         "h": 9,
         "w": 12,
         "x": 12,
-        "y": 58
+        "y": 62
       },
       "id": 4,
       "legend": {
@@ -2143,7 +2145,7 @@
       },
       "yaxes": [
         {
-          "format": "short",
+          "format": "s",
           "label": null,
           "logBase": 1,
           "max": null,
@@ -2151,7 +2153,7 @@
           "show": true
         },
         {
-          "format": "short",
+          "format": "s",
           "label": null,
           "logBase": 1,
           "max": null,
@@ -2171,7 +2173,7 @@
         "h": 1,
         "w": 24,
         "x": 0,
-        "y": 67
+        "y": 71
       },
       "id": 60,
       "panels": [],
@@ -2190,7 +2192,7 @@
         "h": 8,
         "w": 12,
         "x": 0,
-        "y": 68
+        "y": 72
       },
       "id": 62,
       "legend": {
@@ -2244,7 +2246,7 @@
       },
       "yaxes": [
         {
-          "format": "short",
+          "format": "s",
           "label": null,
           "logBase": 1,
           "max": null,
@@ -2252,7 +2254,7 @@
           "show": true
         },
         {
-          "format": "short",
+          "format": "s",
           "label": null,
           "logBase": 1,
           "max": null,
@@ -2276,14 +2278,14 @@
         "allValue": null,
         "current": {},
         "datasource": "${DS_PROMETHEUS}",
-        "definition": "label_values(openstack_api_response_seconds, cloud_name)",
+        "definition": "label_values(openstack_api_status, cloud_name)",
         "hide": 0,
         "includeAll": false,
         "label": "Cloud",
         "multi": false,
         "name": "cloud",
         "options": [],
-        "query": "label_values(openstack_api_response_seconds, cloud_name)",
+        "query": "label_values(openstack_api_status, cloud_name)",
         "refresh": 1,
         "regex": "",
         "skipUrlSync": false,
@@ -2317,5 +2319,5 @@
   "timezone": "",
   "title": "Openstack Health",
   "uid": "so14pR0Mz",
-  "version": 7
+  "version": 11
 }
\ No newline at end of file
diff --git a/lib/api_metrics.py b/lib/api_metrics.py
index c22407c..10a1865 100644
--- a/lib/api_metrics.py
+++ b/lib/api_metrics.py
@@ -5,19 +5,20 @@ import datetime
 import traceback
 import prometheus_client as prom
 
-api_metrics = prom.Gauge('openstack_api_response_seconds', 'Time for openstack api to execute.', ['api_name','cloud_name'])
+api_metrics = prom.Gauge('openstack_api_response_milliseconds', 'Time for openstack api to execute in milliseconds.', ['api_name','cloud_name'])
 api_status = prom.Gauge('openstack_api_status', 'API current status. 1 = up 0 = down.',['api_name','cloud_name'])
 
 def generate_nova_metrics(connection,cloud_name):
     try:
         start_time = datetime.datetime.now()
         for server in connection.compute.servers():
-            name = server
+            name = server.name
+            break
         end_time = datetime.datetime.now()
         time_took = end_time - start_time
-        seconds_took = time_took.seconds
-        print(f'Nova took {seconds_took} seconds')
-        api_metrics.labels('nova',cloud_name).set(seconds_took)
+        milliseconds_took = time_took.microseconds / 1000
+        print(f'Nova took {milliseconds_took} milliseconds')
+        api_metrics.labels('nova',cloud_name).set(milliseconds_took)
         api_status.labels('nova',cloud_name).set(1)
     except:
         print(traceback.print_exc())
@@ -29,12 +30,13 @@ def generate_neutron_metrics(connection,cloud_name):
         project = connection.current_project
         start_time = datetime.datetime.now()
         for network in connection.network.networks(project_id=project.id):
-            name = network
+            name = network.name
+            break
         end_time = datetime.datetime.now()
         time_took = end_time - start_time
-        seconds_took = time_took.seconds
-        print(f'Neutron took {seconds_took} seconds')
-        api_metrics.labels('neutron',cloud_name).set(seconds_took)
+        milliseconds_took = time_took.microseconds / 1000
+        print(f'Neutron took {milliseconds_took} milliseconds')
+        api_metrics.labels('neutron',cloud_name).set(milliseconds_took)
         api_status.labels('neutron',cloud_name).set(1)
     except:
         print(traceback.print_exc())
@@ -45,12 +47,13 @@ def generate_cinder_metrics(connection,cloud_name):
     try:
         start_time = datetime.datetime.now()
         for volume in  connection.volume.volumes():
-            name = volume
+            name = volume.name
+            break
         end_time = datetime.datetime.now()
         time_took = end_time - start_time
-        seconds_took = time_took.seconds
-        print(f'Cinder took {seconds_took} seconds')
-        api_metrics.labels('cinder',cloud_name).set(seconds_took)
+        milliseconds_took = time_took.microseconds / 1000
+        print(f'Cinder took {milliseconds_took} milliseconds')
+        api_metrics.labels('cinder',cloud_name).set(milliseconds_took)
         api_status.labels('cinder',cloud_name).set(1)
     except:
         print(traceback.print_exc())