Add separate influxrepo for legacy clusters

-Reasons include legacy flux queries and bucket definitions
2026-06-26 20:20:38 +02:00 · 2022-03-18 12:57:57 +01:00
parent ed18df2ecf
commit 7632f10f2b
3 changed files with 245 additions and 52 deletions
@@ -0,0 +1,216 @@
+package metricdata
+
+import (
+	"context"
+	"errors"
+	"fmt"
+	"log"
+	"strings"
+	"time"
+	"crypto/tls"
+	"encoding/json"
+
+	"github.com/ClusterCockpit/cc-backend/config"
+	"github.com/ClusterCockpit/cc-backend/schema"
+	influxdb2 "github.com/influxdata/influxdb-client-go/v2"
+	influxdb2Api "github.com/influxdata/influxdb-client-go/v2/api"
+)
+
+type LegacyInfluxDBv2DataRepositoryConfig struct {
+	Url   string `json:"url"`
+	Token string `json:"token"`
+	Bucket string `json:"bucket"`
+	Org string `json:"org"`
+	Measurement string `json:"measurement"`
+	SkipTls bool `json:"skiptls"`
+}
+
+type LegacyInfluxDBv2DataRepository struct {
+	client              influxdb2.Client
+	queryClient         influxdb2Api.QueryAPI
+	bucket, measurement string
+}
+
+func (idb *LegacyInfluxDBv2DataRepository) Init(rawConfig json.RawMessage) error {
+	var config LegacyInfluxDBv2DataRepositoryConfig
+	if err := json.Unmarshal(rawConfig, &config); err != nil {
+		return err
+	}
+
+	idb.client 			= influxdb2.NewClientWithOptions(config.Url, config.Token, influxdb2.DefaultOptions().SetTLSConfig(&tls.Config {InsecureSkipVerify: config.SkipTls,} ))
+	idb.queryClient = idb.client.QueryAPI(config.Org)
+	idb.bucket      = config.Bucket
+  idb.measurement = config.Measurement
+
+	return nil
+}
+
+func (idb *LegacyInfluxDBv2DataRepository) formatTime(t time.Time) string {
+	return t.Format(time.RFC3339) // Like “2006-01-02T15:04:05Z07:00”
+}
+
+func (idb *LegacyInfluxDBv2DataRepository) epochToTime(epoch int64) time.Time {
+	return time.Unix(epoch, 0)
+}
+
+func (idb *LegacyInfluxDBv2DataRepository) LoadData(job *schema.Job, metrics []string, scopes []schema.MetricScope, ctx context.Context) (schema.JobData, error) {
+
+	fieldsConds := make([]string, 0, len(metrics))
+	for _, m := range metrics {
+		fieldsConds = append(fieldsConds, fmt.Sprintf(`r["_field"] == "%s"`, m))
+	}
+	fieldsCond := strings.Join(fieldsConds, " or ")
+
+	hostsConds := make([]string, 0, len(job.Resources))
+	for _, h := range job.Resources {
+		if h.HWThreads != nil || h.Accelerators != nil {
+			return nil, errors.New("the legacy InfluxDB metric data repository does not support HWThreads or Accelerators")
+		}
+
+		hostsConds = append(hostsConds, fmt.Sprintf(`r["host"] == "%s"`, h.Hostname))
+	}
+	hostsCond := strings.Join(hostsConds, " or ")
+
+	query := fmt.Sprintf(`
+		from(bucket: "%s")
+	  |> range(start: %s, stop: %s)
+	  |> filter(fn: (r) => r["_measurement"] == "%s" )
+	  |> filter(fn: (r) => %s )
+	  |> filter(fn: (r) => %s )
+	  |> drop(columns: ["_start", "_stop", "_measurement"])`,
+	 	idb.bucket,
+	 	idb.formatTime(job.StartTime), idb.formatTime(idb.epochToTime(job.StartTimeUnix + int64(job.Duration) + int64(1) )),
+	 	idb.measurement, hostsCond, fieldsCond)
+
+	rows, err := idb.queryClient.Query(ctx, query)
+	if err != nil {
+		return nil, err
+	}
+
+	jobData := make(schema.JobData) // map[<string>FIELD]map[<MetricScope>SCOPE]<*JobMetric>METRIC
+	scope 	:= schema.MetricScope("node") // Legacy Clusters only have Node Scope
+
+	for _, met := range metrics {
+		 	jobMetric, ok := jobData[met]
+		 	if !ok {
+		 			mc 		:= config.GetMetricConfig(job.Cluster, met)
+		 			jobMetric = map[schema.MetricScope]*schema.JobMetric{
+		 					scope: { // uses scope var from above
+		 							Unit:     mc.Unit,
+		 							Scope:    "node", // Legacy Clusters only have Node Scope
+		 							Timestep: mc.Timestep,
+		 							Series:   make([]schema.Series, 0, len(job.Resources)),
+		 							StatisticsSeries: nil, // Should be: &schema.StatsSeries{},
+		 					},
+		 			}
+		 	}
+			jobData[met] = jobMetric
+	}
+
+	field, host, hostSeries := "", "", schema.Series{}
+
+	for rows.Next() {
+		row := rows.Record()
+		if ( host == "" || host != row.ValueByKey("host").(string) || rows.TableChanged() ) {
+				if ( host != "" ) {
+				  	jobData[field][scope].Series = append(jobData[field][scope].Series, hostSeries) // add to jobData before resetting
+				}
+				// (Re-)Set new Series
+				field, host = row.Field(), row.ValueByKey("host").(string)
+				hostSeries  = schema.Series{
+						Hostname:   host,
+						Statistics: nil,
+						Data:       make([]schema.Float, 0),
+				}
+		}
+		val := row.Value().(float64)
+		hostSeries.Data = append(hostSeries.Data, schema.Float(val))
+	}
+
+  jobData[field][scope].Series = append(jobData[field][scope].Series, hostSeries)
+
+	stats, err := idb.LoadStats(job, metrics, ctx)
+	if err != nil {
+		return nil, err
+	}
+
+	for metric, nodes := range stats {
+		for node, stats := range nodes {
+			for index, _ := range jobData[metric][scope].Series {
+				if jobData[metric][scope].Series[index].Hostname == node {
+					jobData[metric][scope].Series[index].Statistics = &schema.MetricStatistics{Avg: stats.Avg, Min: stats.Min, Max: stats.Max}
+				}
+			}
+		}
+	}
+
+	// DEBUG:
+	// for _, met := range metrics {
+	//    for _, series := range jobData[met][scope].Series {
+	//    log.Println(fmt.Sprintf("<< Result: %d data points for metric %s on %s, Stats: Min %.2f, Max %.2f, Avg %.2f >>",
+	// 		 	len(series.Data), met, series.Hostname,
+	// 			series.Statistics.Min, series.Statistics.Max, series.Statistics.Avg))
+  //    }
+	// }
+	return jobData, nil
+}
+
+func (idb *LegacyInfluxDBv2DataRepository) LoadStats(job *schema.Job, metrics []string, ctx context.Context) (map[string]map[string]schema.MetricStatistics, error) {
+
+	stats := map[string]map[string]schema.MetricStatistics{}
+
+	hostsConds := make([]string, 0, len(job.Resources))
+	for _, h := range job.Resources {
+			if h.HWThreads != nil || h.Accelerators != nil {
+					return nil, errors.New("the legacy InfluxDB metric data repository does not support HWThreads or Accelerators")
+			}
+
+			hostsConds = append(hostsConds, fmt.Sprintf(`r.host == "%s"`, h.Hostname))
+	}
+	hostsCond := strings.Join(hostsConds, " or ")
+
+	for _, metric := range metrics {
+			query := fmt.Sprintf(`
+				  data = from(bucket: "%s")
+				  |> range(start: %s, stop: %s)
+				  |> filter(fn: (r) => r._measurement == "%s" and r._field == "%s" and (%s))
+				  union(tables: [data |> mean(column: "_value") |> set(key: "_field", value: "avg"),
+				                 data |>  min(column: "_value") |> set(key: "_field", value: "min"),
+				                 data |>  max(column: "_value") |> set(key: "_field", value: "max")])
+				  |> pivot(rowKey: ["host"], columnKey: ["_field"], valueColumn: "_value")
+				  |> group()`,
+					idb.bucket,
+					idb.formatTime(job.StartTime), idb.formatTime(idb.epochToTime(job.StartTimeUnix + int64(job.Duration) + int64(1) )),
+					idb.measurement, metric, hostsCond)
+
+			rows, err := idb.queryClient.Query(ctx, query)
+			if err != nil {
+				return nil, err
+			}
+
+			nodes := map[string]schema.MetricStatistics{}
+			for rows.Next() {
+					row := rows.Record()
+					host := row.ValueByKey("host").(string)
+					avg, min, max := row.ValueByKey("avg").(float64),
+						row.ValueByKey("min").(float64),
+						row.ValueByKey("max").(float64)
+
+					nodes[host] = schema.MetricStatistics{
+						Avg: avg,
+						Min: min,
+						Max: max,
+					}
+			}
+			stats[metric] = nodes
+	}
+
+	return stats, nil
+}
+
+func (idb *LegacyInfluxDBv2DataRepository) LoadNodeData(cluster, partition string, metrics, nodes []string, scopes []schema.MetricScope, from, to time.Time, ctx context.Context) (map[string]map[string][]*schema.JobMetric, error) {
+	// TODO : Implement to be used in Analysis- und System/Node-View
+	log.Println(fmt.Sprintf("LoadNodeData unimplemented for LegacyInfluxDBv2DataRepository, Args: cluster %s, partition %s, metrics %v, nodes %v, scopes %v", cluster, partition, metrics, nodes, scopes))
+
+	return nil, errors.New("unimplemented for LegacyInfluxDBv2DataRepository")
+}
@@ -54,15 +54,12 @@ func (idb *InfluxDBv2DataRepository) epochToTime(epoch int64) time.Time {
 func (idb *InfluxDBv2DataRepository) LoadData(job *schema.Job, metrics []string, scopes []schema.MetricScope, ctx context.Context) (schema.JobData, error) {

 	// Set Bucket & Prepare Measurement
-	if (job.Cluster == "woody" || job.Cluster == "emmy" || job.Cluster == "meggie") {
-			idb.measurement = "data"  // Temporary: Old Line Protocol for old cluster
-	} else {
-			// idb.measurement = nil  // New: Measurement = metric; Placeholder at this stage
+	if (job.Cluster == "fritz" || job.Cluster == "alex") {
 			log.Println(fmt.Sprintf("New line protocol unimplemented for influx: %s", job.Cluster))
 			return nil, errors.New("new line protocol unimplemented")
 	}
-	// DEBUG

+	// DEBUG
 	// log.Println("<< Requested Metrics >> ")
 	// log.Println(metrics)
 	// log.Println("<< Requested Scope >> ")
@@ -82,8 +79,6 @@ func (idb *InfluxDBv2DataRepository) LoadData(job *schema.Job, metrics []string,
 	// 		log.Println(influxPing)
 	// } else { log.Println("Influx Ping Error") }

-	// END DEBUG
-
 	fieldsConds := make([]string, 0, len(metrics))
 	for _, m := range metrics {
 		fieldsConds = append(fieldsConds, fmt.Sprintf(`r["_field"] == "%s"`, m))
@@ -93,8 +88,8 @@ func (idb *InfluxDBv2DataRepository) LoadData(job *schema.Job, metrics []string,
 	hostsConds := make([]string, 0, len(job.Resources))
 	for _, h := range job.Resources {
 		if h.HWThreads != nil || h.Accelerators != nil {
-			// TODO/FIXME...
-			return nil, errors.New("the InfluxDB metric data repository does not support HWThreads or Accelerators")
+			// TODO
+			return nil, errors.New("the InfluxDB metric data repository does not yet support HWThreads or Accelerators")
 		}

 		hostsConds = append(hostsConds, fmt.Sprintf(`r["host"] == "%s"`, h.Hostname))
@@ -114,14 +109,12 @@ func (idb *InfluxDBv2DataRepository) LoadData(job *schema.Job, metrics []string,

 	rows, err := idb.queryClient.Query(ctx, query)
 	if err != nil {
-		log.Println("<< THE QUERY THREW AN ERROR >>")
 		return nil, err
 	}

 	jobData := make(schema.JobData) // Empty Schema: map[<string>FIELD]map[<MetricScope>SCOPE]<*JobMetric>METRIC
-	scope 	:= schema.MetricScope("node") // use scopes argument here?
+	scope 	:= schema.MetricScope("node") // use scopes argument here

-	// Build Basic JobData Structure based on requested metrics and scope
 	for _, met := range metrics {
 		 	jobMetric, ok := jobData[met]
 		 	if !ok {
@@ -129,53 +122,43 @@ func (idb *InfluxDBv2DataRepository) LoadData(job *schema.Job, metrics []string,
 		 			jobMetric = map[schema.MetricScope]*schema.JobMetric{
 		 					scope: { // uses scope var from above!
 		 							Unit:     mc.Unit,
-		 							Scope:    mc.Scope, // was "node" hardcode, fixme?
+		 							Scope:    mc.Scope,
 		 							Timestep: mc.Timestep,
-		 							Series:   make([]schema.Series, 0, len(job.Resources)), // One series per node / resource
+		 							Series:   make([]schema.Series, 0, len(job.Resources)),
 		 							StatisticsSeries: nil, // Should be: &schema.StatsSeries{},
 		 					},
 		 			}
 		 	}
-			// Set Initialized JobMetric for field
-			jobData[met] = jobMetric

-			// log.Println(fmt.Sprintf("<< BUILT jobData >> Unit: %s >> Scope: %s >> Timestep: %d", jobData[met][scope].Unit, jobData[met][scope].Scope, jobData[met][scope].Timestep))
+			jobData[met] = jobMetric
 	}

-	// Fill Data Structure
 	field, host, hostSeries := "", "", schema.Series{}

 	for rows.Next() {
 		row := rows.Record()

-		// Build new Series for initial run, new host, or new metric (tablechange)
 		if ( host == "" || host != row.ValueByKey("host").(string) || rows.TableChanged() ) {

-				if ( host != "" ) { // Not in initial loop
-					  // log.Println(fmt.Sprintf("<< Save Series for : Field %s @  Host %s >>", field, host))
-				  	jobData[field][scope].Series = append(jobData[field][scope].Series, hostSeries) // add filled data to jobData **before resetting** for new field or new host
+				if ( host != "" ) {
+				  	jobData[field][scope].Series = append(jobData[field][scope].Series, hostSeries)
 				}
-				// (Re-)Set new Series
 				field, host = row.Field(), row.ValueByKey("host").(string)
 				hostSeries  = schema.Series{
 						Hostname:   host,
 						Statistics: nil,
 						Data:       make([]schema.Float, 0),
 				}
-				// log.Println(fmt.Sprintf("<< New Series for : Field %s @  Host %s >>", field, host))
 		}

 		val := row.Value().(float64)
 		hostSeries.Data = append(hostSeries.Data, schema.Float(val))
 	}

-	// Append last state also
-	// log.Println(fmt.Sprintf("<< Save Final Series for : Field %s @  Host %s >>", field, host))
  jobData[field][scope].Series = append(jobData[field][scope].Series, hostSeries)

 	stats, err := idb.LoadStats(job, metrics, ctx)
 	if err != nil {
-		log.Println("<< LOAD STATS THREW AN ERROR >>")
 		return nil, err
 	}

@@ -208,13 +191,7 @@ func (idb *InfluxDBv2DataRepository) LoadData(job *schema.Job, metrics []string,

 func (idb *InfluxDBv2DataRepository) LoadStats(job *schema.Job, metrics []string, ctx context.Context) (map[string]map[string]schema.MetricStatistics, error) {

-	// Set Bucket & Prepare Measurement
-	if (job.Cluster == "woody" || job.Cluster == "emmy" || job.Cluster == "meggie") {
-			idb.bucket = "ClusterCockpit/data" // Temporary: Old Line Protocol for old cluster
-			idb.measurement = "data"  // Temporary: Old Line Protocol for old cluster
-	} else {
-			// idb.bucket = job.Cluster // New: Bucket per Cluster
-			// idb.measurement = nil  // New: Measurement = metric; Placeholder at this stage
+	if (job.Cluster == "fritz" || job.Cluster == "alex") {
 			log.Println(fmt.Sprintf("New line protocol unimplemented for influx: %s", job.Cluster))
 			return nil, errors.New("new line protocol unimplemented")
 	}
@@ -224,8 +201,8 @@ func (idb *InfluxDBv2DataRepository) LoadStats(job *schema.Job, metrics []string
 	hostsConds := make([]string, 0, len(job.Resources))
 	for _, h := range job.Resources {
 			if h.HWThreads != nil || h.Accelerators != nil {
-					// TODO/FIXME...
-					return nil, errors.New("the InfluxDB metric data repository does not support HWThreads or Accelerators")
+					// TODO
+					return nil, errors.New("the InfluxDB metric data repository does not yet support HWThreads or Accelerators")
 			}

 			hostsConds = append(hostsConds, fmt.Sprintf(`r.host == "%s"`, h.Hostname))
@@ -237,7 +214,6 @@ func (idb *InfluxDBv2DataRepository) LoadStats(job *schema.Job, metrics []string
 				  data = from(bucket: "%s")
 				  |> range(start: %s, stop: %s)
 				  |> filter(fn: (r) => r._measurement == "%s" and r._field == "%s" and (%s))
-
 				  union(tables: [data |> mean(column: "_value") |> set(key: "_field", value: "avg"),
 				                 data |>  min(column: "_value") |> set(key: "_field", value: "min"),
 				                 data |>  max(column: "_value") |> set(key: "_field", value: "max")])
@@ -249,7 +225,6 @@ func (idb *InfluxDBv2DataRepository) LoadStats(job *schema.Job, metrics []string

 			rows, err := idb.queryClient.Query(ctx, query)
 			if err != nil {
-				log.Println("<< THE QUERY for STATS THREW AN ERROR >>")
 				return nil, err
 			}

@@ -51,6 +51,8 @@ func Init(jobArchivePath string, disableArchive bool) error {
 				mdr = &CCMetricStore{}
 			case "influxdb":
 				mdr = &InfluxDBv2DataRepository{}
+			case "legacyinfluxdb":
+				mdr = &LegacyInfluxDBv2DataRepository{}
 			case "test":
 				mdr = &TestMetricDataRepository{}
 			default: