mirror of
				https://github.com/ClusterCockpit/cc-backend
				synced 2025-10-26 14:25:06 +01:00 
			
		
		
		
	Correct return of node data from higher granularity in influxdb source
This commit is contained in:
		| @@ -113,9 +113,9 @@ func (idb *LegacyInfluxDBv2DataRepository) LoadData(job *schema.Job, metrics []s | |||||||
| 		row := rows.Record() | 		row := rows.Record() | ||||||
| 		if ( host == "" || host != row.ValueByKey("host").(string) || rows.TableChanged() ) { | 		if ( host == "" || host != row.ValueByKey("host").(string) || rows.TableChanged() ) { | ||||||
| 				if ( host != "" ) { | 				if ( host != "" ) { | ||||||
|  | 					  // Append Series before reset | ||||||
| 				  	jobData[field][scope].Series = append(jobData[field][scope].Series, hostSeries) // add to jobData before resetting | 				  	jobData[field][scope].Series = append(jobData[field][scope].Series, hostSeries) // add to jobData before resetting | ||||||
| 				} | 				} | ||||||
| 				// (Re-)Set new Series |  | ||||||
| 				field, host = row.Field(), row.ValueByKey("host").(string) | 				field, host = row.Field(), row.ValueByKey("host").(string) | ||||||
| 				hostSeries  = schema.Series{ | 				hostSeries  = schema.Series{ | ||||||
| 						Hostname:   host, | 						Hostname:   host, | ||||||
| @@ -126,7 +126,7 @@ func (idb *LegacyInfluxDBv2DataRepository) LoadData(job *schema.Job, metrics []s | |||||||
| 		val := row.Value().(float64) | 		val := row.Value().(float64) | ||||||
| 		hostSeries.Data = append(hostSeries.Data, schema.Float(val)) | 		hostSeries.Data = append(hostSeries.Data, schema.Float(val)) | ||||||
| 	} | 	} | ||||||
|  | 	// Append last series | ||||||
|   jobData[field][scope].Series = append(jobData[field][scope].Series, hostSeries) |   jobData[field][scope].Series = append(jobData[field][scope].Series, hostSeries) | ||||||
|  |  | ||||||
| 	stats, err := idb.LoadStats(job, metrics, ctx) | 	stats, err := idb.LoadStats(job, metrics, ctx) | ||||||
|   | |||||||
| @@ -53,37 +53,17 @@ func (idb *InfluxDBv2DataRepository) epochToTime(epoch int64) time.Time { | |||||||
|  |  | ||||||
| func (idb *InfluxDBv2DataRepository) LoadData(job *schema.Job, metrics []string, scopes []schema.MetricScope, ctx context.Context) (schema.JobData, error) { | func (idb *InfluxDBv2DataRepository) LoadData(job *schema.Job, metrics []string, scopes []schema.MetricScope, ctx context.Context) (schema.JobData, error) { | ||||||
|  |  | ||||||
| 	// Set Bucket & Prepare Measurement |  | ||||||
| 	if (job.Cluster == "fritz" || job.Cluster == "alex") { |  | ||||||
| 			log.Println(fmt.Sprintf("New line protocol unimplemented for influx: %s", job.Cluster)) |  | ||||||
| 			return nil, errors.New("new line protocol unimplemented") |  | ||||||
| 	} |  | ||||||
|  |  | ||||||
| 	// DEBUG | 	// DEBUG | ||||||
| 	// log.Println("<< Requested Metrics >> ") | 	// log.Println("<< Requested Metrics >> ") | ||||||
| 	// log.Println(metrics) | 	// log.Println(metrics) | ||||||
|   // log.Println("<< Requested Scope >> ") |   // log.Println("<< Requested Scope >> ") | ||||||
| 	// log.Println(scopes) | 	// log.Println(scopes) | ||||||
|  |  | ||||||
| 	// influxHealth, healthErr := idb.client.Health(ctx) | 	measurementsConds := make([]string, 0, len(metrics)) | ||||||
| 	// influxReady, rdyErr := idb.client.Ready(ctx) |  | ||||||
| 	// influxPing, pingErr := idb.client.Ping(ctx) |  | ||||||
| 	// |  | ||||||
| 	// log.Println("<< Influx Health Status >> ") |  | ||||||
| 	// if healthErr == nil {	log.Println(fmt.Sprintf("{Commit:%s, Message:%s, Name:%s, Status:%s, Version:%s}", *influxHealth.Commit, *influxHealth.Message, influxHealth.Name, influxHealth.Status, *influxHealth.Version)) |  | ||||||
| 	// } else { log.Println("Influx Health Error") } |  | ||||||
| 	// if rdyErr == nil { log.Println(fmt.Sprintf("{Started:%s, Status:%s, Up:%s}", *influxReady.Started, *influxReady.Status, *influxReady.Up)) |  | ||||||
| 	// } else { log.Println("Influx Ready Error") } |  | ||||||
| 	// if pingErr == nil { |  | ||||||
| 	// 		log.Println("<< PING >>") |  | ||||||
| 	// 		log.Println(influxPing) |  | ||||||
| 	// } else { log.Println("Influx Ping Error") } |  | ||||||
|  |  | ||||||
| 	fieldsConds := make([]string, 0, len(metrics)) |  | ||||||
| 	for _, m := range metrics { | 	for _, m := range metrics { | ||||||
| 		fieldsConds = append(fieldsConds, fmt.Sprintf(`r["_field"] == "%s"`, m)) | 		measurementsConds = append(measurementsConds, fmt.Sprintf(`r["_measurement"] == "%s"`, m)) | ||||||
| 	} | 	} | ||||||
| 	fieldsCond := strings.Join(fieldsConds, " or ") | 	measurementsCond := strings.Join(measurementsConds, " or ") | ||||||
|  |  | ||||||
| 	hostsConds := make([]string, 0, len(job.Resources)) | 	hostsConds := make([]string, 0, len(job.Resources)) | ||||||
| 	for _, h := range job.Resources { | 	for _, h := range job.Resources { | ||||||
| @@ -92,76 +72,89 @@ func (idb *InfluxDBv2DataRepository) LoadData(job *schema.Job, metrics []string, | |||||||
| 			return nil, errors.New("the InfluxDB metric data repository does not yet support HWThreads or Accelerators") | 			return nil, errors.New("the InfluxDB metric data repository does not yet support HWThreads or Accelerators") | ||||||
| 		} | 		} | ||||||
|  |  | ||||||
| 		hostsConds = append(hostsConds, fmt.Sprintf(`r["host"] == "%s"`, h.Hostname)) | 		hostsConds = append(hostsConds, fmt.Sprintf(`r["hostname"] == "%s"`, h.Hostname)) | ||||||
| 	} | 	} | ||||||
| 	hostsCond := strings.Join(hostsConds, " or ") | 	hostsCond := strings.Join(hostsConds, " or ") | ||||||
|  |  | ||||||
| 	query := fmt.Sprintf(` | 	jobData := make(schema.JobData) // Empty Schema: map[<string>FIELD]map[<MetricScope>SCOPE]<*JobMetric>METRIC | ||||||
|  | 	// Requested Scopes | ||||||
|  | 	for _, scope := range scopes { | ||||||
|  |  | ||||||
|  | 			// Query Influxdb | ||||||
|  | 			query := "" | ||||||
|  |  | ||||||
|  | 			switch scope { | ||||||
|  | 					case "node": | ||||||
|  | 							// Get Finest Granularity, Groupy By Measurement and Hostname (== Metric / Node), Calculate Mean, Set NULL to 0.0 | ||||||
|  | 							query = fmt.Sprintf(` | ||||||
| 								from(bucket: "%s") | 								from(bucket: "%s") | ||||||
| 								|> range(start: %s, stop: %s) | 								|> range(start: %s, stop: %s) | ||||||
| 	  |> filter(fn: (r) => r["_measurement"] == "%s" ) |  | ||||||
| 								|> filter(fn: (r) => %s ) | 								|> filter(fn: (r) => %s ) | ||||||
| 								|> filter(fn: (r) => %s ) | 								|> filter(fn: (r) => %s ) | ||||||
| 	  |> drop(columns: ["_start", "_stop", "_measurement"])`, | 								|> drop(columns: ["_start", "_stop"]) | ||||||
|  | 								|> group(columns: ["hostname", "_measurement"]) | ||||||
|  | 		            |> aggregateWindow(every: 60s, fn: mean) | ||||||
|  | 								|> map(fn: (r) => (if exists r._value then {r with _value: r._value} else {r with _value: 0.0}))`, | ||||||
| 								idb.bucket, | 								idb.bucket, | ||||||
| 								idb.formatTime(job.StartTime), idb.formatTime(idb.epochToTime(job.StartTimeUnix + int64(job.Duration) + int64(1) )), | 								idb.formatTime(job.StartTime), idb.formatTime(idb.epochToTime(job.StartTimeUnix + int64(job.Duration) + int64(1) )), | ||||||
| 	 	idb.measurement, hostsCond, fieldsCond) | 								measurementsCond, hostsCond) | ||||||
|  | 					default: | ||||||
|  | 							return nil, errors.New("the InfluxDB metric data repository does not yet support other scopes than 'node'") | ||||||
|  | 			} | ||||||
|  |  | ||||||
| 			rows, err := idb.queryClient.Query(ctx, query) | 			rows, err := idb.queryClient.Query(ctx, query) | ||||||
| 			if err != nil { | 			if err != nil { | ||||||
| 				return nil, err | 				return nil, err | ||||||
| 			} | 			} | ||||||
|  |  | ||||||
| 	jobData := make(schema.JobData) // Empty Schema: map[<string>FIELD]map[<MetricScope>SCOPE]<*JobMetric>METRIC | 			// Init Metrics | ||||||
| 	scope 	:= schema.MetricScope("node") // use scopes argument here | 			for _, metric := range metrics { | ||||||
|  | 					jobMetric, ok := jobData[metric] | ||||||
| 	for _, met := range metrics { |  | ||||||
| 		 	jobMetric, ok := jobData[met] |  | ||||||
| 					if !ok { | 					if !ok { | ||||||
| 		 			mc 		:= config.GetMetricConfig(job.Cluster, met) | 							mc 		:= config.GetMetricConfig(job.Cluster, metric) | ||||||
| 							jobMetric = map[schema.MetricScope]*schema.JobMetric{ | 							jobMetric = map[schema.MetricScope]*schema.JobMetric{ | ||||||
| 									scope: { // uses scope var from above! | 									scope: { // uses scope var from above! | ||||||
| 											Unit:     mc.Unit, | 											Unit:     mc.Unit, | ||||||
| 		 							Scope:    mc.Scope, | 											Scope:    scope, | ||||||
| 											Timestep: mc.Timestep, | 											Timestep: mc.Timestep, | ||||||
| 											Series:   make([]schema.Series, 0, len(job.Resources)), | 											Series:   make([]schema.Series, 0, len(job.Resources)), | ||||||
| 											StatisticsSeries: nil, // Should be: &schema.StatsSeries{}, | 											StatisticsSeries: nil, // Should be: &schema.StatsSeries{}, | ||||||
| 									}, | 									}, | ||||||
| 							} | 							} | ||||||
| 					} | 					} | ||||||
|  | 					jobData[metric] = jobMetric | ||||||
| 			jobData[met] = jobMetric |  | ||||||
| 			} | 			} | ||||||
|  |  | ||||||
|  | 			// Process Result: Time-Data | ||||||
| 			field, host, hostSeries := "", "", schema.Series{} | 			field, host, hostSeries := "", "", schema.Series{} | ||||||
|  |  | ||||||
| 			for rows.Next() { | 			for rows.Next() { | ||||||
| 				  row := rows.Record() | 				  row := rows.Record() | ||||||
|  | 					if ( host == "" || host != row.ValueByKey("hostname").(string) || rows.TableChanged() ) { | ||||||
| 		if ( host == "" || host != row.ValueByKey("host").(string) || rows.TableChanged() ) { |  | ||||||
|  |  | ||||||
| 					 		if ( host != "" ) { | 					 		if ( host != "" ) { | ||||||
|  | 									// Append Series before reset | ||||||
| 					 		  	jobData[field][scope].Series = append(jobData[field][scope].Series, hostSeries) | 					 		  	jobData[field][scope].Series = append(jobData[field][scope].Series, hostSeries) | ||||||
| 					 		} | 					 		} | ||||||
| 				field, host = row.Field(), row.ValueByKey("host").(string) | 					 		field, host = row.Measurement(), row.ValueByKey("hostname").(string) | ||||||
| 					 		hostSeries  = schema.Series{ | 					 		hostSeries  = schema.Series{ | ||||||
| 					 				Hostname:   host, | 					 				Hostname:   host, | ||||||
| 					 				Statistics: nil, | 					 				Statistics: nil, | ||||||
| 					 				Data:       make([]schema.Float, 0), | 					 				Data:       make([]schema.Float, 0), | ||||||
| 					 		} | 					 		} | ||||||
| 					} | 					} | ||||||
|  |  | ||||||
| 					val := row.Value().(float64) | 					val := row.Value().(float64) | ||||||
| 					hostSeries.Data = append(hostSeries.Data, schema.Float(val)) | 					hostSeries.Data = append(hostSeries.Data, schema.Float(val)) | ||||||
| 			} | 			} | ||||||
|  | 			// Append last Series | ||||||
| 		  jobData[field][scope].Series = append(jobData[field][scope].Series, hostSeries) | 		  jobData[field][scope].Series = append(jobData[field][scope].Series, hostSeries) | ||||||
|  | 	} | ||||||
|  |  | ||||||
|  | 	// Get Stats | ||||||
| 	stats, err := idb.LoadStats(job, metrics, ctx) | 	stats, err := idb.LoadStats(job, metrics, ctx) | ||||||
| 	if err != nil { | 	if err != nil { | ||||||
| 		return nil, err | 		return nil, err | ||||||
| 	} | 	} | ||||||
|  |  | ||||||
|  | 	for _, scope := range scopes { | ||||||
| 		for metric, nodes := range stats { | 		for metric, nodes := range stats { | ||||||
| 			// log.Println(fmt.Sprintf("<< Add Stats for : Field %s >>", metric)) | 			// log.Println(fmt.Sprintf("<< Add Stats for : Field %s >>", metric)) | ||||||
| 			for node, stats := range nodes { | 			for node, stats := range nodes { | ||||||
| @@ -176,26 +169,24 @@ func (idb *InfluxDBv2DataRepository) LoadData(job *schema.Job, metrics []string, | |||||||
| 				} | 				} | ||||||
| 			} | 			} | ||||||
| 		} | 		} | ||||||
|  | 	} | ||||||
|  |  | ||||||
| 	// DEBUG: | 	// DEBUG: | ||||||
| 	for _, met := range metrics { | 	// for _, scope := range scopes { | ||||||
| 	   for _, series := range jobData[met][scope].Series { | 	// 		for _, met := range metrics { | ||||||
| 	   log.Println(fmt.Sprintf("<< Result: %d data points for metric %s on %s, Stats: Min %.2f, Max %.2f, Avg %.2f >>", | 	// 		   for _, series := range jobData[met][scope].Series { | ||||||
| 			 	len(series.Data), met, series.Hostname, | 	// 		   log.Println(fmt.Sprintf("<< Result: %d data points for metric %s on %s with scope %s, Stats: Min %.2f, Max %.2f, Avg %.2f >>", | ||||||
| 				series.Statistics.Min, series.Statistics.Max, series.Statistics.Avg)) | 	// 				 	len(series.Data), met, series.Hostname, scope, | ||||||
|      } | 	// 					series.Statistics.Min, series.Statistics.Max, series.Statistics.Avg)) | ||||||
| 	} | 	// 		   } | ||||||
|  | 	// 		} | ||||||
|  | 	// } | ||||||
|  |  | ||||||
| 	return jobData, nil | 	return jobData, nil | ||||||
| } | } | ||||||
|  |  | ||||||
| func (idb *InfluxDBv2DataRepository) LoadStats(job *schema.Job, metrics []string, ctx context.Context) (map[string]map[string]schema.MetricStatistics, error) { | func (idb *InfluxDBv2DataRepository) LoadStats(job *schema.Job, metrics []string, ctx context.Context) (map[string]map[string]schema.MetricStatistics, error) { | ||||||
|  |  | ||||||
| 	if (job.Cluster == "fritz" || job.Cluster == "alex") { |  | ||||||
| 			log.Println(fmt.Sprintf("New line protocol unimplemented for influx: %s", job.Cluster)) |  | ||||||
| 			return nil, errors.New("new line protocol unimplemented") |  | ||||||
| 	} |  | ||||||
|  |  | ||||||
| 	stats := map[string]map[string]schema.MetricStatistics{} | 	stats := map[string]map[string]schema.MetricStatistics{} | ||||||
|  |  | ||||||
| 	hostsConds := make([]string, 0, len(job.Resources)) | 	hostsConds := make([]string, 0, len(job.Resources)) | ||||||
| @@ -204,8 +195,7 @@ func (idb *InfluxDBv2DataRepository) LoadStats(job *schema.Job, metrics []string | |||||||
| 				// TODO | 				// TODO | ||||||
| 				return nil, errors.New("the InfluxDB metric data repository does not yet support HWThreads or Accelerators") | 				return nil, errors.New("the InfluxDB metric data repository does not yet support HWThreads or Accelerators") | ||||||
| 			} | 			} | ||||||
|  | 			hostsConds = append(hostsConds, fmt.Sprintf(`r["hostname"] == "%s"`, h.Hostname)) | ||||||
| 			hostsConds = append(hostsConds, fmt.Sprintf(`r.host == "%s"`, h.Hostname)) |  | ||||||
| 	} | 	} | ||||||
| 	hostsCond := strings.Join(hostsConds, " or ") | 	hostsCond := strings.Join(hostsConds, " or ") | ||||||
|  |  | ||||||
| @@ -213,15 +203,15 @@ func (idb *InfluxDBv2DataRepository) LoadStats(job *schema.Job, metrics []string | |||||||
| 			query := fmt.Sprintf(` | 			query := fmt.Sprintf(` | ||||||
| 				  data = from(bucket: "%s") | 				  data = from(bucket: "%s") | ||||||
| 				  |> range(start: %s, stop: %s) | 				  |> range(start: %s, stop: %s) | ||||||
| 				  |> filter(fn: (r) => r._measurement == "%s" and r._field == "%s" and (%s)) | 				  |> filter(fn: (r) => r._measurement == "%s" and r._field == "value" and (%s)) | ||||||
| 				  union(tables: [data |> mean(column: "_value") |> set(key: "_field", value: "avg"), | 				  union(tables: [data |> mean(column: "_value") |> set(key: "_field", value: "avg"), | ||||||
| 				                 data |>  min(column: "_value") |> set(key: "_field", value: "min"), | 				                 data |>  min(column: "_value") |> set(key: "_field", value: "min"), | ||||||
| 				                 data |>  max(column: "_value") |> set(key: "_field", value: "max")]) | 				                 data |>  max(column: "_value") |> set(key: "_field", value: "max")]) | ||||||
| 				  |> pivot(rowKey: ["host"], columnKey: ["_field"], valueColumn: "_value") | 				  |> pivot(rowKey: ["hostname"], columnKey: ["_field"], valueColumn: "_value") | ||||||
| 				  |> group()`, | 				  |> group()`, | ||||||
| 					idb.bucket, | 					idb.bucket, | ||||||
| 					idb.formatTime(job.StartTime), idb.formatTime(idb.epochToTime(job.StartTimeUnix + int64(job.Duration) + int64(1) )), | 					idb.formatTime(job.StartTime), idb.formatTime(idb.epochToTime(job.StartTimeUnix + int64(job.Duration) + int64(1) )), | ||||||
| 					idb.measurement, metric, hostsCond) | 					metric, hostsCond) | ||||||
|  |  | ||||||
| 			rows, err := idb.queryClient.Query(ctx, query) | 			rows, err := idb.queryClient.Query(ctx, query) | ||||||
| 			if err != nil { | 			if err != nil { | ||||||
| @@ -231,7 +221,7 @@ func (idb *InfluxDBv2DataRepository) LoadStats(job *schema.Job, metrics []string | |||||||
| 			nodes := map[string]schema.MetricStatistics{} | 			nodes := map[string]schema.MetricStatistics{} | ||||||
| 			for rows.Next() { | 			for rows.Next() { | ||||||
| 					row := rows.Record() | 					row := rows.Record() | ||||||
| 					host := row.ValueByKey("host").(string) | 					host := row.ValueByKey("hostname").(string) | ||||||
| 					avg, min, max := row.ValueByKey("avg").(float64), | 					avg, min, max := row.ValueByKey("avg").(float64), | ||||||
| 						row.ValueByKey("min").(float64), | 						row.ValueByKey("min").(float64), | ||||||
| 						row.ValueByKey("max").(float64) | 						row.ValueByKey("max").(float64) | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user