2024-08-21 09:47:16 +02:00
|
|
|
package resampler
|
|
|
|
|
|
|
|
import (
|
|
|
|
"errors"
|
2024-08-25 16:12:43 +02:00
|
|
|
"fmt"
|
2024-08-21 09:47:16 +02:00
|
|
|
"math"
|
|
|
|
|
|
|
|
"github.com/ClusterCockpit/cc-metric-store/internal/util"
|
|
|
|
)
|
|
|
|
|
|
|
|
func SimpleResampler(data []util.Float, old_frequency int64, new_frequency int64) ([]util.Float, error) {
|
|
|
|
if old_frequency == 0 || new_frequency == 0 {
|
|
|
|
return nil, errors.New("either old or new frequency is set to 0")
|
|
|
|
}
|
|
|
|
|
|
|
|
if new_frequency%old_frequency != 0 {
|
|
|
|
return nil, errors.New("new sampling frequency should be multiple of the old frequency")
|
|
|
|
}
|
|
|
|
|
|
|
|
var step int = int(new_frequency / old_frequency)
|
|
|
|
var new_data_length = len(data) / step
|
|
|
|
|
|
|
|
if new_data_length == 0 || len(data) < 100 || new_data_length >= len(data) {
|
|
|
|
return data, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
new_data := make([]util.Float, new_data_length)
|
|
|
|
|
|
|
|
for i := 0; i < new_data_length; i++ {
|
|
|
|
new_data[i] = data[i*step]
|
|
|
|
}
|
|
|
|
|
|
|
|
return new_data, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Inspired by one of the algorithms from https://skemman.is/bitstream/1946/15343/3/SS_MSthesis.pdf
|
|
|
|
// Adapted from https://github.com/haoel/downsampling/blob/master/core/lttb.go
|
2024-08-26 13:18:06 +02:00
|
|
|
func LargestTriangleThreeBucket(data []util.Float, old_frequency int64, new_frequency int64) ([]util.Float, int64, error) {
|
2024-08-21 09:47:16 +02:00
|
|
|
|
|
|
|
if old_frequency == 0 || new_frequency == 0 {
|
|
|
|
return data, old_frequency, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
if new_frequency%old_frequency != 0 {
|
2024-09-17 10:49:32 +02:00
|
|
|
return nil, 0, fmt.Errorf("new sampling frequency : %d should be multiple of the old frequency : %d", new_frequency, old_frequency)
|
2024-08-21 09:47:16 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
var step int = int(new_frequency / old_frequency)
|
|
|
|
var new_data_length = len(data) / step
|
|
|
|
|
|
|
|
if new_data_length == 0 || len(data) < 100 || new_data_length >= len(data) {
|
|
|
|
return data, old_frequency, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
new_data := make([]util.Float, 0, new_data_length)
|
|
|
|
|
|
|
|
// Bucket size. Leave room for start and end data points
|
|
|
|
bucketSize := float64(len(data)-2) / float64(new_data_length-2)
|
|
|
|
|
|
|
|
new_data = append(new_data, data[0]) // Always add the first point
|
|
|
|
|
|
|
|
// We have 3 pointers represent for
|
|
|
|
// > bucketLow - the current bucket's beginning location
|
|
|
|
// > bucketMiddle - the current bucket's ending location,
|
|
|
|
// also the beginning location of next bucket
|
|
|
|
// > bucketHight - the next bucket's ending location.
|
|
|
|
bucketLow := 1
|
|
|
|
bucketMiddle := int(math.Floor(bucketSize)) + 1
|
|
|
|
|
|
|
|
var prevMaxAreaPoint int
|
|
|
|
|
|
|
|
for i := 0; i < new_data_length-2; i++ {
|
|
|
|
|
|
|
|
bucketHigh := int(math.Floor(float64(i+2)*bucketSize)) + 1
|
|
|
|
if bucketHigh >= len(data)-1 {
|
|
|
|
bucketHigh = len(data) - 2
|
|
|
|
}
|
|
|
|
|
|
|
|
// Calculate point average for next bucket (containing c)
|
|
|
|
avgPointX, avgPointY := calculateAverageDataPoint(data[bucketMiddle:bucketHigh+1], int64(bucketMiddle))
|
|
|
|
|
|
|
|
// Get the range for current bucket
|
|
|
|
currBucketStart := bucketLow
|
|
|
|
currBucketEnd := bucketMiddle
|
|
|
|
|
|
|
|
// Point a
|
|
|
|
pointX := prevMaxAreaPoint
|
|
|
|
pointY := data[prevMaxAreaPoint]
|
|
|
|
|
|
|
|
maxArea := -1.0
|
|
|
|
|
|
|
|
var maxAreaPoint int
|
2024-08-25 16:12:43 +02:00
|
|
|
flag_ := 0
|
2024-08-21 09:47:16 +02:00
|
|
|
for ; currBucketStart < currBucketEnd; currBucketStart++ {
|
|
|
|
|
|
|
|
area := calculateTriangleArea(util.Float(pointX), pointY, avgPointX, avgPointY, util.Float(currBucketStart), data[currBucketStart])
|
|
|
|
if area > maxArea {
|
|
|
|
maxArea = area
|
|
|
|
maxAreaPoint = currBucketStart
|
|
|
|
}
|
2024-08-25 16:12:43 +02:00
|
|
|
if math.IsNaN(float64(avgPointY)) {
|
|
|
|
flag_ = 1
|
|
|
|
}
|
2024-08-21 09:47:16 +02:00
|
|
|
}
|
|
|
|
|
2024-08-25 16:12:43 +02:00
|
|
|
if flag_ == 1 {
|
|
|
|
new_data = append(new_data, util.NaN) // Pick this point from the bucket
|
|
|
|
|
|
|
|
} else {
|
|
|
|
new_data = append(new_data, data[maxAreaPoint]) // Pick this point from the bucket
|
|
|
|
}
|
|
|
|
prevMaxAreaPoint = maxAreaPoint // This MaxArea point is the next's prevMAxAreaPoint
|
2024-08-21 09:47:16 +02:00
|
|
|
|
|
|
|
//move to the next window
|
|
|
|
bucketLow = bucketMiddle
|
|
|
|
bucketMiddle = bucketHigh
|
|
|
|
}
|
|
|
|
|
|
|
|
new_data = append(new_data, data[len(data)-1]) // Always add last
|
|
|
|
|
|
|
|
return new_data, new_frequency, nil
|
|
|
|
}
|