deploymenttheory
diff --git a/‎concurrency/const.go
Lines changed: 19 additions & 0 deletions b/‎concurrency/const.go
Lines changed: 19 additions & 0 deletions
diff --git a/‎concurrency/handler.go
Lines changed: 31 additions & 18 deletions b/‎concurrency/handler.go
Lines changed: 31 additions & 18 deletions
diff --git a/‎concurrency/metrics.go
Lines changed: 124 additions & 87 deletions b/‎concurrency/metrics.go
Lines changed: 124 additions & 87 deletions
@@ -4,6 +4,16 @@ package concurrency
 import "time"
 
 const (
+	// MaxConcurrency defines the upper limit of concurrent requests the system can handle.
+	MaxConcurrency = 10
+
+	// MinConcurrency defines the lower limit of concurrent requests the system will maintain.
+	MinConcurrency = 1
+
+	// EvaluationInterval specifies the frequency at which the system evaluates its performance metrics
+	// to decide if concurrency adjustments are needed.
+	EvaluationInterval = 1 * time.Minute
+
 	// MaxAcceptableTTFB represents the maximum acceptable Time to First Byte (TTFB) in milliseconds.
 	// TTFB is the time taken for the server to start sending the first byte of data in response to a request.
 	// Adjustments in concurrency will be made if the TTFB exceeds this threshold.
@@ -22,4 +32,13 @@ const (
 	// Error rate is calculated as (TotalRateLimitErrors + 5xxErrors) / TotalRequests.
 	// Adjustments in concurrency will be made if the error rate exceeds this threshold. A threshold of 0.1 (or 10%) is common.
 	ErrorRateThreshold = 0.1
+
+	// Weight assigned to each metric feedback type
+	WeightRateLimit     = 0.5 // Weight for rate limit feedback, less if not all APIs provide this data
+	WeightResponseCodes = 1.0 // Weight for server response codes
+	WeightResponseTime  = 1.5 // Higher weight for response time variability
+
+	// Thresholds for semaphore scaling actions
+	ThresholdScaleDown = -1.5 // Threshold to decide scaling down
+	ThresholdScaleUp   = 1.5  // Threshold to decide scaling up
 )
@@ -6,23 +6,26 @@ import (
 	"time"
 
 	"github.com/deploymenttheory/go-api-http-client/logger"
-)
-
-// Constants and Data Structures:
-const (
-	MaxConcurrency     = 10              // Maximum allowed concurrent requests
-	MinConcurrency     = 1               // Minimum allowed concurrent requests
-	EvaluationInterval = 1 * time.Minute // Time interval for evaluating metrics and adjusting concurrency
+	"golang.org/x/sync/semaphore"
 )
 
 // ConcurrencyHandler controls the number of concurrent HTTP requests.
+// type ConcurrencyHandler struct {
+// 	sem                      chan struct{}
+// 	logger                   logger.Logger
+// 	AcquisitionTimes         []time.Duration
+// 	lock                     sync.Mutex
+// 	lastTokenAcquisitionTime time.Time
+// 	Metrics                  *ConcurrencyMetrics
+// }
+
 type ConcurrencyHandler struct {
-	sem                      chan struct{}
-	logger                   logger.Logger
-	AcquisitionTimes         []time.Duration
-	lock                     sync.Mutex
-	lastTokenAcquisitionTime time.Time
-	Metrics                  *ConcurrencyMetrics
+	sem             *semaphore.Weighted
+	lock            sync.RWMutex
+	logger          logger.Logger
+	Metrics         *ConcurrencyMetrics
+	currentCapacity int64
+	activePermits   int64
 }
 
 // ConcurrencyMetrics captures various metrics related to managing concurrency for the client's interactions with the API.
@@ -60,12 +63,22 @@ type ConcurrencyMetrics struct {
 // concurrency limit, logger, and concurrency metrics. The ConcurrencyHandler ensures
 // no more than a certain number of concurrent requests are made.
 // It uses a semaphore to control concurrency.
-func NewConcurrencyHandler(limit int, logger logger.Logger, metrics *ConcurrencyMetrics) *ConcurrencyHandler {
+//
+//	func NewConcurrencyHandler(limit int, logger logger.Logger, metrics *ConcurrencyMetrics) *ConcurrencyHandler {
+//		return &ConcurrencyHandler{
+//			sem:              make(chan struct{}, limit),
+//			logger:           logger,
+//			AcquisitionTimes: []time.Duration{},
+//			Metrics:          metrics,
+//		}
+//	}
+func NewConcurrencyHandler(limit int64, logger logger.Logger, metrics *ConcurrencyMetrics) *ConcurrencyHandler {
 	return &ConcurrencyHandler{
-		sem:              make(chan struct{}, limit),
-		logger:           logger,
-		AcquisitionTimes: []time.Duration{},
-		Metrics:          metrics,
+		sem:             semaphore.NewWeighted(limit),
+		logger:          logger,
+		Metrics:         metrics,
+		currentCapacity: limit,
+		activePermits:   0,
 	}
 }
 
 
@@ -27,49 +27,57 @@ import (
 //
 // It logs the specific reason for scaling decisions, helping in traceability and fine-tuning system performance.
 func (ch *ConcurrencyHandler) EvaluateAndAdjustConcurrency(resp *http.Response, responseTime time.Duration) {
-	// Call monitoring functions
 	rateLimitFeedback := ch.MonitorRateLimitHeaders(resp)
 	responseCodeFeedback := ch.MonitorServerResponseCodes(resp)
 	responseTimeFeedback := ch.MonitorResponseTimeVariability(responseTime)
 
-	// Log the feedback from each monitoring function for debugging
-	ch.logger.Debug("Concurrency Adjustment Feedback",
-		zap.Int("RateLimitFeedback", rateLimitFeedback),
-		zap.Int("ResponseCodeFeedback", responseCodeFeedback),
-		zap.Int("ResponseTimeFeedback", responseTimeFeedback))
-
-	// Determine overall action based on feedback
-	suggestions := []int{rateLimitFeedback, responseCodeFeedback, responseTimeFeedback}
-	scaleDownCount := 0
-	scaleUpCount := 0
-
-	for _, suggestion := range suggestions {
-		switch suggestion {
-		case -1:
-			scaleDownCount++
-		case 1:
-			scaleUpCount++
-		}
-	}
+	// Compute the weighted feedback
+	weightedFeedback := float64(rateLimitFeedback)*WeightRateLimit +
+		float64(responseCodeFeedback)*WeightResponseCodes +
+		float64(responseTimeFeedback)*WeightResponseTime
 
-	// Log the counts for scale down and up suggestions
-	ch.logger.Info("Scaling Decision Counts",
-		zap.Int("ScaleDownCount", scaleDownCount),
-		zap.Int("ScaleUpCount", scaleUpCount))
+	// Log the feedback and weighted result for debugging
+	ch.logger.Debug("Concurrency Adjustment Feedback",
+		zap.Float64("WeightedFeedback", weightedFeedback))
 
-	// Decide on scaling action
-	if scaleDownCount > scaleUpCount {
-		ch.logger.Info("Scaling down the concurrency", zap.String("Reason", "More signals suggested to decrease concurrency"))
+	// Apply thresholds to determine scaling action
+	if weightedFeedback <= ThresholdScaleDown {
+		ch.logger.Info("Scaling down the concurrency", zap.Float64("WeightedFeedback", weightedFeedback))
 		ch.ScaleDown()
-	} else if scaleUpCount > scaleDownCount {
-		ch.logger.Info("Scaling up the concurrency", zap.String("Reason", "More signals suggested to increase concurrency"))
+	} else if weightedFeedback >= ThresholdScaleUp {
+		ch.logger.Info("Scaling up the concurrency", zap.Float64("WeightedFeedback", weightedFeedback))
 		ch.ScaleUp()
 	} else {
-		ch.logger.Info("No change in concurrency", zap.String("Reason", "Equal signals for both scaling up and down"))
+		ch.logger.Info("Maintaining current concurrency level", zap.Float64("WeightedFeedback", weightedFeedback))
 	}
 }
 
 // MonitorRateLimitHeaders monitors the rate limit headers in the response and suggests a concurrency adjustment.
+// func (ch *ConcurrencyHandler) MonitorRateLimitHeaders(resp *http.Response) int {
+// 	remaining := resp.Header.Get("X-RateLimit-Remaining")
+// 	retryAfter := resp.Header.Get("Retry-After")
+// 	suggestion := 0
+
+// 	if remaining != "" {
+// 		remainingValue, err := strconv.Atoi(remaining)
+// 		if err == nil && remainingValue < 10 {
+// 			// Suggest decrease concurrency if X-RateLimit-Remaining is below the threshold
+// 			suggestion = -1
+// 		}
+// 	}
+
+// 	if retryAfter != "" {
+// 		// Suggest decrease concurrency if Retry-After is specified
+// 		suggestion = -1
+// 	} else {
+// 		// Suggest increase concurrency if currently below maximum limit and no other decrease suggestion has been made
+// 		if len(ch.sem) < MaxConcurrency && suggestion == 0 {
+// 			suggestion = 1
+// 		}
+// 	}
+
+//		return suggestion
+//	}
 func (ch *ConcurrencyHandler) MonitorRateLimitHeaders(resp *http.Response) int {
 	remaining := resp.Header.Get("X-RateLimit-Remaining")
 	retryAfter := resp.Header.Get("Retry-After")
@@ -78,99 +86,128 @@ func (ch *ConcurrencyHandler) MonitorRateLimitHeaders(resp *http.Response) int {
 	if remaining != "" {
 		remainingValue, err := strconv.Atoi(remaining)
 		if err == nil && remainingValue < 10 {
-			// Suggest decrease concurrency if X-RateLimit-Remaining is below the threshold
 			suggestion = -1
 		}
 	}
 
 	if retryAfter != "" {
-		// Suggest decrease concurrency if Retry-After is specified
 		suggestion = -1
-	} else {
-		// Suggest increase concurrency if currently below maximum limit and no other decrease suggestion has been made
-		if len(ch.sem) < MaxConcurrency && suggestion == 0 {
-			suggestion = 1
-		}
 	}
 
 	return suggestion
 }
 
 // MonitorServerResponseCodes monitors the response status codes and suggests a concurrency adjustment.
+// func (ch *ConcurrencyHandler) MonitorServerResponseCodes(resp *http.Response) int {
+// 	statusCode := resp.StatusCode
+
+// 	// Lock the metrics to ensure thread safety
+// 	ch.Metrics.Lock.Lock()
+// 	defer ch.Metrics.Lock.Unlock()
+
+// 	// Update the appropriate error count based on the response status code
+// 	switch {
+// 	case statusCode >= 500 && statusCode < 600:
+// 		ch.Metrics.TotalRateLimitErrors++
+// 	case statusCode >= 400 && statusCode < 500:
+// 		// Assuming 4xx errors as client errors
+// 		ch.Metrics.TotalRetries++
+// 	}
+
+// 	// Calculate error rate
+// 	totalRequests := float64(ch.Metrics.TotalRequests)
+// 	totalErrors := float64(ch.Metrics.TotalRateLimitErrors + ch.Metrics.TotalRetries)
+// 	errorRate := totalErrors / totalRequests
+
+// 	// Set the new error rate in the metrics
+// 	ch.Metrics.ResponseCodeMetrics.ErrorRate = errorRate
+
+//		// Determine action based on the error rate
+//		if errorRate > ErrorRateThreshold {
+//			// Suggest decrease concurrency
+//			return -1
+//		} else if errorRate <= ErrorRateThreshold && len(ch.sem) < MaxConcurrency {
+//			// Suggest increase concurrency if there is capacity
+//			return 1
+//		}
+//		return 0
+//	}
 func (ch *ConcurrencyHandler) MonitorServerResponseCodes(resp *http.Response) int {
 	statusCode := resp.StatusCode
-
-	// Lock the metrics to ensure thread safety
 	ch.Metrics.Lock.Lock()
 	defer ch.Metrics.Lock.Unlock()
 
-	// Update the appropriate error count based on the response status code
-	switch {
-	case statusCode >= 500 && statusCode < 600:
+	if statusCode >= 500 {
 		ch.Metrics.TotalRateLimitErrors++
-	case statusCode >= 400 && statusCode < 500:
-		// Assuming 4xx errors as client errors
+		return -1
+	} else if statusCode >= 400 {
 		ch.Metrics.TotalRetries++
-	}
-
-	// Calculate error rate
-	totalRequests := float64(ch.Metrics.TotalRequests)
-	totalErrors := float64(ch.Metrics.TotalRateLimitErrors + ch.Metrics.TotalRetries)
-	errorRate := totalErrors / totalRequests
-
-	// Set the new error rate in the metrics
-	ch.Metrics.ResponseCodeMetrics.ErrorRate = errorRate
-
-	// Determine action based on the error rate
-	if errorRate > ErrorRateThreshold {
-		// Suggest decrease concurrency
 		return -1
-	} else if errorRate <= ErrorRateThreshold && len(ch.sem) < MaxConcurrency {
-		// Suggest increase concurrency if there is capacity
-		return 1
 	}
+
 	return 0
 }
 
 // MonitorResponseTimeVariability monitors the response time variability and suggests a concurrency adjustment.
+// func (ch *ConcurrencyHandler) MonitorResponseTimeVariability(responseTime time.Duration) int {
+// 	ch.Metrics.Lock.Lock()
+// 	defer ch.Metrics.Lock.Unlock()
+
+// 	// Update ResponseTimeVariability metrics
+// 	ch.Metrics.ResponseTimeVariability.Lock.Lock()
+// 	defer ch.Metrics.ResponseTimeVariability.Lock.Unlock()
+// 	ch.Metrics.ResponseTimeVariability.Total += responseTime
+// 	ch.Metrics.ResponseTimeVariability.Count++
+
+// 	// Calculate average response time
+// 	ch.Metrics.ResponseTimeVariability.Average = ch.Metrics.ResponseTimeVariability.Total / time.Duration(ch.Metrics.ResponseTimeVariability.Count)
+
+// 	// Calculate variance of response times
+// 	ch.Metrics.ResponseTimeVariability.Variance = ch.calculateVariance(ch.Metrics.ResponseTimeVariability.Average, responseTime)
+
+// 	// Calculate standard deviation of response times
+// 	stdDev := math.Sqrt(ch.Metrics.ResponseTimeVariability.Variance)
+
+//		// Determine action based on standard deviation
+//		if stdDev > ch.Metrics.ResponseTimeVariability.StdDevThreshold {
+//			// Suggest decrease concurrency
+//			return -1
+//		} else if stdDev <= ch.Metrics.ResponseTimeVariability.StdDevThreshold && len(ch.sem) < MaxConcurrency {
+//			// Suggest increase concurrency if there is capacity
+//			return 1
+//		}
+//		return 0
+//	}
 func (ch *ConcurrencyHandler) MonitorResponseTimeVariability(responseTime time.Duration) int {
 	ch.Metrics.Lock.Lock()
 	defer ch.Metrics.Lock.Unlock()
 
-	// Update ResponseTimeVariability metrics
-	ch.Metrics.ResponseTimeVariability.Lock.Lock()
-	defer ch.Metrics.ResponseTimeVariability.Lock.Unlock()
+	// Update total response time and count
 	ch.Metrics.ResponseTimeVariability.Total += responseTime
 	ch.Metrics.ResponseTimeVariability.Count++
 
-	// Calculate average response time
-	ch.Metrics.ResponseTimeVariability.Average = ch.Metrics.ResponseTimeVariability.Total / time.Duration(ch.Metrics.ResponseTimeVariability.Count)
+	// Calculate the average response time
+	averageResponseTime := ch.Metrics.ResponseTimeVariability.Total / time.Duration(ch.Metrics.ResponseTimeVariability.Count)
 
-	// Calculate variance of response times
-	ch.Metrics.ResponseTimeVariability.Variance = ch.calculateVariance(ch.Metrics.ResponseTimeVariability.Average, responseTime)
+	// Calculate variance
+	variance := ch.calculateVariance(averageResponseTime, responseTime)
+	// Calculate standard deviation
+	stdDev := math.Sqrt(variance)
 
-	// Calculate standard deviation of response times
-	stdDev := math.Sqrt(ch.Metrics.ResponseTimeVariability.Variance)
+	// Convert MaxAcceptableResponseTimeVariability to seconds for comparison
+	maxStdDev := MaxAcceptableResponseTimeVariability.Seconds()
 
-	// Determine action based on standard deviation
-	if stdDev > ch.Metrics.ResponseTimeVariability.StdDevThreshold {
-		// Suggest decrease concurrency
-		return -1
-	} else if stdDev <= ch.Metrics.ResponseTimeVariability.StdDevThreshold && len(ch.sem) < MaxConcurrency {
-		// Suggest increase concurrency if there is capacity
-		return 1
+	if stdDev > maxStdDev {
+		return -1 // Suggest to decrease concurrency if stdDev exceeds the maximum threshold
 	}
-	return 0
+	return 1 // Suggest to increase concurrency if stdDev is within the acceptable range
 }
 
-// calculateVariance calculates the variance of response times.
-func (ch *ConcurrencyHandler) calculateVariance(averageResponseTime time.Duration, responseTime time.Duration) float64 {
-	// Convert time.Duration values to seconds
-	averageSeconds := averageResponseTime.Seconds()
-	responseSeconds := responseTime.Seconds()
-
-	// Calculate variance
-	variance := (float64(ch.Metrics.ResponseTimeVariability.Count-1)*math.Pow(averageSeconds-responseSeconds, 2) + ch.Metrics.ResponseTimeVariability.Variance) / float64(ch.Metrics.ResponseTimeVariability.Count)
-	ch.Metrics.ResponseTimeVariability.Variance = variance
-	return variance
+// calculateVariance calculates the variance between the average response time and a new sample.
+func (ch *ConcurrencyHandler) calculateVariance(average, newSample time.Duration) float64 {
+	mean := average.Seconds()       // Convert to seconds
+	newValue := newSample.Seconds() // Convert to seconds
+	newVariance := (float64(ch.Metrics.ResponseTimeVariability.Count-1)*math.Pow(mean-newValue, 2) + ch.Metrics.ResponseTimeVariability.Variance) / float64(ch.Metrics.ResponseTimeVariability.Count)
+	ch.Metrics.ResponseTimeVariability.Variance = newVariance // Update the variance in metrics
+	return newVariance
 }