* add ui for maintenance * valid config loading. fix workers page. * refactor * grpc between admin and workers * add a long-running bidirectional grpc call between admin and worker * use the grpc call to heartbeat * use the grpc call to communicate * worker can remove the http client * admin uses http port + 10000 as its default grpc port * one task one package * handles connection failures gracefully with exponential backoff * grpc with insecure tls * grpc with optional tls * fix detecting tls * change time config from nano seconds to seconds * add tasks with 3 interfaces * compiles reducing hard coded * remove a couple of tasks * remove hard coded references * reduce hard coded values * remove hard coded values * remove hard coded from templ * refactor maintenance package * fix import cycle * simplify * simplify * auto register * auto register factory * auto register task types * self register types * refactor * simplify * remove one task * register ui * lazy init executor factories * use registered task types * DefaultWorkerConfig remove hard coded task types * remove more hard coded * implement get maintenance task * dynamic task configuration * "System Settings" should only have system level settings * adjust menu for tasks * ensure menu not collapsed * render job configuration well * use templ for ui of task configuration * fix ordering * fix bugs * saving duration in seconds * use value and unit for duration * Delete WORKER_REFACTORING_PLAN.md * Delete maintenance.json * Delete custom_worker_example.go * remove address from workers * remove old code from ec task * remove creating collection button * reconnect with exponential backoff * worker use security.toml * start admin server with tls info from security.toml * fix "weed admin" cli description
140 lines
3.7 KiB
Go
140 lines
3.7 KiB
Go
package erasure_coding
|
|
|
|
import (
|
|
"time"
|
|
|
|
"github.com/seaweedfs/seaweedfs/weed/glog"
|
|
"github.com/seaweedfs/seaweedfs/weed/worker/types"
|
|
)
|
|
|
|
// EcDetector implements erasure coding task detection
|
|
type EcDetector struct {
|
|
enabled bool
|
|
volumeAgeHours int
|
|
fullnessRatio float64
|
|
scanInterval time.Duration
|
|
}
|
|
|
|
// Compile-time interface assertions
|
|
var (
|
|
_ types.TaskDetector = (*EcDetector)(nil)
|
|
)
|
|
|
|
// NewEcDetector creates a new erasure coding detector
|
|
func NewEcDetector() *EcDetector {
|
|
return &EcDetector{
|
|
enabled: false, // Conservative default
|
|
volumeAgeHours: 24 * 7, // 1 week
|
|
fullnessRatio: 0.9, // 90% full
|
|
scanInterval: 2 * time.Hour,
|
|
}
|
|
}
|
|
|
|
// GetTaskType returns the task type
|
|
func (d *EcDetector) GetTaskType() types.TaskType {
|
|
return types.TaskTypeErasureCoding
|
|
}
|
|
|
|
// ScanForTasks scans for volumes that should be converted to erasure coding
|
|
func (d *EcDetector) ScanForTasks(volumeMetrics []*types.VolumeHealthMetrics, clusterInfo *types.ClusterInfo) ([]*types.TaskDetectionResult, error) {
|
|
if !d.enabled {
|
|
return nil, nil
|
|
}
|
|
|
|
var results []*types.TaskDetectionResult
|
|
now := time.Now()
|
|
ageThreshold := time.Duration(d.volumeAgeHours) * time.Hour
|
|
|
|
for _, metric := range volumeMetrics {
|
|
// Skip if already EC volume
|
|
if metric.IsECVolume {
|
|
continue
|
|
}
|
|
|
|
// Check age and fullness criteria
|
|
if metric.Age >= ageThreshold && metric.FullnessRatio >= d.fullnessRatio {
|
|
// Check if volume is read-only (safe for EC conversion)
|
|
if !metric.IsReadOnly {
|
|
continue
|
|
}
|
|
|
|
result := &types.TaskDetectionResult{
|
|
TaskType: types.TaskTypeErasureCoding,
|
|
VolumeID: metric.VolumeID,
|
|
Server: metric.Server,
|
|
Collection: metric.Collection,
|
|
Priority: types.TaskPriorityLow, // EC is not urgent
|
|
Reason: "Volume is old and full enough for EC conversion",
|
|
Parameters: map[string]interface{}{
|
|
"age_hours": int(metric.Age.Hours()),
|
|
"fullness_ratio": metric.FullnessRatio,
|
|
},
|
|
ScheduleAt: now,
|
|
}
|
|
results = append(results, result)
|
|
}
|
|
}
|
|
|
|
glog.V(2).Infof("EC detector found %d tasks to schedule", len(results))
|
|
return results, nil
|
|
}
|
|
|
|
// ScanInterval returns how often this task type should be scanned
|
|
func (d *EcDetector) ScanInterval() time.Duration {
|
|
return d.scanInterval
|
|
}
|
|
|
|
// IsEnabled returns whether this task type is enabled
|
|
func (d *EcDetector) IsEnabled() bool {
|
|
return d.enabled
|
|
}
|
|
|
|
// Configuration setters
|
|
|
|
func (d *EcDetector) SetEnabled(enabled bool) {
|
|
d.enabled = enabled
|
|
}
|
|
|
|
func (d *EcDetector) SetVolumeAgeHours(hours int) {
|
|
d.volumeAgeHours = hours
|
|
}
|
|
|
|
func (d *EcDetector) SetFullnessRatio(ratio float64) {
|
|
d.fullnessRatio = ratio
|
|
}
|
|
|
|
func (d *EcDetector) SetScanInterval(interval time.Duration) {
|
|
d.scanInterval = interval
|
|
}
|
|
|
|
// GetVolumeAgeHours returns the current volume age threshold in hours
|
|
func (d *EcDetector) GetVolumeAgeHours() int {
|
|
return d.volumeAgeHours
|
|
}
|
|
|
|
// GetFullnessRatio returns the current fullness ratio threshold
|
|
func (d *EcDetector) GetFullnessRatio() float64 {
|
|
return d.fullnessRatio
|
|
}
|
|
|
|
// GetScanInterval returns the scan interval
|
|
func (d *EcDetector) GetScanInterval() time.Duration {
|
|
return d.scanInterval
|
|
}
|
|
|
|
// ConfigureFromPolicy configures the detector based on the maintenance policy
|
|
func (d *EcDetector) ConfigureFromPolicy(policy interface{}) {
|
|
// Type assert to the maintenance policy type we expect
|
|
if maintenancePolicy, ok := policy.(interface {
|
|
GetECEnabled() bool
|
|
GetECVolumeAgeHours() int
|
|
GetECFullnessRatio() float64
|
|
}); ok {
|
|
d.SetEnabled(maintenancePolicy.GetECEnabled())
|
|
d.SetVolumeAgeHours(maintenancePolicy.GetECVolumeAgeHours())
|
|
d.SetFullnessRatio(maintenancePolicy.GetECFullnessRatio())
|
|
} else {
|
|
glog.V(1).Infof("Could not configure EC detector from policy: unsupported policy type")
|
|
}
|
|
}
|