2023-05-05 07:57:07 +00:00
package control
import (
"crypto/ecdsa"
"fmt"
"strings"
2023-05-19 15:06:20 +00:00
"sync/atomic"
2023-05-05 07:57:07 +00:00
"time"
"git.frostfs.info/TrueCloudLab/frostfs-node/cmd/frostfs-cli/internal/key"
commonCmd "git.frostfs.info/TrueCloudLab/frostfs-node/cmd/internal/common"
"git.frostfs.info/TrueCloudLab/frostfs-node/pkg/local_object_storage/shard"
"git.frostfs.info/TrueCloudLab/frostfs-node/pkg/services/control"
2024-11-07 14:32:10 +00:00
"git.frostfs.info/TrueCloudLab/frostfs-sdk-go/api/rpc/client"
2023-05-05 07:57:07 +00:00
clientSDK "git.frostfs.info/TrueCloudLab/frostfs-sdk-go/client"
"github.com/spf13/cobra"
)
const (
awaitFlag = "await"
noProgressFlag = "no-progress"
2024-02-05 13:33:09 +00:00
scopeFlag = "scope"
2024-09-03 12:42:38 +00:00
repOneOnlyFlag = "rep-one-only"
2024-02-05 13:33:09 +00:00
2024-09-18 09:15:32 +00:00
containerWorkerCountFlag = "container-worker-count"
objectWorkerCountFlag = "object-worker-count"
2024-02-05 13:33:09 +00:00
scopeAll = "all"
scopeObjects = "objects"
scopeTrees = "trees"
2023-05-05 07:57:07 +00:00
)
var evacuationShardCmd = & cobra . Command {
Use : "evacuation" ,
Short : "Objects evacuation from shard" ,
Long : "Objects evacuation from shard to other shards" ,
}
var startEvacuationShardCmd = & cobra . Command {
Use : "start" ,
Short : "Start evacuate objects from shard" ,
Long : "Start evacuate objects from shard to other shards" ,
Run : startEvacuateShard ,
}
var getEvacuationShardStatusCmd = & cobra . Command {
Use : "status" ,
Short : "Get evacuate objects from shard status" ,
Long : "Get evacuate objects from shard to other shards status" ,
Run : getEvacuateShardStatus ,
}
var stopEvacuationShardCmd = & cobra . Command {
Use : "stop" ,
Short : "Stop running evacuate process" ,
Long : "Stop running evacuate process from shard to other shards" ,
Run : stopEvacuateShardStatus ,
}
2024-03-13 07:40:44 +00:00
var resetEvacuationStatusShardCmd = & cobra . Command {
Use : "reset" ,
Short : "Reset evacuate objects from shard status" ,
Long : "Reset evacuate objects from shard to other shards status" ,
Run : resetEvacuateShardStatus ,
}
2023-05-05 07:57:07 +00:00
func startEvacuateShard ( cmd * cobra . Command , _ [ ] string ) {
pk := key . Get ( cmd )
ignoreErrors , _ := cmd . Flags ( ) . GetBool ( ignoreErrorsFlag )
2024-09-18 09:15:32 +00:00
containerWorkerCount , _ := cmd . Flags ( ) . GetUint32 ( containerWorkerCountFlag )
objectWorkerCount , _ := cmd . Flags ( ) . GetUint32 ( objectWorkerCountFlag )
2024-09-03 12:42:38 +00:00
repOneOnly , _ := cmd . Flags ( ) . GetBool ( repOneOnlyFlag )
2023-05-05 07:57:07 +00:00
req := & control . StartShardEvacuationRequest {
Body : & control . StartShardEvacuationRequest_Body {
2024-09-18 09:15:32 +00:00
Shard_ID : getShardIDList ( cmd ) ,
IgnoreErrors : ignoreErrors ,
Scope : getEvacuationScope ( cmd ) ,
ContainerWorkerCount : containerWorkerCount ,
ObjectWorkerCount : objectWorkerCount ,
2024-09-03 12:42:38 +00:00
RepOneOnly : repOneOnly ,
2023-05-05 07:57:07 +00:00
} ,
}
signRequest ( cmd , pk , req )
cli := getClient ( cmd , pk )
var resp * control . StartShardEvacuationResponse
var err error
err = cli . ExecRaw ( func ( client * client . Client ) error {
2023-05-26 08:26:54 +00:00
resp , err = control . StartShardEvacuation ( client , req )
2023-05-05 07:57:07 +00:00
return err
} )
commonCmd . ExitOnErr ( cmd , "Start evacuate shards failed, rpc error: %w" , err )
verifyResponse ( cmd , resp . GetSignature ( ) , resp . GetBody ( ) )
cmd . Println ( "Shard evacuation has been successfully started." )
if awaitCompletion , _ := cmd . Flags ( ) . GetBool ( awaitFlag ) ; awaitCompletion {
noProgress , _ := cmd . Flags ( ) . GetBool ( noProgressFlag )
waitEvacuateCompletion ( cmd , pk , cli , ! noProgress , true )
}
}
2024-02-05 13:33:09 +00:00
func getEvacuationScope ( cmd * cobra . Command ) uint32 {
rawScope , err := cmd . Flags ( ) . GetString ( scopeFlag )
commonCmd . ExitOnErr ( cmd , "Invalid scope value: %w" , err )
switch rawScope {
case scopeAll :
return uint32 ( control . StartShardEvacuationRequest_Body_OBJECTS ) | uint32 ( control . StartShardEvacuationRequest_Body_TREES )
case scopeObjects :
return uint32 ( control . StartShardEvacuationRequest_Body_OBJECTS )
case scopeTrees :
return uint32 ( control . StartShardEvacuationRequest_Body_TREES )
default :
commonCmd . ExitOnErr ( cmd , "Invalid scope value: %w" , fmt . Errorf ( "unknown scope %s" , rawScope ) )
}
return uint32 ( control . StartShardEvacuationRequest_Body_NONE )
}
2023-05-05 07:57:07 +00:00
func getEvacuateShardStatus ( cmd * cobra . Command , _ [ ] string ) {
pk := key . Get ( cmd )
req := & control . GetShardEvacuationStatusRequest {
Body : & control . GetShardEvacuationStatusRequest_Body { } ,
}
signRequest ( cmd , pk , req )
cli := getClient ( cmd , pk )
var resp * control . GetShardEvacuationStatusResponse
var err error
err = cli . ExecRaw ( func ( client * client . Client ) error {
2023-05-26 08:26:54 +00:00
resp , err = control . GetShardEvacuationStatus ( client , req )
2023-05-05 07:57:07 +00:00
return err
} )
commonCmd . ExitOnErr ( cmd , "Get evacuate shards status failed, rpc error: %w" , err )
verifyResponse ( cmd , resp . GetSignature ( ) , resp . GetBody ( ) )
printStatus ( cmd , resp )
}
func stopEvacuateShardStatus ( cmd * cobra . Command , _ [ ] string ) {
pk := key . Get ( cmd )
req := & control . StopShardEvacuationRequest {
Body : & control . StopShardEvacuationRequest_Body { } ,
}
signRequest ( cmd , pk , req )
cli := getClient ( cmd , pk )
var resp * control . StopShardEvacuationResponse
var err error
err = cli . ExecRaw ( func ( client * client . Client ) error {
2023-05-26 08:26:54 +00:00
resp , err = control . StopShardEvacuation ( client , req )
2023-05-05 07:57:07 +00:00
return err
} )
commonCmd . ExitOnErr ( cmd , "Stop evacuate shards failed, rpc error: %w" , err )
verifyResponse ( cmd , resp . GetSignature ( ) , resp . GetBody ( ) )
waitEvacuateCompletion ( cmd , pk , cli , false , false )
cmd . Println ( "Evacuation stopped." )
}
2024-03-13 07:40:44 +00:00
func resetEvacuateShardStatus ( cmd * cobra . Command , _ [ ] string ) {
pk := key . Get ( cmd )
req := & control . ResetShardEvacuationStatusRequest {
Body : & control . ResetShardEvacuationStatusRequest_Body { } ,
}
signRequest ( cmd , pk , req )
cli := getClient ( cmd , pk )
var resp * control . ResetShardEvacuationStatusResponse
var err error
err = cli . ExecRaw ( func ( client * client . Client ) error {
resp , err = control . ResetShardEvacuationStatus ( client , req )
return err
} )
commonCmd . ExitOnErr ( cmd , "Reset shards evacuation status failed, rpc error: %w" , err )
verifyResponse ( cmd , resp . GetSignature ( ) , resp . GetBody ( ) )
cmd . Println ( "Shards evacuation status has been reset." )
}
2023-05-05 07:57:07 +00:00
func waitEvacuateCompletion ( cmd * cobra . Command , pk * ecdsa . PrivateKey , cli * clientSDK . Client , printProgress , printCompleted bool ) {
const statusPollingInterval = 1 * time . Second
const reportIntervalSeconds = 5
var resp * control . GetShardEvacuationStatusResponse
2023-05-19 15:06:20 +00:00
reportResponse := new ( atomic . Pointer [ control . GetShardEvacuationStatusResponse ] )
2023-05-05 07:57:07 +00:00
pollingCompleted := make ( chan struct { } )
progressReportCompleted := make ( chan struct { } )
go func ( ) {
defer close ( progressReportCompleted )
if ! printProgress {
return
}
cmd . Printf ( "Progress will be reported every %d seconds.\n" , reportIntervalSeconds )
for {
select {
case <- pollingCompleted :
return
case <- time . After ( reportIntervalSeconds * time . Second ) :
r := reportResponse . Load ( )
if r == nil || r . GetBody ( ) . GetStatus ( ) == control . GetShardEvacuationStatusResponse_Body_COMPLETED {
continue
}
printStatus ( cmd , r )
}
}
} ( )
for {
req := & control . GetShardEvacuationStatusRequest {
Body : & control . GetShardEvacuationStatusRequest_Body { } ,
}
signRequest ( cmd , pk , req )
var err error
err = cli . ExecRaw ( func ( client * client . Client ) error {
2023-05-26 08:26:54 +00:00
resp , err = control . GetShardEvacuationStatus ( client , req )
2023-05-05 07:57:07 +00:00
return err
} )
reportResponse . Store ( resp )
if err != nil {
commonCmd . ExitOnErr ( cmd , "Failed to get evacuate status, rpc error: %w" , err )
return
}
if resp . GetBody ( ) . GetStatus ( ) != control . GetShardEvacuationStatusResponse_Body_RUNNING {
break
}
time . Sleep ( statusPollingInterval )
}
close ( pollingCompleted )
<- progressReportCompleted
if printCompleted {
printCompletedStatusMessage ( cmd , resp )
}
}
func printCompletedStatusMessage ( cmd * cobra . Command , resp * control . GetShardEvacuationStatusResponse ) {
cmd . Println ( "Shard evacuation has been completed." )
sb := & strings . Builder { }
appendShardIDs ( sb , resp )
appendCounts ( sb , resp )
appendError ( sb , resp )
appendStartedAt ( sb , resp )
appendDuration ( sb , resp )
cmd . Println ( sb . String ( ) )
}
func printStatus ( cmd * cobra . Command , resp * control . GetShardEvacuationStatusResponse ) {
if resp . GetBody ( ) . GetStatus ( ) == control . GetShardEvacuationStatusResponse_Body_EVACUATE_SHARD_STATUS_UNDEFINED {
cmd . Println ( "There is no running or completed evacuation." )
return
}
sb := & strings . Builder { }
appendShardIDs ( sb , resp )
appendStatus ( sb , resp )
appendCounts ( sb , resp )
appendError ( sb , resp )
appendStartedAt ( sb , resp )
appendDuration ( sb , resp )
2023-05-29 15:44:46 +00:00
appendEstimation ( sb , resp )
2023-05-05 07:57:07 +00:00
cmd . Println ( sb . String ( ) )
}
2023-05-29 15:44:46 +00:00
func appendEstimation ( sb * strings . Builder , resp * control . GetShardEvacuationStatusResponse ) {
if resp . GetBody ( ) . GetStatus ( ) != control . GetShardEvacuationStatusResponse_Body_RUNNING ||
resp . GetBody ( ) . GetDuration ( ) == nil ||
2024-02-05 14:49:09 +00:00
( resp . GetBody ( ) . GetTotalObjects ( ) == 0 && resp . GetBody ( ) . GetTotalTrees ( ) == 0 ) ||
( resp . GetBody ( ) . GetEvacuatedObjects ( ) + resp . GetBody ( ) . GetFailedObjects ( ) + resp . GetBody ( ) . GetSkippedObjects ( ) == 0 &&
resp . GetBody ( ) . GetEvacuatedTrees ( ) + resp . GetBody ( ) . GetFailedTrees ( ) == 0 ) {
2023-05-29 15:44:46 +00:00
return
}
durationSeconds := float64 ( resp . GetBody ( ) . GetDuration ( ) . GetSeconds ( ) )
2024-02-05 14:49:09 +00:00
evacuated := float64 ( resp . GetBody ( ) . GetEvacuatedObjects ( ) + resp . GetBody ( ) . GetFailedObjects ( ) + resp . GetBody ( ) . GetSkippedObjects ( ) +
resp . GetBody ( ) . GetEvacuatedTrees ( ) + resp . GetBody ( ) . GetFailedTrees ( ) )
2023-05-29 15:44:46 +00:00
avgObjEvacuationTimeSeconds := durationSeconds / evacuated
2024-02-05 14:49:09 +00:00
objectsLeft := float64 ( resp . GetBody ( ) . GetTotalObjects ( ) + resp . GetBody ( ) . GetTotalTrees ( ) ) - evacuated
2023-05-29 15:44:46 +00:00
leftSeconds := avgObjEvacuationTimeSeconds * objectsLeft
leftMinutes := int ( leftSeconds / 60 )
sb . WriteString ( fmt . Sprintf ( " Estimated time left: %d minutes." , leftMinutes ) )
}
2023-05-05 07:57:07 +00:00
func appendDuration ( sb * strings . Builder , resp * control . GetShardEvacuationStatusResponse ) {
if resp . GetBody ( ) . GetDuration ( ) != nil {
duration := time . Second * time . Duration ( resp . GetBody ( ) . GetDuration ( ) . GetSeconds ( ) )
hour := int ( duration . Seconds ( ) / 3600 )
minute := int ( duration . Seconds ( ) / 60 ) % 60
second := int ( duration . Seconds ( ) ) % 60
sb . WriteString ( fmt . Sprintf ( " Duration: %02d:%02d:%02d." , hour , minute , second ) )
}
}
func appendStartedAt ( sb * strings . Builder , resp * control . GetShardEvacuationStatusResponse ) {
if resp . GetBody ( ) . GetStartedAt ( ) != nil {
startedAt := time . Unix ( resp . GetBody ( ) . GetStartedAt ( ) . GetValue ( ) , 0 ) . UTC ( )
sb . WriteString ( fmt . Sprintf ( " Started at: %s UTC." , startedAt . Format ( time . RFC3339 ) ) )
}
}
func appendError ( sb * strings . Builder , resp * control . GetShardEvacuationStatusResponse ) {
2023-12-11 10:18:34 +00:00
if len ( resp . GetBody ( ) . GetErrorMessage ( ) ) > 0 {
sb . WriteString ( fmt . Sprintf ( " Error: %s." , resp . GetBody ( ) . GetErrorMessage ( ) ) )
2023-05-05 07:57:07 +00:00
}
}
func appendStatus ( sb * strings . Builder , resp * control . GetShardEvacuationStatusResponse ) {
var status string
switch resp . GetBody ( ) . GetStatus ( ) {
case control . GetShardEvacuationStatusResponse_Body_COMPLETED :
status = "completed"
case control . GetShardEvacuationStatusResponse_Body_RUNNING :
status = "running"
default :
status = "undefined"
}
sb . WriteString ( fmt . Sprintf ( " Status: %s." , status ) )
}
func appendShardIDs ( sb * strings . Builder , resp * control . GetShardEvacuationStatusResponse ) {
sb . WriteString ( "Shard IDs: " )
for idx , shardID := range resp . GetBody ( ) . GetShard_ID ( ) {
shardIDStr := shard . NewIDFromBytes ( shardID ) . String ( )
if idx > 0 {
sb . WriteString ( ", " )
}
sb . WriteString ( shardIDStr )
if idx == len ( resp . GetBody ( ) . GetShard_ID ( ) ) - 1 {
sb . WriteString ( "." )
}
}
}
func appendCounts ( sb * strings . Builder , resp * control . GetShardEvacuationStatusResponse ) {
2024-02-05 14:49:09 +00:00
sb . WriteString ( fmt . Sprintf ( " Evacuated %d objects out of %d, failed to evacuate: %d, skipped: %d; evacuated %d trees out of %d, failed to evacuate: %d." ,
resp . GetBody ( ) . GetEvacuatedObjects ( ) ,
resp . GetBody ( ) . GetTotalObjects ( ) ,
resp . GetBody ( ) . GetFailedObjects ( ) ,
resp . GetBody ( ) . GetSkippedObjects ( ) ,
resp . GetBody ( ) . GetEvacuatedTrees ( ) ,
resp . GetBody ( ) . GetTotalTrees ( ) ,
resp . GetBody ( ) . GetFailedTrees ( ) ) )
2023-05-05 07:57:07 +00:00
}
func initControlEvacuationShardCmd ( ) {
evacuationShardCmd . AddCommand ( startEvacuationShardCmd )
evacuationShardCmd . AddCommand ( getEvacuationShardStatusCmd )
evacuationShardCmd . AddCommand ( stopEvacuationShardCmd )
2024-03-13 07:40:44 +00:00
evacuationShardCmd . AddCommand ( resetEvacuationStatusShardCmd )
2023-05-05 07:57:07 +00:00
initControlStartEvacuationShardCmd ( )
initControlFlags ( getEvacuationShardStatusCmd )
initControlFlags ( stopEvacuationShardCmd )
2024-03-13 07:40:44 +00:00
initControlFlags ( resetEvacuationStatusShardCmd )
2023-05-05 07:57:07 +00:00
}
func initControlStartEvacuationShardCmd ( ) {
initControlFlags ( startEvacuationShardCmd )
flags := startEvacuationShardCmd . Flags ( )
flags . StringSlice ( shardIDFlag , nil , "List of shard IDs in base58 encoding" )
flags . Bool ( shardAllFlag , false , "Process all shards" )
flags . Bool ( ignoreErrorsFlag , true , "Skip invalid/unreadable objects" )
2024-02-05 13:33:09 +00:00
flags . String ( scopeFlag , scopeAll , fmt . Sprintf ( "Evacuation scope; possible values: %s, %s, %s" , scopeTrees , scopeObjects , scopeAll ) )
2023-05-05 07:57:07 +00:00
flags . Bool ( awaitFlag , false , "Block execution until evacuation is completed" )
flags . Bool ( noProgressFlag , false , fmt . Sprintf ( "Print progress if %s provided" , awaitFlag ) )
2024-09-18 09:15:32 +00:00
flags . Uint32 ( containerWorkerCountFlag , 0 , "Count of concurrent container evacuation workers" )
flags . Uint32 ( objectWorkerCountFlag , 0 , "Count of concurrent object evacuation workers" )
2024-09-03 12:42:38 +00:00
flags . Bool ( repOneOnlyFlag , false , "Evacuate objects only from containers with policy 'REP 1 ...'" )
2023-05-05 07:57:07 +00:00
startEvacuationShardCmd . MarkFlagsMutuallyExclusive ( shardIDFlag , shardAllFlag )
}