123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290 |
- package shell
- import (
- "context"
- "flag"
- "fmt"
- "github.com/chrislusf/seaweedfs/weed/glog"
- "github.com/chrislusf/seaweedfs/weed/pb"
- "github.com/chrislusf/seaweedfs/weed/storage/types"
- "io"
- "time"
- "google.golang.org/grpc"
- "github.com/chrislusf/seaweedfs/weed/operation"
- "github.com/chrislusf/seaweedfs/weed/pb/master_pb"
- "github.com/chrislusf/seaweedfs/weed/pb/volume_server_pb"
- "github.com/chrislusf/seaweedfs/weed/storage/erasure_coding"
- "github.com/chrislusf/seaweedfs/weed/storage/needle"
- )
- func init() {
- Commands = append(Commands, &commandEcDecode{})
- }
- type commandEcDecode struct {
- }
- func (c *commandEcDecode) Name() string {
- return "ec.decode"
- }
- func (c *commandEcDecode) Help() string {
- return `decode a erasure coded volume into a normal volume
- ec.decode [-collection=""] [-volumeId=<volume_id>]
- `
- }
- func (c *commandEcDecode) Do(args []string, commandEnv *CommandEnv, writer io.Writer) (err error) {
- encodeCommand := flag.NewFlagSet(c.Name(), flag.ContinueOnError)
- volumeId := encodeCommand.Int("volumeId", 0, "the volume id")
- collection := encodeCommand.String("collection", "", "the collection name")
- forceChanges := encodeCommand.Bool("force", false, "force the encoding even if the cluster has less than recommended 4 nodes")
- if err = encodeCommand.Parse(args); err != nil {
- return nil
- }
- if err = commandEnv.confirmIsLocked(args); err != nil {
- return
- }
- vid := needle.VolumeId(*volumeId)
- // collect topology information
- topologyInfo, _, err := collectTopologyInfo(commandEnv, 0)
- if err != nil {
- return err
- }
- if !*forceChanges {
- var nodeCount int
- eachDataNode(topologyInfo, func(dc string, rack RackId, dn *master_pb.DataNodeInfo) {
- nodeCount++
- })
- if nodeCount < erasure_coding.ParityShardsCount {
- glog.V(0).Infof("skip erasure coding with %d nodes, less than recommended %d nodes", nodeCount, erasure_coding.ParityShardsCount)
- return nil
- }
- }
- // volumeId is provided
- if vid != 0 {
- return doEcDecode(commandEnv, topologyInfo, *collection, vid)
- }
- // apply to all volumes in the collection
- volumeIds := collectEcShardIds(topologyInfo, *collection)
- fmt.Printf("ec encode volumes: %v\n", volumeIds)
- for _, vid := range volumeIds {
- if err = doEcDecode(commandEnv, topologyInfo, *collection, vid); err != nil {
- return err
- }
- }
- return nil
- }
- func doEcDecode(commandEnv *CommandEnv, topoInfo *master_pb.TopologyInfo, collection string, vid needle.VolumeId) (err error) {
- // find volume location
- nodeToEcIndexBits := collectEcNodeShardBits(topoInfo, vid)
- fmt.Printf("ec volume %d shard locations: %+v\n", vid, nodeToEcIndexBits)
- // collect ec shards to the server with most space
- targetNodeLocation, err := collectEcShards(commandEnv, nodeToEcIndexBits, collection, vid)
- if err != nil {
- return fmt.Errorf("collectEcShards for volume %d: %v", vid, err)
- }
- // generate a normal volume
- err = generateNormalVolume(commandEnv.option.GrpcDialOption, vid, collection, targetNodeLocation)
- if err != nil {
- return fmt.Errorf("generate normal volume %d on %s: %v", vid, targetNodeLocation, err)
- }
- // delete the previous ec shards
- err = mountVolumeAndDeleteEcShards(commandEnv.option.GrpcDialOption, collection, targetNodeLocation, nodeToEcIndexBits, vid)
- if err != nil {
- return fmt.Errorf("delete ec shards for volume %d: %v", vid, err)
- }
- return nil
- }
- func mountVolumeAndDeleteEcShards(grpcDialOption grpc.DialOption, collection string, targetNodeLocation pb.ServerAddress, nodeToEcIndexBits map[pb.ServerAddress]erasure_coding.ShardBits, vid needle.VolumeId) error {
- // mount volume
- if err := operation.WithVolumeServerClient(false, targetNodeLocation, grpcDialOption, func(volumeServerClient volume_server_pb.VolumeServerClient) error {
- _, mountErr := volumeServerClient.VolumeMount(context.Background(), &volume_server_pb.VolumeMountRequest{
- VolumeId: uint32(vid),
- })
- return mountErr
- }); err != nil {
- return fmt.Errorf("mountVolumeAndDeleteEcShards mount volume %d on %s: %v", vid, targetNodeLocation, err)
- }
- // unmount ec shards
- for location, ecIndexBits := range nodeToEcIndexBits {
- fmt.Printf("unmount ec volume %d on %s has shards: %+v\n", vid, location, ecIndexBits.ShardIds())
- err := unmountEcShards(grpcDialOption, vid, location, ecIndexBits.ToUint32Slice())
- if err != nil {
- return fmt.Errorf("mountVolumeAndDeleteEcShards unmount ec volume %d on %s: %v", vid, location, err)
- }
- }
- // delete ec shards
- for location, ecIndexBits := range nodeToEcIndexBits {
- fmt.Printf("delete ec volume %d on %s has shards: %+v\n", vid, location, ecIndexBits.ShardIds())
- err := sourceServerDeleteEcShards(grpcDialOption, collection, vid, location, ecIndexBits.ToUint32Slice())
- if err != nil {
- return fmt.Errorf("mountVolumeAndDeleteEcShards delete ec volume %d on %s: %v", vid, location, err)
- }
- }
- return nil
- }
- func generateNormalVolume(grpcDialOption grpc.DialOption, vid needle.VolumeId, collection string, sourceVolumeServer pb.ServerAddress) error {
- fmt.Printf("generateNormalVolume from ec volume %d on %s\n", vid, sourceVolumeServer)
- err := operation.WithVolumeServerClient(false, sourceVolumeServer, grpcDialOption, func(volumeServerClient volume_server_pb.VolumeServerClient) error {
- _, genErr := volumeServerClient.VolumeEcShardsToVolume(context.Background(), &volume_server_pb.VolumeEcShardsToVolumeRequest{
- VolumeId: uint32(vid),
- Collection: collection,
- })
- return genErr
- })
- return err
- }
- func collectEcShards(commandEnv *CommandEnv, nodeToEcIndexBits map[pb.ServerAddress]erasure_coding.ShardBits, collection string, vid needle.VolumeId) (targetNodeLocation pb.ServerAddress, err error) {
- maxShardCount := 0
- var exisitngEcIndexBits erasure_coding.ShardBits
- for loc, ecIndexBits := range nodeToEcIndexBits {
- toBeCopiedShardCount := ecIndexBits.MinusParityShards().ShardIdCount()
- if toBeCopiedShardCount > maxShardCount {
- maxShardCount = toBeCopiedShardCount
- targetNodeLocation = loc
- exisitngEcIndexBits = ecIndexBits
- }
- }
- fmt.Printf("collectEcShards: ec volume %d collect shards to %s from: %+v\n", vid, targetNodeLocation, nodeToEcIndexBits)
- var copiedEcIndexBits erasure_coding.ShardBits
- for loc, ecIndexBits := range nodeToEcIndexBits {
- if loc == targetNodeLocation {
- continue
- }
- needToCopyEcIndexBits := ecIndexBits.Minus(exisitngEcIndexBits).MinusParityShards()
- if needToCopyEcIndexBits.ShardIdCount() == 0 {
- continue
- }
- err = operation.WithVolumeServerClient(false, targetNodeLocation, commandEnv.option.GrpcDialOption, func(volumeServerClient volume_server_pb.VolumeServerClient) error {
- fmt.Printf("copy %d.%v %s => %s\n", vid, needToCopyEcIndexBits.ShardIds(), loc, targetNodeLocation)
- _, copyErr := volumeServerClient.VolumeEcShardsCopy(context.Background(), &volume_server_pb.VolumeEcShardsCopyRequest{
- VolumeId: uint32(vid),
- Collection: collection,
- ShardIds: needToCopyEcIndexBits.ToUint32Slice(),
- CopyEcxFile: false,
- CopyEcjFile: true,
- CopyVifFile: true,
- SourceDataNode: string(loc),
- })
- if copyErr != nil {
- return fmt.Errorf("copy %d.%v %s => %s : %v\n", vid, needToCopyEcIndexBits.ShardIds(), loc, targetNodeLocation, copyErr)
- }
- return nil
- })
- if err != nil {
- break
- }
- copiedEcIndexBits = copiedEcIndexBits.Plus(needToCopyEcIndexBits)
- }
- nodeToEcIndexBits[targetNodeLocation] = exisitngEcIndexBits.Plus(copiedEcIndexBits)
- return targetNodeLocation, err
- }
- func lookupVolumeIds(commandEnv *CommandEnv, volumeIds []string) (volumeIdLocations []*master_pb.LookupVolumeResponse_VolumeIdLocation, err error) {
- var resp *master_pb.LookupVolumeResponse
- err = commandEnv.MasterClient.WithClient(false, func(client master_pb.SeaweedClient) error {
- resp, err = client.LookupVolume(context.Background(), &master_pb.LookupVolumeRequest{VolumeOrFileIds: volumeIds})
- return err
- })
- if err != nil {
- return nil, err
- }
- return resp.VolumeIdLocations, nil
- }
- func collectTopologyInfo(commandEnv *CommandEnv, delayBeforeCollecting time.Duration) (topoInfo *master_pb.TopologyInfo, volumeSizeLimitMb uint64, err error) {
- if delayBeforeCollecting > 0 {
- time.Sleep(delayBeforeCollecting)
- }
- var resp *master_pb.VolumeListResponse
- err = commandEnv.MasterClient.WithClient(false, func(client master_pb.SeaweedClient) error {
- resp, err = client.VolumeList(context.Background(), &master_pb.VolumeListRequest{})
- return err
- })
- if err != nil {
- return
- }
- return resp.TopologyInfo, resp.VolumeSizeLimitMb, nil
- }
- func collectEcShardIds(topoInfo *master_pb.TopologyInfo, selectedCollection string) (vids []needle.VolumeId) {
- vidMap := make(map[uint32]bool)
- eachDataNode(topoInfo, func(dc string, rack RackId, dn *master_pb.DataNodeInfo) {
- if diskInfo, found := dn.DiskInfos[string(types.HardDriveType)]; found {
- for _, v := range diskInfo.EcShardInfos {
- if v.Collection == selectedCollection {
- vidMap[v.Id] = true
- }
- }
- }
- })
- for vid := range vidMap {
- vids = append(vids, needle.VolumeId(vid))
- }
- return
- }
- func collectEcNodeShardBits(topoInfo *master_pb.TopologyInfo, vid needle.VolumeId) map[pb.ServerAddress]erasure_coding.ShardBits {
- nodeToEcIndexBits := make(map[pb.ServerAddress]erasure_coding.ShardBits)
- eachDataNode(topoInfo, func(dc string, rack RackId, dn *master_pb.DataNodeInfo) {
- if diskInfo, found := dn.DiskInfos[string(types.HardDriveType)]; found {
- for _, v := range diskInfo.EcShardInfos {
- if v.Id == uint32(vid) {
- nodeToEcIndexBits[pb.NewServerAddressFromDataNode(dn)] = erasure_coding.ShardBits(v.EcIndexBits)
- }
- }
- }
- })
- return nodeToEcIndexBits
- }
|