filechunks2_test.go 3.7 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485
  1. package filer
  2. import (
  3. "github.com/stretchr/testify/assert"
  4. "golang.org/x/exp/slices"
  5. "log"
  6. "testing"
  7. "github.com/seaweedfs/seaweedfs/weed/glog"
  8. "github.com/seaweedfs/seaweedfs/weed/pb/filer_pb"
  9. )
  10. func TestDoMinusChunks(t *testing.T) {
  11. // https://github.com/seaweedfs/seaweedfs/issues/3328
  12. // clusterA and clusterB using filer.sync to sync file: hello.txt
  13. // clusterA append a new line and then clusterB also append a new line
  14. // clusterA append a new line again
  15. chunksInA := []*filer_pb.FileChunk{
  16. {Offset: 0, Size: 3, FileId: "11", ModifiedTsNs: 100},
  17. {Offset: 3, Size: 3, FileId: "22", SourceFileId: "2", ModifiedTsNs: 200},
  18. {Offset: 6, Size: 3, FileId: "33", ModifiedTsNs: 300},
  19. }
  20. chunksInB := []*filer_pb.FileChunk{
  21. {Offset: 0, Size: 3, FileId: "1", SourceFileId: "11", ModifiedTsNs: 100},
  22. {Offset: 3, Size: 3, FileId: "2", ModifiedTsNs: 200},
  23. {Offset: 6, Size: 3, FileId: "3", SourceFileId: "33", ModifiedTsNs: 300},
  24. }
  25. // clusterB using command "echo 'content' > hello.txt" to overwrite file
  26. // clusterA will receive two evenNotification, need to empty the whole file content first and add new content
  27. // the first one is oldEntry is chunksInB and newEntry is empty fileChunks
  28. firstOldEntry := chunksInB
  29. var firstNewEntry []*filer_pb.FileChunk
  30. // clusterA received the first one event, gonna empty the whole chunk, according the code in filer_sink 194
  31. // we can get the deleted chunks and newChunks
  32. firstDeletedChunks := DoMinusChunks(firstOldEntry, firstNewEntry)
  33. log.Println("first deleted chunks:", firstDeletedChunks)
  34. //firstNewEntry := DoMinusChunks(firstNewEntry, firstOldEntry)
  35. // clusterA need to delete all chunks in firstDeletedChunks
  36. emptiedChunksInA := DoMinusChunksBySourceFileId(chunksInA, firstDeletedChunks)
  37. // chunksInA supposed to be empty by minus the deletedChunks but it just delete the chunk which sync from clusterB
  38. log.Println("clusterA synced empty chunks event result:", emptiedChunksInA)
  39. // clusterB emptied it's chunks and clusterA must sync the change and empty chunks too
  40. assert.Equalf(t, firstNewEntry, emptiedChunksInA, "empty")
  41. }
  42. func TestCompactFileChunksRealCase(t *testing.T) {
  43. chunks := []*filer_pb.FileChunk{
  44. {FileId: "2,512f31f2c0700a", Offset: 0, Size: 25 - 0, ModifiedTsNs: 5320497},
  45. {FileId: "6,512f2c2e24e9e8", Offset: 868352, Size: 917585 - 868352, ModifiedTsNs: 5320492},
  46. {FileId: "7,514468dd5954ca", Offset: 884736, Size: 901120 - 884736, ModifiedTsNs: 5325928},
  47. {FileId: "5,5144463173fe77", Offset: 917504, Size: 2297856 - 917504, ModifiedTsNs: 5325894},
  48. {FileId: "4,51444c7ab54e2d", Offset: 2301952, Size: 2367488 - 2301952, ModifiedTsNs: 5325900},
  49. {FileId: "4,514450e643ad22", Offset: 2371584, Size: 2420736 - 2371584, ModifiedTsNs: 5325904},
  50. {FileId: "6,514456a5e9e4d7", Offset: 2449408, Size: 2490368 - 2449408, ModifiedTsNs: 5325910},
  51. {FileId: "3,51444f8d53eebe", Offset: 2494464, Size: 2555904 - 2494464, ModifiedTsNs: 5325903},
  52. {FileId: "4,5144578b097c7e", Offset: 2560000, Size: 2596864 - 2560000, ModifiedTsNs: 5325911},
  53. {FileId: "3,51445500b6b4ac", Offset: 2637824, Size: 2678784 - 2637824, ModifiedTsNs: 5325909},
  54. {FileId: "1,51446285e52a61", Offset: 2695168, Size: 2715648 - 2695168, ModifiedTsNs: 5325922},
  55. }
  56. printChunks("before", chunks)
  57. compacted, garbage := CompactFileChunks(nil, chunks)
  58. printChunks("compacted", compacted)
  59. printChunks("garbage", garbage)
  60. }
  61. func printChunks(name string, chunks []*filer_pb.FileChunk) {
  62. slices.SortFunc(chunks, func(a, b *filer_pb.FileChunk) int {
  63. if a.Offset == b.Offset {
  64. return int(a.ModifiedTsNs - b.ModifiedTsNs)
  65. }
  66. return int(a.Offset - b.Offset)
  67. })
  68. for _, chunk := range chunks {
  69. glog.V(0).Infof("%s chunk %s [%10d,%10d)", name, chunk.GetFileIdString(), chunk.Offset, chunk.Offset+int64(chunk.Size))
  70. }
  71. }