You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							95 lines
						
					
					
						
							2.5 KiB
						
					
					
				
			
		
		
		
			
			
			
		
		
	
	
							95 lines
						
					
					
						
							2.5 KiB
						
					
					
				
								package main
							 | 
						|
								
							 | 
						|
								import (
							 | 
						|
									"flag"
							 | 
						|
									"fmt"
							 | 
						|
									"os"
							 | 
						|
									"path/filepath"
							 | 
						|
								
							 | 
						|
									"github.com/chrislusf/seaweedfs/weed/glog"
							 | 
						|
									"github.com/chrislusf/seaweedfs/weed/storage"
							 | 
						|
									"github.com/chrislusf/seaweedfs/weed/storage/backend"
							 | 
						|
									"github.com/chrislusf/seaweedfs/weed/storage/needle"
							 | 
						|
									"github.com/chrislusf/seaweedfs/weed/storage/super_block"
							 | 
						|
								)
							 | 
						|
								
							 | 
						|
								var (
							 | 
						|
									volumePath       = flag.String("dir", "/tmp", "data directory to store files")
							 | 
						|
									volumeCollection = flag.String("collection", "", "the volume collection name")
							 | 
						|
									volumeId         = flag.Int("volumeId", -1, "a volume id. The volume should already exist in the dir. The volume index file should not exist.")
							 | 
						|
								)
							 | 
						|
								
							 | 
						|
								func Checksum(n *needle.Needle) string {
							 | 
						|
									return fmt.Sprintf("%s%x", n.Id, n.Cookie)
							 | 
						|
								}
							 | 
						|
								
							 | 
						|
								type VolumeFileScanner4SeeDat struct {
							 | 
						|
									version needle.Version
							 | 
						|
									block   super_block.SuperBlock
							 | 
						|
								
							 | 
						|
									dir        string
							 | 
						|
									hashes     map[string]bool
							 | 
						|
									dat        *os.File
							 | 
						|
									datBackend backend.BackendStorageFile
							 | 
						|
								}
							 | 
						|
								
							 | 
						|
								func (scanner *VolumeFileScanner4SeeDat) VisitSuperBlock(superBlock super_block.SuperBlock) error {
							 | 
						|
									scanner.version = superBlock.Version
							 | 
						|
									scanner.block = superBlock
							 | 
						|
									return nil
							 | 
						|
								
							 | 
						|
								}
							 | 
						|
								func (scanner *VolumeFileScanner4SeeDat) ReadNeedleBody() bool {
							 | 
						|
									return true
							 | 
						|
								}
							 | 
						|
								
							 | 
						|
								func (scanner *VolumeFileScanner4SeeDat) VisitNeedle(n *needle.Needle, offset int64, needleHeader, needleBody []byte) error {
							 | 
						|
								
							 | 
						|
									if scanner.datBackend == nil {
							 | 
						|
										newFileName := filepath.Join(*volumePath, "dat_fixed")
							 | 
						|
										newDatFile, err := os.Create(newFileName)
							 | 
						|
										if err != nil {
							 | 
						|
											glog.Fatalf("Write New Volume Data %v", err)
							 | 
						|
										}
							 | 
						|
										scanner.datBackend = backend.NewDiskFile(newDatFile)
							 | 
						|
										scanner.datBackend.WriteAt(scanner.block.Bytes(), 0)
							 | 
						|
									}
							 | 
						|
								
							 | 
						|
									checksum := Checksum(n)
							 | 
						|
								
							 | 
						|
									if scanner.hashes[checksum] {
							 | 
						|
										glog.V(0).Infof("duplicate checksum:%s fid:%d,%s%x @ offset:%d", checksum, *volumeId, n.Id, n.Cookie, offset)
							 | 
						|
										return nil
							 | 
						|
									}
							 | 
						|
									scanner.hashes[checksum] = true
							 | 
						|
								
							 | 
						|
									_, s, _, e := n.Append(scanner.datBackend, scanner.version)
							 | 
						|
									fmt.Printf("size %d error %v\n", s, e)
							 | 
						|
								
							 | 
						|
									return nil
							 | 
						|
								}
							 | 
						|
								
							 | 
						|
								func main() {
							 | 
						|
									flag.Parse()
							 | 
						|
								
							 | 
						|
									vid := needle.VolumeId(*volumeId)
							 | 
						|
								
							 | 
						|
									outpath, _ := filepath.Abs(filepath.Dir(os.Args[0]))
							 | 
						|
								
							 | 
						|
									scanner := &VolumeFileScanner4SeeDat{
							 | 
						|
										dir:    filepath.Join(outpath, "out"),
							 | 
						|
										hashes: map[string]bool{},
							 | 
						|
									}
							 | 
						|
								
							 | 
						|
									if _, err := os.Stat(scanner.dir); err != nil {
							 | 
						|
										if err := os.MkdirAll(scanner.dir, os.ModePerm); err != nil {
							 | 
						|
											glog.Fatalf("could not create output dir : %s", err)
							 | 
						|
										}
							 | 
						|
									}
							 | 
						|
								
							 | 
						|
									err := storage.ScanVolumeFile(*volumePath, *volumeCollection, vid, storage.NeedleMapInMemory, scanner)
							 | 
						|
									if err != nil {
							 | 
						|
										glog.Fatalf("Reading Volume File [ERROR] %s\n", err)
							 | 
						|
									}
							 | 
						|
								
							 | 
						|
								}
							 |