Chris Lu
5 years ago
8 changed files with 180 additions and 33 deletions
-
134other/java/client/src/main/java/seaweedfs/client/FileChunkManifest.java
-
9other/java/client/src/main/java/seaweedfs/client/FilerClient.java
-
12other/java/client/src/main/java/seaweedfs/client/SeaweedRead.java
-
42other/java/client/src/main/java/seaweedfs/client/SeaweedWrite.java
-
5other/java/client/src/test/java/seaweedfs/client/SeaweedReadTest.java
-
7other/java/hdfs2/src/main/java/seaweed/hdfs/SeaweedInputStream.java
-
2other/java/hdfs2/src/main/java/seaweed/hdfs/SeaweedOutputStream.java
-
2other/java/hdfs3/src/main/java/seaweed/hdfs/SeaweedInputStream.java
@ -0,0 +1,134 @@ |
|||
package seaweedfs.client; |
|||
|
|||
import org.slf4j.Logger; |
|||
import org.slf4j.LoggerFactory; |
|||
|
|||
import java.io.IOException; |
|||
import java.util.ArrayList; |
|||
import java.util.List; |
|||
import java.util.Map; |
|||
|
|||
public class FileChunkManifest { |
|||
|
|||
private static final Logger LOG = LoggerFactory.getLogger(FileChunkManifest.class); |
|||
|
|||
private static final int mergeFactor = 3; |
|||
|
|||
public static boolean hasChunkManifest(List<FilerProto.FileChunk> chunks) { |
|||
for (FilerProto.FileChunk chunk : chunks) { |
|||
if (chunk.getIsChunkManifest()) { |
|||
return true; |
|||
} |
|||
} |
|||
return false; |
|||
} |
|||
|
|||
public static List<FilerProto.FileChunk> resolveChunkManifest( |
|||
final FilerGrpcClient filerGrpcClient, List<FilerProto.FileChunk> chunks) throws IOException { |
|||
|
|||
List<FilerProto.FileChunk> dataChunks = new ArrayList<>(); |
|||
|
|||
for (FilerProto.FileChunk chunk : chunks) { |
|||
if (!chunk.getIsChunkManifest()) { |
|||
dataChunks.add(chunk); |
|||
continue; |
|||
} |
|||
|
|||
// IsChunkManifest |
|||
LOG.debug("fetching chunk manifest:{}", chunk); |
|||
byte[] data = fetchChunk(filerGrpcClient, chunk); |
|||
FilerProto.FileChunkManifest m = FilerProto.FileChunkManifest.newBuilder().mergeFrom(data).build(); |
|||
List<FilerProto.FileChunk> resolvedChunks = new ArrayList<>(); |
|||
for (FilerProto.FileChunk t : m.getChunksList()) { |
|||
// avoid deprecated chunk.getFileId() |
|||
resolvedChunks.add(t.toBuilder().setFileId(FilerClient.toFileId(t.getFid())).build()); |
|||
} |
|||
dataChunks.addAll(resolveChunkManifest(filerGrpcClient, resolvedChunks)); |
|||
} |
|||
|
|||
return dataChunks; |
|||
} |
|||
|
|||
private static byte[] fetchChunk(final FilerGrpcClient filerGrpcClient, FilerProto.FileChunk chunk) throws IOException { |
|||
|
|||
FilerProto.LookupVolumeRequest.Builder lookupRequest = FilerProto.LookupVolumeRequest.newBuilder(); |
|||
String vid = "" + chunk.getFid().getVolumeId(); |
|||
lookupRequest.addVolumeIds(vid); |
|||
FilerProto.LookupVolumeResponse lookupResponse = filerGrpcClient |
|||
.getBlockingStub().lookupVolume(lookupRequest.build()); |
|||
Map<String, FilerProto.Locations> vid2Locations = lookupResponse.getLocationsMapMap(); |
|||
FilerProto.Locations locations = vid2Locations.get(vid); |
|||
|
|||
SeaweedRead.ChunkView chunkView = new SeaweedRead.ChunkView( |
|||
FilerClient.toFileId(chunk.getFid()), // avoid deprecated chunk.getFileId() |
|||
0, |
|||
-1, |
|||
0, |
|||
true, |
|||
chunk.getCipherKey().toByteArray(), |
|||
chunk.getIsCompressed()); |
|||
|
|||
byte[] chunkData = SeaweedRead.chunkCache.getChunk(chunkView.fileId); |
|||
if (chunkData == null) { |
|||
LOG.debug("doFetchFullChunkData:{}", chunkView); |
|||
chunkData = SeaweedRead.doFetchFullChunkData(chunkView, locations); |
|||
} |
|||
LOG.debug("chunk {} size {}", chunkView.fileId, chunkData.length); |
|||
SeaweedRead.chunkCache.setChunk(chunkView.fileId, chunkData); |
|||
|
|||
return chunkData; |
|||
|
|||
} |
|||
|
|||
public static List<FilerProto.FileChunk> maybeManifestize( |
|||
final FilerGrpcClient filerGrpcClient, List<FilerProto.FileChunk> inputChunks) throws IOException { |
|||
// the return variable |
|||
List<FilerProto.FileChunk> chunks = new ArrayList<>(); |
|||
|
|||
List<FilerProto.FileChunk> dataChunks = new ArrayList<>(); |
|||
for (FilerProto.FileChunk chunk : inputChunks) { |
|||
if (!chunk.getIsChunkManifest()) { |
|||
dataChunks.add(chunk); |
|||
} else { |
|||
chunks.add(chunk); |
|||
} |
|||
} |
|||
|
|||
int remaining = dataChunks.size(); |
|||
for (int i = 0; i + mergeFactor < dataChunks.size(); i += mergeFactor) { |
|||
FilerProto.FileChunk chunk = mergeIntoManifest(filerGrpcClient, dataChunks.subList(i, i + mergeFactor)); |
|||
chunks.add(chunk); |
|||
remaining -= mergeFactor; |
|||
} |
|||
|
|||
// remaining |
|||
for (int i = dataChunks.size() - remaining; i < dataChunks.size(); i++) { |
|||
chunks.add(dataChunks.get(i)); |
|||
} |
|||
return chunks; |
|||
} |
|||
|
|||
private static FilerProto.FileChunk mergeIntoManifest(final FilerGrpcClient filerGrpcClient, List<FilerProto.FileChunk> dataChunks) throws IOException { |
|||
// create and serialize the manifest |
|||
FilerProto.FileChunkManifest.Builder m = FilerProto.FileChunkManifest.newBuilder().addAllChunks(dataChunks); |
|||
byte[] data = m.build().toByteArray(); |
|||
|
|||
long minOffset = Long.MAX_VALUE; |
|||
long maxOffset = -1; |
|||
for (FilerProto.FileChunk chunk : dataChunks) { |
|||
minOffset = Math.min(minOffset, chunk.getOffset()); |
|||
maxOffset = Math.max(maxOffset, chunk.getSize() + chunk.getOffset()); |
|||
} |
|||
|
|||
FilerProto.FileChunk.Builder manifestChunk = SeaweedWrite.writeChunk( |
|||
filerGrpcClient.getReplication(), |
|||
filerGrpcClient, |
|||
minOffset, |
|||
data, 0, data.length); |
|||
manifestChunk.setIsChunkManifest(true); |
|||
manifestChunk.setSize(maxOffset - minOffset); |
|||
return manifestChunk.build(); |
|||
|
|||
} |
|||
|
|||
} |
Write
Preview
Loading…
Cancel
Save
Reference in new issue