Skip to content

Commit

Permalink
[CELEBORN-1612] Add a basic reader writer class to Tez
Browse files Browse the repository at this point in the history
### What changes were proposed in this pull request?
1. Add a basic reader writer class to Tez
2. Copy sort pusher from MR to Tez project and add unsort implementation

### Why are the changes needed?
Add basic utilities to support Tez client.

### Does this PR introduce _any_ user-facing change?
NO.

### How was this patch tested?
Cluster tests.

Closes #2969 from GH-Gloway/1610.

Authored-by: hongguangwei <[email protected]>
Signed-off-by: mingji <[email protected]>
  • Loading branch information
GH-Gloway authored and FMX committed Dec 3, 2024
1 parent c893287 commit 3dd810c
Show file tree
Hide file tree
Showing 3 changed files with 569 additions and 0 deletions.
Original file line number Diff line number Diff line change
@@ -0,0 +1,94 @@
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

package org.apache.celeborn.client;

import java.io.IOException;

import org.slf4j.LoggerFactory;

import org.apache.celeborn.client.read.CelebornInputStream;
import org.apache.celeborn.client.read.MetricsCallback;
import org.apache.celeborn.common.exception.CelebornIOException;
import org.apache.celeborn.common.unsafe.Platform;

public class CelebornTezReader {
private static final org.slf4j.Logger logger = LoggerFactory.getLogger(CelebornTezReader.class);

private int shuffleId;
private int partitionId;
private int attemptNumber;
private ShuffleClient shuffleClient;
private long inputShuffleSize;
private CelebornInputStream celebornInputStream;

public CelebornTezReader(
ShuffleClient shuffleClient, int shuffleId, int partitionId, int attemptNumber) {
this.shuffleClient = shuffleClient;
this.partitionId = partitionId;
this.attemptNumber = attemptNumber;
this.shuffleId = shuffleId;
}

public void init() throws IOException {
MetricsCallback metricsCallback =
new MetricsCallback() {
@Override
public void incBytesRead(long bytesRead) {}

@Override
public void incReadTime(long time) {}
};
celebornInputStream =
shuffleClient.readPartition(
shuffleId, partitionId, attemptNumber, 0, Integer.MAX_VALUE, metricsCallback);
}

public byte[] getShuffleBlock() throws IOException {
// get len
byte[] header = new byte[4];
int count = celebornInputStream.read(header);
if (count == -1) {
return null;
}
while (count != header.length) {
count += celebornInputStream.read(header, count, 4 - count);
}

// get data
int blockLen = Platform.getInt(header, Platform.BYTE_ARRAY_OFFSET);
inputShuffleSize += blockLen;
byte[] shuffleData = new byte[blockLen];
count = celebornInputStream.read(shuffleData);
while (count != shuffleData.length) {
count += celebornInputStream.read(shuffleData, count, blockLen - count);
if (count == -1) {
// read shuffle is done.
throw new CelebornIOException("Read mr shuffle failed.");
}
}
return shuffleData;
}

public void close() throws IOException {
celebornInputStream.close();
}

public int getPartitionId() {
return partitionId;
}
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,128 @@
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

package org.apache.celeborn.client;

import java.io.IOException;
import java.util.concurrent.atomic.LongAdder;

import org.apache.tez.runtime.library.api.IOInterruptedException;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import org.apache.celeborn.client.write.DataPusher;
import org.apache.celeborn.common.CelebornConf;
import org.apache.celeborn.common.identity.UserIdentifier;

public class CelebornTezWriter {
private final Logger logger = LoggerFactory.getLogger(CelebornTezWriter.class);

private final ShuffleClient shuffleClient;
private DataPusher dataPusher;
private final int shuffleId;
private final int mapId;
private final int attemptNumber;
private final int numMappers;
private final int numPartitions;

public CelebornTezWriter(
int shuffleId,
int mapId,
int attemptNumber,
long taskAttemptId,
int numMappers,
int numPartitions,
CelebornConf conf,
String appUniqueId,
String lifecycleManagerHost,
int lifecycleManagerPort,
UserIdentifier userIdentifier) {
shuffleClient =
ShuffleClient.get(
appUniqueId, lifecycleManagerHost, lifecycleManagerPort, conf, userIdentifier, null);
// TEZ_SHUFFLE_ID
this.shuffleId = shuffleId;
this.mapId = mapId;
this.attemptNumber = attemptNumber;
this.numMappers = numMappers;
this.numPartitions = numPartitions;

LongAdder[] mapStatusLengths = new LongAdder[numPartitions];
for (int i = 0; i < numPartitions; i++) {
mapStatusLengths[i] = new LongAdder();
}
try {
dataPusher =
new DataPusher(
shuffleId,
mapId,
attemptNumber,
taskAttemptId,
numMappers,
numPartitions,
conf,
shuffleClient,
null,
integer -> {},
mapStatusLengths);
} catch (InterruptedException e) {
throw new RuntimeException(e);
}
}

public void pushData(int partitionId, byte[] dataBuf, int size) throws IOException {
try {
dataPusher.addTask(partitionId, dataBuf, size);
} catch (InterruptedException e) {
throw new IOInterruptedException(e);
}
}

public void mergeData(int partitionId, byte[] dataBuf, int size) throws IOException {
int bytesWritten =
shuffleClient.mergeData(
shuffleId,
mapId,
attemptNumber,
partitionId,
dataBuf,
0,
size,
numMappers,
numPartitions);
}

public int getNumPartitions() {
return numPartitions;
}

public void close() throws IOException {
logger.info(
"Call mapper end shuffleId:{} mapId:{} attemptId:{} numMappers:{}",
0,
mapId,
attemptNumber,
numMappers);
try {
dataPusher.waitOnTermination();
shuffleClient.pushMergedData(shuffleId, mapId, attemptNumber);
shuffleClient.mapperEnd(shuffleId, mapId, attemptNumber, numMappers);
} catch (InterruptedException e) {
throw new IOInterruptedException(e);
}
}
}
Loading

0 comments on commit 3dd810c

Please sign in to comment.