[ISSUE-911] Decrease numConnectionsPerPeer to achieve better performance (#983)
This commit is contained in:
parent
fb6d1de108
commit
5ecb09d62a
@ -1046,7 +1046,7 @@ object CelebornConf extends Logging {
|
||||
.categories("network")
|
||||
.doc("Number of concurrent connections between two nodes.")
|
||||
.intConf
|
||||
.createWithDefault(8)
|
||||
.createWithDefault(2)
|
||||
|
||||
val NETWORK_IO_BACKLOG: ConfigEntry[Int] =
|
||||
buildConf("celeborn.<module>.io.backLog")
|
||||
|
||||
@ -19,9 +19,9 @@
|
||||
celeborn.rpc.io.mode NIO
|
||||
celeborn.rpc.io.clientThreads 8
|
||||
celeborn.rpc.io.serverThreads 8
|
||||
celeborn.rpc.io.numConnectionsPerPeer 8
|
||||
celeborn.rpc.io.numConnectionsPerPeer 2
|
||||
|
||||
celeborn.push.io.numConnectionsPerPeer 8
|
||||
celeborn.push.io.numConnectionsPerPeer 2
|
||||
celeborn.push.io.threads 8
|
||||
|
||||
celeborn.push.replicate.enabled true
|
||||
|
||||
@ -45,7 +45,7 @@ celeborn:
|
||||
celeborn.worker.monitor.disk.enabled: false
|
||||
rss.rpc.io.serverThreads: 64
|
||||
rss.worker.fetch.chunk.size: 8m
|
||||
rss.rpc.io.numConnectionsPerPeer: 8
|
||||
rss.rpc.io.numConnectionsPerPeer: 2
|
||||
celeborn.worker.flush.buffer.size: 256K
|
||||
celeborn.metrics.enabled: true
|
||||
rss.push.io.threads: 32
|
||||
|
||||
@ -28,7 +28,7 @@ license: |
|
||||
| celeborn.<module>.io.lazyFD | true | Whether to initialize FileDescriptor lazily or not. If true, file descriptors are created only when data is going to be transferred. This can reduce the number of open files. | |
|
||||
| celeborn.<module>.io.maxRetries | 3 | Max number of times we will try IO exceptions (such as connection timeouts) per request. If set to 0, we will not do any retries. | |
|
||||
| celeborn.<module>.io.mode | NIO | Netty EventLoopGroup backend, available options: NIO, EPOLL. | |
|
||||
| celeborn.<module>.io.numConnectionsPerPeer | 8 | Number of concurrent connections between two nodes. | |
|
||||
| celeborn.<module>.io.numConnectionsPerPeer | 2 | Number of concurrent connections between two nodes. | |
|
||||
| celeborn.<module>.io.preferDirectBufs | true | If true, we will prefer allocating off-heap byte buffers within Netty. | |
|
||||
| celeborn.<module>.io.receiveBuffer | 0b | Receive buffer size (SO_RCVBUF). Note: the optimal size for receive buffer and send buffer should be latency * network_bandwidth. Assuming latency = 1ms, network_bandwidth = 10Gbps buffer size should be ~ 1.25MB. | 0.2.0 |
|
||||
| celeborn.<module>.io.retryWait | 5s | Time that we will wait in order to perform a retry after an IOException. Only relevant if maxIORetries > 0. | 0.2.0 |
|
||||
|
||||
Loading…
Reference in New Issue
Block a user