Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

WIP: feat: send data by chunk in websocket #3988

Open
wants to merge 4 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
7 changes: 4 additions & 3 deletions packages/connection/__test__/browser/index.test.ts
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
import { furySerializer } from '@opensumi/ide-connection';
import { WSWebSocketConnection, furySerializer } from '@opensumi/ide-connection';
import { ReconnectingWebSocketConnection } from '@opensumi/ide-connection/lib/common/connection/drivers/reconnecting-websocket';
import { sleep } from '@opensumi/ide-core-common';
import { Server, WebSocket } from '@opensumi/mock-socket';
Expand All @@ -21,10 +21,11 @@ describe('connection browser', () => {
let data2Received = false;

mockServer.on('connection', (socket) => {
socket.on('message', (msg) => {
const connection = new WSWebSocketConnection(socket as any);
connection.onMessage((msg) => {
const msgObj = furySerializer.deserialize(msg as Uint8Array);
if (msgObj.kind === 'open') {
socket.send(
connection.send(
furySerializer.serialize({
id: msgObj.id,
kind: 'server-ready',
Expand Down
10 changes: 6 additions & 4 deletions packages/connection/__test__/common/frame-decoder.test.ts
Original file line number Diff line number Diff line change
Expand Up @@ -35,7 +35,9 @@ console.timeEnd('createPayload');
// 1m
const pressure = 1024 * 1024;

const purePackets = [p1k, p64k, p128k, p5m, p10m].map((v) => [LengthFieldBasedFrameDecoder.construct(v), v] as const);
const purePackets = [p1k, p64k, p128k, p5m, p10m].map(
(v) => [LengthFieldBasedFrameDecoder.construct(v).dump(), v] as const,
);

const size = purePackets.reduce((acc, v) => acc + v[0].byteLength, 0);

Expand All @@ -48,7 +50,7 @@ purePackets.forEach((v) => {
});

const mixedPackets = [p1m, p5m].map((v) => {
const sumiPacket = LengthFieldBasedFrameDecoder.construct(v);
const sumiPacket = LengthFieldBasedFrameDecoder.construct(v).dump();
const newPacket = createPayload(1024 + sumiPacket.byteLength);
newPacket.set(sumiPacket, 1024);
return [newPacket, v] as const;
Expand All @@ -59,7 +61,7 @@ const packets = [...purePackets, ...mixedPackets];
describe('frame decoder', () => {
it('can create frame', () => {
const content = new Uint8Array([1, 2, 3]);
const packet = LengthFieldBasedFrameDecoder.construct(content);
const packet = LengthFieldBasedFrameDecoder.construct(content).dump();
const reader = BinaryReader({});

reader.reset(packet);
Expand Down Expand Up @@ -116,7 +118,7 @@ describe('frame decoder', () => {

it('can decode a stream it has no valid length info', (done) => {
const v = createPayload(1024);
const sumiPacket = LengthFieldBasedFrameDecoder.construct(v);
const sumiPacket = LengthFieldBasedFrameDecoder.construct(v).dump();

const decoder = new LengthFieldBasedFrameDecoder();
decoder.onData((data) => {
Expand Down
40 changes: 40 additions & 0 deletions packages/connection/src/common/buffers/buffers.ts
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,7 @@
*/

export const emptyBuffer = new Uint8Array(0);
export const buffer4Capacity = new Uint8Array(4);

export function copy(
source: Uint8Array,
Expand Down Expand Up @@ -72,6 +73,39 @@ export class Buffers {
return target;
}

slice4(start: number) {
let end = start + 4;
const buffers = this.buffers;

if (end > this.size) {
end = this.size;
}

if (start >= end) {
return emptyBuffer;
}

let startBytes = 0;
let si = 0;
for (; si < buffers.length && startBytes + buffers[si].length <= start; si++) {
startBytes += buffers[si].length;
}

const target = buffer4Capacity;

let ti = 0;
for (let ii = si; ti < end - start && ii < buffers.length; ii++) {
const len = buffers[ii].length;

const _start = ti === 0 ? start - startBytes : 0;
const _end = ti + len >= end - start ? Math.min(_start + (end - start) - ti, len) : len;
copy(buffers[ii], target, ti, _start, _end);
ti += _end - _start;
}

return target;
}

pos(i: number): { buf: number; offset: number } {
if (i < 0 || i >= this.size) {
throw new Error(`out of range, ${i} not in [0, ${this.size})`);
Expand Down Expand Up @@ -268,6 +302,12 @@ export class Cursor {
return buffers;
}

read4() {
const buffers = this.buffers.slice4(this.offset);
this.skip(4);
return buffers;
}

skip(n: number) {
let count = 0;
while (this.chunkIndex < this.buffers.buffers.length) {
Expand Down
53 changes: 31 additions & 22 deletions packages/connection/src/common/connection/drivers/frame-decoder.ts
Original file line number Diff line number Diff line change
@@ -1,21 +1,37 @@
import { BinaryWriter } from '@furyjs/fury/dist/lib/writer';

import { Emitter, readUInt32LE } from '@opensumi/ide-core-common';
import { MaybeNull, readUInt32LE } from '@opensumi/ide-core-common';

import { Buffers } from '../../buffers/buffers';

/**
* You can use `Buffer.from('\r\n\r\n')` to get this indicator.
*/
export const indicator = new Uint8Array([0x0d, 0x0a, 0x0d, 0x0a]);
export const indicator = new Uint8Array([0x0d, 0x0a, 0x0a, 0x0d]);

/**
* The number of bytes in the length field.
*
* How many bytes are used to represent data length.
*
* For example, if the length field is 4 bytes, then the maximum length of the data is 2^32 = 4GB
*/
const lengthFieldLength = 4;

/**
* sticky packet unpacking problems are generally problems at the transport layer.
* we use a length field to represent the length of the data, and then read the data according to the length
*/
export class LengthFieldBasedFrameDecoder {
protected dataEmitter = new Emitter<Uint8Array>();
onData = this.dataEmitter.event;
private _onDataListener: MaybeNull<(data: Uint8Array) => void>;
onData(listener: (data: Uint8Array) => void) {
this._onDataListener = listener;
return {
dispose: () => {
this._onDataListener = null;
},
};
}
Comment on lines +26 to +34
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

监听器管理方式的重大变更

这个变更将之前基于 Emitter 的多监听器方法改为了单一监听器方法。虽然这简化了事件处理机制,但也限制了类只能同时处理一个监听器。

考虑以下几点:

  1. 这种改变可能会影响依赖多个监听器的现有代码。
  2. 单一监听器模式可能会在某些使用场景下造成限制。

建议考虑以下改进:

  1. 如果确实需要多个监听器,可以考虑使用数组来存储多个监听器函数。
  2. 添加清晰的文档注释,说明这个类现在只支持单一监听器,以防止误用。
  3. 考虑添加一个 removeListener 方法,使 API 更加完整和直观。
private _onDataListeners: Array<(data: Uint8Array) => void> = [];

onData(listener: (data: Uint8Array) => void) {
  this._onDataListeners.push(listener);
  return {
    dispose: () => {
      const index = this._onDataListeners.indexOf(listener);
      if (index > -1) {
        this._onDataListeners.splice(index, 1);
      }
    },
  };
}

removeListener(listener: (data: Uint8Array) => void) {
  const index = this._onDataListeners.indexOf(listener);
  if (index > -1) {
    this._onDataListeners.splice(index, 1);
  }
}

这样的实现既保持了简单性,又提供了更大的灵活性。


protected buffers = new Buffers();
protected cursor = this.buffers.cursor();
Expand All @@ -24,15 +40,6 @@ export class LengthFieldBasedFrameDecoder {

protected state = 0;

/**
* The number of bytes in the length field.
*
* How many bytes are used to represent data length.
*
* For example, if the length field is 4 bytes, then the maximum length of the data is 2^32 = 4GB
*/
lengthFieldLength = 4;

reset() {
this.contentLength = -1;
this.state = 0;
Expand All @@ -57,7 +64,9 @@ export class LengthFieldBasedFrameDecoder {

const binary = this.buffers.slice(start, end);

this.dataEmitter.fire(binary);
if (this._onDataListener) {
this._onDataListener(binary);
}

if (this.buffers.byteLength > end) {
this.contentLength = -1;
Expand Down Expand Up @@ -93,13 +102,13 @@ export class LengthFieldBasedFrameDecoder {
}

if (this.contentLength === -1) {
if (this.cursor.offset + this.lengthFieldLength > bufferLength) {
if (this.cursor.offset + lengthFieldLength > bufferLength) {
// Not enough data yet, wait for more data
return false;
}

// read the content length
const buf = this.cursor.read(this.lengthFieldLength);
const buf = this.cursor.read4();
// fury writer use little endian
this.contentLength = readUInt32LE(buf, 0);
}
Expand All @@ -123,8 +132,8 @@ export class LengthFieldBasedFrameDecoder {
case 0:
this.state = 1;
break;
case 2:
this.state = 3;
case 3:
this.state = 4;
break;
default:
this.state = 0;
Expand All @@ -136,8 +145,8 @@ export class LengthFieldBasedFrameDecoder {
case 1:
this.state = 2;
break;
case 3:
this.state = 4;
case 2:
this.state = 3;
iter.return();
break;
default:
Expand All @@ -154,7 +163,7 @@ export class LengthFieldBasedFrameDecoder {
}

dispose() {
this.dataEmitter.dispose();
this._onDataListener = undefined;
this.buffers.dispose();
}

Expand All @@ -165,6 +174,6 @@ export class LengthFieldBasedFrameDecoder {
LengthFieldBasedFrameDecoder.writer.buffer(indicator);
LengthFieldBasedFrameDecoder.writer.uint32(content.byteLength);
LengthFieldBasedFrameDecoder.writer.buffer(content);
return LengthFieldBasedFrameDecoder.writer.dump();
return LengthFieldBasedFrameDecoder.writer;
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -4,17 +4,34 @@ import ReconnectingWebSocket, {
UrlProvider,
} from '@opensumi/reconnecting-websocket';

import { chunkSize } from '../../constants';

import { BaseConnection } from './base';
import { LengthFieldBasedFrameDecoder } from './frame-decoder';

import type { ErrorEvent } from '@opensumi/reconnecting-websocket';

export class ReconnectingWebSocketConnection extends BaseConnection<Uint8Array> {
constructor(private socket: ReconnectingWebSocket) {
protected decoder = new LengthFieldBasedFrameDecoder();

protected constructor(private socket: ReconnectingWebSocket) {
super();

if (socket.binaryType === 'arraybuffer') {
this.socket.addEventListener('message', this.arrayBufferHandler);
} else if (socket.binaryType === 'blob') {
throw new Error('blob is not implemented');
}
}

send(data: Uint8Array): void {
this.socket.send(data);
const handle = LengthFieldBasedFrameDecoder.construct(data).dumpAndOwn();
const packet = handle.get();
for (let i = 0; i < packet.byteLength; i += chunkSize) {
this.socket.send(packet.subarray(i, i + chunkSize));
}

handle.dispose();
}

isOpen(): boolean {
Expand All @@ -29,29 +46,8 @@ export class ReconnectingWebSocketConnection extends BaseConnection<Uint8Array>
},
};
}

onMessage(cb: (data: Uint8Array) => void): IDisposable {
const handler = (e: MessageEvent) => {
let buffer: Promise<ArrayBuffer>;
if (e.data instanceof Blob) {
buffer = e.data.arrayBuffer();
} else if (e.data instanceof ArrayBuffer) {
buffer = Promise.resolve(e.data);
} else if (e.data?.constructor?.name === 'Buffer') {
// Compatibility with nodejs Buffer in test environment
buffer = Promise.resolve(e.data);
} else {
throw new Error('unknown message type, expect Blob or ArrayBuffer, received: ' + typeof e.data);
}
buffer.then((v) => cb(new Uint8Array(v, 0, v.byteLength)));
};

this.socket.addEventListener('message', handler);
return {
dispose: () => {
this.socket.removeEventListener('message', handler);
},
};
return this.decoder.onData(cb);
}
onceClose(cb: (code?: number, reason?: string) => void): IDisposable {
const disposable = this.onClose(wrapper);
Expand Down Expand Up @@ -91,8 +87,13 @@ export class ReconnectingWebSocketConnection extends BaseConnection<Uint8Array>
};
}

private arrayBufferHandler = (e: MessageEvent<ArrayBuffer>) => {
const buffer: ArrayBuffer = e.data;
this.decoder.push(new Uint8Array(buffer, 0, buffer.byteLength));
};

dispose(): void {
// do nothing
this.socket.removeEventListener('message', this.arrayBufferHandler);
}

static forURL(url: UrlProvider, protocols?: string | string[], options?: ReconnectingWebSocketOptions) {
Expand Down
5 changes: 3 additions & 2 deletions packages/connection/src/common/connection/drivers/stream.ts
Original file line number Diff line number Diff line change
Expand Up @@ -21,10 +21,11 @@ export class StreamConnection extends BaseConnection<Uint8Array> {
}

send(data: Uint8Array): void {
const result = LengthFieldBasedFrameDecoder.construct(data);
this.writable.write(result, () => {
const handle = LengthFieldBasedFrameDecoder.construct(data).dumpAndOwn();
this.writable.write(handle.get(), () => {
// TODO: logger error
});
handle.dispose();
}

onMessage(cb: (data: Uint8Array) => void): IDisposable {
Expand Down
24 changes: 17 additions & 7 deletions packages/connection/src/common/connection/drivers/ws-websocket.ts
Original file line number Diff line number Diff line change
@@ -1,24 +1,34 @@
import { IDisposable } from '@opensumi/ide-core-common';

import { chunkSize } from '../../constants';

import { BaseConnection } from './base';
import { LengthFieldBasedFrameDecoder } from './frame-decoder';

import type WebSocket from 'ws';

export class WSWebSocketConnection extends BaseConnection<Uint8Array> {
protected decoder = new LengthFieldBasedFrameDecoder();

constructor(public socket: WebSocket) {
super();
this.socket.on('message', (data: Buffer) => {
this.decoder.push(data);
});
bytemain marked this conversation as resolved.
Show resolved Hide resolved
}

send(data: Uint8Array): void {
this.socket.send(data);
const handle = LengthFieldBasedFrameDecoder.construct(data).dumpAndOwn();
const packet = handle.get();
for (let i = 0; i < packet.byteLength; i += chunkSize) {
this.socket.send(packet.subarray(i, i + chunkSize));
}

handle.dispose();
Comment on lines +21 to +27
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

send 方法的改进很好,但可以考虑进一步优化。

新的 send 方法使用 LengthFieldBasedFrameDecoder 构造数据包并分块发送,这是一个很好的改进,可以更好地处理大型消息。

为了进一步优化性能,您可以考虑以下建议:

  1. 使用 ArrayBufferSharedArrayBuffer 来减少内存复制。
  2. 考虑使用 WebSocket.bufferedAmount 来控制发送速率,避免缓冲区溢出。

示例实现:

send(data: Uint8Array): void {
  const handle = LengthFieldBasedFrameDecoder.construct(data).dumpAndOwn();
  const packet = handle.get();
  
  const sendChunk = (start: number) => {
    while (start < packet.byteLength && this.socket.bufferedAmount < 1024 * 1024) { // 1MB buffer threshold
      const end = Math.min(start + chunkSize, packet.byteLength);
      this.socket.send(packet.subarray(start, end));
      start = end;
    }
    if (start < packet.byteLength) {
      setTimeout(() => sendChunk(start), 0);
    } else {
      handle.dispose();
    }
  };

  sendChunk(0);
}

这个实现使用了递归的方式来控制发送速率,避免一次性将所有数据推入缓冲区。

}

onMessage(cb: (data: Uint8Array) => void): IDisposable {
this.socket.on('message', cb);
return {
dispose: () => {
this.socket.off('message', cb);
},
};
return this.decoder.onData(cb);
}
onceClose(cb: () => void): IDisposable {
this.socket.once('close', cb);
Expand Down
5 changes: 5 additions & 0 deletions packages/connection/src/common/constants.ts
Original file line number Diff line number Diff line change
@@ -1 +1,6 @@
export const METHOD_NOT_REGISTERED = '$$METHOD_NOT_REGISTERED';

/**
* 分片大小, 8MB
*/
export const chunkSize = 8 * 1024 * 1024;
3 changes: 1 addition & 2 deletions packages/connection/src/node/common-channel-handler.ts
Original file line number Diff line number Diff line change
Expand Up @@ -42,8 +42,7 @@ export class CommonChannelHandler extends BaseCommonChannelHandler implements We
...this.options.wsServerOptions,
});
this.wsServer.on('connection', (connection: WebSocket) => {
const wsConnection = new WSWebSocketConnection(connection);
this.receiveConnection(wsConnection);
this.receiveConnection(new WSWebSocketConnection(connection));
});
}

Expand Down
Loading
Loading