WebSocket 是一种基于 TCP 的网络协议。在 2009 年诞生,于 2011 年被 IETF 定为标准 RFC 6455 通信标准,并由 RFC7936 补充规范。WebSocket API 也被 W3C 定为标准。
WebSocket 也是一种 全双工通信
的协议,既允许客户端向服务器主动发送消息,也允许服务器主动向客户端发送消息。在 WebSocket 中,浏览器和服务器只需要完成一次握手,两者之间就可以建立持久性的连接,进行双向数据传输。
先用带有 Upgrade:Websocket
请求头的 HTTP
)。客户端 HTTP
请求的 Header
Connection: Upgrade
Sec-WebSocket-Extensions: permessage-deflate; client_max_window_bits
Sec-WebSocket-Key: IRQYhWINfX5Fh1zdocDl6Q==
Sec-WebSocket-Version: 13
Upgrade: websocket
GET /chat HTTP/1.1
Upgrade: websocket
Connection: Upgrade
Sec-WebSocket-Key: hj0eNqbhE/A0GkBXDRrYYw==
Sec-WebSocket-Version: 13
# key:客户端传递过来的Sec-WebSocket-Key里面的值
def compute_accept_value(key):
"""Computes the value for the Sec-WebSocket-Accept header,
given the value for Sec-WebSocket-Key.
sha1 = hashlib.sha1()
sha1.update(b"258EAFA5-E914-47DA-95CA-C5AB0DC85B11") # Magic value
return native_str(base64.b64encode(sha1.digest()))
握手成功后,由 HTTP 协议升级成 Websocket 协议,进行长连接通信,两端相互传递信息。服务端响应的 HTTP Header 头信息如下:
Connection: upgrade
Sec-Websocket-Accept: TSF8/KitM+yYRbXmjclgl7DwbHk=
Upgrade: websocket
HTTP/1.1 101 Switching Protocols # 必须
Content-Length: 0
Upgrade: websocket # 必须
Sec-Websocket-Accept: ZEs+c+VBk8Aj01+wJGN7Y15796g= # 必须
Server: TornadoServer/4.5.1 # 无所谓
Connection: Upgrade # 必须
Date: Wed, 21 Jun 2017 03:29:14 GMT # 无所谓
0 1 2 3
0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1
|F|R|R|R| opcode|M| Payload len | Extended payload length |
|I|S|S|S| (4) |A| (7) | (16/64) |
|N|V|V|V| |S| | (if payload len==126/127) |
| |1|2|3| |K| | |
+-+-+-+-+-------+-+-------------+ - - - - - - - - - - - - - - - +
| Extended payload length continued, if payload len == 127 |
+ - - - - - - - - - - - - - - - +-------------------------------+
| |Masking-key, if MASK set to 1 |
| Masking-key (continued) | Payload Data |
+-------------------------------- - - - - - - - - - - - - - - - +
: Payload Data continued ... :
+ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - +
| Payload Data continued ... |
通过上图得知,一帧WebSocket数据=头 + Payload载荷,头的消息最小为2字节,最大为14字节(基本2个字节 + Extended payload length 8字节 + Masking-key 4字节 )。
摘选自: RFC 6455
操作代码,Opcode的值决定了应该如何解析后续的数据载荷(data payload)。如果操作代码是不认识的,那么接收端应该断开连接(fail the connection)。
enum WebSocketFrameType {
ERROR_FRAME = 0xFF00, // 帧错误
INCOMPLETE_FRAME = 0xFE00, // 不完整的帧
OPENING_FRAME = 0x3300, // 握手
INCOMPLETE_TEXT_FRAME = 0x01, // 不完整的文本
INCOMPLETE_BINARY_FRAME = 0x02, // 不完整的二进制数据
TEXT_FRAME = 0x81, // 文本数据
BINARY_FRAME = 0x82, // 二进制数据
PING_FRAME = 0x19, // ping
PONG_FRAME = 0x1A // pong
如果Mask是1,那么在Masking-key中会定义一个掩码键(masking key),并用这个掩码键来对数据载荷进行反掩码。所有客户端发送到服务端的数据帧,Mask都是1。
假设数Payload length === x,如果
备注:载荷数据的长度,不包括mask key的长度。
应用数据:任意的应用数据,在扩展数据之后(如果存在扩展数据),占据了数据帧剩余的位置。载荷数据长度 减去 扩展数据长度,就得到应用数据的长度。
// unmask data
const uint8_t *c = in_buffer + pos;
for (int i = 0; i < payload_length; i++) {
out_buffer[i] = c[i] ^ ((unsigned char *) (&mask))[i % 4];
/** @file ws.h
* @brief
* @author teng.qing
* @date 2021/5/21
// WebSocket, v1.00 2012-09-13
// Description: WebSocket FRC6544 codec, written in C++.
// Homepage: http://katzarsky.github.com/WebSocket
// Author: [email protected]
#include /* uint8_t */
#include /* sscanf */
#include /* isdigit */
#include /* int */
// std c++
using namespace std;
namespace evpp {
namespace ws {
/** @class WebSocketFrameType
* @brief websocket帧类型
enum WebSocketFrameType {
ERROR_FRAME = 0xFF00, // 帧错误
INCOMPLETE_FRAME = 0xFE00, // 不完整的帧
OPENING_FRAME = 0x3300, // 握手
INCOMPLETE_TEXT_FRAME = 0x01, // 不完整的文本
INCOMPLETE_BINARY_FRAME = 0x02, // 不完整的二进制数据
TEXT_FRAME = 0x81, // 文本数据
BINARY_FRAME = 0x82, // 二进制数据
PING_FRAME = 0x19, // ping
PONG_FRAME = 0x1A // pong
/** @class HandshakeInfo
* @brief 握手信息
struct HandshakeInfo {
string resource; // /sub
string host;
string origin;
string protocol; // Sec-WebSocket-Protocol
string key; // Sec-WebSocket-Key
string version; // Sec-WebSocket-Version
string extensions; // Sec-WebSocket-Extensions
/** @class ws
* @brief
class WebSocketHelper {
WebSocketHelper() = default;
WebSocketHelper(const WebSocketHelper &) = delete;
WebSocketHelper &operator=(const WebSocketHelper &) = delete;
* @param input_frame .in. pointer to input frame
* @param input_len .in. length of input frame
/**@fn parseHandshake
*@brief 获取握手信息
*@param [in]input_frame: 缓冲区
*@param [in]input_len: 缓冲区
*@param [out]info: 握手信息
WebSocketFrameType parseHandshake(const char *input_frame, int input_len, HandshakeInfo &info);
/** @fn answerHandshake
* @brief 获取握手响应数据
* @param [in]info: 握手信息
* @return 握手响应帧数据,tcp直接发送即可
string answerHandshake(const HandshakeInfo &info);
/** @fn makeFrame
* @brief encode
* @param [in]msg: 裸数据
* @param [in]msg_len: 裸数据长度
* @param [out]buffer: 输出缓冲区
* @param [int]buffer_len: 输出缓冲区长度
* @return 帧长度
int makeFrame(WebSocketFrameType frame_type, const uint8_t *msg,
int msg_len, uint8_t *buffer, int buffer_len);
/** @fn getFrame
* @brief 解析客户端发来的数据,需要经过掩码处理。服务器发给客户端的不需要
* @param [in]in_buffer: 接收缓冲区
* @param [in]in_length: 接收缓冲区大小
* @param [in]out_buffer: 输出缓冲区
* @param [in]out_size: 输出缓冲区大小
* @param [out]out_length: payload载荷数据长度
* @param [out]use_count: 帧头数据长度+载荷数据长度,即in_buffer已使用长度
* @return 帧类型
WebSocketFrameType getFrame(const uint8_t *in_buffer, int in_length, uint8_t *out_buffer,
int out_size, int &out_length, int &use_count);
string trim(string str);
vector<string> explode(string theString, string theDelimiter, bool theIncludeEmptyStrings = false);
/** @file ws.h
* @brief
* @author teng.qing
* @date 2021/5/21
#include "web_socket_helper.h"
// WebSocketHelper, v1.00 2012-09-13
// Description: WebSocketHelper FRC6544 codec, written in C++.
// Homepage: http://katzarsky.github.com/WebSocketHelper
// Author: [email protected]
#include "base64.h"
#include "evpp/sha1/sha1.h"
using namespace std;
namespace evpp {
namespace ws {
WebSocketFrameType WebSocketHelper::parseHandshake(const char *input_frame, int input_len, HandshakeInfo &info) {
// 1. copy char*/len into string
// 2. try to parse headers until \r\n occurs
string headers(input_frame, input_len);
int header_end = headers.find("\r\n\r\n");
if (header_end == string::npos) { // end-of-headers not found - do not parse
headers.resize(header_end); // trim off any data we don't need after the headers
int key_count = 0;
vector<string> headers_rows = explode(headers, string("\r\n"));
for (int i = 0; i < headers_rows.size(); i++) {
string &header = headers_rows[i];
if (header.find("GET") == 0) {
vector<string> get_tokens = explode(header, string(" "));
if (get_tokens.size() >= 2) {
info.resource = get_tokens[1];
} else {
int pos = header.find(":");
if (pos != string::npos) {
string header_key(header, 0, pos);
string header_value(header, pos + 1);
header_value = trim(header_value);
if (header_key == "Host") info.host = header_value;
else if (header_key == "Origin") info.origin = header_value;
else if (header_key == "Sec-WebSocket-Key") info.key = header_value;
else if (header_key == "Sec-WebSocket-Protocol") info.protocol = header_value;
else if (header_key == "Sec-WebSocket-Version") info.version = header_value;
else if (header_key == "Sec-WebSocket-Extensions") info.extensions = header_value;
if (key_count < 2) {
string WebSocketHelper::trim(string str) {
char *whitespace = " \t\r\n";
string::size_type pos = str.find_last_not_of(whitespace);
if (pos != string::npos) {
str.erase(pos + 1);
pos = str.find_first_not_of(whitespace);
if (pos != string::npos) str.erase(0, pos);
} else {
return string();
return str;
vector<string> WebSocketHelper::explode(
string theString,
string theDelimiter,
bool theIncludeEmptyStrings) {
//UASSERT( theDelimiter.size(), >, 0 );
vector<string> theStringVector;
int start = 0, end = 0, length = 0;
while (end != string::npos) {
end = theString.find(theDelimiter, start);
// If at end, use length=maxLength. Else use length=end-start.
length = (end == string::npos) ? string::npos : end - start;
if (theIncludeEmptyStrings
|| ((length > 0) /* At end, end == length == string::npos */
&& (start < theString.size())))
theStringVector.push_back(theString.substr(start, length));
// If at end, use start=maxSize. Else use start=end+delimiter.
start = ((end > (string::npos - theDelimiter.size()))
? string::npos : end + theDelimiter.size());
return theStringVector;
string WebSocketHelper::answerHandshake(const HandshakeInfo &info) {
unsigned char digest[20]; // 160 bit sha1 digest
string answer;
answer += "HTTP/1.1 101 Switching Protocols\r\n";
answer += "Upgrade: WebSocket\r\n";
answer += "Connection: Upgrade\r\n";
if (!info.key.empty()) {
string accept_key;
accept_key += info.key;
accept_key += "258EAFA5-E914-47DA-95CA-C5AB0DC85B11"; //RFC6544_MAGIC_KEY
//printf("INTERMEDIATE_KEY:(%s)\n", accept_key.data());
SHA1 sha;
sha.Input(accept_key.data(), accept_key.size());
sha.Result((unsigned *) digest);
//printf("DIGEST:"); for(int i=0; i<20; i++) printf("%02x ",digest[i]); printf("\n");
//little endian to big endian
for (int i = 0; i < 20; i += 4) {
unsigned char c;
c = digest[i];
digest[i] = digest[i + 3];
digest[i + 3] = c;
c = digest[i + 1];
digest[i + 1] = digest[i + 2];
digest[i + 2] = c;
//printf("DIGEST:"); for(int i=0; i<20; i++) printf("%02x ",digest[i]); printf("\n");
accept_key = base64_encode2((const unsigned char *) digest, 20); //160bit = 20 bytes/chars
answer += "Sec-WebSocket-Accept: " + (accept_key) + "\r\n";
if (info.protocol.length() > 0) {
answer += "Sec-WebSocket-Protocol: " + (info.protocol) + "\r\n";
answer += "\r\n";
return answer;
int WebSocketHelper::makeFrame(WebSocketFrameType frame_type, const uint8_t *msg,
int msg_len, uint8_t *buffer, int buffer_len) {
int pos = 0;
int size = msg_len;
buffer[pos++] = (unsigned char) frame_type; // text frame
if (size <= 125) {
buffer[pos++] = size;
} else if (size <= 65535) {
buffer[pos++] = 126; //16 bit length follows
buffer[pos++] = (size >> 8) & 0xFF; // leftmost first
buffer[pos++] = size & 0xFF;
} else { // >2^16-1 (65535)
buffer[pos++] = 127; //64 bit length follows
// write 8 bytes length (significant first)
// since msg_length is int it can be no longer than 4 bytes = 2^32-1
// padd zeroes for the first 4 bytes
for (int i = 3; i >= 0; i--) {
buffer[pos++] = 0;
// write the actual 32bit msg_length in the next 4 bytes
for (int i = 3; i >= 0; i--) {
buffer[pos++] = ((size >> 8 * i) & 0xFF);
memcpy((void *) (buffer + pos), msg, size);
return (size + pos);
WebSocketFrameType WebSocketHelper::getFrame(const uint8_t *in_buffer, int in_length, uint8_t *out_buffer,
int out_size, int &out_length, int &use_count) {
/* ws frame: RFC6455
0 1 2 3
0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1
|F|R|R|R| opcode|M| Payload len | Extended payload length |
|I|S|S|S| (4) |A| (7) | (16/64) |
|N|V|V|V| |S| | (if payload len==126/127) |
| |1|2|3| |K| | |
+-+-+-+-+-------+-+-------------+ - - - - - - - - - - - - - - - +
| Extended payload length continued, if payload len == 127 |
+ - - - - - - - - - - - - - - - +-------------------------------+
| |Masking-key, if MASK set to 1 |
| Masking-key (continued) | Payload Data |
+-------------------------------- - - - - - - - - - - - - - - - +
: Payload Data continued ... :
+ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - +
| Payload Data continued ... |
* see:
* RFC6455: https://datatracker.ietf.org/doc/html/rfc6455)
* websocket报文格式及掩码处理方式: https://www.cnblogs.com/laohaozi/p/12537571.html
if (in_length < 3) return INCOMPLETE_FRAME;
unsigned char msg_opcode = in_buffer[0] & 0x0F;
unsigned char msg_fin = (in_buffer[0] >> 7) & 0x01; // final frame
unsigned char msg_masked = (in_buffer[1] >> 7) & 0x01;
// *** message decoding
int payload_length = 0;
int pos = 2;
int length_field = in_buffer[1] & (~0x80);
unsigned int mask = 0;
//printf("IN:"); for(int i=0; i<20; i++) printf("%02x ",buffer[i]); printf("\n");
if (length_field <= 125) {
payload_length = length_field;
} else if (length_field == 126) { //msglen is 16bit!
//payload_length = in_buffer[2] + (in_buffer[3]<<8);
//payload_length = in_buffer[3] + (in_buffer[2]<<8);
payload_length = in_buffer[2];
for (int i = 0; i < 1; i++) {
payload_length = (payload_length << 8) + in_buffer[3 + i];
pos += 2;
} else if (length_field == 127) { //msglen is 64bit!
payload_length = in_buffer[2];
for (int i = 0; i < 4; i++) {
payload_length = (payload_length << 8) + in_buffer[3 + i];
//payload_length = in_buffer[2] + (in_buffer[3]<<8);
pos += 8;
//printf("PAYLOAD_LEN: %08x\n", payload_length);
if (in_length < payload_length + pos) {
printf("%s\n", "return INCOMPLETE_FRAME");
if (msg_masked) {
mask = *((unsigned int *) (in_buffer + pos));
//printf("MASK: %08x\n", mask);
pos += 4;
// unmask data
const uint8_t *c = in_buffer + pos;
for (int i = 0; i < payload_length; i++) {
// mod_by [email protected] 2021-05-23 backup code
// c[i] = c[i] ^ ((unsigned char *) (&mask))[i % 4];
out_buffer[i] = c[i] ^ ((unsigned char *) (&mask))[i % 4];
use_count = payload_length + pos;
out_length = payload_length;
if (payload_length > out_size || use_count > in_length) {
//TODO: if output buffer is too small -- ERROR or resize(free and allocate bigger one) the buffer ?
// del_by [email protected] 2021-05-23 unmask data use output buffer,do not need copy
//memcpy((void *) out_buffer, (void *) (in_buffer + pos), payload_length);
//out_buffer[payload_length] = 0;
//printf("TEXT: %s\n", out_buffer);
if (msg_opcode == 0x0) return (msg_fin) ? TEXT_FRAME : INCOMPLETE_TEXT_FRAME; // continuation frame
if (msg_opcode == 0x1) return (msg_fin) ? TEXT_FRAME : INCOMPLETE_TEXT_FRAME;
if (msg_opcode == 0x2) return (msg_fin) ? BINARY_FRAME : INCOMPLETE_BINARY_FRAME;
if (msg_opcode == 0x9) return PING_FRAME; // 9 ping
if (msg_opcode == 0xA) return PONG_FRAME; // 10 pong