WINVNC源码分析（四）——IO之rdr库

来源：互联网发布：l型的橱柜的算法编辑：程序博客网时间：2024/05/20 07:33

rdr是winvnc用来io操作的一个库工程。

IO操作无非两种，写入和读取数据，所以这里每个类都相应地分成了IN和OUT两种操作，先分析IN。

view plain

class InStream { public: virtual ~InStream() {} // check() ensures there is buffer data for at least one item of size // itemSize bytes. Returns the number of items in the buffer (up to a // maximum of nItems). inline int check(int itemSize, int nItems=1) { if (ptr + itemSize * nItems > end) { if (ptr + itemSize > end) return overrun(itemSize, nItems); nItems = (end - ptr) / itemSize; } return nItems; } // readU/SN() methods read unsigned and signed N-bit integers. inline U8 readU8() { check(1); return *ptr++; } inline U16 readU16() { check(2); int b0 = *ptr++; int b1 = *ptr++; return b0 << 8 | b1; } inline U32 readU32() { check(4); int b0 = *ptr++; int b1 = *ptr++; int b2 = *ptr++; int b3 = *ptr++; return b0 << 24 | b1 << 16 | b2 << 8 | b3; } inline S8 readS8() { return (S8) readU8(); } inline S16 readS16() { return (S16)readU16(); } inline S32 readS32() { return (S32)readU32(); } // readString() reads a string - a U32 length followed by the data. // Returns a null-terminated string - the caller should delete[] it // afterwards. char* readString(); // maxStringLength protects against allocating a huge buffer. Set it // higher if you need longer strings. static U32 maxStringLength; inline void skip(int bytes) { while (bytes > 0) { int n = check(1, bytes); ptr += n; bytes -= n; } } // readBytes() reads an exact number of bytes. virtual void readBytes(void* data, int length) { U8* dataPtr = (U8*)data; U8* dataEnd = dataPtr + length; while (dataPtr < dataEnd) { int n = check(1, dataEnd - dataPtr); memcpy(dataPtr, ptr, n); ptr += n; dataPtr += n; } } // readOpaqueN() reads a quantity without byte-swapping. inline U8 readOpaque8() { return readU8(); } inline U16 readOpaque16() { check(2); U16 r; ((U8*)&r)[0] = *ptr++; ((U8*)&r)[1] = *ptr++; return r; } inline U32 readOpaque32() { check(4); U32 r; ((U8*)&r)[0] = *ptr++; ((U8*)&r)[1] = *ptr++; ((U8*)&r)[2] = *ptr++; ((U8*)&r)[3] = *ptr++; return r; } inline U32 readOpaque24A() { check(3); U32 r=0; ((U8*)&r)[0] = *ptr++; ((U8*)&r)[1] = *ptr++; ((U8*)&r)[2] = *ptr++; return r; } inline U32 readOpaque24B() { check(3); U32 r=0; ((U8*)&r)[1] = *ptr++; ((U8*)&r)[2] = *ptr++; ((U8*)&r)[3] = *ptr++; return r; } // pos() returns the position in the stream. virtual int pos() = 0; // getptr(), getend() and setptr() are "dirty" methods which allow you to // manipulate the buffer directly. This is useful for a stream which is a // wrapper around an underlying stream. inline const U8* getptr() const { return ptr; } inline const U8* getend() const { return end; } inline void setptr(const U8* p) { ptr = p; } private: // overrun() is implemented by a derived class to cope with buffer overrun. // It ensures there are at least itemSize bytes of buffer data. Returns // the number of items in the buffer (up to a maximum of nItems). itemSize // is supposed to be "small" (a few bytes). virtual int overrun(int itemSize, int nItems) = 0; protected: InStream() {} const U8* ptr; const U8* end; };

构造函数为protected权限，摆明是给子类提供接口规范，derived class。

两个变量根据名字来分析，ptr指向的应该是当前位置，end则是最后一个字节。

inline int check(int itemSize, int nItems=1)

检查剩余缓存是否够用，代码对三种情况进行了处理，当前缓存不足一个itemSize的时候会运行overrun。overrun在这里是一个纯虚函数，稍后我们可以在子类中它的应用。

readU系列

以readU32为例，这里没有用memcpy进行拷贝，而是将源低地址的8位赋值给目标变量的高8位，既默认大端字节序（网络字节序）。

readS只是将readU的返回值作一个有符号类型的强制转换。

char* InStream::readString()

这里默认当前缓存头32位保存的是将要读取内容的长度，然后动态分配了相应长度（+1保证C STYLE字符串），拷贝后返回头指针，意味着由调用函数者来释放。上限是U32 InStream::maxStringLength = 65535;

inline void skip(int bytes)

用来快进当前指针bytes个字节。

virtual void readBytes(void* data, int length)

读取指定长度length的内容到data。这里用了while循环，虽然之前看到了有overrun函数，所以貌似有不读到就阻塞的嫌疑。

readOpaque系列则

这里就是一个字节一个字节的原始拷贝了。因为一个类型指针在内存中永远指向的是低地址。附一个判断CPU大小端的函数

view plain

bool IsBig_Endian(){unsigned short test = 0x1100;if(*( (unsigned char*) &test ) == 0x11){#define HAVE_BIGENDIANreturn true;}else{#undef HAVE_BIGENDIANreturn false;}}

class FdInStream : public InStream

这个类是IO端口的一个缓存，从IO端口读取数据，并且计算流量。

view plain

int FdInStream::readWithTimeoutOrCallback(void* buf, int len){ struct timeval before, after; if (timing) gettimeofday(&before, 0); int n = checkReadable(fd, timeout);//查看端口是否有数据到达 if (n < 0) throw SystemException("select",errno); if (n == 0) { if (timeout) throw TimedOut(); if (blockCallback) (*blockCallback)(blockCallbackArg);//如果IO没有数据，则调用回调函数blockCallback } while (true) { n = ::read(fd, buf, len); if (n != -1 || errno != EINTR) break;//从IO读到数据就退出循环，出错则阻塞尝试 fprintf(stderr,"read returned EINTR/n"); } if (n < 0) throw SystemException("read",errno); if (n == 0) throw EndOfStream(); if (timing) { gettimeofday(&after, 0);// fprintf(stderr,"%d.%06d/n",(after.tv_sec - before.tv_sec),// (after.tv_usec - before.tv_usec)); int newTimeWaited = ((after.tv_sec - before.tv_sec) * 10000 + (after.tv_usec - before.tv_usec) / 100);//单位100微秒 int newKbits = n * 8 / 1000;//单位1000位 if (newTimeWaited == 0) { fprintf(stderr,"new kbps infinite t %d k %d/n", newTimeWaited, newKbits); } else { fprintf(stderr,"new kbps %d t %d k %d/n", newKbits * 10000 / newTimeWaited, newTimeWaited, newKbits); }//计算本次IO读取的kbps // limit rate to between 10kbit/s and 40Mbit/s if (newTimeWaited > newKbits*1000) newTimeWaited = newKbits*1000;//在10kbit/s以下的计为10kbit/s if (newTimeWaited < newKbits/4) newTimeWaited = newKbits/4;//在40Mbit/s以上的计为40Mbit/s timeWaitedIn100us += newTimeWaited; timedKbits += newKbits;//累计读取时间和数据量 } return n;}

这个是从IO读取长度len数据到buf。

1 用select函数检查端口是否有数据到达。

2 如果没有的话调用构造函数传入的回调函数blockCallback。

3 然后读取数据，虽然::read(fd, buf, len);用了全局符号，但是头文件有定义#define read(s,b,l) recv(s,(char*)b,l,0)。

4 计算流量，先看下获取时间的函数：尝试用两种办法获取当前时间

static void gettimeofday(struct timeval* tv, void*)

view plain

#ifdef _WIN32static void gettimeofday(struct timeval* tv, void*){ LARGE_INTEGER counts, countsPerSec; static double usecPerCount = 0.0; if (QueryPerformanceCounter(&counts)) { if (usecPerCount == 0.0) { QueryPerformanceFrequency(&countsPerSec); usecPerCount = 1000000.0 / countsPerSec.QuadPart; //一个CPU时钟时间单位微秒 } LONGLONG usecs = (LONGLONG)(counts.QuadPart * usecPerCount);//计算系统运行到现在过了多少微秒 tv->tv_usec = (long)(usecs % 1000000); tv->tv_sec = (long)(usecs / 1000000); } else { struct timeb tb; ftime(&tb); tv->tv_sec = tb.time; tv->tv_usec = tb.millitm * 1000;//tv保存的是1970.1.1到现在经过的时间 }}#endif

startTiming、stopTiming和kbitsPerSecond分别用于开始计算、停止计算和返回从开始至今的传输率。

但都作了最小和最大的传输率限制，暂时猜不透用意。

现在我们看看基类中没有实现的虚函数

FdInStream::overrun(int itemSize, int nItems)

view plain

int FdInStream::overrun(int itemSize, int nItems){ if (itemSize > bufSize) throw Exception("FdInStream overrun: max itemSize exceeded"); if (end - ptr != 0) memmove(start, ptr, end - ptr);//把缓冲区的未读数据拷贝到缓冲区的头部 offset += ptr - start; end -= ptr - start; ptr = start; while (end < start + itemSize) { int n = readWithTimeoutOrCallback((U8*)end, start + bufSize - end);//从IO读取数据填充缓冲区剩余部分 end += n; } if (itemSize * nItems > end - ptr) nItems = (end - ptr) / itemSize; return nItems;}

对于比缓冲还大的itemsize只能吼下“OUT”

overrun是在缓冲区剩余未读长度小于itemsize的时候运行的，我们先得理解下几个变量：

ptr 缓冲区中未读数据的首字节地址

end 缓冲区中未读数据的尾字节地址

start 永远都指向了缓冲区的首字节地址

offset 数据传输总量。

首先memmove(start, ptr, end - ptr);把缓冲区的未读数据拷贝到缓冲区的头部，然后调用FdInStream::readWithTimeoutOrCallback从IO读取数据填充缓冲区剩余部分。

对于大量的数据，我们首先把缓冲区中未读数据读取出来，然后调用FdInStream::readWithTimeoutOrCallback直接读取到目标地址，而不再经过缓存区，这样可以提高效率。

也就是说缓冲区虽然方便了管理数据读写管理，但对效率相应地有些影响。

class MemInStream : public InStream

int overrun(int itemSize, int nItems) { throw EndOfStream(); }

可以看出来这个类用于对内存数据的管理。

ZlibInStream : public InStream

本来想到研究zlib库的时候再说，但zlib的接口类非常简洁。它增加的几个变量

view plain

InStream* underlying;//压缩前数据存放的缓冲区，暂时把它叫做A，ZlibInStream是压缩后数据存放的缓冲区，为了区分叫C。z_stream_s* zs;//zlib接口类指针，把它看成是一个压缩加工车间B。int bytesIn;//记录当前A中需要压缩的数据长度

构造函数：

view plain

ZlibInStream::ZlibInStream(int bufSize_) : underlying(0), bufSize(bufSize_ ? bufSize_ : DEFAULT_BUF_SIZE), offset(0), bytesIn(0){ zs = new z_stream; zs->zalloc = Z_NULL; zs->zfree = Z_NULL; zs->opaque = Z_NULL; zs->next_in = Z_NULL; zs->avail_in = 0; if (inflateInit(zs) != Z_OK) { delete zs; throw Exception("ZlibInStream: inflateInit failed"); } ptr = end = start = new U8[bufSize];}

B的初始化。

void ZlibInStream::setUnderlying(InStream* is, int bytesIn_)

view plain

void ZlibInStream::setUnderlying(InStream* is, int bytesIn_){ underlying = is; bytesIn = bytesIn_; ptr = end = start;}

A的初始化。

int ZlibInStream::overrun(int itemSize, int nItems)

view plain

int ZlibInStream::overrun(int itemSize, int nItems){ if (itemSize > bufSize) throw Exception("ZlibInStream overrun: max itemSize exceeded"); if (!underlying) throw Exception("ZlibInStream overrun: no underlying stream"); if (end - ptr != 0) memmove(start, ptr, end - ptr); offset += ptr - start; end -= ptr - start; ptr = start; while (end - ptr < itemSize) { decompress(); } if (itemSize * nItems > end - ptr) nItems = (end - ptr) / itemSize; return nItems;}

对照FdInStream::overrun函数，看出它是调用了核心处理函数decompress来解决无数据可读的情况

void ZlibInStream::decompress()

view plain

void ZlibInStream::decompress(){ zs->next_out = (U8*)end; zs->avail_out = start + bufSize - end; //用C中保存被解压数据的控件指针初始化B的接口变量 underlying->check(1); zs->next_in = (U8*)underlying->getptr(); zs->avail_in = underlying->getend() - underlying->getptr(); if ((int)zs->avail_in > bytesIn) zs->avail_in = bytesIn; int rc = inflate(zs, Z_SYNC_FLUSH); if (rc != Z_OK) { throw Exception("ZlibInStream: inflate failed"); } bytesIn -= zs->next_in - underlying->getptr(); end = zs->next_out; //解压后zs->next_out会发生偏移，偏移量为缓冲接收到的被解压的数据量 underlying->setptr(zs->next_in); //解压后zs->next_in会发生偏移，偏移量为underlying中被解压的数据量}

它是逻辑很简单，压缩前初始化B的几个关键变量，然后直接调用压缩函数inflate，压缩完后，我们要相应地修改A和C的成员指针到相应地偏移量。

void ZlibInStream::reset()

view plain

void ZlibInStream::reset(){ ptr = end = start; if (!underlying) return; while (bytesIn > 0) { decompress(); end = start; // throw away any data } underlying = 0;}

把A中需要压缩的数据全部压缩完并输出到C中，然后初始化成员变量。我们可以通过函数setUnderlying来切换A，但是记住在之前调用RESET。

这个时候看OUT系列就轻松很多了。

class FdOutStream : public OutStream

void FdOutStream::flush()

view plain

void FdOutStream::flush(){ U8* sentUpTo = start; while (sentUpTo < ptr) { int n = write(fd, (const void*) sentUpTo, ptr - sentUpTo); if (n < 0) throw SystemException("write",errno); sentUpTo += n; offset += n; } ptr = start;}

所谓的flush就是把缓冲区的数据写入IO。

FdOutStream::writeBytes(const void* data, int length)

view plain

void FdOutStream::writeBytes(const void* data, int length){ if (length < MIN_BULK_SIZE) { OutStream::writeBytes(data, length); return; } const U8* dataPtr = (const U8*)data; flush(); while (length > 0) { int n = write(fd, dataPtr, length); if (n < 0) throw SystemException("write",errno); length -= n; dataPtr += n; offset += n; }}

发现对于大量数据写入也是先刷新缓冲区，然后绕过缓冲区直接IO写入。

在这里可以清晰地看出offset的用途

它就是用来记录写入IO的数据总量。

int FdOutStream::length()

{

return offset + ptr - start;

}

当然对于外界得到的只能是通过OutStream接口写入的数据总量，因为它会把缓冲区的当前数据量加上去。

MemOutStream

唯一要注意的就是int overrun(int itemSize, int nItems)

在这里如果原来的缓冲不够写，那我们就重新分配一个足够大的缓冲区，把原来缓冲区已写入的数据拷贝过来，然后释放掉旧的缓冲区。

class NullOutStream : public OutStream

这个家伙根本就没有作任何数据的操作，仅仅是计量，猜测是用来计算数据吞吐量的。

class ZlibOutStream : public OutStream

成员变量：

view plain

OutStream* underlying;//压缩后数据存放的缓冲区，暂时把它叫做C，ZlibOutStream 是压缩前数据存放的缓冲区，为了区分叫A。z_stream_s* zs;////zlib接口类指针，把它看成是一个解压加工车间B。

构造函数同样是初始化了B。但这里调用的deflateInit。

void ZlibOutStream::flush()

view plain

void ZlibOutStream::flush(){ zs->next_in = start; zs->avail_in = ptr - start; //用A需要压缩的数据头指针和长度初始化B接口// fprintf(stderr,"zos flush: avail_in %d/n",zs->avail_in); while (zs->avail_in != 0) {//循环保证A中数据能完全压缩完 do { underlying->check(1); zs->next_out = underlying->getptr(); zs->avail_out = underlying->getend() - underlying->getptr();// fprintf(stderr,"zos flush: calling deflate, avail_in %d, avail_out %d/n",// zs->avail_in,zs->avail_out); int rc = deflate(zs, Z_SYNC_FLUSH); if (rc != Z_OK) throw Exception("ZlibOutStream: deflate failed");// fprintf(stderr,"zos flush: after deflate: %d bytes/n",// zs->next_out-underlying->getptr()); underlying->setptr(zs->next_out); } while (zs->avail_out == 0);//第二个循环，检查C是否还有空余的空间，如果没有了，则通过check来刷新C获取足够空间来接收压缩后的数据。//deflate被循环调用，可以理解它是智能的，如果输出空间不够，它会自动记录上次压缩数据的状态，不用调用者操心next_in重置，next_in总是指向已压缩的数据源的后一个字节。 } offset += ptr - start; ptr = start;}

保证了A中所有需要压缩的数据全部压缩并输出。

int ZlibOutStream::overrun(int itemSize, int nItems)

view plain

int ZlibOutStream::overrun(int itemSize, int nItems){// fprintf(stderr,"ZlibOutStream overrun/n"); if (itemSize > bufSize) throw Exception("ZlibOutStream overrun: max itemSize exceeded"); while (end - ptr < itemSize) { zs->next_in = start; zs->avail_in = ptr - start; do { underlying->check(1); zs->next_out = underlying->getptr(); zs->avail_out = underlying->getend() - underlying->getptr();// fprintf(stderr,"zos overrun: calling deflate, avail_in %d, avail_out %d/n",// zs->avail_in,zs->avail_out); int rc = deflate(zs, 0); if (rc != Z_OK) throw Exception("ZlibOutStream: deflate failed");// fprintf(stderr,"zos overrun: after deflate: %d bytes/n",// zs->next_out-underlying->getptr()); underlying->setptr(zs->next_out); } while (zs->avail_out == 0); // output buffer not full if (zs->avail_in == 0) { offset += ptr - start; ptr = start; } else { // but didn't consume all the data? try shifting what's left to the // start of the buffer. fprintf(stderr,"z out buf not full, but in data not consumed/n"); memmove(start, zs->next_in, ptr - zs->next_in); offset += zs->next_in - start; ptr -= zs->next_in - start; } } if (itemSize * nItems > end - ptr) nItems = (end - ptr) / itemSize; return nItems;}

这个函数并没直接调用flush来解决A空间不足的问题，因为只要保证A中有空间满足itemSize就好，而不是flush这种函数完全清空。

void ZlibOutStream::setUnderlying(OutStream* os)

view plain

void ZlibOutStream::setUnderlying(OutStream* os){ underlying = os;}

重置A，记得在它之前调用ZlibOutStream::flush。

0 0