minix中关于如何判定一个字符的类型,如大写、小写、数字……
如果采用传统的方法,如判断一个字母大写的方法:
if(c>='A' && c<'Z') return true;
但是如果判断一个字符是数字或是字母,则采用下面的代码:
if((c<'z' && c>'a') || (c<'Z' && c>'A') || (c>'0' && c<'9')) return true
如果假设更多的局限,效率明显下降
minix的做法是定义一个256元素的unsigned char _ctypes[]数组,由于8位需要8种属性分别描述,如下:
#define _U 0x01 /* this bit is for upper-case letters [A-Z] */ #define _L 0x02 /* this bit is for lower-case letters [a-z] */ #define _N 0x04 /* this bit is for numbers [0-9] */ #define _S 0x08 /* this bit is for white space \t \n \f etc */ #define _P 0x10 /* this bit is for punctuation characters */ #define _C 0x20 /* this bit is for control characters */ #define _X 0x40 /* this bit is for hex digits [a-f] and [A-F]*/#define _PROTOTYPE(function, params) function params
判断字符函数原型:
_PROTOTYPE( int isalnum, (int _c) ); /* alphanumeric [a-z], [A-Z], [0-9] */ _PROTOTYPE( int isalpha, (int _c) ); /* alphabetic */ _PROTOTYPE( int iscntrl, (int _c) ); /* control characters */ _PROTOTYPE( int isdigit, (int _c) ); /* digit [0-9] */ _PROTOTYPE( int isgraph, (int _c) ); /* graphic character */ _PROTOTYPE( int islower, (int _c) ); /* lower-case letter [a-z] */ _PROTOTYPE( int isprint, (int _c) ); /* printable character */ _PROTOTYPE( int ispunct, (int _c) ); /* punctuation mark */ _PROTOTYPE( int isspace, (int _c) ); /* white space sp, \f, \n, \r, \t, \v*/ _PROTOTYPE( int isupper, (int _c) ); /* upper-case letter [A-Z] */ _PROTOTYPE( int isxdigit,(int _c) ); /* hex digit [0-9], [a-f], [A-F] */ _PROTOTYPE( int tolower, (int _c) ); /* convert to lower-case */ _PROTOTYPE( int toupper, (int _c) ); /* convert to upper-case */
以上函数都是通过宏定义:
#define isalnum(c) ((__ctype+1)[c]&(_U|_L|_N)) #define isalpha(c) ((__ctype+1)[c]&(_U|_L)) #define iscntrl(c) ((__ctype+1)[c]&_C) #define isgraph(c) ((__ctype+1)[c]&(_P|_U|_L|_N)) #define ispunct(c) ((__ctype+1)[c]&_P) #define isspace(c) ((__ctype+1)[c]&_S) #define isxdigit(c) ((__ctype+1)[c]&(_N|_X)) #define isdigit(c) ((unsigned) ((c)-'0') < 10) #define islower(c) ((unsigned) ((c)-'a') < 26) #define isupper(c) ((unsigned) ((c)-'A') < 26) #define isprint(c) ((unsigned) ((c)-' ') < 95) #define isascii(c) ((unsigned) (c) < 128)
minix将_ctype[]初始化为:
char __ctype[] = { 0, _C, _C, _C, _C, _C, _C, _C, _C, _C, _C|_S, _C|_S, _C|_S, _C|_S, _C|_S, _C, _C, _C, _C, _C, _C, _C, _C, _C, _C, _C, _C, _C, _C, _C, _C, _C, _C, _S, _P, _P, _P, _P, _P, _P, _P, _P, _P, _P, _P, _P, _P, _P, _P, _N, _N, _N, _N, _N, _N, _N, _N, _N, _N, _P, _P, _P, _P, _P, _P, _P, _U|_X, _U|_X, _U|_X, _U|_X, _U|_X, _U|_X, _U, _U, _U, _U, _U, _U, _U, _U, _U, _U, _U, _U, _U, _U, _U, _U, _U, _U, _U, _U, _P, _P, _P, _P, _P, _P, _L|_X, _L|_X, _L|_X, _L|_X, _L|_X, _L|_X, _L, _L, _L, _L, _L, _L, _L, _L, _L, _L, _L, _L, _L, _L, _L, _L, _L, _L, _L, _L, _P, _P, _P, _P, _C, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, };