爬虫Larbin解析(二)——sequencer()

分析的函数: void sequencer()

//位置：larbin-2.6.3/src/fetch/sequencer.cc
void sequencer() 

{

    bool testPriority = true;

    if (space == 0)                //unit space = 0

    {

        space = global::inter->putAll();

    }

    int still = space;

    if (still > maxPerCall)        //#define maxPerCall 100

        still = maxPerCall;

    while (still) 

    {

        if (canGetUrl(&testPriority)) 

        {

            --space; 

            --still; 

        } 

        else 

        { 

            still = 0; 

        } 

    }

}

所在的文件

larbin-2.6.3/src/fetch/sequencer.h、larbin-2.6.3/src/fetch/sequencer.cc

// Larbin

// Sebastien Ailleret

// 15-11-99 -> 15-11-99



#ifndef SEQUENCER_H

#define SEQUENCER_H



/** only for debugging, handle with care */

extern uint space;



/** Call the sequencer */

void sequencer ();



#endif

View Code

// Larbin

// Sebastien Ailleret

// 15-11-99 -> 04-01-02



#include <iostream.h>



#include "options.h"



#include "global.h"

#include "types.h"

#include "utils/url.h"

#include "utils/debug.h"

#include "fetch/site.h"



static bool canGetUrl (bool *testPriority);

uint space = 0;



#define maxPerCall 100



/** start the sequencer*/

//按优先度将URL放到代爬站点

void sequencer() 

{

    bool testPriority = true;

    if (space == 0) 

    {

        space = global::inter->putAll();

    }

    int still = space;

    if (still > maxPerCall)  //#define maxPerCall 100

        still = maxPerCall;

    while (still) 

    {

        if (canGetUrl(&testPriority)) 

        {

            space--; 

            still--; 

        } 

        else 

        { 

            still = 0; 

        } 

    }

}



/* Get the next url

 * here is defined how priorities are handled

 按优先级从各个URL队列

 （比如URLsDisk,URLsDiskWait或URLsPriority,URLsPriorityWait）

 获取url保存到某个NameSite(通过url的hash值)

 */

static bool canGetUrl (bool *testPriority) 

{

    url *u;

    if (global::readPriorityWait)  // global.cc  赋值为0

    {

        global::readPriorityWait--;

        u = global::URLsPriorityWait->get();

        global::namedSiteList[u->hostHashCode()].putPriorityUrlWait(u);

        return true;

    } 

    else if (*testPriority && (u=global::URLsPriority->tryGet()) != NULL) 

    {

        // We've got one url (priority)

        global::namedSiteList[u->hostHashCode()].putPriorityUrl(u);

        return true;

    } 

    else 

    {

        *testPriority = false;

        // Try to get an ordinary url

        if (global::readWait) 

        {

          global::readWait--;

          u = global::URLsDiskWait->get();

          global::namedSiteList[u->hostHashCode()].putUrlWait(u);

          return true;

        } 

        else 

        {

            u = global::URLsDisk->tryGet();

            if (u != NULL) 

            {

                global::namedSiteList[u->hostHashCode()].putUrl(u);

                return true;

            }

            else 

            {

                return false;

            }

        }

    }

}

View Code

一、对于space = global::inter->putAll();

1. interf在global.cc(位置：/larbin-2.6.3/src/global.cc)中的定义为

inter = new Interval(ramUrls);   //#define ramUrls 100000  (位置：larbin-2.6.3/src/types.h)

批注：区别 inter = new Interval(ramUrls); 和 inter = new Interval[ramUrls]; 前一个（）内是参数，要传入构造函数的；后一个[]内是开辟数组的个数。

2. 类 Interval定义（位置：/larbin-2.6.3/src/fetch/site.h）

/** This class is intended to make sure the sum of the

 * sizes of the fifo included in the different sites

 * are not too big

 */

class Interval 

{

    public:

        Interval (uint sizes) : size(sizes), pos(0) {}

        ~Interval () {}

        /** How many urls can we put. Answer 0: if no urls can be put */

        inline uint putAll () 

        { 

            int res = size - pos; 

            pos = size; 

            return res; 

        }

        /** Warn an url has been retrieved */

        inline void getOne () 

        { 

            --pos; 

        }

        /** only for debugging, handle with care */

        inline uint getPos () 

        { 

            return pos; 

        }

    private:

        /** Size of the interval */

        uint size;

        /** Position in the interval */

        uint pos;

};

View Code

批注：类内的函数定义为inline。对内联函数的几点说明：

内联函数避免函数调用的开销。将函数指定为内联函数，（通常）就是将它在程序的每个调用点上“内联地”展开，消除调用函数进行的额外开销（调用前先保存寄存器，并在返回时回复）。内联说明（在函数返回值前加inline）对编译器来说只是一个建议，编译器可以选择忽略。一般内敛函数适用于优化小的、只有几行、经常被调用的函数。大多数编译器不支持递归函数的内敛。
把内联函数放在头文件。以便编译器能够在调用点展开同一个函数（保证编译器可见、所有的定义相同）。
编译器隐式地将在类内定义的成员函数当作为内联函数.

二、对于canGetUrl(&testPriority)

函数定义（位置larbin-2.6.3/src/fetch/sequencer.cc）

/* Get the next url

 * here is defined how priorities are handled

 按优先级从各个URL队列

 （比如URLsDisk,URLsDiskWait或URLsPriority,URLsPriorityWait）

 获取url保存到某个NameSite(通过url的hash值)



at "global.cc"

// FIFOs

URLsDisk         = new PersistentFifo(reload, fifoFile);

URLsDiskWait     = new PersistentFifo(reload, fifoFileWait);

URLsPriority     = new SyncFifo<url>;

URLsPriorityWait = new SyncFifo<url>;



 */

static bool canGetUrl (bool *testPriority) 

{

    url *u;

    if (global::readPriorityWait != 0)  // 在global.cc声明定义: uint global::readPriorityWait=0;

    {

        global::readPriorityWait--;

        u = global::URLsPriorityWait->get();

        global::namedSiteList[u->hostHashCode()].putPriorityUrlWait(u);

        return true;

    } 

    else if (*testPriority && (u=global::URLsPriority->tryGet()) != NULL) 

    {

        // We've got one url (priority)

        global::namedSiteList[u->hostHashCode()].putPriorityUrl(u);

        return true;

    } 

    else 

    {

        *testPriority = false;

        // Try to get an ordinary url

        if (global::readWait) 

        {

          global::readWait--;

          u = global::URLsDiskWait->get();

          global::namedSiteList[u->hostHashCode()].putUrlWait(u);

          return true;

        } 

        else 

        {

            u = global::URLsDisk->tryGet();

            if (u != NULL) 

            {

                global::namedSiteList[u->hostHashCode()].putUrl(u);

                return true;

            }

            else 

            {

                return false;

            }

        }

    }

}

1. 为什么disk和priority的队列都是成对出现的，是因为可以认为每个site在namedSiteList当中都有一个小的队列来保存它的url，这个url的个数是有个数限制的，当超过这个限制的时候就不能再把该site下的url放入，但也不能丢弃，而是放入wait队列。Larbin会控制一段时间在disk队列中取url,一段时间在diskWait当中取url。disk和priority的区别只是优先级的区别。namedSiteList的作用是实现了DNS缓存。

爬虫Larbin解析(二)——sequencer()

2. global::readPriorityWait 的值由main.cc的cron()函数中变化得知

// see if we should read again urls in fifowait

if ((global::now % 300) == 0) {

    global::readPriorityWait = global::URLsPriorityWait->getLength();

    global::readWait = global::URLsDiskWait->getLength();

}

if ((global::now % 300) == 150) {

    global::readPriorityWait = 0;

    global::readWait = 0;

}

这里global::now%300是判断这次是对wait里的url进行处理，还是对不是wait里的进行处理，这里的%300等于0和150的概率都是1/300，所以大约300次换一次。readPriorityWait是URLsPriorityWait中的长度（也就是url的数量）；readWait是URLsDiskWait中url的个数。

3. 在canGetUrl中，在对于每个站点，将相应的url放进去。putPriorityUrlWait, putPriorityUrl, putUrlWait, putUrl在site.h的定义如下

/** Put an url in the fifo

 * If there are too much, put it back in UrlsInternal

 * Never fill totally the fifo => call at least with 1 */

void putGenericUrl(url *u, int limit, bool prio);

inline void putUrl(url *u) {

    putGenericUrl(u, 15, false);

}

inline void putUrlWait(url *u) {

    putGenericUrl(u, 10, false);

}

inline void putPriorityUrl(url *u) {

    putGenericUrl(u, 5, true);

}

inline void putPriorityUrlWait(url *u) {

    putGenericUrl(u, 1, true);

}

可以发现，每次都是调用函数putGenericUrl，其定义如下

/* Put an url in the fifo if their are not too many */

void NamedSite::putGenericUrl(url *u, int limit, bool prio) 
{

    if (nburls > maxUrlsBySite - limit) 
    {

       // Already enough Urls in memory for this Site

       // first check if it can already be forgotten

       if (!strcmp(name, u->getHost())) 
       {

           if (dnsState == errorDns) 
           {

              nburls++;

              forgetUrl(u, noDNS);

              return;

           }

           if (dnsState == noConnDns) 
           {

              nburls++;

              forgetUrl(u, noConnection);

              return;

           }

           if (u->getPort() == port && dnsState == doneDns && !testRobots(u->getFile())) 
           {

              nburls++;

              forgetUrl(u, forbiddenRobots);

              return;

           }

       }

       // else put it back in URLsDisk

       refUrl();

       global::inter->getOne();

       if (prio) 
       {

           global::URLsPriorityWait->put(u);

       } 
       else 
       {

           global::URLsDiskWait->put(u);

       }

   }

如果已经有足够多的url在内存里，执行这里if中的代码，strcmp(name,u->getHost())是判断这个主机是不是已经就进行过dns方面的判断，也就是说对于一个站点，只做一次dns解析的判断，以后就按这个结果进行处理，dnsState有noDns，noConnDns，还有robots.txt不允许的情况，如果没有问题，就把它放到URLsDisk中。

else {

    nburls++;

    if (dnsState == waitDns || strcmp(name, u->getHost()) || port

           != u->getPort() || global::now > dnsTimeout) {

       // dns not done or other site

       putInFifo(u);

       addNamedUrl();

       // Put Site in fifo if not yet in

       if (!isInFifo) {

           isInFifo = true;

           global::dnsSites->put(this);

       }

    } else

       switch (dnsState) {

       case doneDns:

           transfer(u);

           break;

       case errorDns:

           forgetUrl(u, noDNS);

           break;

       default: // noConnDns

           forgetUrl(u, noConnection);

       }

}

如果需要判断dns能不能解析，就将它放到dnsSites里，这个会在fetchDns中判断。或是如果还能放到内存里，并且又是doneDns，表示可以解析，就调用transfer：

void NamedSite::transfer(url *u) {

    if (testRobots(u->getFile())) {

       if (global::proxyAddr == NULL) {

           memcpy(&u->addr, &addr, sizeof(struct in_addr));

       }

       global::IPSiteList[ipHash].putUrl(u);

    } else {

       forgetUrl(u, forbiddenRobots);

    }

}

这里是将url放入到IPSiteList的相应ipHash中。

附类的定义

类url定义（larbin-2.6.3/src/utils/url.h larbin-2.6.3/src/utils/url.cc）

// Larbin

// Sebastien Ailleret

// 15-11-99 -> 14-03-02



/* This class describes an URL */



#ifndef URL_H

#define URL_H



#include <netinet/in.h>

#include <sys/types.h>

#include <sys/socket.h>

#include <stdlib.h>



#include "types.h"



bool fileNormalize (char *file);



class url {

 private:

  char *host;

  char *file;

  uint16_t port; // the order of variables is important for physical size

  int8_t depth;

  /* parse the url */

  void parse (char *s);

  /** parse a file with base */

  void parseWithBase (char *u, url *base);

  /* normalize file name */

  bool normalize (char *file);

  /* Does this url starts with a protocol name */

  bool isProtocol (char *s);

  /* constructor used by giveBase */

  url (char *host, uint port, char *file);



 public:

  /* Constructor : Parses an url (u is deleted) */

  url (char *u, int8_t depth, url *base);



  /* constructor used by input */

  url (char *line, int8_t depth);



  /* Constructor : read the url from a file (cf serialize) */

  url (char *line);



  /* Destructor */

  ~url ();



  /* inet addr (once calculated) */

  struct in_addr addr;



  /* Is it a valid url ? */

  bool isValid ();



  /* print an URL */

  void print ();



  /* return the host */

  inline char *getHost () { return host; }



  /* return the port */

  inline uint getPort () { return port; }



  /* return the file */

  inline char *getFile () { return file; }



  /** Depth in the Site */

  inline int8_t getDepth () { return depth; }



  /* Set depth to max if we are at an entry point in the site

   * try to find the ip addr

   * answer false if forbidden by robots.txt, true otherwise */

  bool initOK (url *from);



  /** return the base of the url

   * give means that you have to delete the string yourself

   */

  url *giveBase ();



  /** return a char * representation of the url

   * give means that you have to delete the string yourself

   */

  char *giveUrl ();



  /** write the url in a buffer

   * buf must be at least of size maxUrlSize

   * returns the size of what has been written (not including '\0')

   */

  int writeUrl (char *buf);



  /* serialize the url for the Persistent Fifo */

  char *serialize ();



  /* very thread unsafe serialisation in a static buffer */

  char *getUrl();



  /* return a hashcode for the host of this url */

  uint hostHashCode ();



  /* return a hashcode for this url */

  uint hashCode ();



#ifdef URL_TAGS

  /* tag associated to this url */

  uint tag;

#endif // URL_TAGS



#ifdef COOKIES

  /* cookies associated with this page */

  char *cookie;

  void addCookie(char *header);

#else // COOKIES

  inline void addCookie(char *header) {}

#endif // COOKIES

};



#endif // URL_H

View Code

// Larbin

// Sebastien Ailleret

// 15-11-99 -> 16-03-02



/* This class describes an URL */



#include <assert.h>

#include <stdlib.h>

#include <stdio.h>

#include <string.h>

#include <ctype.h>

#include <sys/types.h>

#include <sys/socket.h>



#include "options.h"



#include "types.h"

#include "global.h"

#include "utils/url.h"

#include "utils/text.h"

#include "utils/connexion.h"

#include "utils/debug.h"



#ifdef COOKIES

#define initCookie() cookie=NULL

#else // COOKIES

#define initCookie() ((void) 0)

#endif // COOKIES



/* small functions used later */

static uint siteHashCode (char *host) {

  uint h=0;

  uint i=0;

  while (host[i] != 0) {

    h = 37*h + host[i];

    i++;

  }

  return h % namedSiteListSize;

}



/* return the int with correspond to a char

 * -1 if not an hexa char */

static int int_of_hexa (char c) {

  if (c >= '0' && c <= '9')

    return (c - '0');

  else if (c >= 'a' && c <= 'f')

    return (c - 'a' + 10);

  else if (c >= 'A' && c <= 'F')

    return (c - 'A' + 10);

  else

    return -1;

}



/* normalize a file name : also called by robots.txt parser

 * return true if it is ok, false otherwise (cgi-bin)

 */

bool fileNormalize (char *file) {

  int i=0;

  while (file[i] != 0 && file[i] != '#') {

    if (file[i] == '/') {

      if (file[i+1] == '.' && file[i+2] == '/') {

        // suppress /./

        int j=i+3;

        while (file[j] != 0) {

          file[j-2] = file[j];

          j++;

        }

        file[j-2] = 0;

      } else if (file[i+1] == '/') {

        // replace // by /

        int j=i+2;

        while (file[j] != 0) {

          file[j-1] = file[j];

          j++;

        }

        file[j-1] = 0;

      } else if (file[i+1] == '.' && file[i+2] == '.' && file[i+3] == '/') {

        // suppress /../

        if (i == 0) {

          // the file name starts with /../ : error

          return false;

        } else {

          int j = i+4, dec;

          i--;

          while (file[i] != '/') { i--; }

          dec = i+1-j; // dec < 0

          while (file[j] != 0) {

            file[j+dec] = file[j];

            j++;

          }

          file[j+dec] = 0;

        }

      } else if (file[i+1] == '.' && file[i+2] == 0) {

        // suppress /.

        file[i+1] = 0;

        return true;

      } else if (file[i+1] == '.' && file[i+2] == '.' && file[i+3] == 0) {

        // suppress /..

        if (i == 0) {

          // the file name starts with /.. : error

          return false;

        } else {

          i--;

          while (file[i] != '/') {

            i--;

          }

          file[i+1] = 0;

          return true;

        }

      } else { // nothing special, go forward

        i++;

      }

    } else if (file[i] == '%') {

      int v1 = int_of_hexa(file[i+1]);

      int v2 = int_of_hexa(file[i+2]);

      if (v1 < 0 || v2 < 0) return false;

      char c = 16 * v1 + v2;

      if (isgraph(c)) {

        file[i] = c;

        int j = i+3;

        while (file[j] != 0) {

          file[j-2] = file[j];

          j++;

        }

        file[j-2] = 0;

        i++;

      } else if (c == ' ' || c == '/') { // keep it with the % notation

        i += 3;

      } else { // bad url

        return false;

      }

    } else { // nothing special, go forward

      i++;

    }

  }

  file[i] = 0;

  return true;

}



/**************************************/

/* definition of methods of class url */

/**************************************/



/* Constructor : Parses an url */

url::url (char *u, int8_t depth, url *base) {

  newUrl();

  this->depth = depth;

  host = NULL;

  port = 80;

  file = NULL;

  initCookie();

#ifdef URL_TAGS

  tag = 0;

#endif // URL_TAGS

  if (startWith("http://", u)) {

    // absolute url

    parse (u + 7);

    // normalize file name

    if (file != NULL && !normalize(file)) {

      delete [] file;

      file = NULL;

      delete [] host;

      host = NULL;

    }

  } else if (base != NULL) {

    if (startWith("http:", u)) {

      parseWithBase(u+5, base);

    } else if (isProtocol(u)) {

      // Unknown protocol (mailto, ftp, news, file, gopher...)

    } else {

      parseWithBase(u, base);

    }

  }

}



/* constructor used by input */

url::url (char *line,  int8_t depth) {

  newUrl();

  this->depth = depth;

  host = NULL;

  port = 80;

  file = NULL;

  initCookie();

  int i=0;

#ifdef URL_TAGS

  tag = 0;

  while (line[i] >= '0' && line[i] <= '9') {

    tag = 10*tag + line[i] - '0';

    i++;

  }

  i++;

#endif // URL_TAGS

  if (startWith("http://", line+i)) {

    parse(line+i+7);

    // normalize file name

    if (file != NULL && !normalize(file)) {

      delete [] file;

      file = NULL;

      delete [] host;

      host = NULL;

    }

  }

}



/* Constructor : read the url from a file (cf serialize)

 */

url::url (char *line) {

  newUrl();

  int i=0;

  // Read depth

  depth = 0;

  while (line[i] >= '0' && line[i] <= '9') {

    depth = 10*depth + line[i] - '0';

    i++;

  }

#ifdef URL_TAGS

  // read tag

  tag = 0; i++;

  while (line[i] >= '0' && line[i] <= '9') {

    tag = 10*tag + line[i] - '0';

    i++;

  }

#endif // URL_TAGS

  int deb = ++i;

  // Read host

  while (line[i] != ':') {

    i++;

  }

  line[i] = 0;

  host = newString(line+deb);

  i++;

  // Read port

  port = 0;

  while (line[i] >= '0' && line[i] <= '9') {

    port = 10*port + line[i] - '0';

    i++;

  }

#ifndef COOKIES

  // Read file name

  file = newString(line+i);

#else // COOKIES

  char *cpos = strchr(line+i, ' ');

  if (cpos == NULL) {

    cookie = NULL;

  } else {

    *cpos = 0;

    // read cookies

    cookie = new char[maxCookieSize];

    strcpy(cookie, cpos+1);

  }

  // Read file name

  file = newString(line+i);

#endif // COOKIES

}



/* constructor used by giveBase */

url::url (char *host, uint port, char *file) {

  newUrl();

  initCookie();

  this->host = host;

  this->port = port;

  this->file = file;

}



/* Destructor */

url::~url () {

  delUrl();

  delete [] host;

  delete [] file;

#ifdef COOKIES

  delete [] cookie;

#endif // COOKIES

}



/* Is it a valid url ? */

bool url::isValid () {

  if (host == NULL) return false;

  int lh = strlen(host);

  return file!=NULL && lh < maxSiteSize

    && lh + strlen(file) + 18 < maxUrlSize;

}



/* print an URL */

void url::print () {

  printf("http://%s:%u%s\n", host, port, file);

}



/* Set depth to max if necessary

 * try to find the ip addr

 * answer false if forbidden by robots.txt, true otherwise */

bool url::initOK (url *from) {

#if defined(DEPTHBYSITE) || defined(COOKIES)

  if (strcmp(from->getHost(), host)) { // different site

#ifdef DEPTHBYSITE

    depth = global::depthInSite;

#endif // DEPTHBYSITE

  } else { // same site

#ifdef COOKIES

    if (from->cookie != NULL) {

      cookie = new char[maxCookieSize];

      strcpy(cookie, from->cookie);

    }

#endif // COOKIES

  }

#endif // defined(DEPTHBYSITE) || defined(COOKIES)

  if (depth < 0) {

    errno = tooDeep;

    return false;

  }

  NamedSite *ns = global::namedSiteList + (hostHashCode());

  if (!strcmp(ns->name, host) && ns->port == port) {

    switch (ns->dnsState) {

    case errorDns:

      errno = fastNoDns;

      return false;

    case noConnDns:

      errno = fastNoConn;

      return false;

    case doneDns:

      if (!ns->testRobots(file)) {

        errno = fastRobots;

        return false;

      }

    }

  }

  return true;

}



/* return the base of the url */

url *url::giveBase () {

  int i = strlen(file);

  assert (file[0] == '/');

  while (file[i] != '/') {

    i--;

  }

  char *newFile = new char[i+2];

  memcpy(newFile, file, i+1);

  newFile[i+1] = 0;

  return new url(newString(host), port, newFile);

}



/** return a char * representation of the url

 * give means that you have to delete the string yourself

 */

char *url::giveUrl () {

  char *tmp;

  int i = strlen(file);

  int j = strlen(host);



  tmp = new char[18+i+j];  // 7 + j + 1 + 9 + i + 1

                           // http://(host):(port)(file)\0

  strcpy(tmp, "http://");

  strcpy (tmp+7, host);

  j += 7;

  if (port != 80) {

    j += sprintf(tmp + j, ":%u", port);

  }

  // Copy file name

  while (i >= 0) {

    tmp [j+i] = file[i];

    i--;

  }

  return tmp;

}



/** write the url in a buffer

 * buf must be at least of size maxUrlSize

 * returns the size of what has been written (not including '\0')

 */

int url::writeUrl (char *buf) {

  if (port == 80)

    return sprintf(buf, "http://%s%s", host, file);

  else

    return sprintf(buf, "http://%s:%u%s", host, port, file);

}



/* serialize the url for the Persistent Fifo */

char *url::serialize () {

  // this buffer is protected by the lock of PersFifo

  static char statstr[maxUrlSize+40+maxCookieSize];

  int pos = sprintf(statstr, "%u ", depth);

#ifdef URL_TAGS

  pos += sprintf(statstr+pos, "%u ", tag);

#endif // URL_TAGS

  pos += sprintf(statstr+pos, "%s:%u%s", host, port, file);

#ifdef COOKIES

  if (cookie != NULL) {

    pos += sprintf(statstr+pos, " %s", cookie);

  }

#endif // COOKIES

  statstr[pos] = '\n';

  statstr[pos+1] = 0;

  return statstr;

}



/* very thread unsafe serialisation in a static buffer */

char *url::getUrl() {

  static char statstr[maxUrlSize+40];

  sprintf(statstr, "http://%s:%u%s", host, port, file);

  return statstr;

}



/* return a hashcode for the host of this url */

uint url::hostHashCode () {

  return siteHashCode (host);

}



/* return a hashcode for this url */

uint url::hashCode () {

  unsigned int h=port;

  unsigned int i=0;

  while (host[i] != 0) {

    h = 31*h + host[i];

    i++;

  }

  i=0;

  while (file[i] != 0) {

    h = 31*h + file[i];

    i++;

  }

  return h % hashSize;

}



/* parses a url : 

 * at the end, arg must have its initial state, 

 * http:// has allready been suppressed

 */

void url::parse (char *arg) {

  int deb = 0, fin = deb;

  // Find the end of host name (put it into lowerCase)

  while (arg[fin] != '/' && arg[fin] != ':' && arg[fin] != 0) {

    fin++;

  }

  if (fin == 0) return;



  // get host name

  host = new char[fin+1];

  for (int  i=0; i<fin; i++) {

    host[i] = lowerCase(arg[i]);

  }

  host[fin] = 0;



  // get port number

  if (arg[fin] == ':') {

    port = 0;

    fin++;

    while (arg[fin] >= '0' && arg[fin] <= '9') {

      port = port*10 + arg[fin]-'0';

      fin++;

    }

  }



  // get file name

  if (arg[fin] != '/') {

    // www.inria.fr => add the final /

    file = newString("/");

  } else {

    file = newString(arg + fin);

  }

}



/** parse a file with base

 */

void url::parseWithBase (char *u, url *base) {

  // cat filebase and file

  if (u[0] == '/') {

    file = newString(u);

  } else {

    uint lenb = strlen(base->file);

    char *tmp = new char[lenb + strlen(u) + 1];

    memcpy(tmp, base->file, lenb);

    strcpy(tmp + lenb, u);

    file = tmp;

  }

  if (!normalize(file)) {

    delete [] file;

    file = NULL;

    return;

  }

  host = newString(base->host);

  port = base->port;

}



/** normalize file name

 * return true if it is ok, false otherwise (cgi-bin)

 */

bool url::normalize (char *file) {

  return fileNormalize(file);

}



/* Does this url starts with a protocol name */

bool url::isProtocol (char *s) {

  uint i = 0;

  while (isalnum(s[i])) {

    i++;

  }

  return s[i] == ':';

}



#ifdef COOKIES

#define addToCookie(s) len = strlen(cookie); \

    strncpy(cookie+len, s, maxCookieSize-len); \

    cookie[maxCookieSize-1] = 0;



/* see if a header contain a new cookie */

void url::addCookie(char *header) {

  if (startWithIgnoreCase("set-cookie: ", header)) {

    char *pos = strchr(header+12, ';');

    if (pos != NULL) {

      int len;

      if (cookie == NULL) {

        cookie = new char[maxCookieSize];

        cookie[0] = 0;

      } else {

        addToCookie("; ");

      }

      *pos = 0;

      addToCookie(header+12);

      *pos = ';';

    }

  }

}

#endif // COOKIES

View Code

global::namedSiteList

NamedSite *global::namedSiteList;

namedSiteList = new NamedSite[namedSiteListSize];

class NamedSite 

{

    private:

        /* string used for following CNAME chains (just one jump) */

        char *cname;

        /** we've got a good dns answer

        * get the robots.txt */

        void dnsOK ();

        /** Cannot get the inet addr

        * dnsState must have been set properly before the call */

        void dnsErr ();

        /** Delete the old identity of the site */

        void newId ();

        /** put this url in its IPSite */

        void transfer (url *u);

        /** forget this url for this reason */

        void forgetUrl (url *u, FetchError reason);

    public:

        /** Constructor */

        NamedSite ();

        /** Destructor : never used */

        ~NamedSite ();

        /* name of the site */

        char name[maxSiteSize];

        /* port of the site */

        uint16_t port;

        /* numbers of urls in ram for this site */

        uint16_t nburls;

        /* fifo of urls waiting to be fetched */

        url *fifo[maxUrlsBySite];

        uint8_t inFifo;

        uint8_t outFifo;

        void putInFifo(url *u);

        url *getInFifo();

        short fifoLength();

        /** Is this Site in a dnsSites */

        bool isInFifo;

        /** internet addr of this server */

        char dnsState;

        struct in_addr addr;

        uint ipHash;

        /* Date of expiration of dns call and robots.txt fetch */

        time_t dnsTimeout;

        /** test if a file can be fetched thanks to the robots.txt */

        bool testRobots(char *file);

        /* forbidden paths : given by robots.txt */

        Vector<char> forbidden;

        /** Put an url in the fifo

        * If there are too much, put it back in UrlsInternal

        * Never fill totally the fifo => call at least with 1 */

        void putGenericUrl(url *u, int limit, bool prio);

        inline void putUrl (url *u) { putGenericUrl(u, 15, false); }

        inline void putUrlWait (url *u) { putGenericUrl(u, 10, false); }

        inline void putPriorityUrl (url *u) { putGenericUrl(u, 5, true); }

        inline void putPriorityUrlWait (url *u) { putGenericUrl(u, 1, true); }

        /** Init a new dns query */

        void newQuery ();

        /** The dns query ended with success */

        void dnsAns (adns_answer *ans);

        /** we got the robots.txt, transfer what must be in IPSites */

        void robotsResult (FetchError res);

};

View Code

///////////////////////////////////////////////////////////

// class NamedSite

///////////////////////////////////////////////////////////



/** Constructor : initiate fields used by the program

 */

NamedSite::NamedSite () 

{

  name[0] = 0;

  nburls = 0;

  inFifo = 0; outFifo = 0;

  isInFifo = false;

  dnsState = waitDns;

  cname = NULL;

}



/** Destructor : This one is never used

 */

NamedSite::~NamedSite () {

  assert(false);

}



/* Management of the Fifo */

void NamedSite::putInFifo(url *u) {

  fifo[inFifo] = u;

  inFifo = (inFifo + 1) % maxUrlsBySite;

  assert(inFifo!=outFifo);

}



url *NamedSite::getInFifo() {

  assert (inFifo != outFifo);

  url *tmp = fifo[outFifo];

  outFifo = (outFifo + 1) % maxUrlsBySite;

  return tmp;

}



short NamedSite::fifoLength() {

  return (inFifo + maxUrlsBySite - outFifo) % maxUrlsBySite;

}



/* Put an url in the fifo if their are not too many */

void NamedSite::putGenericUrl(url *u, int limit, bool prio) {

  if (nburls > maxUrlsBySite-limit) {

    // Already enough Urls in memory for this Site

    // first check if it can already be forgotten

    if (!strcmp(name, u->getHost())) {

      if (dnsState == errorDns) {

        nburls++;

        forgetUrl(u, noDNS);

        return;

      }

      if (dnsState == noConnDns) {

        nburls++;

        forgetUrl(u, noConnection);

        return;

      }

      if (u->getPort() == port

          && dnsState == doneDns && !testRobots(u->getFile())) {

        nburls++;

        forgetUrl(u, forbiddenRobots);

        return;

      }

    }

    // else put it back in URLsDisk

    refUrl();

    global::inter->getOne();

    if (prio) {

      global::URLsPriorityWait->put(u);

    } else {

      global::URLsDiskWait->put(u);

    }

  } else {

    nburls++;

    if (dnsState == waitDns

        || strcmp(name, u->getHost())

        || port != u->getPort()

        || global::now > dnsTimeout) {

      // dns not done or other site

      putInFifo(u);

      addNamedUrl();

      // Put Site in fifo if not yet in

      if (!isInFifo) {

        isInFifo = true;

        global::dnsSites->put(this);

      }

    } else switch (dnsState) {

    case doneDns:

      transfer(u);

      break;

    case errorDns:

      forgetUrl(u, noDNS);

      break;

    default: // noConnDns

      forgetUrl(u, noConnection);

    }

  }

}



/** Init a new dns query

 */

void NamedSite::newQuery () 

{

    // Update our stats

    newId();

    if (global::proxyAddr != NULL) 

    {

        // we use a proxy, no need to get the sockaddr

        // give anything for going on

        siteSeen();

        siteDNS();

        // Get the robots.txt

        dnsOK();

    } 

    else if (isdigit(name[0])) 

    {

        // the name already in numbers-and-dots notation

        siteSeen();

        if (inet_aton(name, &addr)) 

        {

              // Yes, it is in numbers-and-dots notation

              siteDNS();

              // Get the robots.txt

              dnsOK();

        } 

        else 

        {

            // No, it isn't : this site is a non sense

            dnsState = errorDns;

            dnsErr();

        }

    } 

    else 

    {

        // submit an adns query

        global::nbDnsCalls++;

        adns_query quer = NULL;

        adns_submit(global::ads, name,

                    (adns_rrtype) adns_r_addr,

                    (adns_queryflags) 0,

                    this, &quer);

    }

}



/** The dns query ended with success

 * assert there is a freeConn

 */

void NamedSite::dnsAns (adns_answer *ans) 

{

    if (ans->status == adns_s_prohibitedcname) 

    {

        if (cname == NULL) 

        {

            // try to find ip for cname of cname

            cname = newString(ans->cname);

            global::nbDnsCalls++;

            adns_query quer = NULL;

            adns_submit(global::ads, cname,

                  (adns_rrtype) adns_r_addr,

                  (adns_queryflags) 0,

                  this, &quer);

        } 

        else 

        {

            // dns chains too long => dns error

            // cf nslookup or host for more information

            siteSeen();

            delete [] cname; cname = NULL;

            dnsState = errorDns;

            dnsErr();

        }

    } 

    else 

    {

        siteSeen();

        if (cname != NULL) 

        { 

            delete [] cname; 

            cname = NULL; 

        }

        if (ans->status != adns_s_ok) 

        {

          // No addr inet

          dnsState = errorDns;

          dnsErr();

        } 

        else 

        {

          siteDNS();

          // compute the new addr

          memcpy (&addr,

                  &ans->rrs.addr->addr.inet.sin_addr,

                  sizeof (struct in_addr));

          // Get the robots.txt

          dnsOK();

        }

    }

}



/** we've got a good dns answer

 * get the robots.txt

 * assert there is a freeConn

 */

void NamedSite::dnsOK () {

  Connexion *conn = global::freeConns->get();

  char res = getFds(conn, &addr, port);

  if (res != emptyC) {

    conn->timeout = timeoutPage;

    if (global::proxyAddr != NULL) {

      // use a proxy

      conn->request.addString("GET http://");

      conn->request.addString(name);

      char tmp[15];

      sprintf(tmp, ":%u", port);

      conn->request.addString(tmp);

      conn->request.addString("/robots.txt HTTP/1.0\r\nHost: ");

    } else {

      // direct connection

      conn->request.addString("GET /robots.txt HTTP/1.0\r\nHost: ");

    }

    conn->request.addString(name);

    conn->request.addString(global::headersRobots);

    conn->parser = new robots(this, conn);

    conn->pos = 0;

    conn->err = success;

    conn->state = res;

  } else {

    // Unable to get a socket

    global::freeConns->put(conn);

    dnsState = noConnDns;

    dnsErr();

  }

}



/** Cannot get the inet addr

 * dnsState must have been set properly before the call

 */

void NamedSite::dnsErr () {

  FetchError theErr;

  if (dnsState == errorDns) {

    theErr = noDNS;

  } else {

    theErr = noConnection;

  }

  int ss = fifoLength();

  // scan the queue

  for (int i=0; i<ss; i++) {

    url *u = getInFifo();

    if (!strcmp(name, u->getHost())) {

      delNamedUrl();

      forgetUrl(u, theErr);

    } else { // different name

      putInFifo(u);

    }

  }

  // where should now lie this site

  if (inFifo==outFifo) {

    isInFifo = false;

  } else {

    global::dnsSites->put(this);

  }

}



/** test if a file can be fetched thanks to the robots.txt */

bool NamedSite::testRobots(char *file) {

  uint pos = forbidden.getLength();

  for (uint i=0; i<pos; i++) {

    if (robotsMatch(forbidden[i], file))

      return false;

  }

  return true;

}



/** Delete the old identity of the site */

void NamedSite::newId () {

  // ip expires or new name or just new port

  // Change the identity of this site

#ifndef NDEBUG

  if (name[0] == 0) {

    addsite();

  }

#endif // NDEBUG

  url *u = fifo[outFifo];

  strcpy(name, u->getHost());

  port = u->getPort();

  dnsTimeout = global::now + dnsValidTime;

  dnsState = waitDns;

}



/** we got the robots.txt,

 * compute ipHashCode

 * transfer what must be in IPSites

 */

void NamedSite::robotsResult (FetchError res) {

  bool ok = res != noConnection;

  if (ok) {

    dnsState = doneDns;

    // compute ip hashcode

    if (global::proxyAddr == NULL) {

      ipHash=0;

      char *s = (char *) &addr;

      for (uint i=0; i<sizeof(struct in_addr); i++) {

        ipHash = ipHash*31 + s[i];

      }

    } else {

      // no ip and need to avoid rapidFire => use hostHashCode

      ipHash = this - global::namedSiteList;

    }

    ipHash %= IPSiteListSize;

  } else {

    dnsState = noConnDns;

  }

  int ss = fifoLength();

  // scan the queue

  for (int i=0; i<ss; i++) {

    url *u = getInFifo();

    if (!strcmp(name, u->getHost())) {

      delNamedUrl();

      if (ok) {

        if (port == u->getPort()) {

          transfer(u);

        } else {

          putInFifo(u);

        }

      } else {

        forgetUrl(u, noConnection);

      }

    } else {

      putInFifo(u);

    }

  }

  // where should now lie this site

  if (inFifo==outFifo) {

    isInFifo = false;

  } else {

    global::dnsSites->put(this);

  }  

}



void NamedSite::transfer (url *u) {

  if (testRobots(u->getFile())) {

    if (global::proxyAddr == NULL) {

      memcpy (&u->addr, &addr, sizeof (struct in_addr));

    }

    global::IPSiteList[ipHash].putUrl(u);

  } else {

    forgetUrl(u, forbiddenRobots);

  }

}



void NamedSite::forgetUrl (url *u, FetchError reason) {

  urls();

  fetchFail(u, reason);

  answers(reason);

  nburls--;

  delete u;

  global::inter->getOne();

}

View Code

其中两个类的定义

larbin-2.6.3/src/utils/PersistentFifo.h、larbin-2.6.3/src/utils/PersistentFifo.cc

// Larbin

// Sebastien Ailleret

// 06-01-00 -> 12-06-01



/* this fifo is stored on disk */



#ifndef PERSFIFO_H

#define PERSFIFO_H



#include <dirent.h>

#include <unistd.h>

#include <sys/types.h>

#include <sys/stat.h>

#include <fcntl.h>

#include <errno.h>

#include <string.h>



#include "types.h"

#include "utils/url.h"

#include "utils/text.h"

#include "utils/connexion.h"

#include "utils/mypthread.h"



class PersistentFifo 

{

    protected:

        uint in, out;

        #ifdef THREAD_OUTPUT

        pthread_mutex_t lock;

        #endif

        // number of the file used for reading

        uint fileNameLength;

        // name of files

        int fin, fout;

        char *fileName;



    protected:

        // Make fileName fit with this number

        void makeName(uint nb);

        // Give a file name for this int

        int getNumber(char *file);

        // Change the file used for reading

        void updateRead ();

        // Change the file used for writing

        void updateWrite ();



    protected:

        // buffer used for readLine

        char outbuf[BUF_SIZE];

        // number of char used in this buffer

        uint outbufPos;

        // buffer used for readLine

        char buf[BUF_SIZE];

        // number of char used in this buffer

        uint bufPos, bufEnd;

        // sockets for reading and writing

        int rfds, wfds;

    protected:

        // read a line on rfds

        char *readLine ();

        // write an url in the out file (buffered write)

        void writeUrl (char *s);

        // Flush the out Buffer in the outFile

        void flushOut ();



    public:

        PersistentFifo (bool reload, char *baseName);

        ~PersistentFifo ();



        /* get the first object (non totally blocking)

        * return NULL if there is none

        */

        url *tryGet ();



        /* get the first object (non totally blocking)

        * probably crash if there is none

        */

        url *get ();



        /* add an object in the fifo */

        void put (url *obj);



        /* how many items are there inside ? */

        int getLength ();

};



#endif // PERSFIFO_H

View Code

// Larbin

// Sebastien Ailleret

// 27-05-01 -> 04-01-02



#include <string.h>

#include <assert.h>

#include <stdlib.h>

#include <stdio.h>

#include <string.h>

#include <ctype.h>

#include <iostream.h>



#include "types.h"

#include "global.h"

#include "utils/mypthread.h"

#include "utils/PersistentFifo.h"



PersistentFifo::PersistentFifo (bool reload, char *baseName) 

{

  fileNameLength = strlen(baseName)+5;

  fileName = new char[fileNameLength+2];

  strcpy(fileName, baseName);

  fileName[fileNameLength+1] = 0;

  outbufPos = 0;

  bufPos = 0;

  bufEnd = 0;

  mypthread_mutex_init(&lock, NULL);

  if (reload) 

  {

    DIR *dir = opendir(".");

    struct dirent *name;



    fin = -1;

    fout = -1;

    name = readdir(dir);

    while (name != NULL) 

    {

      if (startWith(fileName, name->d_name)) 

      {

        int tmp = getNumber(name->d_name);

        if (fin == -1) 

        {

          fin = tmp;

          fout = tmp;

        } 

        else 

        {

          if (tmp > fin)  { fin = tmp; }

          if (tmp < fout) { fout = tmp; }

        }

      }

      name = readdir(dir);

    }

    if (fin == -1) 

    {

      fin = 0;

      fout = 0;

    }

    if (fin == fout && fin != 0) 

    {

      cerr << "previous crawl was too little, cannot reload state\n"

           << "please restart larbin with -scratch option\n";

      exit(1);

    }

    closedir(dir);

    in = (fin - fout) * urlByFile;

    out = 0;

    makeName(fin);

    wfds = creat (fileName, S_IRUSR | S_IWUSR);

    makeName(fout);

    rfds = open (fileName, O_RDONLY);

  } 

  else 

  {

    // Delete old fifos

    DIR *dir = opendir(".");

    struct dirent *name;

    name = readdir(dir);

    while (name != NULL) 

    {

      if (startWith(fileName, name->d_name)) 

      {

        unlink(name->d_name);

      }

      name = readdir(dir);

    }

    closedir(dir);



    fin = 0;

    fout = 0;

    in = 0;

    out = 0;

    makeName(0);

    wfds = creat (fileName, S_IRUSR | S_IWUSR);

    rfds = open (fileName, O_RDONLY);

  }

}



PersistentFifo::~PersistentFifo () 

{

  mypthread_mutex_destroy (&lock);

  close(rfds);

  close(wfds);

}



url *PersistentFifo::tryGet () 

{

  url *tmp = NULL;

  mypthread_mutex_lock(&lock);

  if (in != out) 

  {

    // The stack is not empty

    char *line = readLine();

    tmp = new url(line);

    out++;

    updateRead();

  }

  mypthread_mutex_unlock(&lock);

  return tmp;

}



url *PersistentFifo::get () 

{

  mypthread_mutex_lock(&lock);

  char *line = readLine();

  url *res = new url(line);

  out++;

  updateRead();

  mypthread_mutex_unlock(&lock);

  return res;

}



/** Put something in the fifo

 * The objet is then deleted

 */

void PersistentFifo::put (url *obj) 

{

  mypthread_mutex_lock(&lock);

  char *s = obj->serialize(); // statically allocated string

  writeUrl(s);

  in++;

  updateWrite();

  mypthread_mutex_unlock(&lock);

  delete obj;

} 

int PersistentFifo::getLength () 

{

  return in - out;

}



void PersistentFifo::makeName (uint nb) 

{

  for (uint i=fileNameLength; i>=fileNameLength-5; i--) 

  {

    fileName[i] = (nb % 10) + '0';

    nb /= 10;

  }

}



int PersistentFifo::getNumber (char *file) 

{

  uint len = strlen(file);

  int res = 0;

  for (uint i=len-6; i<=len-1; i++) 

  {

    res = (res * 10) + file[i] - '0';

  }

  return res;

}



void PersistentFifo::updateRead () 

{

  if ((out % urlByFile) == 0) 

  {

    close(rfds);

    makeName(fout);

    unlink(fileName);

    makeName(++fout);

    rfds = open(fileName, O_RDONLY);

    in -= out;

    out = 0;

    assert(bufPos == bufEnd);

  }

}



void PersistentFifo::updateWrite () 

{

  if ((in % urlByFile) == 0) 

  {

    flushOut();

    close(wfds);

    makeName(++fin);

    wfds = creat(fileName, S_IRUSR | S_IWUSR);

#ifdef RELOAD

    global::seen->save();

#ifdef NO_DUP

    global::hDuplicate->save();

#endif

#endif

  }

}



/* read a line from the file

 * uses a buffer

 */

char *PersistentFifo::readLine () {

  if (bufPos == bufEnd) {

    bufPos = 0; bufEnd = 0; buf[0] = 0;

  }

  char *posn = strchr(buf + bufPos, '\n');

  while (posn == NULL) {

    if (!(bufEnd - bufPos < maxUrlSize + 40 + maxCookieSize)) {

      printf(fileName);

      printf(buf+bufPos);

    }

    if (bufPos*2 > BUF_SIZE) {

      bufEnd -= bufPos;

      memmove(buf, buf+bufPos, bufEnd);

      bufPos = 0;

    }

    int postmp = bufEnd;

    bool noRead = true;

    while (noRead) {

      int rd = read(rfds, buf+bufEnd, BUF_SIZE-1-bufEnd);

      switch (rd) {

      case 0 :

        // We need to flush the output in order to read it

        flushOut();

        break;

      case -1 :

        // We have a trouble here

        if (errno != EINTR) {

          cerr << "Big Problem while reading (persistentFifo.h)\n";

          perror("reason");

          assert(false);

        } else {

          perror("Warning in PersistentFifo: ");

        }

        break;

      default:

        noRead = false;

        bufEnd += rd;

        buf[bufEnd] = 0;

        break;

      }

    }

    posn = strchr(buf + postmp, '\n');

  }

  *posn = 0;

  char *res = buf + bufPos;

  bufPos = posn + 1 - buf;

  return res;

}



// write an url in the out file (buffered write)

void PersistentFifo::writeUrl (char *s) {

  size_t len = strlen(s);

  assert(len < maxUrlSize + 40 + maxCookieSize);

  if (outbufPos + len < BUF_SIZE) {

    memcpy(outbuf + outbufPos, s, len);

    outbufPos += len;

  } else {

    // The buffer is full

    flushOut ();

    memcpy(outbuf + outbufPos, s, len);

    outbufPos = len;

  }

}



// Flush the out Buffer in the outFile

void PersistentFifo::flushOut () {

  ecrireBuff (wfds, outbuf, outbufPos);

  outbufPos = 0;

}

View Code

Larbin-2.6.3/src/utils/syncFifo.h

// Larbin

// Sebastien Ailleret

// 09-11-99 -> 07-12-01



/* fifo in RAM with synchronisations */



#ifndef SYNCFIFO_H

#define SYNCFIFO_H



#define std_size 100



#include "utils/mypthread.h"



template <class T>

class SyncFifo {

 protected:

  uint in, out;

  uint size;

  T **tab;

#ifdef THREAD_OUTPUT

  pthread_mutex_t lock;

  pthread_cond_t nonEmpty;

#endif



 public:

  /* Specific constructor */

  SyncFifo (uint size = std_size);



  /* Destructor */

  ~SyncFifo ();



  /* get the first object */

  T *get ();



  /* get the first object (non totally blocking)

   * return NULL if there is none

   */

  T *tryGet ();



  /* add an object in the Fifo */

  void put (T *obj);



  /* how many itmes are there inside ? */

  int getLength ();

};



template <class T>

SyncFifo<T>::SyncFifo (uint size) {

  tab = new T*[size];

  this->size = size;

  in = 0;

  out = 0;

  mypthread_mutex_init (&lock, NULL);

  mypthread_cond_init (&nonEmpty, NULL);

}



template <class T>

SyncFifo<T>::~SyncFifo () {

  delete [] tab;

  mypthread_mutex_destroy (&lock);

  mypthread_cond_destroy (&nonEmpty);

}



template <class T>

T *SyncFifo<T>::get () {

  T *tmp;

  mypthread_mutex_lock(&lock);

  mypthread_cond_wait(in == out, &nonEmpty, &lock);

  tmp = tab[out];

  out = (out + 1) % size;

  mypthread_mutex_unlock(&lock);

  return tmp;

}



template <class T>

T *SyncFifo<T>::tryGet () {

  T *tmp = NULL;

  mypthread_mutex_lock(&lock);

  if (in != out) {

    // The stack is not empty

    tmp = tab[out];

    out = (out + 1) % size;

  }

  mypthread_mutex_unlock(&lock);

  return tmp;

}



template <class T>

void SyncFifo<T>::put (T *obj) {

  mypthread_mutex_lock(&lock);

  tab[in] = obj;

  if (in == out) {

    mypthread_cond_broadcast(&nonEmpty);

  }

  in = (in + 1) % size;

  if (in == out) {

    T **tmp;

    tmp = new T*[2*size];

    for (uint i=out; i<size; i++) {

      tmp[i] = tab[i];

    }

    for (uint i=0; i<in; i++) {

      tmp[i+size] = tab[i];

    }

    in += size;

    size *= 2;

    delete [] tab;

    tab = tmp;

  }

  mypthread_mutex_unlock(&lock);

}



template <class T>

int SyncFifo<T>::getLength () {

  int tmp;

  mypthread_mutex_lock(&lock);

  tmp = (in + size - out) % size;

  mypthread_mutex_unlock(&lock);

  return tmp;

}



#endif // SYNCFIFO_H

View Code

你可能感兴趣的:(sequence)

leetcode-124 Binary Tree Maximum Path Sum 乐观的大鹏 LeetCode
Givenanon-emptybinarytree,findthemaximumpathsum.Forthisproblem,apathisdefinedasanysequenceofnodesfromsomestartingnodetoanynodeinthetreealongtheparent-childconnections.Thepathmustcontainatleastonenodea
LeetCode 673. Number of Longest Increasing Subsequence (Java版; Meidum) littlehaes 字符串动态规划算法 leetcode 数据结构
welcometomyblogLeetCode673.NumberofLongestIncreasingSubsequence(Java版;Meidum)题目描述Givenanunsortedarrayofintegers,findthenumberoflongestincreasingsubsequence.Example1:Input:[1,3,5,4,7]Output:2Explanatio
Biopython提取和分离复合体PDB文件中所有链的结构信息 qq_27390023 生物信息学 python
从蛋白质复合体的PDB文件中提取每个链的结构信息，并保存成单独的pdb文件。示例代码fromBioimportPDBdefextract_chain_sequences(pdb_file,output_dir):"""从PDB文件中提取所有链的序列，并保存为独立的PDB文件。:parampdb_file:蛋白质复合体PDB文件路径:paramoutput_dir:输出目录，用于保存各链的PDB文件
详解TCP的三次握手汪先声 tcp/ip 网络协议网络
TCP（三次握手）是指在建立一个可靠的传输控制协议(TCP)连接时，客户端和服务器之间的三步交互过程。这个过程的主要目的是确保连接是可靠的、双方的发送与接收能力是正常的，并且可以开始数据传输。下面是对每个步骤的详细解释：1.第一次握手：客户端发送SYN过程：客户端（A）向服务器（B）发送一个同步报文段（SYN，SynchronizeSequenceNumber），表示它想要与服务器建立连接。目的：
LeetCode 2207. 字符串中最多数目的子字符串 Sasakihaise_ LeetCode leetcode 后缀和
题目链接：力扣https://leetcode-cn.com/problems/maximize-number-of-subsequences-in-a-string/【分析】由于pattern中只有两个字符，假设分别是a、b，只需要统计出text中每个a后面有多少b即可，这儿这个通过后缀和的思想，先算出总的b的个数，如果当前字符是a，那么后面b的个数就是总的b的个数，如果是b，就把总的b的个数-
自学Python:计算斐波纳契数列小强聊成长
斐波那契数列（Fibonaccisequence），又称黄金分割数列，因数学家莱昂纳多·斐波那契（LeonardodaFibonacci）以兔子繁殖为例子而引入，故又称为“兔子数列”，指的是这样一个数列：0、1、1、2、3、5、8、13、21、34、……在数学上，斐波那契数列以如下被以递推的方法定义：F(0)=0，F(1)=1,F(n)=F(n-1)+F(n-2)（n≥2，n∈N*）在现代物理、准
一维数组 list 呢，怎么转换成 (批次句子长度特征值 )三维向量 python pytorch lstm 编程人工智能 zhangfeng1133 python pytorch 人工智能数据挖掘
一、介绍对于一维数组，如果你想将其转换成适合深度学习模型（如LSTM）输入的格式，你需要考虑将其扩展为三维张量。这通常涉及到批次大小（batchsize）、序列长度（sequencelength）和特征数量（numberoffeatures）的维度。以下是如何将一维数组转换为这种格式的步骤：###1.确定维度-**批次大小（BatchSize）**：这是你一次处理的样本数量。-**序列长度（Seq
顺序表(SequenceList)数据结构的基本操作实现详解 SuchABigBug C语言数据结构链表 c语言
目录一、前言二、整体设计框架三、函数实现1.SeqListInit2.SeqListDestory3.SeqListCheckCapacity4.SeqListPushBack(尾插)5.SeqListPopBack(尾删)6.SeqListPushFront(头插)7.SeqListPopFront(头删)8.SeqlistFind9.SeqListInsert(任意位置插入)9.SeqList
动态规划算法之最长公子序列详细解读（附带Java代码解读）南城花随雪。算法分析算法动态规划 java
最长公共子序列（LongestCommonSubsequence,LCS）问题是动态规划中另一个经典问题，广泛用于比较两个序列的相似度。它的目标是找到两个序列之间最长的公共子序列（不是连续的），使得这个子序列同时出现在两个序列中。1.问题定义给定两个序列X和Y，要找到它们的最长公共子序列，即一个序列Z，它同时是X和Y的子序列，且Z的长度最大。例如：对于序列X="ABCBDAB"和Y="BDCAB"
LeetCode题解：Word Ladder CheeRok LeetCode LeetCode全题解 leetcode
Giventwowords(beginWordandendWord),andadictionary’swordlist,findthelengthofshortesttransformationsequencefrombeginWordtoendWord,suchthat:OnlyonelettercanbechangedatatimeEachintermediatewordmustexistin
C语言 | Leetcode C语言题解之第392题判断子序列 DdddJMs__135 分享 C语言 Leetcode 题解
题目：题解：boolisSubsequence(char*s,char*t){intn=strlen(s),m=strlen(t);intf[m+1][26];memset(f,0,sizeof(f));for(inti=0;i=0;i--){for(intj=0;j<26;j++){if(t[i]==j+'a')f[i][j]=i;elsef[i][j]=f[i+1][j];}}intadd=0
代码随想录算法训练营Day22 | 491.递增子序列，46.全排列，47.全排列 II ，332. 重新安排行程，51. N皇后，37. 解数独，总结 Yummy Penguin 算法
第七章回溯算法part04491.递增子序列本题和大家刚做过的90.子集II非常像，但又很不一样，很容易掉坑里。代码随想录视频讲解：回溯算法精讲，树层去重与树枝去重|LeetCode：491.递增子序列_哔哩哔哩_bilibili#491classSolution:deffindSubsequences(self,nums):result=[]path=[]self.backtracking(nu
C++ | Leetcode C++题解之第392题判断子序列 Ddddddd_158 经验分享 C++Leetcode 题解
题目：题解：classSolution{public:boolisSubsequence(strings,stringt){intn=s.size(),m=t.size();vector>f(m+1,vector(26,0));for(inti=0;i=0;i--){for(intj=0;j<26;j++){if(t[i]==j+'a')f[i][j]=i;elsef[i][j]=f[i+1][j
python安全渗透笔记红云谈安全 python编程学习 python 安全
Python学习python常见错误UnicodeDecodeError:‘gbk’codeccan’tdecodebyte0x8cinposition22:illegalmultibytesequence//打开的文件未编码encoding='UTF-8'expectedanindentedblock未缩进，ifforcontinue又进入一次新的循环%将其他变量置入字符串特定位置以生成新字符串
胶水105 假装是老付
捕捉这些脱节的最好方法是按顺序给我自己讲一个故事，并考虑到我从以前的那些对话中收集到【工作任务之间】的那些依赖关系。Thebestwaytocatchthesedisconnectsistotellmyselfastoryinasequence,consideringdependenciesI’vegleanedfrompreviousconversations.例二EXAMPLE2来自销售团队的
Kafka高性能揭秘 —— sequence IO、PageCache、SendFile的应用详解大数据学习与分享 Kafka kafka 大数据 java
大家都知道Kafka是将数据存储于磁盘的，而磁盘读写性能往往很差，但Kafka官方测试其数据读写速率能达到600M/s，那么为什么Kafka性能会这么高呢？首先producer往broker发送消息时，采用batch的方式即批量而非一条一条的发送，这种方式可以有效降低网络IO的请求次数，提升性能。此外这些批次消息会"暂存"在缓冲池中，避免频繁的GC问题。批量发送的消息可以进行压缩并且传输的时候可以
vLLM (3) - Sequence & SequenceGroup 戴昊光人工智能 language model nlp python transformer
系列文章目录vLLM(1)-Qwen2推理&部署vLLM(2)-架构总览vLLM(3)-Sequence&SequenceGroup文章目录系列文章目录前言一、SequenceStage&SequenceStatus1.SeqenceStage2.SeqenceStatus二、SequenceData&Sequence1.SequenceData2.Sequence三、SequenceGroup&
创建sequence sql模板 wrx繁星点点 #新增模板 sql 数据库
createsequenceSEQ_CLE_FUND_ADJU_APPLY(序列名)minvalue（最小值）1nomaxvalue（如果间隔值>0说明是递增序列可以不需要最大值就使用nomaxvalue代替maxvalue9999999999，如果间隔值<0说明是递减序列可以不需要最小值就可以使用nominvalue）startwith（起始值：默认为1）1incrementby（间隔数：每次加
浙大数据结构：01-复杂度2 Maximum Subsequence Sum _Power_Y 数据结构浙大数据结构 c++
数据结构MOOCPTA习题01-复杂度2MaximumSubsequenceSum#includeusingnamespacestd;constintM=100005;inta[M];intmain(){intk;cin>>k;intf=1;for(inti=0;i>a[i];if(a[i]>=0)//如果出现大于0则进行在线处理f=0;}if(f){//全都小于0coutma){//更新答案ma
hive序列生成_Hive实现自增列的两种方法 weixin_39559804 hive序列生成
多维数据仓库中的维度表和事实表一般都需要有一个代理键，作为这些表的主键，代理键一般由单列的自增数字序列构成。Hive没有关系数据库中的自增列，但它也有一些对自增序列的支持，通常有两种方法生成代理键：使用row_number()窗口函数或者使用一个名为UDFRowSequence的用户自定义函数(UDF)。用row_number()函数生成代理键INSERTOVERWRITETABLEmy_hive
2020-08-13 To Succeed in The Long-Term, Think in 5, 10, or 20 Year Time Frames 春生阁
Humanscanbeprettygoodatshort-termthinking—butwe’renotverygoodatthinkingaboutthelong-termconsequencesofourpresentactions.Thepressuresofmodernlifemakeitincrediblydifficultforustoprojecttheimplicationsof
AtCoder Beginner Contest 369（ABCDEFG题）视频讲解阿史大杯茶 Atcoder c++算法数据结构
A-369ProblemStatementYouaregiventwointegersAAAandBBB.Howmanyintegersxxxsatisfythefollowingcondition?Condition:ItispossibletoarrangethethreeintegersAAA,BBB,andxxxinsomeordertoformanarithmeticsequence.A
Java | Leetcode Java题解之第392题判断子序列 m0_57195758 分享 Java Leetcode 题解
题目：题解：classSolution{publicbooleanisSubsequence(Strings,Stringt){intn=s.length(),m=t.length();int[][]f=newint[m+1][26];for(inti=0;i=0;i--){for(intj=0;j<26;j++){if(t.charAt(i)==j+'a')f[i][j]=i;elsef[i][
C++ | Leetcode C++题解之第392题判断子序列 Ddddddd_158 经验分享 C++Leetcode 题解
题目：题解：classSolution{public:boolisSubsequence(strings,stringt){intn=s.size(),m=t.size();vector>f(m+1,vector(26,0));for(inti=0;i=0;i--){for(intj=0;j<26;j++){if(t[i]==j+'a')f[i][j]=i;elsef[i][j]=f[i+1][j
如何在oracle实现自增数列 bhots oracle 数据库
如果您想在Oracle数据库中使用触发器（Trigger）实现自增功能，可以考虑通过序列（Sequence）结合触发器实现自增功能。以下是一个简单的示例：创建序列：首先创建一个序列，用于生成自增的值。CREATESEQUENCEyour_sequence_nameSTARTWITH1INCREMENTBY1;创建触发器：创建一个触发器，在插入数据时触发，将序列的值插入到相应的列中。CREATEOR
斐波那契数列——C语言木木ᶻ c语言蓝桥杯算法
目录一、递归法二、for循环三、for循环+数组斐波那契数列（Fibonaccisequence），也称之为黄金分割数列，由意大利数学家列昂纳多・斐波那契（LeonardoFibonacci）提出。斐波那契数列指的是这样的一个数列：1、1、2、3、5、8、13、21、34、……，这个数列从第3项开始，每一项都等于前面两项之和。在数学上，斐波那契数列可以被递推的方法定义如下：F(1)=1F(2)=1
Hive的存储格式百流 hadoop学习日记 hive hadoop 数据仓库
文章目录Hive的存储格式1.存储格式简介2.行存储与列存储行式存储列式存储混合的PAX存储结构TextFileSequenceFileHive的存储格式1.存储格式简介Hive支持的存储数的格式主要有：TEXTFILE(默认格式)、SEQUENCEFILE、RCFILE、ORCFILE、PARQUET。textfile为默认格式，建表时没有指定文件格式，则使用TEXTFILE，导入数据时会直接把
PCIe - DMA Sequence Starry丶标准总线接口协议数字IC fpga开发 express 网络
目录1.Initiation2.H2C（HosttoCard）2.1.MWr2.2.MRd2.3.CfgWr2.4.CfgRd3.C2H（CardtoHost）3.1.MWr3.2.MRd介绍PCIe拓扑结构下的DMA流程，实际上RC充当的就是DMAController的角色1.Initiation上电初始化，在设备枚举阶段，在内存空间中为每个PCIe设备分配BAR空间（包括MSI-X中断向量表）
oracle创建的用户能看另一用户全部表,ORACLE授权用户查询另一个用户下的表与视图... 实在想不出来了
一、系统权限说明：1、用户权限CREATESESSIOIN连接到数据库CREATETABLE在用户的方案中创建表CREATESEQUENCE在用户的方案中创建序列CREATEVIEW在用户的方案中创视图CREATEPROCEDURE在用户的方案中创建存储过程，函数或包1.1、例子：授予系统权限DBA能够授予用户指定的系统权限GRANTcreatesession,createtable,create
QT-快捷键-记事本文字放大缩小打地基的小白 QT 学习路程 qt 开发语言
一、QShortcut类QShortcut简介QShortcut类允许你为你的应用程序定义快捷键。当快捷键被按下时，QShortcut可以触发一个槽函数，或者它可以直接激活一个QWidget。创建QShortcut对象QShortcut可以通过多种构造函数创建，其中最常见的形式是：QShortcut(QKeySequencekey,QWidget*parent,constchar*member=0
jQuery 键盘事件keydown ,keypress ,keyup介绍 107x js jquery keydown keypress keyup
本文章总结了下些关于jQuery 键盘事件keydown ,keypress ,keyup介绍，有需要了解的朋友可参考。一、首先需要知道的是： 1、keydown() keydown事件会在键盘按下时触发. 2、keyup() 代码如下复制代码 $('input').keyup(funciton(){
AngularJS中的Promise bijian1013 JavaScript AngularJS Promise
一.Promise Promise是一个接口，它用来处理的对象具有这样的特点：在未来某一时刻（主要是异步调用）会从服务端返回或者被填充属性。其核心是，promise是一个带有then()函数的对象。为了展示它的优点，下面来看一个例子，其中需要获取用户当前的配置文件： var cu
c++ 用数组实现栈类 CrazyMizzz 数据结构 C++
#include<iostream> #include<cassert> using namespace std; template<class T, int SIZE = 50> class Stack{ private: T list[SIZE];//数组存放栈的元素 int top;//栈顶位置 public: Stack(
java和c语言的雷同麦田的设计者 java 递归 scaner
软件启动时的初始化代码，加载用户信息2015年5月27号从头学java二 1、语言的三种基本结构：顺序、选择、循环。废话不多说，需要指出一下几点： a、return语句的功能除了作为函数返回值以外，还起到结束本函数的功能，return后的语句不会再继续执行。 b、for循环相比于whi
LINUX环境并发服务器的三种实现模型被触发 linux
服务器设计技术有很多，按使用的协议来分有TCP服务器和UDP服务器。按处理方式来分有循环服务器和并发服务器。 1 循环服务器与并发服务器模型在网络程序里面，一般来说都是许多客户对应一个服务器，为了处理客户的请求，对服务端的程序就提出了特殊的要求。目前最常用的服务器模型有： ·循环服务器：服务器在同一时刻只能响应一个客户端的请求 ·并发服务器：服
Oracle数据库查询指令肆无忌惮_ oracle数据库
20140920 单表查询 -- 查询************************************************************************************************************ -- 使用scott用户登录 -- 查看emp表 desc emp
ext右下角浮动窗口知了ing JavaScript ext
第一种 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> <html xmlns="http://www.w3.org/1999/
浅谈REDIS数据库的键值设计矮蛋蛋 redis
http://www.cnblogs.com/aidandan/ 原文地址：http://www.hoterran.info/redis_kv_design 丰富的数据结构使得redis的设计非常的有趣。不像关系型数据库那样，DEV和DBA需要深度沟通，review每行sql语句，也不像memcached那样，不需要DBA的参与。redis的DBA需要熟悉数据结构，并能了解使用场景。
maven编译可执行jar包 alleni123 maven
http://stackoverflow.com/questions/574594/how-can-i-create-an-executable-jar-with-dependencies-using-maven <build> <plugins> <plugin> <artifactId>maven-asse
人力资源在现代企业中的作用百合不是茶 HR 企业管理
//人力资源在在企业中的作用人力资源为什么会存在，人力资源究竟是干什么的人力资源管理是对管理模式一次大的创新，人力资源兴起的原因有以下点：工业时代的国际化竞争，现代市场的风险管控等等。所以人力资源在现代经济竞争中的优势明显的存在，人力资源在集团类公司中存在着明显的优势(鸿海集团)，有一次笔者亲自去体验过红海集团的招聘，只知道人力资源是管理企业招聘的当时我被招聘上了，当时给我们培训的人
Linux自启动设置详解 bijian1013 linux
linux有自己一套完整的启动体系，抓住了linux启动的脉络，linux的启动过程将不再神秘。阅读之前建议先看一下附图。本文中假设inittab中设置的init tree为： /etc/rc.d/rc0.d /etc/rc.d/rc1.d /etc/rc.d/rc2.d /etc/rc.d/rc3.d /etc/rc.d/rc4.d /etc/rc.d/rc5.d /etc
Spring Aop Schema实现 bijian1013 java spring AOP
本例使用的是Spring2.5 1.Aop配置文件spring-aop.xml <?xml version="1.0" encoding="UTF-8"?> <beans xmlns="http://www.springframework.org/schema/beans" xmln
【Gson七】Gson预定义类型适配器 bit1129 gson
Gson提供了丰富的预定义类型适配器，在对象和JSON串之间进行序列化和反序列化时，指定对象和字符串之间的转换方式， DateTypeAdapter public final class DateTypeAdapter extends TypeAdapter<Date> { public static final TypeAdapterFacto
【Spark八十八】Spark Streaming累加器操作（updateStateByKey) bit1129 update
在实时计算的实际应用中，有时除了需要关心一个时间间隔内的数据，有时还可能会对整个实时计算的所有时间间隔内产生的相关数据进行统计。比如：对Nginx的access.log实时监控请求404时，有时除了需要统计某个时间间隔内出现的次数，有时还需要统计一整天出现了多少次404，也就是说404监控横跨多个时间间隔。 Spark Streaming的解决方案是累加器，工作原理是，定义
linux系统下通过shell脚本快速找到哪个进程在写文件 ronin47
一个文件正在被进程写我想查看这个进程文件一直在增大找不到谁在写使用lsof也没找到这个问题挺有普遍性的，解决方法应该很多，这里我给大家提个比较直观的方法。 linux下每个文件都会在某个块设备上存放，当然也都有相应的inode, 那么透过vfs.write我们就可以知道谁在不停的写入特定的设备上的inode。幸运的是systemtap的安装包里带了inodewatch.stp，位
java-两种方法求第一个最长的可重复子串 bylijinnan java 算法
import java.util.Arrays; import java.util.Collections; import java.util.List; public class MaxPrefix { public static void main(String[] args) { String str="abbdabcdabcx";
Netty源码学习-ServerBootstrap启动及事件处理过程 bylijinnan java netty
Netty是采用了Reactor模式的多线程版本，建议先看下面这篇文章了解一下Reactor模式： http://bylijinnan.iteye.com/blog/1992325 Netty的启动及事件处理的流程，基本上是按照上面这篇文章来走的文章里面提到的操作，每一步都能在Netty里面找到对应的代码其中Reactor里面的Acceptor就对应Netty的ServerBo
servelt filter listener 的生命周期 cngolon filter listener servelt 生命周期
1. servlet 当第一次请求一个servlet资源时，servlet容器创建这个servlet实例，并调用他的 init(ServletConfig config)做一些初始化的工作，然后调用它的service方法处理请求。当第二次请求这个servlet资源时，servlet容器就不在创建实例，而是直接调用它的service方法处理请求，也就是说
jmpopups获取input元素值 ctrain JavaScript
jmpopups 获取弹出层form表单首先，我有一个div，里面包含了一个表单，默认是隐藏的，使用jmpopups时，会弹出这个隐藏的div，其实jmpopups是将我们的代码生成一份拷贝。当我直接获取这个form表单中的文本框时，使用方法：$('#form input[name=test1]').val()；这样是获取不到的。我们必须到jmpopups生成的代码中去查找这个值，$(
vi查找替换命令详解 daizj linux 正则表达式替换查找 vim
一、查找查找命令 /pattern<Enter> ：向下查找pattern匹配字符串 ?pattern<Enter>：向上查找pattern匹配字符串使用了查找命令之后，使用如下两个键快速查找： n：按照同一方向继续查找 N：按照反方向查找字符串匹配 pattern是需要匹配的字符串，例如： 1: /abc<En
对网站中的js,css文件进行打包 dcj3sjt126com PHP 打包
一，为什么要用smarty进行打包 apache中也有给js,css这样的静态文件进行打包压缩的模块，但是本文所说的不是以这种方式进行的打包，而是和smarty结合的方式来把网站中的js,css文件进行打包。为什么要进行打包呢，主要目的是为了合理的管理自己的代码。现在有好多网站，你查看一下网站的源码的话，你会发现网站的头部有大量的JS文件和CSS文件，网站的尾部也有可能有大量的J
php Yii: 出现undefined offset 或者 undefined index解决方案 dcj3sjt126com undefined
在开发Yii 时，在程序中定义了如下方式： if($this->menuoption[2] === 'test')，那么在运行程序时会报：undefined offset:2，这样的错误主要是由于php.ini 里的错误等级太高了，在windows下错误等级
linux 文件格式（1） sed工具 eksliang linux linux sed工具 sed工具 linux sed详解
转载请出自出处： http://eksliang.iteye.com/blog/2106082 简介 sed 是一种在线编辑器，它一次处理一行内容。处理时，把当前处理的行存储在临时缓冲区中，称为“模式空间”（pattern space），接着用sed命令处理缓冲区中的内容，处理完成后，把缓冲区的内容送往屏幕。接着处理下一行，这样不断重复，直到文件末尾
Android应用程序获取系统权限 gqdy365 android
引用如何使Android应用程序获取系统权限第一个方法简单点，不过需要在Android系统源码的环境下用make来编译： 1. 在应用程序的AndroidManifest.xml中的manifest节点
HoverTree开发日志之验证码 hvt .net C#asp.net hovertree webform
HoverTree是一个ASP.NET的开源CMS，目前包含文章系统，图库和留言板功能。代码完全开放，文章内容页生成了静态的HTM页面，留言板提供留言审核功能，文章可以发布HTML源代码，图片上传同时生成高品质缩略图。推出之后得到许多网友的支持，再此表示感谢！留言板不断收到许多有益留言，但同时也有不少广告，因此决定在提交留言页面增加验证码功能。ASP.NET验证码在网上找，如果不是很多，就是特别多
JSON API：用 JSON 构建 API 的标准指南中文版 justjavac json
译文地址：https://github.com/justjavac/json-api-zh_CN 如果你和你的团队曾经争论过使用什么方式构建合理 JSON 响应格式，那么 JSON API 就是你的 anti-bikeshedding 武器。通过遵循共同的约定，可以提高开发效率，利用更普遍的工具，可以是你更加专注于开发重点：你的程序。基于 JSON API 的客户端还能够充分利用缓存，
数据结构随记_2 lx.asymmetric 数据结构笔记
第三章栈与队列一．简答题 1. 在一个循环队列中，队首指针指向队首元素的前一个位置。 2.在具有n个单元的循环队列中，队满时共有 n-1 个元素。 3. 向栈中压入元素的操作是先移动栈顶指针&n
Linux下的监控工具dstat 网络接口 linux
1) 工具说明dstat是一个用来替换 vmstat,iostat netstat,nfsstat和ifstat这些命令的工具, 是一个全能系统信息统计工具. 与sysstat相比, dstat拥有一个彩色的界面, 在手动观察性能状况时, 数据比较显眼容易观察; 而且dstat支持即时刷新, 譬如输入dstat 3, 即每三秒收集一次, 但最新的数据都会每秒刷新显示. 和sysstat相同的是,
C 语言初级入门--二维数组和指针 1140566087 二维数组 c/c++指针
/* 二维数组的定义和二维数组元素的引用二维数组的定义：当数组中的每个元素带有两个下标时，称这样的数组为二维数组； (逻辑上把数组看成一个具有行和列的表格或一个矩阵); 语法：类型名数组名[常量表达式1][常量表达式2] 二维数组的引用：引用二维数组元素时必须带有两个下标，引用形式如下：例如： int a[3][4]; 引用：
10点睛Spring4.1-Application Event wiselyman application
10.1 Application Event Spring使用Application Event给bean之间的消息通讯提供了手段应按照如下部分实现bean之间的消息通讯继承ApplicationEvent类实现自己的事件实现继承ApplicationListener接口实现监听事件使用ApplicationContext发布消息