pongo庞果:xml字符串文件的解析——为什么我的代码效率低?

最近正在学习C++ STL,尝试着使用C++解庞果上面的在线编程挑战题目,结果总是说超过3s时间。这是为啥呀为啥呀?哥只是用了个string 而已啊

题目 :http://hero.pongo.cn/Home/Index  蓝港在线:xml字符串文件的解析

代码贴出来,留待日后有能力了改进效率:

#include 
#include 
#include 
#include 

using namespace std;
using namespace boost;

string intToString(const int n )
{
   std::stringstream newstr;
   newstr << n;
   return newstr.str();
}

void ltrim(string& s)
{
   const char drop = ' ';
   // trim right
   s.erase(s.find_last_not_of(drop)+1);
   // trim left
   //s.erase(0,s.find_first_not_of(drop));
}

// LAB means Left Angle Brace: "<"
void jumpTilEndorLAB(string& str, int& pos)
{
   while((str[pos] != '\0') && (str[pos] != '<'))
   {
      pos++;
   }
}

//parse xml header: 
void parseXmlHeader(string& str, int& pos)
{
   if(('<' == str[pos]) && ('?' == str[pos+1]))
   {
      while(('?' != str[pos]) && ('>' != str[pos+1]))
      {
         pos++;
      }
      pos += 2;   //jump over ?>
      jumpTilEndorLAB(str, pos);
   }
   return ;
}

// parse the xml
string ParsingXML(string str)
{
   string   result;
   result.reserve(1024);
   int bodyPos = 0;
   int length = str.length(); 

   parseXmlHeader(str, bodyPos);

   if(bodyPos == length)
   {
      return result;
   }

   // Body format:
   //
   //    
   //          
   //    
   //    
   //

   int categoryStart = bodyPos;
   int categoryEndAll = length;
   // parse all categories
   while( categoryStart != categoryEndAll)
   {
      string category(str.substr(categoryStart+1, str.find_first_of('>', categoryStart)-categoryStart-1));

      //cout << category << endl;
      result += (category + "\r\n");

      int entityStart = categoryStart + category.length() + 2; //jump over 
      int entityEndAll = str.find((""), categoryStart);
      jumpTilEndorLAB(str, entityStart);

      //parse the category's entities
      int entityIndex = 1;
      while(entityStart != entityEndAll)
      {
         string entity(str.substr(entityStart+1, str.find_first_of('>', entityStart)-entityStart-1));
         //cout << "\t" << entity << " " << entityIndex++ << endl;
         result += "\t";
         result += (entity + " " + intToString(entityIndex) + "\r\n");

         entityIndex++;

         int attrStart = entityStart + 2 + entity.length();  //jump over 
         while(str[attrStart] != '<') 
         {
            attrStart++;
         }
         attrStart++;   //jump over the "<" before attribute
         while((str[attrStart] == ' ') || (str[attrStart] == '\t') || 
            (str[attrStart] == '\r') || (str[attrStart] == '\n'))   // jump over ' ' before attribute if spaces exist
         {
            attrStart++;
         }
         // parse the attributes
         while((str[attrStart] != '/') && (str[attrStart+1] != '>'))
         {
            int equivalentPos = str.find_first_of('=', attrStart);
            string attrName = str.substr(attrStart, equivalentPos-attrStart);
            ltrim(attrName);
            //cout << "\t\t" << attrName << ":";
            result += "\t\t";
            result += (attrName + ":");

            int valueBegin = str.find_first_of('\"', equivalentPos+1)+1;
            int valueEnd = str.find_first_of('\"', valueBegin+1);
            string attrValue = str.substr(valueBegin, valueEnd-valueBegin);
            //cout << attrValue << endl;
            result += (attrValue + "\r\n");

            attrStart = valueEnd + 1;  //parse next attribute
            while((str[attrStart] == ' ') || (str[attrStart] == '\t') || 
               (str[attrStart] == '\r') || (str[attrStart] == '\n'))   // jump over ' ' before attribute if spaces exist
            {
               attrStart++;
            }
         }
         entityStart = attrStart + 5 + entity.length();   //jump over "/>"
         jumpTilEndorLAB(str, entityStart);   //parse next entity
      }
      categoryStart = entityStart + 3 + category.length();   //jump over 
      jumpTilEndorLAB(str, categoryStart);         //parse next category
   }

   return result;
}

int main()
{   
   string str1(
"\
\r\n\
\r\n\t\
\r\n\t\t\
\r\n\t\r\n\t\
\r\n\t\t\
\r\n\t\
\r\n");

   //cout << str1 << endl;

   string result1;
   {
      progress_timer pt;
      for(int i = 0; i < 1000; i++)
      {
         result1 = ParsingXML(str1);
      }
   }
   cout << result1;

   return 1;

} 

注:此代码效率低,需要改进!





你可能感兴趣的:(C/C++,C++,STL,String,xml)