rootm0s
diff --git a/‎PeProtector/Compile/CCompile.cpp
+725 b/‎PeProtector/Compile/CCompile.cpp
+725
diff --git a/‎PeProtector/Compile/CCompile.h
+18 b/‎PeProtector/Compile/CCompile.h
+18
diff --git a/‎PeProtector/Compile/CLexicalAnalizer.cpp
+324 b/‎PeProtector/Compile/CLexicalAnalizer.cpp
+324
@@ -0,0 +1,18 @@
+#ifndef CCOMPILE_H
+#define CCOMPILE_H
+
+#include "..\Library\SCommand.h"
+#include <istream>
+#include <iosfwd>
+
+namespace NPeProtector
+{
+   /**
+    * @brief Compile source code into SCommand array for next processing in Protector
+    * @param[in] input character stream of source code
+    * @return Array of SCommand
+    */
+   std::vector<SCommand> compile(std::basic_istream<char, std::char_traits<char> > & input);
+}
+
+#endif
@@ -0,0 +1,324 @@
+#include "CLexicalAnalizer.h"
+#include "ctype.h"
+#include <string>
+#include "..\library\Types.h"
+#include <assert.h>
+#include <iostream>
+
+using std::vector;
+using std::string;
+using std::basic_istream;
+using std::char_traits;
+using std::getline;
+using std::exception;
+using std::stoul;
+
+#define ARRAY_SIZE(array) (sizeof((array))/sizeof((array[0])))
+
+namespace NPeProtector
+{
+namespace
+{
+   // todo move to impl
+   const char * const sCategories[] =
+   {
+      ",",
+//      ".",
+      ":",
+      "-",
+      "+",
+      "(",
+      ")",
+      "[",
+      "]",
+      "*",
+      // keywords
+      "IMPORT",
+      "EXTERN",
+      "DUP",
+      "PTR",
+      "SECTION",
+      "DIRECTIVE"
+   };
+
+   vector<string> splitLine(string line)
+   {
+      vector<string> result;
+
+      // skip comments
+      line = string(line, 0, line.find(';'));
+
+      for (unsigned int beginPosition = 0, length = 0; beginPosition < line.size();)
+      {
+         if ((beginPosition + length == line.size()) || line[beginPosition + length] == ' ' || line[beginPosition + length] == '\t')
+         {
+            if (length > 0)
+            {
+               // add name
+               result.push_back(line.substr(beginPosition, length));
+               beginPosition += length + 1;
+               length = 0;
+            }
+            else
+            {
+               // skip space
+               beginPosition += 1;
+            }
+         }
+         else if (line[beginPosition + length] == '"')
+         {
+            if (length > 0)
+            {
+               // add name
+               result.push_back(line.substr(beginPosition, length));
+            }
+
+            const size_t beginStringPosition = beginPosition + length;
+
+            // add string
+            const size_t quotePosition = line.find("\"", beginStringPosition + 1);
+            if (quotePosition == string::npos)
+            {
+               throw exception("wrong quote");
+            }
+            else
+            {
+               const size_t endStringPosition = quotePosition + 1;
+               result.push_back(line.substr(beginStringPosition, endStringPosition - beginStringPosition));
+            }
+            beginPosition = quotePosition + 1;
+            length = 0;
+         }
+         else if (!isalnum(line[beginPosition + length]) && line[beginPosition + length] != '_' && line[beginPosition + length] != '.')
+         {
+            if (length > 0)
+            {
+               // add name
+               result.push_back(line.substr(beginPosition, length)); 
+
+               // add character
+               result.push_back(line.substr(beginPosition + length, 1));
+
+               beginPosition += length + 1;
+               length = 0;
+            }
+            else
+            {
+               // add character
+               result.push_back(line.substr(beginPosition, 1));
+               beginPosition += 1;
+            }
+         }
+         else
+         {
+            length += 1;
+         }
+      }
+      return result;
+   }
+
+   vector<string> splitFile(basic_istream<char, char_traits<char> > & input)
+   {
+      vector<string> lines;
+      string line;
+      while (getline(input, line))
+      {
+         lines.push_back(line);
+      }
+      return lines;
+   }
+
+   vector<vector<string> > split(basic_istream<char, char_traits<char> > & input)
+   {
+      vector<vector<string> > tokens;
+
+      const vector<string> & lines = splitFile(input);
+
+      for (unsigned int i = 0; i < lines.size(); ++i)
+      {
+         tokens.push_back(splitLine(lines[i]));
+      }
+      return tokens;
+   }
+
+   //TODO find count of vector
+   SToken getToken(const string & stringToken)
+   {
+      assert(!stringToken.empty());
+
+      // scan for standard tokens
+      for (int i = 0; i < ARRAY_SIZE(sCategories); ++i)
+      {
+         if (!_strcmpi(stringToken.c_str(), sCategories[i]))
+         {
+            return SToken(NCategory::EType(i));
+         }
+      }
+
+      // TODO: create loop for this
+
+      // scan for instructions
+      for (int i = 0; i < NInstruction::gSize; ++i)
+      {
+         if (!_strcmpi(stringToken.c_str(), NInstruction::gStrings[i]))
+         {
+            return SToken(NCategory::INSTRUCTION, i);
+         }
+      }
+
+      // scan for registers
+      for (int i = 0; i < NRegister::gSize; ++i)
+      {
+         if (!_strcmpi(stringToken.c_str(), NRegister::gStrings[i]))
+         {
+            return SToken(NCategory::REGISTER, i);
+         }
+      }
+
+      // scan for prefixes
+      for (int i = 0; i < NPrefix::gSize; ++i)
+      {
+         if (!_strcmpi(stringToken.c_str(), NPrefix::gStrings[i]))
+         {
+            return SToken(NCategory::PREFIX, i);
+         }
+      }
+
+      // scan for data types
+      for (int i = 0; i < NDataType::gSize; ++i)
+      {
+         if (!_strcmpi(stringToken.c_str(), NDataType::gStrings[i]))
+         {
+            return SToken(NCategory::DATA_TYPE, i);
+         }
+      }
+
+      // scan for segments
+      for (int i = 0; i < NSegment::gSize; ++i)
+      {
+         if (!_strcmpi(stringToken.c_str(), NSegment::gStrings[i]))
+         {
+            return SToken(NCategory::SEGMENT, i);
+         }
+      }
+
+      if (stringToken[0] == '"')
+      {
+         return SToken(NCategory::STRING, 0, stringToken.substr(1, stringToken.size() - 2));
+      }
+
+      if (isdigit(stringToken[0]))
+      {
+         int base = 10;
+         string digits = stringToken;
+
+         if (stringToken.back() == 'h' || stringToken.back() == 'H')
+         {
+            base = 16;
+            digits = stringToken.substr(0, stringToken.size() - 1);
+         }
+
+         size_t index = 0;
+         const unsigned int constant = stoul(digits, &index, base);
+         if (index != digits.size())
+         {
+            throw exception(("wrong number : " + stringToken).c_str());
+         }
+         return SToken(NCategory::CONSTANT, 0, "", constant);
+      }
+
+      return SToken(NCategory::NAME, 0, stringToken);
+   }
+}
+
+namespace NCategory
+{
+   const char * const gStrings[] =
+   {
+      "COMMA",         // ','
+      //"DOT",           // '.' for import
+      "COLON",         // ':'
+      "MINUS",         // '-'
+      "PLUS",          // '+'
+      "OP_BRACKET",    // '('
+      "CL_BRACKET",    // ')'
+      "OP_SQ_BRACKET", // '['
+      "CL_SQ_BRACKET", // ']'
+      "ASTERIX",       // '*'
+      // keywords
+      "IMPORT",
+      "EXTERN",
+      "DUP",
+      "PTR",
+      "SECTION",
+      "DIRECTIVE",
+      // groups
+      "DATA_TYPE",   // map to type NDataType::EType
+      "PREFIX",      // map to type NPrefix::EType
+      "INSTRUCTION", // map to type NInstruction::EType
+      "REGISTER",    // map to type NRegister::EType
+      "SEGMENT",     // map to type NSegment::EType
+      // undefined string
+      "NAME",
+      "STRING",
+      "CONSTANT"
+   };
+   const int gSize = ARRAY_SIZE(gStrings);
+}
+
+   SToken::SToken() 
+      : mType()
+      , mIndex()
+      , mData()
+      , mConstant()
+   {
+   }
+
+   SToken::SToken(const NCategory::EType type, int index /*= 0*/, string name /*= string()*/, DWORD constant /*= 0*/)
+      : mType(type)
+      , mIndex(index)
+      , mData(name)
+      , mConstant(constant)
+   {
+   }
+
+   bool isMatch(const vector<SToken> & tokens, const vector<NCategory::EType> & categories)
+   {
+      bool result = categories.empty();
+      if (!result)
+      {
+         unsigned int i = 0;
+         for (; i < categories.size() && i < tokens.size(); ++i)
+         {
+            if (tokens[i].mType != categories[i])
+            {
+               break;
+            }
+         }
+         result = i == categories.size();
+      }
+      return result;
+   }
+
+   vector<vector<SToken> > parse(basic_istream<char, char_traits<char> > & input)
+   {
+      const vector<vector<string> > & tokens = split(input);
+      
+      vector<vector<SToken> > result;
+
+      for (unsigned int i = 0; i < tokens.size(); ++i)
+      {
+         vector<SToken> lineTokens;
+
+         for (unsigned int j = 0; j < tokens[i].size(); ++j)
+         {
+            if (!tokens[i][j].empty())
+            {
+               lineTokens.push_back(getToken(tokens[i][j]));
+            }
+         }
+         result.push_back(lineTokens);
+      }
+      return result;
+   }
+}