ES-DE/es-core/src/utils/StringUtil.cpp

#include "utils/StringUtil.h"

namespace Utils
{
	namespace String
	{
		unsigned int chars2Unicode(const std::string& _string, size_t& _cursor)
		{
			const char&  c      = _string[_cursor];
			unsigned int result = '?';

			if((c & 0x80) == 0) // 0xxxxxxx, one byte character
			{
				// 0xxxxxxx
				result = ((_string[_cursor++]       )      );
			}
			else if((c & 0xE0) == 0xC0) // 110xxxxx, two byte character
			{
				// 110xxxxx 10xxxxxx
				result = ((_string[_cursor++] & 0x1F) <<  6) |
						 ((_string[_cursor++] & 0x3F)      );
			}
			else if((c & 0xF0) == 0xE0) // 1110xxxx, three byte character
			{
				// 1110xxxx 10xxxxxx 10xxxxxx
				result = ((_string[_cursor++] & 0x0F) << 12) |
						 ((_string[_cursor++] & 0x3F) <<  6) |
						 ((_string[_cursor++] & 0x3F)      );
			}
			else if((c & 0xF8) == 0xF0) // 11110xxx, four byte character
			{
				// 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx
				result = ((_string[_cursor++] & 0x07) << 18) |
						 ((_string[_cursor++] & 0x3F) << 12) |
						 ((_string[_cursor++] & 0x3F) <<  6) |
						 ((_string[_cursor++] & 0x3F)      );
			}
			else
			{
				// error, invalid unicode
				++_cursor;
			}

			return result;

		} // chars2Unicode

		std::string unicode2Chars(const unsigned int _unicode)
		{
			std::string result;

			if(_unicode < 0x80) // one byte character
			{
				result += ((_unicode      ) & 0xFF);
			}
			else if(_unicode < 0x800) // two byte character
			{
				result += ((_unicode >>  6) & 0xFF) | 0xC0;
				result += ((_unicode      ) & 0x3F) | 0x80;
			}
			else if(_unicode < 0xFFFF) // three byte character
			{
				result += ((_unicode >> 12) & 0xFF) | 0xE0;
				result += ((_unicode >>  6) & 0x3F) | 0x80;
				result += ((_unicode      ) & 0x3F) | 0x80;
			}
			else if(_unicode <= 0x1fffff) // four byte character
			{
				result += ((_unicode >> 18) & 0xFF) | 0xF0;
				result += ((_unicode >> 12) & 0x3F) | 0x80;
				result += ((_unicode >>  6) & 0x3F) | 0x80;
				result += ((_unicode      ) & 0x3F) | 0x80;
			}
			else
			{
				// error, invalid unicode
				result += '?';
			}

			return result;

		} // unicode2Chars

		size_t nextCursor(const std::string& _string, const size_t _cursor)
		{
			size_t result = _cursor;

			while(result < _string.length())
			{
				++result;

				if((_string[result] & 0xC0) != 0x80) // break if current character is not 10xxxxxx
					break;
			}

			return result;

		} // nextCursor

		size_t prevCursor(const std::string& _string, const size_t _cursor)
		{
			size_t result = _cursor;

			while(result > 0)
			{
				--result;

				if((_string[result] & 0xC0) != 0x80) // break if current character is not 10xxxxxx
					break;
			}

			return result;

		} // prevCursor

		size_t moveCursor(const std::string& _string, const size_t _cursor, const int _amount)
		{
			size_t result = _cursor;

			if(_amount > 0)
			{
				for(int i = 0; i < _amount; ++i)
					result = nextCursor(_string, result);
			}
			else if(_amount < 0)
			{
				for(int i = _amount; i < 0; ++i)
					result = prevCursor(_string, result);
			}

			return result;

		} // moveCursor

		void trim(std::string& _string)
		{
			if(_string.size())
			{
				size_t cursorB = 0;
				size_t cursorE = _string.size();
			
				while((cursorB < _string.size()) && _string[cursorB] == ' ')
					++cursorB;

				while((cursorE > 0) && _string[cursorE - 1] == ' ')
					--cursorE;

				_string.erase(_string.begin() + cursorE, _string.end());
				_string.erase(_string.begin(), _string.begin() + cursorB);
			}

		} // trim

	} // String::

} // Utils::
Move StringUtil to utils subfolder Added utils/FileSystemUtils which will replace some boost::filesystem functions in the future 2017-11-15 15:59:39 +00:00			`#include "utils/StringUtil.h"`

			`namespace Utils`
			`{`
			`namespace String`
			`{`
			`unsigned int chars2Unicode(const std::string& _string, size_t& _cursor)`
			`{`
			`const char& c = _string[_cursor];`
			`unsigned int result = '?';`

			`if((c & 0x80) == 0) // 0xxxxxxx, one byte character`
			`{`
			`// 0xxxxxxx`
			`result = ((_string[_cursor++] ) );`
			`}`
			`else if((c & 0xE0) == 0xC0) // 110xxxxx, two byte character`
			`{`
			`// 110xxxxx 10xxxxxx`
			`result = ((_string[_cursor++] & 0x1F) << 6) \|`
			`((_string[_cursor++] & 0x3F) );`
			`}`
			`else if((c & 0xF0) == 0xE0) // 1110xxxx, three byte character`
			`{`
			`// 1110xxxx 10xxxxxx 10xxxxxx`
			`result = ((_string[_cursor++] & 0x0F) << 12) \|`
			`((_string[_cursor++] & 0x3F) << 6) \|`
			`((_string[_cursor++] & 0x3F) );`
			`}`
			`else if((c & 0xF8) == 0xF0) // 11110xxx, four byte character`
			`{`
			`// 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx`
			`result = ((_string[_cursor++] & 0x07) << 18) \|`
			`((_string[_cursor++] & 0x3F) << 12) \|`
			`((_string[_cursor++] & 0x3F) << 6) \|`
			`((_string[_cursor++] & 0x3F) );`
			`}`
			`else`
			`{`
			`// error, invalid unicode`
			`++_cursor;`
			`}`

			`return result;`

			`} // chars2Unicode`

			`std::string unicode2Chars(const unsigned int _unicode)`
			`{`
			`std::string result;`

			`if(_unicode < 0x80) // one byte character`
			`{`
Silence warnings 2017-11-17 14:58:52 +00:00			`result += ((_unicode ) & 0xFF);`
Move StringUtil to utils subfolder Added utils/FileSystemUtils which will replace some boost::filesystem functions in the future 2017-11-15 15:59:39 +00:00			`}`
			`else if(_unicode < 0x800) // two byte character`
			`{`
Silence warnings 2017-11-17 14:58:52 +00:00			`result += ((_unicode >> 6) & 0xFF) \| 0xC0;`
Move StringUtil to utils subfolder Added utils/FileSystemUtils which will replace some boost::filesystem functions in the future 2017-11-15 15:59:39 +00:00			`result += ((_unicode ) & 0x3F) \| 0x80;`
			`}`
			`else if(_unicode < 0xFFFF) // three byte character`
			`{`
Silence warnings 2017-11-17 14:58:52 +00:00			`result += ((_unicode >> 12) & 0xFF) \| 0xE0;`
Move StringUtil to utils subfolder Added utils/FileSystemUtils which will replace some boost::filesystem functions in the future 2017-11-15 15:59:39 +00:00			`result += ((_unicode >> 6) & 0x3F) \| 0x80;`
			`result += ((_unicode ) & 0x3F) \| 0x80;`
			`}`
			`else if(_unicode <= 0x1fffff) // four byte character`
			`{`
Silence warnings 2017-11-17 14:58:52 +00:00			`result += ((_unicode >> 18) & 0xFF) \| 0xF0;`
Move StringUtil to utils subfolder Added utils/FileSystemUtils which will replace some boost::filesystem functions in the future 2017-11-15 15:59:39 +00:00			`result += ((_unicode >> 12) & 0x3F) \| 0x80;`
			`result += ((_unicode >> 6) & 0x3F) \| 0x80;`
			`result += ((_unicode ) & 0x3F) \| 0x80;`
			`}`
			`else`
			`{`
			`// error, invalid unicode`
			`result += '?';`
			`}`

			`return result;`

			`} // unicode2Chars`

			`size_t nextCursor(const std::string& _string, const size_t _cursor)`
			`{`
			`size_t result = _cursor;`

			`while(result < _string.length())`
			`{`
			`++result;`

			`if((_string[result] & 0xC0) != 0x80) // break if current character is not 10xxxxxx`
			`break;`
			`}`

			`return result;`

			`} // nextCursor`

			`size_t prevCursor(const std::string& _string, const size_t _cursor)`
			`{`
			`size_t result = _cursor;`

			`while(result > 0)`
			`{`
			`--result;`

			`if((_string[result] & 0xC0) != 0x80) // break if current character is not 10xxxxxx`
			`break;`
			`}`

			`return result;`

			`} // prevCursor`

			`size_t moveCursor(const std::string& _string, const size_t _cursor, const int _amount)`
			`{`
			`size_t result = _cursor;`

			`if(_amount > 0)`
			`{`
			`for(int i = 0; i < _amount; ++i)`
			`result = nextCursor(_string, result);`
			`}`
			`else if(_amount < 0)`
			`{`
			`for(int i = _amount; i < 0; ++i)`
			`result = prevCursor(_string, result);`
			`}`

			`return result;`

			`} // moveCursor`

			`void trim(std::string& _string)`
			`{`
			`if(_string.size())`
			`{`
			`size_t cursorB = 0;`
			`size_t cursorE = _string.size();`

			`while((cursorB < _string.size()) && _string[cursorB] == ' ')`
			`++cursorB;`

			`while((cursorE > 0) && _string[cursorE - 1] == ' ')`
			`--cursorE;`

			`_string.erase(_string.begin() + cursorE, _string.end());`
			`_string.erase(_string.begin(), _string.begin() + cursorB);`
			`}`

			`} // trim`

			`} // String::`

			`} // Utils::`