jucipp/src/utility.cpp

#include "utility.hpp"
#include <algorithm>
#include <cstring>
#include <vector>

ScopeGuard::~ScopeGuard() {
  if(on_exit)
    on_exit();
}

size_t utf8_character_count(const std::string &text, size_t pos, size_t length) noexcept {
  size_t characters = 0;
  auto size = length == std::string::npos ? text.size() : std::min(pos + length, text.size());
  for(; pos < size;) {
    if(static_cast<unsigned char>(text[pos]) <= 0b01111111) {
      ++characters;
      ++pos;
    }
    else if(static_cast<unsigned char>(text[pos]) >= 0b11111000) // Invalid UTF-8 byte
      ++pos;
    else if(static_cast<unsigned char>(text[pos]) >= 0b11110000) {
      ++characters;
      pos += 4;
    }
    else if(static_cast<unsigned char>(text[pos]) >= 0b11100000) {
      ++characters;
      pos += 3;
    }
    else if(static_cast<unsigned char>(text[pos]) >= 0b11000000) {
      ++characters;
      pos += 2;
    }
    else // // Invalid start of UTF-8 character
      ++pos;
  }
  return characters;
}

size_t utf16_code_units_byte_count(const std::string &text, size_t code_units, size_t start_pos) {
  if(code_units == 0)
    return 0;

  size_t pos = start_pos;
  size_t current_code_units = 0;
  for(; pos < text.size();) {
    if(static_cast<unsigned char>(text[pos]) <= 0b01111111) {
      ++current_code_units;
      ++pos;
      if(current_code_units >= code_units)
        break;
    }
    else if(static_cast<unsigned char>(text[pos]) >= 0b11111000) // Invalid UTF-8 byte
      ++pos;
    else if(static_cast<unsigned char>(text[pos]) >= 0b11110000) {
      current_code_units += 2;
      pos += 4;
      if(current_code_units >= code_units)
        break;
    }
    else if(static_cast<unsigned char>(text[pos]) >= 0b11100000) {
      ++current_code_units;
      pos += 3;
      if(current_code_units >= code_units)
        break;
    }
    else if(static_cast<unsigned char>(text[pos]) >= 0b11000000) {
      ++current_code_units;
      pos += 2;
      if(current_code_units >= code_units)
        break;
    }
    else // // Invalid start of UTF-8 character
      ++pos;
  }
  return pos - start_pos;
}

size_t utf16_code_unit_count(const std::string &text, size_t pos, size_t length) {
  size_t code_units = 0;
  auto size = length == std::string::npos ? text.size() : std::min(pos + length, text.size());
  for(; pos < size;) {
    if(static_cast<unsigned char>(text[pos]) <= 0b01111111) {
      ++code_units;
      ++pos;
    }
    else if(static_cast<unsigned char>(text[pos]) >= 0b11111000) // Invalid UTF-8 byte
      ++pos;
    else if(static_cast<unsigned char>(text[pos]) >= 0b11110000) {
      code_units += 2;
      pos += 4;
    }
    else if(static_cast<unsigned char>(text[pos]) >= 0b11100000) {
      ++code_units;
      pos += 3;
    }
    else if(static_cast<unsigned char>(text[pos]) >= 0b11000000) {
      ++code_units;
      pos += 2;
    }
    else // // Invalid start of UTF-8 character
      ++pos;
  }
  return code_units;
}

bool starts_with(const char *str, const std::string &test) noexcept {
  for(size_t i = 0; i < test.size(); ++i) {
    if(*str == '\0')
      return false;
    if(*str != test[i])
      return false;
    ++str;
  }
  return true;
}

bool starts_with(const char *str, const char *test) noexcept {
  for(; *test != '\0'; ++test) {
    if(*str == '\0')
      return false;
    if(*str != *test)
      return false;
    ++str;
  }
  return true;
}

bool starts_with(const std::string &str, const std::string &test) noexcept {
  return str.compare(0, test.size(), test) == 0;
}

bool starts_with(const std::string &str, const char *test) noexcept {
  for(size_t i = 0; i < str.size(); ++i) {
    if(*test == '\0')
      return true;
    if(str[i] != *test)
      return false;
    ++test;
  }
  return *test == '\0';
}

bool starts_with(const std::string &str, size_t pos, const std::string &test) noexcept {
  if(pos > str.size())
    return false;
  return str.compare(pos, test.size(), test) == 0;
}

bool starts_with(const std::string &str, size_t pos, const char *test) noexcept {
  if(pos > str.size())
    return false;
  for(size_t i = pos; i < str.size(); ++i) {
    if(*test == '\0')
      return true;
    if(str[i] != *test)
      return false;
    ++test;
  }
  return *test == '\0';
}

bool ends_with(const std::string &str, const std::string &test) noexcept {
  if(test.size() > str.size())
    return false;
  return str.compare(str.size() - test.size(), test.size(), test) == 0;
}

bool ends_with(const std::string &str, const char *test) noexcept {
  auto test_size = strlen(test);
  if(test_size > str.size())
    return false;
  return str.compare(str.size() - test_size, test_size, test) == 0;
}

std::string escape(const std::string &input, const std::set<char> &escape_chars) {
  std::string result;
  result.reserve(input.size());
  for(auto &chr : input) {
    if(escape_chars.find(chr) != escape_chars.end())
      result += '\\';
    result += chr;
  }
  return result;
}

std::string to_hex_string(const std::string &input) {
  std::string result;
  result.reserve(input.size() * 2);
  std::string hex_chars = "0123456789abcdef";
  for(auto &chr : input) {
    result += hex_chars[static_cast<unsigned char>(chr) >> 4];
    result += hex_chars[static_cast<unsigned char>(chr) & 0x0f];
  }
  return result;
}

int version_compare(const std::string &lhs, const std::string &rhs) {
  static auto get_parts = [](const std::string &str) {
    std::vector<int> result;
    std::string tmp;
    for(auto &chr : str) {
      if(chr >= '0' && chr <= '9')
        tmp += chr;
      else if(chr == '.') {
        if(!tmp.empty()) {
          try {
            result.emplace_back(std::stoi(tmp));
          }
          catch(...) {
          }
          tmp.clear();
        }
      }
      else
        tmp += std::to_string(static_cast<unsigned char>(chr)); // Convert for instance letters to numbers
    }
    if(!tmp.empty()) {
      try {
        result.emplace_back(std::stoi(tmp));
      }
      catch(...) {
      }
      tmp.clear();
    }
    return result;
  };
  auto lhs_parts = get_parts(lhs);
  auto rhs_parts = get_parts(rhs);
  if(std::equal(lhs_parts.begin(), lhs_parts.end(), rhs_parts.begin(), rhs_parts.end()))
    return 0;
  if(std::lexicographical_compare(lhs_parts.begin(), lhs_parts.end(), rhs_parts.begin(), rhs_parts.end()))
    return -1;
  return 1;
}
Renamed C++ header and source files to use proper C++ file extensions. 6 years ago			`#include "utility.hpp"`
Made use of prettier library when possible to speed up prettier formatting 4 years ago			`#include <algorithm>`
Added and made use of string functions starts_with and ends_with, and minor cleanup for selection window code 6 years ago			`#include <cstring>`
Added version_compare and adds parallel to default value in preference item project.cmake.compile_command 4 years ago			`#include <vector>`
Added and made use of ScopeGuard class 7 years ago
			`ScopeGuard::~ScopeGuard() {`
			`if(on_exit)`
			`on_exit();`
			`}`
Added and made use of string functions starts_with and ends_with, and minor cleanup for selection window code 6 years ago
Improved resource use of Terminal::print 5 years ago			`size_t utf8_character_count(const std::string &text, size_t pos, size_t length) noexcept {`
Language client: added support for type declaration and implementation location. Also fixes to utf-8 byte count and regular utf-16 offsets, and cleaned up write_request and write_notification calls 5 years ago			`size_t characters = 0;`
Improved resource use of Terminal::print 5 years ago			`auto size = length == std::string::npos ? text.size() : std::min(pos + length, text.size());`
Language client: improved support for both UTF-16 offsets and offsetEncoding set to utf-8 5 years ago			`for(; pos < size;) {`
			`if(static_cast<unsigned char>(text[pos]) <= 0b01111111) {`
Language client: added support for type declaration and implementation location. Also fixes to utf-8 byte count and regular utf-16 offsets, and cleaned up write_request and write_notification calls 5 years ago			`++characters;`
Language client: improved support for both UTF-16 offsets and offsetEncoding set to utf-8 5 years ago			`++pos;`
			`}`
			`else if(static_cast<unsigned char>(text[pos]) >= 0b11111000) // Invalid UTF-8 byte`
			`++pos;`
			`else if(static_cast<unsigned char>(text[pos]) >= 0b11110000) {`
Language client: added support for type declaration and implementation location. Also fixes to utf-8 byte count and regular utf-16 offsets, and cleaned up write_request and write_notification calls 5 years ago			`++characters;`
Language client: improved support for both UTF-16 offsets and offsetEncoding set to utf-8 5 years ago			`pos += 4;`
			`}`
			`else if(static_cast<unsigned char>(text[pos]) >= 0b11100000) {`
Language client: added support for type declaration and implementation location. Also fixes to utf-8 byte count and regular utf-16 offsets, and cleaned up write_request and write_notification calls 5 years ago			`++characters;`
Language client: improved support for both UTF-16 offsets and offsetEncoding set to utf-8 5 years ago			`pos += 3;`
			`}`
			`else if(static_cast<unsigned char>(text[pos]) >= 0b11000000) {`
Language client: added support for type declaration and implementation location. Also fixes to utf-8 byte count and regular utf-16 offsets, and cleaned up write_request and write_notification calls 5 years ago			`++characters;`
Language client: improved support for both UTF-16 offsets and offsetEncoding set to utf-8 5 years ago			`pos += 2;`
			`}`
			`else // // Invalid start of UTF-8 character`
			`++pos;`
Fixed snippet argument offsets 6 years ago			`}`
Language client: added support for type declaration and implementation location. Also fixes to utf-8 byte count and regular utf-16 offsets, and cleaned up write_request and write_notification calls 5 years ago			`return characters;`
Fixed snippet argument offsets 6 years ago			`}`

Language client: improved support for both UTF-16 offsets and offsetEncoding set to utf-8 5 years ago			`size_t utf16_code_units_byte_count(const std::string &text, size_t code_units, size_t start_pos) {`
			`if(code_units == 0)`
			`return 0;`

			`size_t pos = start_pos;`
			`size_t current_code_units = 0;`
			`for(; pos < text.size();) {`
			`if(static_cast<unsigned char>(text[pos]) <= 0b01111111) {`
			`++current_code_units;`
			`++pos;`
			`if(current_code_units >= code_units)`
			`break;`
			`}`
			`else if(static_cast<unsigned char>(text[pos]) >= 0b11111000) // Invalid UTF-8 byte`
			`++pos;`
			`else if(static_cast<unsigned char>(text[pos]) >= 0b11110000) {`
			`current_code_units += 2;`
			`pos += 4;`
			`if(current_code_units >= code_units)`
			`break;`
			`}`
			`else if(static_cast<unsigned char>(text[pos]) >= 0b11100000) {`
			`++current_code_units;`
			`pos += 3;`
			`if(current_code_units >= code_units)`
			`break;`
			`}`
			`else if(static_cast<unsigned char>(text[pos]) >= 0b11000000) {`
			`++current_code_units;`
			`pos += 2;`
			`if(current_code_units >= code_units)`
			`break;`
			`}`
			`else // // Invalid start of UTF-8 character`
			`++pos;`
			`}`
			`return pos - start_pos;`
			`}`

Language client: added support for type declaration and implementation location. Also fixes to utf-8 byte count and regular utf-16 offsets, and cleaned up write_request and write_notification calls 5 years ago			`size_t utf16_code_unit_count(const std::string &text, size_t pos, size_t length) {`
			`size_t code_units = 0;`
			`auto size = length == std::string::npos ? text.size() : std::min(pos + length, text.size());`
			`for(; pos < size;) {`
			`if(static_cast<unsigned char>(text[pos]) <= 0b01111111) {`
			`++code_units;`
			`++pos;`
			`}`
			`else if(static_cast<unsigned char>(text[pos]) >= 0b11111000) // Invalid UTF-8 byte`
			`++pos;`
			`else if(static_cast<unsigned char>(text[pos]) >= 0b11110000) {`
			`code_units += 2;`
			`pos += 4;`
			`}`
			`else if(static_cast<unsigned char>(text[pos]) >= 0b11100000) {`
			`++code_units;`
			`pos += 3;`
			`}`
			`else if(static_cast<unsigned char>(text[pos]) >= 0b11000000) {`
			`++code_units;`
			`pos += 2;`
			`}`
			`else // // Invalid start of UTF-8 character`
			`++pos;`
			`}`
			`return code_units;`
			`}`

Added and made use of string functions starts_with and ends_with, and minor cleanup for selection window code 6 years ago			`bool starts_with(const char *str, const std::string &test) noexcept {`
			`for(size_t i = 0; i < test.size(); ++i) {`
			`if(*str == '\0')`
			`return false;`
			`if(*str != test[i])`
			`return false;`
			`++str;`
			`}`
			`return true;`
			`}`

			`bool starts_with(const char str, const char test) noexcept {`
			`for(; *test != '\0'; ++test) {`
			`if(*str == '\0')`
			`return false;`
			`if(str != test)`
			`return false;`
			`++str;`
			`}`
			`return true;`
			`}`

			`bool starts_with(const std::string &str, const std::string &test) noexcept {`
			`return str.compare(0, test.size(), test) == 0;`
			`}`

			`bool starts_with(const std::string &str, const char *test) noexcept {`
			`for(size_t i = 0; i < str.size(); ++i) {`
			`if(*test == '\0')`
			`return true;`
			`if(str[i] != *test)`
			`return false;`
			`++test;`
			`}`
			`return *test == '\0';`
			`}`

			`bool starts_with(const std::string &str, size_t pos, const std::string &test) noexcept {`
			`if(pos > str.size())`
			`return false;`
			`return str.compare(pos, test.size(), test) == 0;`
			`}`

			`bool starts_with(const std::string &str, size_t pos, const char *test) noexcept {`
			`if(pos > str.size())`
			`return false;`
			`for(size_t i = pos; i < str.size(); ++i) {`
			`if(*test == '\0')`
			`return true;`
			`if(str[i] != *test)`
			`return false;`
			`++test;`
			`}`
			`return *test == '\0';`
			`}`

			`bool ends_with(const std::string &str, const std::string &test) noexcept {`
			`if(test.size() > str.size())`
			`return false;`
			`return str.compare(str.size() - test.size(), test.size(), test) == 0;`
			`}`

			`bool ends_with(const std::string &str, const char *test) noexcept {`
			`auto test_size = strlen(test);`
			`if(test_size > str.size())`
			`return false;`
			`return str.compare(str.size() - test_size, test_size, test) == 0;`
			`}`
Made use of prettier library when possible to speed up prettier formatting 4 years ago
			`std::string escape(const std::string &input, const std::set<char> &escape_chars) {`
			`std::string result;`
			`result.reserve(input.size());`
			`for(auto &chr : input) {`
			`if(escape_chars.find(chr) != escape_chars.end())`
			`result += '\\';`
			`result += chr;`
			`}`
			`return result;`
			`}`

			`std::string to_hex_string(const std::string &input) {`
			`std::string result;`
			`result.reserve(input.size() * 2);`
			`std::string hex_chars = "0123456789abcdef";`
			`for(auto &chr : input) {`
			`result += hex_chars[static_cast<unsigned char>(chr) >> 4];`
			`result += hex_chars[static_cast<unsigned char>(chr) & 0x0f];`
			`}`
			`return result;`
			`}`
Added version_compare and adds parallel to default value in preference item project.cmake.compile_command 4 years ago
			`int version_compare(const std::string &lhs, const std::string &rhs) {`
			`static auto get_parts = [](const std::string &str) {`
			`std::vector<int> result;`
			`std::string tmp;`
			`for(auto &chr : str) {`
			`if(chr >= '0' && chr <= '9')`
			`tmp += chr;`
			`else if(chr == '.') {`
			`if(!tmp.empty()) {`
			`try {`
			`result.emplace_back(std::stoi(tmp));`
			`}`
			`catch(...) {`
			`}`
			`tmp.clear();`
			`}`
			`}`
			`else`
			`tmp += std::to_string(static_cast<unsigned char>(chr)); // Convert for instance letters to numbers`
			`}`
			`if(!tmp.empty()) {`
			`try {`
			`result.emplace_back(std::stoi(tmp));`
			`}`
			`catch(...) {`
			`}`
			`tmp.clear();`
			`}`
			`return result;`
			`};`
			`auto lhs_parts = get_parts(lhs);`
			`auto rhs_parts = get_parts(rhs);`
			`if(std::equal(lhs_parts.begin(), lhs_parts.end(), rhs_parts.begin(), rhs_parts.end()))`
			`return 0;`
			`if(std::lexicographical_compare(lhs_parts.begin(), lhs_parts.end(), rhs_parts.begin(), rhs_parts.end()))`
			`return -1;`
			`return 1;`
			`}`