charman.cpp 1.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657
  1. #include <regex>
  2. #include <string>
  3. #include <vector>
  4. #include "charman.h"
  5. #include "zf_log.h"
  6. void CharMan::validate(void) {
  7. bool valid = true;
  8. for (int x = 0; x < text_offsets.size(); ++x) {
  9. int offset = text_offsets[x];
  10. if (offset >= 0) {
  11. if (text[x] != buffer[offset]) {
  12. ZF_LOGE("validate: %d off %d [%c != %c]", x, offset, text[x],
  13. buffer[offset]);
  14. valid = false;
  15. }
  16. if (text[x] != work[offset]) {
  17. ZF_LOGE("validate: %d off %d [%c != %c]", x, offset, text[x],
  18. work[offset]);
  19. valid = false;
  20. }
  21. }
  22. }
  23. if (!valid) {
  24. ZF_LOGE("* NOT VALID* Somethings hosed.");
  25. }
  26. }
  27. void CharMan::regular_expressions(void) {
  28. std::regex words("[a-zA-Z]+( [a-zA-Z]+)+");
  29. // I need position and length.
  30. for (auto it =
  31. std::sregex_iterator(this->text.begin(), this->text.end(), words);
  32. it != std::sregex_iterator(); ++it) {
  33. pos_len.push_back(std::make_pair(it->position(), it->length()));
  34. ZF_LOGD("pos %d len %d", (int)it->position(), (int)it->length());
  35. }
  36. }
  37. CharMan::CharMan(std::string &buffer, std::string &work, std::string &text,
  38. std::vector<int> &text_offsets)
  39. : buffer(buffer), work(work), text(text), text_offsets(text_offsets) {
  40. /*
  41. this->buffer = buffer;
  42. this->work = work;
  43. this->text = text;
  44. this->text_offsets = text_offsets;
  45. */
  46. validate();
  47. regular_expressions();
  48. ZF_LOGD("Found %d word groups", pos_len.size());
  49. };
  50. CharMan::~CharMan() { validate(); }