microjson.cpp 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302
  1. /*
  2. * MIT License
  3. *
  4. * Copyright (c) 2020 Alexey Edelev <semlanik@gmail.com>
  5. *
  6. * This file is part of microjson project https://git.semlanik.org/semlanik/microjson
  7. *
  8. * Permission is hereby granted, free of charge, to any person obtaining a copy of this
  9. * software and associated documentation files (the "Software"), to deal in the Software
  10. * without restriction, including without limitation the rights to use, copy, modify,
  11. * merge, publish, distribute, sublicense, and/or sell copies of the Software, and
  12. * to permit persons to whom the Software is furnished to do so, subject to the following
  13. * conditions:
  14. *
  15. * The above copyright notice and this permission notice shall be included in all copies
  16. * or substantial portions of the Software.
  17. *
  18. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,
  19. * INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR
  20. * PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE
  21. * FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
  22. * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  23. * DEALINGS IN THE SOFTWARE.
  24. */
  25. #include "microjson.h"
  26. #include <iostream>
  27. #include <functional>
  28. #ifdef MICROJSON_DEBUG
  29. #define micorJsonDebug std::cout
  30. #else
  31. struct micorJsonNull : public std::ostream {
  32. };
  33. static micorJsonNull nullout;
  34. #define micorJsonDebug nullout
  35. #endif
  36. namespace {
  37. enum ParsingState {
  38. LookingForNameBegin,
  39. LookingForNameEnd,
  40. LookingForSeparator,
  41. LookingForValueBegin,
  42. LookingForValueEnd
  43. };
  44. }
  45. size_t microjson::extractNextProperty(const char *buffer, size_t size, JsonProperty &property) {
  46. if (buffer == nullptr || size == 0 || size == SIZE_MAX) {
  47. return SIZE_MAX;
  48. }
  49. property.nameBegin = SIZE_MAX;
  50. property.nameEnd = SIZE_MAX;
  51. property.valueBegin = SIZE_MAX;
  52. property.valueEnd = SIZE_MAX;
  53. property.type = JsonInvalidType;
  54. int valueBracesCounter = -1;
  55. int valueBracketsCounter = -1;
  56. int trueCounter = 3;
  57. int falseCounter = 4;
  58. std::function<bool(void)> valueEndMarker;
  59. ParsingState state = LookingForNameBegin;
  60. size_t i = 0;
  61. for (; i < size; i++) {
  62. const char byte = buffer[i];
  63. if (state == LookingForNameBegin) {
  64. if (byte == '\n' || byte == ' ' || byte == '\r' || byte == '\t') {
  65. micorJsonDebug << "Skip space" << std::endl;
  66. continue;
  67. }
  68. if (byte == '"') {
  69. micorJsonDebug << "Found name begin" << std::endl;
  70. property.nameBegin = i + 1;
  71. state = LookingForNameEnd;
  72. } else {
  73. std::cerr << "Not found name begin, unexpected" << std::endl;
  74. break;
  75. }
  76. } else if (state == LookingForNameEnd && byte == '"') {
  77. if (byte == '\n' || byte == ' ' || byte == '\r' || byte == '\t') {
  78. micorJsonDebug << "Skip space" << std::endl;
  79. continue;
  80. }
  81. if (i > 0 && buffer[i - 1] == '\\') {
  82. micorJsonDebug << "'\"' found in name" << std::endl;
  83. continue;
  84. }
  85. micorJsonDebug << "Found name end" << std::endl;
  86. property.nameEnd = i;
  87. state = LookingForSeparator;
  88. } else if (state == LookingForSeparator) {
  89. if (byte == '\n' || byte == ' ' || byte == '\r' || byte == '\t') {
  90. micorJsonDebug << "Skip space" << std::endl;
  91. continue;
  92. }
  93. if (byte == ':') {
  94. micorJsonDebug << "Found Separator" << std::endl;
  95. state = LookingForValueBegin;
  96. } else {
  97. break;
  98. }
  99. } else if (state == LookingForValueBegin) {
  100. if (byte == '\n' || byte == ' ' || byte == '\r' || byte == '\t') {
  101. micorJsonDebug << "Skip space" << std::endl;
  102. continue;
  103. }
  104. switch (byte) {
  105. case '"':
  106. valueEndMarker = [&](){
  107. return buffer[i] == '"' && buffer[i - 1] != '\\';
  108. };
  109. property.type = JsonStringType;
  110. break;
  111. case '-':
  112. case '0':
  113. case '1':
  114. case '2':
  115. case '3':
  116. case '4':
  117. case '5':
  118. case '6':
  119. case '7':
  120. case '8':
  121. case '9':
  122. valueEndMarker = [&buffer, &i](){
  123. if (buffer[i] != '+'
  124. && buffer[i] != '-'
  125. && buffer[i] != '0'
  126. && buffer[i] != '1'
  127. && buffer[i] != '2'
  128. && buffer[i] != '3'
  129. && buffer[i] != '4'
  130. && buffer[i] != '5'
  131. && buffer[i] != '6'
  132. && buffer[i] != '7'
  133. && buffer[i] != '8'
  134. && buffer[i] != '9'
  135. && buffer[i] != 'e'
  136. && buffer[i] != '.') {
  137. i--;
  138. return true;
  139. }
  140. return false;
  141. };
  142. property.type = JsonNumberType;
  143. break;
  144. case '{':
  145. valueBracesCounter++;
  146. valueEndMarker = [&valueBracesCounter](){
  147. return valueBracesCounter < 0;
  148. };
  149. property.type = JsonObjectType;
  150. break;
  151. case 't':
  152. valueEndMarker = [&trueCounter](){
  153. return trueCounter == 0;
  154. };
  155. property.type = JsonBoolType;
  156. break;
  157. case 'f':
  158. valueEndMarker = [&falseCounter](){
  159. return falseCounter == 0;
  160. };
  161. property.type = JsonBoolType;
  162. break;
  163. case '[':
  164. valueBracketsCounter++;
  165. valueEndMarker = [&valueBracketsCounter](){
  166. return valueBracketsCounter < 0;
  167. };
  168. property.type = JsonArrayType;
  169. break;
  170. }
  171. if (valueEndMarker) {
  172. micorJsonDebug << "Found value begin" << std::endl;
  173. property.valueBegin = i;
  174. state = LookingForValueEnd;
  175. } else {
  176. break;
  177. }
  178. } else if (state == LookingForValueEnd) {
  179. switch (byte) {
  180. case '}':
  181. --valueBracesCounter;
  182. break;
  183. case '{':
  184. ++valueBracesCounter;
  185. break;
  186. case ']':
  187. --valueBracketsCounter;
  188. break;
  189. case '[':
  190. ++valueBracketsCounter;
  191. break;
  192. default:
  193. --trueCounter;
  194. --falseCounter;
  195. break;
  196. }
  197. if (valueEndMarker()) {
  198. micorJsonDebug << "Found value end" << std::endl;
  199. property.valueEnd = i;
  200. break;
  201. }
  202. }
  203. }
  204. if (property.eofCheck()) {
  205. property.valueEnd = size - 1; //EOF case
  206. micorJsonDebug << "Found value end at EOF" << std::endl;
  207. }
  208. micorJsonDebug << property.nameBegin << " " << property.nameEnd << " " << property.valueBegin << " " << property.valueEnd << " " << property.type << std::endl;
  209. if (property.check()) {
  210. if (property.type == JsonStringType
  211. || property.type == JsonArrayType
  212. || property.type == JsonObjectType) {
  213. ++property.valueBegin;
  214. --property.valueEnd;
  215. }
  216. for (size_t j = i + 1; j < size; j++) {
  217. const char &byte = buffer[j];
  218. if (byte == ',') {
  219. return j + 1;
  220. } else if (byte != '\n' && byte != ' ' && byte != '\r' && byte != '\t') {
  221. micorJsonDebug << "Unexpected: " << byte;
  222. return SIZE_MAX;
  223. }
  224. }
  225. return size;
  226. } else {
  227. micorJsonDebug << "Property check failed" << std::endl;
  228. }
  229. return SIZE_MAX;
  230. }
  231. microjson::JsonObject microjson::parseObject(const char *buffer, size_t size) {
  232. JsonObject obj;
  233. if (buffer == nullptr || size == 0 || size == SIZE_MAX) {
  234. return obj;
  235. }
  236. size_t objectBeginPosition = SIZE_MAX;
  237. size_t objectEndPosition = SIZE_MAX;
  238. for (size_t i = 0; i < size; i++) {
  239. const char beginByte = buffer[i];
  240. const char endByte = buffer[size - i - 1];
  241. if (objectBeginPosition == SIZE_MAX) {
  242. if (beginByte == '{') {
  243. objectBeginPosition = i;
  244. } else if (beginByte != '\n' && beginByte != ' ' && beginByte != '\r' && beginByte != '\t') {
  245. std::cerr << "Unexpected begin byte" << beginByte << std::endl;
  246. break;
  247. }
  248. }
  249. if (objectEndPosition == SIZE_MAX) {
  250. if (endByte == '}') {
  251. objectEndPosition = size - i - 1;
  252. } else if (endByte != '\n' && endByte != ' ' && endByte != '\r' && endByte != '\t') {
  253. std::cerr << "Unexpected end byte" << endByte << std::endl;
  254. break;
  255. }
  256. }
  257. if (objectBeginPosition != SIZE_MAX && objectEndPosition != SIZE_MAX) {
  258. break;
  259. }
  260. }
  261. if (objectBeginPosition == SIZE_MAX || objectEndPosition == SIZE_MAX) {
  262. return obj;
  263. }
  264. JsonProperty property;
  265. buffer += objectBeginPosition + 1;//Skip '{'
  266. size = objectEndPosition - objectBeginPosition - 1;//Skip '}'
  267. micorJsonDebug << "Object buffer size: " << size << " buffer: " << std::string(buffer, size) << std::endl;
  268. for (size_t nextPropertyPosition = microjson::extractNextProperty(buffer, size, property); nextPropertyPosition != SIZE_MAX; ) {
  269. micorJsonDebug << "nextPropertyPosition: " << nextPropertyPosition << "size: " << size << std::endl;
  270. if (nextPropertyPosition != SIZE_MAX) {
  271. std::string name((buffer + property.nameBegin), property.nameSize());
  272. std::string value((buffer + property.valueBegin), property.valueSize());
  273. micorJsonDebug << "name: " << name << " value: " << value << std::endl;
  274. obj[name] = { value, property.type };
  275. }
  276. buffer += nextPropertyPosition;
  277. size = size - nextPropertyPosition;
  278. nextPropertyPosition = microjson::extractNextProperty(buffer, size, property);
  279. }
  280. return obj;
  281. }