microjson.cpp 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389
  1. /*
  2. * MIT License
  3. *
  4. * Copyright (c) 2020 Alexey Edelev <semlanik@gmail.com>
  5. *
  6. * This file is part of microjson project https://git.semlanik.org/semlanik/microjson
  7. *
  8. * Permission is hereby granted, free of charge, to any person obtaining a copy of this
  9. * software and associated documentation files (the "Software"), to deal in the Software
  10. * without restriction, including without limitation the rights to use, copy, modify,
  11. * merge, publish, distribute, sublicense, and/or sell copies of the Software, and
  12. * to permit persons to whom the Software is furnished to do so, subject to the following
  13. * conditions:
  14. *
  15. * The above copyright notice and this permission notice shall be included in all copies
  16. * or substantial portions of the Software.
  17. *
  18. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,
  19. * INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR
  20. * PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE
  21. * FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
  22. * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  23. * DEALINGS IN THE SOFTWARE.
  24. */
  25. #include "microjson.h"
  26. #include <iostream>
  27. #ifdef MICROJSON_DEBUG
  28. #define microjsonDebug std::cout
  29. #else
  30. struct microjsonNull : public std::ostream {
  31. class nullBuffer : public std::streambuf {};
  32. microjsonNull() : std::ostream(new nullBuffer) {}
  33. };
  34. static microjsonNull nullout;
  35. #define microjsonDebug nullout
  36. #endif
  37. namespace {
  38. template<const char expectedBeginByte>
  39. void lookForBoundaries(const char *buffer, size_t size, size_t &begin, size_t &end) {
  40. const char expectedEndByte = expectedBeginByte + 2;
  41. begin = SIZE_MAX;
  42. end = SIZE_MAX;
  43. for (size_t i = 0; i < size; i++) {
  44. const char beginByte = buffer[i];
  45. const char endByte = buffer[size - i - 1];
  46. if (begin == SIZE_MAX) {
  47. if (beginByte == expectedBeginByte) {
  48. begin = i;
  49. } else if (beginByte != '\n' && beginByte != ' ' && beginByte != '\r' && beginByte != '\t') {
  50. std::cerr << "Unexpected begin byte" << beginByte << std::endl;
  51. break;
  52. }
  53. }
  54. if (end == SIZE_MAX) {
  55. if (endByte == expectedEndByte) {
  56. end = size - i - 1;
  57. } else if (endByte != '\n' && endByte != ' ' && endByte != '\r' && endByte != '\t') {
  58. std::cerr << "Unexpected end byte" << endByte << std::endl;
  59. break;
  60. }
  61. }
  62. if (begin != SIZE_MAX && end != SIZE_MAX) {
  63. break;
  64. }
  65. }
  66. }
  67. void lookForName(const char *buffer, size_t size, size_t &i, microjson::JsonProperty &property) {
  68. property.nameBegin = SIZE_MAX;
  69. property.nameEnd = SIZE_MAX;
  70. bool beginFound = false;
  71. for(; i < size; ++i) {
  72. const char byte = buffer[i];
  73. if (microjson::skipWhiteSpace(byte)) {
  74. microjsonDebug << "Skip space" << std::endl;
  75. continue;
  76. }
  77. if(!beginFound) {
  78. if (byte == '"') {
  79. microjsonDebug << "Found name begin" << std::endl;
  80. property.nameBegin = i + 1;
  81. beginFound = true;
  82. } else {
  83. std::cerr << "Not found name begin, unexpected" << std::endl;
  84. break;
  85. }
  86. } else if(byte == '"') {
  87. if (i > 0 && buffer[i - 1] == '\\') {
  88. microjsonDebug << "'\"' found in name" << std::endl;
  89. continue;
  90. }
  91. microjsonDebug << "Found name end" << std::endl;
  92. property.nameEnd = i;
  93. break;
  94. }
  95. }
  96. ++i;
  97. }
  98. bool lookForSeparator(const char* buffer, size_t size, size_t &i) {
  99. bool found = false;
  100. for(; i < size; ++i) {
  101. const char byte = buffer[i];
  102. if (microjson::skipWhiteSpace(byte)) {
  103. microjsonDebug << "Skip space" << std::endl;
  104. continue;
  105. }
  106. if (byte == ':') {
  107. microjsonDebug << "Found Separator" << std::endl;
  108. found = true;
  109. }
  110. break;
  111. }
  112. ++i;
  113. return found;
  114. }
  115. void lookForValue(const char *buffer, size_t size, size_t &i, microjson::JsonProperty &property) {
  116. int valueBracesCounter = -1;
  117. int valueBracketsCounter = -1;
  118. int trueCounter = 3;
  119. int falseCounter = 4;
  120. std::function<bool(void)> valueEndMarker;
  121. bool beginFound = false;
  122. bool stringScope = false;
  123. property.valueBegin = SIZE_MAX;
  124. property.valueEnd = SIZE_MAX;
  125. for(; i < size; i++) {
  126. const char byte = buffer[i];
  127. if (!beginFound) {
  128. microjsonDebug << "lookForValue at: " << i << " byte: " << byte << std::endl;
  129. if (microjson::skipWhiteSpace(byte)) {
  130. microjsonDebug << "Skip space" << std::endl;
  131. continue;
  132. }
  133. switch (byte) {
  134. case '"':
  135. valueEndMarker = [&](){
  136. return buffer[i] == '"' && buffer[i - 1] != '\\';
  137. };
  138. property.type = microjson::JsonStringType;
  139. break;
  140. case '-':
  141. case '0':
  142. case '1':
  143. case '2':
  144. case '3':
  145. case '4':
  146. case '5':
  147. case '6':
  148. case '7':
  149. case '8':
  150. case '9':
  151. valueEndMarker = [&buffer, &i](){
  152. if (buffer[i] != '+'
  153. && buffer[i] != '-'
  154. && buffer[i] != '0'
  155. && buffer[i] != '1'
  156. && buffer[i] != '2'
  157. && buffer[i] != '3'
  158. && buffer[i] != '4'
  159. && buffer[i] != '5'
  160. && buffer[i] != '6'
  161. && buffer[i] != '7'
  162. && buffer[i] != '8'
  163. && buffer[i] != '9'
  164. && buffer[i] != 'e'
  165. && buffer[i] != '.') {
  166. i--;
  167. return true;
  168. }
  169. return false;
  170. };
  171. property.type = microjson::JsonNumberType;
  172. break;
  173. case '{':
  174. valueBracesCounter++;
  175. valueEndMarker = [&stringScope, &byte, &valueBracesCounter](){
  176. if (!stringScope) {
  177. switch (byte) {
  178. case '}':
  179. --valueBracesCounter;
  180. break;
  181. case '{':
  182. ++valueBracesCounter;
  183. break;
  184. default:
  185. break;
  186. }
  187. }
  188. return valueBracesCounter < 0;
  189. };
  190. property.type = microjson::JsonObjectType;
  191. break;
  192. case 't':
  193. valueEndMarker = [&trueCounter](){
  194. --trueCounter;
  195. return trueCounter == 0;
  196. };
  197. property.type = microjson::JsonBoolType;
  198. break;
  199. case 'f':
  200. valueEndMarker = [&falseCounter](){
  201. --falseCounter;
  202. return falseCounter == 0;
  203. };
  204. property.type = microjson::JsonBoolType;
  205. break;
  206. case '[':
  207. valueBracketsCounter++;
  208. valueEndMarker = [&stringScope, &byte, &valueBracketsCounter](){
  209. if(!stringScope) {
  210. switch(byte) {
  211. case ']':
  212. --valueBracketsCounter;
  213. break;
  214. case '[':
  215. ++valueBracketsCounter;
  216. break;
  217. default:
  218. break;
  219. }
  220. }
  221. return valueBracketsCounter < 0;
  222. };
  223. property.type = microjson::JsonArrayType;
  224. break;
  225. }
  226. if (valueEndMarker) {
  227. microjsonDebug << "Found value begin" << std::endl;
  228. property.valueBegin = i;
  229. beginFound = true;
  230. } else {
  231. break;
  232. }
  233. } else {
  234. if (byte == '"' && (i == 0 || buffer[i - 1] != '\\')) {
  235. stringScope = !stringScope;
  236. }
  237. if (valueEndMarker()) {
  238. microjsonDebug << "Found value end" << std::endl;
  239. property.valueEnd = i;
  240. break;
  241. }
  242. }
  243. }
  244. if (property.checkEof()) {
  245. property.valueEnd = size - 1; //EOF case
  246. microjsonDebug << "Found value end at EOF" << std::endl;
  247. }
  248. if (property.type == microjson::JsonStringType) {
  249. ++property.valueBegin;
  250. --property.valueEnd;
  251. }
  252. }
  253. void findSeparator(const char *buffer, size_t size, size_t &i, const char expectedEndByte) {
  254. while (++i < size) {
  255. if(!microjson::skipWhiteSpace(buffer[i])) {
  256. break;
  257. }
  258. }
  259. const char endByte = buffer[i];
  260. if (endByte == expectedEndByte) {
  261. if(++i != size) {
  262. i = SIZE_MAX;
  263. }
  264. } else if(endByte == ',') {
  265. ++i;
  266. } else {
  267. i = SIZE_MAX;
  268. }
  269. }
  270. using Extractor = bool(*)(const char *, size_t, size_t &, const char, microjson::JsonProperty &);
  271. template<typename R,
  272. const char expectedBeginByte,
  273. Extractor extract,
  274. void(* collect)(const char *, R &, const microjson::JsonProperty &property)>
  275. R parseJsonCommon(const char *buffer, size_t size) {
  276. R returnValue;
  277. if (buffer == nullptr || size == 0 || size == SIZE_MAX) {
  278. return returnValue;
  279. }
  280. size_t objectBeginPosition = SIZE_MAX;
  281. size_t objectEndPosition = SIZE_MAX;
  282. lookForBoundaries<expectedBeginByte>(buffer, size, objectBeginPosition, objectEndPosition);
  283. if (objectBeginPosition == SIZE_MAX || objectEndPosition == SIZE_MAX) {
  284. return returnValue;
  285. }
  286. microjson::JsonProperty property;
  287. buffer += objectBeginPosition + 1;//Skip '{'
  288. size = objectEndPosition - objectBeginPosition;//Do not skip '}'
  289. microjsonDebug << "Object buffer size: " << size << " buffer: " << std::string(buffer, size) << std::endl;
  290. size_t nextPosition = 0;
  291. while (nextPosition < size) {
  292. microjsonDebug << "nextPropertyPosition: " << nextPosition << "size: " << size << std::endl;
  293. if(extract(buffer, size, nextPosition, expectedBeginByte + 2, property)) {
  294. collect(buffer, returnValue, property);
  295. }
  296. }
  297. return returnValue;
  298. }
  299. void appendProperty(const char* buffer, microjson::JsonObject &obj, const microjson::JsonProperty &property){
  300. std::string name((buffer + property.nameBegin), property.nameSize());
  301. std::string value;
  302. if(property.valueSize() > 0) {
  303. value = std::string((buffer + property.valueBegin), property.valueSize());
  304. }
  305. microjsonDebug << "name: " << name << " value: " << value << std::endl;
  306. obj[name] = { value, property.type };
  307. };
  308. void appendValue(const char* buffer, microjson::JsonArray &values, const microjson::JsonProperty &property){
  309. std::string value = std::string((buffer + property.valueBegin), property.valueSize());
  310. microjsonDebug << "value: " << value << std::endl;
  311. values.push_back({value, property.type});
  312. };
  313. }
  314. bool microjson::extractValue(const char *buffer, size_t size, size_t &i, const char expectedEndByte, microjson::JsonProperty &property) {
  315. if (size == 0) {
  316. i = SIZE_MAX;
  317. return false;
  318. }
  319. lookForValue(buffer, size, i, property);
  320. findSeparator(buffer, size, i, expectedEndByte);
  321. return property.checkValue();
  322. }
  323. bool microjson::extractProperty(const char *buffer, size_t size, size_t &i, const char expectedEndByte, microjson::JsonProperty &property) {
  324. if (size == 0) {
  325. i = SIZE_MAX;
  326. return false;
  327. }
  328. lookForName(buffer, size, i, property);
  329. if(property.nameBegin == SIZE_MAX && property.nameEnd == SIZE_MAX) {
  330. std::cerr << "Name not found" << std::endl;
  331. return false;
  332. }
  333. microjsonDebug << "Found name: " << std::string(buffer + property.nameBegin, property.nameSize()) << std::endl;
  334. if(!lookForSeparator(buffer, size, i)) {
  335. std::cerr << "Separator not found" << std::endl;
  336. return false;
  337. }
  338. lookForValue(buffer, size, i, property);
  339. microjsonDebug << "Found value: " << std::string(buffer + property.valueBegin, property.valueSize()) << std::endl;
  340. findSeparator(buffer, size, i, expectedEndByte);
  341. return property.check();
  342. }
  343. microjson::JsonObject microjson::parseJsonObject(const char *buffer, size_t size) {
  344. return parseJsonCommon<JsonObject, '{', extractProperty, appendProperty>(buffer, size);
  345. }
  346. microjson::JsonArray microjson::parseJsonArray(const char *buffer, size_t size) {
  347. return parseJsonCommon<JsonArray, '[', extractValue, appendValue>(buffer, size);
  348. }