microjson.cpp 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422
  1. /*
  2. * MIT License
  3. *
  4. * Copyright (c) 2020 Alexey Edelev <semlanik@gmail.com>
  5. *
  6. * This file is part of microjson project https://git.semlanik.org/semlanik/microjson
  7. *
  8. * Permission is hereby granted, free of charge, to any person obtaining a copy of this
  9. * software and associated documentation files (the "Software"), to deal in the Software
  10. * without restriction, including without limitation the rights to use, copy, modify,
  11. * merge, publish, distribute, sublicense, and/or sell copies of the Software, and
  12. * to permit persons to whom the Software is furnished to do so, subject to the following
  13. * conditions:
  14. *
  15. * The above copyright notice and this permission notice shall be included in all copies
  16. * or substantial portions of the Software.
  17. *
  18. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,
  19. * INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR
  20. * PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE
  21. * FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
  22. * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  23. * DEALINGS IN THE SOFTWARE.
  24. */
  25. #include "microjson.h"
  26. #include <iostream>
  27. #ifdef MICROJSON_DEBUG
  28. #define microjsonDebug std::cout
  29. #else
  30. struct microjsonNull : public std::ostream {};
  31. static microjsonNull nullout;
  32. #define microjsonDebug nullout
  33. #endif
  34. namespace {
  35. struct JsonProperty {
  36. JsonProperty() : nameBegin(SIZE_MAX)
  37. , nameEnd(SIZE_MAX)
  38. , valueBegin(SIZE_MAX)
  39. , valueEnd(SIZE_MAX)
  40. , type(microjson::JsonInvalidType){}
  41. size_t nameBegin;
  42. size_t nameEnd;
  43. size_t valueBegin;
  44. size_t valueEnd;
  45. microjson::JsonType type;
  46. size_t nameSize() const {
  47. return nameEnd - nameBegin;
  48. }
  49. size_t valueSize() const {
  50. return valueEnd - valueBegin + 1;
  51. }
  52. bool checkValue() const {
  53. return type != microjson::JsonInvalidType && valueBegin != SIZE_MAX && valueEnd != SIZE_MAX &&
  54. valueBegin <= valueEnd;
  55. }
  56. bool checkEof() const {
  57. return (type == microjson::JsonNumberType || type == microjson::JsonBoolType) &&
  58. valueBegin != SIZE_MAX && valueEnd == SIZE_MAX;
  59. }
  60. bool check() const {
  61. return checkValue() && nameBegin != SIZE_MAX && nameEnd != SIZE_MAX &&
  62. nameBegin < nameEnd && nameEnd < valueBegin;
  63. }
  64. };
  65. inline bool skipWhiteSpace(const char byte) {
  66. return byte == '\n' || byte == ' ' || byte == '\r' || byte == '\t' || byte == '\f' || byte == '\v';
  67. }
  68. template<const char expectedBeginByte>
  69. void lookForBoundaries(const char *buffer, size_t size, size_t &begin, size_t &end) {
  70. const char expectedEndByte = expectedBeginByte + 2;
  71. begin = SIZE_MAX;
  72. end = SIZE_MAX;
  73. for (size_t i = 0; i < size; i++) {
  74. const char beginByte = buffer[i];
  75. const char endByte = buffer[size - i - 1];
  76. if (begin == SIZE_MAX) {
  77. if (beginByte == expectedBeginByte) {
  78. begin = i;
  79. } else if (beginByte != '\n' && beginByte != ' ' && beginByte != '\r' && beginByte != '\t') {
  80. std::cerr << "Unexpected begin byte" << beginByte << std::endl;
  81. break;
  82. }
  83. }
  84. if (end == SIZE_MAX) {
  85. if (endByte == expectedEndByte) {
  86. end = size - i - 1;
  87. } else if (endByte != '\n' && endByte != ' ' && endByte != '\r' && endByte != '\t') {
  88. std::cerr << "Unexpected end byte" << endByte << std::endl;
  89. break;
  90. }
  91. }
  92. if (begin != SIZE_MAX && end != SIZE_MAX) {
  93. break;
  94. }
  95. }
  96. }
  97. void lookForName(const char *buffer, size_t size, size_t &i, JsonProperty &property) {
  98. property.nameBegin = SIZE_MAX;
  99. property.nameEnd = SIZE_MAX;
  100. bool beginFound = false;
  101. for(; i < size; ++i) {
  102. const char byte = buffer[i];
  103. if (skipWhiteSpace(byte)) {
  104. microjsonDebug << "Skip space" << std::endl;
  105. continue;
  106. }
  107. if(!beginFound) {
  108. if (byte == '"') {
  109. microjsonDebug << "Found name begin" << std::endl;
  110. property.nameBegin = i + 1;
  111. beginFound = true;
  112. } else {
  113. std::cerr << "Not found name begin, unexpected" << std::endl;
  114. break;
  115. }
  116. } else if(byte == '"') {
  117. if (i > 0 && buffer[i - 1] == '\\') {
  118. microjsonDebug << "'\"' found in name" << std::endl;
  119. continue;
  120. }
  121. microjsonDebug << "Found name end" << std::endl;
  122. property.nameEnd = i;
  123. break;
  124. }
  125. }
  126. ++i;
  127. }
  128. bool lookForSeparator(const char* buffer, size_t size, size_t &i) {
  129. bool found = false;
  130. for(; i < size; ++i) {
  131. const char byte = buffer[i];
  132. if (skipWhiteSpace(byte)) {
  133. microjsonDebug << "Skip space" << std::endl;
  134. continue;
  135. }
  136. if (byte == ':') {
  137. microjsonDebug << "Found Separator" << std::endl;
  138. found = true;
  139. }
  140. break;
  141. }
  142. ++i;
  143. return found;
  144. }
  145. void lookForValue(const char *buffer, size_t size, size_t &i, JsonProperty &property) {
  146. int valueBracesCounter = -1;
  147. int valueBracketsCounter = -1;
  148. int trueCounter = 3;
  149. int falseCounter = 4;
  150. std::function<bool(void)> valueEndMarker;
  151. bool beginFound = false;
  152. bool stringScope = false;
  153. property.valueBegin = SIZE_MAX;
  154. property.valueEnd = SIZE_MAX;
  155. for(; i < size; i++) {
  156. const char byte = buffer[i];
  157. if (!beginFound) {
  158. microjsonDebug << "lookForValue at: " << i << " byte: " << byte << std::endl;
  159. if (skipWhiteSpace(byte)) {
  160. microjsonDebug << "Skip space" << std::endl;
  161. continue;
  162. }
  163. switch (byte) {
  164. case '"':
  165. valueEndMarker = [&](){
  166. return buffer[i] == '"' && buffer[i - 1] != '\\';
  167. };
  168. property.type = microjson::JsonStringType;
  169. break;
  170. case '-':
  171. case '0':
  172. case '1':
  173. case '2':
  174. case '3':
  175. case '4':
  176. case '5':
  177. case '6':
  178. case '7':
  179. case '8':
  180. case '9':
  181. valueEndMarker = [&buffer, &i](){
  182. if (buffer[i] != '+'
  183. && buffer[i] != '-'
  184. && buffer[i] != '0'
  185. && buffer[i] != '1'
  186. && buffer[i] != '2'
  187. && buffer[i] != '3'
  188. && buffer[i] != '4'
  189. && buffer[i] != '5'
  190. && buffer[i] != '6'
  191. && buffer[i] != '7'
  192. && buffer[i] != '8'
  193. && buffer[i] != '9'
  194. && buffer[i] != 'e'
  195. && buffer[i] != '.') {
  196. i--;
  197. return true;
  198. }
  199. return false;
  200. };
  201. property.type = microjson::JsonNumberType;
  202. break;
  203. case '{':
  204. valueBracesCounter++;
  205. valueEndMarker = [&stringScope, &byte, &valueBracesCounter](){
  206. if (!stringScope) {
  207. switch (byte) {
  208. case '}':
  209. --valueBracesCounter;
  210. break;
  211. case '{':
  212. ++valueBracesCounter;
  213. break;
  214. default:
  215. break;
  216. }
  217. }
  218. return valueBracesCounter < 0;
  219. };
  220. property.type = microjson::JsonObjectType;
  221. break;
  222. case 't':
  223. valueEndMarker = [&trueCounter](){
  224. --trueCounter;
  225. return trueCounter == 0;
  226. };
  227. property.type = microjson::JsonBoolType;
  228. break;
  229. case 'f':
  230. valueEndMarker = [&falseCounter](){
  231. --falseCounter;
  232. return falseCounter == 0;
  233. };
  234. property.type = microjson::JsonBoolType;
  235. break;
  236. case '[':
  237. valueBracketsCounter++;
  238. valueEndMarker = [&stringScope, &byte, &valueBracketsCounter](){
  239. if(!stringScope) {
  240. switch(byte) {
  241. case ']':
  242. --valueBracketsCounter;
  243. break;
  244. case '[':
  245. ++valueBracketsCounter;
  246. break;
  247. default:
  248. break;
  249. }
  250. }
  251. return valueBracketsCounter < 0;
  252. };
  253. property.type = microjson::JsonArrayType;
  254. break;
  255. }
  256. if (valueEndMarker) {
  257. microjsonDebug << "Found value begin" << std::endl;
  258. property.valueBegin = i;
  259. beginFound = true;
  260. } else {
  261. break;
  262. }
  263. } else {
  264. if (byte == '"' && (i == 0 || buffer[i - 1] != '\\')) {
  265. stringScope = !stringScope;
  266. }
  267. if (valueEndMarker()) {
  268. microjsonDebug << "Found value end" << std::endl;
  269. property.valueEnd = i;
  270. break;
  271. }
  272. }
  273. }
  274. }
  275. bool extractProperty(const char *buffer, size_t size, size_t &i, JsonProperty &property) {
  276. lookForName(buffer, size, i, property);
  277. if(property.nameBegin == SIZE_MAX && property.nameEnd == SIZE_MAX) {
  278. std::cerr << "Name not found" << std::endl;
  279. return false;
  280. }
  281. if(!lookForSeparator(buffer, size, i)) {
  282. std::cerr << "Separator not found" << std::endl;
  283. return false;
  284. }
  285. lookForValue(buffer, size, i, property);
  286. if (property.checkEof()) {
  287. property.valueEnd = size - 1; //EOF case
  288. microjsonDebug << "Found value end at EOF" << std::endl;
  289. }
  290. return property.check();
  291. }
  292. bool extractValue(const char *buffer, size_t size, size_t &i, JsonProperty &property) {
  293. lookForValue(buffer, size, i, property);
  294. if (property.checkEof()) {
  295. property.valueEnd = size - 1; //EOF case
  296. microjsonDebug << "Found value end at EOF" << std::endl;
  297. }
  298. return property.checkValue();
  299. }
  300. using Extractor = bool(*)(const char *, size_t, size_t &, JsonProperty &);
  301. template <Extractor extract>
  302. size_t extractNext(const char *buffer, size_t size, JsonProperty &property) {
  303. if (buffer == nullptr || size == 0 || size == SIZE_MAX) {
  304. return SIZE_MAX;
  305. }
  306. property.nameBegin = SIZE_MAX;
  307. property.nameEnd = SIZE_MAX;
  308. property.valueBegin = SIZE_MAX;
  309. property.valueEnd = SIZE_MAX;
  310. property.type = microjson::JsonInvalidType;
  311. size_t i = 0;
  312. if(!extract(buffer, size, i, property)) {
  313. return SIZE_MAX;
  314. }
  315. if (property.type == microjson::JsonStringType) {
  316. ++property.valueBegin;
  317. --property.valueEnd;
  318. }
  319. for (size_t j = i + 1; j < size; j++) {
  320. const char &byte = buffer[j];
  321. if (byte == ',') {
  322. return j + 1;
  323. } else if (!skipWhiteSpace(byte)) {
  324. microjsonDebug << "Unexpected: " << byte;
  325. return SIZE_MAX;
  326. }
  327. }
  328. return size;
  329. }
  330. template<typename R,
  331. const char expectedBeginByte,
  332. Extractor extract,
  333. void(* collect)(const char *, R &, const JsonProperty &property)>
  334. R parseJsonCommon(const char *buffer, size_t size) {
  335. R returnValue;
  336. if (buffer == nullptr || size == 0 || size == SIZE_MAX) {
  337. return returnValue;
  338. }
  339. size_t objectBeginPosition = SIZE_MAX;
  340. size_t objectEndPosition = SIZE_MAX;
  341. lookForBoundaries<expectedBeginByte>(buffer, size, objectBeginPosition, objectEndPosition);
  342. if (objectBeginPosition == SIZE_MAX || objectEndPosition == SIZE_MAX) {
  343. return returnValue;
  344. }
  345. JsonProperty property;
  346. buffer += objectBeginPosition + 1;//Skip '{'
  347. size = objectEndPosition - objectBeginPosition - 1;//Skip '}'
  348. microjsonDebug << "Object buffer size: " << size << " buffer: " << std::string(buffer, size) << std::endl;
  349. for (size_t nextPosition = extractNext<extract>(buffer, size, property); nextPosition != SIZE_MAX; ) {
  350. microjsonDebug << "nextPropertyPosition: " << nextPosition << "size: " << size << std::endl;
  351. if (nextPosition != SIZE_MAX) {
  352. collect(buffer, returnValue, property);
  353. }
  354. buffer += nextPosition;
  355. size = size - nextPosition;
  356. nextPosition = extractNext<extract>(buffer, size, property);
  357. }
  358. return returnValue;
  359. }
  360. void appendProperty(const char* buffer, microjson::JsonObject &obj, const JsonProperty &property){
  361. std::string name((buffer + property.nameBegin), property.nameSize());
  362. std::string value((buffer + property.valueBegin), property.valueSize());
  363. microjsonDebug << "name: " << name << " value: " << value << std::endl;
  364. obj[name] = { value, property.type };
  365. };
  366. void appendValue(const char* buffer, microjson::JsonArray &values, const JsonProperty &property){
  367. std::string value = std::string((buffer + property.valueBegin), property.valueSize());
  368. microjsonDebug << "value: " << value << std::endl;
  369. values.push_back({value, property.type});
  370. };
  371. }
  372. microjson::JsonObject microjson::parseJsonObject(const char *buffer, size_t size) {
  373. return parseJsonCommon<JsonObject, '{', extractProperty, appendProperty>(buffer, size);
  374. }
  375. microjson::JsonArray microjson::parseJsonArray(const char *buffer, size_t size) {
  376. return parseJsonCommon<JsonArray, '[', extractValue, appendValue>(buffer, size);
  377. }