tokenization.js 7.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197
  1. /*---------------------------------------------------------------------------------------------
  2. * Copyright (c) Microsoft Corporation. All rights reserved.
  3. * Licensed under the MIT License. See License.txt in the project root for license information.
  4. *--------------------------------------------------------------------------------------------*/
  5. import * as json from './_deps/jsonc-parser/main.js';
  6. export function createTokenizationSupport(supportComments) {
  7. return {
  8. getInitialState: function () { return new JSONState(null, null, false, null); },
  9. tokenize: function (line, state, offsetDelta, stopAtOffset) {
  10. return tokenize(supportComments, line, state, offsetDelta, stopAtOffset);
  11. }
  12. };
  13. }
  14. export var TOKEN_DELIM_OBJECT = 'delimiter.bracket.json';
  15. export var TOKEN_DELIM_ARRAY = 'delimiter.array.json';
  16. export var TOKEN_DELIM_COLON = 'delimiter.colon.json';
  17. export var TOKEN_DELIM_COMMA = 'delimiter.comma.json';
  18. export var TOKEN_VALUE_BOOLEAN = 'keyword.json';
  19. export var TOKEN_VALUE_NULL = 'keyword.json';
  20. export var TOKEN_VALUE_STRING = 'string.value.json';
  21. export var TOKEN_VALUE_NUMBER = 'number.json';
  22. export var TOKEN_PROPERTY_NAME = 'string.key.json';
  23. export var TOKEN_COMMENT_BLOCK = 'comment.block.json';
  24. export var TOKEN_COMMENT_LINE = 'comment.line.json';
  25. var ParentsStack = /** @class */ (function () {
  26. function ParentsStack(parent, type) {
  27. this.parent = parent;
  28. this.type = type;
  29. }
  30. ParentsStack.pop = function (parents) {
  31. if (parents) {
  32. return parents.parent;
  33. }
  34. return null;
  35. };
  36. ParentsStack.push = function (parents, type) {
  37. return new ParentsStack(parents, type);
  38. };
  39. ParentsStack.equals = function (a, b) {
  40. if (!a && !b) {
  41. return true;
  42. }
  43. if (!a || !b) {
  44. return false;
  45. }
  46. while (a && b) {
  47. if (a === b) {
  48. return true;
  49. }
  50. if (a.type !== b.type) {
  51. return false;
  52. }
  53. a = a.parent;
  54. b = b.parent;
  55. }
  56. return true;
  57. };
  58. return ParentsStack;
  59. }());
  60. var JSONState = /** @class */ (function () {
  61. function JSONState(state, scanError, lastWasColon, parents) {
  62. this._state = state;
  63. this.scanError = scanError;
  64. this.lastWasColon = lastWasColon;
  65. this.parents = parents;
  66. }
  67. JSONState.prototype.clone = function () {
  68. return new JSONState(this._state, this.scanError, this.lastWasColon, this.parents);
  69. };
  70. JSONState.prototype.equals = function (other) {
  71. if (other === this) {
  72. return true;
  73. }
  74. if (!other || !(other instanceof JSONState)) {
  75. return false;
  76. }
  77. return (this.scanError === other.scanError &&
  78. this.lastWasColon === other.lastWasColon &&
  79. ParentsStack.equals(this.parents, other.parents));
  80. };
  81. JSONState.prototype.getStateData = function () {
  82. return this._state;
  83. };
  84. JSONState.prototype.setStateData = function (state) {
  85. this._state = state;
  86. };
  87. return JSONState;
  88. }());
  89. function tokenize(comments, line, state, offsetDelta, stopAtOffset) {
  90. if (offsetDelta === void 0) { offsetDelta = 0; }
  91. // handle multiline strings and block comments
  92. var numberOfInsertedCharacters = 0;
  93. var adjustOffset = false;
  94. switch (state.scanError) {
  95. case 2 /* UnexpectedEndOfString */:
  96. line = '"' + line;
  97. numberOfInsertedCharacters = 1;
  98. break;
  99. case 1 /* UnexpectedEndOfComment */:
  100. line = '/*' + line;
  101. numberOfInsertedCharacters = 2;
  102. break;
  103. }
  104. var scanner = json.createScanner(line);
  105. var lastWasColon = state.lastWasColon;
  106. var parents = state.parents;
  107. var ret = {
  108. tokens: [],
  109. endState: state.clone()
  110. };
  111. while (true) {
  112. var offset = offsetDelta + scanner.getPosition();
  113. var type = '';
  114. var kind = scanner.scan();
  115. if (kind === 17 /* EOF */) {
  116. break;
  117. }
  118. // Check that the scanner has advanced
  119. if (offset === offsetDelta + scanner.getPosition()) {
  120. throw new Error('Scanner did not advance, next 3 characters are: ' + line.substr(scanner.getPosition(), 3));
  121. }
  122. // In case we inserted /* or " character, we need to
  123. // adjust the offset of all tokens (except the first)
  124. if (adjustOffset) {
  125. offset -= numberOfInsertedCharacters;
  126. }
  127. adjustOffset = numberOfInsertedCharacters > 0;
  128. // brackets and type
  129. switch (kind) {
  130. case 1 /* OpenBraceToken */:
  131. parents = ParentsStack.push(parents, 0 /* Object */);
  132. type = TOKEN_DELIM_OBJECT;
  133. lastWasColon = false;
  134. break;
  135. case 2 /* CloseBraceToken */:
  136. parents = ParentsStack.pop(parents);
  137. type = TOKEN_DELIM_OBJECT;
  138. lastWasColon = false;
  139. break;
  140. case 3 /* OpenBracketToken */:
  141. parents = ParentsStack.push(parents, 1 /* Array */);
  142. type = TOKEN_DELIM_ARRAY;
  143. lastWasColon = false;
  144. break;
  145. case 4 /* CloseBracketToken */:
  146. parents = ParentsStack.pop(parents);
  147. type = TOKEN_DELIM_ARRAY;
  148. lastWasColon = false;
  149. break;
  150. case 6 /* ColonToken */:
  151. type = TOKEN_DELIM_COLON;
  152. lastWasColon = true;
  153. break;
  154. case 5 /* CommaToken */:
  155. type = TOKEN_DELIM_COMMA;
  156. lastWasColon = false;
  157. break;
  158. case 8 /* TrueKeyword */:
  159. case 9 /* FalseKeyword */:
  160. type = TOKEN_VALUE_BOOLEAN;
  161. lastWasColon = false;
  162. break;
  163. case 7 /* NullKeyword */:
  164. type = TOKEN_VALUE_NULL;
  165. lastWasColon = false;
  166. break;
  167. case 10 /* StringLiteral */:
  168. var currentParent = parents ? parents.type : 0 /* Object */;
  169. var inArray = currentParent === 1 /* Array */;
  170. type =
  171. lastWasColon || inArray ? TOKEN_VALUE_STRING : TOKEN_PROPERTY_NAME;
  172. lastWasColon = false;
  173. break;
  174. case 11 /* NumericLiteral */:
  175. type = TOKEN_VALUE_NUMBER;
  176. lastWasColon = false;
  177. break;
  178. }
  179. // comments, iff enabled
  180. if (comments) {
  181. switch (kind) {
  182. case 12 /* LineCommentTrivia */:
  183. type = TOKEN_COMMENT_LINE;
  184. break;
  185. case 13 /* BlockCommentTrivia */:
  186. type = TOKEN_COMMENT_BLOCK;
  187. break;
  188. }
  189. }
  190. ret.endState = new JSONState(state.getStateData(), scanner.getTokenError(), lastWasColon, parents);
  191. ret.tokens.push({
  192. startIndex: offset,
  193. scopes: type
  194. });
  195. }
  196. return ret;
  197. }