css-selector-parser.js 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360
  1. /*
  2. * Copyright (c) Felix Böhm
  3. * All rights reserved.
  4. *
  5. * Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met:
  6. *
  7. * Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer.
  8. *
  9. * Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution.
  10. *
  11. * THIS IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS,
  12. * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  13. */
  14. // Modified by Gildas Lormeau
  15. this.cssWhat = this.cssWhat || (() => {
  16. "use strict";
  17. const re_name = /^(?:\\.|[\w\-\u00c0-\uFFFF])+/,
  18. re_escape = /\\([\da-f]{1,6}\s?|(\s)|.)/ig,
  19. //modified version of https://github.com/jquery/sizzle/blob/master/src/sizzle.js#L87
  20. re_attr = /^\s*((?:\\.|[\w\u00c0-\uFFFF-])+)\s*(?:(\S?)=\s*(?:(['"])([^]*?)\3|(#?(?:\\.|[\w\u00c0-\uFFFF-])*)|)|)\s*(i)?\]/;
  21. const actionTypes = {
  22. __proto__: null,
  23. "undefined": "exists",
  24. "": "equals",
  25. "~": "element",
  26. "^": "start",
  27. "$": "end",
  28. "*": "any",
  29. "!": "not",
  30. "|": "hyphen"
  31. };
  32. const simpleSelectors = {
  33. __proto__: null,
  34. ">": "child",
  35. "~": "sibling",
  36. "+": "adjacent"
  37. };
  38. const attribSelectors = {
  39. __proto__: null,
  40. "#": ["id", "equals"],
  41. ".": ["class", "element"]
  42. };
  43. //pseudos, whose data-property is parsed as well
  44. const unpackPseudos = {
  45. __proto__: null,
  46. "has": true,
  47. "not": true,
  48. "matches": true
  49. };
  50. const stripQuotesFromPseudos = {
  51. __proto__: null,
  52. "contains": true,
  53. "icontains": true
  54. };
  55. const quotes = {
  56. __proto__: null,
  57. "\"": true,
  58. "'": true
  59. };
  60. const pseudoElements = [
  61. "after", "before", "cue", "first-letter", "first-line", "selection", "slotted"
  62. ];
  63. const stringify = (() => {
  64. const actionTypes = {
  65. "equals": "",
  66. "element": "~",
  67. "start": "^",
  68. "end": "$",
  69. "any": "*",
  70. "not": "!",
  71. "hyphen": "|"
  72. };
  73. const simpleSelectors = {
  74. __proto__: null,
  75. child: " > ",
  76. sibling: " ~ ",
  77. adjacent: " + ",
  78. descendant: " ",
  79. universal: "*"
  80. };
  81. function stringify(token) {
  82. let value = "";
  83. token.forEach(token => value += stringifySubselector(token) + ",");
  84. return value.substring(0, value.length - 1);
  85. }
  86. function stringifySubselector(token) {
  87. let value = "";
  88. token.forEach(token => value += stringifyToken(token));
  89. return value;
  90. }
  91. function stringifyToken(token) {
  92. if (token.type in simpleSelectors) return simpleSelectors[token.type];
  93. if (token.type == "tag") return escapeName(token.name);
  94. if (token.type == "attribute") {
  95. if (token.action == "exists") return "[" + escapeName(token.name) + "]";
  96. if (token.expandedSelector && token.name == "id" && token.action == "equals" && !token.ignoreCase) return "#" + escapeName(token.value);
  97. if (token.expandedSelector && token.name == "class" && token.action == "element" && !token.ignoreCase) return "." + escapeName(token.value);
  98. return "[" +
  99. escapeName(token.name) + actionTypes[token.action] + "=\"" +
  100. escapeName(token.value) + "\"" + (token.ignoreCase ? "i" : "") + "]";
  101. }
  102. if (token.type == "pseudo") {
  103. if (token.data == null) return ":" + escapeName(token.name);
  104. if (typeof token.data == "string") return ":" + escapeName(token.name) + "(" + token.data + ")";
  105. return ":" + escapeName(token.name) + "(" + stringify(token.data) + ")";
  106. }
  107. if (token.type == "pseudo-element") {
  108. return "::" + escapeName(token.name);
  109. }
  110. }
  111. function escapeName(str) {
  112. return cssEscape(str).output;
  113. }
  114. return stringify;
  115. })();
  116. const REGEXP_STARTS_DASH_DECIMAL = /^-[\d]/;
  117. return {
  118. parse,
  119. stringify
  120. };
  121. // cssEscape taken from https://mathiasbynens.be/notes/css-escapes
  122. function cssEscape(string, escapeNonASCII) {
  123. const firstChar = string.charAt(0);
  124. const length = string.length;
  125. let value, character, charCode, output = "", counter = 0, surrogatePairCount = 0, extraCharCode; // low surrogate
  126. while (counter < length) {
  127. character = string.charAt(counter++);
  128. charCode = character.charCodeAt();
  129. if (escapeNonASCII && (charCode < 0x20 || charCode > 0x7E)) {
  130. if ((charCode & 0xF800) == 0xD800) {
  131. surrogatePairCount++;
  132. extraCharCode = string.charCodeAt(counter++);
  133. if ((charCode & 0xFC00) != 0xD800 || (extraCharCode & 0xFC00) != 0xDC00) {
  134. throw Error("UCS-2(decode): illegal sequence");
  135. }
  136. charCode = ((charCode & 0x3FF) << 10) + (extraCharCode & 0x3FF) + 0x10000;
  137. }
  138. value = "\\" + charCode.toString(16).toUpperCase() + " ";
  139. } else {
  140. if (character == "\t" || character == "\n" || character == "\v" || character == "\f" || character == ":") {
  141. value = "\\" + charCode.toString(16).toUpperCase() + " ";
  142. } else if (character == "[" || character == " " || character == "!" || character == "\"" || character == "#" || character == "$" || character == "%" || character == "&" || character == "'" || character == "(" || character == ")" || character == "*" || character == "+" || character == "," || character == "." || character == "/" || character == ";" || character == "<" || character == "=" || character == ">" || character == "?" || character == "@" || character == "[" || character == "\\" || character == "]" || character == "^" || character == "`" || character == "{," || character == "|" || character == "}" || character == "~" || character == "]") {
  143. value = "\\" + character;
  144. } else {
  145. value = character;
  146. }
  147. }
  148. output += value;
  149. }
  150. if (output.startsWith("_")) {
  151. output = "\\_" + output.slice(1);
  152. }
  153. if (output.match(REGEXP_STARTS_DASH_DECIMAL)) {
  154. output = "\\-" + output.slice(1);
  155. }
  156. if (firstChar == "0" || firstChar == "1" || firstChar == "2" || firstChar == "3" || firstChar == "4" || firstChar == "5" || firstChar == "6" || firstChar == "7" || firstChar == "8" || firstChar == "9") {
  157. output = "\\3" + firstChar + " " + output.slice(1);
  158. }
  159. return {
  160. "surrogatePairCount": surrogatePairCount,
  161. "output": output
  162. };
  163. }
  164. // unescape function taken from https://github.com/jquery/sizzle/blob/master/src/sizzle.js#L139
  165. function funescape(_, escaped, escapedWhitespace) {
  166. const high = "0x" + escaped - 0x10000;
  167. // NaN means non-codepoint
  168. // Support: Firefox
  169. // Workaround erroneous numeric interpretation of +"0x"
  170. return high != high || escapedWhitespace ?
  171. escaped :
  172. // BMP codepoint
  173. high < 0 ?
  174. String.fromCharCode(high + 0x10000) :
  175. // Supplemental Plane codepoint (surrogate pair)
  176. String.fromCharCode(high >> 10 | 0xD800, high & 0x3FF | 0xDC00);
  177. }
  178. function unescapeCSS(str) {
  179. return str.replace(re_escape, funescape);
  180. }
  181. function isWhitespace(c) {
  182. return c == " " || c == "\n" || c == "\t" || c == "\f" || c == "\r";
  183. }
  184. function parse(selector, options) {
  185. const subselects = [];
  186. selector = parseSelector(subselects, selector + "", options);
  187. if (selector != "") {
  188. throw new SyntaxError("Unmatched selector: " + selector);
  189. }
  190. return subselects;
  191. }
  192. function parseSelector(subselects, selector, options) {
  193. let tokens = [];
  194. let sawWS = false;
  195. let data, firstChar, name, quot;
  196. stripWhitespace(0);
  197. while (selector != "") {
  198. firstChar = selector.charAt(0);
  199. if (isWhitespace(firstChar)) {
  200. sawWS = true;
  201. stripWhitespace(1);
  202. } else if (firstChar in simpleSelectors) {
  203. tokens.push({ type: simpleSelectors[firstChar] });
  204. sawWS = false;
  205. stripWhitespace(1);
  206. } else if (firstChar == ",") {
  207. if (tokens.length == 0) {
  208. throw new SyntaxError("empty sub-selector");
  209. }
  210. subselects.push(tokens);
  211. tokens = [];
  212. sawWS = false;
  213. stripWhitespace(1);
  214. } else {
  215. if (sawWS) {
  216. if (tokens.length > 0) {
  217. tokens.push({ type: "descendant" });
  218. }
  219. sawWS = false;
  220. }
  221. if (firstChar == "*") {
  222. selector = selector.substr(1);
  223. tokens.push({ type: "universal" });
  224. } else if (firstChar in attribSelectors) {
  225. selector = selector.substr(1);
  226. tokens.push({
  227. expandedSelector: true,
  228. type: "attribute",
  229. name: attribSelectors[firstChar][0],
  230. action: attribSelectors[firstChar][1],
  231. value: getName(),
  232. ignoreCase: false
  233. });
  234. } else if (firstChar == "[") {
  235. selector = selector.substr(1);
  236. data = selector.match(re_attr);
  237. if (!data) {
  238. throw new SyntaxError("Malformed attribute selector: " + selector);
  239. }
  240. selector = selector.substr(data[0].length);
  241. name = unescapeCSS(data[1]);
  242. if (
  243. !options || (
  244. "lowerCaseAttributeNames" in options ?
  245. options.lowerCaseAttributeNames :
  246. !options.xmlMode
  247. )
  248. ) {
  249. name = name.toLowerCase();
  250. }
  251. tokens.push({
  252. type: "attribute",
  253. name: name,
  254. action: actionTypes[data[2]],
  255. value: unescapeCSS(data[4] || data[5] || ""),
  256. ignoreCase: !!data[6]
  257. });
  258. } else if (firstChar == ":") {
  259. if (selector.charAt(1) == ":") {
  260. selector = selector.substr(2);
  261. tokens.push({ type: "pseudo-element", name: getName().toLowerCase() });
  262. continue;
  263. }
  264. selector = selector.substr(1);
  265. name = getName().toLowerCase();
  266. data = null;
  267. if (selector.charAt(0) == "(") {
  268. if (name in unpackPseudos) {
  269. quot = selector.charAt(1);
  270. const quoted = quot in quotes;
  271. selector = selector.substr(quoted + 1);
  272. data = [];
  273. selector = parseSelector(data, selector, options);
  274. if (quoted) {
  275. if (selector.charAt(0) != quot) {
  276. throw new SyntaxError("unmatched quotes in :" + name);
  277. } else {
  278. selector = selector.substr(1);
  279. }
  280. }
  281. if (selector.charAt(0) != ")") {
  282. throw new SyntaxError("missing closing parenthesis in :" + name + " " + selector);
  283. }
  284. selector = selector.substr(1);
  285. } else {
  286. let pos = 1, counter = 1;
  287. for (; counter > 0 && pos < selector.length; pos++) {
  288. if (selector.charAt(pos) == "(" && !isEscaped(pos)) counter++;
  289. else if (selector.charAt(pos) == ")" && !isEscaped(pos)) counter--;
  290. }
  291. if (counter) {
  292. throw new SyntaxError("parenthesis not matched");
  293. }
  294. data = selector.substr(1, pos - 2);
  295. selector = selector.substr(pos);
  296. if (name in stripQuotesFromPseudos) {
  297. quot = data.charAt(0);
  298. if (quot == data.slice(-1) && quot in quotes) {
  299. data = data.slice(1, -1);
  300. }
  301. data = unescapeCSS(data);
  302. }
  303. }
  304. }
  305. tokens.push({ type: pseudoElements.indexOf(name) == -1 ? "pseudo" : "pseudo-element", name: name, data: data });
  306. } else if (re_name.test(selector)) {
  307. name = getName();
  308. if (!options || ("lowerCaseTags" in options ? options.lowerCaseTags : !options.xmlMode)) {
  309. name = name.toLowerCase();
  310. }
  311. tokens.push({ type: "tag", name: name });
  312. } else {
  313. if (tokens.length && tokens[tokens.length - 1].type == "descendant") {
  314. tokens.pop();
  315. }
  316. addToken(subselects, tokens);
  317. return selector;
  318. }
  319. }
  320. }
  321. addToken(subselects, tokens);
  322. return selector;
  323. function getName() {
  324. const sub = selector.match(re_name)[0];
  325. selector = selector.substr(sub.length);
  326. return unescapeCSS(sub);
  327. }
  328. function stripWhitespace(start) {
  329. while (isWhitespace(selector.charAt(start))) start++;
  330. selector = selector.substr(start);
  331. }
  332. function isEscaped(pos) {
  333. let slashCount = 0;
  334. while (selector.charAt(--pos) == "\\") slashCount++;
  335. return (slashCount & 1) == 1;
  336. }
  337. }
  338. function addToken(subselects, tokens) {
  339. if (subselects.length > 0 && tokens.length == 0) {
  340. throw new SyntaxError("empty sub-selector");
  341. }
  342. subselects.push(tokens);
  343. }
  344. })();