Skip to content

Commit

Permalink
Regex: Added aliases and minor improvements (#2325)
Browse files Browse the repository at this point in the history
This adds a lot of aliases to the regex tokens, so themes can apply their styles. It also makes a few improvements. See the PR for more details.
  • Loading branch information
RunDevelopment committed May 7, 2020
1 parent 6d663b6 commit 8a72830
Show file tree
Hide file tree
Showing 6 changed files with 132 additions and 30 deletions.
80 changes: 55 additions & 25 deletions components/prism-regex.js
Expand Up @@ -4,8 +4,15 @@
pattern: /\\[\\(){}[\]^$+*?|.]/,
alias: 'escape'
};
var escape = /\\(?:x[\da-fA-F]{2}|u[\da-fA-F]{4}|u\{[\da-fA-F]+\}|c[a-zA-Z]|0[0-7]{0,2}|[123][0-7]{2}|.)/
var charClass = /\\[wsd]|\.|\\p{[^{}]+}/i
var escape = /\\(?:x[\da-fA-F]{2}|u[\da-fA-F]{4}|u\{[\da-fA-F]+\}|c[a-zA-Z]|0[0-7]{0,2}|[123][0-7]{2}|.)/;
var charClass = {
pattern: /\.|\\[wsd]|\\p{[^{}]+}/i,
alias: 'class-name'
};
var charClassWithoutDot = {
pattern: /\\[wsd]|\\p{[^{}]+}/i,
alias: 'class-name'
};

var rangeChar = '(?:[^\\\\-]|' + escape.source + ')';
var range = RegExp(rangeChar + '-' + rangeChar);
Expand All @@ -17,16 +24,6 @@
alias: 'variable'
};

var backreference = [
/\\(?![123][0-7]{2})[1-9]/, // a backreference which is not an octal escape
{
pattern: /\\k<[^<>']+>/,
inside: {
'group-name': groupName
}
}
];

Prism.languages.regex = {
'charset': {
pattern: /((?:^|[^\\])(?:\\\\)*)\[(?:[^\\\]]|\\[\s\S])*\]/,
Expand All @@ -35,25 +32,47 @@
'charset-negation': {
pattern: /(^\[)\^/,
lookbehind: true,
alias: 'operator'
},
'charset-punctuation': {
pattern: /^\[|\]$/,
alias: 'punctuation'
},
'charset-punctuation': /^\[|\]$/,
'range': {
pattern: range,
inside: {
'escape': escape,
'range-punctuation': /-/
'range-punctuation': {
pattern: /-/,
alias: 'operator'
}
}
},
'special-escape': specialEscape,
'charclass': charClass,
'backreference': backreference,
'charclass': charClassWithoutDot,
'escape': escape
}
},
'special-escape': specialEscape,
'charclass': charClass,
'backreference': backreference,
'anchor': /[$^]|\\[ABbGZz]/,
'backreference': [
{
// a backreference which is not an octal escape
pattern: /\\(?![123][0-7]{2})[1-9]/,
alias: 'keyword'
},
{
pattern: /\\k<[^<>']+>/,
alias: 'keyword',
inside: {
'group-name': groupName
}
}
],
'anchor': {
pattern: /[$^]|\\[ABbGZz]/,
alias: 'function'
},
'escape': escape,
'group': [
{
Expand All @@ -62,14 +81,24 @@

// (), (?<name>), (?'name'), (?>), (?:), (?=), (?!), (?<=), (?<!), (?is-m), (?i-m:)
pattern: /\((?:\?(?:<[^<>']+>|'[^<>']+'|[>:]|<?[=!]|[idmnsuxU]+(?:-[idmnsuxU]+)?:?))?/,
alias: 'punctuation',
inside: {
'group-name': groupName
}
},
/\)/
{
pattern: /\)/,
alias: 'punctuation'
}
],
'quantifier': /[+*?]|\{(?:\d+,?\d*)\}/,
'alternation': /\|/
'quantifier': {
pattern: /(?:[+*?]|\{(?:\d+,?\d*)\})[?+]?/,
alias: 'number'
},
'alternation': {
pattern: /\|/,
alias: 'keyword'
}
};


Expand All @@ -84,12 +113,13 @@
var grammar = Prism.languages[lang];
if (grammar) {
grammar['regex'].inside = {
'regex-flags': /[a-z]+$/,
'regex-delimiter': /^\/|\/$/,
'language-regex': {
pattern: /[\s\S]+/,
pattern: /^(\/)[\s\S]+(?=\/[a-z]*$)/i,
lookbehind: true,
inside: Prism.languages.regex
}
},
'regex-flags': /[a-z]+$/i,
'regex-delimiter': /^\/|\/$/,
};
}
});
Expand Down
2 changes: 1 addition & 1 deletion components/prism-regex.min.js

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

46 changes: 46 additions & 0 deletions examples/prism-regex.html
@@ -0,0 +1,46 @@
<p>The regex languages con be used for inline regex snippets like <code>(?&lt;number>\d+)[-_ ]\k&lt;number></code> but it mainly adds itself to other languages such as:</p>

<h2>JavaScript</h2>
<pre class="language-javascript" data-dependencies="regex"><code>Prism.languages.markup = {
'comment': /&lt;!--[\s\S]*?-->/,
'prolog': /&lt;\?[\s\S]+?\?>/,
'doctype': {
pattern: /&lt;!DOCTYPE(?:[^>"'[\]]|"[^"]*"|'[^']*')+(?:\[(?:[^&lt;"'\]]|"[^"]*"|'[^']*'|&lt;(?!!--)|&lt;!--(?:[^-]|-(?!->))*-->)*\]\s*)?>/i,
greedy: true
},
'cdata': /&lt;!\[CDATA\[[\s\S]*?]]>/i,
'tag': {
pattern: /&lt;\/?(?!\d)[^\s>\/=$&lt;%]+(?:\s(?:\s*[^\s>\/=]+(?:\s*=\s*(?:"[^"]*"|'[^']*'|[^\s'">=]+(?=[\s>]))|(?=[\s/>])))+)?\s*\/?>/i,
greedy: true,
inside: {
'tag': {
pattern: /^&lt;\/?[^\s>\/]+/i,
inside: {
'punctuation': /^&lt;\/?/,
'namespace': /^[^\s>\/:]+:/
}
},
'attr-value': {
pattern: /=\s*(?:"[^"]*"|'[^']*'|[^\s'">=]+)/i,
inside: {
'punctuation': [
/^=/,
{
pattern: /^(\s*)["']|["']$/,
lookbehind: true
}
]
}
},
'punctuation': /\/?>/,
'attr-name': {
pattern: /[^\s>\/]+/,
inside: {
'namespace': /^[^\s>\/:]+:/
}
}

}
},
'entity': /&amp;#?[\da-z]{1,8};/i
};</code></pre>
4 changes: 1 addition & 3 deletions tests/examples-test.js
Expand Up @@ -13,9 +13,7 @@ describe('Examples', function () {
'markup-templating',
't4-templating',
// this does alter some languages but it's mainly a library
'javadoclike',
// Regex doesn't have any classes supported by our themes and mainly extends other languages
'regex'
'javadoclike'
]);
const validFiles = new Set();

Expand Down
8 changes: 8 additions & 0 deletions tests/languages/regex/charset_feature.test
Expand Up @@ -2,6 +2,7 @@
[^]
[foo]
[\]\b]
[.^$\1]

----------------------------------------------------

Expand All @@ -28,6 +29,13 @@
["special-escape", "\\]"],
["escape", "\\b"],
["charset-punctuation", "]"]
]],

["charset", [
["charset-punctuation", "["],
".^$",
["escape", "\\1"],
["charset-punctuation", "]"]
]]
]

Expand Down
22 changes: 21 additions & 1 deletion tests/languages/regex/quantifier_feature.test
@@ -1,6 +1,12 @@
* + ?
{2} {2,} {0,1}

*? +? ??
{2}? {2,}? {0,1}?

*+ ++ ?+
{2}+ {2,}+ {0,1}+

----------------------------------------------------

[
Expand All @@ -9,7 +15,21 @@
["quantifier", "?"],
["quantifier", "{2}"],
["quantifier", "{2,}"],
["quantifier", "{0,1}"]
["quantifier", "{0,1}"],

["quantifier", "*?"],
["quantifier", "+?"],
["quantifier", "??"],
["quantifier", "{2}?"],
["quantifier", "{2,}?"],
["quantifier", "{0,1}?"],

["quantifier", "*+"],
["quantifier", "++"],
["quantifier", "?+"],
["quantifier", "{2}+"],
["quantifier", "{2,}+"],
["quantifier", "{0,1}+"]
]

----------------------------------------------------
Expand Down

0 comments on commit 8a72830

Please sign in to comment.