66
|
1 package lexers
|
|
2
|
|
3 import (
|
|
4 "strings"
|
|
5
|
|
6 . "github.com/alecthomas/chroma/v2" // nolint
|
|
7 )
|
|
8
|
|
9 // Restructuredtext lexer.
|
|
10 var Restructuredtext = Register(MustNewLexer(
|
|
11 &Config{
|
|
12 Name: "reStructuredText",
|
|
13 Aliases: []string{"rst", "rest", "restructuredtext"},
|
|
14 Filenames: []string{"*.rst", "*.rest"},
|
|
15 MimeTypes: []string{"text/x-rst", "text/prs.fallenstein.rst"},
|
|
16 },
|
|
17 restructuredtextRules,
|
|
18 ))
|
|
19
|
|
20 func restructuredtextRules() Rules {
|
|
21 return Rules{
|
|
22 "root": {
|
|
23 {"^(=+|-+|`+|:+|\\.+|\\'+|\"+|~+|\\^+|_+|\\*+|\\++|#+)([ \\t]*\\n)(.+)(\\n)(\\1)(\\n)", ByGroups(GenericHeading, Text, GenericHeading, Text, GenericHeading, Text), nil},
|
|
24 {"^(\\S.*)(\\n)(={3,}|-{3,}|`{3,}|:{3,}|\\.{3,}|\\'{3,}|\"{3,}|~{3,}|\\^{3,}|_{3,}|\\*{3,}|\\+{3,}|#{3,})(\\n)", ByGroups(GenericHeading, Text, GenericHeading, Text), nil},
|
|
25 {`^(\s*)([-*+])( .+\n(?:\1 .+\n)*)`, ByGroups(Text, LiteralNumber, UsingSelf("inline")), nil},
|
|
26 {`^(\s*)([0-9#ivxlcmIVXLCM]+\.)( .+\n(?:\1 .+\n)*)`, ByGroups(Text, LiteralNumber, UsingSelf("inline")), nil},
|
|
27 {`^(\s*)(\(?[0-9#ivxlcmIVXLCM]+\))( .+\n(?:\1 .+\n)*)`, ByGroups(Text, LiteralNumber, UsingSelf("inline")), nil},
|
|
28 {`^(\s*)([A-Z]+\.)( .+\n(?:\1 .+\n)+)`, ByGroups(Text, LiteralNumber, UsingSelf("inline")), nil},
|
|
29 {`^(\s*)(\(?[A-Za-z]+\))( .+\n(?:\1 .+\n)+)`, ByGroups(Text, LiteralNumber, UsingSelf("inline")), nil},
|
|
30 {`^(\s*)(\|)( .+\n(?:\| .+\n)*)`, ByGroups(Text, Operator, UsingSelf("inline")), nil},
|
|
31 {`^( *\.\.)(\s*)((?:source)?code(?:-block)?)(::)([ \t]*)([^\n]+)(\n[ \t]*\n)([ \t]+)(.*)(\n)((?:(?:\8.*|)\n)+)`, EmitterFunc(rstCodeBlock), nil},
|
|
32 {`^( *\.\.)(\s*)([\w:-]+?)(::)(?:([ \t]*)(.*))`, ByGroups(Punctuation, Text, OperatorWord, Punctuation, Text, UsingSelf("inline")), nil},
|
|
33 {`^( *\.\.)(\s*)(_(?:[^:\\]|\\.)+:)(.*?)$`, ByGroups(Punctuation, Text, NameTag, UsingSelf("inline")), nil},
|
|
34 {`^( *\.\.)(\s*)(\[.+\])(.*?)$`, ByGroups(Punctuation, Text, NameTag, UsingSelf("inline")), nil},
|
|
35 {`^( *\.\.)(\s*)(\|.+\|)(\s*)([\w:-]+?)(::)(?:([ \t]*)(.*))`, ByGroups(Punctuation, Text, NameTag, Text, OperatorWord, Punctuation, Text, UsingSelf("inline")), nil},
|
|
36 {`^ *\.\..*(\n( +.*\n|\n)+)?`, CommentPreproc, nil},
|
|
37 {`^( *)(:[a-zA-Z-]+:)(\s*)$`, ByGroups(Text, NameClass, Text), nil},
|
|
38 {`^( *)(:.*?:)([ \t]+)(.*?)$`, ByGroups(Text, NameClass, Text, NameFunction), nil},
|
|
39 {`^(\S.*(?<!::)\n)((?:(?: +.*)\n)+)`, ByGroups(UsingSelf("inline"), UsingSelf("inline")), nil},
|
|
40 {`(::)(\n[ \t]*\n)([ \t]+)(.*)(\n)((?:(?:\3.*|)\n)+)`, ByGroups(LiteralStringEscape, Text, LiteralString, LiteralString, Text, LiteralString), nil},
|
|
41 Include("inline"),
|
|
42 },
|
|
43 "inline": {
|
|
44 {`\\.`, Text, nil},
|
|
45 {"``", LiteralString, Push("literal")},
|
|
46 {"(`.+?)(<.+?>)(`__?)", ByGroups(LiteralString, LiteralStringInterpol, LiteralString), nil},
|
|
47 {"`.+?`__?", LiteralString, nil},
|
|
48 {"(`.+?`)(:[a-zA-Z0-9:-]+?:)?", ByGroups(NameVariable, NameAttribute), nil},
|
|
49 {"(:[a-zA-Z0-9:-]+?:)(`.+?`)", ByGroups(NameAttribute, NameVariable), nil},
|
|
50 {`\*\*.+?\*\*`, GenericStrong, nil},
|
|
51 {`\*.+?\*`, GenericEmph, nil},
|
|
52 {`\[.*?\]_`, LiteralString, nil},
|
|
53 {`<.+?>`, NameTag, nil},
|
|
54 {"[^\\\\\\n\\[*`:]+", Text, nil},
|
|
55 {`.`, Text, nil},
|
|
56 },
|
|
57 "literal": {
|
|
58 {"[^`]+", LiteralString, nil},
|
|
59 {"``((?=$)|(?=[-/:.,; \\n\\x00\\\u2010\\\u2011\\\u2012\\\u2013\\\u2014\\\u00a0\\'\\\"\\)\\]\\}\\>\\\u2019\\\u201d\\\u00bb\\!\\?]))", LiteralString, Pop(1)},
|
|
60 {"`", LiteralString, nil},
|
|
61 },
|
|
62 }
|
|
63 }
|
|
64
|
|
65 func rstCodeBlock(groups []string, state *LexerState) Iterator {
|
|
66 iterators := []Iterator{}
|
|
67 tokens := []Token{
|
|
68 {Punctuation, groups[1]},
|
|
69 {Text, groups[2]},
|
|
70 {OperatorWord, groups[3]},
|
|
71 {Punctuation, groups[4]},
|
|
72 {Text, groups[5]},
|
|
73 {Keyword, groups[6]},
|
|
74 {Text, groups[7]},
|
|
75 }
|
|
76 code := strings.Join(groups[8:], "")
|
|
77 lexer := Get(groups[6])
|
|
78 if lexer == nil {
|
|
79 tokens = append(tokens, Token{String, code})
|
|
80 iterators = append(iterators, Literator(tokens...))
|
|
81 } else {
|
|
82 sub, err := lexer.Tokenise(nil, code)
|
|
83 if err != nil {
|
|
84 panic(err)
|
|
85 }
|
|
86 iterators = append(iterators, Literator(tokens...), sub)
|
|
87 }
|
|
88 return Concaterator(iterators...)
|
|
89 }
|