-
Notifications
You must be signed in to change notification settings - Fork 7
/
Copy pathcodehigh.lua
141 lines (124 loc) · 4.3 KB
/
codehigh.lua
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
local P, R, S, V, C, Cb, Cc, Cf, Cg, Cp, Cs, Ct = lpeg.P, lpeg.R, lpeg.S, lpeg.V,
lpeg.C, lpeg.Cb, lpeg.Cc, lpeg.Cf, lpeg.Cg, lpeg.Cp, lpeg.Cs, lpeg.Ct
lpeg.locale(lpeg)
local alnum, alpha, cntrl, digit, graph, lower, punct, space, upper, xdigit =
lpeg.alnum, lpeg.alpha, lpeg.cntrl, lpeg.digit, lpeg.graph,
lpeg.lower, lpeg.punct, lpeg.space, lpeg.upper, lpeg.xdigit
local function anywhere(p)
return P{ Cp() * p * Cp() + 1 * V(1) }
end
local language = {}
language["latex"] =
{
{1, "Package", P"\\" * (P"documentclass" + P"usepackage")},
{6, "NewCommand", P"\\newcommand"},
{3, "SetCommand", P"\\set" * alpha ^ 1},
{4, "BeginEnd", P"\\" * (P"begin" + P"end")},
{5, "Section", P"\\" * (P"part" + P"chapter" + P"section" + P"subsection")},
{2, "Command", P"\\" * alpha ^ 1},
{7, "Brace", S"{}"},
{8, "MathMode", P"$"},
{9, "Comment", P"%" * (P(1) - S"\r\n") ^ 0 * (S"\r\n" + -1)},
}
language["latex/math"] =
{
{6, "LeftRight", P"\\" * (P"left" + P"right")},
{2, "Command", P"\\" * alpha ^ 1},
{8, "MathMode", P"$"},
{4, "Script", S"_^"},
{5, "Number", digit ^ 1},
{1, "Brace", S"{}"},
{7, "Bracket", S"[]"},
{3, "Parenthesis", S"()"},
{9, "Comment", P"%" * (P(1) - S"\r\n") ^ 0 * (S"\r\n" + -1)},
}
language["latex/table"] =
{
{8, "Newline", P"\\\\"},
{1, "Alignment", P"&" },
{6, "BeginEnd", P"\\" * (P"begin" + P"end")},
{4, "Command", P"\\" * alpha ^ 1},
{2, "Brace", S"{}"},
{3, "Bracket", S"[]"},
{9, "Comment", P"%" * (P(1) - S"\r\n") ^ 0 * (S"\r\n" + -1)},
}
language["latex/latex2"] =
{
{1, "Argument", P"#" ^ 1 * digit},
{6, "NewCommand", P"\\" * (P"" + S"egx") * P"def"},
{5, "SetCommand", P"\\set" * alpha ^ 1},
{4, "PrivateCmd", P"\\" * alpha ^ 0 * P"@" * (alpha + "@") ^ 0},
{3, "Command", P"\\" * alpha ^ 1},
{2, "Brace", S"{}"},
{7, "Bracket", S"[]"},
{9, "Comment", P"%" * (P(1) - S"\r\n") ^ 0 * (S"\r\n" + -1)},
}
language["latex/latex3"] =
{
{1, "Argument", P"#" ^ 1 * digit},
{2, "PrivateVar", P"\\" * S"cgl" * P"__" * (alpha + S"_:@") ^ 1},
{5, "PrivateFun", P"\\" * P"__" * (alpha + S"_:@") ^ 1},
{4, "PublicVar", P"\\" * S"cgl" * P"_" * (alpha + S"_:@") ^ 1},
{6, "PublicFun", P"\\" * (alpha + S"_:@") ^ 1},
{8, "Brace", S"{}"},
{3, "Bracket", S"[]"},
{9, "Comment", P"%" * (P(1) - S"\r\n") ^ 0 * (S"\r\n" + -1)},
}
local function FindMatch(lang, code)
syntax = language[lang]
local b, e, s = -1, -1, ""
for _, v in ipairs(syntax) do
local p = v[3]
mb, me = anywhere(p):match(code)
if mb and (b == -1 or mb < b) then
b = mb
e = me
s = v[1]
end
end
--print(b, e, s)
return b, e, s
end
---- We can not use "catcodetable@string" because space has catcode 10 with it,
---- which causes multiple spaces are printed as single space in "tex.tprint".
-- local cctab = luatexbase.registernumber("catcodetable@string")
---- We don't have "catcodetable@other" inside source2e
-- local cctab = luatexbase.registernumber("catcodetable@other")
---- Here is the catcodetable from luatexbase package
local cctab = luatexbase.catcodetables.CatcodeTableOther
local function PrintCommand(name, content)
tex.tprint(
{"\\expandafter\\gdef\\csname " .. name .. "\\endcsname{"},
{cctab, content}, -- all characters including spaces have catcode 12
{"}"}
)
end
local count = 0
local function PrintCode(style, code)
count = count + 1
local name = "l__cdhh_parse_code_" .. count .. "_tl"
PrintCommand(name, code)
name = "l__cdhh_parse_style_" .. count .. "_tl"
PrintCommand(name, style)
end
function ParseCode(lang, code)
count = 0
while code ~= "" do
local b, e, s = FindMatch(lang, code)
--texio.write_nl(code)
--texio.write_nl("b = " .. b)
--texio.write_nl("e = " .. e)
--texio.write_nl("s = " .. s)
if b == -1 then
PrintCode(0, code)
code = ""
else
PrintCode(0, code:sub(1, b-1))
PrintCode(s, code:sub(b, e-1))
code = code:sub(e)
end
end
local name = "l__cdhh_parse_code_count_tl"
tex.sprint("\\expandafter\\gdef\\csname " .. name .. "\\endcsname{" .. count .. "}")
end
return { FindMatch = FindMatch, PrintCode = PrintCode, ParseCode = ParseCode }