summaryrefslogtreecommitdiff
path: root/tex/context/modules/mkiv/x-ldx.lua
blob: e88c4c79772fb597d6695dc93d237e9338b07750 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
if not modules then modules = { } end modules ['x-ldx'] = {
    version   = 1.001,
    comment   = "companion to x-ldx.mkiv",
    author    = "Hans Hagen, PRAGMA-ADE, Hasselt NL",
    copyright = "PRAGMA ADE / ConTeXt Development Team",
    license   = "see context related readme files"
}

-- --[[ldx--
-- <topic>Introduction</topic>
-- --ldx]]--

--[[ldx--
<source>Lua Documentation Module</source>

This file is part of the <logo label='context'/> documentation suite and
itself serves as an example of using <logo label='lua'/> in combination
with <logo label='tex'/>.

I will rewrite this using lpeg. On the other hand, we cannot expect proper
<logo label='tex'/> and for educational purposed the syntax might be wrong.

Todo: use the scite parser.
--ldx]]--

local banner = "version 1.0.1 - 2007+ - PRAGMA ADE / CONTEXT"

local report = logs.reporter("x-ldx")

--[[
This script needs a few libraries. Instead of merging the code here
we can use

<typing>
mtxrun --internal x-ldx.lua
</typing>

That way, the libraries included in the runner will be used.
]]--

-- libraries l-string.lua l-table.lua l-io.lua l-file.lua

-- begin library merge
-- end library merge

local gsub, find, sub = string.gsub, string.find, string.sub
local splitstring, emptystring = string.split, string.is_empty
local concat = table.concat

--[[
Just a demo comment line. We will handle such multiline comments but
only when they start and end at the beginning of a line. More rich
comments are tagged differently.
]]--

--[[ldx--
First we define a proper namespace for this module. The <q>l</q> stands for
<logo label='lua'/>, the <q>d</q> for documentation and the <q>x</q> for
<logo label='xml'/>.
--ldx]]--

if not ldx then ldx = { } end

--[[ldx--
We load the lua file into a table. The entries in this table themselves are
tables and have keys like <t>code</t> and <t>comment</t>.
--ldx]]--

function ldx.load(filename)
    local data = file.readdata(filename)
    local expr = "%s*%-%-%[%[ldx%-*%s*(.-)%s*%-%-ldx%]%]%-*%s*"
    local i, j, t = 0, 0, { }
    while true do
        local comment, ni
        ni, j, comment = find(data, expr, j)
        if not ni then break end
        t[#t+1] = { code = sub(data, i, ni-1) }
        t[#t+1] = { comment = comment }
        i = j + 1
    end
    local str = sub(data, i, #data)
    str = gsub(str, "^%s*(.-)%s*$", "%1")
    if #str > 0 then
        t[#t+1] = { code = str }
    end
    return t
end

--[[ldx--
We will tag keywords so that we can higlight them using a special font
or color. Users can extend this list when needed.
--ldx]]--

ldx.keywords = { }

--[[ldx--
Here come the reserved words:
--ldx]]--

ldx.keywords.reserved = {
    ["and"]      = 1,
    ["break"]    = 1,
    ["do"]       = 1,
    ["else"]     = 1,
    ["elseif"]   = 1,
    ["end"]      = 1,
    ["false"]    = 1,
    ["for"]      = 1,
    ["function"] = 1,
    ["if"]       = 1,
    ["in"]       = 1,
    ["local"]    = 1,
    ["nil"]      = 1,
    ["not"]      = 1,
    ["or"]       = 1,
    ["repeat"]   = 1,
    ["return"]   = 1,
    ["then"]     = 1,
    ["true"]     = 1,
    ["until"]    = 1,
    ["while"]    = 1
}

--[[ldx--
We need to escape a few tokens. We keep the hash local to the
definition but set it up only once, hence the <key>do</key>
construction.
--ldx]]--

do
    local e = { [">"] = "&gt;", ["<"] = "&lt;", ["&"] = "&amp;" }
    function ldx.escape(str)
        return (gsub(str, "([><&])",e))
    end
end

--[[ldx--
Enhancing the code is a bit tricky due to the fact that we have to
deal with strings and escaped quotes within these strings. Before we
mess around with the code, we hide the strings, and after that we
insert them again. Single and double quoted strings are tagged so
that we can use a different font to highlight them.
--ldx]]--

ldx.make_index = true

function ldx.enhance(data) -- i need to use lpeg and then we can properly autoindent -)
    local e = ldx.escape
    for k=1,#data do
        local v = data[k]
        if v.code then
            local dqs, sqs, com, cmt, cod = { }, { }, { }, { }, e(v.code)
            cod = gsub(cod, '\\"', "##d##")
            cod = gsub(cod, "\\'", "##s##")
            cod = gsub(cod, "%-%-%[%[.-%]%]%-%-", function(s)
                cmt[#cmt+1] = s
                return "<l<<<".. #cmt ..">>>l>"
            end)
            cod = gsub(cod, "%-%-([^\n]*)", function(s)
                com[#com+1] = s
                return "<c<<<".. #com ..">>>c>"
            end)
            cod = gsub(cod, "(%b\"\")", function(s)
                dqs[#dqs+1] = sub(s,2,-2) or ""
                return "<d<<<".. #dqs ..">>>d>"
            end)
            cod = gsub(cod, "(%b\'\')", function(s)
                sqs[#sqs+1] = sub(s,2,-2) or ""
                return "<s<<<".. #sqs ..">>>s>"
            end)
            cod = gsub(cod, "(%a+)",function(key)
                local class = ldx.keywords.reserved[key]
                if class then
                    return "<key class='" .. class .. "'>" .. key .. "</key>"
                else
                    return key
                end
            end)
            cod = gsub(cod, "<s<<<(%d+)>>>s>", function(s)
                return "<sqs>" .. sqs[tonumber(s)] .. "</sqs>"
            end)
            cod = gsub(cod, "<d<<<(%d+)>>>d>", function(s)
                return "<dqs>" .. dqs[tonumber(s)] .. "</dqs>"
            end)
            cod = gsub(cod, "<c<<<(%d+)>>>c>", function(s)
                return "<com>" .. com[tonumber(s)] .. "</com>"
            end)
            cod = gsub(cod, "<l<<<(%d+)>>>l>", function(s)
                return cmt[tonumber(s)]
            end)
            cod = gsub(cod, "##d##", "\\\"")
            cod = gsub(cod, "##s##", "\\\'")
            if ldx.make_index then
                local lines = splitstring(cod,"\n")
                local f = "(<key class='1'>function</key>)%s+([%w%.]+)%s*%("
                for k=1,#lines do
                    local v = lines[k]
                    -- functies
                    v = gsub(v,f,function(key, str)
                        return "<function>" .. str .. "</function>("
                    end)
                    -- variables
                    v = gsub(v,"^([%w][%w%,%s]-)(=[^=])",function(str, rest)
                        local t = splitstring(str,",%s*")
                        for k=1,#t do
                            t[k] = "<variable>" .. t[k] .. "</variable>"
                        end
                        return concat(t,", ") .. rest
                    end)
                    -- so far
                    lines[k] = v
                end
                v.code = concat(lines,"\n")
            else
                v.code = cod
            end
        end
    end
end

--[[ldx--
We're now ready to save the file in <logo label='xml'/> format. This boils
down to wrapping the code and comment as well as the whole document. We tag
lines in the code as such so that we don't need messy <t>CDATA</t> constructs
and by calculating the indentation we also avoid space troubles. It also makes
it possible to change the indentation afterwards.
--ldx]]--

local newmethod = true

function ldx.as_xml(data) -- ldx: not needed
    local t, cmode = { }, false
    t[#t+1] = "<?xml version='1.0' standalone='yes'?>\n"
    t[#t+1] = "\n<document xmlns:ldx='http://www.pragma-ade.com/schemas/ldx.rng' xmlns='http://www.pragma-ade.com/schemas/ldx.rng'>\n"
    for k=1,#data do
        local v = data[k]
        if v.code and not emptystring(v.code) then
            if newmethod then
                t[#t+1] = "\n<luacode><![CDATA[\n"
                t[#t+1] = v.code
                t[#t+1] = "]]></luacode>\n"
            else
                t[#t+1] = "\n<code>\n"
                local split = splitstring(v.code,"\n")
                for k=1,#split do -- make this faster
                    local v = split[k]
                    local a, b = find(v,"^(%s+)")
                    if v then v = gsub(v,"[\n\r ]+$","") end
                    if a and b then
                        v = sub(v,b+1,#v)
                        if cmode then
                            t[#t+1] = "<line comment='yes' n='" .. b .. "'>" .. v .. "</line>\n"
                        else
                            t[#t+1] = "<line n='" .. b .. "'>" .. v .. "</line>\n"
                        end
                    elseif emptystring(v) then
                        if cmode then
                            t[#t+1] = "<line comment='yes'/>\n"
                        else
                            t[#t+1] = "<line/>\n"
                        end
                    elseif find(v,"^%-%-%[%[") then
                        t[#t+1] = "<line comment='yes'>" .. v .. "</line>\n"
                        cmode= true
                    elseif find(v,"^%]%]%-%-") then
                        t[#t+1] = "<line comment='yes'>" .. v .. "</line>\n"
                        cmode= false
                    elseif cmode then
                        t[#t+1] = "<line comment='yes'>" .. v .. "</line>\n"
                    else
                        t[#t+1] = "<line>" .. v .. "</line>\n"
                    end
                end
                t[#t+1] = "</code>\n"
            end
        elseif v.comment then
            t[#t+1] = "\n<comment>\n" .. v.comment .. "\n</comment>\n"
        else
            -- cannot happen
        end
    end
    t[#t+1] = "\n</document>\n"
    return concat(t,"")
end

--[[ldx--
Saving the result is a trivial effort.
--ldx]]--

function ldx.save(filename,data)
    file.savedata(filename,ldx.as_xml(data))
end

--[[ldx--
The next function wraps it all in one call:
--ldx]]--

function ldx.convert(luaname,ldxname)
    if not lfs.isfile(luaname) then
        file.addsuffix(luaname,"lua")
    end
    if lfs.isfile(luaname) then
        if not ldxname then
            ldxname = file.replacesuffix(luaname,"ldx")
        end
        report("converting file %a to %a",luaname,ldxname)
        local data = ldx.load(luaname)
        if data then
--             ldx.enhance(data)
            if ldxname ~= luaname then
                ldx.save(ldxname,data)
            end
        else
            report("invalid file %a",luaname)
        end
    else
        report("unknown file %a",luaname)
    end
end

--[[ldx--
This module can be used directly:

<typing>
mtxrun --internal x-ldx somefile.lua
</typing>

will produce an ldx file that can be processed with <logo label='context'/>
by running:

<typing>
context --use=x-ldx --forcexml somefile.ldx
</typing>

You can do this in one step by saying:

<typing>
context --ctx=x-ldx somefile.lua
</typing>

This will trigger <logo label='context'/> into loading the mentioned
<logo label='ctx'/> file. That file describes the conversion as well
as the module to be used.

The main conversion call is:
--ldx]]--

-- todo: assume usage of "mtxrun --script x-ldx", maybe make it mtx-ldx

if environment.files and environment.files[1] then
    ldx.convert(environment.files[1],environment.files[2])
else
    report("no file given")
end