if not modules then modules = { } end modules ['back-exp'] = {
version = 1.001,
comment = "companion to back-exp.mkiv",
author = "Hans Hagen, PRAGMA-ADE, Hasselt NL",
copyright = "PRAGMA ADE / ConTeXt Development Team",
license = "see context related readme files"
}
-- Todo: share properties more with tagged pdf (or thge reverse)
-- Because we run into the 200 local limit we quite some do .. end wrappers .. not always
-- that nice but it has to be.
-- Experiments demonstrated that mapping to
and classes is messy because we have to
-- package attributes (some 30) into one set of (space seperatated but prefixed classes)
-- which only makes things worse .. so if you want something else, use xslt to get there.
-- language -> only mainlanguage, local languages should happen through start/stoplanguage
-- tocs/registers -> maybe add a stripper (i.e. just don't flush entries in final tree)
-- footnotes -> css 3
-- bodyfont -> in styles.css
-- Because we need to look ahead we now always build a tree (this was optional in
-- the beginning). The extra overhead in the frontend is neglectable.
--
-- We can optimize the code ... currently the overhead is some 10% for xml + html so
-- there is no hurry.
-- todo: move critital formatters out of functions
-- todo: delay loading (apart from basic tag stuff)
-- problem : too many local variables
-- check setting __i__
local next, type, tonumber = next, type, tonumber
local sub, gsub, match = string.sub, string.gsub, string.match
local validstring = string.valid
local lpegmatch = lpeg.match
local utfchar, utfvalues, utflen = utf.char, utf.values, utf.len
local concat, merge, sort, setmetatableindex = table.concat, table.merge, table.sort, table.setmetatableindex
local sortedhash, sortedkeys = table.sortedhash, table.sortedkeys
local formatters = string.formatters
local todimen = number.todimen
local replacetemplate = utilities.templates.replace
local settings_to_array = utilities.parsers.settings_to_array
local addsuffix, joinfile, nameonly, basename, filesuffix = file.addsuffix, file.join, file.nameonly, file.basename, file.suffix
local trace_export = false trackers.register ("export.trace", function(v) trace_export = v end)
local trace_spacing = false trackers.register ("export.trace.spacing", function(v) trace_spacing = v end)
local trace_details = false trackers.register ("export.trace.details", function(v) trace_details = v end)
local less_state = false directives.register("export.lessstate", function(v) less_state = v end)
local show_comment = true directives.register("export.comment", function(v) show_comment = v end)
-- maybe we will also support these:
--
-- local css_hyphens = false directives.register("export.css.hyphens", function(v) css_hyphens = v end)
-- local css_textalign = false directives.register("export.css.textalign", function(v) css_textalign = v end)
-- local css_bodyfontsize = false directives.register("export.css.bodyfontsize", function(v) css_bodyfontsize = v end)
-- local css_textwidth = false directives.register("export.css.textwidth", function(v) css_textwidth = v end)
local report_export = logs.reporter("backend","export")
local nodes = nodes
local attributes = attributes
local variables = interfaces.variables
local v_yes = variables.yes
local v_no = variables.no
local v_xml = variables.xml
local v_hidden = variables.hidden
local implement = interfaces.implement
local included = backends.included
local tasks = nodes.tasks
local fontchar = fonts.hashes.characters
local fontquads = fonts.hashes.quads
local languagenames = languages.numbers
local texgetcount = tex.getcount
local references = structures.references
local structurestags = structures.tags
local taglist = structurestags.taglist
local specifications = structurestags.specifications
local properties = structurestags.properties
local locatedtag = structurestags.locatedtag
structurestags.usewithcare = { }
local starttiming = statistics.starttiming
local stoptiming = statistics.stoptiming
local characterdata = characters.data
local overloads = fonts.mappings.overloads
-- todo: more locals (and optimize)
local exportversion = "0.35"
local mathmlns = "http://www.w3.org/1998/Math/MathML"
local contextns = "http://www.contextgarden.net/context/export" -- whatever suits
local cssnamespaceurl = "@namespace context url('%namespace%') ;"
local cssnamespace = "context|"
----- cssnamespacenop = "/* no namespace */"
local usecssnamespace = false
local nofcurrentcontent = 0 -- so we don't free (less garbage collection)
local currentcontent = { }
local currentnesting = nil
local currentattribute = nil
local last = nil
local currentparagraph = nil
local noftextblocks = 0
----- hyphencode = 0xAD
local hyphen = utfchar(0xAD) -- todo: also emdash etc
local tagsplitter = structurestags.patterns.splitter
----- colonsplitter = lpeg.splitat(":")
----- dashsplitter = lpeg.splitat("-")
local threshold = 65536
local indexing = false
local keephyphens = false
local exportproperties = false
local finetuning = { }
local treestack = { }
local nesting = { }
local currentdepth = 0
local wrapups = { }
local tree = { data = { }, fulltag == "root" } -- root
local treehash = { }
local extras = { }
local checks = { }
local fixes = { }
local finalizers = { }
local nofbreaks = 0
local used = { }
local exporting = false
local restart = false
local specialspaces = { [0x20] = " " } -- for conversion
local somespace = { [0x20] = true, [" "] = true } -- for testing
local entities = { ["&"] = "&", [">"] = ">", ["<"] = "<" }
local attribentities = { ["&"] = "&", [">"] = ">", ["<"] = "<", ['"'] = "quot;" }
local p_entity = lpeg.replacer(entities) -- was: entityremapper = utf.remapper(entities)
local p_attribute = lpeg.replacer(attribentities)
local p_escaped = lpeg.patterns.xml.escaped
local f_tagid = formatters["%s-%04i"]
-- local alignmapping = {
-- flushright = "right",
-- middle = "center",
-- flushleft = "left",
-- }
local defaultnature = "mixed" -- "inline"
setmetatableindex(used, function(t,k)
if k then
local v = { }
t[k] = v
return v
end
end)
local f_entity = formatters["%X;"]
local f_attribute = formatters[" %s=%q"]
local f_property = formatters[" %s%s=%q"]
setmetatableindex(specialspaces, function(t,k)
local v = utfchar(k)
t[k] = v
entities[v] = f_entity(k)
somespace[k] = true
somespace[v] = true
return v
end)
local namespaced = {
-- filled on
}
local namespaces = {
msubsup = "m",
msub = "m",
msup = "m",
mn = "m",
mi = "m",
ms = "m",
mo = "m",
mtext = "m",
mrow = "m",
mfrac = "m",
mroot = "m",
msqrt = "m",
munderover = "m",
munder = "m",
mover = "m",
merror = "m",
math = "m",
mrow = "m",
mtable = "m",
mtr = "m",
mtd = "m",
mfenced = "m",
maction = "m",
mspace = "m",
-- only when testing
mstacker = "m",
mstackertop = "m",
mstackermid = "m",
mstackerbot = "m",
}
setmetatableindex(namespaced, function(t,k)
if k then
local namespace = namespaces[k]
local v = namespace and namespace .. ":" .. k or k
t[k] = v
return v
end
end)
local function attribute(key,value)
if value and value ~= "" then
return f_attribute(key,lpegmatch(p_attribute,value))
else
return ""
end
end
local function setattribute(di,key,value,escaped)
if value and value ~= "" then
local a = di.attributes
if escaped then
value = lpegmatch(p_escaped,value)
end
if not a then
di.attributes = { [key] = value }
else
a[key] = value
end
end
end
local listdata = { } -- this has to be done otherwise: each element can just point back to ...
function wrapups.hashlistdata()
local c = structures.lists.collected
for i=1,#c do
local ci = c[i]
local tag = ci.references.tag
if tag then
local m = ci.metadata
local t = m.kind .. ">" .. tag -- todo: use internal (see strc-lst.lua where it's set)
listdata[t] = ci
end
end
end
function structurestags.setattributehash(attr,key,value) -- public hash
local specification = taglist[attr]
if specification then
specification[key] = value
else
-- some kind of error
end
end
local usedstyles = { }
local usedimages = { }
local referencehash = { } -- move ?
local destinationhash = { } -- move ?
structurestags.backend = {
setattribute = setattribute,
extras = extras,
checks = checks,
fixes = fixes,
listdata = listdata,
finalizers = finalizers,
usedstyles = usedstyles,
usedimages = usedimages,
referencehash = referencehash,
destinationhash = destinationhash,
}
local namespacetemplate = [[
/* %what% for file %filename% */
%cssnamespaceurl%
]]
do
-- experiment: styles and images
--
-- officially we should convert to bp but we round anyway
-- /* padding : ; */
-- /* text-justify : inter-word ; */
-- /* text-align : justify ; */
local documenttemplate = [[
document,
%namespace%div.document {
font-size : %size% !important ;
max-width : %width% !important ;
text-align : %align% !important ;
hyphens : %hyphens% !important ;
}]]
local styletemplate = [[
%element%[detail="%detail%"],
%namespace%div.%element%.%detail% {
display : inline ;
font-style : %style% ;
font-variant : %variant% ;
font-weight : %weight% ;
font-family : %family% ;
color : %color% ;
}]]
local numbertoallign = {
[0] = "justify", ["0"] = "justify", [variables.normal ] = "justify",
"right", ["1"] = "right", [variables.flushright] = "right",
"center", ["2"] = "center", [variables.middle ] = "center",
"left", ["3"] = "left", [variables.flushleft ] = "left",
}
function wrapups.allusedstyles(filename)
local result = { replacetemplate(namespacetemplate, {
what = "styles",
filename = filename,
namespace = contextns,
-- cssnamespaceurl = usecssnamespace and cssnamespaceurl or cssnamespacenop,
cssnamespaceurl = cssnamespaceurl,
},false,true) }
--
local bodyfont = finetuning.bodyfont
local width = finetuning.width
local hyphen = finetuning.hyphen
local align = finetuning.align
--
if type(bodyfont) == "number" then
bodyfont = todimen(bodyfont)
else
bodyfont = "12pt"
end
if type(width) == "number" then
width = todimen(width) or "50em"
else
width = "50em"
end
if hyphen == v_yes then
hyphen = "manual"
else
hyphen = "inherited"
end
if align then
align = numbertoallign[align]
end
if not align then
align = hyphen and "justify" or "inherited"
end
--
result[#result+1] = replacetemplate(documenttemplate,{
size = bodyfont,
width = width,
align = align,
hyphens = hyphen
})
--
local colorspecification = xml.css.colorspecification
local fontspecification = xml.css.fontspecification
for element, details in sortedhash(usedstyles) do
for detail, data in sortedhash(details) do
local s = fontspecification(data.style)
local c = colorspecification(data.color)
detail = gsub(detail,"[^A-Za-z0-9]+","-")
result[#result+1] = replacetemplate(styletemplate,{
namespace = usecssnamespace and cssnamespace or "",
element = element,
detail = detail,
style = s.style or "inherit",
variant = s.variant or "inherit",
weight = s.weight or "inherit",
family = s.family or "inherit",
color = c or "inherit",
display = s.display and "block" or nil,
})
end
end
return concat(result,"\n\n")
end
end
do
local imagetemplate = [[
%element%[id="%id%"], %namespace%div.%element%[id="%id%"] {
display : block ;
background-image : url('%url%') ;
background-size : 100%% auto ;
background-repeat : no-repeat ;
width : %width% ;
height : %height% ;
}]]
local f_svgname = formatters["%s.svg"]
local f_svgpage = formatters["%s-page-%s.svg"]
local collected = { }
local function usedname(name,page)
if filesuffix(name) == "pdf" then
-- temp hack .. we will have a remapper
if page and page > 1 then
name = f_svgpage(nameonly(name),page)
else
name = f_svgname(nameonly(name))
end
end
local scheme = url.hasscheme(name)
if not scheme or scheme == "file" then
-- or can we just use the name ?
return joinfile("../images",basename(url.filename(name)))
else
return name
end
end
function wrapups.allusedimages(filename)
local result = { replacetemplate(namespacetemplate, {
what = "images",
filename = filename,
namespace = contextns,
-- cssnamespaceurl = usecssnamespace and cssnamespaceurl or "",
cssnamespaceurl = cssnamespaceurl,
},false,true) }
for element, details in sortedhash(usedimages) do
for detail, data in sortedhash(details) do
local name = data.name
local page = tonumber(data.page) or 1
local spec = {
element = element,
id = data.id,
name = name,
page = page,
url = usedname(name,page),
width = data.width,
height = data.height,
used = data.used,
namespace = usecssnamespace and cssnamespace or "",
}
result[#result+1] = replacetemplate(imagetemplate,spec)
collected[detail] = spec
end
end
return concat(result,"\n\n")
end
function wrapups.uniqueusedimages() -- todo: combine these two
return collected
end
end
--
properties.vspace = { export = "break", nature = "display" }
----------------- = { export = "pagebreak", nature = "display" }
local function makebreaklist(list)
nofbreaks = nofbreaks + 1
local t = { }
local l = list and list.taglist
if l then
for i=1,#list do
t[i] = l[i]
end
end
t[#t+1] = "break>" .. nofbreaks -- maybe no number or 0
return { taglist = t }
end
local breakattributes = {
type = "collapse"
}
local function makebreaknode(attributes) -- maybe no fulltag
nofbreaks = nofbreaks + 1
return {
tg = "break",
fulltag = "break>" .. nofbreaks,
n = nofbreaks,
element = "break",
nature = "display",
attributes = attributes or nil,
-- data = { }, -- not needed
-- attribute = 0, -- not needed
-- parnumber = 0,
}
end
do
local fields = { "title", "subtitle", "author", "keywords", "url", "version" }
local ignoredelements = false
local function checkdocument(root)
local data = root.data
if data then
for i=1,#data do
local di = data[i]
local tg = di.tg
if tg == "noexport" then
local s = specifications[di.fulltag]
local u = s and s.userdata
if u then
local comment = u.comment
if comment then
di.element = "comment"
di.data = { { content = comment } }
u.comment = nil
else
data[i] = false
end
else
data[i] = false
end
elseif di.content then
-- okay
elseif tg == "ignore" then
di.element = ""
checkdocument(di)
elseif ignoredelements and ignoredelements[tg] then
di.element = ""
checkdocument(di)
else
checkdocument(di) -- new, else no noexport handling
end
end
end
end
function extras.document(di,element,n,fulltag)
setattribute(di,"language",languagenames[texgetcount("mainlanguagenumber")])
if not less_state then
setattribute(di,"file",tex.jobname)
if included.date then
setattribute(di,"date",os.fulltime())
end
setattribute(di,"context",environment.version)
setattribute(di,"version",exportversion)
setattribute(di,"xmlns:m",mathmlns)
local identity = interactions.general.getidentity()
for i=1,#fields do
local key = fields[i]
local value = identity[key]
if value and value ~= "" then
setattribute(di,key,value)
end
end
end
checkdocument(di)
end
implement {
name = "ignoretagsinexport",
arguments = "string",
actions = function(list)
for tag in string.gmatch(list,"[a-z]+") do
if ignoredelements then
ignoredelements[tag] = true
else
ignoredelements = { [tag] = true }
end
end
end,
}
end
-- flusher
do
local f_detail = formatters[' detail="%s"']
local f_chain = formatters[' chain="%s"']
local f_index = formatters[' n="%s"']
local f_spacing = formatters['%s']
local f_empty_inline = formatters["<%s/>"]
local f_empty_mixed = formatters["%w<%s/>\n"]
local f_empty_display = formatters["\n%w<%s/>\n"]
local f_empty_inline_attr = formatters["<%s%s/>"]
local f_empty_mixed_attr = formatters["%w<%s%s/>"]
local f_empty_display_attr = formatters["\n%w<%s%s/>\n"]
local f_begin_inline = formatters["<%s>"]
local f_begin_mixed = formatters["%w<%s>"]
local f_begin_display = formatters["\n%w<%s>\n"]
local f_begin_inline_attr = formatters["<%s%s>"]
local f_begin_mixed_attr = formatters["%w<%s%s>"]
local f_begin_display_attr = formatters["\n%w<%s%s>\n"]
local f_end_inline = formatters["%s>"]
local f_end_mixed = formatters["%s>\n"]
local f_end_display = formatters["%w%s>\n"]
local f_begin_inline_comment = formatters["<%s>"]
local f_begin_mixed_comment = formatters["%w<%s>"]
local f_begin_display_comment = formatters["\n%w\n%w<%s>\n"]
local f_begin_inline_attr_comment = formatters["<%s%s>"]
local f_begin_mixed_attr_comment = formatters["%w<%s%s>"]
local f_begin_display_attr_comment = formatters["\n%w\n%w<%s%s>\n"]
local f_comment_begin_inline = formatters[""]
local f_comment_begin_mixed = formatters["%w"]
local f_comment_begin_display = formatters["\n%w\n"]
local f_comment_end_inline = formatters[""]
local f_comment_end_mixed = formatters["\n"]
local f_comment_end_display = formatters["%w\n"]
local f_metadata_begin = formatters["\n%w\n"]
local f_metadata = formatters["%w%s\n"]
local f_metadata_end = formatters["%w\n"]
local function attributes(a)
local r = { }
local n = 0
for k, v in next, a do
n = n + 1
r[n] = f_attribute(k,tostring(v)) -- tostring because of %q
end
sort(r)
return concat(r,"")
end
local function properties(a)
local r = { }
local n = 0
for k, v in next, a do
n = n + 1
r[n] = f_property(exportproperties,k,tostring(v)) -- tostring because of %q
end
sort(r)
return concat(r,"")
end
local depth = 0
local inline = 0
local function emptytag(result,element,nature,di) -- currently only break but at some point
local a = di.attributes -- we might add detail etc
if a then -- happens seldom
if nature == "display" then
result[#result+1] = f_empty_display_attr(depth,namespaced[element],attributes(a))
elseif nature == "mixed" then
result[#result+1] = f_empty_mixed_attr(depth,namespaced[element],attributes(a))
else
result[#result+1] = f_empty_inline_attr(namespaced[element],attributes(a))
end
else
if nature == "display" then
result[#result+1] = f_empty_display(depth,namespaced[element])
elseif nature == "mixed" then
result[#result+1] = f_empty_mixed(depth,namespaced[element])
else
result[#result+1] = f_empty_inline(namespaced[element])
end
end
end
-- local function stripspaces(di)
-- local d = di.data
-- local n = #d
-- local m = 0
-- for i=1,n do
-- local di = d[i]
-- if di.tg then
-- m = m + 1
-- d[m] = di
-- end
-- end
-- for i=n,m+1,-1 do
-- d[i] = nil
-- end
-- end
--
-- -- simpler:
local function stripspaces(di)
local d = di.data
for i=1,#d do
local di = d[i]
if not di.tg then
di.content = ""
end
end
end
local function begintag(result,element,nature,di,skip)
local index = di.n
local fulltag = di.fulltag
local specification = specifications[fulltag] or { } -- we can have a dummy
local comment = di.comment
local detail = specification.detail
if skip == "comment" then
if show_comment then
if nature == "inline" or inline > 0 then
result[#result+1] = f_comment_begin_inline(namespaced[element])
inline = inline + 1
elseif nature == "mixed" then
result[#result+1] = f_comment_begin_mixed(depth,namespaced[element])
depth = depth + 1
inline = 1
else
result[#result+1] = f_comment_begin_display(depth,namespaced[element])
depth = depth + 1
end
end
elseif skip then
-- ignore
else
local n = 0
local r = { } -- delay this
if detail then
detail = gsub(detail,"[^A-Za-z0-9]+","-")
specification.detail = detail -- we use it later in for the div
n = n + 1
r[n] = f_detail(detail)
end
local parents = specification.parents
if parents then
parents = gsub(parents,"[^A-Za-z0-9 ]+","-")
specification.parents = parents -- we use it later in for the div
n = n + 1
r[n] = f_chain(parents)
end
if indexing and index then
n = n + 1
r[n] = f_index(index)
end
--
local extra = extras[element]
if extra then
extra(di,element,index,fulltag)
end
--
if di.record then
stripspaces(di)
end
--
if exportproperties then
local p = specification.userdata
if not p then
-- skip
elseif exportproperties == v_yes then
n = n + 1
r[n] = attributes(p)
else
n = n + 1
r[n] = properties(p)
end
end
local a = di.attributes
if a then
if trace_spacing then
a.p = di.parnumber or 0
end
n = n + 1
r[n] = attributes(a)
elseif trace_spacing then
n = n + 1
r[n] = attributes { p = di.parnumber or 0 }
end
if n == 0 then
if nature == "inline" or inline > 0 then
if show_comment and comment then
result[#result+1] = f_begin_inline_comment(comment,namespaced[element])
else
result[#result+1] = f_begin_inline(namespaced[element])
end
inline = inline + 1
elseif nature == "mixed" then
if show_comment and comment then
result[#result+1] = f_begin_mixed_comment(depth,comment,namespaced[element])
else
result[#result+1] = f_begin_mixed(depth,namespaced[element])
end
depth = depth + 1
inline = 1
else
if show_comment and comment then
result[#result+1] = f_begin_display_comment(depth,comment,depth,namespaced[element])
else
result[#result+1] = f_begin_display(depth,namespaced[element])
end
depth = depth + 1
end
else
r = concat(r,"",1,n)
if nature == "inline" or inline > 0 then
if show_comment and comment then
result[#result+1] = f_begin_inline_attr_comment(comment,namespaced[element],r)
else
result[#result+1] = f_begin_inline_attr(namespaced[element],r)
end
inline = inline + 1
elseif nature == "mixed" then
if show_comment and comment then
result[#result+1] = f_begin_mixed_attr_comment(depth,comment,namespaced[element],r)
else
result[#result+1] = f_begin_mixed_attr(depth,namespaced[element],r)
end
depth = depth + 1
inline = 1
else
if show_comment and comment then
result[#result+1] = f_begin_display_attr_comment(depth,comment,depth,namespaced[element],r)
else
result[#result+1] = f_begin_display_attr(depth,namespaced[element],r)
end
depth = depth + 1
end
end
end
used[element][detail or ""] = { nature, specification.parents } -- for template css
-- also in last else ?
local metadata = specification.metadata
if metadata and next(metadata) then
result[#result+1] = f_metadata_begin(depth)
for k, v in sortedhash(metadata) do
if v ~= "" then
result[#result+1] = f_metadata(depth+1,k,lpegmatch(p_entity,v))
end
end
result[#result+1] = f_metadata_end(depth)
end
end
local function endtag(result,element,nature,di,skip)
if skip == "comment" then
if show_comment then
if nature == "display" and (inline == 0 or inline == 1) then
depth = depth - 1
result[#result+1] = f_comment_end_display(depth,namespaced[element])
inline = 0
elseif nature == "mixed" and (inline == 0 or inline == 1) then
depth = depth - 1
result[#result+1] = f_comment_end_mixed(namespaced[element])
inline = 0
else
inline = inline - 1
result[#result+1] = f_comment_end_inline(namespaced[element])
end
end
elseif skip then
-- ignore
else
if nature == "display" and (inline == 0 or inline == 1) then
depth = depth - 1
result[#result+1] = f_end_display(depth,namespaced[element])
inline = 0
elseif nature == "mixed" and (inline == 0 or inline == 1) then
depth = depth - 1
result[#result+1] = f_end_mixed(namespaced[element])
inline = 0
else
inline = inline - 1
result[#result+1] = f_end_inline(namespaced[element])
end
end
end
local function flushtree(result,data,nature)
local nofdata = #data
for i=1,nofdata do
local di = data[i]
if not di then -- hm, di can be string
-- whatever
else
local content = di.content
-- also optimize for content == "" : trace that first
if content then
-- already has breaks
local content = lpegmatch(p_entity,content)
if i == nofdata and sub(content,-1) == "\n" then -- move check
-- can be an end of line in par but can also be the last line
if trace_spacing then
result[#result+1] = f_spacing(di.parnumber or 0,sub(content,1,-2))
else
result[#result+1] = sub(content,1,-2)
end
result[#result+1] = " "
else
if trace_spacing then
result[#result+1] = f_spacing(di.parnumber or 0,content)
else
result[#result+1] = content
end
end
elseif not di.collapsed then -- ignore collapsed data (is appended, reconstructed par)
local element = di.element
if not element then
-- skip
elseif element == "break" then -- or element == "pagebreak" -- todo: use empty flag
emptytag(result,element,nature,di)
elseif element == "mspace" then -- todo: use empty flag
emptytag(result,element,nature,di)
elseif element == "" or di.skip == "ignore" then
-- skip
else
if di.before then
flushtree(result,di.before,nature)
end
local natu = di.nature
local skip = di.skip
if di.breaknode then
emptytag(result,"break","display",di)
end
begintag(result,element,natu,di,skip)
flushtree(result,di.data,natu)
endtag(result,element,natu,di,skip)
if di.after then
flushtree(result,di.after,nature)
end
end
else
-- local element = di.element
-- if element == "mspace" then -- todo: use empty flag
-- emptytag(result,element,nature,di)
-- end
end
end
end
end
local function breaktree(tree,parent,parentelement) -- also removes double breaks
local data = tree.data
if data then
local nofdata = #data
local prevelement
local prevnature
local prevparnumber
local newdata = { }
local nofnewdata = 0
for i=1,nofdata do
local di = data[i]
if not di then
-- skip
elseif di.skip == "ignore" then
-- skip (new)
elseif di.tg == "ignore" then
-- skip (new)
elseif di.content then
if di.samepar then
prevparnumber = false
else
local parnumber = di.parnumber
if prevnature == "inline" and prevparnumber and prevparnumber ~= parnumber then
nofnewdata = nofnewdata + 1
if trace_spacing then
newdata[nofnewdata] = makebreaknode { type = "a", p = prevparnumber, n = parnumber }
else
newdata[nofnewdata] = makebreaknode()
end
end
prevelement = nil
prevparnumber = parnumber
end
prevnature = "inline"
nofnewdata = nofnewdata + 1
newdata[nofnewdata] = di
elseif not di.collapsed then
local element = di.element
if element == "break" then -- or element == "pagebreak"
if prevelement == "break" then
di.element = ""
end
prevelement = element
prevnature = "display"
nofnewdata = nofnewdata + 1
newdata[nofnewdata] = di
elseif element == "" or di.skip == "ignore" then
-- skip
else
if di.samepar then
prevnature = "inline"
prevparnumber = false
else
local nature = di.nature
local parnumber = di.parnumber
if prevnature == "inline" and nature == "inline" and prevparnumber and prevparnumber ~= parnumber then
nofnewdata = nofnewdata + 1
if trace_spacing then
newdata[nofnewdata] = makebreaknode { type = "b", p = prevparnumber, n = parnumber }
else
newdata[nofnewdata] = makebreaknode()
end
end
prevnature = nature
prevparnumber = parnumber
end
prevelement = element
breaktree(di,tree,element)
nofnewdata = nofnewdata + 1
newdata[nofnewdata] = di
end
else
if di.samepar then
prevnature = "inline"
prevparnumber = false
else
local nature = di.nature
local parnumber = di.parnumber
if prevnature == "inline" and nature == "inline" and prevparnumber and prevparnumber ~= parnumber then
nofnewdata = nofnewdata + 1
if trace_spacing then
newdata[nofnewdata] = makebreaknode { type = "c", p = prevparnumber, n = parnumber }
else
newdata[nofnewdata] = makebreaknode()
end
end
prevnature = nature
prevparnumber = parnumber
end
nofnewdata = nofnewdata + 1
newdata[nofnewdata] = di
end
end
tree.data = newdata
end
end
-- also tabulaterow reconstruction .. maybe better as a checker
-- i.e cell attribute
local function showtree(data,when,where)
if data then
for i=1,#data do
local d = data[i]
if type(d) == "table" and d.element then
print(when,where,i,d.element,d.parnumber or 0)
end
end
end
end
local function collapsetree(tree)
-- showtree(data,"before","collapse")
-- for tag, trees in sortedhash(treehash) do
for tag, trees in next, treehash do
local d = trees[1].data
if d then
local nd = #d
if nd > 0 then
for i=2,#trees do
local currenttree = trees[i]
local currentdata = currenttree.data
local currentpar = currenttree.parnumber
local previouspar = trees[i-1].parnumber
currenttree.collapsed = true
-- is the next ok?
if previouspar == 0 or not (di and di.content) then
previouspar = nil -- no need anyway so no further testing needed
end
for j=1,#currentdata do
local cd = currentdata[j]
if not cd or cd == "" then
-- skip
elseif cd.skip == "ignore" then
-- skip
elseif cd.content then
if not currentpar then
-- add space ?
elseif not previouspar then
-- add space ?
elseif currentpar ~= previouspar then
nd = nd + 1
if trace_spacing then
d[nd] = makebreaknode { type = "d", p = previouspar, n = currentpar }
else
d[nd] = makebreaknode()
end
end
previouspar = currentpar
nd = nd + 1
d[nd] = cd
else
nd = nd + 1
d[nd] = cd
end
currentdata[j] = false
end
end
end
end
end
-- showtree(data,"after","collapse")
end
local function finalizetree(tree)
-- showtree(data,"before","finalize")
for _, finalizer in next, finalizers do
finalizer(tree)
end
-- showtree(data,"after","finalize")
end
local function indextree(tree)
local data = tree.data
if data then
-- showtree(data,"before","index")
local n, new = 0, { }
for i=1,#data do
local d = data[i]
if not d then
-- skip
elseif d.content then
n = n + 1
new[n] = d
elseif not d.collapsed then
n = n + 1
d.__i__ = n
d.__p__ = tree
indextree(d)
new[n] = d
end
end
tree.data = new
-- showtree(new,"after","index")
end
end
local function checktree(tree)
local data = tree.data
if data then
-- showtree(data,"before","check")
for i=1,#data do
local d = data[i]
if type(d) == "table" then
local tg = d.tg
if tg then
local check = checks[tg]
if check then
check(d,data,i)
end
end
checktree(d) -- so parts can pass twice
end
end
-- showtree(data,"after","check")
end
end
local function fixtree(tree)
local data = tree.data
if data then
-- showtree(data,"before","fix")
for i=1,#data do
local d = data[i]
if type(d) == "table" then
local tg = d.tg
if tg then
local fix = fixes[tg]
if fix then
fix(d,data,i)
end
end
fixtree(d) -- so parts can pass twice
end
end
-- showtree(data,"after","fix")
end
end
wrapups.flushtree = flushtree
wrapups.breaktree = breaktree
wrapups.collapsetree = collapsetree
wrapups.finalizetree = finalizetree
wrapups.indextree = indextree
wrapups.checktree = checktree
wrapups.fixtree = fixtree
end
-- collector code
local function push(fulltag,depth)
local tg, n, detail, element, nature, record
local specification = specifications[fulltag]
if specification then
tg = specification.tagname
n = specification.tagindex
detail = specification.detail
else
-- a break (more efficient if we don't store those in specifications)
tg, n = lpegmatch(tagsplitter,fulltag)
n = tonumber(n) -- to tonumber in tagsplitter
end
local p = properties[tg]
if p then
element = p.export or tg
nature = p.nature or "inline" -- defaultnature
record = p.record
end
local treedata = tree.data
local t = { -- maybe we can use the tag table
tg = tg,
fulltag = fulltag,
detail = detail,
n = n, -- already a number
element = element,
nature = nature,
data = { },
attribute = currentattribute,
parnumber = currentparagraph,
record = record, -- we can consider storing properties
}
treedata[#treedata+1] = t
currentdepth = currentdepth + 1
nesting[currentdepth] = fulltag
treestack[currentdepth] = tree
if trace_export then
if detail and detail ~= "" then
report_export("%w<%s trigger=%q n=%q paragraph=%q index=%q detail=%q>",currentdepth-1,tg,n,currentattribute or 0,currentparagraph or 0,#treedata,detail)
else
report_export("%w<%s trigger=%q n=%q paragraph=%q index=%q>",currentdepth-1,tg,n,currentattribute or 0,currentparagraph or 0,#treedata)
end
end
tree = t
if tg == "break" then
-- no need for this
else
local h = treehash[fulltag]
if h then
h[#h+1] = t
else
treehash[fulltag] = { t }
end
end
end
local function pop()
if currentdepth > 0 then
local top = nesting[currentdepth]
tree = treestack[currentdepth]
currentdepth = currentdepth - 1
if trace_export then
if top then
report_export("%w%s>",currentdepth,match(top,"[^>]+"))
else
report_export("")
end
end
else
report_export("%w",currentdepth)
end
end
local function continueexport()
if nofcurrentcontent > 0 then
if trace_export then
report_export("%w",currentdepth)
end
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = " " -- pagebreak
end
end
local function pushentry(current)
if not current then
-- bad news
return
end
current = current.taglist
if not current then
-- even worse news
return
end
if restart then
continueexport()
restart = false
end
local newdepth = #current
local olddepth = currentdepth
if trace_export then
report_export("%w",currentdepth,olddepth,newdepth,current[newdepth])
end
if olddepth <= 0 then
for i=1,newdepth do
push(current[i],i)
end
else
local difference
if olddepth < newdepth then
for i=1,olddepth do
if current[i] ~= nesting[i] then
difference = i
break
end
end
else
for i=1,newdepth do
if current[i] ~= nesting[i] then
difference = i
break
end
end
end
if difference then
for i=olddepth,difference,-1 do
pop()
end
for i=difference,newdepth do
push(current[i],i)
end
elseif newdepth > olddepth then
for i=olddepth+1,newdepth do
push(current[i],i)
end
elseif newdepth < olddepth then
for i=olddepth,newdepth,-1 do
pop()
end
elseif trace_export then
report_export("%w",currentdepth,newdepth,nesting[newdepth] or "?")
end
end
return olddepth, newdepth
end
local function pushcontent(oldparagraph,newparagraph)
if nofcurrentcontent > 0 then
if oldparagraph then
if currentcontent[nofcurrentcontent] == "\n" then
if trace_export then
report_export("%w",currentdepth)
end
nofcurrentcontent = nofcurrentcontent - 1
end
end
local content = concat(currentcontent,"",1,nofcurrentcontent)
if content == "" then
-- omit; when oldparagraph we could push, remove spaces, pop
elseif somespace[content] and oldparagraph then
-- omit; when oldparagraph we could push, remove spaces, pop
else
local olddepth, newdepth
local list = taglist[currentattribute]
if list then
olddepth, newdepth = pushentry(list)
end
if tree then
local td = tree.data
local nd = #td
td[nd+1] = { parnumber = oldparagraph or currentparagraph, content = content }
if trace_export then
report_export("%w",currentdepth,utflen(content))
report_export("%w%s",currentdepth,(gsub(content,"\n","\\n")))
report_export("%w",currentdepth)
end
if olddepth then
for i=newdepth-1,olddepth,-1 do
pop()
end
end
end
end
nofcurrentcontent = 0
end
if oldparagraph then
pushentry(makebreaklist(currentnesting))
if trace_export then
report_export("%w",currentdepth,oldparagraph,newparagraph)
end
end
end
local function finishexport()
if trace_export then
report_export("%w",currentdepth)
end
if nofcurrentcontent > 0 then
if somespace[currentcontent[nofcurrentcontent]] then
if trace_export then
report_export("%w",currentdepth)
end
nofcurrentcontent = nofcurrentcontent - 1
end
pushcontent()
end
for i=currentdepth,1,-1 do
pop()
end
currentcontent = { } -- we're nice and do a cleanup
if trace_export then
report_export("%w",currentdepth)
end
end
-- inserts ?
local collectresults do -- too many locals otherwise
local nodecodes = nodes.nodecodes
local gluecodes = nodes.gluecodes
local listcodes = nodes.listcodes
local whatsitcodes = nodes.whatsitcodes
local subtypes = nodes.subtypes
local hlist_code = nodecodes.hlist
local vlist_code = nodecodes.vlist
local glyph_code = nodecodes.glyph
local glue_code = nodecodes.glue
local kern_code = nodecodes.kern
local disc_code = nodecodes.disc
local whatsit_code = nodecodes.whatsit
local par_code = nodecodes.par
local userskip_code = gluecodes.userskip
local rightskip_code = gluecodes.rightskip
local parfillskip_code = gluecodes.parfillskip
local spaceskip_code = gluecodes.spaceskip
local xspaceskip_code = gluecodes.xspaceskip
local intermathskip_code = gluecodes.intermathskip
local linelist_code = listcodes.line
local userdefinedwhatsit_code = whatsitcodes.userdefined
local privateattribute = attributes.private
local a_image = privateattribute('image')
local a_reference = privateattribute('reference')
local a_destination = privateattribute('destination')
local a_characters = privateattribute('characters')
local a_exportstatus = privateattribute('exportstatus')
local a_tagged = privateattribute('tagged')
local a_taggedpar = privateattribute("taggedpar")
local a_textblock = privateattribute("textblock")
local inline_mark = nodes.pool.userids["margins.inline"]
local nuts = nodes.nuts
local getnext = nuts.getnext
local getdisc = nuts.getdisc
local getlist = nuts.getlist
local getid = nuts.getid
local getattr = nuts.getattr
local setattr = nuts.setattr -- maybe use properties
local isglyph = nuts.isglyph
local getkern = nuts.getkern
local getwidth = nuts.getwidth
local startofpar = nuts.startofpar
local nexthlist = nuts.traversers.hlist
local nextnode = nuts.traversers.node
local function addtomaybe(maybewrong,c,case)
if trace_export then
report_export("%w",currentdepth,c,case)
else
local s = formatters["%C"](c)
if maybewrong then
maybewrong[#maybewrong+1] = s
else
maybewrong = { s }
end
return maybewrong
end
end
local function showmaybe(maybewrong)
if not trace_export then
report_export("fuzzy paragraph: % t",maybewrong)
end
end
local function showdetail(n,id,subtype)
local a = getattr(n,a_tagged)
local t = taglist[a]
local c = nodecodes[id]
local s = subtypes[id][subtype]
if a and t then
report_export("node %a, subtype %a, tag %a, element %a, tree '% t'",c,s,a,t.tagname,t.taglist)
else
report_export("node %a, subtype %a, untagged",c,s)
end
end
local function collectresults(head,list,pat,pap) -- is last used (we also have currentattribute)
local p
local paragraph
local maybewrong
local pid
for n, id, subtype in nextnode, head do
if trace_details then
showdetail(n,id,subtype)
end
if id == glyph_code then
local c, f = isglyph(n)
local at = getattr(n,a_tagged) or pat
if not at then
-- we need to tag the pagebody stuff as being valid skippable
--
-- report_export("skipping character: %C (no attribute)",n.char)
else
if last ~= at then
local tl = taglist[at]
local ap = getattr(n,a_taggedpar) or pap
if paragraph and (not ap or ap < paragraph) then
maybewrong = addtomaybe(maybewrong,c,1)
end
pushcontent()
currentnesting = tl
currentparagraph = ap
currentattribute = at
last = at
pushentry(currentnesting)
if trace_export then
report_export("%w",currentdepth,c,at)
end
-- We need to intercept this here; maybe I will also move this
-- to a regular setter at the tex end.
local r = getattr(n,a_reference)
if r then
local t = tl.taglist
referencehash[t[#t]] = r -- fulltag
end
local d = getattr(n,a_destination)
if d then
local t = tl.taglist
destinationhash[t[#t]] = d -- fulltag
end
--
elseif last then
-- we can consider tagging the pars (lines) in the parbuilder but then we loose some
-- information unless we inject a special node (but even then we can run into nesting
-- issues)
local ap = getattr(n,a_taggedpar) or pap
if ap ~= currentparagraph then
pushcontent(currentparagraph,ap)
pushentry(currentnesting)
currentattribute = last
currentparagraph = ap
end
if paragraph and (not ap or ap < paragraph) then
maybewrong = addtomaybe(maybewrong,c,2)
end
if trace_export then
report_export("%w",currentdepth,c,last)
end
else
if trace_export then
report_export("%w",currentdepth,c,at)
end
end
local s = getattr(n,a_exportstatus)
if s then
c = s
end
if c == 0 then
if trace_export then
report_export("%w",currentdepth)
end
elseif c == 0x20 then
local a = getattr(n,a_characters)
nofcurrentcontent = nofcurrentcontent + 1
if a then
if trace_export then
report_export("%w",currentdepth,a)
end
currentcontent[nofcurrentcontent] = specialspaces[a] -- special space
else
currentcontent[nofcurrentcontent] = " "
end
else
local fc = fontchar[f]
if fc then
fc = fc and fc[c]
if fc then
local u = fc.unicode
if not u then
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = utfchar(c)
elseif type(u) == "table" then
for i=1,#u do
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = utfchar(u[i])
end
else
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = utfchar(u)
end
elseif c > 0 then
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = utfchar(c)
else
-- we can have -1 as side effect of an explicit hyphen (unless we expand)
end
elseif c > 0 then
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = utfchar(c)
else
-- we can have -1 as side effect of an explicit hyphen (unless we expand)
end
end
end
elseif id == glue_code then
-- we need to distinguish between hskips and vskips
local ca = getattr(n,a_characters)
if ca == 0 then
-- skip this one ... already converted special character (node-acc)
elseif ca then
local a = getattr(n,a_tagged) or pat
if a then
local c = specialspaces[ca]
if last ~= a then
local tl = taglist[a]
if trace_export then
report_export("%w",currentdepth,ca,a)
end
pushcontent()
currentnesting = tl
currentparagraph = getattr(n,a_taggedpar) or pap
currentattribute = a
last = a
pushentry(currentnesting)
-- no reference check (see above)
elseif last then
local ap = getattr(n,a_taggedpar) or pap
if ap ~= currentparagraph then
pushcontent(currentparagraph,ap)
pushentry(currentnesting)
currentattribute = last
currentparagraph = ap
end
if trace_export then
report_export("%w",currentdepth,ca,last)
end
end
-- if somespace[currentcontent[nofcurrentcontent]] then
-- if trace_export then
-- report_export("%w",currentdepth)
-- end
-- nofcurrentcontent = nofcurrentcontent - 1
-- end
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = c
end
elseif subtype == userskip_code then
-- local at = getattr(n,a_tagged)
-- local tl = taglist[at]
-- if tl and structurestags.strip(tl.taglist[#tl.taglist]) == "mspace" then
-- if nofcurrentcontent > 0 then
-- pushcontent()
-- pushentry(currentnesting) -- ??
-- end
-- -- in the past we'd push a space here ... check mkiv : otherwise no threshold with mspace
-- pushentry(tl)
-- if trace_export then
-- report_export("%w",currentdepth)
end
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = " "
elseif a then
-- e.g LOGOLOGO
if trace_export then
report_export("%w",currentdepth,last,a)
end
pushcontent()
if trace_export then
report_export("%w",currentdepth)
end
last = a
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = " "
currentnesting = taglist[last]
pushentry(currentnesting)
currentattribute = last
end
end
end
-- end
elseif subtype == spaceskip_code or subtype == xspaceskip_code then
if not somespace[currentcontent[nofcurrentcontent]] then
local a = getattr(n,a_tagged) or pat
if a == last then
if trace_export then
report_export("%w",currentdepth)
end
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = " "
else
if trace_export then
report_export("%w",currentdepth)
end
last = a
pushcontent()
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = " "
currentnesting = taglist[last]
pushentry(currentnesting)
currentattribute = last
end
end
elseif subtype == intermathskip_code then
-- put this as attribute when it differs, maybe more ... check mathml
elseif subtype == rightskip_code then
-- a line
if nofcurrentcontent > 0 then
local r = currentcontent[nofcurrentcontent]
if r == hyphen then
if not keephyphens then
nofcurrentcontent = nofcurrentcontent - 1
end
elseif pid == disc_code then
-- go on .. tricky: we should mark the glyhs as coming from a disc
elseif not somespace[r] then
local a = getattr(n,a_tagged) or pat
if a == last then
if trace_export then
report_export("%w",currentdepth)
end
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = " "
else
if trace_export then
report_export("%w",currentdepth)
end
last = a
pushcontent()
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = " "
currentnesting = taglist[last]
pushentry(currentnesting)
currentattribute = last
end
end
end
elseif subtype == parfillskip_code then
-- deal with paragraph endings (crossings) elsewhere and we quit here
-- as we don't want the rightskip space addition
if maybewrong then
showmaybe(maybewrong)
end
return
end
elseif id == hlist_code or id == vlist_code then
local ai = getattr(n,a_image)
if ai then
local at = getattr(n,a_tagged) or pat
if nofcurrentcontent > 0 then
pushcontent()
pushentry(currentnesting) -- ??
end
pushentry(taglist[at]) -- has an index, todo: flag empty element
if trace_export then
report_export("%w",currentdepth,kern)
end
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = " "
end
elseif a then
-- e.g LOGOLOGO
if trace_export then
report_export("%w",currentdepth,limit,last,a)
end
last = a
pushcontent()
if trace_export then
report_export("%w",currentdepth,kern)
end
nofcurrentcontent = nofcurrentcontent + 1
currentcontent[nofcurrentcontent] = " "
-- currentnesting = taglist[last]
currentnesting = t
pushentry(currentnesting)
currentattribute = last
end
end
end
end
end
elseif id == whatsit_code then
-- todo (lmtx)
if subtype == userdefinedwhatsit_code then
-- similar to images, see above
local at = getattr(n,a_tagged)
if nofcurrentcontent > 0 then
pushcontent()
pushentry(currentnesting) -- ??
end
pushentry(taglist[at])
if trace_export then
report_export("%w",currentdepth)
end
-- continueexport()
restart = true
collectresults(head)
if trace_export then
report_export("%w",currentdepth)
end
stoptiming(treehash)
return head
end
function nodes.handlers.checkparcounter(p)
setattr(p,a_taggedpar,texgetcount("tagparcounter") + 1)
return p
end
function builders.paragraphs.tag(head)
noftextblocks = noftextblocks + 1
for n, subtype in nexthlist, head do
if subtype == linelist_code then
setattr(n,a_textblock,noftextblocks)
elseif subtype == glue_code or subtype == kern_code then -- no need to set fontkerns
setattr(n,a_textblock,0)
end
end
return false
end
end
do
local xmlcollected = xml.collected
local xmlsetcomment = xml.setcomment
local xmlpreamble_nop = [[
]]
local xmlpreamble_yes = [[
]]
local flushtree = wrapups.flushtree
local function wholepreamble(standalone,nocomment)
return replacetemplate(nocomment and xmlpreamble_nop or xmlpreamble_yes, {
standalone = standalone and "yes" or "no",
filename = tex.jobname,
date = included.date and os.fulltime(),
contextversion = environment.version,
exportversion = exportversion,
})
end
local csspreamble = [[
]]
local cssheadlink = [[
]]
local function allusedstylesheets(cssfiles,files,path)
local done = { }
local result = { }
local extras = { }
for i=1,#cssfiles do
local cssfile = cssfiles[i]
if type(cssfile) ~= "string" then
-- error
elseif cssfile == "export-example.css" then
-- ignore
elseif not done[cssfile] then
cssfile = joinfile(path,basename(cssfile))
report_export("adding css reference '%s'",cssfile)
files[#files+1] = cssfile
result[#result+1] = replacetemplate(csspreamble, { filename = cssfile })
extras[#extras+1] = replacetemplate(cssheadlink, { filename = cssfile })
done[cssfile] = true
end
end
return concat(result), concat(extras)
end
local elementtemplate = [[
/* element="%element%" detail="%detail%" chain="%chain%" */
%element%,
%namespace%div.%element% {
display: %display% ;
}]]
local detailtemplate = [[
/* element="%element%" detail="%detail%" chain="%chain%" */
%element%[detail=%detail%],
%namespace%div.%element%.%detail% {
display: %display% ;
}]]
--
local htmltemplate = [[
%preamble%
%title%
%style%
Rendering can be suboptimal because there is no default/fallback css loaded.
%body%
]]
local displaymapping = {
inline = "inline",
display = "block",
mixed = "inline",
}
local function allusedelements(filename)
local result = { replacetemplate(namespacetemplate, {
what = "template",
filename = filename,
namespace = contextns,
-- cssnamespaceurl = usecssnamespace and cssnamespaceurl or "",
cssnamespaceurl = cssnamespaceurl,
},false,true) }
for element, details in sortedhash(used) do
if namespaces[element] then
-- skip math
else
for detail, what in sortedhash(details) do
local nature = what[1] or "display"
local chain = what[2]
local display = displaymapping[nature] or "block"
if detail == "" then
result[#result+1] = replacetemplate(elementtemplate, {
element = element,
display = display,
chain = chain,
namespace = usecssnamespace and namespace or "",
})
else
result[#result+1] = replacetemplate(detailtemplate, {
element = element,
display = display,
detail = detail,
chain = chain,
namespace = usecssnamespace and cssnamespace or "",
})
end
end
end
end
return concat(result,"\n\n")
end
local function allcontent(tree)
local result = { }
local data = tree.data
for i=1,#data do
if data[i].tg ~= "document" then
data[i] = { }
end
end
flushtree(result,tree.data,"display") -- we need to collect images
result = concat(result)
-- no need to lpeg .. fast enough
result = gsub(result,"\n *\n","\n")
result = gsub(result,"\n +([^< ])","\n%1")
--
return result
end
-- local xhtmlpreamble = [[
--
-- ]]
local function cleanxhtmltree(xmltree)
if xmltree then
local implicits = { }
local explicits = { }
local overloads = { }
for e in xmlcollected(xmltree,"*") do
local at = e.at
if at then
local explicit = at.explicit
local implicit = at.implicit
if explicit then
if not explicits[explicit] then
explicits[explicit] = true
at.id = explicit
if implicit then
overloads[implicit] = explicit
end
end
else
if implicit and not implicits[implicit] then
implicits[implicit] = true
at.id = "aut:" .. implicit
end
end
end
end
for e in xmlcollected(xmltree,"*") do
local at = e.at
if at then
local internal = at.internal
local location = at.location
if internal then
if location then
local explicit = overloads[location]
if explicit then
at.href = "#" .. explicit
else
at.href = "#aut:" .. internal
end
else
at.href = "#aut:" .. internal
end
else
if location then
at.href = "#" .. location
else
local url = at.url
if url then
at.href = url
else
local file = at.file
if file then
at.href = file
end
end
end
end
end
end
return xmltree
else
return xml.convert('\ninvalid xhtml tree')
end
end
-- maybe the reverse: be explicit about what is permitted
local private = {
destination = true,
prefix = true,
reference = true,
--
id = true,
href = true,
--
implicit = true,
explicit = true,
--
url = true,
file = true,
internal = true,
location = true,
--
name = true, -- image name
used = true, -- image name
page = true, -- image name
width = true,
height = true,
--
}
local addclicks = true
local f_onclick = formatters[ [[location.href='%s']] ]
local f_onclick = formatters[ [[location.href='%s']] ]
local p_cleanid = lpeg.replacer { [":"] = "-" }
local p_cleanhref = lpeg.Cs(lpeg.P("#") * p_cleanid)
local p_splitter = lpeg.Ct ( (
lpeg.Carg(1) * lpeg.C((1-lpeg.P(" "))^1) / function(d,s) if not d[s] then d[s] = true return s end end
* lpeg.P(" ")^0 )^1 )
local classes = table.setmetatableindex(function(t,k)
local v = concat(lpegmatch(p_splitter,k,1,{})," ")
t[k] = v
return v
end)
local function makeclass(tg,at)
local detail = at.detail
local chain = at.chain
local extra = nil
local classes = { }
local nofclasses = 0
at.detail = nil
at.chain = nil
for k, v in next, at do
if not private[k] then
nofclasses = nofclasses + 1
classes[nofclasses] = k .. "-" .. v
end
end
if detail and detail ~= "" then
if chain and chain ~= "" then
if chain ~= detail then
extra = classes[tg .. " " .. chain .. " " .. detail]
elseif tg ~= detail then
extra = detail
end
elseif tg ~= detail then
extra = detail
end
elseif chain and chain ~= "" then
if tg ~= chain then
extra = chain
end
end
-- in this order
if nofclasses > 0 then
sort(classes)
classes = concat(classes," ")
if extra then
return tg .. " " .. extra .. " " .. classes
else
return tg .. " " .. classes
end
else
if extra then
return tg .. " " .. extra
else
return tg
end
end
end
-- Some elements are not supported (well) in css so we need to retain them. For
-- instance, tablecells have no colspan so basically that renders css table div
-- elements quite useless. A side effect is that we nwo can have conflicts when
-- we mix in with other html (as there is no reset). Of course, when it eventually
-- gets added, there is a change then that those not using the div abstraction
-- will be rediculed.
--
-- a table tr td th thead tbody tfoot
--
local crappycss = {
table = "table", tabulate = "table",
tablehead = "thead", tabulatehead = "thead",
tablebody = "tbody", tabulatebody = "tbody",
tablefoot = "tfoot", tabulatefoot = "tfoot",
tablerow = "tr", tabulaterow = "tr",
tablecell = "td", tabulatecell = "td",
}
local cssmapping = false
directives.register("export.nativetags", function(v)
cssmapping = v and crappycss or false
end)
local function remap(specification,source,target)
local comment = nil -- share comments
for c in xmlcollected(source,"*") do
if not c.special then
local tg = c.tg
local ns = c.ns
if ns == "m" then
if false then -- yes or no
c.ns = ""
c.at["xmlns:m"] = nil
end
-- elseif tg == "a" then
-- c.ns = ""
else
local dt = c.dt
local nt = #dt
if nt == 0 or (nt == 1 and dt[1] == "") then
if comment then
c.dt = comment
else
xmlsetcomment(c,"empty")
comment = c.dt
end
end
local at = c.at
local class = nil
local label = nil
if tg == "document" then
at.href = nil
at.detail = nil
at.chain = nil
elseif tg == "metavariable" then
label = at.name
at.detail = "metaname-" .. label
class = makeclass(tg,at)
else
class = makeclass(tg,at)
end
local id = at.id
local href = at.href
local attr = nil
if id then
id = lpegmatch(p_cleanid, id) or id
if href then
href = lpegmatch(p_cleanhref,href) or href
attr = {
class = class,
id = id,
href = href,
onclick = addclicks and f_onclick(href) or nil,
}
else
attr = {
class = class,
id = id,
}
end
else
if href then
href = lpegmatch(p_cleanhref,href) or href
attr = {
class = class,
href = href,
onclick = addclicks and f_onclick(href) or nil,
}
else
attr = {
class = class,
}
end
end
c.at = attr
if label then
attr.label = label
end
c.tg = cssmapping and cssmapping[tg] or "div"
end
end
end
end
-- local cssfile = nil directives.register("backend.export.css", function(v) cssfile = v end)
local embedfile = false directives.register("export.embed",function(v) embedfile = v end)
local justexport = nodes.handlers.export
local function wrapuptree(tree)
wrapups.fixtree(tree)
wrapups.collapsetree(tree)
wrapups.indextree(tree)
wrapups.checktree(tree)
wrapups.breaktree(tree)
wrapups.finalizetree(tree)
end
local function localexport(head)
starttiming(treehash)
local saved_treestack = treestack
local saved_nesting = nesting
local saved_currentdepth = currentdepth
local saved_tree = tree
local saved_treehash = treehash
local saved_nofbreaks = nofbreaks
local saved_show_comment = show_comment
treestack = { }
nesting = { }
currentdepth = 0
tree = { data = { }, fulltag == "root" } -- root
treehash = { }
nofbreaks = 0
show_comment = false
justexport(head)
finishexport()
wrapuptree(tree)
-- tree.data = tree.data[1].data
local result = concat {
wholepreamble(true,true),
allcontent(tree),
}
treestack = saved_treestack
nesting = saved_nesting
currentdepth = saved_currentdepth
tree = saved_tree
treehash = saved_treehash
nofbreaks = saved_nofbreaks
show_comment = saved_show_comment
stoptiming(treehash)
return result
end
structurestags.localexport = localexport
function structures.tags.exportbox(n,filename,buffername)
local list = nodes.nuts.getbox(n)
if n then
local e = localexport(list)
if filename and filename ~= "" then
io.savedata(filename,e)
elseif buffername then
buffers.assign(buffername == interfaces.variables.yes and "" or buffername,e)
else
return e
end
end
end
interfaces.implement {
name = "exportbox",
arguments = { "integer", "string", "string" },
actions = structures.tags.exportbox
}
function structurestags.finishexport()
if exporting then
exporting = false
else
return
end
local onlyxml = finetuning.export == v_xml
starttiming(treehash)
--
finishexport()
--
report_export("")
if onlyxml then
report_export("exporting xml, no other files")
else
report_export("exporting xml, xhtml, html and css files")
end
report_export("")
--
wrapuptree(tree)
--
local askedname = finetuning.file
--
-- we use a dedicated subpath:
--
-- ./jobname-export
-- ./jobname-export/images
-- ./jobname-export/styles
-- ./jobname-export/styles
-- ./jobname-export/jobname-export.xml
-- ./jobname-export/jobname-export.xhtml
-- ./jobname-export/jobname-export.html
-- ./jobname-export/jobname-specification.lua
-- ./jobname-export/styles/jobname-defaults.css
-- ./jobname-export/styles/jobname-styles.css
-- ./jobname-export/styles/jobname-images.css
-- ./jobname-export/styles/jobname-templates.css
if type(askedname) ~= "string" or askedname == "" then
askedname = tex.jobname
end
local usedname = nameonly(askedname)
local basepath = usedname .. "-export"
local imagepath = joinfile(basepath,"images")
local stylepath = joinfile(basepath,"styles")
local function validpath(what,pathname)
if lfs.isdir(pathname) then
report_export("using existing %s path %a",what,pathname)
return pathname
end
lfs.mkdir(pathname)
if lfs.isdir(pathname) then
report_export("using cretated %s path %a",what,basepath)
return pathname
else
report_export("unable to create %s path %a",what,basepath)
return false
end
end
if not (validpath("export",basepath) and validpath("images",imagepath) and validpath("styles",stylepath)) then
return
end
-- we're now on the dedicated export subpath so we can't clash names
--
-- a xhtml suffix no longer seems to be work well with browsers
local xmlfilebase = addsuffix(usedname .. "-raw","xml" )
local xhtmlfilebase = addsuffix(usedname .. "-tag","xhtml")
local htmlfilebase = addsuffix(usedname .. "-div","html")
local specificationfilebase = addsuffix(usedname .. "-pub","lua" )
local xmlfilename = joinfile(basepath, xmlfilebase )
local xhtmlfilename = joinfile(basepath, xhtmlfilebase )
local htmlfilename = joinfile(basepath, htmlfilebase )
local specificationfilename = joinfile(basepath, specificationfilebase)
--
local defaultfilebase = addsuffix(usedname .. "-defaults", "css")
local imagefilebase = addsuffix(usedname .. "-images", "css")
local stylefilebase = addsuffix(usedname .. "-styles", "css")
local templatefilebase = addsuffix(usedname .. "-templates","css")
--
local defaultfilename = joinfile(stylepath,defaultfilebase )
local imagefilename = joinfile(stylepath,imagefilebase )
local stylefilename = joinfile(stylepath,stylefilebase )
local templatefilename = joinfile(stylepath,templatefilebase)
local cssfile = finetuning.cssfile
-- we keep track of all used files
local files = {
}
-- we always load the defaults and optionally extra css files; we also copy the example
-- css file so that we always have the latest version
local cssfiles = {
defaultfilebase,
imagefilebase,
stylefilebase,
}
local cssextra = cssfile and table.unique(settings_to_array(cssfile)) or { }
-- at this point we're ready for the content; the collector also does some
-- housekeeping and data collecting; at this point we still have an xml
-- representation that uses verbose element names and carries information in
-- attributes
local result = allcontent(tree)
-- ugly but so be it:
local extradata = structures.tags.getextradata()
if extradata then
local t = { "" }
t[#t+1] = ""
for name, action in sortedhash(extradata) do
t[#t+1] = action()
end
t[#t+1] = ""
t[#t+1] = ""
-- we use a function because otherwise we can have a bad capture index
result = gsub(result,"",function()
return concat(t,"\n")
end)
end
-- done with ugly
if onlyxml then
os.remove(defaultfilename)
os.remove(imagefilename)
os.remove(stylefilename)
os.remove(templatefilename)
for i=1,#cssextra do
os.remove(joinfile(stylepath,basename(source)))
end
-- os.remove(xmlfilename)
os.remove(imagefilename)
os.remove(stylefilename)
os.remove(templatefilename)
os.remove(xhtmlfilename)
os.remove(specificationfilename)
os.remove(htmlfilename)
result = concat {
wholepreamble(true,true),
"\n",
result,
}
report_export("saving xml data in %a",xmlfilename)
io.savedata(xmlfilename,result)
return
end
local examplefilename = resolvers.findfile("export-example.css")
if examplefilename then
local data = io.loaddata(examplefilename)
if not data or data == "" then
data = "/* missing css file */"
elseif not usecssnamespace then
data = gsub(data,cssnamespace,"")
end
io.savedata(defaultfilename,data)
end
if cssfile then
for i=1,#cssextra do
local source = addsuffix(cssextra[i],"css")
local target = joinfile(stylepath,basename(source))
cssfiles[#cssfiles+1] = source
if not lfs.isfile(source) then
source = joinfile("../",source)
end
if lfs.isfile(source) then
report_export("copying %s",source)
file.copy(source,target)
end
end
end
local x_styles, h_styles = allusedstylesheets(cssfiles,files,"styles")
local attach = backends.nodeinjections.attachfile
if embedfile and attach then
-- only for testing
attach {
data = concat{ wholepreamble(true), result },
name = basename(xmlfilename),
registered = "export",
title = "raw xml export",
method = v_hidden,
mimetype = "application/mathml+xml",
}
end
result = concat {
wholepreamble(true),
x_styles, -- adds to files
result,
}
cssfiles = table.unique(cssfiles)
-- we're now ready for saving the result in the xml file
report_export("saving xml data in %a",xmlfilename)
io.savedata(xmlfilename,result)
report_export("saving css image definitions in %a",imagefilename)
io.savedata(imagefilename,wrapups.allusedimages(usedname))
report_export("saving css style definitions in %a",stylefilename)
io.savedata(stylefilename,wrapups.allusedstyles(usedname))
report_export("saving css template in %a",templatefilename)
io.savedata(templatefilename,allusedelements(usedname))
-- additionally we save an xhtml file; for that we load the file as xml tree
report_export("saving xhtml variant in %a",xhtmlfilename)
local xmltree = cleanxhtmltree(xml.convert(result))
-- local xmltree = xml.convert(result)
-- for c in xml.collected(xmltree,"m:mtext[lastindex()=1]/m:mrow") do
-- print(c)
-- end
-- for c in xml.collected(xmltree,"mtext/mrow") do
-- print(c)
-- end
-- local xmltree = cleanxhtmltree(xmltree)
xml.save(xmltree,xhtmlfilename)
-- now we save a specification file that can b eused for generating an epub file
-- looking at identity is somewhat redundant as we also inherit from interaction
-- at the tex end
local identity = interactions.general.getidentity()
local metadata = structures.tags.getmetadata()
local specification = {
name = usedname,
identifier = os.uuid(),
images = wrapups.uniqueusedimages(),
imagefile = joinfile("styles",imagefilebase),
imagepath = "images",
stylepath = "styles",
xmlfiles = { xmlfilebase },
xhtmlfiles = { xhtmlfilebase },
htmlfiles = { htmlfilebase },
styles = cssfiles,
htmlroot = htmlfilebase,
language = languagenames[texgetcount("mainlanguagenumber")],
title = validstring(finetuning.title) or validstring(identity.title),
subtitle = validstring(finetuning.subtitle) or validstring(identity.subtitle),
author = validstring(finetuning.author) or validstring(identity.author),
firstpage = validstring(finetuning.firstpage),
lastpage = validstring(finetuning.lastpage),
metadata = metadata,
}
report_export("saving specification in %a",specificationfilename,specificationfilename)
xml.wipe(xmltree,"metadata") -- maybe optional
io.savedata(specificationfilename,table.serialize(specification,true))
-- the html export for epub is different in the sense that it uses div's instead of
-- specific tags
report_export("saving div based alternative in %a",htmlfilename)
remap(specification,xmltree)
-- believe it or not, but a can prevent viewing in browsers
local title = specification.title
if not title or title == "" then
title = metadata.title
if not title or title == "" then
title = usedname -- was: "no title"
end
end
local variables = {
style = h_styles,
body = xml.tostring(xml.first(xmltree,"/div")),
preamble = wholepreamble(false),
title = title,
}
io.savedata(htmlfilename,replacetemplate(htmltemplate,variables,"xml"))
-- finally we report how an epub file can be made (using the specification)
report_export("")
report_export('create epub with: mtxrun --script epub --make "%s" [--purge --rename --svgmath]',usedname)
report_export("")
stoptiming(treehash)
end
local enableaction = nodes.tasks.enableaction
function structurestags.initializeexport()
if not exporting then
report_export("enabling export to xml")
enableaction("shipouts","nodes.handlers.export")
enableaction("shipouts","nodes.handlers.accessibility")
enableaction("math", "noads.handlers.tags")
enableaction("everypar","nodes.handlers.checkparcounter")
luatex.registerstopactions(structurestags.finishexport)
exporting = true
end
end
function structurestags.setupexport(t)
merge(finetuning,t)
keephyphens = finetuning.hyphen == v_yes
exportproperties = finetuning.properties
if exportproperties == v_no then
exportproperties = false
end
end
statistics.register("xml exporting time", function()
if exporting then
return string.format("%s seconds, version %s", statistics.elapsedtime(treehash),exportversion)
end
end)
end
-- These are called at the tex end:
implement {
name = "setupexport",
actions = structurestags.setupexport,
arguments = {
{
{ "align" },
{ "bodyfont", "dimen" },
{ "width", "dimen" },
{ "properties" },
{ "hyphen" },
{ "title" },
{ "subtitle" },
{ "author" },
{ "firstpage" },
{ "lastpage" },
{ "svgstyle" },
{ "cssfile" },
{ "file" },
{ "export" },
}
}
}
implement {
name = "finishexport",
actions = structurestags.finishexport,
}
implement {
name = "initializeexport",
actions = structurestags.initializeexport,
}