1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
|
if not modules then modules = { } end modules ['node-acc'] = {
version = 1.001,
comment = "companion to node-ini.mkiv",
author = "Hans Hagen, PRAGMA-ADE, Hasselt NL",
copyright = "PRAGMA ADE / ConTeXt Development Team",
license = "see context related readme files"
}
local nodes, node = nodes, node
local nodecodes = nodes.nodecodes
local tasks = nodes.tasks
local nuts = nodes.nuts
local tonut = nodes.tonut
local tonode = nodes.tonode
local getid = nuts.getid
local getfield = nuts.getfield
local getattr = nuts.getattr
local getlist = nuts.getlist
local getchar = nuts.getchar
local getnext = nuts.getnext
local setfield = nuts.setfield
local setattr = nuts.setattr
local setlink = nuts.setlink
local setchar = nuts.setchar
local setsubtype = nuts.setsubtype
local getwidth = nuts.getwidth
local setwidth = nuts.setwidth
----- traverse_nodes = nuts.traverse
local traverse_id = nuts.traverse_id
----- copy_node = nuts.copy
local insert_after = nuts.insert_after
local copy_no_components = nuts.copy_no_components
local glue_code = nodecodes.glue
----- kern_code = nodecodes.kern
local glyph_code = nodecodes.glyph
local hlist_code = nodecodes.hlist
local vlist_code = nodecodes.vlist
local a_characters = attributes.private("characters")
local threshold = 65536 -- not used
local nofreplaced = 0
-- todo: nbsp etc
-- todo: collapse kerns (not needed, backend does this)
-- todo: maybe cache as we now create many nodes
-- todo: check for subtype related to spacing (13/14 but most seems to be user anyway)
local function injectspaces(head)
local p, p_id
local n = head
while n do
local id = getid(n)
if id == glue_code then
if p and getid(p) == glyph_code then
-- unless we don't care about the little bit of overhead
-- we can just: local g = copy_node(g)
local g = copy_no_components(p)
local a = getattr(n,a_characters)
setchar(g,32)
setlink(p,g,n)
setwidth(n,getwidth(n) - getwidth(g))
if a then
setattr(g,a_characters,a)
end
setattr(n,a_characters,0)
nofreplaced = nofreplaced + 1
end
elseif id == hlist_code or id == vlist_code then
injectspaces(getlist(n),attribute)
end
p_id = id
p = n
n = getnext(n)
end
return head, true -- always done anyway
end
nodes.handlers.accessibility = function(head)
local head, done = injectspaces(tonut(head))
return tonode(head), done
end
statistics.register("inserted spaces in output",function()
if nofreplaced > 0 then
return nofreplaced
end
end)
-- todo:
-- local a_hyphenated = attributes.private('hyphenated')
--
-- local hyphenated, codes = { }, { }
--
-- local function compact(n)
-- local t = { }
-- for n in traverse_id(glyph_code,n) do
-- t[#t+1] = utfchar(getchar(n)) -- check for unicode
-- end
-- return concat(t,"")
-- end
--
-- local function injectspans(head)
-- local done = false
-- for n in traverse_nodes(tonuts(head)) do
-- local id = getid(n)
-- if id == disc then
-- local r = getfield(n,"replace")
-- local p = getfield(n,"pre")
-- if r and p then
-- local str = compact(r)
-- local hsh = hyphenated[str]
-- if not hsh then
-- hsh = #codes + 1
-- hyphenated[str] = hsh
-- codes[hsh] = str
-- end
-- setattr(n,a_hyphenated,hsh)
-- done = true
-- end
-- elseif id == hlist_code or id == vlist_code then
-- injectspans(getlist(n))
-- end
-- end
-- return tonodes(head), done
-- end
--
-- nodes.injectspans = injectspans
--
-- tasks.appendaction("processors", "words", "nodes.injectspans")
--
-- local pdfpageliteral = nuts.pool.pdfpageliteral
--
-- local function injectspans(head)
-- local done = false
-- for n in traverse_nodes(tonut(head)) do
-- local id = getid(n)
-- if id == disc then
-- local a = getattr(n,a_hyphenated)
-- if a then
-- local str = codes[a]
-- local b = pdfpageliteral(format("/Span << /ActualText %s >> BDC", lpdf.tosixteen(str)))
-- local e = pdfpageliteral("EMC")
-- insert_before(head,n,b)
-- insert_after(head,n,e)
-- done = true
-- end
-- elseif id == hlist_code or id == vlist_code then
-- injectspans(getlist(n))
-- end
-- end
-- return tonodes(head), done
-- end
|