• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

sile-typesetter / sile / 9490661318

12 Jun 2024 10:35PM UTC coverage: 63.543% (-5.6%) from 69.177%
9490661318

push

github

web-flow
Merge abd81ea2a into 8887271be

15 of 15 new or added lines in 3 files covered. (100.0%)

1031 existing lines in 36 files now uncovered.

10965 of 17256 relevant lines covered (63.54%)

4698.75 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

84.03
/languages/unicode.lua
1
local icu = require("justenoughicu")
80✔
2

3
local chardata = require("char-def")
80✔
4

5
SILE.settings:declare({
80✔
6
   parameter = "languages.fixedNbsp",
7
   type = "boolean",
8
   default = false,
9
   help = "Whether to treat U+00A0 (NO-BREAK SPACE) as a fixed-width space",
10
})
11

12
SILE.nodeMakers.base = pl.class({
160✔
13

14
   _init = function (self, options)
15
      self.contents = {}
1,960✔
16
      self.options = options
1,960✔
17
      self.token = ""
1,960✔
18
      self.lastnode = false
1,960✔
19
      self.lasttype = false
1,960✔
20
   end,
21

22
   makeToken = function (self)
23
      if #self.contents > 0 then
5,203✔
24
         coroutine.yield(SILE.shaper:formNnode(self.contents, self.token, self.options))
7,322✔
25
         SU.debug("tokenizer", "Token:", self.token)
3,661✔
26
         self.contents = {}
3,661✔
27
         self.token = ""
3,661✔
28
         self.lastnode = "nnode"
3,661✔
29
      end
30
   end,
31

32
   addToken = function (self, char, item)
33
      self.token = self.token .. char
11,958✔
34
      table.insert(self.contents, item)
11,958✔
35
   end,
36

37
   makeGlue = function (self, item)
38
      if SILE.settings:get("typesetter.obeyspaces") or self.lastnode ~= "glue" then
3,098✔
39
         SU.debug("tokenizer", "Space node")
1,531✔
40
         coroutine.yield(SILE.shaper:makeSpaceNode(self.options, item))
3,062✔
41
      end
42
      self.lastnode = "glue"
1,549✔
43
      self.lasttype = "sp"
1,549✔
44
   end,
45

46
   makePenalty = function (self, p)
47
      if self.lastnode ~= "penalty" and self.lastnode ~= "glue" then
1,447✔
48
         coroutine.yield(SILE.types.node.penalty({ penalty = p or 0 }))
28✔
49
      end
50
      self.lastnode = "penalty"
1,447✔
51
   end,
52

53
   makeNonBreakingSpace = function (self)
54
      -- Unicode Line Breaking Algorithm (UAX 14) specifies that U+00A0
55
      -- (NO-BREAK SPACE) is expanded or compressed like a normal space.
56
      coroutine.yield(SILE.types.node.kern(SILE.shaper:measureSpace(self.options)))
21✔
57
      self.lastnode = "glue"
7✔
58
      self.lasttype = "sp"
7✔
59
   end,
60

61
   iterator = function (_, _)
62
      SU.error("Abstract function nodemaker:iterator called", true)
×
63
   end,
64

65
   charData = function (_, char)
66
      local cp = SU.codepoint(char)
48,019✔
67
      if not chardata[cp] then
48,019✔
68
         return {}
844✔
69
      end
70
      return chardata[cp]
47,175✔
71
   end,
72

73
   isActiveNonBreakingSpace = function (self, char)
74
      return self:isNonBreakingSpace(char) and not SILE.settings:get("languages.fixedNbsp")
23,937✔
75
   end,
76

77
   isBreaking = function (self, char)
78
      return self.breakingTypes[self:charData(char).linebreak]
20,528✔
79
   end,
80

81
   isNonBreakingSpace = function (self, char)
82
      local c = self:charData(char)
11,965✔
83
      return c.contextname and c.contextname == "nobreakspace"
11,965✔
84
   end,
85

86
   isPunctuation = function (self, char)
87
      return self.puctuationTypes[self:charData(char).category]
×
88
   end,
89

90
   isSpace = function (self, char)
91
      return self.spaceTypes[self:charData(char).linebreak]
30,912✔
92
   end,
93

94
   isQuote = function (self, char)
95
      return self.quoteTypes[self:charData(char).linebreak]
20,528✔
96
   end,
97

98
   isWord = function (self, char)
99
      return self.wordTypes[self:charData(char).linebreak]
140✔
100
   end,
101
})
80✔
102

103
SILE.nodeMakers.unicode = pl.class(SILE.nodeMakers.base)
160✔
104

105
SILE.nodeMakers.unicode.breakingTypes = { ba = true, zw = true }
80✔
106
SILE.nodeMakers.unicode.puctuationTypes = { po = true }
80✔
107
SILE.nodeMakers.unicode.quoteTypes = {} -- quote linebreak category is ambiguous depending on the language
80✔
108
SILE.nodeMakers.unicode.spaceTypes = { sp = true }
80✔
109
SILE.nodeMakers.unicode.wordTypes = { cm = true }
80✔
110

111
function SILE.nodeMakers.unicode:dealWith (item)
160✔
112
   local char = item.text
10,264✔
113
   local cp = SU.codepoint(char)
10,264✔
114
   local thistype = chardata[cp] and chardata[cp].linebreak
10,264✔
115
   if self:isSpace(item.text) then
20,528✔
UNCOV
116
      self:makeToken()
×
UNCOV
117
      self:makeGlue(item)
×
118
   elseif self:isActiveNonBreakingSpace(item.text) then
20,528✔
119
      self:makeToken()
×
120
      self:makeNonBreakingSpace()
×
121
   elseif self:isBreaking(item.text) then
20,528✔
UNCOV
122
      self:addToken(char, item)
×
UNCOV
123
      self:makeToken()
×
UNCOV
124
      self:makePenalty(0)
×
125
   elseif self:isQuote(item.text) then
20,528✔
126
      self:addToken(char, item)
×
127
      self:makeToken()
×
128
   elseif self.lasttype and (thistype and thistype ~= self.lasttype and not self:isWord(thistype)) then
10,334✔
129
      self:addToken(char, item)
140✔
130
   else
131
      self:letterspace()
10,194✔
132
      self:addToken(char, item)
10,194✔
133
   end
134
   self.lasttype = thistype
10,264✔
135
end
136

137
function SILE.nodeMakers.unicode:handleInitialGlue (items)
160✔
138
   local i = 1
1,959✔
139
   while i <= #items do
2,020✔
140
      local item = items[i]
2,003✔
141
      if self:isSpace(item.text) then
4,006✔
142
         self:makeGlue(item)
122✔
143
      else
144
         break
145
      end
146
      i = i + 1
61✔
147
   end
148
   return i, items
1,959✔
149
end
150

151
function SILE.nodeMakers.unicode:letterspace ()
160✔
152
   if not SILE.settings:get("document.letterspaceglue") then
20,388✔
153
      return
10,139✔
154
   end
155
   if self.token then
55✔
156
      self:makeToken()
55✔
157
   end
158
   if self.lastnode and self.lastnode ~= "glue" then
55✔
159
      local w = SILE.settings:get("document.letterspaceglue").width
102✔
160
      SU.debug("tokenizer", "Letter space glue:", w)
51✔
161
      coroutine.yield(SILE.types.node.kern({ width = w }))
102✔
162
      self.lastnode = "glue"
51✔
163
      self.lasttype = "sp"
51✔
164
   end
165
end
166

167
function SILE.nodeMakers.unicode.isICUBreakHere (_, chunks, item)
160✔
168
   return chunks[1] and (item.index >= chunks[1].index)
13,453✔
169
end
170

171
function SILE.nodeMakers.unicode:handleICUBreak (chunks, item)
160✔
172
   -- The ICU library has told us there is a breakpoint at
173
   -- this index. We need to...
174
   local bp = chunks[1]
3,189✔
175
   -- ... remove this breakpoint (and any out of order ones)
176
   -- from the ICU breakpoints array so that chunks[1] is
177
   -- the next index point for comparison against the string...
178
   while chunks[1] and item.index >= chunks[1].index do
6,378✔
179
      table.remove(chunks, 1)
6,378✔
180
   end
181
   -- ...decide which kind of breakpoint we have here and
182
   -- handle it appropriately.
183
   if bp.type == "word" then
3,189✔
184
      self:handleWordBreak(item)
3,484✔
185
   elseif bp.type == "line" then
1,447✔
186
      self:handleLineBreak(item, bp.subtype)
1,447✔
187
   end
188
   return chunks
3,189✔
189
end
190

191
function SILE.nodeMakers.unicode:handleWordBreak (item)
160✔
192
   self:makeToken()
1,742✔
193
   if self:isSpace(item.text) then
3,484✔
194
      -- Spacing word break
195
      self:makeGlue(item)
2,976✔
196
   elseif self:isActiveNonBreakingSpace(item.text) then
508✔
197
      -- Non-breaking space word break
198
      self:makeNonBreakingSpace()
14✔
199
   else
200
      -- a word break which isn't a space
201
      self:addToken(item.text, item)
247✔
202
   end
203
end
204

205
function SILE.nodeMakers.unicode:_handleWordBreakRepeatHyphen (item)
160✔
206
   -- According to some language rules, when a break occurs at an explicit hyphen,
207
   -- the hyphen gets repeated at the beginning of the new line
UNCOV
208
   if item.text == "-" then
×
UNCOV
209
      self:addToken(item.text, item)
×
UNCOV
210
      self:makeToken()
×
UNCOV
211
      if self.lastnode ~= "discretionary" then
×
UNCOV
212
         coroutine.yield(SILE.types.node.discretionary({
×
213
            postbreak = SILE.shaper:createNnodes("-", self.options),
214
         }))
UNCOV
215
         self.lastnode = "discretionary"
×
216
      end
217
   else
UNCOV
218
      SILE.nodeMakers.unicode.handleWordBreak(self, item)
×
219
   end
220
end
221

222
function SILE.nodeMakers.unicode:handleLineBreak (item, subtype)
160✔
223
   -- Because we are in charge of paragraphing, we
224
   -- will override space-type line breaks, and treat
225
   -- them just as ordinary word spaces.
226
   if self:isSpace(item.text) or self:isActiveNonBreakingSpace(item.text) then
4,341✔
227
      self:handleWordBreak(item)
×
228
      return
×
229
   end
230
   -- But explicit line breaks we will turn into
231
   -- soft and hard breaks.
232
   self:makeToken()
1,447✔
233
   self:makePenalty(subtype == "soft" and 0 or -1000)
1,447✔
234
   local char = item.text
1,447✔
235
   self:addToken(char, item)
1,447✔
236
   local cp = SU.codepoint(char)
1,447✔
237
   self.lasttype = chardata[cp] and chardata[cp].linebreak
1,447✔
238
end
239

240
function SILE.nodeMakers.unicode:_handleLineBreakRepeatHyphen (item, subtype)
160✔
241
   if self.lastnode == "discretionary" then
×
242
      -- Initial word boundary after a discretionary:
243
      -- Bypass it and just deal with the token.
244
      self:dealWith(item)
×
245
   else
246
      SILE.nodeMakers.unicode.handleLineBreak(self, item, subtype)
×
247
   end
248
end
249

250
function SILE.nodeMakers.unicode:iterator (items)
160✔
251
   local fulltext = ""
1,959✔
252
   for i = 1, #items do
15,473✔
253
      fulltext = fulltext .. items[i].text
13,514✔
254
   end
255
   local chunks = { icu.breakpoints(fulltext, self.options.language) }
1,959✔
256
   table.remove(chunks, 1)
1,959✔
257
   return coroutine.wrap(function ()
1,959✔
258
      local i
259
      i, self.items = self:handleInitialGlue(items)
3,918✔
260
      for j = i, #items do
15,412✔
261
         self.i = j
13,453✔
262
         self.item = self.items[self.i]
13,453✔
263
         if self:isICUBreakHere(chunks, self.item) then
26,906✔
264
            chunks = self:handleICUBreak(chunks, self.item)
6,378✔
265
         else
266
            self:dealWith(self.item)
10,264✔
267
         end
268
      end
269
      self:makeToken()
1,959✔
270
   end)
271
end
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2025 Coveralls, Inc