fs = require 'fs' punycode = require 'punycode' LineBreaker = require '../' assert = require 'assert' describe 'unicode line break tests', -> # these tests are weird, possibly incorrect or just tailored differently. we skip them. skip = [812, 814, 848, 850, 864, 866, 900, 902, 956, 958, 1068, 1070, 1072, 1074, 1224, 1226, 1228, 1230, 1760, 1762, 2932, 2934, 4100, 4101, 4102, 4103, 4340, 4342, 4496, 4498, 4568, 4570, 4704, 4706, 4707, 4708, 4710, 4711, 4712, 4714, 4715, 4716, 4718, 4719, 4722, 4723, 4726, 4727, 4730, 4731, 4734, 4735, 4736, 4738, 4739, 4742, 4743, 4746, 4747, 4748, 4750, 4751, 4752, 4754, 4755, 4756, 4758, 4759, 4760, 4762, 4763, 4764, 4766, 4767, 4768, 4770, 4771, 4772, 4774, 4775, 4778, 4779, 4780, 4782, 4783, 4784, 4786, 4787, 4788, 4790, 4791, 4794, 4795, 4798, 4799, 4800, 4802, 4803, 4804, 4806, 4807, 4808, 4810, 4811, 4812, 4814, 4815, 4816, 4818, 4819, 4820, 4822, 4823, 4826, 4827, 4830, 4831, 4834, 4835, 4838, 4839, 4840, 4842, 4843, 4844, 4846, 4847, 4848, 4850, 4851, 4852, 4854, 4855, 4856, 4858, 4859, 4960, 4962, 5036, 5038, 6126, 6135, 6140, 6225, 6226, 6227, 6228, 6229, 6230, 6232, 6233, 6234, 6235, 6236, 6332] data = fs.readFileSync __dirname + '/LineBreakTest.txt', 'utf8' lines = data.split '\n' lines.forEach (line, i) -> return if not line or /^#/.test(line) [cols, comment] = line.split('#') codePoints = cols.split(/\s*[×÷]\s*/).slice(1, -1).map (c) -> parseInt(c, 16) str = punycode.ucs2.encode codePoints breaker = new LineBreaker(str) breaks = [] last = 0 while bk = breaker.nextBreak() breaks.push str.slice(last, bk.position) last = bk.position expected = cols.split(/\s*÷\s*/).slice(0, -1).map (c) -> codes = c.split(/\s*×\s*/) codes.shift() if codes[0] is '' codes = codes.map (c) -> parseInt(c, 16) punycode.ucs2.encode codes if i in skip it.skip cols, -> return it cols, -> assert.deepEqual breaks, expected, i + ' ' + JSON.stringify(breaks) + ' != ' + JSON.stringify(expected) + ' #' + comment