if not modules then modules = { } end modules ['luaotfload-database'] = { version = "2.7", comment = "companion to luaotfload-main.lua", author = "Khaled Hosny, Elie Roux, Philipp Gesang", copyright = "Luaotfload Development Team", license = "GNU GPL v2.0" } --[[doc-- With version 2.7 we killed of the Fontforge libraries in favor of the Lua implementation of the OT format reader. There were many reasons to do this on top of the fact that FF won’t be around at version 1.0 anymore: In addition to maintainability, memory safety and general code hygiene, the new reader shows an amazing performance: Scanning of the 3200 font files on my system takes around 23 s now, as opposed to 74 s with the Fontforge libs. Memory usage has improved drastically as well, as illustrated by these profiles: GB 1.324^ # | # | ::# | : #:: | @: #: | @: #: | @@@: #: | @@@ @: #: | @@ @ @ @: #: | @ @@:@ @ @: #: : | @@ : @ :@ @ @: #: : | @@: ::@@ :@@ ::@ :@ @ @: #: : ::: | @@ : :: @@ :@ : @ :@ @ @: #: : :: : | @@ : ::: @@ :@ ::: @ :@ @ @: #: :: :: : | @@@@ :: :::: @@ :@ : : @ :@ @ @: #: :: :::: :: | :@ @@ :: :::: @@ :@ : :: : @ :@ @ @: #: :: :: :: :: | @:@ @@ :: ::::: @@ :@ : :::: : @ :@ @ @: #: :::: :::: :: :: | @@:@ @@ :: ::::::: @@ :@ : : :: : @ :@ @ @: #: ::: @: :: :: ::@ | @@@:@ @@ :: :: ::::: @@ :@ ::: :: : @ :@ @ @: #: ::: @: :: :: ::@ | @@@@@:@ @@ ::::::: ::::: @@ :@ ::: :: : @ :@ @ @: #: ::: ::@: :: :: ::@ 0 +----------------------------------------------------------------------->GB 0 16.29 This is the memory usage during a complete database rebuild with the Fontforge libraries. The same action using the new ``getinfo()`` method gives a different picture: MB 43.37^ # | @ @ @# | @@ @ @ @# : | @@@ : @: @ @ @# : | @ @@@ : : @: @ @: :@# : | @ @ @@@ : : @: @ @: :@# : | @ : : :@ @@@:::: @::@ @: :@#:: : | :: : @ : @ : :::@ @ :@@@:::::@::@ @:::@#:::: | : @ : :: : :@:: :@: :::::@ @ :@@@:::::@::@:@:::@#:::: | :: :@ : @ ::@:@:::@:: :@: :::::@: :@ :@@@:::::@::@:@:::@#:::: | :: :@::: :@ ::@:@: :@::::@::::::::@:::@::@@@:::::@::@:@:::@#:::: | :@::::@::: :@:::@:@: :@::::@::::::::@:::@::@@@:::::@::@:@:::@#:::: | :::::@::::@::: :@:::@:@: :@::::@::::::::@:::@::@@@:::::@::@:@:::@#:::: | ::: :@::::@::: :@:::@:@: :@::::@::::::::@:::@::@@@:::::@::@:@:::@#:::: | :::: :@::::@::: :@:::@:@: :@::::@::::::::@:::@::@@@:::::@::@:@:::@#:::: | :::: :@::::@::: :@:::@:@: :@::::@::::::::@:::@::@@@:::::@::@:@:::@#:::: | :::: :@::::@::: :@:::@:@: :@::::@::::::::@:::@::@@@:::::@::@:@:::@#:::: | :::: :@::::@::: :@:::@:@: :@::::@::::::::@:::@::@@@:::::@::@:@:::@#:::: | :::: :@::::@::: :@:::@:@: :@::::@::::::::@:::@::@@@:::::@::@:@:::@#:::: | :::: :@::::@::: :@:::@:@: :@::::@::::::::@:::@::@@@:::::@::@:@:::@#:::: 0 +----------------------------------------------------------------------->GB 0 3.231 FF peaks at around 1.4 GB after 12.5 GB worth of allocations, whereas the Lua implementation arrives at around 45 MB after 3.2 GB total: impl time(B) total(B) useful-heap(B) extra-heap(B) fontforge 12,496,407,184 1,421,150,144 1,327,888,638 93,261,506 lua 3,263,698,960 45,478,640 37,231,892 8,246,748 Much of the inefficiency of Fontforge is a direct consequence of having to parse the entire font to extract what essentially boils down to a couple hundred bytes of metadata per font. Since some information like design sizes (oh, Adobe!) is stuffed away in Opentype tables, the vastly more efficient approach of fontloader.info() proves insufficient for indexing. Thus, we ended up using fontloader.open() which causes even the character tables to be parsed, which incidentally are responsible for most of the allocations during that peak of 1.4 GB measured above, along with the encodings: 20.67% (293,781,048B) 0x6A8F72: SplineCharCreate (splineutil.c:3878) 09.82% (139,570,318B) 0x618ACD: _FontViewBaseCreate (fontviewbase.c:84) 08.77% (124,634,384B) 0x6A8FB3: SplineCharCreate (splineutil.c:3885) 04.53% (64,436,904B) in 80 places, all below massif's threshold (1.00%) 02.68% (38,071,520B) 0x64E14E: addKernPair (parsettfatt.c:493) 01.04% (14,735,320B) 0x64DE7D: addPairPos (parsettfatt.c:452) 39.26% (557,942,484B) 0x64A4E0: PsuedoEncodeUnencoded (parsettf.c:5706) What gives? For 2.7 we expect a rougher transition than a year back due to the complete revamp of the OT loading code. Breakage of fragile aspects like font and style names has been anticipated and addressed prior to the 2016 pretest release. In contrast to the earlier approach of letting FF do a complete dump and then harvest identifiers from the output we now have to coordinate with upstream as to which fields are actually needed in order to provide a similarly acceptable name → file lookup. On the bright side, these things are a lot simpler to fix than the rather tedious work of having users update their Luatex binary =) --doc]]-- local lpeg = require "lpeg" local P, Cc, lpegmatch = lpeg.P, lpeg.Cc, lpeg.match local log = luaotfload.log local logreport = log and log.report or print -- overriden later on local report_status = log.names_status local report_status_start = log.names_status_start local report_status_stop = log.names_status_stop --- Luatex builtins local load = load local next = next local require = require local tonumber = tonumber local unpack = table.unpack local fonts = fonts or { } local fontshandlers = fonts.handlers or { } local otfhandler = fonts.handlers.otf or { } fonts.handlers = fontshandlers local gzipload = gzip.load local gzipsave = gzip.save local iolines = io.lines local ioopen = io.open local iopopen = io.popen local kpseexpand_path = kpse.expand_path local kpsefind_file = kpse.find_file local kpselookup = kpse.lookup local kpsereadable_file = kpse.readable_file local lfsattributes = lfs.attributes local lfschdir = lfs.chdir local lfscurrentdir = lfs.currentdir local lfsdir = lfs.dir local mathabs = math.abs local mathmin = math.min local osgetenv = os.getenv local osgettimeofday = os.gettimeofday local osremove = os.remove local stringfind = string.find local stringformat = string.format local stringgmatch = string.gmatch local stringgsub = string.gsub local stringlower = string.lower local stringsub = string.sub local stringupper = string.upper local tableconcat = table.concat local tablesort = table.sort local utf8gsub = unicode.utf8.gsub local utf8lower = unicode.utf8.lower local utf8len = unicode.utf8.len local zlibcompress = zlib.compress --- these come from Lualibs/Context local filebasename = file.basename local filecollapsepath = file.collapsepath or file.collapse_path local filedirname = file.dirname local fileextname = file.extname local fileiswritable = file.iswritable local filejoin = file.join local filenameonly = file.nameonly local filereplacesuffix = file.replacesuffix local filesplitpath = file.splitpath or file.split_path local filesuffix = file.suffix local getwritablepath = caches.getwritablepath local lfsisdir = lfs.isdir local lfsisfile = lfs.isfile local lfsmkdirs = lfs.mkdirs local lpegsplitat = lpeg.splitat local stringis_empty = string.is_empty local stringsplit = string.split local stringstrip = string.strip local tableappend = table.append local tablecontains = table.contains local tablecopy = table.copy local tablefastcopy = table.fastcopy local tabletofile = table.tofile local tabletohash = table.tohash local tableserialize = table.serialize local names = fonts and fonts.names or { } local name_index = nil --> upvalue for names.data local lookup_cache = nil --> for names.lookups --- string -> (string * string) local make_luanames = function (path) return filereplacesuffix(path, "lua"), filereplacesuffix(path, "luc") end local format_precedence = { "otf", "ttc", "ttf", "afm", "pfb" } local location_precedence = { "local", "system", "texmf", } local set_location_precedence = function (precedence) location_precedence = precedence end --[[doc-- Auxiliary functions --doc]]-- --- fontnames contain all kinds of garbage; as a precaution we --- lowercase and strip them of non alphanumerical characters --- string -> string local invalidchars = "[^%a%d]" local sanitize_fontname = function (str) if str ~= nil then str = utf8gsub (utf8lower (str), invalidchars, "") return str end return nil end local sanitize_fontnames = function (rawnames) local result = { } for category, namedata in next, rawnames do if type (namedata) == "string" then result [category] = utf8gsub (utf8lower (namedata), invalidchars, "") else local target = { } for field, name in next, namedata do target [field] = utf8gsub (utf8lower (name), invalidchars, "") end result [category] = target end end return result end local find_files_indeed find_files_indeed = function (acc, dirs, filter) if not next (dirs) then --- done return acc end local pwd = lfscurrentdir () local dir = dirs[#dirs] dirs[#dirs] = nil if lfschdir (dir) then lfschdir (pwd) local newfiles = { } for ent in lfsdir (dir) do if ent ~= "." and ent ~= ".." then local fullpath = dir .. "/" .. ent if filter (fullpath) == true then if lfsisdir (fullpath) then dirs[#dirs+1] = fullpath elseif lfsisfile (fullpath) then newfiles[#newfiles+1] = fullpath end end end end return find_files_indeed (tableappend (acc, newfiles), dirs, filter) end --- could not cd into, so we skip it return find_files_indeed (acc, dirs, filter) end local dummyfilter = function () return true end --- the optional filter function receives the full path of a file --- system entity. a filter applies if the first argument it returns is --- true. --- string -> function? -> string list local find_files = function (root, filter) if lfsisdir (root) then return find_files_indeed ({}, { root }, filter or dummyfilter) end end --[[doc-- This is a sketch of the luaotfload db: type dbobj = { families : familytable; files : filemap; status : filestatus; mappings : fontentry list; meta : metadata; } and familytable = { local : (format, familyentry) hash; // specified with include dir texmf : (format, familyentry) hash; system : (format, familyentry) hash; } and familyentry = { r : sizes; // regular i : sizes; // italic b : sizes; // bold bi : sizes; // bold italic } and sizes = { default : int; // points into mappings or names optical : (int, int) list; // design size -> index entry } and metadata = { created : string // creation time formats : string list; // { "otf", "ttf", "ttc" } local : bool; (* set if local fonts were added to the db *) modified : string // modification time statistics : TODO; // created when built with "--stats" version : float; // index version } and filemap = { // created by generate_filedata() base : { local : (string, int) hash; // basename -> idx system : (string, int) hash; texmf : (string, int) hash; }; bare : { local : (string, (string, int) hash) hash; // location -> (barename -> idx) system : (string, (string, int) hash) hash; texmf : (string, (string, int) hash) hash; }; full : (int, string) hash; // idx -> full path } and fontentry = { // finalized by collect_families() basename : string; // file name without path "foo.otf" conflicts : { barename : int; basename : int }; // filename conflict with font at index; happens with subfonts familyname : string; // sanitized name of the font family the font belongs to, usually from the names table fontname : string; // sanitized name of the font format : string; // "otf" | "ttf" | "afm" (* | "pfb" *) fullname : string; // sanitized full name of the font including style modifiers fullpath : string; // path to font in filesystem index : int; // index in the mappings table italicangle : float; // italic angle; non-zero with oblique faces location : string; // "texmf" | "system" | "local" metafamily : string; // alternative family identifier if appropriate, sanitized plainname : string; // unsanitized font name typographicsubfamily : string; // sanitized preferred subfamily (names table 14) psname : string; // PostScript name size : (false | float * float * float); // if available, size info from the size table converted from decipoints subfamily : string; // sanitized subfamily (names table 2) subfont : (int | bool); // integer if font is part of a TrueType collection ("ttc") version : string; // font version string weight : int; // usWeightClass } and filestatus = (string, // fullname { index : int list; // pointer into mappings timestamp : int; }) dict beware that this is a reconstruction and may be incomplete or out of date. Last update: 2014-04-06, describing version 2.51. mtx-fonts has in names.tma: type names = { cache_uuid : uuid; cache_version : float; datastate : uuid list; fallbacks : (filetype, (basename, int) hash) hash; families : (basename, int list) hash; files : (filename, fullname) hash; indices : (fullname, int) hash; mappings : (filetype, (basename, int) hash) hash; names : ? (empty hash) ?; rejected : (basename, int) hash; specifications: fontentry list; } and fontentry = { designsize : int; familyname : string; filename : string; fontname : string; format : string; fullname : string; maxsize : int; minsize : int; modification : int; rawname : string; style : string; subfamily : string; variant : string; weight : string; width : string; } --doc]]-- --- string list -> string option -> dbobj local initialize_namedata = function (formats, created) local now = os.date "%Y-%m-%d %H:%M:%S" --- i. e. "%F %T" on POSIX systems return { status = { }, -- was: status; map abspath -> mapping mappings = { }, -- TODO: check if still necessary after rewrite files = { }, -- created later meta = { created = created or now, formats = formats, ["local"] = false, modified = now, statistics = { }, version = names.version, }, } end --- When loading a lua file we try its binary complement first, which --- is assumed to be located at an identical path, carrying the suffix --- .luc. --- string -> (string * table) local load_lua_file = function (path) local foundname = filereplacesuffix (path, "luc") local code = nil local fh = ioopen (foundname, "rb") -- try bin first if fh then local chunk = fh:read"*all" fh:close() code = load (chunk, "b") end if not code then --- fall back to text file foundname = filereplacesuffix (path, "lua") fh = ioopen(foundname, "rb") if fh then local chunk = fh:read"*all" fh:close() code = load (chunk, "t") end end if not code then --- probe gzipped file foundname = filereplacesuffix (path, "lua.gz") local chunk = gzipload (foundname) if chunk then code = load (chunk, "t") end end if not code then return nil, nil end return foundname, code () end --- define locals in scope local access_font_index local find_closest local flush_lookup_cache local generate_filedata local get_font_filter local group_modifiers local load_names local lookup_font_name local getmetadata local order_design_sizes local ot_fullinfo local read_blacklist local reload_db local lookup_fullpath local save_lookups local save_names local set_font_filter local t1_fullinfo local update_names --- state of the database local fonts_reloaded = false --- limit output when approximate font matching (luaotfload-tool -F) local fuzzy_limit = 1 --- display closest only --- bool? -> -> bool? -> dbobj option load_names = function (dry_run, no_rebuild) local starttime = osgettimeofday () local foundname, data = load_lua_file (config.luaotfload.paths.index_path_lua) if data then logreport ("log", 0, "db", "Font names database loaded from %s", foundname) logreport ("term", 3, "db", "Font names database loaded from %s", foundname) logreport ("info", 3, "db", "Loading took %0.f ms.", 1000 * (osgettimeofday () - starttime)) local db_version, names_version if data.meta then db_version = data.meta.version else --- Compatibility branch; the version info used to be --- stored in the table root which is why updating from --- an earlier index version broke. db_version = data.version or -42 --- invalid end names_version = names.version if db_version ~= names_version then logreport ("both", 0, "db", [[Version mismatch; expected %4.3f, got %4.3f.]], names_version, db_version) if not fonts_reloaded then logreport ("both", 0, "db", [[Force rebuild.]]) data = update_names (initialize_namedata (get_font_filter ()), true, false) if not data then logreport ("both", 0, "db", "Database creation unsuccessful.") end end end else if no_rebuild == true then logreport ("both", 2, "db", [[Database does not exist, skipping rebuild though.]]) return false end logreport ("both", 0, "db", [[Font names database not found, generating new one.]]) logreport ("both", 0, "db", [[This can take several minutes; please be patient.]]) data = update_names (initialize_namedata (get_font_filter ()), nil, dry_run) if not data then logreport ("both", 0, "db", "Database creation unsuccessful.") end end return data end --[[doc-- access_font_index -- Provide a reference of the index table. Will cause the index to be loaded if not present. --doc]]-- access_font_index = function () if not name_index then name_index = load_names () end return name_index end getmetadata = function () if not name_index then name_index = load_names (false, true) if name_index then return tablefastcopy (name_index.meta) end end return false end --- unit -> unit local load_lookups load_lookups = function ( ) local foundname, data = load_lua_file(config.luaotfload.paths.lookup_path_lua) if data then logreport ("log", 0, "cache", "Lookup cache loaded from %s.", foundname) logreport ("term", 3, "cache", "Lookup cache loaded from %s.", foundname) else logreport ("both", 1, "cache", "No lookup cache, creating empty.") data = { } end lookup_cache = data end local regular_synonym = { book = true, normal = true, plain = true, regular = true, roman = true, } local italic_synonym = { oblique = true, slanted = true, italic = true, } local bold_synonym = { bold = true, black = true, heavy = true, } local style_category = { regular = "r", bold = "b", bolditalic = "bi", italic = "i", r = "regular", b = "bold", bi = "bolditalic", i = "italic", } local type1_metrics = { "tfm", "ofm", } local lookup_filename = function (filename) if not name_index then name_index = load_names () end local files = name_index.files local basedata = files.base local baredata = files.bare for i = 1, #location_precedence do local location = location_precedence [i] local basenames = basedata [location] local barenames = baredata [location] local idx if basenames ~= nil then idx = basenames [filename] if idx then goto done end end if barenames ~= nil then for j = 1, #format_precedence do local format = format_precedence [j] local filemap = barenames [format] if filemap then idx = barenames [format] [filename] if idx then break end end end end ::done:: if idx then return files.full [idx] end end end --[[doc-- lookup_font_file -- The ``file:`` are ultimately delegated here. The lookups are kind of a blunt instrument since they try locating the file using every conceivable method, which is quite inefficient. Nevertheless, resolving files that way is rarely the bottleneck. --doc]]-- local dummy_findfile = resolvers.findfile -- from basics-gen --- string -> string * string * bool local lookup_font_file lookup_font_file = function (filename) local found = lookup_filename (filename) if not found then found = dummy_findfile(filename) end if found then return found, nil, true end for i=1, #type1_metrics do local format = type1_metrics[i] if resolvers.findfile(filename, format) then return file.addsuffix(filename, format), format, true end end if not fonts_reloaded and config.luaotfload.db.update_live == true then return reload_db (stringformat ("File not found: %s.", filename), lookup_font_file, filename) end return filename, nil, false end --[[doc-- get_font_file -- Look up the file of an entry in the mappings table. If the index is valid, pass on the name and subfont index after verifing the existence of the resolved file. This verification differs depending the index entry’s ``location`` field: * ``texmf`` fonts are verified using the (slow) function ``kpse.lookup()``; * other locations are tested by resolving the full path and checking for the presence of a file there. --doc]]-- --- int -> bool * (string * int) option local get_font_file = function (index) local entry = name_index.mappings [index] if not entry then return false end local basename = entry.basename if entry.location == "texmf" then if kpselookup(basename) then return true, basename, entry.subfont end else --- system, local local fullname = name_index.files.full [index] if lfsisfile (fullname) then return true, basename, entry.subfont end end return false end --[[doc-- We need to verify if the result of a cached lookup actually exists in the texmf or filesystem. Again, due to the schizoprenic nature of the font managment we have to check both the system path and the texmf. --doc]]-- local verify_font_file = function (basename) local path = lookup_fullpath (basename) if path and lfsisfile(path) then return true end if kpsefind_file(basename) then return true end return false end --[[doc-- Lookups can be quite costly, more so the less specific they are. Even if we find a matching font eventually, the next time the user compiles Eir document E will have to stand through the delay again. Thus, some caching of results -- even between runs -- is in order. We’ll just store successful name: lookups in a separate cache file. type lookup_cache = (string, (string * num)) dict The spec is expected to be modified in place (ugh), so we’ll have to catalogue what fields actually influence its behavior. Idk what the “spec” resolver is for. lookup inspects modifies ---------- ----------------- --------------------------- file: name forced, name name:[*] name, style, sub, resolved, sub, name, forced optsize, size spec: name, sub resolved, sub, name, forced [*] name: contains both the name resolver from luatex-fonts and lookup_font_name () below From my reading of font-def.lua, what a resolver does is basically rewrite the “name” field of the specification record with the resolution. Also, the fields “resolved”, “sub”, “force” etc. influence the outcome. --doc]]-- local concat_char = "#" local hash_fields = { --- order is important "specification", "style", "sub", "optsize", "size", } local n_hash_fields = #hash_fields --- spec -> string local hash_request = function (specification) local key = { } --- segments of the hash for i=1, n_hash_fields do local field = specification[hash_fields[i]] if field then key[#key+1] = field end end return tableconcat(key, concat_char) end --- 'a -> 'a -> table -> (string * int|boolean * boolean) local lookup_font_name_cached lookup_font_name_cached = function (specification) if not lookup_cache then load_lookups () end local request = hash_request(specification) logreport ("both", 4, "cache", "Looking for %q in cache ...", request) local found = lookup_cache [request] --- case 1) cache positive ---------------------------------------- if found then --- replay fields from cache hit logreport ("info", 4, "cache", "Found!") local basename = found[1] --- check the presence of the file in case it’s been removed local success = verify_font_file (basename) if success == true then return basename, found[2], true end logreport ("both", 4, "cache", "Cached file not found; resolving again.") else logreport ("both", 4, "cache", "Not cached; resolving.") end --- case 2) cache negative ---------------------------------------- --- first we resolve normally ... local filename, subfont = lookup_font_name (specification) if not filename then return nil, nil end --- ... then we add the fields to the cache ... ... local entry = { filename, subfont } logreport ("both", 4, "cache", "New entry: %s.", request) lookup_cache [request] = entry --- obviously, the updated cache needs to be stored. --- TODO this should trigger a save only once the --- document is compiled (finish_pdffile callback?) logreport ("both", 5, "cache", "Saving updated cache.") local success = save_lookups () if not success then --- sad, but not critical logreport ("both", 0, "cache", "Error writing cache.") end return filename, subfont end --- this used to be inlined; with the lookup cache we don’t --- have to be parsimonious wrt function calls anymore --- “found” is the match accumulator local add_to_match = function (found, size, face) local continue = true local optsize = face.size if optsize and next (optsize) then local dsnsize, maxsize, minsize dsnsize = optsize[1] maxsize = optsize[2] minsize = optsize[3] if size ~= nil and (dsnsize == size or (size > minsize and size <= maxsize)) then found[1] = face continue = false ---> break else found[#found+1] = face end else found[1] = face continue = false ---> break end return found, continue end local choose_closest = function (distances) local closest = 2^51 local match for i = 1, #distances do local d, index = unpack (distances [i]) if d < closest then closest = d match = index end end return match end --[[doc-- choose_size -- Pick a font face of appropriate size from the list of family members with matching style. There are three categories: 1. exact matches: if there is a face whose design size equals the asked size, it is returned immediately and no further candidates are inspected. 2. range matches: of all faces in whose design range the requested size falls the one whose center the requested size is closest to is returned. 3. out-of-range matches: of all other faces (i. e. whose range is above or below the asked size) the one is chosen whose boundary (upper or lower) is closest to the requested size. 4. default matches: if no design size or a design size of zero is requested, the face with the default size is returned. --doc]]-- --- int * int * int * int list -> int -> int local choose_size = function (sizes, askedsize) local mappings = name_index.mappings local match = sizes.default local exact local inrange = { } --- distance * index list local norange = { } --- distance * index list local fontname, subfont if askedsize ~= 0 then --- firstly, look for an exactly matching design size or --- matching range for i = 1, #sizes do local dsnsize, high, low, index = unpack (sizes [i]) if dsnsize == askedsize then --- exact match, this is what we were looking for exact = index goto skip elseif askedsize < low then --- below range, add to the norange table local d = low - askedsize norange [#norange + 1] = { d, index } elseif askedsize > high then --- beyond range, add to the norange table local d = askedsize - high norange [#norange + 1] = { d, index } else --- range match local d = ((low + high) / 2) - askedsize if d < 0 then d = -d end inrange [#inrange + 1] = { d, index } end end end ::skip:: if exact then match = exact elseif #inrange > 0 then match = choose_closest (inrange) elseif #norange > 0 then match = choose_closest (norange) end return match end --[[doc-- lookup_familyname -- Query the families table for an entry matching the specification. The parameters “name” and “style” are pre-sanitized. --doc]]-- --- spec -> string -> string -> int -> string * int local lookup_familyname = function (specification, name, style, askedsize) local families = name_index.families local mappings = name_index.mappings local candidates = nil --- arrow code alert for i = 1, #location_precedence do local location = location_precedence [i] local locgroup = families [location] for j = 1, #format_precedence do local format = format_precedence [j] local fmtgroup = locgroup [format] if fmtgroup then local familygroup = fmtgroup [name] if familygroup then local stylegroup = familygroup [style] if stylegroup then --- suitable match candidates = stylegroup goto done end end end end end if true then return nil, nil end ::done:: index = choose_size (candidates, askedsize) local success, resolved, subfont = get_font_file (index) if not success then return nil, nil end logreport ("info", 2, "db", "Match found: %s(%d).", resolved, subfont or 0) return resolved, subfont end local lookup_fontname = function (specification, name, style) local mappings = name_index.mappings local fallback = nil local lastresort = nil style = style_category [style] for i = 1, #mappings do local face = mappings [i] local typographicsubfamily = face.typographicsubfamily local subfamily = face.subfamily if face.fontname == name or face.fullname == name or face.psname == name then return face.basename, face.subfont elseif face.familyname == name then if typographicsubfamily == style or subfamily == style then fallback = face elseif regular_synonym [typographicsubfamily] or regular_synonym [subfamily] then lastresort = face end elseif face.metafamily == name and ( regular_synonym [typographicsubfamily] or regular_synonym [subfamily]) then lastresort = face end end if fallback then return fallback.basename, fallback.subfont end if lastresort then return lastresort.basename, lastresort.subfont end return nil, nil end --[[doc-- lookup_font_name -- Perform a name: lookup. This first queries the font families table and, if there is no match for the spec, the font names table. The return value is a pair consisting of the file name and the subfont index if appropriate.. the request specification has the fields: · features: table · normal: set of { ccmp clig itlc kern liga locl mark mkmk rlig } · ??? · forced: string · lookup: "name" · method: string · name: string · resolved: string · size: int · specification: string (== ":" ) · sub: string The “size” field deserves special attention: if its value is negative, then it actually specifies a scalefactor of the design size of the requested font. This happens e.g. if a font is requested without an explicit “at size”. If the font is part of a larger collection with different design sizes, this complicates matters a bit: Normally, the resolver prefers fonts that have a design size as close as possible to the requested size. If no size specified, then the design size is implied. But which design size should that be? Xetex appears to pick the “normal” (unmarked) size: with Adobe fonts this would be the one that is neither “caption” nor “subhead” nor “display” &c ... For fonts by Adobe this seems to be the one that does not receive a “typographicsubfamily” field. (IOW Adobe uses the “typographicsubfamily” field to encode the design size in more or less human readable format.) However, this is not true of LM and EB Garamond. As this matters only where there are multiple design sizes to a given font/style combination, we put a workaround in place that chooses that unmarked version. The first return value of “lookup_font_name” is the file name of the requested font (string). It can be passed to the fullname resolver get_font_file(). The second value is either “false” or an integer indicating the subfont index in a TTC. --doc]]-- --- table -> string * (int | bool) lookup_font_name = function (specification) local resolved, subfont if not name_index then name_index = load_names () end local name = sanitize_fontname (specification.name) local style = sanitize_fontname (specification.style) or "r" local askedsize = specification.optsize if askedsize then askedsize = tonumber (askedsize) else askedsize = specification.size if askedsize and askedsize >= 0 then askedsize = askedsize / 65536 else askedsize = 0 end end resolved, subfont = lookup_familyname (specification, name, style, askedsize) if not resolved then resolved, subfont = lookup_fontname (specification, name, style) end if not resolved then if not fonts_reloaded and config.luaotfload.db.update_live == true then return reload_db (stringformat ("Font %s not found.", specification.name or ""), lookup_font_name, specification) end end return resolved, subfont end lookup_fullpath = function (fontname, ext) --- getfilename() if not name_index then name_index = load_names () end local files = name_index.files local basedata = files.base local baredata = files.bare for i = 1, #location_precedence do local location = location_precedence [i] local basenames = basedata [location] local idx if basenames ~= nil then idx = basenames [fontname] end if ext then local barenames = baredata [location] [ext] if not idx and barenames ~= nil then idx = barenames [fontname] end end if idx then return files.full [idx] end end return "" end --- when reload is triggered we update the database --- and then re-run the caller with the arg list --- string -> ('a -> 'a) -> 'a list -> 'a reload_db = function (why, caller, ...) local namedata = name_index local formats = tableconcat (namedata.meta.formats, ",") logreport ("both", 0, "db", "Reload initiated (formats: %s); reason: %q.", formats, why) set_font_filter (formats) namedata = update_names (namedata, false, false) if namedata then fonts_reloaded = true name_index = namedata return caller (...) end logreport ("both", 0, "db", "Database update unsuccessful.") end --- string -> string -> int local iterative_levenshtein = function (s1, s2) local costs = { } local len1, len2 = #s1, #s2 for i = 0, len1 do local last = i for j = 0, len2 do if i == 0 then costs[j] = j else if j > 0 then local current = costs[j-1] if stringsub(s1, i, i) ~= stringsub(s2, j, j) then current = mathmin(current, last, costs[j]) + 1 end costs[j-1] = last last = current end end end if i > 0 then costs[len2] = last end end return costs[len2]--- lower right has the distance end --- string list -> string list local delete_dupes = function (lst) local n0 = #lst if n0 == 0 then return lst end tablesort (lst) local ret = { } local last for i = 1, n0 do local cur = lst[i] if cur ~= last then last = cur ret[#ret + 1] = cur end end logreport (false, 8, "query", "Removed %d duplicate names.", n0 - #ret) return ret end --- string -> int -> bool find_closest = function (name, limit) local name = sanitize_fontname (name) limit = limit or fuzzy_limit if not name_index then name_index = load_names () end if not name_index or type (name_index) ~= "table" then if not fonts_reloaded then return reload_db("Font index missing.", find_closest, name) end return false end local by_distance = { } --- (int, string list) dict local distances = { } --- int list local cached = { } --- (string, int) dict local mappings = name_index.mappings local n_fonts = #mappings for n = 1, n_fonts do local current = mappings[n] --[[ This is simplistic but surpisingly fast. Matching is performed against the “fullname” field of a db record in preprocessed form. We then store the raw “fullname” at its edit distance. We should probably do some weighting over all the font name categories as well as whatever agrep does. --]] local fullname = current.plainname local sfullname = current.fullname local dist = cached[sfullname]--- maybe already calculated if not dist then dist = iterative_levenshtein(name, sfullname) cached[sfullname] = dist end local namelst = by_distance[dist] if not namelst then --- first entry namelst = { fullname } distances[#distances+1] = dist else --- append namelst[#namelst+1] = fullname end by_distance[dist] = namelst end --- print the matches according to their distance local n_distances = #distances if n_distances > 0 then --- got some data tablesort(distances) limit = mathmin(n_distances, limit) logreport (false, 1, "query", "Displaying %d distance levels.", limit) for i = 1, limit do local dist = distances[i] local namelst = delete_dupes (by_distance[dist]) logreport (false, 0, "query", "Distance from \"%s\": %s\n " .. tableconcat (namelst, "\n "), name, dist) end return true end return false end --- find_closest() --- string -> uint -> bool * (string | rawdata) local read_font_file = function (filename, subfont) local fontdata = otfhandler.readers.getinfo (filename, { subfont = subfont , details = false , platformnames = true , rawfamilynames = true }) local msg = fontdata.comment if msg then return false, msg end return true, fontdata end local load_font_file = function (filename, subfont) local err, ret = read_font_file (filename, subfont) if err == false then logreport ("both", 1, "db", "ERROR: failed to open %q: %q.", tostring (filename), tostring (ret)) return end return ret end --- rawdata -> (int * int * int | bool) local get_size_info = function (rawinfo) local design_size = rawinfo.design_size local design_range_top = rawinfo.design_range_top local design_range_bottom = rawinfo.design_range_bottom local fallback_size = design_size ~= 0 and design_size or design_range_bottom ~= 0 and design_range_bottom or design_range_top ~= 0 and design_range_top if fallback_size then design_size = (design_size or fallback_size) / 10 design_range_top = (design_range_top or fallback_size) / 10 design_range_bottom = (design_range_bottom or fallback_size) / 10 return { design_size, design_range_top, design_range_bottom, } end return false end --[[doc-- map_enlish_names -- Names-table for Lua fontloader objects. This may vanish eventually once we ditch Fontforge completely. Only subset of entries of that table are actually relevant so we’ll stick to that part. --doc]]-- local get_english_names = function (metadata) local namesource local platformnames = metadata.platformnames --[[-- Hans added the “platformnames” option for us to access parts of the original name table. The names are unreliable and completely disorganized, sure, but the Windows variant of the field often contains the superior information. Case in point: ["platformnames"]={ ["macintosh"]={ ["compatiblefullname"]="Garamond Premr Pro Smbd It", ["family"]="Garamond Premier Pro", ["fullname"]="Garamond Premier Pro Semibold Italic", ["postscriptname"]="GaramondPremrPro-SmbdIt", ["subfamily"]="Semibold Italic", }, ["windows"]={ ["family"]="Garamond Premr Pro Smbd", ["fullname"]="GaramondPremrPro-SmbdIt", ["postscriptname"]="GaramondPremrPro-SmbdIt", ["subfamily"]="Italic", ["typographicfamily"]="Garamond Premier Pro", ["typographicsubfamily"]="Semibold Italic", }, }, The essential bit is contained as “typographicfamily” (which we call for historical reasons the “preferred family”) and the “subfamily”. Only Why this is the case, only Adobe knows for certain. --]]-- if platformnames then --namesource = platformnames.macintosh or platformnames.windows namesource = platformnames.windows or platformnames.macintosh end return namesource or metadata end --[[-- In case of broken PS names we set some dummies. For this reason we copy what is necessary whilst keeping the table structure the same as in the tfmdata. --]]-- local get_raw_info = function (metadata, basename) local fontname = metadata.fontname local fullname = metadata.fullname if not fontname or not fullname then --- Broken names table, e.g. avkv.ttf with UTF-16 strings; --- we put some dummies in place like the fontloader --- (font-otf.lua) does. logreport ("both", 3, "db", "Invalid names table of font %s, using dummies. \z Reported: fontname=%q, fullname=%q.", tostring (basename), tostring (fontname), tostring (fullname)) fontname = "bad-fontname-" .. basename fullname = "bad-fullname-" .. basename end return { familyname = metadata.familyname, fontname = fontname, fullname = fullname, italicangle = metadata.italicangle, names = metadata.names, units_per_em = metadata.units_per_em, version = metadata.version, design_size = metadata.design_size or metadata.designsize, design_range_top = metadata.design_range_top or metadata.maxsize, design_range_bottom = metadata.design_range_bottom or metadata.minsize, } end local organize_namedata = function (rawinfo, nametable, basename, info) local default_name = nametable.compatiblefullname or nametable.fullname or nametable.postscriptname or rawinfo.fullname or rawinfo.fontname or info.fullname or info.fontname local default_family = nametable.typographicfamily or nametable.family or rawinfo.familyname or info.familyname -- local default_modifier = nametable.typographicsubfamily -- or nametable.subfamily local fontnames = { --- see --- https://developer.apple.com/fonts/TTRefMan/RM06/Chap6name.html --- http://www.microsoft.com/typography/OTSPEC/name.htm#NameIDs english = { --- where a “compatiblefullname” field is given, the value --- of “fullname” is either identical or differs by --- separating the style with a hyphen and omitting spaces. --- (According to the spec, “compatiblefullname” is --- “Macintosh only”.) Of the three “fullname” fields, this --- one appears to be the one with the entire name given in --- a legible, non-abbreviated fashion, for most fonts at --- any rate. However, in some fonts (e.g. CMU) all three --- fields are identical. fullname = --[[ 18 ]] nametable.compatiblefullname or --[[ 4 ]] nametable.fullname or default_name, --- we keep both the “preferred family” and the “family” --- values around since both are valid but can turn out --- quite differently, e.g. with Latin Modern: --- typographicfamily: “Latin Modern Sans”, --- family: “LM Sans 10” family = --[[ 1 ]] nametable.family or default_family, subfamily = --[[ 2 ]] nametable.subfamily or rawinfo.subfamilyname, psname = --[[ 6 ]] nametable.postscriptname, typographicfamily = --[[ 16 ]] nametable.typographicfamily, typographicsubfamily = --[[ 17 ]] nametable.typographicsubfamily, }, metadata = { fullname = rawinfo.fullname, fontname = rawinfo.fontname, familyname = rawinfo.familyname, }, info = { fullname = info.fullname, familyname = info.familyname, fontname = info.fontname, }, } return { sanitized = sanitize_fontnames (fontnames), fontname = rawinfo.fontname, fullname = rawinfo.fullname, familyname = rawinfo.familyname, } end local dashsplitter = lpegsplitat "-" local split_fontname = function (fontname) --- sometimes the style hides in the latter part of the --- fontname, separated by a dash, e.g. “Iwona-Regular”, --- “GFSSolomos-Regular” local splitted = { lpegmatch (dashsplitter, fontname) } if next (splitted) then return sanitize_fontname (splitted [#splitted]) end end local organize_styledata = function (metadata, rawinfo, info) local pfminfo = metadata.pfminfo local names = rawinfo.names return { --- see http://www.microsoft.com/typography/OTSPEC/features_pt.htm#size size = get_size_info (rawinfo), pfmweight = pfminfo and pfminfo.weight or metadata.pfmweight or 400, weight = rawinfo.weight or metadata.weight or "unspecified", split = split_fontname (rawinfo.fontname), width = pfminfo and pfminfo.width or metadata.pfmwidth, italicangle = metadata.italicangle, --- this is for querying, see www.ntg.nl/maps/40/07.pdf for details units_per_em = metadata.units_per_em or metadata.units, version = metadata.version, } end --[[doc-- The data inside an Opentype font file can be quite heterogeneous. Thus in order to get the relevant information, parts of the original table as returned by the font file reader need to be relocated. --doc]]-- --- string -> int -> bool -> string -> fontentry ot_fullinfo = function (filename, subfont, location, basename, format, info) local metadata = load_font_file (filename, subfont) if not metadata then return nil end local rawinfo = get_raw_info (metadata, basename) local nametable = get_english_names (metadata) local namedata = organize_namedata (rawinfo, nametable, basename, info) local style = organize_styledata (metadata, rawinfo, info) local res = { file = { base = basename, full = filename, subfont = subfont, location = location or "system" }, format = format, names = namedata, style = style, version = rawinfo.version, } return res end --[[doc-- Type1 font inspector. In comparison with OTF, PFB’s contain a good deal less name fields which makes it tricky in some parts to find a meaningful representation for the database. Good read: http://www.adobe.com/devnet/font/pdfs/5004.AFM_Spec.pdf --doc]]-- --- string -> int -> bool -> string -> fontentry t1_fullinfo = function (filename, _subfont, location, basename, format) local sanitized local metadata = load_font_file (filename) local fontname = metadata.fontname local fullname = metadata.fullname local familyname = metadata.familyname local italicangle = metadata.italicangle local style = "" local weight sanitized = sanitize_fontnames ({ fontname = fontname, psname = fullname, metafamily = familyname, familyname = familyname, weight = metadata.weight, --- string identifier typographicsubfamily = style, }) weight = sanitized.weight if weight == "bold" then style = weight end if italicangle ~= 0 then style = style .. "italic" end return { basename = basename, fullpath = filename, subfont = false, location = location or "system", format = format, fullname = sanitized.fullname, fontname = sanitized.fontname, familyname = sanitized.familyname, plainname = fullname, psname = sanitized.fontname, version = metadata.version, size = false, typographicsubfamily = style ~= "" and style or weight, weight = metadata.pfminfo and pfminfo.weight or 400, italicangle = italicangle, } end local loaders = { otf = ot_fullinfo, ttc = ot_fullinfo, ttf = ot_fullinfo, afm = t1_fullinfo, pfb = t1_fullinfo, } --- not side-effect free! local compare_timestamps = function (fullname, currentstatus, currententrystatus, currentmappings, targetstatus, targetentrystatus, targetmappings) local currenttimestamp = currententrystatus and currententrystatus.timestamp local targettimestamp = lfsattributes (fullname, "modification") if targetentrystatus ~= nil and targetentrystatus.timestamp == targettimestamp then logreport ("log", 3, "db", "Font %q already read.", fullname) return false end targetentrystatus.timestamp = targettimestamp targetentrystatus.index = targetentrystatus.index or { } if currenttimestamp == targettimestamp and not targetentrystatus.index [1] then --- copy old namedata into new for _, currentindex in next, currententrystatus.index do local targetindex = #targetentrystatus.index local fullinfo = currentmappings [currentindex] local location = #targetmappings + 1 targetmappings [location] = fullinfo targetentrystatus.index [targetindex + 1] = location end logreport ("log", 3, "db", "Font %q already indexed.", fullname) return false end return true end local insert_fullinfo = function (fullname, basename, n_font, loader, format, location, targetmappings, targetentrystatus, info) local fullinfo = loader (fullname, n_font, location, basename, format, info) if not fullinfo then return false end local index = targetentrystatus.index [n_font] if not index then index = #targetmappings + 1 end targetmappings [index] = fullinfo targetentrystatus.index [n_font] = index return true end --- we return true if the font is new or re-indexed --- string -> dbobj -> dbobj -> bool local read_font_names = function (fullname, currentnames, targetnames, location) local targetmappings = targetnames.mappings local targetstatus = targetnames.status --- by full path local targetentrystatus = targetstatus [fullname] if targetentrystatus == nil then targetentrystatus = { } targetstatus [fullname] = targetentrystatus end local currentmappings = currentnames.mappings local currentstatus = currentnames.status local currententrystatus = currentstatus [fullname] local basename = filebasename (fullname) local barename = filenameonly (fullname) local entryname = fullname if location == "texmf" then entryname = basename end --- 1) skip if blacklisted if names.blacklist[fullname] or names.blacklist[basename] then logreport ("log", 2, "db", "Ignoring blacklisted font %q.", fullname) return false end --- 2) skip if known with same timestamp if not compare_timestamps (fullname, currentstatus, currententrystatus, currentmappings, targetstatus, targetentrystatus, targetmappings) then return false end --- 3) new font; choose a loader, abort if unknown local format = stringlower (filesuffix (basename)) local loader = loaders [format] --- ot_fullinfo, t1_fullinfo if not loader then logreport ("both", 0, "db", "Unknown format: %q, skipping.", format) return false end --- 4) get basic info, abort if fontloader can’t read it local err, info = read_font_file (fullname) if err == false then logreport ("log", 1, "db", "Failed to read basic information from %q: %q", basename, tostring (info)) return false end --- 5) check for subfonts and process each of them if type (info) == "table" and #info >= 1 then --- ttc local success = false --- true if at least one subfont got read for n_font = 1, #info do if insert_fullinfo (fullname, basename, n_font, loader, format, location, targetmappings, targetentrystatus, info) then success = true end end return success end return insert_fullinfo (fullname, basename, false, loader, format, location, targetmappings, targetentrystatus, info) end local path_normalize do --- os.type and os.name are constants so we --- choose a normalization function in advance --- instead of testing with every call local os_type, os_name = os.type, os.name local filecollapsepath = filecollapsepath local lfsreadlink = lfs.readlink --- windows and dos if os_type == "windows" or os_type == "msdos" then --- ms platfom specific stuff path_normalize = function (path) path = stringgsub(path, '\\', '/') path = stringlower(path) path = filecollapsepath(path) return path end --[[doc-- The special treatment for cygwin was removed with a patch submitted by Ken Brown. Reference: http://cygwin.com/ml/cygwin/2013-05/msg00006.html --doc]]-- else -- posix path_normalize = function (path) local dest = lfsreadlink(path) if dest then if kpsereadable_file(dest) then path = dest elseif kpsereadable_file(filejoin(filedirname(path), dest)) then path = filejoin(file.dirname(path), dest) else -- broken symlink? end end path = filecollapsepath(path) return path end end end local blacklist = { } local p_blacklist --- prefixes of dirs --- string list -> string list local collapse_prefixes = function (lst) --- avoid redundancies in blacklist if #lst < 2 then return lst end tablesort(lst) local cur = lst[1] local result = { cur } for i=2, #lst do local elm = lst[i] if stringsub(elm, 1, #cur) ~= cur then --- different prefix cur = elm result[#result+1] = cur end end return result end --- string list -> string list -> (string, bool) hash_t local create_blacklist = function (blacklist, whitelist) local result = { } local dirs = { } logreport ("info", 2, "db", "Blacklisting %d files and directories.", #blacklist) for i=1, #blacklist do local entry = blacklist[i] if lfsisdir(entry) then dirs[#dirs+1] = entry else result[blacklist[i]] = true end end logreport ("info", 2, "db", "Whitelisting %d files.", #whitelist) for i=1, #whitelist do result[whitelist[i]] = nil end dirs = collapse_prefixes(dirs) --- build the disjunction of the blacklisted directories for i=1, #dirs do local p_dir = P(dirs[i]) if p_blacklist then p_blacklist = p_blacklist + p_dir else p_blacklist = p_dir end end if p_blacklist == nil then --- always return false p_blacklist = Cc(false) end return result end --- unit -> unit read_blacklist = function () local files = { kpselookup ("luaotfload-blacklist.cnf", {all=true, format="tex"}) } local blacklist = { } local whitelist = { } if files and type(files) == "table" then for _, path in next, files do for line in iolines (path) do line = stringstrip(line) -- to get rid of lines like " % foo" local first_chr = stringsub(line, 1, 1) if first_chr == "%" or stringis_empty(line) then -- comment or empty line elseif first_chr == "-" then logreport ("both", 3, "db", "Whitelisted file %q via %q.", line, path) whitelist[#whitelist+1] = stringsub(line, 2, -1) else local cmt = stringfind(line, "%%") if cmt then line = stringsub(line, 1, cmt - 1) end line = stringstrip(line) logreport ("both", 3, "db", "Blacklisted file %q via %q.", line, path) blacklist[#blacklist+1] = line end end end end names.blacklist = create_blacklist(blacklist, whitelist) end local p_font_filter do local extension_pattern = function (list) if type (list) ~= "table" or #list == 0 then return P(-1) end local pat for i=#list, 1, -1 do local e = list[i] if not pat then pat = P(e) else pat = pat + P(e) end end pat = pat * P(-1) return (1 - pat)^1 * pat end --- small helper to adjust the font filter pattern (--formats --- option) local current_formats = { } set_font_filter = function (formats) if not formats or type (formats) ~= "string" then return end if splitcomma == nil then splitcomma = luaotfload.parsers and luaotfload.parsers.splitcomma end if stringsub (formats, 1, 1) == "+" then -- add formats = lpegmatch (splitcomma, stringsub (formats, 2)) if formats then current_formats = tableappend (current_formats, formats) end elseif stringsub (formats, 1, 1) == "-" then -- add formats = lpegmatch (splitcomma, stringsub (formats, 2)) if formats then local newformats = { } for i = 1, #current_formats do local fmt = current_formats[i] local include = true for j = 1, #formats do if current_formats[i] == formats[j] then include = false goto skip end end newformats[#newformats+1] = fmt ::skip:: end current_formats = newformats end else -- set formats = lpegmatch (splitcomma, formats) if formats then current_formats = formats end end p_font_filter = extension_pattern (current_formats) end get_font_filter = function (formats) return tablefastcopy (current_formats) end end local locate_matching_pfb = function (afmfile, dir) local pfbname = filereplacesuffix (afmfile, "pfb") local pfbpath = dir .. "/" .. pfbname if lfsisfile (pfbpath) then return pfbpath end --- Check for match in texmf too return kpsefind_file (pfbname, "type1 fonts") end local process_dir_tree process_dir_tree = function (acc, dirs, done) if not next (dirs) then --- done return acc end local pwd = lfscurrentdir () local dir = dirs[#dirs] dirs[#dirs] = nil if not lfschdir (dir) then --- Cannot cd; skip. return process_dir_tree (acc, dirs, done) end dir = lfscurrentdir () --- resolve symlinks lfschdir (pwd) if tablecontains (done, dir) then --- Already traversed. Note that it’d be unsafe to rely on the --- hash part above due to Lua only processing up to 32 bytes --- of string data. The lookup shouldn’t impact performance too --- much but we could check the performance of alternative data --- structures at some point. return process_dir_tree (acc, dirs, done) end local newfiles = { } local blacklist = names.blacklist for ent in lfsdir (dir) do --- filter right away if ent ~= "." and ent ~= ".." and not blacklist[ent] then local fullpath = dir .. "/" .. ent if lfsisdir (fullpath) and not lpegmatch (p_blacklist, fullpath) then dirs[#dirs+1] = fullpath elseif lfsisfile (fullpath) then ent = stringlower (ent) if lpegmatch (p_font_filter, ent) then newfiles[#newfiles+1] = fullpath if filesuffix (ent) == "afm" then local pfbpath = locate_matching_pfb (ent, dir) if pfbpath then newfiles[#newfiles+1] = pfbpath end else newfiles[#newfiles+1] = fullpath end end end end end done [#done + 1] = dir return process_dir_tree (tableappend (acc, newfiles), dirs, done) end local process_dir = function (dir) local pwd = lfscurrentdir () if lfschdir (dir) then dir = lfscurrentdir () --- resolve symlinks lfschdir (pwd) local files = { } local blacklist = names.blacklist for ent in lfsdir (dir) do if ent ~= "." and ent ~= ".." and not blacklist[ent] then local fullpath = dir .. "/" .. ent if lfsisfile (fullpath) then ent = stringlower (ent) if lpegmatch (p_font_filter, ent) then if filesuffix (ent) == "afm" then local pfbpath = locate_matching_pfb (ent, dir) if pfbpath then files[#files+1] = pfbpath end else files[#files+1] = fullpath end end end end end return files end return { } end --- string -> bool -> string list local find_font_files = function (root, recurse) if lfsisdir (root) then if recurse == true then return process_dir_tree ({}, { root }, {}) else --- kpathsea already delivered the necessary subdirs return process_dir (root) end end end --- truncate_string -- Cut the first part of a string to fit it --- into a given terminal width. The parameter “restrict” (int) --- indicates the number of characters already consumed on the --- line. local truncate_string = function (str, restrict) local tw = config.luaotfload.misc.termwidth local wd = tw - restrict local len = utf8len (str) if wd - len < 0 then --- combined length exceeds terminal, str = ".." .. stringsub(str, len - wd + 2) end return str end --[[doc-- collect_font_filenames_dir -- Traverse the directory root at ``dirname`` looking for font files. Returns a list of {*filename*; *location*} pairs. --doc]]-- --- string -> string -> string * string list local collect_font_filenames_dir = function (dirname, location) if lpegmatch (p_blacklist, dirname) then logreport ("both", 4, "db", "Skipping blacklisted directory %s.", dirname) --- ignore return { } end local found = find_font_files (dirname, location ~= "texmf" and location ~= "local") if not found then logreport ("both", 4, "db", "No such directory: %q; skipping.", dirname) return { } end local nfound = #found local files = { } logreport ("both", 4, "db", "%d font files detected in %s.", nfound, dirname) for j = 1, nfound do local fullname = found[j] files[#files + 1] = { path_normalize (fullname), location } end return files end --- string list -> string list local filter_out_pwd = function (dirs) local result = { } if stripslashes == nil then stripslashes = luaotfload.parsers and luaotfload.parsers.stripslashes end local pwd = path_normalize (lpegmatch (stripslashes, lfscurrentdir ())) for i = 1, #dirs do --- better safe than sorry local dir = path_normalize (lpegmatch (stripslashes, dirs[i])) if dir == "." or dir == pwd then logreport ("both", 3, "db", "Path “%s” matches $PWD (“%s”), skipping.", dir, pwd) else result[#result+1] = dir end end return result end local path_separator = os.type == "windows" and ";" or ":" --[[doc-- collect_font_filenames_texmf -- Scan texmf tree for font files relying on the kpathsea variables $OPENTYPEFONTS and $TTFONTS of texmf.cnf. The current working directory comes as “.” (texlive) or absolute path (miktex) and will always be filtered out. Returns a list of { *filename*; *location* } pairs. --doc]]-- --- unit -> string * string list local collect_font_filenames_texmf = function () local osfontdir = kpseexpand_path "$OSFONTDIR" if stringis_empty (osfontdir) then logreport ("both", 1, "db", "Scanning TEXMF for fonts...") else logreport ("both", 1, "db", "Scanning TEXMF and $OSFONTDIR for fonts...") if log.get_loglevel () > 3 then local osdirs = filesplitpath (osfontdir) logreport ("both", 0, "db", "$OSFONTDIR has %d entries:", #osdirs) for i = 1, #osdirs do logreport ("both", 0, "db", "[%d] %s", i, osdirs[i]) end end end fontdirs = kpseexpand_path "$OPENTYPEFONTS" fontdirs = fontdirs .. path_separator .. kpseexpand_path "$TTFONTS" fontdirs = fontdirs .. path_separator .. kpseexpand_path "$T1FONTS" fontdirs = fontdirs .. path_separator .. kpseexpand_path "$AFMFONTS" if stringis_empty (fontdirs) then return { } end local tasks = filter_out_pwd (filesplitpath (fontdirs)) logreport ("both", 3, "db", "Initiating scan of %d directories.", #tasks) local files = { } for _, dir in next, tasks do files = tableappend (files, collect_font_filenames_dir (dir, "texmf")) end logreport ("both", 3, "db", "Collected %d files.", #files) return files end --- unit -> string list local function get_os_dirs () if os.name == 'macosx' then return { filejoin(kpseexpand_path('~'), "Library/Fonts"), "/Library/Fonts", "/System/Library/Fonts", "/Network/Library/Fonts", } elseif os.type == "windows" or os.type == "msdos" then local windir = osgetenv("WINDIR") return { filejoin(windir, 'Fonts') } else local fonts_conves = { --- plural, much? "/usr/local/etc/fonts/fonts.conf", "/etc/fonts/fonts.conf", } if not luaotfload.parsers then logreport ("log", 0, "db", "Fatal: no fonts.conf parser.") end local os_dirs = luaotfload.parsers.read_fonts_conf(fonts_conves, find_files) return os_dirs end return {} end --[[doc-- count_removed -- Count paths that do not exist in the file system. --doc]]-- --- string list -> size_t local count_removed = function (files) if not files or not files.full then logreport ("log", 4, "db", "Empty file store; no data to work with.") return 0 end local old = files.full logreport ("log", 4, "db", "Checking removed files.") local nrem = 0 local nold = #old for i = 1, nold do local f = old[i] if not kpsereadable_file (f) then logreport ("log", 2, "db", "File %s does not exist in file system.") nrem = nrem + 1 end end return nrem end --[[doc-- retrieve_namedata -- Scan the list of collected fonts and populate the list of namedata. · dirname : name of the directory to scan · currentnames : current font db object · targetnames : font db object to fill · dry_run : don’t touch anything Returns the number of fonts that were actually added to the index. --doc]]-- --- string * string list -> dbobj -> dbobj -> bool? -> int * int local retrieve_namedata = function (files, currentnames, targetnames, dry_run) local nfiles = #files local nnew = 0 logreport ("info", 1, "db", "Scanning %d collected font files ...", nfiles) local bylocation = { texmf = { 0, 0 } , ["local"] = { 0, 0 } , system = { 0, 0 } } report_status_start (2, 4) for i = 1, nfiles do local fullname, location = unpack (files[i]) local count = bylocation[location] count[1] = count[1] + 1 if dry_run == true then local truncated = truncate_string (fullname, 43) logreport ("log", 2, "db", "Would have been loading %s.", fullname) report_status ("term", "db", "Would have been loading %s", truncated) --- skip the read_font_names part else local truncated = truncate_string (fullname, 32) logreport ("log", 2, "db", "Loading font %s.", fullname) report_status ("term", "db", "Loading font %s", truncated) local new = read_font_names (fullname, currentnames, targetnames, location) if new == true then nnew = nnew + 1 count[2] = count[2] + 1 end end end report_status_stop ("term", "db", "Scanned %d files, %d new.", nfiles, nnew) for location, count in next, bylocation do logreport ("term", 4, "db", " * %s: %d files, %d new", location, count[1], count[2]) end return nnew end --- unit -> string * string list local collect_font_filenames_system = function () local n_scanned, n_new = 0, 0 logreport ("info", 1, "db", "Scanning system fonts...") logreport ("info", 2, "db", "Searching in static system directories...") local files = { } for _, dir in next, get_os_dirs () do tableappend (files, collect_font_filenames_dir (dir, "system")) end logreport ("term", 3, "db", "Collected %d files.", #files) return files end --- unit -> bool flush_lookup_cache = function () lookup_cache = { } collectgarbage "collect" return true end --[[doc-- collect_font_filenames_local -- Scan $PWD (during a TeX run) for font files. Side effect: This sets the “local” flag in the subtable “meta” to prevent the merged table from being saved to disk. TODO the local tree could be cached in $PWD. --doc]]-- --- unit -> string * string list local collect_font_filenames_local = function () local pwd = lfscurrentdir () logreport ("both", 1, "db", "Scanning for fonts in $PWD (%q) ...", pwd) local files = collect_font_filenames_dir (pwd, "local") local nfiles = #files if nfiles > 0 then targetnames.meta["local"] = true --- prevent saving to disk logreport ("term", 1, "db", "Found %d files.", pwd) else logreport ("term", 1, "db", "Couldn’t find a thing here. What a waste.", pwd) end logreport ("term", 3, "db", "Collected %d files.", #files) return files end --- fontentry list -> filemap generate_filedata = function (mappings) logreport ("both", 2, "db", "Creating filename map.") local nmappings = #mappings local files = { bare = { ["local"] = { }, system = { }, --- mapped to mapping format -> index in full texmf = { }, --- mapped to mapping format -> “true” }, base = { ["local"] = { }, system = { }, --- mapped to index in “full” texmf = { }, --- set; all values are “true” }, full = { }, --- non-texmf } local base = files.base local bare = files.bare local full = files.full local conflicts = { basenames = 0, barenames = 0, } for index = 1, nmappings do local entry = mappings [index] local filedata = entry.file local format local location local fullpath local basename local barename local subfont if filedata then --- new entry format = entry.format --- otf, afm, ... location = filedata.location --- texmf, system, ... fullpath = filedata.full basename = filedata.base barename = filenameonly (fullpath) subfont = filedata.subfont else format = entry.format --- otf, afm, ... location = entry.location --- texmf, system, ... fullpath = entry.fullpath basename = entry.basename barename = filenameonly (fullpath) subfont = entry.subfont end entry.index = index --- 1) add to basename table local inbase = base [location] --- no format since the suffix is known if inbase then local present = inbase [basename] if present then logreport ("both", 4, "db", "Conflicting basename: %q already indexed \z in category %s, ignoring.", barename, location) conflicts.basenames = conflicts.basenames + 1 --- track conflicts per font local conflictdata = entry.conflicts if not conflictdata then entry.conflicts = { basename = present } else -- some conflicts already detected conflictdata.basename = present end else inbase [basename] = index end else inbase = { basename = index } base [location] = inbase end --- 2) add to barename table local inbare = bare [location] [format] if inbare then local present = inbare [barename] if present then logreport ("both", 4, "db", "Conflicting barename: %q already indexed \z in category %s/%s, ignoring.", barename, location, format) conflicts.barenames = conflicts.barenames + 1 --- track conflicts per font local conflictdata = entry.conflicts if not conflictdata then entry.conflicts = { barename = present } else -- some conflicts already detected conflictdata.barename = present end else inbare [barename] = index end else inbare = { [barename] = index } bare [location] [format] = inbare end --- 3) add to fullpath map full [index] = fullpath end --- mapping traversal return files end local bold_spectrum_low = 501 --- 500 is medium, 900 heavy/black local bold_weight = 700 local normal_width = 5 local pick_style local pick_fallback_style local check_regular do local choose_exact = function (field) --- only clean matches, without guessing if italic_synonym [field] then return "i" end if stringsub (field, 1, 10) == "bolditalic" or stringsub (field, 1, 11) == "boldoblique" then return "bi" end if stringsub (field, 1, 4) == "bold" then return "b" end if stringsub (field, 1, 6) == "italic" then return "i" end return false end pick_style = function (typographicsubfamily, subfamily) local style if typographicsubfamily then style = choose_exact (typographicsubfamily) if style then return style end elseif subfamily then style = choose_exact (subfamily) if style then return style end end return false end pick_fallback_style = function (italicangle, pfmweight, width) --[[-- More aggressive, but only to determine bold faces. Note: Before you make this test more inclusive, ensure no fonts are matched in the bold synonym spectrum over a literally “bold[italic]” one. In the past, heuristics been tried but ultimately caused unwanted modifiers polluting the lookup table. What doesn’t work is, e. g. treating weights > 500 as bold or allowing synonyms like “heavy”, “black”. --]]-- if width == normal_width and pfmweight == bold_weight then --- bold spectrum matches if italicangle == 0 then return "b" end return "bi" end return false end --- we use only exact matches here since there are constructs --- like “regularitalic” (Cabin, Bodoni Old Fashion) check_regular = function (typographicsubfamily, subfamily, italicangle, weight, width, pfmweight) local plausible_weight = false --[[-- This filters out undesirable candidates that specify their typographicsubfamily or subfamily as “regular” but are actually of “semibold” or other weight—another drawback of the oversimplifying classification into only three styles (r, i, b, bi). --]]-- if italicangle == 0 then if pfmweight == 400 then --[[-- Some fonts like Dejavu advertise an undistinguished regular and a “condensed” version with the same weight whilst also providing the style info in the typographic subfamily instead of the subfamily (i. e. the converse of what Adobe’s doing). The only way to weed out the undesired pseudo-regular shape is to peek at its advertised width (4 vs. 5). --]]-- if width then plausible_weight = width == normal_width else plausible_weight = true end elseif weight and regular_synonym [weight] then plausible_weight = true end end if plausible_weight then if subfamily then if regular_synonym [subfamily] then return "r" end elseif typographicsubfamily then if regular_synonym [typographicsubfamily] then return "r" end end end return false end end local pull_values = function (entry) local file = entry.file local names = entry.names local style = entry.style local sanitized = names.sanitized local english = sanitized.english local info = sanitized.info local metadata = sanitized.metadata --- pull file info ... entry.basename = file.base entry.fullpath = file.full entry.location = file.location entry.subfont = file.subfont --- pull name info ... entry.psname = english.psname entry.fontname = info.fontname or metadata.fontname entry.fullname = english.fullname or info.fullname entry.typographicsubfamily = english.typographicsubfamily entry.familyname = metadata.familyname or english.typographicfamily or english.family entry.plainname = names.fullname entry.subfamily = english.subfamily --- pull style info ... entry.italicangle = style.italicangle entry.size = style.size entry.weight = style.weight entry.width = style.width entry.pfmweight = style.pfmweight if config.luaotfload.db.strip == true then entry.file = nil entry.names = nil entry.style = nil end end local add_family = function (name, subtable, modifier, entry) if not name then --- probably borked font return end local familytable = subtable [name] if not familytable then familytable = { } subtable [name] = familytable end familytable [#familytable + 1] = { index = entry.index, modifier = modifier, } end local get_subtable = function (families, entry) local location = entry.location local format = entry.format local subtable = families [location] [format] if not subtable then subtable = { } families [location] [format] = subtable end return subtable end local collect_families = function (mappings) logreport ("info", 2, "db", "Analyzing families.") local families = { ["local"] = { }, system = { }, texmf = { }, } for i = 1, #mappings do local entry = mappings [i] if entry.file then pull_values (entry) end local subtable = get_subtable (families, entry) local familyname = entry.familyname local typographicsubfamily = entry.typographicsubfamily local subfamily = entry.subfamily local weight = entry.weight local width = entry.width local pfmweight = entry.pfmweight local italicangle = entry.italicangle local modifier = pick_style (typographicsubfamily, subfamily) if not modifier then --- regular, exact only modifier = check_regular (typographicsubfamily, subfamily, italicangle, weight, width, pfmweight) end if not modifier then modifier = pick_fallback_style (italicangle, pfmweight, width) end if modifier then add_family (familyname, subtable, modifier, entry) end end collectgarbage "collect" return families end --[[doc-- group_modifiers -- For not-quite-bold faces, determine whether they can fill in for a missing bold face slot in a matching family. Some families like Lucida do not contain real bold / bold italic members. Instead, they have semibold variants at weight 600 which we must add in a separate pass. --doc]]-- local style_categories = { "r", "b", "i", "bi" } local bold_categories = { "b", "bi" } group_modifiers = function (mappings, families) logreport ("info", 2, "db", "Analyzing shapes, weights, and styles.") for location, location_data in next, families do for format, format_data in next, location_data do for familyname, collected in next, format_data do local styledata = { } --- will replace the “collected” table --- First, fill in the ordinary style data that --- fits neatly into the four relevant modifier --- categories. for _, modifier in next, style_categories do local entries for key, info in next, collected do if info.modifier == modifier then if not entries then entries = { } end local index = info.index local entry = mappings [index] local size = entry.size if size then entries [#entries + 1] = { size [1], size [2], size [3], index, } else entries.default = index end collected [key] = nil end styledata [modifier] = entries end end --- At this point the family set may still lack --- entries for bold or bold italic. We will fill --- those in using the modifier with the numeric --- weight that is closest to bold (700). if next (collected) then --- there are uncategorized entries for _, modifier in next, bold_categories do if not styledata [modifier] then local closest local minimum = 2^51 for key, info in next, collected do local info_modifier = tonumber (info.modifier) and "b" or "bi" if modifier == info_modifier then local index = info.index local entry = mappings [index] local weight = entry.pfmweight local diff = weight < 700 and 700 - weight or weight - 700 if diff < minimum then minimum = diff closest = weight end end end if closest then --- We know there is a substitute face for the modifier. --- Now we scan the list again to extract the size data --- in case the shape is available at multiple sizes. local entries = { } for key, info in next, collected do local info_modifier = tonumber (info.modifier) and "b" or "bi" if modifier == info_modifier then local index = info.index local entry = mappings [index] local size = entry.size if entry.pfmweight == closest then if size then entries [#entries + 1] = { size [1], size [2], size [3], index, } else entries.default = index end end end end styledata [modifier] = entries end end end end format_data [familyname] = styledata end end end return families end local cmp_sizes = function (a, b) return a [1] < b [1] end order_design_sizes = function (families) logreport ("info", 2, "db", "Ordering design sizes.") for location, data in next, families do for format, data in next, data do for familyname, data in next, data do for style, data in next, data do tablesort (data, cmp_sizes) end end end end return families end --[[doc-- collect_font_filenames -- Scan the three search path categories for font files. This constitutes the first pass of the update mode. --doc]]-- --- unit -> string * string list local collect_font_filenames = function () logreport ("info", 4, "db", "Scanning the filesystem for font files.") local filenames = { } local bisect = config.luaotfload.misc.bisect local max_fonts = config.luaotfload.db.max_fonts --- XXX revisit for lua 5.3 wrt integers tableappend (filenames, collect_font_filenames_texmf ()) tableappend (filenames, collect_font_filenames_system ()) if config.luaotfload.db.scan_local == true then tableappend (filenames, collect_font_filenames_local ()) end --- Now drop everything above max_fonts. if max_fonts < #filenames then filenames = { unpack (filenames, 1, max_fonts) } end --- And choose the requested slice if in bisect mode. if bisect then return { unpack (filenames, bisect[1], bisect[2]) } end return filenames end --[[doc-- nth_font_file -- Return the filename of the nth font. --doc]]-- --- int -> string local nth_font_filename = function (n) logreport ("info", 4, "db", "Picking font file no. %d.", n) if not p_blacklist then read_blacklist () end local filenames = collect_font_filenames () return filenames[n] and filenames[n][1] or "" end --[[doc-- font_slice -- Return the fonts in the range from lo to hi. --doc]]-- local font_slice = function (lo, hi) logreport ("info", 4, "db", "Retrieving font files nos. %d--%d.", lo, hi) if not p_blacklist then read_blacklist () end local filenames = collect_font_filenames () local result = { } for i = lo, hi do result[#result + 1] = filenames[i][1] end return result end --[[doc count_font_files -- Return the number of files found by collect_font_filenames. This function is exported primarily for use with luaotfload-tool.lua in bisect mode. --doc]]-- --- unit -> int local count_font_files = function () logreport ("info", 4, "db", "Counting font files.") if not p_blacklist then read_blacklist () end return #collect_font_filenames () end --- dbobj -> stats local collect_statistics = function (mappings) local sum_dsnsize, n_dsnsize = 0, 0 local fullname, family, families = { }, { }, { } local subfamily, typographicsubfamily = { }, { } local addtohash = function (hash, item) if item then local times = hash [item] if times then hash [item] = times + 1 else hash [item] = 1 end end end local appendtohash = function (hash, key, value) if key and value then local entry = hash [key] if entry then entry [#entry + 1] = value else hash [key] = { value } end end end local addtoset = function (hash, key, value) if key and value then local set = hash [key] if set then set [value] = true else hash [key] = { [value] = true } end end end local setsize = function (set) local n = 0 for _, _ in next, set do n = n + 1 end return n end local hashsum = function (hash) local n = 0 for _, m in next, hash do n = n + m end return n end for _, entry in next, mappings do local style = entry.style local names = entry.names.sanitized local englishnames = names.english addtohash (fullname, englishnames.fullname) addtohash (family, englishnames.family) addtohash (subfamily, englishnames.subfamily) addtohash (typographicsubfamily, englishnames.typographicsubfamily) addtoset (families, englishnames.family, englishnames.fullname) local sizeinfo = entry.style.size if sizeinfo then sum_dsnsize = sum_dsnsize + sizeinfo [1] n_dsnsize = n_dsnsize + 1 end end --inspect (families) local n_fullname = setsize (fullname) local n_family = setsize (family) if log.get_loglevel () > 1 then local pprint_top = function (hash, n, set) local freqs = { } local items = { } for item, value in next, hash do if set then freq = setsize (value) else freq = value end local ifreq = items [freq] if ifreq then ifreq [#ifreq + 1] = item else items [freq] = { item } freqs [#freqs + 1] = freq end end tablesort (freqs) local from = #freqs local to = from - (n - 1) if to < 1 then to = 1 end for i = from, to, -1 do local freq = freqs [i] local itemlist = items [freq] if type (itemlist) == "table" then itemlist = tableconcat (itemlist, ", ") end logreport ("both", 0, "db", " · %4d × %s.", freq, itemlist) end end logreport ("both", 0, "", "~~~~ font index statistics ~~~~") logreport ("both", 0, "db", " · Collected %d fonts (%d names) in %d families.", #mappings, n_fullname, n_family) pprint_top (families, 4, true) logreport ("both", 0, "db", " · %d different “subfamily” kinds.", setsize (subfamily)) pprint_top (subfamily, 4) logreport ("both", 0, "db", " · %d different “typographicsubfamily” kinds.", setsize (typographicsubfamily)) pprint_top (typographicsubfamily, 4) end local mean_dsnsize = 0 if n_dsnsize > 0 then mean_dsnsize = sum_dsnsize / n_dsnsize end return { mean_dsnsize = mean_dsnsize, names = { fullname = n_fullname, families = n_family, }, -- style = { -- subfamily = subfamily, -- typographicsubfamily = typographicsubfamily, -- }, } end --- force: dictate rebuild from scratch --- dry_dun: don’t write to the db, just scan dirs --- dbobj? -> bool? -> bool? -> dbobj update_names = function (currentnames, force, dry_run) local targetnames local n_new = 0 local n_rem = 0 local conf = config.luaotfload if conf.run.live ~= false and conf.db.update_live == false then logreport ("info", 2, "db", "Skipping database update.") --- skip all db updates return currentnames or name_index end local starttime = osgettimeofday () --[[ The main function, scans everything - “targetnames” is the final table to return - force is whether we rebuild it from scratch or not ]] logreport ("both", 1, "db", "Updating the font names database" .. (force and " forcefully." or ".")) if config.luaotfload.db.skip_read == true then --- the difference to a “dry run” is that we don’t search --- for font files entirely. we also ignore the “force” --- parameter since it concerns only the font files. logreport ("info", 2, "db", "Ignoring font files, reusing old data.") currentnames = load_names (false) targetnames = currentnames else if force then currentnames = initialize_namedata (get_font_filter ()) else if not currentnames or not next (currentnames) then currentnames = load_names (dry_run) end if currentnames.meta.version ~= names.version then logreport ("both", 1, "db", "No font names database or old \z one found; generating new one.") currentnames = initialize_namedata (get_font_filter ()) end end targetnames = initialize_namedata (get_font_filter (), currentnames.meta and currentnames.meta.created) read_blacklist () --- pass 1: Collect the names of all fonts we are going to process. local font_filenames = collect_font_filenames () --- pass 2: read font files (normal case) or reuse information --- present in index n_rem = count_removed (currentnames.files) n_new = retrieve_namedata (font_filenames, currentnames, targetnames, dry_run) logreport ("info", 3, "db", "Found %d font files; %d new, %d stale entries.", #font_filenames, n_new, n_rem) end --- pass 3 (optional): collect some stats about the raw font info if config.luaotfload.misc.statistics == true then targetnames.meta.statistics = collect_statistics (targetnames.mappings) end --- we always generate the file lookup tables because --- non-texmf entries are redirected there and the mapping --- needs to be 100% consistent --- pass 4: build filename table targetnames.files = generate_filedata (targetnames.mappings) --- pass 5: build family lookup table targetnames.families = collect_families (targetnames.mappings) --- pass 6: arrange style and size info targetnames.families = group_modifiers (targetnames.mappings, targetnames.families) --- pass 7: order design size tables targetnames.families = order_design_sizes (targetnames.families) logreport ("info", 3, "db", "Rebuilt in %0.f ms.", 1000 * (osgettimeofday () - starttime)) name_index = targetnames if dry_run ~= true then if n_new + n_rem == 0 then logreport ("info", 2, "db", "No new or removed fonts, skip saving to disk.") else local success, reason = save_names () if not success then logreport ("both", 0, "db", "Failed to save database to disk: %s", reason) end end if flush_lookup_cache () and save_lookups () then logreport ("both", 2, "cache", "Lookup cache emptied.") return targetnames end end return targetnames end --- unit -> bool save_lookups = function ( ) local paths = config.luaotfload.paths local luaname, lucname = paths.lookup_path_lua, paths.lookup_path_luc if fileiswritable (luaname) and fileiswritable (lucname) then tabletofile (luaname, lookup_cache, true) osremove (lucname) caches.compile (lookup_cache, luaname, lucname) --- double check ... if lfsisfile (luaname) and lfsisfile (lucname) then logreport ("both", 3, "cache", "Lookup cache saved.") return true end logreport ("info", 0, "cache", "Could not compile lookup cache.") return false end logreport ("info", 0, "cache", "Lookup cache file not writable.") if not fileiswritable (luaname) then logreport ("info", 0, "cache", "Failed to write %s.", luaname) end if not fileiswritable (lucname) then logreport ("info", 0, "cache", "Failed to write %s.", lucname) end return false end --- save_names() is usually called without the argument --- dbobj? -> bool * string option save_names = function (currentnames) if not currentnames then currentnames = name_index end if not currentnames or type (currentnames) ~= "table" then return false, "invalid names table" elseif currentnames.meta and currentnames.meta["local"] then return false, "table contains local entries" end local paths = config.luaotfload.paths local luaname, lucname = paths.index_path_lua, paths.index_path_luc if fileiswritable (luaname) and fileiswritable (lucname) then osremove (lucname) local gzname = luaname .. ".gz" if config.luaotfload.db.compress then local serialized = tableserialize (currentnames, true) gzipsave (gzname, serialized) caches.compile (currentnames, "", lucname) else tabletofile (luaname, currentnames, true) caches.compile (currentnames, luaname, lucname) end logreport ("info", 2, "db", "Font index saved at ...") local success = false if lfsisfile (luaname) then logreport ("info", 2, "db", "Text: " .. luaname) success = true end if lfsisfile (gzname) then logreport ("info", 2, "db", "Gzip: " .. gzname) success = true end if lfsisfile (lucname) then logreport ("info", 2, "db", "Byte: " .. lucname) success = true end if success then return true else logreport ("info", 0, "db", "Could not compile font index.") return false end end logreport ("info", 0, "db", "Index file not writable") if not fileiswritable (luaname) then logreport ("info", 0, "db", "Failed to write %s.", luaname) end if not fileiswritable (lucname) then logreport ("info", 0, "db", "Failed to write %s.", lucname) end return false end --[[doc-- Below set of functions is modeled after mtx-cache. --doc]]-- --- string -> string -> string list -> string list -> string list -> unit local print_cache = function (category, path, luanames, lucnames, rest) local report_indeed = function (...) logreport ("info", 0, "cache", ...) end report_indeed("Luaotfload cache: %s", category) report_indeed("location: %s", path) report_indeed("[raw] %4i", #luanames) report_indeed("[compiled] %4i", #lucnames) report_indeed("[other] %4i", #rest) report_indeed("[total] %4i", #luanames + #lucnames + #rest) end --- string -> string -> string list -> bool -> bool local purge_from_cache = function (category, path, list, all) logreport ("info", 1, "cache", "Luaotfload cache: %s %s", (all and "erase" or "purge"), category) logreport ("info", 1, "cache", "location: %s", path) local n = 0 for i=1,#list do local filename = list[i] if stringfind(filename,"luatex%-cache") then -- safeguard if all then logreport ("info", 5, "cache", "Removing %s.", filename) osremove(filename) n = n + 1 else local suffix = filesuffix(filename) if suffix == "lua" then local checkname = file.replacesuffix( filename, "lua", "luc") if lfsisfile(checkname) then logreport ("info", 5, "cache", "Removing %s.", filename) osremove(filename) n = n + 1 end end end end end logreport ("info", 1, "cache", "Removed lua files : %i", n) return true end --- string -> string list -> int -> string list -> string list -> string list -> --- (string list * string list * string list * string list) local collect_cache collect_cache = function (path, all, n, luanames, lucnames, rest) if not all then local all = find_files (path) local luanames, lucnames, rest = { }, { }, { } return collect_cache(nil, all, 1, luanames, lucnames, rest) end local filename = all[n] if filename then local suffix = filesuffix(filename) if suffix == "lua" then luanames[#luanames+1] = filename elseif suffix == "luc" then lucnames[#lucnames+1] = filename else rest[#rest+1] = filename end return collect_cache(nil, all, n+1, luanames, lucnames, rest) end return luanames, lucnames, rest, all end local getwritablecachepath = function ( ) --- fonts.handlers.otf doesn’t exist outside a Luatex run, --- so we have to improvise local writable = getwritablepath (config.luaotfload.paths.cache_dir, "") if writable then return writable end end local getreadablecachepaths = function ( ) local readables = caches.getreadablepaths (config.luaotfload.paths.cache_dir) local result = { } if readables then for i=1, #readables do local readable = readables[i] if lfsisdir (readable) then result[#result+1] = readable end end end return result end --- unit -> unit local purge_cache = function ( ) local writable_path = getwritablecachepath () local luanames, lucnames, rest = collect_cache(writable_path) if log.get_loglevel() > 1 then print_cache("writable path", writable_path, luanames, lucnames, rest) end local success = purge_from_cache("writable path", writable_path, luanames, false) return success end --- unit -> unit local erase_cache = function ( ) local writable_path = getwritablecachepath () local luanames, lucnames, rest, all = collect_cache(writable_path) if log.get_loglevel() > 1 then print_cache("writable path", writable_path, luanames, lucnames, rest) end local success = purge_from_cache("writable path", writable_path, all, true) return success end local separator = function ( ) logreport ("info", 0, string.rep("-", 67)) end --- unit -> unit local show_cache = function ( ) local readable_paths = getreadablecachepaths () local writable_path = getwritablecachepath () local luanames, lucnames, rest = collect_cache(writable_path) separator () print_cache ("writable path", writable_path, luanames, lucnames, rest) texio.write_nl"" for i=1,#readable_paths do local readable_path = readable_paths[i] if readable_path ~= writable_path then local luanames, lucnames = collect_cache (readable_path) print_cache ("readable path", readable_path, luanames, lucnames, rest) end end separator() return true end ----------------------------------------------------------------------- --- API assumptions of the fontloader ----------------------------------------------------------------------- --- PHG: we need to investigate these, maybe they’re useful as early --- hooks local ignoredfile = function () return false end local reportmissingbase = function () logreport ("info", 0, "db", --> bug‽ "Font name database not found but expected by fontloader.") fonts.names.reportmissingbase = nil end local reportmissingname = function () logreport ("info", 0, "db", --> bug‽ "Fontloader attempted to lookup name before Luaotfload \z was initialized.") fonts.names.reportmissingname = nil end local getfilename = function (a1, a2) logreport ("info", 6, "db", --> bug‽ "Fontloader looked up font file (%s, %s) before Luaotfload \z was initialized.", tostring(a1), tostring(a2)) return lookup_fullpath (a1, a2) end local resolve = function (name, subfont) logreport ("info", 6, "db", --> bug‽ "Fontloader attempted to resolve name (%s, %s) before \z Luaotfload was initialized.", tostring(name), tostring(subfont)) return lookup_font_name { name = name, sub = subfont } end local api = { ignoredfile = ignoredfile, reportmissingbase = reportmissingbase, reportmissingname = reportmissingname, getfilename = getfilename, resolve = resolve, } ----------------------------------------------------------------------- --- export functionality to the namespace “fonts.names” ----------------------------------------------------------------------- local export = { set_font_filter = set_font_filter, flush_lookup_cache = flush_lookup_cache, save_lookups = save_lookups, load = load_names, access_font_index = access_font_index, data = function () return name_index end, save = save_names, update = update_names, lookup_font_file = lookup_font_file, lookup_font_name = lookup_font_name, lookup_font_name_cached = lookup_font_name_cached, getfilename = lookup_fullpath, lookup_fullpath = lookup_fullpath, read_blacklist = read_blacklist, sanitize_fontname = sanitize_fontname, getmetadata = getmetadata, set_location_precedence = set_location_precedence, count_font_files = count_font_files, nth_font_filename = nth_font_filename, font_slice = font_slice, --- font cache purge_cache = purge_cache, erase_cache = erase_cache, show_cache = show_cache, find_closest = find_closest, --- transitionary use_fontforge = false, } return { init = function () --- the font loader namespace is “fonts”, same as in Context --- we need to put some fallbacks into place for when running --- as a script if not fonts then return false end logreport = luaotfload.log.report local fonts = fonts fonts.names = fonts.names or names fonts.formats = fonts.formats or { } fonts.definers = fonts.definers or { resolvers = { } } names.blacklist = blacklist names.version = 2.9 names.data = nil --- contains the loaded database names.lookups = nil --- contains the lookup cache for sym, ref in next, export do names[sym] = ref end for sym, ref in next, api do names[sym] = names[sym] or ref end return true end } -- vim:tw=71:sw=4:ts=4:expandtab