blob: f1f7e86b1d1fd78821c671c0e27a9d60bbdf6fe2 [file] [log] [blame]
# liblouis Braille Translation and Back-Translation Library
#
# Copyright (C) 2017 Bert Frees
#
# This file is part of liblouis.
#
# liblouis is free software: you can redistribute it and/or modify it
# under the terms of the GNU Lesser General Public License as published
# by the Free Software Foundation, either version 2.1 of the License, or
# (at your option) any later version.
#
# liblouis is distributed in the hope that it will be useful, but
# WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
# Lesser General Public License for more details.
#
# You should have received a copy of the GNU Lesser General Public
# License along with liblouis. If not, see <http://www.gnu.org/licenses/>.
#
import argparse
from utils import *
def main():
parser = argparse.ArgumentParser(description="Export chunked words in patgen format.")
parser.add_argument('-d', '--dictionary', required=True, dest="DICTIONARY",
help="dictionary file")
parser.add_argument('-t', '--table', required=True, dest="TABLE",
help="translation table, possibly including hyphenation patterns to be used for showing the good and bad hyphens found")
args = parser.parse_args()
conn, c = open_dictionary(args.DICTIONARY)
c.execute("SELECT text,braille FROM dictionary WHERE braille IS NOT NULL")
load_table(args.TABLE)
hyphenation_enabled = liblouis.hyphenationEnabled()
for text, braille in c.fetchall():
# ignore long words for now
if len(text) > 48:
printerrln('WARNING: word is too long to be processed, may be translated incorrectly: %s' % text)
continue
if not is_letter(text):
printerrln('WARNING: word has non-letters: %s' % text)
continue
suggested_hyphen_string = suggest_chunks(text, braille)
if suggested_hyphen_string:
if hyphenation_enabled:
actual_hyphen_string = hyphenate(text)
else:
actual_hyphen_string = "".join(["0" * (len(text) - 1)])
println(my_zip(text,
# * = correct hyphen
# - = missed hyphen
# . = bad hyphen
# .0 = optional hyphen present
# 0 = optional hyphen not present
map(lambda e, a: ".0" if e == "x" and a == "1" else
"0" if e == "x" else
"*" if e == "1" and a == "1" else
"-" if e == "1" else
"." if a == "1" else None,
suggested_hyphen_string, actual_hyphen_string)))
conn.close()
if __name__ == "__main__": main()