From b31ace79ea5f6b3f279c544cd3a443d6fbf2a24d Mon Sep 17 00:00:00 2001 From: Patrick Simianer Date: Thu, 26 Feb 2026 10:05:59 +0000 Subject: overhaul --- bitext2tmx | 39 +++++++++++++++++++++++++++++++++++++++ 1 file changed, 39 insertions(+) create mode 100755 bitext2tmx (limited to 'bitext2tmx') diff --git a/bitext2tmx b/bitext2tmx new file mode 100755 index 0000000..e9c8e23 --- /dev/null +++ b/bitext2tmx @@ -0,0 +1,39 @@ +#!/usr/bin/env python3 + +import sys +from xml.sax.saxutils import escape + + +if __name__ == "__main__": + prefix = """ +
+ """ + + with open(sys.argv[1], "r") as src_file, open(sys.argv[2], "r") as tgt_file: + src_lang = sys.argv[1].split(".")[-1] + tgt_lang = sys.argv[2].split(".")[-1] + + tus = [] + for src_line, tgt_line in zip(src_file.readlines(), tgt_file.readlines()): + src_line = src_line.rstrip("\n") + tgt_line = tgt_line.rstrip("\n") + tus.append(f""" + + + {escape(src_line)} + + + {escape(tgt_line)} + + """) + + suffix = """ +""" + + complete = "\n".join([prefix] + tus + [suffix]) + + print(complete) -- cgit v1.2.3