From 4bb4c4b4e35d00a4a8e96a3f1de4301f481b9cc6 Mon Sep 17 00:00:00 2001 From: Patrick Simianer Date: Wed, 19 Feb 2020 15:16:50 +0000 Subject: sentencepiece-decode --- sentencepiece-decode | 9 +++++++++ 1 file changed, 9 insertions(+) create mode 100755 sentencepiece-decode diff --git a/sentencepiece-decode b/sentencepiece-decode new file mode 100755 index 0000000..5e07ffa --- /dev/null +++ b/sentencepiece-decode @@ -0,0 +1,9 @@ +#!/usr/bin/env ruby + +require 'zipf' + +while line = STDIN.gets + line = line.split.join "" + puts line.gsub "▁", " " +end + -- cgit v1.2.3