From 6cafb943db279faa4fc0ddb400ad1326d129c5e6 Mon Sep 17 00:00:00 2001 From: Patrick Simianer Date: Fri, 11 Dec 2015 16:22:17 +0100 Subject: derivation_to_json: further cleanup --- derivation_to_json/example.0.json | 156 +++++++++++++++++++++++++ derivation_to_json/example.0.output | 2 + derivation_to_json/example.0.raw | 10 ++ derivation_to_json/example.1.json | 220 ++++++++++++++++++++++++++++++++++++ derivation_to_json/example.1.output | 2 + derivation_to_json/example.1.raw | 13 +++ 6 files changed, 403 insertions(+) create mode 100644 derivation_to_json/example.0.json create mode 100644 derivation_to_json/example.0.output create mode 100644 derivation_to_json/example.0.raw create mode 100644 derivation_to_json/example.1.json create mode 100644 derivation_to_json/example.1.output create mode 100644 derivation_to_json/example.1.raw diff --git a/derivation_to_json/example.0.json b/derivation_to_json/example.0.json new file mode 100644 index 0000000..cd69cde --- /dev/null +++ b/derivation_to_json/example.0.json @@ -0,0 +1,156 @@ +{ + "source_groups" : [ + "die", + "neuerung", + "bezieht sich auf gassensoren", + "auf basis von", + "metalloxid @-@ halbleitern ,", + "die sehr", + "empfindlich und wenig temperaturabhängig", + "sind ." + ], + "span_info" : { + "8" : [ + [ + 15, + 19 + ], + [] + ], + "6" : [ + [ + 1, + 2 + ], + [] + ], + "4" : [ + [ + 0, + 9 + ], + [ + [ + 1, + 6 + ] + ] + ], + "1" : [ + [ + 0, + 21 + ], + [] + ], + "3" : [ + [ + 0, + 13 + ], + [ + [ + 0, + 9 + ] + ] + ], + "7" : [ + [ + 13, + 21 + ], + [ + [ + 15, + 19 + ] + ] + ], + "5" : [ + [ + 1, + 6 + ], + [ + [ + 1, + 2 + ] + ] + ] + }, + "source_rgroups" : [ + 4, + 6, + 5, + 4, + 3, + 7, + 8, + 7 + ], + "phrase_alignment" : [ + [ + 0 + ], + [ + 1 + ], + [ + 2 + ], + [ + 3 + ], + [ + 4 + ], + [ + 5 + ], + [ + 6 + ], + [ + 7 + ] + ], + "target_rgroups" : [ + 4, + 6, + 5, + 4, + 3, + 7, + 8, + 7 + ], + "target_groups" : [ + "the", + "invention", + "relates to gas sensors", + "which are based on metal", + "@-@ oxide semiconductors and which", + "are very", + "sensitive and not appreciably temperature @-@ dependent", + "." + ], + "rules_by_span_id" : { + "8" : "[X] ||| empfindlich und wenig temperaturabhängig ||| sensitive and not appreciably temperature @-@ dependent ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=6.5059 MaxLexFgivenE=1.51642 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 0-0 1-1 2-3 3-3 3-4 3-6", + "6" : "[X] ||| neuerung ||| invention ||| ForceRule=1 ||| 0-0", + "4" : "[X] ||| die [X] auf basis von ||| the [1] which are based on metal ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=5.95916 MaxLexFgivenE=3.2265 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 0-0 2-4 3-4 3-5 4-6", + "3" : "[X] ||| [X] metalloxid @-@ halbleitern , ||| [1] @-@ oxide semiconductors and which ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=3.79715 MaxLexFgivenE=2.26688 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 1-2 2-1 3-3 4-5", + "7" : "[X] ||| die sehr [X] sind . ||| are very [1] . ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=0.456219 MaxLexFgivenE=2.16613 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 0-0 1-1 3-3 4-3", + "5" : "[X] ||| [X] bezieht sich auf gassensoren ||| [1] relates to gas sensors ||| IsSupportedOnline=0 IsSingletonFE=0 IsSingletonF=0 MaxLexEgivenF=1.45124 MaxLexFgivenE=2.73473 CountEF=0.477121 SampleCountF=0.477121 EgivenFCoherent=-0 ||| 1-1 1-2 2-1 4-3 4-4" + }, + "span2id" : { + "[0, 21]" : 1, + "[1, 2]" : 6, + "[0, 9]" : 4, + "[0, 13]" : 3, + "[15, 19]" : 8, + "[13, 21]" : 7, + "[1, 6]" : 5 + } +} diff --git a/derivation_to_json/example.0.output b/derivation_to_json/example.0.output new file mode 100644 index 0000000..440964b --- /dev/null +++ b/derivation_to_json/example.0.output @@ -0,0 +1,2 @@ +die neuerung bezieht sich auf gassensoren auf basis von metalloxid @-@ halbleitern , die sehr empfindlich und wenig temperaturabhängig sind . +the invention relates to gas sensors which are based on metal @-@ oxide semiconductors and which are very sensitive and not appreciably temperature @-@ dependent . diff --git a/derivation_to_json/example.0.raw b/derivation_to_json/example.0.raw new file mode 100644 index 0000000..7fed320 --- /dev/null +++ b/derivation_to_json/example.0.raw @@ -0,0 +1,10 @@ +({<0,21> [Goal] ||| [S] ||| [1]}({<0,21> [S] ||| [S] [X] ||| [1] [2]}({<0,13> [S] ||| [X] ||| [1]}({<0,13> [X] ||| [X] metalloxid @-@ halbleitern , ||| [1] @-@ oxide semiconductors and which}({<0,9> [X] ||| die [X] auf basis von ||| the [1] which are based on metal}({<1,6> [X] ||| [X] bezieht sich auf gassensoren ||| [1] relates to gas sensors}({<1,2> [X] ||| neuerung ||| invention}) ) ) ) ) ({<13,21> [X] ||| die sehr [X] sind . ||| are very [1] .}({<15,19> [X] ||| empfindlich und wenig temperaturabhängig ||| sensitive and not appreciably temperature @-@ dependent}) ) ) ) +[X] ||| neuerung ||| invention ||| ForceRule=1 ||| 0-0 +[X] ||| [X] bezieht sich auf gassensoren ||| [1] relates to gas sensors ||| IsSupportedOnline=0 IsSingletonFE=0 IsSingletonF=0 MaxLexEgivenF=1.45124 MaxLexFgivenE=2.73473 CountEF=0.477121 SampleCountF=0.477121 EgivenFCoherent=-0 ||| 1-1 1-2 2-1 4-3 4-4 +[X] ||| die [X] auf basis von ||| the [1] which are based on metal ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=5.95916 MaxLexFgivenE=3.2265 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 0-0 2-4 3-4 3-5 4-6 +[X] ||| [X] metalloxid @-@ halbleitern , ||| [1] @-@ oxide semiconductors and which ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=3.79715 MaxLexFgivenE=2.26688 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 1-2 2-1 3-3 4-5 +[S] ||| [X] ||| [1] +[X] ||| empfindlich und wenig temperaturabhängig ||| sensitive and not appreciably temperature @-@ dependent ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=6.5059 MaxLexFgivenE=1.51642 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 0-0 1-1 2-3 3-3 3-4 3-6 +[X] ||| die sehr [X] sind . ||| are very [1] . ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=0.456219 MaxLexFgivenE=2.16613 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 0-0 1-1 3-3 4-3 +[S] ||| [S] [X] ||| [1] [2] ||| Glue=1 +[Goal] ||| [S] ||| [1] diff --git a/derivation_to_json/example.1.json b/derivation_to_json/example.1.json new file mode 100644 index 0000000..b395061 --- /dev/null +++ b/derivation_to_json/example.1.json @@ -0,0 +1,220 @@ +{ + "source_groups" : [ + "in einer", + "favorisierten", + "ausführung", + "dient einer", + "der schwenkbolzen ( 8 )", + "zugleich", + "als messbolzen ,", + "indem", + "an ihm dehnungsmess @-@ streifen", + "( 12", + ") angebracht sind ." + ], + "span_info" : { + "6" : [ + [ + 4, + 11 + ], + [ + [ + 6, + 11 + ] + ] + ], + "11" : [ + [ + 16, + 21 + ], + [] + ], + "3" : [ + [ + 0, + 12 + ], + [ + [ + 2, + 12 + ] + ] + ], + "7" : [ + [ + 6, + 11 + ], + [] + ], + "9" : [ + [ + 12, + 23 + ], + [ + [ + 12, + 15 + ], + [ + 16, + 21 + ] + ] + ], + "8" : [ + [ + 12, + 27 + ], + [ + [ + 12, + 23 + ] + ] + ], + "1" : [ + [ + 0, + 27 + ], + [] + ], + "4" : [ + [ + 2, + 12 + ], + [ + [ + 2, + 3 + ], + [ + 4, + 11 + ] + ] + ], + "10" : [ + [ + 12, + 15 + ], + [] + ], + "5" : [ + [ + 2, + 3 + ], + [] + ] + }, + "source_rgroups" : [ + 3, + 5, + 4, + 6, + 7, + 4, + 10, + 9, + 11, + 9, + 8 + ], + "phrase_alignment" : [ + [ + 0 + ], + [ + 1 + ], + [ + 5 + ], + [ + 2, + 4 + ], + [ + 3 + ], + [ + 5 + ], + [ + 6 + ], + [ + 7, + 9 + ], + [ + 8 + ], + [ + 9, + 7 + ], + [ + 10 + ] + ], + "target_rgroups" : [ + 3, + 5, + 6, + 7, + 6, + 4, + 10, + 9, + 11, + 9, + 8 + ], + "target_groups" : [ + "in a", + "fuck that", + "of", + "the hinge bolts ( 8 )", + "is used", + "at the", + "time as", + "a measuring bolt ,", + "by having strain gauge strips", + "( 12", + ") attached to it ." + ], + "rules_by_span_id" : { + "6" : "[X] ||| dient einer [X] ||| of [1] is used ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=2.51875 MaxLexFgivenE=3.28665 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 0-2 0-3 1-0", + "11" : "[X] ||| an ihm dehnungsmess @-@ streifen ||| by having strain gauge strips ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=7.23159 MaxLexFgivenE=6.6978 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 0-4 2-2 3-0 4-3", + "3" : "[X] ||| in einer [X] ||| in a [1] ||| IsSupportedOnline=0 IsSingletonFE=0 IsSingletonF=0 MaxLexEgivenF=0.605196 MaxLexFgivenE=1.51196 CountEF=0.69897 SampleCountF=1.63347 EgivenFCoherent=1.02119 ||| 0-0 1-1", + "7" : "[X] ||| der schwenkbolzen ( 8 ) ||| the hinge bolts ( 8 ) ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=4.2972 MaxLexFgivenE=3.01678 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 0-0 1-2 2-1 2-3 2-5 3-4 4-5", + "9" : "[X] ||| [X] indem [X] ( 12 ||| [1] a measuring bolt , [2] ( 12 ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=10.3295 MaxLexFgivenE=3.69621 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 3-6 4-7", + "8" : "[X] ||| [X] ) angebracht sind . ||| [1] ) attached to it . ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=5.52044 MaxLexFgivenE=3.17712 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 1-1 2-2 3-3 4-5", + "4" : "[X] ||| [X] ausführung [X] zugleich ||| [1] [2] at the ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=2.87767 MaxLexFgivenE=7.30184 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 3-3", + "10" : "[X] ||| als messbolzen , ||| time as ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=0.328333 MaxLexFgivenE=2.60944 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 0-1 1-0 2-0", + "5" : "[X] ||| favorisierten ||| fuck that ||| ForceRule=1 ||| 0-0 0-1" + }, + "span2id" : { + "[4, 11]" : 6, + "[16, 21]" : 11, + "[12, 15]" : 10, + "[0, 27]" : 1, + "[12, 23]" : 9, + "[0, 12]" : 3, + "[12, 27]" : 8, + "[2, 3]" : 5, + "[2, 12]" : 4, + "[6, 11]" : 7 + } +} diff --git a/derivation_to_json/example.1.output b/derivation_to_json/example.1.output new file mode 100644 index 0000000..544b448 --- /dev/null +++ b/derivation_to_json/example.1.output @@ -0,0 +1,2 @@ +in einer favorisierten ausführung dient einer der schwenkbolzen ( 8 ) zugleich als messbolzen , indem an ihm dehnungsmess @-@ streifen ( 12 ) angebracht sind . +in a fuck that of the hinge bolts ( 8 ) is used at the time as a measuring bolt , by having strain gauge strips ( 12 ) attached to it . diff --git a/derivation_to_json/example.1.raw b/derivation_to_json/example.1.raw new file mode 100644 index 0000000..66a5743 --- /dev/null +++ b/derivation_to_json/example.1.raw @@ -0,0 +1,13 @@ +({<0,27> [Goal] ||| [S] ||| [1]}({<0,27> [S] ||| [S] [X] ||| [1] [2]}({<0,12> [S] ||| [X] ||| [1]}({<0,12> [X] ||| in einer [X] ||| in a [1]}({<2,12> [X] ||| [X] ausführung [X] zugleich ||| [1] [2] at the}({<2,3> [X] ||| favorisierten ||| fuck that}) ({<4,11> [X] ||| dient einer [X] ||| of [1] is used}({<6,11> [X] ||| der schwenkbolzen ( 8 ) ||| the hinge bolts ( 8 )}) ) ) ) ) ({<12,27> [X] ||| [X] ) angebracht sind . ||| [1] ) attached to it .}({<12,23> [X] ||| [X] indem [X] ( 12 ||| [1] a measuring bolt , [2] ( 12}({<12,15> [X] ||| als messbolzen , ||| time as}) ({<16,21> [X] ||| an ihm dehnungsmess @-@ streifen ||| by having strain gauge strips}) ) ) ) ) +[X] ||| favorisierten ||| fuck that ||| ForceRule=1 ||| 0-0 0-1 +[X] ||| der schwenkbolzen ( 8 ) ||| the hinge bolts ( 8 ) ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=4.2972 MaxLexFgivenE=3.01678 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 0-0 1-2 2-1 2-3 2-5 3-4 4-5 +[X] ||| dient einer [X] ||| of [1] is used ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=2.51875 MaxLexFgivenE=3.28665 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 0-2 0-3 1-0 +[X] ||| [X] ausführung [X] zugleich ||| [1] [2] at the ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=2.87767 MaxLexFgivenE=7.30184 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 3-3 +[X] ||| in einer [X] ||| in a [1] ||| IsSupportedOnline=0 IsSingletonFE=0 IsSingletonF=0 MaxLexEgivenF=0.605196 MaxLexFgivenE=1.51196 CountEF=0.69897 SampleCountF=1.63347 EgivenFCoherent=1.02119 ||| 0-0 1-1 +[S] ||| [X] ||| [1] +[X] ||| als messbolzen , ||| time as ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=0.328333 MaxLexFgivenE=2.60944 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 0-1 1-0 2-0 +[X] ||| an ihm dehnungsmess @-@ streifen ||| by having strain gauge strips ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=7.23159 MaxLexFgivenE=6.6978 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 0-4 2-2 3-0 4-3 +[X] ||| [X] indem [X] ( 12 ||| [1] a measuring bolt , [2] ( 12 ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=10.3295 MaxLexFgivenE=3.69621 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 3-6 4-7 +[X] ||| [X] ) angebracht sind . ||| [1] ) attached to it . ||| IsSupportedOnline=0 IsSingletonFE=1 IsSingletonF=1 MaxLexEgivenF=5.52044 MaxLexFgivenE=3.17712 CountEF=0.30103 SampleCountF=0.30103 EgivenFCoherent=-0 ||| 1-1 2-2 3-3 4-5 +[S] ||| [S] [X] ||| [1] [2] ||| Glue=1 +[Goal] ||| [S] ||| [1] -- cgit v1.2.3