Download Manual pages More Tools

Welcome to

View Semantics

What?

These tools illustrate ways to further process the results of Treebank Semantics.

The tools are distributed freely.

How?

The tools are all command line scripts, written with sed, bash, awk, and Python. Other important assumptions are the tregex tool and the Tree module of NLTK for Python.

Acknowledgements

Development is funded by the Japan Society for the Promotion of Science (JSPS).

Feedback

Feedback is extremely welcome. Please email: ajb129 __AT__ hotmail __DOT__ com.



Manual pages

    add_zero(1)modify parse
    fulltext_to_lu(1)make lexical units from FrameNet fulltext XML
    fulltext_to_report(1)return expaneded report
    indexed_to_fulltext(1)make lexical units from FrameNet fulltext XML
    indexed_to_salsa(1)transfrorm indexed to TIGER/SALSA XML
    lu_merge(1)merge Framenet lexUnit XML
    parse_indexed(1)creates argument-predicate information
    salsa_to_tiger(1)change XML format
    tree_number_terminals(1)add numbers to terminal nodes of a tree
    tree_positions(1)manipulate "word:height" information for nodes

In examples munge-trees by Mark Johnson is used to reformat trees. Anything else exceptional is noted.



add_zero(1)add_zero(1)

NAME

add_zero - modify parse

SYNOPSIS

add_zero [OPTIONS]

DESCRIPTION

Filter to modify a parse by adding ZERO as a node to dominate all null elements.

Requires tsurgeon_script to work.

OPTIONS

--word)add WORD to all non ZERO terminals
--example)show an example
*)show this help message

EXAMPLE

$ cat << EOF | add_zero --word | munge-trees -p
> ( (IP-MAT (NP-SBJ *speaker*)
>           (PP-OB1 (NP (IP-REL (NP-OB1 *T*)
>                               (NP-SBJ *pro*)
>                               (VB 落とし)
>                               (AXD た))
>                       (N お金))
>                   (P-ROLE を))
>           (VB 拾い)
>           (AX まし)
>           (AXD た)
>           (PU 。))
>   (ID 853_textbook_particles;o_page_170;AT68-2;JP))
> EOF
-| ( (IP-MAT (NP-SBJ (ZERO *speaker*))
-|           (PP-OB1 (NP (IP-REL (NP-OB1 (ZERO *T*))
-|                               (NP-SBJ (ZERO *pro*))
-|                               (VB (WORD 落とし))
-|                               (AXD (WORD た)))
-|                       (N (WORD お金)))
-|                   (P-ROLE (WORD を)))
-|           (VB (WORD 拾い))
-|           (AX (WORD まし))
-|           (AXD (WORD た))
-|           (PU (WORD 。)))
-|   (ID 853_textbook_particles;o_page_170;AT68-2;JP))


fulltext_to_lu(1)fulltext_to_lu(1)

NAME

fulltext_to_lu - make lexical units from FrameNet fulltext XML

SYNOPSIS

fulltext_to_lu [OPTIONS]

DESCRIPTION

Filter that transforms FrameNet fulltext XML into shell scripts for creating FrameNet lexUnit XML.

OPTIONS

--example)show an example
*)show this help message

EXAMPLE

$ cat << EOF | fulltext_to_lu
> <?xml version="1.0" encoding="UTF-8" standalone="yes"?>
> <?xml-stylesheet type="text/xsl" href="fullText.xsl"?>
> <fullTextAnnotation xsi:schemaLocation="../schema/fullText.xsd" xmlns="http://framenet.icsi.berkeley.edu" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
>   <header>
>     <corpus description="textbook_kisonihongo" name="textbook_kisonihongo" ID="28">
>       <document description="textbook_kisonihongo" name="textbook_kisonihongo" ID="9819"/>
>     </corpus>
>   </header>
>   <sentence corpID="28" docID="9819" sentNo="1" paragNo="1" aPos="0" ID="1_textbook_kisonihongo">
>     <text>A hoop rolls .</text>
>     <annotationSet cDate="02/10/2017 09:00:00 JST Fri" status="UNANN" ID="5462464">
>       <layer rank="1" name="WSL">
>         <label end="0" start="0" name="NT"/>
>         <label end="13" start="13" name="NT"/>
>       </layer>
>     </annotationSet>
>     <annotationSet cDate="02/10/2017 09:00:00 JST Fri" luID="0" luName="rolls.v" frameID="0" frameName="Unk" status="MANUAL" ID="5462465">
>       <layer rank="1" name="Target">
>         <label end="11" start="7" name="Target"/>
>       </layer>
>       <layer rank="1" name="FE">
>         <label feID="1" bgColor="FF0000" fgColor="FFFFFF" end="5" start="0" name="ARG0"/>
>       </layer>
>       <layer rank="1" name="GF">
>         <label end="5" start="0" name="Ext"/>
>       </layer>
>       <layer rank="1" name="PT">
>         <label end="5" start="0" name="NP-SBJ"/>
>       </layer>
>       <layer rank="1" name="Other"/>
>       <layer rank="1" name="Sent"/>
>       <layer rank="1" name="Noun"/>
>     </annotationSet>
>   </sentence>
> </fullTextAnnotation>
> EOF
-| #!/bin/bash
-| 
-| cat >> rolls.v.xml << EOF
-| <?xml version="1.0" encoding="UTF-8" standalone="yes"?>
-| <?xml-stylesheet type="text/xsl" href="lexUnit.xsl"?>
-| <lexUnit status="FN1_Sent" POS="v" name="rolls" ID="1000" frame="Unk" frameID="0000" totalAnnotated="1" xsi:schemaLocation="../schema/lexUnit.xsd" xmlns="http://framenet.icsi.berkeley.edu" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
-|   <header>
-|     <frame>
-|       <FE fgColor="FFFFFF" bgColor="FF0000" type="ARG0" abbrev="ARG0" name="ARG0"/>
-|     </frame>
-|   </header>
-|   <definition>rolls.v</definition>
-|   <lexeme POS="v" name="rolls"/>
-|   <valences>
-|     <FERealization total="1">
-|       <FE name="ARG0"/>
-|       <pattern total="1">
-|         <valenceUnit GF="Ext" PT="NP-SBJ" FE="ARG0"/>
-|         <annoSet ID="5462465"/>
-|       </pattern>
-|     </FERealization>
-|     <FEGroupRealization total="1">
-|       <FE name="ARG0"/>
-|       <pattern total="1">
-|         <valenceUnit GF="Ext" PT="NP-SBJ" FE="ARG0"/>
-|         <annoSet ID="5462465"/>
-|       </pattern>
-|     </FEGroupRealization>
-|   </valences>
-|   <subCorpus name="1_textbook_kisonihongo">
-|     <sentence sentNo="1" aPos="0" ID="1_textbook_kisonihongo">
-|       <text>A hoop rolls .</text>
-|       <annotationSet cDate="02/10/2017 09:00:00 JST Fri" status="UNANN" ID="5462464">
-|         <layer rank="1" name="WSL">
-|           <label end="0" start="0" name="NT"/>
-|           <label end="13" start="13" name="NT"/>
-|         </layer>
-|       </annotationSet>
-|       <annotationSet cDate="02/10/2017 09:00:00 JST Fri" status="MANUAL" ID="5462465">
-|         <layer rank="1" name="Target">
-|           <label end="11" start="7" name="Target"/>
-|         </layer>
-|         <layer rank="1" name="FE">
-|           <label feID="1" end="5" start="0" name="ARG0"/>
-|         </layer>
-|         <layer rank="1" name="GF">
-|           <label end="5" start="0" name="Ext"/>
-|         </layer>
-|         <layer rank="1" name="PT">
-|           <label end="5" start="0" name="NP-SBJ"/>
-|         </layer>
-|         <layer rank="1" name="Other"/>
-|         <layer rank="1" name="Sent"/>
-|         <layer rank="1" name="Noun"/>
-|       </annotationSet>
-|     </sentence>
-|   </subCorpus>
-| </lexUnit>
-| 
-| EOF
-| 

SEE ALSO

indexed_to_fulltext(1), lu_merge(1)



fulltext_to_report(1)fulltext_to_report(1)

NAME

fulltext_to_report - return expaneded report

SYNOPSIS

fulltext_to_report [OPTIONS]

DESCRIPTION

Filter to expand fulltext report.

OPTIONS

--short)determine short fasta output (HTML default)
--fasta|--fst)determine fasta output (HTML default)
--html2)alternative HTML output
--xml)determine XML output (HTML default)
--rtf)determine rtf output (HTML default)
--tnt)determine tnt output (HTML default)
--db)set database
--lang)set language
*)show this help message

SEE ALSO

indexed_to_fulltext(1)



indexed_to_fulltext(1)indexed_to_fulltext(1)

NAME

indexed_to_fulltext - make lexical units from FrameNet fulltext XML

SYNOPSIS

indexed_to_fulltext [OPTIONS]

DESCRIPTION

Filter that transforms FrameNet fulltext XML into shell scripts for creating lexical units.

OPTIONS

--all)calculate all dependencies (notably, treat NPR as N)
--example)show an example
*)show this help message

EXAMPLE

$ cat << EOF | tree_positions --char --index | indexed_to_fulltext
> ( (IP-MAT (NP-SBJ;<ENTITY[1]> (D A) (N hoop)) (VBP;<,ENTITY[1]@ARG0,EVENT[2]@EVENT,> rolls) (PU .)) (ID 1_textbook_kisonihongo;page_13;AT1-1;EN))
> EOF
-| <?xml version="1.0" encoding="UTF-8" standalone="yes"?>
-| <?xml-stylesheet type="text/xsl" href="fullText.xsl"?>
-| <fullTextAnnotation xsi:schemaLocation="../schema/fullText.xsd" xmlns="http://framenet.icsi.berkeley.edu" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
-|   <header>
-|     <corpus description="textbook_kisonihongo" name="textbook_kisonihongo" ID="17305">
-|       <document description="textbook_kisonihongo" name="textbook_kisonihongo" ID="5615"/>
-|     </corpus>
-|   </header>
-|   <sentence corpID="17305" docID="5615" sentNo="1" paragNo="1" aPos="0" ID="1_textbook_kisonihongo">
-|     <text>A hoop rolls .</text>
-|     <annotationSet cDate="05/01/19 08:58:04 JST Wed" status="UNANN" ID="10438">
-|       <layer rank="1" name="WSL">
-|         <label end="0" start="0" name="NT"/>
-|         <label end="13" start="13" name="NT"/>
-|       </layer>
-|     </annotationSet>
-|     <annotationSet cDate="05/01/19 08:58:04 JST Wed" luID="0" luName="rolls.v" frameID="0" frameName="Target" status="MANUAL" ID="10439">
-|       <layer rank="1" name="Target">
-|         <label end="11" start="7" name="Target"/>
-|       </layer>
-|       <layer rank="1" name="FE">
-|         <label feID="1" bgColor="FF0000" fgColor="FFFFFF" end="5" start="0" name="ARG0"/>
-|       </layer>
-|       <layer rank="1" name="GF">
-|         <label end="5" start="0" name="Ext"/>
-|       </layer>
-|       <layer rank="1" name="PT">
-|         <label end="5" start="0" name="NP-SBJ"/>
-|       </layer>
-|       <layer rank="1" name="Other"/>
-|       <layer rank="1" name="Sent"/>
-|       <layer rank="1" name="Noun"/>
-|     </annotationSet>
-|   </sentence>
-| </fullTextAnnotation>

SEE ALSO

fulltext_to_lu(1), fulltext_to_report(1)



indexed_to_salsa(1)indexed_to_salsa(1)

NAME

indexed_to_salsa - transfrorm indexed to TIGER/SALSA XML

SYNOPSIS

indexed_to_salsa [OPTIONS]

DESCRIPTION

Filter to transform indexed view to TIGER/SALSA XML.

OPTIONS

--full)consider all predicates
--addhead)add head to headless output
--headless)go headless
--example)show an example
*)show this help message

EXAMPLE

$ cat << EOF | indexed_to_salsa
> ( (IP-MAT;@1 (PP-SBJ;<2>;@2 (NP;@3 (PRO;@4 それ)) (P-OPTR;@5 は)) (PU;@6 、) (NP-PRD;<7>;@7 (CP-THT;<8>;@8 (CP-QUE;@9 (IP-SUB;@10 (PP-CND;<11>;@11 (IP-ADV;@12 (PP-SBJ;<13>;@13 (NP;@14 (N;@15 人)) (P-ROLE;@16 が)) (VB;<,13@ARG0,EVENT[6]@EVENT,>;@17 死ぬ)) (P-CONN;@18 と)) (NP-SBJ;{,13,};<19>;@19 (ZERO;@20 pro)) (IP-SMC;<21>;@21 (ADVP;@22 (WADV;@23 どう))) (VB;<,21@SMC,19@ARG0,11@と,EVENT[12]@EVENT,>;@24 なる)) (P-FINAL;@25 か)) (P-COMP;@26 という)) (N;<,7@h,8@EMB,>;@27 点)) (AX;<,7@ARG1,2@ARG0,EVENT[13]@EVENT,>;@28 で) (VB2;@29 ある) (PU;@30 。)) (ID 4_book_BCCWJ_PB10_00047;JP))
> EOF
-| <corpus corpusname="book_BCCWJ_PB10_00047" target="">
-|   <head>
-|     <meta>
-|       <name>book_BCCWJ_PB10_00047</name>
-|       <format>TigerXML</format>
-|     </meta>
-|     <frames>
-|       <frame name="4_book_BCCWJ_PB10_00047_17:ID|ARG0::"><element name="ARG0" optional="false"/></frame>
-|       <frame name="4_book_BCCWJ_PB10_00047_24:ID|SMC::|ARG0::|と::"><element name="SMC" optional="false"/><element name="ARG0" optional="false"/><element name="と" optional="false"/></frame>
-|       <frame name="4_book_BCCWJ_PB10_00047_28:ID|ARG1::|ARG0::"><element name="ARG1" optional="false"/><element name="ARG0" optional="false"/></frame>
-|     </frames>
-|     <wordtags>
-|     </wordtags>
-|     <flags>
-|     </flags>
-|     <annotation>
-|       <feature name="word" domain="T">
-|         <value name="pro"/>
-|         <value name="、"/>
-|         <value name="。"/>
-|         <value name="ある"/>
-|         <value name="か"/>
-|         <value name="が"/>
-|         <value name="それ"/>
-|         <value name="で"/>
-|         <value name="と"/>
-|         <value name="という"/>
-|         <value name="どう"/>
-|         <value name="なる"/>
-|         <value name="は"/>
-|         <value name="人"/>
-|         <value name="死ぬ"/>
-|         <value name="点"/>
-|       </feature>
-|       <feature name="pos" domain="T">
-|         <value name="AX">AX</value>
-|         <value name="N">N</value>
-|         <value name="P">P</value>
-|         <value name="PRO">PRO</value>
-|         <value name="PU">PU</value>
-|         <value name="VB">VB</value>
-|         <value name="VB2">VB2</value>
-|         <value name="WADV">WADV</value>
-|         <value name="ZERO">ZERO</value>
-|       </feature>
-|       <feature name="cat" domain="NT">
-|         <value name="ADVP"/>
-|         <value name="CP"/>
-|         <value name="IP"/>
-|         <value name="NP"/>
-|         <value name="PP"/>
-|         <value name="TOP"/>
-|       </feature>
-|       <edgelabel>
-|         <value name="--"/>
-|         <value name="ADV"/>
-|         <value name="CND"/>
-|         <value name="COMP"/>
-|         <value name="CONN"/>
-|         <value name="FINAL"/>
-|         <value name="MAT"/>
-|         <value name="OPTR"/>
-|         <value name="PRD"/>
-|         <value name="QUE"/>
-|         <value name="ROLE"/>
-|         <value name="SBJ"/>
-|         <value name="SMC"/>
-|         <value name="SUB"/>
-|         <value name="THT"/>
-|       </edgelabel>
-|       <secedgelabel>
-|         <value name="old"/>
-|       </secedgelabel>
-|     </annotation>
-|   </head>
-|   <body>
-|     <s id="4_book_BCCWJ_PB10_00047">
-|       <graph root="4_book_BCCWJ_PB10_00047_0">
-|         <terminals>
-|           <t id="4_book_BCCWJ_PB10_00047_4" word="それ" pos="PRO"/>
-|           <t id="4_book_BCCWJ_PB10_00047_5" word="は" pos="P"/>
-|           <t id="4_book_BCCWJ_PB10_00047_6" word="、" pos="PU"/>
-|           <t id="4_book_BCCWJ_PB10_00047_15" word="人" pos="N"/>
-|           <t id="4_book_BCCWJ_PB10_00047_16" word="が" pos="P"/>
-|           <t id="4_book_BCCWJ_PB10_00047_17" word="死ぬ" pos="VB"/>
-|           <t id="4_book_BCCWJ_PB10_00047_18" word="と" pos="P"/>
-|           <t id="4_book_BCCWJ_PB10_00047_20" word="pro" pos="ZERO"/>
-|           <t id="4_book_BCCWJ_PB10_00047_23" word="どう" pos="WADV"/>
-|           <t id="4_book_BCCWJ_PB10_00047_24" word="なる" pos="VB"/>
-|           <t id="4_book_BCCWJ_PB10_00047_25" word="か" pos="P"/>
-|           <t id="4_book_BCCWJ_PB10_00047_26" word="という" pos="P"/>
-|           <t id="4_book_BCCWJ_PB10_00047_27" word="点" pos="N"/>
-|           <t id="4_book_BCCWJ_PB10_00047_28" word="で" pos="AX"/>
-|           <t id="4_book_BCCWJ_PB10_00047_29" word="ある" pos="VB2"/>
-|           <t id="4_book_BCCWJ_PB10_00047_30" word="。" pos="PU"/>
-|         </terminals>
-|         <nonterminals>
-|           <nt id="4_book_BCCWJ_PB10_00047_0" cat="TOP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_1" label="MAT"/>
-|           </nt>
-|           <nt id="4_book_BCCWJ_PB10_00047_22" cat="ADVP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_23" label="--"/>
-|           </nt>
-|           <nt id="4_book_BCCWJ_PB10_00047_21" cat="IP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_22" label="--"/>
-|           </nt>
-|           <nt id="4_book_BCCWJ_PB10_00047_19" cat="NP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_20" label="--"/>
-|             <secedge idref="4_book_BCCWJ_PB10_00047_13" label="old"/>
-|           </nt>
-|           <nt id="4_book_BCCWJ_PB10_00047_14" cat="NP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_15" label="--"/>
-|           </nt>
-|           <nt id="4_book_BCCWJ_PB10_00047_13" cat="PP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_14" label="--"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_16" label="ROLE"/>
-|           </nt>
-|           <nt id="4_book_BCCWJ_PB10_00047_12" cat="IP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_13" label="SBJ"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_17" label="--"/>
-|           </nt>
-|           <nt id="4_book_BCCWJ_PB10_00047_11" cat="PP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_12" label="ADV"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_18" label="CONN"/>
-|           </nt>
-|           <nt id="4_book_BCCWJ_PB10_00047_10" cat="IP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_11" label="CND"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_19" label="SBJ"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_21" label="SMC"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_24" label="--"/>
-|           </nt>
-|           <nt id="4_book_BCCWJ_PB10_00047_9" cat="CP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_10" label="SUB"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_25" label="FINAL"/>
-|           </nt>
-|           <nt id="4_book_BCCWJ_PB10_00047_8" cat="CP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_9" label="QUE"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_26" label="COMP"/>
-|           </nt>
-|           <nt id="4_book_BCCWJ_PB10_00047_7" cat="NP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_8" label="THT"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_27" label="--"/>
-|           </nt>
-|           <nt id="4_book_BCCWJ_PB10_00047_3" cat="NP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_4" label="--"/>
-|           </nt>
-|           <nt id="4_book_BCCWJ_PB10_00047_2" cat="PP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_3" label="--"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_5" label="OPTR"/>
-|           </nt>
-|           <nt id="4_book_BCCWJ_PB10_00047_1" cat="IP">
-|             <edge idref="4_book_BCCWJ_PB10_00047_2" label="SBJ"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_6" label="--"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_7" label="PRD"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_28" label="--"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_29" label="--"/>
-|             <edge idref="4_book_BCCWJ_PB10_00047_30" label="--"/>
-|           </nt>
-|         </nonterminals>
-|       </graph>
-|       <sem>
-|         <globals>
-|         </globals>
-|         <frames>
-|           <frame name="4_book_BCCWJ_PB10_00047_17:ID|ARG0::"><target>
-|               <fenode idref="4_book_BCCWJ_PB10_00047_17"/>
-|             </target><fe name="ARG0" id="4_book_BCCWJ_PB10_00047_f1_e1">
-|               <fenode idref="4_book_BCCWJ_PB10_00047_13"/>
-|             </fe></frame>
-|           <frame name="4_book_BCCWJ_PB10_00047_24:ID|SMC::|ARG0::|と::"><target>
-|               <fenode idref="4_book_BCCWJ_PB10_00047_24"/>
-|             </target><fe name="SMC" id="4_book_BCCWJ_PB10_00047_f2_e3">
-|               <fenode idref="4_book_BCCWJ_PB10_00047_21"/>
-|             </fe><fe name="ARG0" id="4_book_BCCWJ_PB10_00047_f2_e1">
-|               <fenode idref="4_book_BCCWJ_PB10_00047_19"/>
-|             </fe><fe name="と" id="4_book_BCCWJ_PB10_00047_f2_e4">
-|               <fenode idref="4_book_BCCWJ_PB10_00047_11"/>
-|             </fe></frame>
-|           <frame name="4_book_BCCWJ_PB10_00047_28:ID|ARG1::|ARG0::"><target>
-|               <fenode idref="4_book_BCCWJ_PB10_00047_28"/>
-|             </target><fe name="ARG1" id="4_book_BCCWJ_PB10_00047_f3_e2">
-|               <fenode idref="4_book_BCCWJ_PB10_00047_7"/>
-|             </fe><fe name="ARG0" id="4_book_BCCWJ_PB10_00047_f3_e1">
-|               <fenode idref="4_book_BCCWJ_PB10_00047_2"/>
-|             </fe></frame>
-|         </frames>
-|         <usp>
-|           <uspframes>
-|           </uspframes>
-|           <uspfes>
-|           </uspfes>
-|         </usp>
-|         <wordtags>
-|         </wordtags>
-|       </sem>
-|     </s>
-|   </body>
-| </corpus>
.SEE ALSO
salsa_to_tiger(1)


lu_merge(1)lu_merge(1)

NAME

lu_merge - merge Framenet lexUnit XML

SYNOPSIS

lu_merge [OPTIONS]

DESCRIPTION

Filter to merge Framenet lexUnit XML

OPTIONS

*)show this help message

SEE ALSO

fulltext_to_lu(1)



parse_indexed(1)parse_indexed(1)

NAME

parse_indexed - creates argument-predicate information

SYNOPSIS

parse_indexed [OPTIONS]

DESCRIPTION

Takes a parsed tree from stdin and outputs the same tree only with arguments and predicate information calculated.

OPTIONS

--iml)add CONJP IML layers
--word)include WORD and ZERO layers
--single)single tree rather than discourse output
--salsa)TIGER/SALSA support
--coindex)Coindexation
--frame*)Framenet support
--clean)remove argument roles and event
--debug)keep tree and sed information for debugging
*)show this help message


salsa_to_tiger(1)salsa_to_tiger(1)

NAME

salsa_to_tiger - change XML format

SYNOPSIS

salsa_to_tiger [OPTIONS]

DESCRIPTION

Filter that takes TIGER/SALSA XML input and returns TIGER XML output.

OPTIONS

*)show this help message

SEE ALSO

indexed_to_salsa(1)



tree_number_terminals(1)tree_number_terminals(1)

NAME

tree_number_terminals - add numbers to terminal nodes of a tree

SYNOPSIS

tree_number_terminals

DESCRIPTION

Filter to add numbers to terminal nodes of a tree.

Requires tsurgeon_script(1) and python with NLTK to work.

OPTIONS

--all)number all terminals
--copy)copy numbering to restore the lost matching
--sent)include sentence number
--example)show an example
*)show this help message

EXAMPLE

$ cat << EOF | tree_number_terminals --copy
> ( (CP-FINAL (IP-SUB (PP *ICH*-1)
>                     (NP-SBJ *が*)
>                     (IP-ADV (VB 来)
>                             (AXD た))
>                     (CONJ *)
>                     (PU 、)
>                     (VB 来)
>                     (AXD た))
>             (PU 、)
>             (PP-1 (NP (N バス))
>                   (P が))
>             (PU 。))
>   (ID 990_textbook_kisonihongo;page_173;AT91-4;JP))
> EOF
-| ( (CP-FINAL (IP-SUB (PP *ICH*-1)
-|                     (NP-SBJ *が_0010*)
-|                     (IP-ADV (VB 来_0002)
-|                             (AXD た_0003))
-|                     (CONJ *)
-|                     (PU 、)
-|                     (VB 来_0006)
-|                     (AXD た_0007))
-|             (PU 、)
-|             (PP-1 (NP (N バス_0009))
-|                   (P が_0010))
-|             (PU 。))
-|   (ID 990_textbook_kisonihongo;page_173;AT91-4;JP))


tree_positions(1)tree_positions(1)

NAME

tree_positions - manipulate "word:height" information for nodes

SYNOPSIS

tree_positions [OPTIONS]

DESCRIPTION

Filter to by default add "word:height" information (following propbank) that specifies the token number of the first word and the number of levels up in the tree to go to find the appropriate node.

Requires Python with the NLTK library (http://www.nltk.org) to work.

OPTIONS

--word*|--height*)give word-height positions
--seq*)give sequential depth-first order positions
--rlc*)give sequential depth-first order without numbered pre-terminals
--char*)give character positions (default)
--remove|--clean)remove rather than add "word:height" information
--index*)change indexing information
--debug)debug indexing
--example)show an example
*)show this help message

EXAMPLE

$ cat << EOF | tree_positions | munge-trees -p
> (IP-MAT (NP-SBJ (D The)
>                 (N gostak))
>         (VP (VBP distims)
>             (NP-OB1 (D the)
>                     (N doshes)))
>         (. .))
> EOF
-| (IP-MAT (NP-SBJ;@0:9 (D;@0:2 The)
-|                      (N;@4:9 gostak))
-|         (VP;@11:28 (VBP;@0:6 distims)
-|                    (NP-OB1;@8:17 (D;@8:10 the)
-|                                  (N;@12:17 doshes)))
-|         (.;@30:30 .))


Last updated: May 01, 2019