PMLTQ-PML2BASE

 view release on metacpan or  search on metacpan

lib/PMLTQ/PML2BASE.pm  view on Meta::CPAN

                               # a given root node belongs to the top-level tree list
                               # of a file (i.e. it is not a nested #NODE within
                               # some non-#NODE and non-#TREES data structure)
#
# Generic SQL DB scheme for PML data:
#
# - every structure/container/ has a unique idx (Number) and carries attributes as columns
#
# - container has a '#content' column
#
# - cdata/constant/choice attributes are stored in the respective columns
#
# - structure/container members are in a separate table where they have a unique idx,
#   referred to by the member column
#
# - unordered-list/alt members are stored in a separate table, whose columns
#   are a 1:N idx referred to by the member column, and a LM/AM column
#   containing the value (following the rules described here);
#
# - sequence members are in a separate table whose columns correspond
#   to the elements, each containing an reference to a table

lib/PMLTQ/PML2BASE.pm  view on Meta::CPAN

#   '#elem-pos' containing the number of preceding elements of the same name in the sequence+1,
#   and the value, as usual. To retrieve a complete content of a certain sequence as a table,
#   one has to use a UNION on all the element tables, ordering by #pos and possibly outputing
#   a constant '#name' column
#
# - the table names should be derived from PML type names in a canonical way,
#   one per PML schema type decl
#
# Possible modifications:
#
# a) cast all cdata structure members also into separate tables and thus
#    keep varchar data in separate tables
#
# b) cast node attributes to a separate table, separating the tree structure
#    from node data, making the tree-structure table very thin
#    in fact: this is necessary, since nodes can be of different types
#
# c) use cdata format information to determine the table column format
#
#  some hacks:
#
#  - updating refs in strips .rf suffix if the member is a PMLREF but
#    not if it is a list of PMLREFs
#
#  - prefix of PMLREFs is stripped down; should be kept and
#    used to verify the target based on filename on UPDATE
#
#

xt/author/treebanks/pdt_test/resources/adata_30_schema.xml  view on Meta::CPAN

  <revision>1.0.0</revision>
  <description>PDT 3.0 analytical trees</description>
  <reference name="mdata" readas="pml"/>

  <import schema="mdata_30_schema.xml" type="m-node.type" minimal_revision="1.0.0"/>
  <import schema="wdata_30_schema.xml" type="bool.type"/>

  <derive type="m-node.type">
    <structure name="m-node">
      <member name="id" as_attribute="1" role="#ID" required="1">
        <cdata format="PMLREF"/>
      </member>
    </structure>
  </derive>

  <root name="adata" type="a-adata.type"/>

  <type name="a-adata.type">
    <structure>
      <member name="meta" required="0" type="a-meta.type"/>
      <member name="trees" role="#TREES" required="1">
        <list type="a-root.type" ordered="1"/>
      </member>
    </structure>
  </type>

  <type name="a-meta.type">
    <structure>
      <member name="annotation_info">
        <structure name="a-annotation-info">
          <member name="version_info"><cdata format="any"/></member>
          <member name="desc"><cdata format="any"/></member>
        </structure>
      </member>
    </structure>
  </type>

  <type name="a-root.type">
    <structure role="#NODE" name="a-root">
      <member name="id" role="#ID" as_attribute="1" required="1"><cdata format="ID"/></member>
      <member name="s.rf"><cdata format="PMLREF"/></member>
      <member name="afun"><constant>AuxS</constant></member>
      <member name="ord" role="#ORDER" required="1"><cdata format="nonNegativeInteger"/></member>
      <member name="clause_number"><cdata format="nonNegativeInteger"/></member>
      <member name="children" role="#CHILDNODES">
        <list type="a-node.type" ordered="1"/>
      </member>
      <member name="sentence" required="0"> <!-- for searching in PML-TQ only (not in the distributed data) -->
        <cdata format="any"/>
      </member>

    </structure>
  </type>

  <type name="a-node.type">
    <structure role="#NODE" name="a-node">
      <member name="id" role="#ID" as_attribute="1" required="1"><cdata format="ID"/></member>
      <member name="m.rf" role="#KNIT" type="m-node.type">
        <cdata format="PMLREF"/>
      </member>
      <member name="afun" type="a-afun.type" required="1"/>
      <member name="is_member" type="bool.type"/>
      <member name="is_parenthesis_root" type="bool.type"/>
      <member name="ord" role="#ORDER" required="1"><cdata format="nonNegativeInteger"/></member>
      <member name="clause_number"><cdata format="nonNegativeInteger"/></member>
      <member name="children" role="#CHILDNODES">
        <list type="a-node.type" ordered="1"/>
      </member>
    </structure>
  </type>
  
  <type name="a-afun.type">
    <choice>
      <value>Pred</value>
      <value>Pnom</value>

xt/author/treebanks/pdt_test/resources/mdata_30_schema.xml  view on Meta::CPAN

  <revision>1.0.0</revision>
  <description>PDT 3.0 morphological annotation</description>
  <reference name="wdata" readas="pml"/>

  <import schema="wdata_30_schema.xml" type="w-node.type" minimal_revision="1.0.0"/>
  <import schema="wdata_30_schema.xml" type="bool.type"/>

  <derive type="w-node.type">
    <structure name="w-node">
      <member as_attribute="1" name="id" role="#ID" required="1">
        <cdata format="PMLREF"/>
      </member>
    </structure>
  </derive>
  
  <root name="mdata" type="m-mdata.type"/>

  <type name="m-mdata.type">
    <sequence role="#TREES" content_pattern="meta?, s+">
      <element name="meta" type="m-meta.type"/>
      <element name="s" type="m-s.type"/>
    </sequence>
  </type>

  <type name="m-meta.type">
    <structure>
      <member name="lang"><cdata format="any"/></member>
      <member name="annotation_info">
        <list ordered="0" type="m-annotation-info.type"/>
      </member>
    </structure>
  </type>

  <type name="m-annotation-info.type">
    <structure name="m-annotation-info">
      <member as_attribute="1" name="id" role="#ID" required="1"><cdata format="ID"/></member>
      <member name="version_info"><cdata format="any"/></member>
      <member name="desc"><cdata format="any"/></member>
    </structure>
  </type>

  <type name="m-s.type">
    <container role="#NODE">
      <attribute name="id" role="#ID" required="1"><cdata format="ID"/></attribute>
      <sequence role="#CHILDNODES">
	<element name="m" type="m-m.type"/>
      </sequence>
    </container>
  </type>

  <type name="m-m.type">
    <container role="#NODE">
      <alt type="m-node.type"/>
    </container>
  </type>

  <type name="m-node.type">
    <structure name="m-node">
      <member as_attribute="1" name="id" role="#ID" required="1"><cdata format="ID"/></member>
      <member name="src.rf"><cdata format="PMLREF"/></member>
      <member name="w.rf">
        <list ordered="1" role="#KNIT" type="w-node.type"><cdata format="PMLREF"/></list>
      </member>
      <member name="form_change" type="m-form_change.type"/>
      <member name="form" required="1"><cdata format="any"/></member>
      <member name="lemma" required="1"><cdata format="any"/></member>
      <member name="tag" required="1"><cdata format="any"/></member>
    </structure>
  </type>

  <type name="m-form_change.type">
    <list ordered="0">
      <choice>
        <value>ctcd</value>
        <value>spell</value>
        <value>insert</value>
        <value>num_normalization</value>

xt/author/treebanks/pdt_test/resources/tdata_30_schema.xml  view on Meta::CPAN

  <type name="t-meta.type">
    <structure>
      <member name="annotation_info" type="t-annotation-info.type"/>
      <member name="genre" type="t-genre.type" required="0"/>
    </structure>
  </type>

  <type name="t-annotation-info.type">
    <structure name="t-annotation-info">
      <member name="version_info">
        <cdata format="any"/>
      </member>
      <member name="desc">
        <cdata format="any"/>
      </member>
    </structure>
  </type>

  <type name="t-genre.type">
    <choice>
      <value>review</value>
      <value>invitation</value>
      <value>letter</value>
      <value>advice</value>

xt/author/treebanks/pdt_test/resources/tdata_30_schema.xml  view on Meta::CPAN

      <value>collection</value>
      <value>caption</value>
      <value>metatext</value>
      <value>other</value>
    </choice>
  </type>

  <type name="t-root.type">
    <structure role="#NODE" name="t-root">
      <member as_attribute="1" name="id" role="#ID" required="1">
        <cdata format="ID"/>
      </member>
      <member name="atree.rf">
        <cdata format="PMLREF"/>
      </member>
      <member name="nodetype">
        <constant>root</constant>
      </member>
      <member name="deepord" role="#ORDER" required="0">
        <cdata format="nonNegativeInteger"/>
      </member>
      <member name="mwes" required="0">
        <list ordered="0" type="st-node.type"/>
      </member>
      <member name="genre" type="t-genre.type" required="0"/> <!-- for searching in PML-TQ only (not in the distributed data) -->
      <member name="children" role="#CHILDNODES">
        <list ordered="1" type="t-node.type"/>
      </member>
      <member name="sentence" required="0"> <!-- for searching in PML-TQ only (not in the distributed data) -->
        <cdata format="any"/>
      </member>
    </structure>
  </type>

  <type name="st-node.type">
    <structure name="st-node">
      <member as_attribute="1" name="id" role="#ID" required="1"><cdata format="ID"/></member>
      <member name="basic-form" required="0"><cdata format="any"/></member>
      <member name="type" required="1"><cdata format="any"/></member>
      <member name="tnode.rfs">
        <list ordered="0">
          <cdata format="PMLREF"/>
        </list>
      </member> 
    </structure>
  </type>

  <type name="t-node.type">
    <structure role="#NODE" name="t-node">
      <member as_attribute="1" name="id" role="#ID" required="1">
        <cdata format="ID"/>
      </member>
      <member name="a" type="t-a.type"/>
      <member name="nodetype" required="1" type="t-nodetype.type"/>
      <member name="is_generated" type="bool.type"/>
      <member name="t_lemma" required="1">
        <cdata format="any"/>
      </member>
      <member name="functor" required="1">
        <alt type="func.type"/>
      </member>
      <member name="subfunctor" type="t-subfunctor.type"/>
      <member name="sentmod" type="t-sentmod.type"/>
      <member name="quot">
        <list ordered="0">
          <structure>
            <member name="type" required="1" type="t-type.type"/>
            <member name="set_id" required="1">
              <cdata format="any"/>
            </member>
          </structure>
        </list>
      </member>
      <member name="is_dsp_root" type="bool.type"/>
      <member name="is_member" type="bool.type"/>
      <member name="is_name_of_person" type="bool.type"/>
      <member name="is_parenthesis" type="bool.type"/>
      <member name="is_state" type="bool.type"/>
      <member name="gram" type="t-gram.type"/>
      <member name="tfa" type="t-tfa.type"/>
      <member name="deepord" role="#ORDER" required="1">
        <cdata format="nonNegativeInteger"/>
      </member>
      <member name="discourse_special" type="t-discourse-special.type" required="0"/>
      <member name="discourse" required="0">
        <list ordered="0" type="t-discourse-link.type"/>
      </member>
      <member name="discourse_groups" required="0">
        <list ordered="0" type="t-discourse-groups.type"/>
      </member>
      <member name="bridging" required="0">
        <list ordered="0" type="t-bridging-link.type"/>
      </member>
      <member name="coref_text" required="0">
        <list ordered="0" type="t-coref_text-link.type"/>
      </member>
      <member name="coref_gram.rf">
        <list ordered="0">
          <cdata format="PMLREF"/>
        </list>
      </member>
      <member name="coref_special" type="coref_special.type"/>
      <member name="compl.rf">
        <list ordered="0">
          <cdata format="PMLREF"/>
        </list>
      </member>
      <member name="val_frame.rf">
        <alt>
          <cdata format="PMLREF"/>
        </alt>
      </member>
      <member name="children" role="#CHILDNODES">
        <list ordered="1" type="t-node.type"/>
      </member>
    </structure>
  </type>

  <type name="t-tfa.type">
    <choice>

xt/author/treebanks/pdt_test/resources/tdata_30_schema.xml  view on Meta::CPAN

      <value>dphr</value>
      <value>fphr</value>
      <value>list</value>
      <value>qcomplex</value>
    </choice>
  </type>

  <type name="t-a.type">
    <structure>
      <member name="lex.rf">
        <cdata format="PMLREF"/>
      </member>
      <member name="aux.rf">
        <list ordered="0">
          <cdata format="PMLREF"/>
        </list>
      </member>
    </structure>
  </type>

  <type name="coref_special.type">
    <choice>
      <value>segm</value>
      <value>exoph</value>
    </choice>

xt/author/treebanks/pdt_test/resources/tdata_30_schema.xml  view on Meta::CPAN

    <choice>
      <value>caption</value>
      <value>heading</value>
      <value>metatext</value>
    </choice>
  </type>

  <type name="t-discourse-groups.type">
    <structure>
      <member name="id" required="1">
        <cdata format="nonNegativeInteger"/>
      </member>
    </structure>
  </type>

  <type name="t-discourse-link.type">
    <structure>
      <member name="target_node.rf" required="0">
        <cdata format="PMLREF"/>
      </member>
      <member name="type" required="1">
        <choice>
          <value>discourse</value>
          <value>list</value>
        </choice>
      </member>
      <member name="start_group_id" required="0">
        <cdata format="nonNegativeInteger"/>
      </member>
      <member name="start_range" required="1">
        <cdata format="any"/>
      </member>
      <member name="target_group_id" required="0">
        <cdata format="nonNegativeInteger"/>
      </member>
      <member name="target_range" required="0">
        <cdata format="any"/>
      </member>
      <member name="discourse_type"  type="t-discourse-type.type" required="0"/>
      <member name="a-connectors.rf" required="0">
        <list ordered="0">
          <cdata format="PMLREF"/>
        </list>
      </member>
      <member name="t-connectors.rf" required="0">
        <list ordered="0">
          <cdata format="PMLREF"/>
        </list>
      </member>
      <member name="all_a-connectors.rf" required="0"> <!-- for searching in PML-TQ only (not in the distributed data) -->
        <list ordered="0">
          <cdata format="PMLREF"/>
        </list>
      </member>
      <member name="connective" required="0"> <!-- for searching in PML-TQ only (not in the distributed data) -->
        <cdata format="any"/>
      </member>
    </structure>
  </type>

  <type name="t-discourse-type.type">
    <choice>
      <value>conc</value>
      <value>cond</value>
      <value>confr</value>
      <value>conj</value>

xt/author/treebanks/pdt_test/resources/tdata_30_schema.xml  view on Meta::CPAN

      <value>restr</value>
      <value>spec</value>
      <value>synchr</value>
      <value>other</value>
    </choice>
  </type>

  <type name="t-bridging-link.type">
    <structure>
      <member name="target_node.rf" required="1">
        <cdata format="PMLREF"/>
      </member>
      <member name="type" type="t-bridging-type.type" required="1"/>
    </structure>
  </type>

  <type name="t-bridging-type.type">
    <choice>
      <value>CONTRAST</value>
      <value>SUB_SET</value>
      <value>SET_SUB</value>

xt/author/treebanks/pdt_test/resources/tdata_30_schema.xml  view on Meta::CPAN

      <value>FUNCT_P</value>
      <value>P_FUNCT</value>
      <value>REST</value>
      <value>ANAF</value>
    </choice>
  </type>

  <type name="t-coref_text-link.type">
    <structure>
      <member name="target_node.rf" required="1">
        <cdata format="PMLREF"/></member>
      <member name="type" required="1">
        <choice>
          <value>SPEC</value>
          <value>GEN</value>
        </choice>
      </member>
    </structure>
  </type>

</pml_schema>

xt/author/treebanks/pdt_test/resources/vallex_schema.xml  view on Meta::CPAN

<?xml version="1.0" encoding="utf-8"?>

<pml_schema xmlns="http://ufal.mff.cuni.cz/pdt/pml/schema/" version="1.1">
 <root name="valency_lexicon" type="v-valency_lexicon.type" />
 <type name="v-valency_lexicon.type">
  <structure>
   <member as_attribute="1" name="owner" required="1">
    <cdata format="PMLREF" />
   </member>
<!--   <member name="head" type="v-head.type" /> -->
   <member name="body" type="v-body.type" role="#TREES"/>
<!--   <member name="tail" type="v-tail.type" /> -->
  </structure>
 </type>
<!--
 <type name="v-head.type">
  <structure>
   <member name="global_history" type="v-global_history.type" />

xt/author/treebanks/pdt_test/resources/vallex_schema.xml  view on Meta::CPAN

  </structure>
 </type>
 <type name="v-tail.type">
  <sequence content_pattern="(forbid+)">
   <element name="forbid" type="v-forbid.type" />
  </sequence>
 </type>
 <type name="v-forbid.type">
  <container>
   <attribute name="id" role="#ID" required="1">
    <cdata format="ID" />
   </attribute>
  </container>
 </type>
-->
 <type name="v-body.type">
  <sequence content_pattern="(word+)">
   <element name="word" type="v-word.type" />
  </sequence>
 </type>
<!--
 <type name="v-global_history.type">
  <sequence content_pattern="(global_event*)">
   <element name="global_event" type="v-global_event.type" />
  </sequence>
 </type>
 <type name="v-global_event.type">
  <container>
   <attribute name="time_stamp" required="1">
    <cdata format="any" />
   </attribute>
   <attribute name="author" required="1">
    <cdata format="any" />
   </attribute>
   <cdata format="any" />
  </container>
 </type>
 <type name="v-list_of_users.type">
  <sequence content_pattern="(user+)">
   <element name="user" type="v-user.type" />
  </sequence>
 </type>
 <type name="v-user.type">
  <container>
   <attribute name="reviewer">
    <choice>
     <value>YES</value>
     <value>NO</value>
    </choice>
   </attribute>
   <attribute name="name" required="1">
    <cdata format="any" />
   </attribute>
   <attribute name="id" role="#ID" required="1">
    <cdata format="ID" />
   </attribute>
   <attribute name="annotator">
    <choice>
     <value>YES</value>
     <value>NO</value>
    </choice>
   </attribute>
  </container>
 </type>
-->
 <type name="v-word.type">
  <structure role="#NODE">
   <member as_attribute="1" name="id" role="#ID" required="1">
    <cdata format="ID" />
   </member>
   <member as_attribute="1" name="lemma" required="1">
    <cdata format="any" />
   </member>
   <member as_attribute="1" name="POS">
    <choice>
     <value>V</value>
     <value>A</value>
     <value>N</value>
     <value>D</value>
    </choice>
   </member>
   <member name="valency_frames" type="v-valency_frames.type" role="#CHILDNODES"/>

xt/author/treebanks/pdt_test/resources/vallex_schema.xml  view on Meta::CPAN

 </type>
 <type name="v-problem.type">
  <container>
   <attribute name="solved">
    <choice>
     <value>YES</value>
     <value>NO</value>
    </choice>
   </attribute>
   <attribute name="author">
    <cdata format="PMLREF" />
   </attribute>
   <cdata format="any" />
  </container>
 </type>
-->
 <type name="v-valency_frames.type">
  <sequence content_pattern="(frame*)">
   <element name="frame" type="v-frame.type" />
  </sequence>
 </type>
 <type name="v-frame.type">
  <structure role="#NODE">
   <member as_attribute="1" name="status">
    <choice>
     <value>active</value>
     <value>reviewed</value>
     <value>substituted</value>
     <value>obsolete</value>
     <value>deleted</value>
    </choice>
   </member>
   <member as_attribute="1" name="used">
    <cdata format="any" />
   </member>
   <member as_attribute="1" name="id" role="#ID" required="1">
    <cdata format="ID" />
   </member>
<!--
   <member as_attribute="1" name="hereditary_used">
    <cdata format="any" />
   </member>
-->
   <member as_attribute="1" name="substituted_with">
    <cdata format="IDREFS" />
   </member>
   <member name="example" type="v-example.type" />
   <member name="frame_elements" type="v-frame_elements.type" role="#CHILDNODES"/>
<!--   <member name="local_history" type="v-local_history.type" /> -->
<!--   <member name="problems" type="v-problems.type" /> -->
   <member name="note" type="v-note.type" />
  </structure>
 </type>
 <type name="v-example.type">
  <cdata format="any" />
 </type>
 <type name="v-note.type">
  <cdata format="any" />
 </type>
 <type name="v-frame_elements.type">
  <sequence content_pattern="(element|element_alternation)*">
   <element name="element_alternation" type="v-element_alternation.type" />
   <element name="element" type="v-element.type" />
  </sequence>
 </type>
 <type name="v-element_alternation.type">
   <container role="#NODE">
     <attribute name="id" role="#ID"><cdata format="ID" /></attribute>
     <sequence content_pattern="(element+)" role="#CHILDNODES">
       <element name="element" type="v-element.type" />
     </sequence>
   </container>
 </type>
 <type name="v-element.type">
  <container role="#NODE">
   <attribute name="id" role="#ID"><cdata format="ID" /></attribute>
   <attribute name="functor" required="1">
    <choice>
     <value>---</value>
     <value>ACT</value>
     <value>PAT</value>
     <value>ADDR</value>
     <value>EFF</value>
     <value>ORIG</value>
     <value>ACMP</value>
     <value>AIM</value>

xt/author/treebanks/pdt_test/resources/vallex_schema.xml  view on Meta::CPAN

     <value>TOWH</value>
     <value>TPAR</value>
     <value>TSIN</value>
     <value>TTILL</value>
     <value>TWHEN</value>
     <value>TOWH</value>
     <value>VOCAT</value>
    </choice>
   </attribute>
<!--   <attribute name="orig_type">
    <cdata format="any" />
   </attribute>
-->
   <attribute name="type">
    <choice>
     <value>oblig</value>
     <value>non-oblig</value>
    </choice>
   </attribute>
   <attribute name="forms">
    <cdata format="any" />
   </attribute>
   <sequence content_pattern="(form*)" role="#CHILDNODES">
    <element name="form" type="v-form.type" />
   </sequence>
  </container>
 </type>
 <type name="v-form.type">
  <container role="#NODE">
   <attribute name="id" role="#ID"><cdata format="ID" /></attribute>
   <attribute name="abbrev">
    <cdata format="any" />
   </attribute>
   <sequence content_pattern="(typical | elided | recip | state | (parent?, node*, (parentpos, node*)?))" role="#CHILDNODES">
    <element name="parentpos" type="v-parentpos.type" />
    <element name="elided" type="v-elided.type" />
    <element name="parent" type="v-parent.type" />
    <element name="recip" type="v-recip.type" />
    <element name="typical" type="v-typical.type" />
    <element name="node" type="v-node.type" />
    <element name="state" type="v-state.type" />
   </sequence>
  </container>
 </type>
 <type name="v-typical.type">
  <container role="#NODE"><attribute name="id" role="#ID"><cdata format="ID" /></attribute></container>
 </type>
 <type name="v-elided.type">
  <container role="#NODE"><attribute name="id" role="#ID"><cdata format="ID" /></attribute></container>
 </type>
 <type name="v-recip.type">
  <container role="#NODE"><attribute name="id" role="#ID"><cdata format="ID" /></attribute></container>
 </type>
 <type name="v-state.type">
  <container role="#NODE"><attribute name="id" role="#ID"><cdata format="ID" /></attribute></container>
 </type>
 <type name="v-parent.type">
  <structure role="#NODE">
   <member as_attribute="1" name="id" role="#ID"><cdata format="ID" /></member>
   <member name="node" type="v-node.type" />
  </structure>
 </type>
 <type name="v-parentpos.type">
  <container role="#NODE"><attribute name="id" role="#ID"><cdata format="ID" /></attribute></container>
 </type>
 <type name="v-node.type">
  <container role="#NODE">
   <attribute name="id" role="#ID"><cdata format="ID" /></attribute>
   <attribute name="num">
    <choice>
     <value>S</value>
     <value>P</value>
    </choice>
   </attribute>
   <attribute name="tagpos14">
    <cdata format="any" />
   </attribute>
   <attribute name="tagpos3">
    <cdata format="any" />
   </attribute>
   <attribute name="form">
    <cdata format="any" />
   </attribute>
   <attribute name="case">
    <choice>
     <value>1</value>
     <value>2</value>
     <value>3</value>
     <value>4</value>
     <value>5</value>
     <value>6</value>
     <value>7</value>
    </choice>
   </attribute>
   <attribute name="tagpos2">
    <cdata format="any" />
   </attribute>
   <attribute name="tagpos5">
    <cdata format="any" />
   </attribute>
   <attribute name="agreement">
    <choice>
     <value>0</value>
     <value>1</value>
    </choice>
   </attribute>
   <attribute name="pos">
    <choice>
     <value>a</value>

xt/author/treebanks/pdt_test/resources/vallex_schema.xml  view on Meta::CPAN

     <value>n</value>
     <value>j</value>
     <value>v</value>
     <value>u</value>
     <value>f</value>
     <value>s</value>
     <value>c</value>
    </choice>
   </attribute>
   <attribute name="tagpos13">
    <cdata format="any" />
   </attribute>
   <attribute name="afun">
    <choice>
     <value>Pred</value>
     <value>Pnom</value>
     <value>AuxV</value>
     <value>Sb</value>
     <value>Obj</value>
     <value>Atr</value>
     <value>Adv</value>

xt/author/treebanks/pdt_test/resources/vallex_schema.xml  view on Meta::CPAN

   </attribute>
   <attribute name="gen">
    <choice>
     <value>F</value>
     <value>M</value>
     <value>I</value>
     <value>N</value>
    </choice>
   </attribute>
   <attribute name="tagpos10">
    <cdata format="any" />
   </attribute>
   <attribute name="tagpos6">
    <cdata format="any" />
   </attribute>
   <attribute name="tagpos9">
    <cdata format="any" />
   </attribute>
   <attribute name="tagpos11">
    <cdata format="any" />
   </attribute>
   <attribute name="tagpos8">
    <cdata format="any" />
   </attribute>
   <attribute name="lemma">
    <cdata format="any" />
   </attribute>
   <attribute name="tagpos12">
    <cdata format="any" />
   </attribute>
   <attribute name="tagpos7">
    <cdata format="any" />
   </attribute>
   <attribute name="tagpos4">
    <cdata format="any" />
   </attribute>
   <attribute name="tagpos15">
    <cdata format="any" />
   </attribute>
   <attribute name="inherits">
    <choice>
     <value>0</value>
     <value>1</value>
    </choice>
   </attribute>
   <attribute name="deg">
    <choice>
     <value>1</value>
     <value>2</value>
     <value>3</value>
    </choice>
   </attribute>
   <attribute name="tagpos1">
    <cdata format="any" />
   </attribute>
   <sequence content_pattern="(node*)" role="#CHILDNODES">
    <element name="node" type="v-node.type" />
   </sequence>
  </container>
 </type>
<!--
 <type name="v-local_history.type">
  <sequence content_pattern="(local_event*)">
   <element name="local_event" type="v-local_event.type" />

xt/author/treebanks/pdt_test/resources/vallex_schema.xml  view on Meta::CPAN

     <value>create</value>
     <value>modify</value>
     <value>delete</value>
     <value>import</value>
     <value>review</value>
     <value>obsolete</value>
     <value>unreview</value>
    </choice>
   </attribute>
   <attribute name="time_stamp" required="1">
    <cdata format="any" />
   </attribute>
   <attribute name="author">
    <cdata format="PMLREF" />
   </attribute>
   <attribute name="imported_from">
    <cdata format="any" />
   </attribute>
  </container>
 </type>
-->
</pml_schema>

xt/author/treebanks/pdt_test/resources/wdata_30_schema.xml  view on Meta::CPAN


  <type name="w-wdata.type">
    <structure>
      <member name="meta" type="w-meta.type"/>
      <member name="doc" type="w-doc.type"/>
    </structure>
  </type>

  <type name="w-meta.type">
    <structure>
      <member name="lang"><cdata format="any"/></member>
      <member name="original_format"><cdata format="any"/></member>
    </structure>
  </type>

  <type name="w-doc.type">
    <container>
      <attribute name="id" required="1" role="#ID"><cdata format="ID"/></attribute>
      <attribute name="source_id"><cdata format="any"/></attribute>
      <sequence content_pattern="docmeta, para+">
	<element name="docmeta" type="w-docmeta.type"/>
	<element name="para" type="w-para.type"/>
      </sequence>
    </container>
  </type>

  <type name="w-docmeta.type">
    <sequence>
      <element name="othermeta" type="w-othermeta.type"/>
    </sequence>
  </type>

  <type name="w-othermeta.type">
    <container>
      <attribute name="origin"><cdata format="any"/></attribute>
      <cdata format="any"/>
    </container>
  </type>

  <type name="w-para.type">
    <sequence>
      <element name="othermarkup" type="w-othermarkup.type"/>
      <element name="w" type="w-node.type"/>
    </sequence>
  </type>

  <type name="w-othermarkup.type">
    <container>
      <attribute name="origin"><cdata format="any"/></attribute>
      <cdata format="any"/>
    </container>
  </type>

  <type name="w-node.type">
    <structure name="w-node">
      <member as_attribute="1" name="id" role="#ID" required="1"><cdata format="ID"/></member>
      <member name="token" required="1"><cdata format="any"/></member>
      <member name="no_space_after" type="bool.type"/>
    </structure>
  </type>
  
  <type name="bool.type">
    <choice>
      <value>0</value>
      <value>1</value>
    </choice>
  </type>

xt/author/treebanks/treex_test/resources/treex_schema.xml  view on Meta::CPAN

        <list ordered="1" type="bundle.type"/>
      </member>
    </structure>
  </root>


  <!-- Metainfo (info about the whole document) -->
  <type name="meta.type">
    <structure>

       <member name="description"><cdata format="any"/></member>

       <member name="zones">
         <sequence>
           <element name="zone" type="language_parametrized_doc_zone.type"/>
         </sequence>
       </member>

       <member name="wild_dump"><cdata format="any"/></member>
       
    </structure>
  </type>


  <type name="language_parametrized_doc_zone.type" >
    <structure>
      <member name="language" required="1" as_attribute="1" type="langcode.type"/>
      <member name="selector" as_attribute="1"><cdata format="any"/></member>
      <member name="text"><cdata format="any"/></member>
    </structure>
  </type>



  <type name="bundle.type" >
    <structure role="#NODE" name="bundle-root">
      <member as_attribute="1" name="id" role="#ID" required="1"><cdata format="ID"/></member>

      <!--CzEng meta informations (not stable, may be changed/deleted in future)
	      align_score is a alignment quality score which may be used in filters.
	      CzEng ids are very long, so we don't want to store them in bundle id,
	      because id of each node is derived from the id of its bundle (and zone and tree)
	      and we don't want to have so many long ids.
	  -->
      <member name="czeng">
        <structure>
          <member name="section"><cdata format="any"/></member>
          <member name="blockid"><cdata format="any"/></member>
          <member name="domain"><cdata format="any"/></member>
          <member name="id"><cdata format="any"/></member>
          <member name="missing_sents_before"><cdata format="any"/></member>
          <member name="filter_score"><cdata format="any"/></member>
          <member name="filter_features"><cdata format="any"/></member>
          <member name="align_score"><cdata format="any"/></member>
          <member name="origfile"><cdata format="any"/></member>
        </structure>
      </member>

      <member name="zones">
        <sequence>
          <element name="zone" type="zone.type"/>
        </sequence>
      </member>

      <member name="message_board">
        <list ordered="1">
           <cdata format="any"/>
        </list>
      </member>

      <!-- ptacek: -->
      <member name="dialog">
       		<structure>
       			<member name="from"><cdata format="any"/></member>
       			<member name="to"><cdata format="any"/></member>
       			<member name="body_asr_confidence"><cdata format="any"/></member>
       			<member name="body_gesture"><cdata format="any"/></member>
       			<member name="body_emotion"><cdata format="any"/></member>
       			<member name="dialog_act"><cdata format="any"/></member>
       			<member name="sentence_type"><cdata format="any"/></member>
       			<member name="utterance_datetime"><cdata format="any"/></member>
       			<member name="local_timezone"><cdata format="any"/></member>
       		</structure>
       </member>

       <member name="wild_dump"><cdata format="any"/></member>

    </structure>
  </type>


  <!-- generic (language- and purpose-parametrized) subbundle,
  containing trees and attributes -->

  <type name="zone.type" >
    <structure>
      <member name="language" required="1" as_attribute="1" type="langcode.type"/>
      <member name="selector" as_attribute="1"><cdata format="any"/></member>
      <member name="sentence"><cdata format="any"/></member>

      <member name="trees">
        <structure>
          <member name="a_tree" type="a-root.type"/> <!-- pozor,      bude potreba zmenit a-root.type!!! -->
          <member name="t_tree" type="t-root.type"/>
          <member name="n_tree" type="n-root.type"/>
          <member name="p_tree" type="p-nonterminal.type"/>
        </structure>
      </member>
    </structure>

xt/author/treebanks/treex_test/resources/treex_subschema_a_layer.xml  view on Meta::CPAN

<pml_schema xmlns="http://ufal.mff.cuni.cz/pdt/pml/schema/"  version="1.1">
  <revision>1.0.0</revision>
  <description>Subschema for a-layer trees</description>

  <import type="iset.type" schema="treex_subschema_interset.xml"/>

 <!--  a-layer representation (merged with m-layer) -->

  <type name="a-root.type">
    <structure role="#NODE" name="a-root">
      <member name="id" role="#ID" as_attribute="1"  required="1"><cdata format="ID"/></member>
      
      <member name="giza_scores">
        <structure>
           <member name="counterpart.rf">
              <cdata format="PMLREF"/>
           </member>
           <member name="therevalue">
              <cdata format="any"/>
           </member>
           <member name="backvalue">
              <cdata format="any"/>
           </member>
        </structure>
      </member>
      <member name="ptree.rf"><cdata format="PMLREF"/></member>
      <member name="s.rf"><cdata format="PMLREF"/></member>
      <member name="afun"><constant>AuxS</constant></member>
      <member name="ord" role="#ORDER" required="1"><cdata format="nonNegativeInteger"/></member>
      <member name="children" role="#CHILDNODES"><list type="a-node.type" ordered="1"/></member>
      <!-- Should the sentence be parsed once again?
           This is useful when tags has been fixed (with the knowledge of the parse). Popel 23.5.2009 -->
      <member name="reparse" type="bool.type"/>
      <member name="wild_dump"><cdata format="any"/></member>
    </structure>
  </type>


  <type name="a-node.type">
    <structure role="#NODE" name="a-node">
      <member name="children" role="#CHILDNODES"><list type="a-node.type" ordered="1"/></member>

      <!--**************  COVERED BY TREEX API METHODS ************-->
      <member name="id" role="#ID" as_attribute="1" required="1"><cdata format="ID"/></member>

      <!-- former m-layer attributes (reduced) -->
      <member name="form"><cdata format="any"/></member>
      <member name="lemma"><cdata format="any"/></member>
      <member name="tag"><cdata format="any"/></member>
      <!-- detailed list of morphosyntactic features (may correspond to the tag attribute) -->
      <member name="iset" type="iset.type"/>
      <member name="no_space_after" type="bool.type"/>
      <member name="translit"><cdata format="any"/></member>
      <member name="gloss"><cdata format="any"/></member>

      <!-- former a-layer attributes -->
      <member name="ord" role="#ORDER" required="1"><cdata format="nonNegativeInteger"/></member>
      <!-- Since we started working with the Universal Dependencies, deprel became our main attribute for the dependency relation label.
           Its usage is not restricted to UD though. It is just a general label. UD restrictions apply only if it is used in the UD context.
           In contrast, afun is a special case of deprel, useful only for the Prague-style trees. Its value range is pre-determined and
           some values imply specific treatment of the trees even in the Treex API.
           Finally, conll/deprel is a predecessor of deprel. Its name refers to one particular file format, CoNLL-X. It is deprecated. -->
      <member name="deprel"><cdata format="any"/></member>
      <member name="afun" type="afun.type" />
      <member name="is_member" type="bool.type"/>

      <!-- CoNLL shared task attributes (deprel, pos, cpos, feat) are grouped in one structure -->
      <member name="conll" type="a-conll.type"/>

      <!-- Shared modifiers of coordinations can be distinguished in PDT style
           just based on the fact they are hanged on the conjunction (coord. head).
           However, in other styles (e.g. Stanford) this attribute might be useful. -->
      <member name="is_shared_modifier" type="bool.type"/>

      <!-- attributes for conversion to t-tree -->
      <member name="edge_to_collapse" type="bool.type"/>
      <member name="is_auxiliary" type="bool.type"/>

      <!-- ??? -->
      <member name="is_parenthesis_root" type="bool.type" />

      <!-- clause segmentation -->
      <member name="clause_number"><cdata format="any"/></member>
      <member name="is_clause_head" type="bool.type"/> <!-- We mean finite clause head, but that's the same as with is_clause_head on t-layer!!! --> 

      <!--**************  NOT YET COVERED BY TREEX API METHODS ************-->
      <member name="morphcat" type="czech_morphcat.type"/> <!-- This should be in Treex API, i.e. not redundant with tag -->

      <!-- surface coreference -->
      <member name="coref" type="a_coreference.type"/>

      <!-- link to p-layer -->
      <member name="p_terminal.rf"><cdata format="PMLREF"/></member>

      <member name="alignment">
          <list ordered="0" type="align-links.type"/>
      </member>

      <!-- tentative -->
      <member name="chunks"><list ordered="0"><cdata format="any"/></list>
      </member>  

      <member name="wild_dump"><cdata format="any"/></member>
      <member name="iset_dump"><cdata format="any"/></member>

    </structure>
  </type>

  <type name="a-conll.type">
    <structure>
      <member name="deprel"><cdata format="any"/></member> <!--dependency relation-->
      <member name="cpos"><cdata format="any"/></member>   <!--coarse-grained part-of-speech tag-->
      <member name="pos"><cdata format="any"/></member>    <!--fine-grained part-of-speech tag-->
      <member name="feat"><cdata format="any"/></member>   <!--various other features separated by |-->
    </structure>
  </type>
      


  <type name="a_coreference.type"> <!-- analytická koreference pro Jirku Mírovského -->
    <structure>
       <member name="markable" type="bool.type"/> <!-- a token to be considered as anaphor/antecedent -->
       <member name="introduction" type="bool.type"/> <!-- first introduction of the entity to the discourse -->
       <member name="anaphor_type"> <cdata format="any"/> </member> <!-- the type of the anaphor - pronoun, proper_noun, demonstrative_noun_phrase, common_noun -->
       <member name="target-node.rf"> <cdata format="PMLREF"/> </member>
       <member name="type"> <cdata format="any"/> </member>
       <member name="src"> <cdata format="any"/> </member>
    </structure>
  </type>

  <type name="afun.type">
    <choice>
      <value>Pred</value>
      <value>Pnom</value>
      <value>AuxV</value>
      <value>Sb</value>
      <value>Obj</value>

xt/author/treebanks/treex_test/resources/treex_subschema_a_layer.xml  view on Meta::CPAN

      <value>NumArg</value><!-- argument of number, if the style dictates that numbers are heads -->
      <value>PossArg</value><!-- argument of possessive expression (indicating the possessor, i.e. the argument is the possessed thing) -->
      <value>AdjArg</value><!-- argument of adjective, i.e. this is the modified noun, if the style dictates that adjectives shall govern -->
      <!-- afun for unrecognized value -->
      <value>NR</value>
    </choice>
  </type>

  <type name="czech_morphcat.type">
    <structure>
        <member name="pos"><cdata format="any"/></member>
        <member name="subpos"><cdata format="any"/></member>
        <member name="synpos"><cdata format="any"/></member>
        <member name="gender"><cdata format="any"/></member>
        <member name="number"><cdata format="any"/></member>
        <member name="case"><cdata format="any"/></member>
        <member name="possgender"><cdata format="any"/></member>
        <member name="possnumber"><cdata format="any"/></member>
        <member name="person"><cdata format="any"/></member>
        <member name="tense"><cdata format="any"/></member>
        <member name="grade"><cdata format="any"/></member>
        <member name="negation"><cdata format="any"/></member>
        <member name="voice"><cdata format="any"/></member>
        <member name="reserve1"><cdata format="any"/></member>
        <member name="reserve2"><cdata format="any"/></member>
        <!-- ptacek 5.8.2008 for en/cz_generate -->
        <member name="compound_person"><cdata format="any"/></member>
        <member name="compound_number"><cdata format="any"/></member>
        <member name="compound_gender"><cdata format="any"/></member>
        <member name="ordering_type"><cdata format="any"/></member>
        <!-- zabokrtsky because of Arabic -->
        <member name="definiteness"><cdata format="any"/></member>
        <member name="mood"><cdata format="any"/></member>
    </structure>
  </type>

  <type name="align-links.type">
    <structure>
       <member name="counterpart.rf">
          <cdata format="PMLREF"/>
       </member>
       <member name="type">
          <cdata format="any"/>
       </member>
    </structure>
 </type>


  <type name="m-form_change.type">
    <choice>
      <value>ctcd</value>
      <value>spell</value>
      <value>insert</value>

xt/author/treebanks/treex_test/resources/treex_subschema_interset.xml  view on Meta::CPAN

<pml_schema xmlns="http://ufal.mff.cuni.cz/pdt/pml/schema/" version="1.1">
  <revision>1.0.0</revision>
  <description>DZ Interset features and values</description>

  <!-- Each Interset feature has a list of permitted values (see the iset-*.type definitions below)
       However, we declare the features as plain strings because value combinations (such as
       <gender>masc|neut</gender>) are also allowed. Type checking must be done elsewhere. -->

  <type name="iset.type">
    <structure>
      <member name="pos"><cdata format="any"/></member>
      <member name="nountype"><cdata format="any"/></member>
      <member name="nametype"><cdata format="any"/></member>
      <member name="adjtype"><cdata format="any"/></member>
      <member name="prontype"><cdata format="any"/></member>
      <member name="numtype"><cdata format="any"/></member>
      <member name="numform"><cdata format="any"/></member>
      <member name="numvalue"><cdata format="any"/></member>
      <member name="verbtype"><cdata format="any"/></member>
      <member name="advtype"><cdata format="any"/></member>
      <member name="adpostype"><cdata format="any"/></member>
      <member name="conjtype"><cdata format="any"/></member>
      <member name="parttype"><cdata format="any"/></member>
      <member name="punctype"><cdata format="any"/></member>
      <member name="puncside"><cdata format="any"/></member>
      <member name="synpos"><cdata format="any"/></member> <!-- deprecated -->
      <member name="poss"><cdata format="any"/></member>
      <member name="reflex"><cdata format="any"/></member>
      <member name="foreign"><cdata format="any"/></member>
      <member name="abbr"><cdata format="any"/></member>
      <member name="hyph"><cdata format="any"/></member>
      <member name="typo"><cdata format="any"/></member>
      <member name="echo"><cdata format="any"/></member>
      <member name="negativeness"><cdata format="any"/></member>
      <member name="definiteness"><cdata format="any"/></member>
      <member name="gender"><cdata format="any"/></member>
      <member name="animateness"><cdata format="any"/></member>
      <member name="number"><cdata format="any"/></member>
      <member name="case"><cdata format="any"/></member>
      <member name="prepcase"><cdata format="any"/></member>
      <member name="degree"><cdata format="any"/></member>
      <member name="person"><cdata format="any"/></member>
      <member name="politeness"><cdata format="any"/></member>
      <member name="possgender"><cdata format="any"/></member>
      <member name="possnumber"><cdata format="any"/></member>
      <member name="possperson"><cdata format="any"/></member>
      <member name="possednumber"><cdata format="any"/></member>
      <member name="absperson"><cdata format="any"/></member>
      <member name="ergperson"><cdata format="any"/></member>
      <member name="datperson"><cdata format="any"/></member>
      <member name="absnumber"><cdata format="any"/></member>
      <member name="ergnumber"><cdata format="any"/></member>
      <member name="datnumber"><cdata format="any"/></member>
      <member name="abspoliteness"><cdata format="any"/></member>
      <member name="ergpoliteness"><cdata format="any"/></member>
      <member name="datpoliteness"><cdata format="any"/></member>
      <member name="erggender"><cdata format="any"/></member>
      <member name="datgender"><cdata format="any"/></member>
      <member name="position"><cdata format="any"/></member>
      <member name="subcat"><cdata format="any"/></member>
      <member name="verbform"><cdata format="any"/></member>
      <member name="mood"><cdata format="any"/></member>
      <member name="tense"><cdata format="any"/></member>
      <member name="voice"><cdata format="any"/></member>
      <member name="aspect"><cdata format="any"/></member>
      <member name="variant"><cdata format="any"/></member>
      <member name="style"><cdata format="any"/></member>
    </structure>
  </type>

</pml_schema>

xt/author/treebanks/treex_test/resources/treex_subschema_n_layer.xml  view on Meta::CPAN

<?xml version="1.0" encoding="utf-8"?>

<pml_schema xmlns="http://ufal.mff.cuni.cz/pdt/pml/schema/"  version="1.1">
  <revision>1.0.0</revision>
  <description>N-layer (named-entity layer)</description>

  <type name="n-root.type">
    <structure role="#NODE" name="n-root">
      <member name="id" role="#ID" as_attribute="1"
      required="1"><cdata format="ID"/></member>
      <member name="children" role="#CHILDNODES">
        <list type="n-node.type" ordered="1"/>
      </member>
      <member name="wild_dump"><cdata format="any"/></member>
    </structure>
  </type>

  <type name="n-node.type">
    <structure role="#NODE" name="n-node">
      <member name="id" role="#ID" as_attribute="1"
      required="1"><cdata format="ID"/></member>
      <member name="ne_type" ><cdata format="any"/></member>
      <member name="normalized_name"><cdata format="any"/></member>
      <member name="a.rf">
        <list ordered="0">
          <cdata format="PMLREF"/>
        </list>
      </member>
      <member name="children" role="#CHILDNODES">
        <list type="n-node.type" ordered="1"/>
      </member>
      <member name="wild_dump"><cdata format="any"/></member>
    </structure>
  </type>



</pml_schema>

xt/author/treebanks/treex_test/resources/treex_subschema_p_layer.xml  view on Meta::CPAN

<?xml version="1.0" encoding="utf-8"?>

<pml_schema xmlns="http://ufal.mff.cuni.cz/pdt/pml/schema/"  version="1.1">
  <revision>1.0.0</revision>
  <description>P-layer - Phrase-structure (constituency) trees in the Penn treebank style</description>
  <import type="bbn_tag.type" schema="treex_subschema_bbn.xml"/>

  <type name="p-nonterminal.type">
   <structure role="#NODE" name="p-nonterminal">
    <member name="id" role="#ID" as_attribute="1" required="1"><cdata format="ID"/></member>
    <member name="is_head" ><cdata format="any"/></member>
    <!-- label of the incoming edge, as defined in the TIGER-XML and similar formats -->
    <member name="edgelabel"><cdata format="any"/></member>
    <member name="phrase"><cdata format="any"/></member>
    <member name="functions">
      <list type="p-function.type" ordered="1"/>
    </member>
    <member name="index"><cdata format="any"/></member>
    <member name="coindex"><cdata format="any"/></member>
    <member name="children" role="#CHILDNODES">
      <sequence role="#CHILDNODES">
        <element name="nonterminal" type="p-nonterminal.type"/>
        <element name="terminal" type="p-terminal.type"/>
      </sequence>
    </member>
    <member name="wild_dump"><cdata format="any"/></member>
   </structure>
  </type>

  <type name="p-terminal.type">
     <structure role="#NODE" name="p-terminal">
        <member name="id" role="#ID" as_attribute="1" required="1"><cdata format="ID"/></member>
        <member name="is_head" ><cdata format="any"/></member>
        <member name="index"><cdata format="any"/></member>
        <member name="coindex"><cdata format="any"/></member>
        <!-- label of the incoming edge, as defined in the TIGER-XML and similar formats -->
        <member name="edgelabel"><cdata format="any"/></member>
        <member name="form"><cdata format="any"/></member>
        <member name="lemma"><cdata format="any"/></member>
        <member name="tag"><cdata format="any"/></member>
        <member name="bbn_tag" type="bbn_tag.type" />
        <member name="alignment">
            <list ordered="0" type="align-links.type"/>
        </member>
<!--        <member name="m.rf" role="#KNIT" type="m-node.type"/> -->
        <member name="wild_dump"><cdata format="any"/></member>
    </structure>
  </type>

  <type name="p-phrase.type">
    <choice>
      <value>S</value>
      <value>SBAR</value>
      <value>SBARQ</value>
      <value>SINV</value>
      <value>SQ</value>

xt/author/treebanks/treex_test/resources/treex_subschema_p_layer.xml  view on Meta::CPAN

      <value>PPS</value>
      <value>LRB</value>
      <value>RRB</value> -->

    </choice>
  </type>

  <type name="align-links.type">
    <structure>
       <member name="counterpart.rf">
          <cdata format="PMLREF"/>
       </member>
       <member name="type">
          <cdata format="any"/>
       </member>
    </structure>
 </type>


</pml_schema>

xt/author/treebanks/treex_test/resources/treex_subschema_t_layer.xml  view on Meta::CPAN

  <description>T-layer schema</description>
  <!-- Treex PML schema  -->

  <import type="bbn_tag.type" schema="treex_subschema_bbn.xml"/>
  <import type="align-links.type" schema="treex_subschema_a_layer.xml"/>


  <type name="t-root.type">
    <structure role="#NODE" name="t-root">
      <member as_attribute="1" name="id" role="#ID" required="1">
        <cdata format="ID"/>
      </member>
      <member name="language" as_attribute="1" ><cdata format="any"/></member>
      <member name="direction" as_attribute="1"><cdata format="any"/></member>

      <member name="atree.rf">
        <cdata format="PMLREF"/>
      </member>
      <member name="nodetype">
        <constant>root</constant>
      </member>
      <!-- ptacek: adding ordering attr for pmltq queries using order-follows relations
           PML implementation allows for only one attr with #ORDER role
      -->
      <member name="ord" role="#ORDER" required="0">
	    <cdata format="nonNegativeInteger"/>
      </member>
      <member name="children" role="#CHILDNODES">
        <list ordered="1" type="t-node.type"/>
      </member>
      <member name="anot_error" type="t-anot_error.type" />
      <member name="pcedt_coref" type="t-pcedt_coref-root.type" />
      <member name="subtree_scores"  type="subtree_scores.type"/>
      <member name="src_tnode.rf"><cdata format="PMLREF"/></member>
      <member name="wild_dump"><cdata format="any"/></member>
    </structure>
  </type>

  <type name="t-node.type">
    <structure role="#NODE" name="t-node">
       <member name="children" role="#CHILDNODES"><list ordered="1" type="t-node.type"/></member>

       <!--**************  COVERED BY TREEX API METHODS ************-->
       <!--**************  Unstructured attributes ************-->
      <member name="id" as_attribute="1" role="#ID" required="1"><cdata format="ID"/></member>
      <member name="nodetype"  type="t-nodetype.type"/>
      <member name="ord" role="#ORDER" required="0"><cdata format="nonNegativeInteger"/></member> <!-- ptacek: adding ordering attr for pmltq queries using order-follows relations; PML implementation allows for only one attr with #ORDER role -->

      <member name="t_lemma"><cdata format="any"/></member>
      <member name="functor"><alt type="func.type"/></member>
      <member name="subfunctor" type="t-subfunctor.type"/>
      <member name="is_member" type="bool.type"/>
      <member name="formeme"><cdata format="any"/></member>
      <member name="tfa" type="t-tfa.type"/>
      <member name="is_dsp_root" type="bool.type"/>
      <member name="sentmod" type="t-sentmod.type"/>
      <member name="is_parenthesis" type="bool.type"/>
      <member name="is_passive" type="bool.type"/>
      <member name="is_clause_head" type="bool.type"/>
      <member name="is_relclause_head" type="bool.type"/>
      <member name="clause_number"><cdata format="any"/></member>
      <member name="is_name_of_person" type="bool.type"/> <!-- this is redundant with API for accessing n-nodes, but it was in PDT 2.0 -->
      <member name="voice"><cdata format="any"/></member> <!-- pro anglictinu active/passive, pro cestinu jich bude vic! -->
      <member name="t_lemma_origin"><cdata format="any"/></member> <!-- Values could be something like: clone, rule, dict,...  It is analogic to translation_model/t_lemma_variants/origin. popel 13.12.2008 -->
      <member name="formeme_origin"><cdata format="any"/></member> <!--dtto-->

      <!--  References -->
      <member name="a" type="t-a.type"/> <!--name of getter/setter methods may be changed soon-->
      <member name="src_tnode.rf"><cdata format="PMLREF"/></member>

      <!-- Grammatemes accesible via $number = $node->gram_number; $node->set_gram_number('pl');  -->
      <member name="gram" type="t-gram.type"/>

      
      <!--**************  NOT YET COVERED BY TREEX API METHODS ************-->
      <member name="nombank_data"><cdata format="any" /></member>
      <member name="is_generated" type="bool.type"/>
      <member name="bbn_tag" type="bbn_tag.type"/>
      <member name="anot_error" type="t-anot_error.type" />
      <member name="mlayer_pos"><cdata format="any"/></member>
      <member name="is_state" type="bool.type"/>
      <member name="is_name" type="bool.type"/>
      <member name="is_infin" type="bool.type"/>
      <member name="is_reflexive" type="bool.type"/>
      <member name="is_optimizable" type="bool.type"/>

      <!--  References -->
      <member name="compl.rf"><list ordered="0"><cdata format="PMLREF"/></list></member>
      <member name="coref_text.rf"><list ordered="0"><cdata format="PMLREF"/></list></member>
      <member name="coref_text" required="0">
        <list ordered="0" type="t-coref_text-link.type"/>
      </member>
      <member name="coref_gram.rf"><list ordered="0"><cdata format="PMLREF"/></list></member>
      <member name="coref_special" type="coref_special.type"/>
      <member name="pcedt" type="t-pcedt.type"/>
      <member name="val_frame.rf"><alt><cdata format="PMLREF"/></alt></member>
      <member name="original_parent.rf"><cdata format="PMLREF"/></member><!-- When doing temporary changes of a tree structure, original parent  is saved before changing so it can be later restored. (popel 19.2.2009) -->

      <!-- Structured attributes -->
      <member name="translation_model" type="translation_model.type"/>
      <member name="pcedt_coref" type="t-pcedt_coref.type"/>
      <member name="quot">
        <list ordered="0">
          <structure>
            <member name="type"  type="t-type.type"/>
            <member name="set_id" >
              <cdata format="any"/>
            </member>
          </structure>
        </list>
      </member>
      
      <member name="alignment">
          <list ordered="0" type="align-links.type"/>
      </member>

      <!-- TimeML stuff (ptacek 22.2.2010)-->
      <member name="timeml">
	      <structure>
		      <member name="timex3">
			      <structure>
				      <member name="tid"><cdata format="any"/></member>
				      <member name="type" type="timex3-type.type" />
				      <member name="value"><cdata format="any"/></member>
				      <member name="mod" type="timex3-mod.type" />
				      <member name="freq"><cdata format="any"/></member>
				      <member name="quant"><cdata format="any"/></member>
			      </structure>
		      </member>
		      <member name="event">
			      <structure>
				      <member name="eid"><cdata format="any"/></member>
				      <member name="class" type="timeml-event-class.type" />
			      </structure>
		      </member>
		      <member name="signal">
			      <structure>
				      <member name="sid"><cdata format="any"/></member>
			      </structure>
		      </member>
	      </structure>
      </member>

      <!-- wordnet stuff (ptacek 16.2.2010)-->
      <member name="wn">
       		<structure>
       			<member name="synset_id"><cdata format="any"/></member>
       			<member name="hyperchain"><cdata format="any"/></member>
       		</structure>
      </member>
      
      <!-- knowledgebase stuff (ptacek 16.2.2010)-->
      <member name="kb">
       		<structure>
       			<member name="id"><cdata format="any"/></member>
       			<member name="type"><cdata format="any"/></member>
       		</structure>
       </member>
       

      <!-- dott to tmt (ptacek 3.8.08)-->
	  <member name="dott">
	  	<structure>
	  		<member name="pos.str"><cdata format="any"/></member>
	  		<member name="tag"><cdata format="any"/></member>
	  	</structure>
	  </member>
	<!-- ********* DEPRECATED / QUESTIONABLE ATTRIBUTES  ********* -->
	
	<!-- Named entities should be stored in n-trees - see treex_subschema_n_layer.xml
	     <member name="named_entity" type="t-named_entity.type"/>

	     merging NE recognition results into t-tree for pmltq querying
	     <member name="ne"><structure><member name="type"><cdata format="any"/></member></structure></member>-->

        <!-- There is (or should be for other languages) API in Treex for converting numerals to numbers and vice-versa -->
        <!-- t_lemma == 'dva' => numeric_t_lemma == '2' (ptacek 1.6.2010)-->
        <!-- <member name="numeric_t_lemma"><cdata format="any"/></member>-->

        <member name="wild_dump"><cdata format="any"/></member>
    </structure>
  </type>

<!-- *************** Types of t-layer attributes *******************  -->
  <type name="t-anot_error.type">
    <list ordered="0">
	  <cdata format="any"/>
	</list>
  </type>

  <type name="t-annot_comment.type">
      <structure>
          <member name="type" required="1">
            <cdata format="any"/>
          </member>
          <member name="text">
            <cdata format="any"/>
          </member>
      </structure>
  </type>

  <type name="t-coref_text-link.type">
    <structure>
      <member name="target_node.rf" required="1">
        <cdata format="PMLREF"/></member>
      <member name="type" required="0">
        <choice>
          <value>SPEC</value>
          <value>GEN</value>
        </choice>
      </member>
    </structure>
  </type>
  
  <type name="t-pcedt_coref.type">
      <structure>
          <member name="annot_comment">
              <list ordered="0" type="t-annot_comment.type"/>
          </member>
          <member name="highlite" type="bool.type"/>
          <member name="functor_change">
              <list ordered="1">
                  <cdata format="any"/>
              </list>
          </member>
          <member name="is_unchecked" type="bool.type"/>          
      </structure>
  </type>

  <type name="t-pcedt_coref-root.type">
      <structure>
          <member name="annot_comment">
              <list ordered="0" type="t-annot_comment.type"/>

xt/author/treebanks/treex_test/resources/treex_subschema_t_layer.xml  view on Meta::CPAN

      <member name="politeness" type="t-politeness.type"/>
      <member name="negation" type="t-negation.type"/>
      <member name="definiteness" type="t-definiteness.type"/>
      <member name="diathesis" type="t-diathesis.type"/>
    </structure>
  </type>

  <type name="t-pcedt.type">
	<structure>
		<member name="cz_verb" required="0">
			<cdata format="any"/>
		</member>
		<member name="translation_type" required="0">
			<cdata format="any"/>
		</member>
		<member name="pattern" required="0">
			<cdata format="nonNegativeInteger"/>
		</member>
		<member name="pattern_mode" required="0" type="pcedt-pattern_mode.type"/>
		<member name="alt_pattern" required="0">
			<list ordered="0" type="pcedt-alt_pattern.type"/>
		</member>
	</structure>
  </type>

  <type name="pcedt-pattern_mode.type">
    <choice>
		<value>f</value>
		<value>a</value>
		<value>u</value>
		<value>x</value>
    </choice>
  </type>

  <type name="pcedt-alt_pattern.type">
	  <structure>
		  <member name="pattern" required="0">
			  <cdata format="nonNegativeInteger"/>
		  </member>
		  <member name="pattern_mode" required="0" type="pcedt-pattern_mode.type"/>
	  </structure>
  </type>

  <type name="t-named_entity.type">
    <structure>
      <member name="number"><cdata format="any"/></member>
      <member name="type"  type="t-ne-type.type"/>
    </structure>
  </type>

  <type name="t-ne-type.type">
    <choice>
      <value>person</value>
      <value>organization</value>
      <value>location</value>
    </choice>

xt/author/treebanks/treex_test/resources/treex_subschema_t_layer.xml  view on Meta::CPAN

      <value>dphr</value>
      <value>fphr</value>
      <value>list</value>
      <value>qcomplex</value>
    </choice>
  </type>

  <type name="t-a.type">
    <structure>
      <member name="lex.rf">
        <cdata format="PMLREF"/>
      </member>
      <member name="aux.rf">
        <list ordered="0">
          <cdata format="PMLREF"/>
        </list>
      </member>
    </structure>
  </type>

  <type name="coref_special.type">
    <choice>
      <value>segm</value>
      <value>exoph</value>
    </choice>

xt/author/treebanks/treex_test/resources/treex_subschema_t_layer.xml  view on Meta::CPAN

    </choice>
  </type>


   <type name="translation_model.type">
      <structure>

         <member name="t_lemma_variants">
           <list ordered="0">
             <structure>
               <member name="t_lemma"> <cdata format="any"/> </member>
               <member name="logprob"> <cdata format="any"/> </member> <!-- Changed from prop_Lt_given_Ls, popel 13.12.2008 -->
               <member name="backward_logprob"> <cdata format="any"/> </member> <!-- if logprob is (cs|en) then backward means (en|cs). -->
               <member name="origin"> <cdata format="any"/> </member>  <!-- Changed from source, because we use term source in source/head.rf -->
               <member name="pos"> <cdata format="any"/> </member>
               <member name="feat_weights"> <list ordered="0"> <cdata format="any"/> </list> </member>
             </structure>
           </list>
         </member>

         <member name="formeme_variants">
           <list ordered="0">
             <structure>
               <member name="formeme"> <cdata format="any"/> </member>
               <member name="logprob"> <cdata format="any"/> </member> <!-- Changed from prop_Ft_given_Fs, popel 13.12.2008 -->
               <member name="backward_logprob"> <cdata format="any"/> </member>
               <member name="origin"> <cdata format="any"/> </member>  <!-- Symmetric to t_lemma_variants, odusek 02.03.2012 -->
             </structure>
           </list>
         </member>
      </structure>

   </type>

   <type name="language_model.type">
      <structure>
         <member name="gfd" type="logcount_table.type" />
         <member name="gf" type="logcount_table.type" />
         <member name="fd" type="logcount_table.type" />
         <member name="d" type="logcount_table.type" />
      </structure>
   </type>

   <type name="logcount_table.type">
      <list ordered="0">
        <structure>
           <member name="key"> <cdata format="any"/> </member>
           <member name="logcount" > <cdata format="any"/> </member>
        </structure>
      </list>
   </type>


   <type name="transition_scores.type">
      <list ordered="0">
        <structure>
           <member name="hint"> <cdata format="any"/> </member>
           <member name="score"> <cdata format="any"/> </member>
           <member name="my_lexeme_index"> <cdata format="any"/>  </member>
           <member name="my_formeme_index"> <cdata format="any"/> </member>
           <member name="eparent_lexeme_index"> <cdata format="any"/> </member>
        </structure>
      </list>
   </type>

   <type name="subtree_scores.type">
      <list ordered="0">
        <structure>
           <member name="hint"> <cdata format="any"/> </member>
           <member name="score"> <cdata format="any"/> </member>
           <member name="my_lexeme_index"> <cdata format="any"/>  </member>
           <member name="transitions_to_echildren">
             <list ordered="0">
               <structure>
                 <member name="echild_id"> <cdata format="any"/>   </member>
                 <member name="echild_lexeme_index"> <cdata format="any"/> </member>
                 <member name="echild_formeme_index"> <cdata format="any"/> </member>
               </structure>
             </list>
           </member>
        </structure>
      </list>
   </type>

</pml_schema>

xt/author/treebanks/treex_test/resources/treex_subschema_w_layer.xml  view on Meta::CPAN


  <type name="w-para.type">
    <sequence>
      <element name="othermarkup" type="w-othermarkup.type"/>
      <element name="w" type="w-node.type"/>
    </sequence>
  </type>

  <type name="w-othermarkup.type">
    <container>
      <attribute name="origin"><cdata format="any"/></attribute>
      <cdata format="any"/>
    </container>
  </type>

  <type name="w-node.type">
    <structure name="w-node">
      <member as_attribute="1" name="id" role="#ID" required="1"><cdata format="ID"/></member>
      <member name="token" required="1"><cdata format="any"/></member>
      <member name="no_space_after" type="bool.type"/>
    </structure>
  </type>

<!-- radeji do common -->
  <type name="bool.type">
    <choice>
      <value>0</value>
      <value>1</value>
    </choice>



( run in 0.824 second using v1.01-cache-2.11-cpan-454fe037f31 )