folia_edbo.xml 5.95 KB
<?xml version="1.0" encoding="UTF-8" ?>
<mtas>

  <!-- START MTAS INDEX CONFIGURATION -->
  <index>
    <!-- START GENERAL SETTINGS MTAS INDEX PROCESS -->
    <payload index="false" />
    <offset index="false" />
    <realoffset index="false" />
    <parent index="true" />
    <!-- END GENERAL SETTINGS MTAS INDEX PROCESS -->
  </index>
  <!-- END MTAS INDEX CONFIGURATION -->

  <!-- START CONFIGURATION MTAS FOLIA PARSER -->
  <parser name="mtas.analysis.parser.MtasFoliaParser">

    <!-- START GENERAL SETTINGS MTAS FOLIA PARSER -->
    <autorepair value="true" />
    <makeunique value="true" />
    <!-- END GENERAL SETTINGS MTAS FOLIA PARSER -->

    <!-- START REFERENCES -->
    <references>
    </references>
    <!-- END REFERENCES -->

    <!-- START MAPPINGS -->
    <mappings>

      <!-- START WORDS -->
      <mapping type="word" name="str">
      </mapping>      
      <!-- END WORDS -->

      <!-- START WORD ANNOTATIONS -->
      <mapping type="wordAnnotation" name="t">
        <token type="string" offset="false">
          <pre>
            <item type="name" />
          </pre>
          <post>
            <item type="text" />
          </post>
        </token>
        <token type="string" offset="false" realoffset="false" parent="false">
          <pre>
            <item type="name" />
            <item type="string" value="_lc" />
          </pre>
          <post>
            <item type="text" filter="ascii,lowercase" />
          </post>
        </token>
        <condition>
          <item type="ancestor" number="0" />
          <item type="ancestorWord" number="1" />
          <item type="unknownAncestor" number="0" />
          <item type="attribute" name="class" condition="Ticcl"/>
        </condition>
      </mapping>
      <mapping type="wordAnnotation" name="correction">
      </mapping>
      <mapping type="wordAnnotation" name="new">
      </mapping>
      <mapping type="wordAnnotation" name="original">
      </mapping>
      <mapping type="wordAnnotation" name="suggestion">
      </mapping>
      <mapping type="wordAnnotation" name="t">
        <token type="string" offset="false">
          <pre>
            <item type="name" />
          </pre>
          <post>
            <item type="text" />
          </post>
        </token>
        <token type="string" offset="false" realoffset="false" parent="false">
          <pre>
            <item type="name" />
            <item type="string" value="_lc" />
          </pre>
          <post>
            <item type="text" filter="ascii,lowercase" />
          </post>
        </token>
        <condition>
          <item type="ancestor" number="2" />
          <item type="ancestorName" condition="new" />
          <item type="unknownAncestor" number="0" />
          <item type="attribute" name="class" condition="Ticcl"/>
        </condition>
      </mapping>
      <mapping type="wordAnnotation" name="t">
        <token type="string" offset="false">
          <pre>
            <item type="name" />
            <item type="ancestorName" prefix="."/>
          </pre>
          <post>
            <item type="text" />
          </post>
        </token>
        <token type="string" offset="false" realoffset="false" parent="false">
          <pre>
            <item type="name" />
            <item type="string" value="_lc" />
            <item type="ancestorName" prefix="."/>
          </pre>
          <post>
            <item type="text" filter="ascii,lowercase" />
          </post>
        </token>
        <condition>
          <item type="ancestor" number="2" />
          <item type="ancestorName" condition="original" />
          <item type="unknownAncestor" number="0" />          
        </condition>
      </mapping>
      <mapping type="wordAnnotation" name="t">
        <token type="string" offset="false">
          <pre>
            <item type="name" />
            <item type="ancestorName" prefix="."/>
          </pre>
          <post>
            <item type="text" />
          </post>
        </token>
        <token type="string" offset="false" realoffset="false" parent="false">
          <pre>
            <item type="name" />
            <item type="string" value="_lc" />
            <item type="ancestorName" prefix="."/>
          </pre>
          <post>
            <item type="text" filter="ascii,lowercase" />
          </post>
        </token>
        <condition>
          <item type="ancestor" number="2" />
          <item type="ancestorName" condition="suggestion" />
          <item type="unknownAncestor" number="0" />          
        </condition>
      </mapping>
      <!-- END WORD ANNOTATIONS -->

      <!-- START RELATIONS -->
      <!-- END RELATIONS -->

      <!-- START GROUPS -->
      <mapping type="group" name="p">
        <token type="string" offset="false">
          <pre>
            <item type="name" />
          </pre>
          <post>
            <item type="attribute" name="class" />
          </post>
        </token>
      </mapping>
      <mapping type="group" name="div">
        <token type="string" offset="false">
          <pre>
            <item type="name" />
          </pre>
          <post>
            <item type="attribute" name="class" />
          </post>
        </token>
      </mapping>
      <mapping type="group" name="head">
        <token type="string" offset="false">
          <pre>
            <item type="name" />
          </pre>
          <post>
            <item type="attribute" name="class" />
          </post>
        </token>
      </mapping>
      <!-- END GROUPS -->

      <!-- START GROUP ANNOTATIONS -->
      <mapping type="groupAnnotation" name="lang">
        <token type="string" offset="false" realoffset="false" parent="false">
          <pre>
            <item type="name" />
          </pre>
          <post>
            <item type="attribute" name="class" />
          </post>
        </token>
      </mapping>
      <!-- END GROUP ANNOTATIONS -->

    </mappings>
    <!-- END MAPPINGS -->

  </parser>
  <!-- END CONFIGURATION MTAS FOLIA PARSER -->
  
</mtas>