XStandoff Examples

Simple sentences

Two XStandoff instances containing both a single sentence annotated on different levels.

The text

[TXT]

This is a sentence.

The annotation levels

First annotation level: phrase structure

<?xml version="1.0" encoding="UTF-8"?>
<s xmlns="http://www.xstandoff.net/phrase"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:schemaLocation="http://www.xstandoff.net/phrase ../xsd/phrase.xsd">
  <np>
    <pron>This</pron>
  </np><vp>
    <v>is</v>
    <np>
      <det>a</det>
      <n>sentence</n>
    </np>
  </vp>.</s>

Second annotation level: syllables

<?xml version="1.0" encoding="UTF-8"?>
<syllables xmlns="http://www.xstandoff.net/syllables"
 xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
 xsi:schemaLocation="http://www.xstandoff.net/syllables ../xsd/syllables.xsd">
  <syllable>This</syllable>
  <syllable>is</syllable>
  <syllable>a</syllable>
  <syllable>sen</syllable>
  <syllable>tence</syllable>.
</syllables>

The XStandoff instance

[XML] [SVG]

The resulting XStandoff instance.

<?xml version="1.0" encoding="UTF-8"?>
<xsf:corpus xmlns:xsf="http://www.xstandoff.net/2009/xstandoff/1.1"
  xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:schemaLocation="http://www.xstandoff.net/2009/xstandoff/1.1 
  http://www.xstandoff.net/2009/xstandoff/1.1/xsf.xsd">
   <xsf:corpusData xml:id="c1">
      <xsf:primaryData start="0" end="19">
         <xsf:primaryDataRef uri="../pd/sentence1.txt"/>
      </xsf:primaryData>
      <xsf:segmentation>
         <xsf:segment xml:id="seg1" type="char" start="0" end="19"/>
         <xsf:segment xml:id="seg2" type="char" start="0" end="4"/>
         <xsf:segment xml:id="seg3" charRef="32" type="ws" start="4" end="5"/>
         <xsf:segment xml:id="seg4" type="char" start="5" end="18"/>
         <xsf:segment xml:id="seg5" type="char" start="5" end="7"/>
         <xsf:segment xml:id="seg6" charRef="32" type="ws" start="7" end="8"/>
         <xsf:segment xml:id="seg7" type="char" start="8" end="18"/>
         <xsf:segment xml:id="seg8" type="char" start="8" end="9"/>
         <xsf:segment xml:id="seg9" charRef="32" type="ws" start="9" end="10"/>
         <xsf:segment xml:id="seg10" type="char" start="10" end="18"/>
         <xsf:segment xml:id="seg11" type="char" start="10" end="13"/>
         <xsf:segment xml:id="seg12" type="char" start="13" end="18"/>
      </xsf:segmentation>
      <xsf:annotation>
         <xsf:level xml:id="phrase">
           <xsf:layer xmlns:phrase="http://www.xstandoff.net/phrase"
             xsi:schemaLocation="http://www.xstandoff.net/phrase 
             ../xsd/phrase.xsd" priority="0">
               <phrase:s xsf:segment="seg1">
                  <phrase:np xsf:segment="seg2">
                     <phrase:pron xsf:segment="seg2"/>
                  </phrase:np>
                  <phrase:vp xsf:segment="seg4">
                     <phrase:v xsf:segment="seg5"/>
                     <phrase:np xsf:segment="seg7">
                        <phrase:det xsf:segment="seg8"/>
                        <phrase:n xsf:segment="seg10"/>
                     </phrase:np>
                  </phrase:vp>
               </phrase:s>
            </xsf:layer>
         </xsf:level>
         <xsf:level xml:id="syll">
            <xsf:layer xmlns:syll="http://www.xstandoff.net/syll"
              xsi:schemaLocation="http://www.xstandoff.net/syll 
              ../xsd/syll.xsd" priority="1">
               <syll:syllyllables xsf:segment="seg1">
                  <syll:syllable xsf:segment="seg2"/>
                  <syll:syllable xsf:segment="seg5"/>
                  <syll:syllable xsf:segment="seg8"/>
                  <syll:syllable xsf:segment="seg11"/>
                  <syll:syllable xsf:segment="seg12"/>
               </syll:syllyllables>
            </xsf:layer>
         </xsf:level>
      </xsf:annotation>
   </xsf:corpusData>
</xsf:corpus>

The text

[TXT]
The sun shines brighter.

The annotation levels

First annotation level: morphemes

<?xml version="1.0" encoding="UTF-8"?>
<morphemes xmlns="http://www.xstandoff.net/morphemes"
 xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
 xsi:schemaLocation="http://www.xstandoff.net/morphemes ../xsd/morphemes.xsd">
  <morpheme>The</morpheme>
  <morpheme>sun</morpheme>
  <morpheme>shine</morpheme>
  <morpheme>s</morpheme>
  <morpheme>bright</morpheme>
  <morpheme>er</morpheme>.
</morphemes>

Second annotation level: syllables

<?xml version="1.0" encoding="UTF-8"?>
<syllables xmlns="http://www.xstandoff.net/syllables"
 xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
 xsi:schemaLocation="http://www.xstandoff.net/syllables ../xsd/syllables.xsd">
  <syllable>The</syllable>
  <syllable>sun</syllable>
  <syllable>shines</syllable>
  <syllable>brigh</syllable>
  <syllable>ter</syllable>.
</syllables>

The XStandoff instance

[XML] [SVG] [X3D]

The resulting XStandoff instance containing embedded OLAC metadata.

<?xml version="1.0" encoding="UTF-8"?>
<xsf:corpusData xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:schemaLocation="http://www.xstandoff.net/2009/xstandoff/1.1 
  http://www.xstandoff.net/2009/xstandoff/1.1/xsf.xsd"
  xmlns:xsf="http://www.xstandoff.net/2009/xstandoff/1.1" xml:id="c1" xsfVersion="1.1">
   <xsf:meta xmlns:olac="http://www.language-archives.org/OLAC/1.0/" 
   xmlns="http://purl.org/dc/elements/1.1/"
      xmlns:dcterms="http://purl.org/dc/terms/"
      xsi:schemaLocation="http://www.language-archives.org/OLAC/1.0/ ../xsd/meta/olac.xsd">
      <olac:olac>
         <creator>Maik Stührenberg</creator>
         <date>2009-02-19</date>
         <description>Example sentence "The sun shines brighter" 
          annotated with morphemes and syllables.</description>
      </olac:olac>
   </xsf:meta>
   <xsf:primaryData start="0" end="24" xml:lang="en">
      <xsf:textualContent>The sun shines brighter.</xsf:textualContent>
   </xsf:primaryData>
   <xsf:segmentation>
      <xsf:segment xml:id="seg1" type="char" start="0" end="24"/>
      <xsf:segment xml:id="seg2" type="char" start="0" end="3"/>
      <xsf:segment xml:id="seg3" type="char" start="4" end="7"/>
      <xsf:segment xml:id="seg4" type="char" start="8" end="14"/>
      <xsf:segment xml:id="seg5" type="char" start="8" end="13"/>
      <xsf:segment xml:id="seg6" type="char" start="13" end="14"/>
      <xsf:segment xml:id="seg7" type="char" start="15" end="21"/>
      <xsf:segment xml:id="seg8" type="char" start="15" end="20"/>
      <xsf:segment xml:id="seg9" type="char" start="20" end="23"/>
      <xsf:segment xml:id="seg10" type="char" start="21" end="23"/>
   </xsf:segmentation>
   <xsf:annotation>
      <xsf:level xml:id="l_morph">
         <xsf:meta xmlns:olac="http://www.language-archives.org/OLAC/1.0/" 
            xmlns="http://purl.org/dc/elements/1.1/"
            xmlns:dcterms="http://purl.org/dc/terms/"
            xsi:schemaLocation="http://www.language-archives.org/OLAC/1.0/ ../xsd/meta/olac.xsd">
            <olac:olac>
               <creator>Maik Stührenberg</creator>
               <date>2009-02-19</date>
               <description>Morphem annotation. Manually annotated.</description>
            </olac:olac>
         </xsf:meta>
        <xsf:layer xmlns:morph="http://www.xstandoff.net/morphemes"
          xsi:schemaLocation="http://www.xstandoff.net/morphemes 
          ../xsd/morphemes.xsd" priority="0">
            <morph:morphemes xsf:segment="seg1">
               <morph:morpheme xsf:segment="seg2"/>
               <morph:morpheme xsf:segment="seg3"/>
               <morph:morpheme xsf:segment="seg5"/>
               <morph:morpheme xsf:segment="seg6"/>
               <morph:morpheme xsf:segment="seg7"/>
               <morph:morpheme xsf:segment="seg10"/>
            </morph:morphemes>
         </xsf:layer>
      </xsf:level>
      <xsf:level xml:id="l_syll">
         <xsf:meta xmlns:olac="http://www.language-archives.org/OLAC/1.0/" 
            xmlns="http://purl.org/dc/elements/1.1/"
            xmlns:dcterms="http://purl.org/dc/terms/"
            xsi:schemaLocation="http://www.language-archives.org/OLAC/1.0/ ../xsd/meta/olac.xsd">
            <olac:olac>
               <creator>Maik Stührenberg</creator>
               <date>2009-02-19</date>
               <description>Syllables annotation. Manually annotated.</description>
            </olac:olac>
         </xsf:meta>
        <xsf:layer xmlns:syll="http://www.xstandoff.net/syllables"
          xsi:schemaLocation="http://www.xstandoff.net/syllables 
          ../xsd/syllables.xsd" priority="1">
            <syll:syllables xsf:segment="seg1">
               <syll:syllable xsf:segment="seg2"/>
               <syll:syllable xsf:segment="seg3"/>
               <syll:syllable xsf:segment="seg4"/>
               <syll:syllable xsf:segment="seg8"/>
               <syll:syllable xsf:segment="seg9"/>
            </syll:syllables>
         </xsf:layer>
      </xsf:level>
   </xsf:annotation>
</xsf:corpusData>