276 | | <!-- Put you XML code here --> |
277 | | }}} |
278 | | * Issues/Discussion: |
279 | | * ... |
280 | | |
281 | | |
| 276 | #!xml |
| 277 | fcs> |
| 278 | <layers time-unit="millis" audio-file-ref="http://hdl.handle.net/8015/1234567890"> |
| 279 | <layer id="http://endpoint.example.org/layers/orth1" type="orth"> |
| 280 | <span start="1" end="1" time-start="0" time-end="173">t</span> |
| 281 | <span start="3" end="4" time-start="173" time-end="304">da</span> |
| 282 | <span start="6" end="7" time-start="173" time-end="304">'s</span> |
| 283 | <span start="9" end="10" time-start="304" time-end="480">de</span> |
| 284 | <span start="12" end="16" time-start="480" time-end="1119">enige</span> |
| 285 | <span start="18" end="22" time-start="1339" time-end="1901">echte</span> |
| 286 | <span start="24" end="27" time-start="1901" time-end="2427">hoop</span> |
| 287 | <span start="29" end="32" time-start="3084" time-end="3493">voor</span> |
| 288 | <span start="34" end="36" time-start="3493" time-end="3754">ons</span> |
| 289 | <span start="38" end="43" time-start="3754" time-end="4274">mensen</span> |
| 290 | </layer> |
| 291 | <layer id="http://endpoint.example.org/layers/words1" type="words"> |
| 292 | <span start="1" end="1" time-start="0" time-end="173">word</span> |
| 293 | <span start="3" end="4" time-start="173" time-end="304">word</span> |
| 294 | <span start="6" end="7" time-start="173" time-end="304">word</span> |
| 295 | <span start="9" end="10" time-start="304" time-end="480">word</span> |
| 296 | <span start="12" end="16" time-start="480" time-end="1119">word</span> |
| 297 | <span start="18" end="22" time-start="1339" time-end="1901">word</span> |
| 298 | <span start="24" end="27" time-start="1901" time-end="2427">word</span> |
| 299 | <span start="29" end="32" time-start="3084" time-end="3493">word</span> |
| 300 | <span start="34" end="36" time-start="3493" time-end="3754">word</span> |
| 301 | <span start="38" end="43" time-start="3754" time-end="4274">word</span> |
| 302 | </layer> |
| 303 | <layer id="http://endpoint.example.org/layers/pos1" type="pos" alt-value-info="CGN POS tagset"> |
| 304 | <span start="1" end="1" time-start="0" time-end="173" alt-value="SPEC(afgebr)">X</span> |
| 305 | <span start="3" end="4" time-start="173" time-end="304" alt-value="VNW(aanw,pron,stan,vol,3o,ev)">PRON</span> |
| 306 | <span start="6" end="7" time-start="173" time-end="304" alt-value="WW(pv,tgw,ev)">VERB</span> |
| 307 | <span start="9" end="10" time-start="304" time-end="480" alt-value="LID(bep,stan,rest)">DET</span> |
| 308 | <span start="12" end="16" time-start="480" time-end="1119" alt-value="VNW(onbep,det,stan,prenom,met-e,rest)">DET</span> |
| 309 | <span start="18" end="22" time-start="1339" time-end="1901" alt-value="ADJ(prenom,basis,met-e,stan)">ADJ</span> |
| 310 | <span start="24" end="27" time-start="1901" time-end="2427" alt-value="N(soort,ev,basis,zijd,stan)">NOUN</span> |
| 311 | <span start="29" end="32" time-start="3084" time-end="3493" alt-value="VZ(init)">ADP</span> |
| 312 | <span start="34" end="36" time-start="3493" time-end="3754" alt-value="VNW(pr,pron,obl,vol,1,mv)">PRON</span> |
| 313 | <span start="38" end="43" time-start="3754" time-end="4274" alt-value="N(soort,mv,basis)">NOUN</span> |
| 314 | </layer> |
| 315 | <layer id="http://endpoint.example.org/layers/lemma1" type="lemma"> |
| 316 | <span start="1" end="1" time-start="0" time-end="173">_</span> |
| 317 | <span start="3" end="4" time-start="173" time-end="304">dat</span> |
| 318 | <span start="6" end="7" time-start="173" time-end="304">zijn</span> |
| 319 | <span start="9" end="10" time-start="304" time-end="480">de</span> |
| 320 | <span start="12" end="16" time-start="480" time-end="1119">enig</span> |
| 321 | <span start="18" end="22" time-start="1339" time-end="1901">echt</span> |
| 322 | <span start="24" end="27" time-start="1901" time-end="2427">hoop</span> |
| 323 | <span start="29" end="32" time-start="3084" time-end="3493">voor</span> |
| 324 | <span start="34" end="36" time-start="3493" time-end="3754">ons</span> |
| 325 | <span start="38" end="43" time-start="3754" time-end="4274">mens</span> |
| 326 | </layer> |
| 327 | <layer id="http://endpoint.example.org/layers/phonetics1" type="phonetics"> |
| 328 | <span start="1" end="1" time-start="0" time-end="173">t@</span> |
| 329 | <span start="3" end="4" time-start="173" time-end="304">dAz</span> |
| 330 | <span start="6" end="7" time-start="173" time-end="304">dAz</span> |
| 331 | <span start="9" end="10" time-start="304" time-end="480">d@</span> |
| 332 | <span start="12" end="16" time-start="480" time-end="1119">en@G@</span> |
| 333 | <span start="18" end="22" time-start="1339" time-end="1901">Ext@</span> |
| 334 | <span start="24" end="27" time-start="1901" time-end="2427">hop</span> |
| 335 | <span start="29" end="32" time-start="3084" time-end="3493">for</span> |
| 336 | <span start="34" end="36" time-start="3493" time-end="3754">Ons</span> |
| 337 | <span start="38" end="43" time-start="3754" time-end="4274">mEns@</span> |
| 338 | </layer> |
| 339 | </layers> |
| 340 | </fcs> |
| 341 | }}} |
| 342 | * Discussion: |
| 343 | * No preferred/primary layer, all layers are equal |
| 344 | * Each {{{<layer>}}} has a {{{@type}}}, which denotes the type of the layer (closed controlled vocabulary) |
| 345 | * If more layers of a certain type are available, the Aggregator would initially display the first. |
| 346 | * Each {{{<layer>}}} has an {{{@id}}}, which uniquely identifies the layer (in regard to the xml snippet); URIs are used to foster uniqueness |
| 347 | * Each {{{<span>}}} has {{{@start}}} and {{{@end}}} offset to establish the relations between other spans |
| 348 | * The actual "content" is stored as PCDATA in {{{<span>}}}. Additional data, e.g. the original tags in case of pos, can be supplied in the {{{@alt-value}}} attribute. Information about what is contained there must be present in {{{@alt-value-info}}} on {{{<layer>}}}. |
| 349 | * Optionally a {{{<span>}}} may carry {{{@time-start}}} and {{{@time-end}}} elements; the value type is denoted by {{{@time-unit}}} on {{{<layers>}}}. Additionally a reference to a audio-file can be supplied by {{{@audio-file-ref}}} on {{{<layers>}}}; this can be used to generate links for playback |
| 350 | * Issues: |
| 351 | * Quite a lot of redundancy (especially when all segments more or less are the same across layers) |
| 352 | * Time info adds even more redundancy. Furthermore, it's unclear how this information is supposed to be combined for a direct playback link. |
| 353 | * Possible solution: endpoints needs to provide complete and valid playback link? |
| 354 | * "Maker layers" (e.g. "words") only mark intervals but contain useless PCDATA |
| 355 | * Possible solution: allow empty PCDATA (or better empty {{{<span>}}} elements in that case? |
| 356 | * What is the Aggregator supposed to display, if it wants/needs to display offsets? The artificial characters offsets make no real sense in the spoken data example. Nice start end offsets (e.g. 00:01:12.22/00:01:23.42) would probably be nicer. |
| 357 | * Possible solution: add a display label? |