Appendix A

18-JUN-04

TGORG Table structure 1

TABLE_NAME COLUMN_NAME DATA_TYPE DATA_LENGTH

------

ACCOUNT NAME VARCHAR2 40

ACCOUNT VARCHAR2 10

ACCOUNTING ACC_ID NUMBER 22

NAME VARCHAR2 30

HOURS NUMBER 22

INPUT_DATE DATE 7

ACCOUNT_KEY VARCHAR2 80

ACCOUNT_VALUE VARCHAR2 80

WORK_TYPE VARCHAR2 80

COMM VARCHAR2 255

ADDRESS_BOOK_GROUP CN VARCHAR2 255

DN VARCHAR2 255

GROUP_CODE VARCHAR2 5

ADDRESS_BOOK_GROUP_MEMBER CN VARCHAR2 255

MEMBER VARCHAR2 255

DEALER DEALER VARCHAR2 20

EMAIL NAME VARCHAR2 40

EMAIL VARCHAR2 50

EQUIPMENT INV_NR VARCHAR2 25

PARENT_INV_NR VARCHAR2 25

EQUIP_TYPE VARCHAR2 10

USER_NAME VARCHAR2 30

IP_NR VARCHAR2 16

SERIAL_NR VARCHAR2 20

SELL_DATE DATE 7

GUARANTEE DATE 7

MAINT_CODE VARCHAR2 8

ORDER_NR NUMBER 22

MANUFACTURER VARCHAR2 20

DEALER VARCHAR2 20

ROOM_NR NUMBER 22

CONN_NR NUMBER 22

LAST_CHANGE DATE 7

NEXT_CHANGE DATE 7

STATUS VARCHAR2 8

NET_TYPE VARCHAR2 3

OS VARCHAR2 64

ETHERNET_NR VARCHAR2 18

CPU VARCHAR2 12

RAM VARCHAR2 32

DISK_INTERNAL VARCHAR2 32

DISK_EXTERNAL VARCHAR2 32

VIDEO_CARD VARCHAR2 12

AUDIO_CARD VARCHAR2 10

MONITOR_TYPE VARCHAR2 10

RESOLUTION VARCHAR2 10

ADD_ON VARCHAR2 255

STICKER VARCHAR2 1

LAST_UPDATE DATE 7

LAST_USER VARCHAR2 30

PS VARCHAR2 255

UPDATE_ID NUMBER 22

UPDATE_ID2 NUMBER 22

UPDATE_ID3 NUMBER 22

UPDATE_ID4 NUMBER 22

UPDATE_ID5 NUMBER 22

UPDATE_ID6 NUMBER 22

EQUIP_MODEL VARCHAR2 15

INTERNAL VARCHAR2 1

UPDATE_ID7 NUMBER 22

UPDATE_ID8 NUMBER 22

UPDATE_ID8B NUMBER 22

FLAG VARCHAR2 1

GUARANTEE_NR VARCHAR2 25

BACKUP_CLIENT VARCHAR2 1

CONN_NR2 NUMBER 22

EQUIP_CHECK VARCHAR2 1

EQUIPMENT_HISTORY INV_NR VARCHAR2 25

PARENT_INV_NR VARCHAR2 25

EQUIP_TYPE VARCHAR2 10

USER_NAME VARCHAR2 30

IP_NR VARCHAR2 16

SERIAL_NR VARCHAR2 20

SELL_DATE DATE 7

GUARANTEE DATE 7

MAINT_CODE VARCHAR2 8

ORDER_NR NUMBER 22

MANUFACTURER VARCHAR2 20

DEALER VARCHAR2 20

ROOM_NR NUMBER 22

CONN_NR NUMBER 22

LAST_CHANGE DATE 7

NEXT_CHANGE DATE 7

STATUS VARCHAR2 8

NET_TYPE VARCHAR2 3

OS VARCHAR2 64

ETHERNET_NR VARCHAR2 18

CPU VARCHAR2 12

RAM VARCHAR2 32

DISK_INTERNAL VARCHAR2 32

DISK_EXTERNAL VARCHAR2 32

VIDEO_CARD VARCHAR2 12

AUDIO_CARD VARCHAR2 10

MONITOR_TYPE VARCHAR2 10

RESOLUTION VARCHAR2 10

ADD_ON VARCHAR2 255

STICKER VARCHAR2 1

LAST_UPDATE DATE 7

LAST_USER VARCHAR2 30

PS VARCHAR2 255

UPDATE_ID NUMBER 22

UPDATE_ID2 NUMBER 22

UPDATE_ID3 NUMBER 22

UPDATE_ID4 NUMBER 22

UPDATE_ID5 NUMBER 22

UPDATE_ID6 NUMBER 22

EQUIP_MODEL VARCHAR2 15

INTERNAL VARCHAR2 1

UPDATE_ID7 NUMBER 22

UPDATE_ID8 NUMBER 22

UPDATE_ID8B NUMBER 22

FLAG VARCHAR2 1

GUARANTEE_NR VARCHAR2 25

BACKUP_CLIENT VARCHAR2 1

CONN_NR2 NUMBER 22

EQUIP_CHECK VARCHAR2 1

EQUIP_MODEL EQUIP_TYPE VARCHAR2 10

EQUIP_MODEL VARCHAR2 15

CAPACITY VARCHAR2 10

PS VARCHAR2 20

EQUIP_NET NET_TYPE VARCHAR2 3

PS VARCHAR2 20

EQUIP_STATUS STATUS VARCHAR2 8

PS VARCHAR2 20

EQUIP_TYPE EQUIP_TYPE VARCHAR2 10

PS VARCHAR2 20

FUNCTION FUNCTION VARCHAR2 50

HUB HUB_NR VARCHAR2 15

PORT_NR NUMBER 22

STATUS VARCHAR2 2

ROOM_NR NUMBER 22

CONN_NR NUMBER 22

HUB_NR_LINK VARCHAR2 5

PORT_NR_LINK NUMBER 22

PS VARCHAR2 255

UPDATE_ID NUMBER 22

SPEED NUMBER 22

HUB_STATUS STATUS VARCHAR2 2

PS VARCHAR2 20

IP IP_NR VARCHAR2 16

HOSTNAME VARCHAR2 12

PS VARCHAR2 255

IP_GROUP VARCHAR2 15

STATUS VARCHAR2 10

UPDATE_ID NUMBER 22

UPDATE_ID2 NUMBER 22

IP_ET HOSTNAME VARCHAR2 10

IP_NR VARCHAR2 16

ETHERNET_NR VARCHAR2 18

IP_GROUP IP_GROUP VARCHAR2 15

IP_STATUS STATUS VARCHAR2 10

MAINTENANCE MAINT_CODE VARCHAR2 8

PS VARCHAR2 20

MPI_BOOK_GROUP CN VARCHAR2 255

DN VARCHAR2 255

GROUP_CODE VARCHAR2 5

MPI_BOOK_GROUP_MEMBER CN VARCHAR2 255

MEMBER VARCHAR2 255

NATIONALITY NATIONALITY VARCHAR2 50

NV N_TYPE VARCHAR2 12

N_CODE VARCHAR2 8

N_NAAM VARCHAR2 10

N_INST VARCHAR2 2

N_OPMERKING VARCHAR2 40

INVENTNR VARCHAR2 12

STATUSCODE VARCHAR2 1

LONDERHOUD DATE 7

USER_NAME VARCHAR2 30

P_NAAM VARCHAR2 30

VAN DATE 7

TOT DATE 7

COMMENTAAR VARCHAR2 40

UPDATE_ID5 NUMBER 22

PATCH_ROOM ROOM_NR NUMBER 22

PATCH_NR NUMBER 22

TYPE VARCHAR2 5

TEL_NR VARCHAR2 25

TEL_PANEL NUMBER 22

PANEL_NR NUMBER 22

UPDATE_ID NUMBER 22

PATCH_ROOM_TYPE TYPE VARCHAR2 5

PS VARCHAR2 20

PERS USER_NAME VARCHAR2 30

USER_STATUS VARCHAR2 2

ACCOUNT VARCHAR2 10

EXPIRATION DATE 7

ROOM_NR VARCHAR2 10

OLD_ROOM_NR VARCHAR2 10

GROUP_CODE VARCHAR2 2

FROM_DATE DATE 7

TO_DATE DATE 7

SA_OF VARCHAR2 30

LEND_STATUS VARCHAR2 1

WISHES VARCHAR2 255

PHONE VARCHAR2 25

TEL_LIST VARCHAR2 1

ABSENCE_LIST VARCHAR2 1

SHARED VARCHAR2 1

FLOOR NUMBER 22

ROOM_GROUP VARCHAR2 40

WEB_AGREE VARCHAR2 1

PRIV_PAGE VARCHAR2 1

EMAIL VARCHAR2 50

PS VARCHAR2 255

PHONE2 VARCHAR2 25

ROOM_GROUP2 VARCHAR2 40

UPDATE_ID NUMBER 22

NATIONALITY VARCHAR2 50

UNIV_DEGREE VARCHAR2 50

FUNCTION VARCHAR2 50

PHOTO_FILE VARCHAR2 128

SPONSOR VARCHAR2 50

INTRODUCTION VARCHAR2 4000

USER_ID NUMBER 22

PERS_GROUP GROUP_CODE VARCHAR2 2

PS VARCHAR2 20

SPONSOR SPONSOR VARCHAR2 50

UNIV_DEGREE UNIV_DEGREE VARCHAR2 50

1

Appendix B1: Logical Structure of the cor of the Dutch CELEX Database

Appendix B2: Extended Overview about the Dutch CELEX Database

1

Appendix C

<?xml version="1.0" encoding="UTF-8"?>

<!--W3C Schema generated by XML Spy v4.1 (

<xs:schema xmlns:xs=" xmlns:xdb=" elementFormDefault="qualified">

<xs:element name="accomodation">

<xs:complexType>

<xs:attribute name="item" type="xs:string" use="required"/>

</xs:complexType>

</xs:element>

<xs:element name="ambiguous">

<xs:complexType>

<xs:attribute name="value" type="xs:string" use="required"/>

</xs:complexType>

</xs:element>

<xs:element name="analysis">

<xs:complexType>

<xs:sequence>

<xs:element ref="errorType" minOccurs="0"/>

<xs:element ref="comments" minOccurs="0"/>

<xs:element ref="targetUnit" minOccurs="0"/>

<xs:element ref="errorUnit" minOccurs="0"/>

<xs:element ref="sourceLocation" minOccurs="0"/>

<xs:element ref="rule" minOccurs="0"/>

<xs:element ref="accomodation" minOccurs="0"/>

<xs:element ref="wellformedness" minOccurs="0"/>

<xs:element ref="process" maxOccurs="2"/>

<xs:element ref="itemProperties" maxOccurs="3"/>

</xs:sequence>

<xs:attribute name="aid" type="xs:short" use="required"/>

</xs:complexType>

</xs:element>

<xs:element name="channel" type="xs:string"/>

<xs:element name="coder" type="xs:string"/>

<xs:element name="comments" type="xs:string"/>

<xs:element name="complete">

<xs:complexType>

<xs:attribute name="value" type="xs:string" use="required"/>

</xs:complexType>

</xs:element>

<xs:element name="corpus" type="xs:string"/>

<xs:element name="corpusdescription" type="xs:string"/>

<xs:element name="corrected">

<xs:complexType>

<xs:attribute name="value" type="xs:string" use="required"/>

</xs:complexType>

</xs:element>

<xs:element name="date" type="xs:string"/>

<xs:element name="domainProperties">

<xs:complexType>

<xs:sequence>

<xs:element ref="syntacticDomain" minOccurs="0" maxOccurs="3"/>

<xs:element ref="prosodicDomain" minOccurs="0" maxOccurs="3"/>

<xs:element ref="stressDomain" minOccurs="0" maxOccurs="3"/>

<xs:element ref="wordDomain" minOccurs="0" maxOccurs="3"/>

<xs:element ref="syllabicDomain" minOccurs="0" maxOccurs="3"/>

</xs:sequence>

</xs:complexType>

</xs:element>

<xs:element name="errorGroup">

<xs:complexType>

<xs:sequence>

<xs:element ref="analysis" minOccurs="0" maxOccurs="10"/>

<xs:element ref="domainProperties" minOccurs="0"/>

</xs:sequence>

<xs:attribute name="eid" type="xs:short" use="required"/>

</xs:complexType>

</xs:element>

<xs:element name="errorTranslation">

<xs:complexType>

<xs:simpleContent>

<xs:extension base="xs:string">

<xs:attribute name="language" type="xs:string" use="required"/>

</xs:extension>

</xs:simpleContent>

</xs:complexType>

</xs:element>

<xs:element name="errorType">

<xs:simpleType>

<xs:restriction base="xs:string">

<xs:enumeration value=""/>

<xs:enumeration value="lexical"/>

<xs:enumeration value="morphological"/>

<xs:enumeration value="morphosyntactic"/>

<xs:enumeration value="phonological"/>

<xs:enumeration value="phonological/lexical"/>

<xs:enumeration value="phonological/morphologic"/>

<xs:enumeration value="phrasal"/>

<xs:enumeration value="syntactic"/>

<xs:enumeration value="syntactic/morphological"/>

<xs:enumeration value="tip-of-the-tongue"/>

</xs:restriction>

</xs:simpleType>

</xs:element>

<xs:element name="errorUnit" type="xs:string"/>

<xs:element name="errorUtterance" type="xs:string"/>

<xs:element name="extraInfo" type="xs:string"/>

<xs:element name="feature">

<xs:complexType>

<xs:attribute name="class" type="xs:string" use="required"/>

<xs:attribute name="value" type="xs:string" use="required"/>

</xs:complexType>

</xs:element>

<xs:element name="grammaticalWord">

<xs:simpleType>

<xs:restriction base="xs:string">

<xs:enumeration value="WH"/>

<xs:enumeration value="aux/modal"/>

<xs:enumeration value="modifier"/>

<xs:enumeration value="other"/>

<xs:enumeration value="preposition"/>

<xs:enumeration value="pronoun"/>

<xs:enumeration value="quantifier"/>

<xs:enumeration value="clitic"/>

<xs:enumeration value="copula"/>

</xs:restriction>

</xs:simpleType>

</xs:element>

<xs:element name="interpretation">

<xs:complexType>

<xs:sequence>

<xs:element ref="targetUtterance" minOccurs="0"/>

<xs:element ref="errorUtterance"/>

<xs:element ref="phonetics" minOccurs="0"/>

<xs:element ref="targetTranslation" minOccurs="0"/>

<xs:element ref="errorTranslation" minOccurs="0"/>

<xs:element ref="ambiguous" minOccurs="0"/>

<xs:element ref="errorGroup" minOccurs="0"/>

<xs:element ref="issues" minOccurs="0"/>

<xs:element ref="issues2" minOccurs="0"/>

<xs:element ref="extraInfo" minOccurs="0"/>

</xs:sequence>

<xs:attribute name="iid" type="xs:short" use="required"/>

</xs:complexType>

</xs:element>

<xs:element name="issues" type="xs:string"/>

<xs:element name="issues2" type="xs:string"/>

<xs:element name="itemProperties">

<xs:complexType>

<xs:all>

<xs:element ref="syllable" minOccurs="0"/>

<xs:element ref="feature" minOccurs="0"/>

<xs:element ref="segment" minOccurs="0"/>

<xs:element ref="supraSegment" minOccurs="0"/>

<xs:element ref="phrase" minOccurs="0"/>

<xs:element ref="lexicalWord" minOccurs="0"/>

<xs:element ref="morpheme" minOccurs="0"/>

<xs:element ref="grammaticalWord" minOccurs="0"/>

</xs:all>

<xs:attribute name="item" use="required">

<xs:simpleType>

<xs:restriction base="xs:NMTOKEN">

<xs:enumeration value="1"/>

<xs:enumeration value="2"/>

<xs:enumeration value="3"/>

</xs:restriction>

</xs:simpleType>

</xs:attribute>

</xs:complexType>

</xs:element>

<xs:element name="lexicalWord" type="xs:string"/>

<xs:element name="morpheme" type="xs:string"/>

<xs:element name="multipleTrials">

<xs:complexType>

<xs:attribute name="value" type="xs:string" use="required"/>

</xs:complexType>

</xs:element>

<xs:element name="phonetics" type="xs:string"/>

<xs:element name="phrase">

<xs:simpleType>

<xs:restriction base="xs:string">

<xs:enumeration value="X"/>

<xs:enumeration value="XP"/>

<xs:enumeration value="c"/>

<xs:enumeration value="cliche"/>

<xs:enumeration value="i"/>

<xs:enumeration value="idiom"/>

<xs:enumeration value="s"/>

<xs:enumeration value="sentence"/>

<xs:enumeration value="Yes"/>

<xs:enumeration value="Y"/>

</xs:restriction>

</xs:simpleType>

</xs:element>

<xs:element name="process">

<xs:complexType>

<xs:attribute name="pid" use="required">

<xs:simpleType>

<xs:restriction base="xs:NMTOKEN">

<xs:enumeration value="1"/>

<xs:enumeration value="2"/>

</xs:restriction>

</xs:simpleType>

</xs:attribute>

<xs:attribute name="procedure" type="xs:string" use="optional"/>

<xs:attribute name="direction" type="xs:string" use="optional"/>

</xs:complexType>

</xs:element>

<xs:element name="prosodicDomain">

<xs:complexType>

<xs:simpleContent>

<xs:extension base="xs:string">

<xs:attribute name="item" use="required">

<xs:simpleType>

<xs:restriction base="xs:NMTOKEN">

<xs:enumeration value="error"/>

<xs:enumeration value="source"/>

<xs:enumeration value="target"/>

</xs:restriction>

</xs:simpleType>

</xs:attribute>

</xs:extension>

</xs:simpleContent>

</xs:complexType>

</xs:element>

<xs:element name="reporter" type="xs:string"/>

<xs:element name="rule">

<xs:complexType>

<xs:simpleContent>

<xs:extension base="xs:string">

<xs:attribute name="ruleType" type="xs:string" use="required"/>

</xs:extension>

</xs:simpleContent>

</xs:complexType>

</xs:element>

<xs:element name="se">

<xs:complexType>

<xs:sequence>

<xs:element ref="corpus" minOccurs="0"/>

<xs:element ref="targetlanguage" minOccurs="0"/>

<xs:element ref="coder" minOccurs="0"/>

<xs:element ref="speaker" minOccurs="0"/>

<xs:element ref="speakerData" minOccurs="0"/>

<xs:element ref="speakerState" minOccurs="0"/>

<xs:element ref="reporter" minOccurs="0"/>

<xs:element ref="witnesses" minOccurs="0"/>

<xs:element ref="date" minOccurs="0"/>

<xs:element ref="channel" minOccurs="0"/>

<xs:element ref="situation" minOccurs="0"/>

<xs:element ref="complete" minOccurs="0"/>

<xs:element ref="corrected" minOccurs="0"/>

<xs:element ref="multipleTrials" minOccurs="0"/>

<xs:element ref="interpretation" minOccurs="0"/>

</xs:sequence>

<xs:attribute name="errorid" type="xs:short" use="optional"/>

</xs:complexType>

</xs:element>

<xs:element name="subcorpus">

<xs:complexType>

<xs:sequence>

<xs:element ref="corpusdescription" minOccurs="0"/>

<xs:element ref="se" maxOccurs="unbounded"/>

</xs:sequence>

<xs:attribute name="corpusname" type="xs:string" use="optional"/>

<xs:attribute name="normality" type="xs:string" use="optional"/>

<xs:attribute name="errortypes" type="xs:string" use="optional"/>

</xs:complexType>

</xs:element>

<xs:element name="sedb" xdb:defaultTable="XML_SEDB3">

<xs:complexType>

<xs:sequence>

<xs:element ref="subcorpus" minOccurs="0" maxOccurs="unbounded"/>

</xs:sequence>

<xs:attribute name="corpus" type="xs:string" use="optional"/>

<xs:attribute name="status" type="xs:string" use="optional"/>

<xs:attribute name="version" type="xs:string" use="optional"/>

</xs:complexType>

</xs:element>

<xs:element name="segment">

<xs:simpleType>

<xs:restriction base="xs:string">

<xs:enumeration value="C"/>

<xs:enumeration value="C-string"/>

<xs:enumeration value="CV"/>

<xs:enumeration value="V"/>

<xs:enumeration value="VC"/>

<xs:enumeration value="CC"/>

<xs:enumeration value="diphthong"/>

<xs:enumeration value="syllable+"/>

<xs:enumeration value="complex-V"/>

</xs:restriction>

</xs:simpleType>

</xs:element>

<xs:element name="situation" type="xs:string"/>

<xs:element name="sourceLocation" type="xs:string"/>

<xs:element name="speaker" type="xs:string"/>

<xs:element name="speakerData" type="xs:string"/>

<xs:element name="speakerState" type="xs:string"/>

<xs:element name="stressDomain">

<xs:complexType>

<xs:simpleContent>

<xs:extension base="xs:string">

<xs:attribute name="item" use="required">

<xs:simpleType>

<xs:restriction base="xs:NMTOKEN">

<xs:enumeration value="error"/>

<xs:enumeration value="source"/>

<xs:enumeration value="target"/>

</xs:restriction>

</xs:simpleType>

</xs:attribute>

</xs:extension>

</xs:simpleContent>

</xs:complexType>

</xs:element>

<xs:element name="supraSegment">

<xs:simpleType>

<xs:restriction base="xs:string">

<xs:enumeration value="stress"/>

<xs:enumeration value="intonation"/>

</xs:restriction>

</xs:simpleType>

</xs:element>

<xs:element name="syllabicDomain">

<xs:complexType>

<xs:simpleContent>

<xs:extension base="xs:string">

<xs:attribute name="item" use="required">

<xs:simpleType>

<xs:restriction base="xs:NMTOKEN">

<xs:enumeration value="source"/>

<xs:enumeration value="error"/>

<xs:enumeration value="target"/>

</xs:restriction>

</xs:simpleType>

</xs:attribute>

</xs:extension>

</xs:simpleContent>

</xs:complexType>

</xs:element>

<xs:simpleType name="syllabicDomainSimpleType">

<xs:restriction base="xs:string">

<xs:enumeration value="Coda"/>

<xs:enumeration value="Nucleus"/>

<xs:enumeration value="Onset"/>

<xs:enumeration value="Rhyme"/>

</xs:restriction>

</xs:simpleType>

<xs:element name="syllable">

<xs:simpleType>

<xs:restriction base="xs:string">

<xs:enumeration value="$C"/>

<xs:enumeration value="C*V"/>

<xs:enumeration value="C*VC*"/>

<xs:enumeration value="CV"/>

<xs:enumeration value="CVV"/>

<xs:enumeration value="V"/>

<xs:enumeration value="VC"/>

<xs:enumeration value="VC*"/>

<xs:enumeration value="CCV"/>

<xs:enumeration value="CVC"/>

<xs:enumeration value="CC"/>

<xs:enumeration value="CVC-CV"/>

<xs:enumeration value="C-CVC"/>

<xs:enumeration value="CCVC"/>

</xs:restriction>

</xs:simpleType>

</xs:element>

<xs:element name="syntacticDomain">

<xs:complexType>

<xs:simpleContent>

<xs:extension base="xs:string">

<xs:attribute name="item" type="xs:string" use="required"/>

</xs:extension>

</xs:simpleContent>

</xs:complexType>

</xs:element>

<xs:simpleType name="syntacticDomainSimpleType">

<xs:restriction base="xs:string">

<xs:enumeration value="AP"/>

<xs:enumeration value="AdjP"/>

<xs:enumeration value="AdvP"/>

<xs:enumeration value="Adv"/>

<xs:enumeration value="Adj"/>

<xs:enumeration value="N"/>

<xs:enumeration value="NP"/>

<xs:enumeration value="PP"/>

<xs:enumeration value="S"/>

<xs:enumeration value="V"/>

<xs:enumeration value="VP"/>

<xs:enumeration value="Word"/>

</xs:restriction>

</xs:simpleType>

<xs:element name="targetTranslation">

<xs:complexType>

<xs:simpleContent>

<xs:extension base="xs:string">

<xs:attribute name="language" type="xs:string" use="required"/>

</xs:extension>

</xs:simpleContent>

</xs:complexType>

</xs:element>

<xs:element name="targetUnit" type="xs:string"/>

<xs:element name="targetUtterance" type="xs:string"/>

<xs:element name="targetlanguage" type="xs:string"/>

<xs:element name="wellformedness">

<xs:complexType>

<xs:attribute name="syntax">

<xs:simpleType>

<xs:restriction base="xs:NMTOKEN">

<xs:enumeration value="no"/>

<xs:enumeration value="yes"/>

</xs:restriction>

</xs:simpleType>

</xs:attribute>

<xs:attribute name="lexical">

<xs:simpleType>

<xs:restriction base="xs:NMTOKEN">

<xs:enumeration value="no"/>

<xs:enumeration value="yes"/>

</xs:restriction>

</xs:simpleType>

</xs:attribute>

<xs:attribute name="phonology">

<xs:simpleType>

<xs:restriction base="xs:NMTOKEN">

<xs:enumeration value="no"/>

<xs:enumeration value="yes"/>

</xs:restriction>

</xs:simpleType>

</xs:attribute>

<xs:attribute name="semantics">

<xs:simpleType>

<xs:restriction base="xs:NMTOKEN">

<xs:enumeration value="anomalous"/>

<xs:enumeration value="no"/>

<xs:enumeration value="yes"/>

</xs:restriction>

</xs:simpleType>

</xs:attribute>

</xs:complexType>

</xs:element>

<xs:element name="witnesses">

<xs:complexType/>

</xs:element>

<xs:element name="wordDomain">

<xs:complexType>

<xs:simpleContent>

<xs:extension base="xs:string">

<xs:attribute name="item" use="required">

<xs:simpleType>

<xs:restriction base="xs:NMTOKEN">

<xs:enumeration value="error"/>

<xs:enumeration value="target"/>

<xs:enumeration value="source"/>

</xs:restriction>

</xs:simpleType>

</xs:attribute>

</xs:extension>

</xs:simpleContent>

</xs:complexType>

</xs:element>

<xs:simpleType name="wordDomainSimpleType">

<xs:restriction base="xs:string">

<xs:enumeration value="Word-Final"/>

<xs:enumeration value="Word-Initial"/>

<xs:enumeration value="Word-Medial"/>

</xs:restriction>

</xs:simpleType>

</xs:schema>

Appendix D

<?xml version="1.0" encoding="UTF-8"?>

<sedb corpus="uclasec" status="final" version="1.2-28-06-2002" xmlns:xsi=" xsi:noNamespaceSchemaLocation="

<subcorpus corpusname="Uclasec.English.Fromkin" normality="normal" errortypes="mixed">

<corpusdescription>

This corpus was compiled by Victoria A. Fromkin, UCLA, Los Angeles, USA.

The errors were collected during 1970ff.

See xxxxxx for further details.

</corpusdescription>

<se errorid="3111">

<corpus>UCLA</corpus>

<targetlanguage>Eng</targetlanguage>

<coder/>

<speaker>Viv W</speaker>

<reporter>Vicki Fromkin</reporter>

<date>11/76</date>

<!--sound-->

<!--video-->

<channel/>

<situation/>

<complete value="yes"/>

<corrected value="yes"/>

<multipleTrials value="no"/>

<interpretation iid="1">

<targetUtterance>taste the MEAT to see if there's too much salt</targetUtterance>

<errorUtterance>taste the NEAT to see if there's too much salt</errorUtterance>

<ambiguous value="yes"/>

<errorGroup eid="1">

<analysis aid="1">

<errorType>phonological</errorType>

<comments>perseveration of the place of articualation of [t] from 'taste' OR

anticipation of the place of articulation of [s] in 'see' OR

anticipation of the place of articulation of [t] in 'meat'</comments>

<targetUnit>meat</targetUnit>

<errorUnit>neat</errorUnit>

<sourceLocation>utterance internal</sourceLocation>

<rule ruleType=""/>

<wellformedness syntax="yes" lexical="yes" phonology="yes" semantics="no"/>

<process pid="1" procedure="substitution" direction="perseveration"/>

<!--distance-->

<itemProperties item="1">

<feature class="coronal" value="-"/>

</itemProperties>

<itemProperties item="2">

<feature class="coronal" value="+"/>

</itemProperties>

<itemProperties item="3">

<feature class="coronal" value="-/+"/>

</itemProperties>

</analysis>

<analysis aid="2">

<errorType>phonological</errorType>

<comments>perseveration of the place of articualation of [t] from 'taste' OR

anticipation of the place of articulation of [s] in 'see' OR

anticipation of the place of articulation of [t] in 'meat'</comments>

<targetUnit>meat</targetUnit>

<errorUnit>neat</errorUnit>

<sourceLocation>utterance internal</sourceLocation>

<rule ruleType=""/>

<wellformedness syntax="yes" lexical="yes" phonology="yes" semantics="no"/>

<process pid="1" procedure="substitution" direction="anticipation"/>

<!--distance-->

<itemProperties item="1">

<feature class="coronal" value="-"/>

</itemProperties>

<itemProperties item="2">

<feature class="coronal" value="+"/>

</itemProperties>

<itemProperties item="3">

<feature class="coronal" value="-/+"/>

</itemProperties>

</analysis>

<analysis aid="3">

<errorType>phonological</errorType>

<comments>perseveration of the place of articualation of [t] from 'taste' OR

anticipation of the place of articulation of [s] in 'see' OR

anticipation of the place of articulation of [t] in 'meat'</comments>

<targetUnit>meat</targetUnit>

<errorUnit>neat</errorUnit>

<sourceLocation>utterance internal</sourceLocation>

<rule ruleType=""/>

<wellformedness syntax="yes" lexical="yes" phonology="yes" semantics="no"/>

<process pid="1" procedure="substitution" direction="anticipation"/>

<!--distance-->

<itemProperties item="1">

<feature class="coronal" value="-"/>

</itemProperties>

<itemProperties item="2">

<feature class="coronal" value="+"/>

</itemProperties>

<itemProperties item="3">

<feature class="coronal" value="-/+"/>

</itemProperties>

</analysis>

<domainProperties>

<syntacticDomain item="target">VP</syntacticDomain>

<wordDomain item="source">Word-Initial</wordDomain>

<wordDomain item="error">Word-Initial</wordDomain>

<syllabicDomain item="target">Onset</syllabicDomain>

<syllabicDomain item="source">Onset</syllabicDomain>

</domainProperties>

</errorGroup>

</interpretation>

</se>

</subcorpus>

</sedb>

Appendix E

18-JUN-04 SCD Table structure 1

TABLE_NAME COLUMN_NAME DATA_TYPE DATA_LENGTH

------

DOWNLOAD DOWNLOAD_ID NUMBER 22

DOWNLOAD_DATE DATE 7

DOWNLOAD_FILE VARCHAR2 128

ERROR ERROR_ID NUMBER 22

MAIN_CORPUS VARCHAR2 2048

CORPUS VARCHAR2 2048

TARGETLANGUAGE VARCHAR2 2048

SPEAKER VARCHAR2 2048

CORRECTED VARCHAR2 2048

ERRORTYPE ERROR_ID NUMBER 22

INTERPRETATION_ID NUMBER 22

ERRORGROUP_ID NUMBER 22

ANALYSIS_ID NUMBER 22

ERRORTYPE VARCHAR2 128

ERROR_HTML ERROR_ID NUMBER 22

ERROR_SEQ NUMBER 22

ERROR_HTML VARCHAR2 4000

ERROR_XML ERROR_ID NUMBER 22

ERROR_SEQ NUMBER 22

ERROR_XML VARCHAR2 4000

LANGUAGE LANG_ID VARCHAR2 20

LANGUAGE VARCHAR2 128

PROCESS ERROR_ID NUMBER 22

INTERPRETATION_ID NUMBER 22

ERRORGROUP_ID NUMBER 22

ANALYSIS_ID NUMBER 22

PROCESS_ID NUMBER 22

PROCEDURE VARCHAR2 128

DIRECTION VARCHAR2 128

PROSODICDOMAIN ERROR_ID NUMBER 22

INTERPRETATION_ID NUMBER 22

ERRORGROUP_ID NUMBER 22

ITEM VARCHAR2 15

PROSODICDOMAIN VARCHAR2 128

STRESSDOMAIN ERROR_ID NUMBER 22

INTERPRETATION_ID NUMBER 22

ERRORGROUP_ID NUMBER 22

ITEM VARCHAR2 15

STRESSDOMAIN VARCHAR2 128

SYLLABICDOMAIN ERROR_ID NUMBER 22

INTERPRETATION_ID NUMBER 22

ERRORGROUP_ID NUMBER 22

ITEM VARCHAR2 15

SYLLABICDOMAIN VARCHAR2 128

SYNTACTICDOMAIN ERROR_ID NUMBER 22

INTERPRETATION_ID NUMBER 22

ERRORGROUP_ID NUMBER 22

ITEM VARCHAR2 15

SYNTACTICDOMAIN VARCHAR2 128

WORDDOMAIN ERROR_ID NUMBER 22

INTERPRETATION_ID NUMBER 22

ERRORGROUP_ID NUMBER 22

ITEM VARCHAR2 15

WORDDOMAIN VARCHAR2 128

Appendix F

<?xml version="1.0" encoding="UTF-8"?>

<!-- edited with XML Spy v4.2 U ( by Daan Broeder (Max-Planck Institute for Psycholinguistics) -->

<!--

VERSION 3.0.4

DATE 15-06-2004

Double extension of ProfileAttributes removed from elements with a Vocabulary and from elements with a DateType

Added minOccurs="0" to Project.Description

Added minOccurs="0" to References.Description

DATE 14-06-2004

LanguageId can be Unspecified or Unknown

MediaFile can have both CounterPosition and TimePosition to accomodate Profile(s)

Source can have Profile attributes

LexiconResourceBundle: NoHeadEntries, NoSubEntries to IntegerType (also Unknown & Unspecified)

DATE 13-06-2004

introduced IntegerType for [0-9]+ | Unknown | Unspecified

this can replace CounterPositionType

and also serves for ValidationLevel

DATE 03-06-2004

Some changes: to legalise existing profile practice and regularize things

(BUG)AgeValueType ';' to '.' (See CHILDES)

made LanguageId element in WrittenResource of type Vocabulary

Age and BirthDate can now have ProfileAttributes

Anonyms.ResourceLink can have profileAttributes

Removed VocabularyDef and VocabularyDefType - these were not used

Added FollowUpDepend to profile attribute group

VERSION 3.0.3

DATE 17-05-2004

Added minOccurs="0" to History element

Added required attribute "Name" to NamedLinkType (for CorpusLink)

VERSION 3.0.2

DATE 05-11-2003

History element introduced

Profile attribute of Metatranscript element introduced

VERSION 3.0.1

DATE 20-10-2003

Actor.Age can now also be a range

Added BirthDate to Actor

VERSION 3.0.1

DATE 15-10-2003

Corrected TimepositionType, last occurence of ':' should be optional

VERSION 3.0

DATE 26-8-2003

Error ContentrEncoding -> ContentEncoding

same as version 2.9 but now we keep in sync with the documentation

versions that are 3.0 (0-..)

VERSION 2.9

DATE 3-7-2003

- Added maxOccurs="unbounded" to Content.SubGenre

- Added maxOccurs="unbounded" to Content.Task

- Added maxOccurs="unbounded" to Content.Modalities

- Added minOccurs="0" to Session.Description

- Added minOccurs="0" to Actor.Description

- Added minOccurs="0" to MediaFile.Description

- Added minOccurs="0" to WrittenResource.Description

- Added minOccurs="0" to Source.Description

- Added minOccurs="0" to Validation.Description

- Added minOccurs="0" to Access.Description

FollowUp attribute in CVTypeDef introduced

VERSION 2.8

DATE 23-6-2003

- Added content encoding to written resource

DATE 18-6-2003

- Added attribute group to cater for Session profiles

- Added encoding attribute to Content.Subject

- changed multiplicity restrictions for some elements

VERSION 2.7

DATE 17-6-2003

Changed structure of TimePositionType and CounterPositionType

to complex types. No information in attributes only in subelements

VERSION 2.6

DATE 30-5-2003

imdi:boolean had typo, MotherTongue & PrimaryLanguage type to imdi:boolean

corresponds to document version 3.02, in final version synchronise version numbers!

VERSION 2.5

DATE 21-5-2003

Added imdi:boolean type

Addd ResourceRef attribute to Source

corresponds to document version 3.02, in final version synchronise version numbers!

VERSION 2.4

DATE 13-5-2003

Added Lexicon resource

corresponds to document version 3.02, in final version synchronise version numbers!

VERSION: 2.3

DATE: 2003-04-16

Checked cardinalities

Only one Location (was unbounded)

At least one Description in (optional) References

DATE 2003-04-08.

Corresponds to document version 3.02, in final version synchronise version numbers!

VERSION: 2.2

DATE: 2003-03-06

-->

<xsd:schema targetNamespace="

xmlns:xsd=" xmlns:imdi="

elementFormDefault="qualified" attributeFormDefault="unqualified" version="1">

<xsd:element name="METATRANSCRIPT">

<xsd:annotation>

<xsd:documentation> The outer element with administrative data of all metadata

description files. Version 1.0 is based on Session description version 2.5 and

Catalogue description 2.1 Version 3.0 is based on Session description version 3.03,

Catalogue description 2.1, Lexicon description 1.1 </xsd:documentation>

</xsd:annotation>

<xsd:complexType mixed="false">

<xsd:sequence>

<xsd:element name="History" type="xsd:string" minOccurs="0">

<xsd:annotation>

<xsd:documentation>Creation history of this metadata descriptionfile</xsd:documentation>

</xsd:annotation>

</xsd:element>

<xsd:choice>

<xsd:element name="Session" type="imdi:SessionType" maxOccurs="unbounded"/>

<xsd:element name="Corpus" type="imdi:CorpusType" maxOccurs="unbounded"/>

<xsd:element name="Catalogue" type="imdi:CatalogueType"/>

</xsd:choice>

</xsd:sequence>

<xsd:attribute name="Profile" type="xsd:string" use="optional"/>

<xsd:attribute name="Date" type="xsd:date" use="required"/>

<xsd:attribute name="Originator" type="xsd:string" use="optional"/>

<xsd:attribute name="Version" type="xsd:string" use="required"/>