More example output from LEXPARSE

Mark Huckvale (mark@phonetics.ucl.ac.uk)
Mon, 16 Mar 1998 10:08:56 +0000

Dear All

I have been working further on LEXPARSE: the program that takes
Alex's pronunciation lexicon and adds syllable structure to it.

I think I have taken into account Richard's comments on my last
attempt, and I have done a lot more 'copying' of features
throughout the structure.

There are still some things I am not sure of: how far should
I distribute VOI attributes, and how do I set the CHECKED
attribute?

I am not convinced I have made the right choices about putting
CNS units directly below ONSET and in putting ACODA at the
same level as CNS units of CODA.

The output below is a deliberate copy of the words that Richard
used to demnstrate YorkTalk output.

I will put the complete lexicon on the Web site this week. I also
aim to set up an FTP address soon so that you can all download
the recordings.

Mark
---------------------------------------------------------------
<?XML version='1.0' rmd='all'?>
<!DOCTYPE LEXICON [
<!ELEMENT LEXICON (ENTRY)* >
<!ELEMENT ENTRY (HW, POSSEQ?, PRONSEQ?) >
<!ELEMENT HW (#PCDATA) >
<!ELEMENT POSSEQ (POS)* >
<!ELEMENT POS (#PCDATA) >
<!ELEMENT PRONSEQ (PRON)* >
<!ELEMENT PRON (IPA?, SYLSEQ?) >
<!ELEMENT IPA (#PCDATA) >
<!ELEMENT SYLSEQ (SYL)* >
<!ELEMENT SYL (ONSET? ,RHYME) >
<!ELEMENT ONSET (CNS)* >
<!ELEMENT RHYME (NUC, CODA?) >
<!ELEMENT NUC (VOC)* >
<!ELEMENT CODA (CNS*, ACODA?) >
<!ELEMENT ACODA (CNS) >
<!ELEMENT VOC (#PCDATA) >
<!ELEMENT CNS (#PCDATA) >
<!ATTLIST ENTRY
ID ID #required
HREF CDATA #required>
<!ATTLIST SYLSEQ
ID ID #required
HREF CDATA #required>
<!ATTLIST SYL
STRENGTH (STRONG|WEAK) 'WEAK'
WEIGHT (HEAVY|LIGHT) 'LIGHT' >
<!ATTLIST ONSET
STRENGTH (STRONG|WEAK) 'WEAK' >
<!ATTLIST RHYME
STRENGTH (STRONG|WEAK) 'WEAK'
WEIGHT (HEAVY|LIGHT) 'LIGHT'
CHECKED (Y|N) 'N'
VOI (Y|N) 'N'>
<!ATTLIST NUC
STRENGTH (STRONG|WEAK) 'WEAK'
WEIGHT (HEAVY|LIGHT) 'LIGHT'
CHECKED (Y|N) 'N'
VOI (Y|N) 'N'
LONG (Y|N) 'N' >
<!ATTLIST CODA
VOI (Y|N) 'N' >
<!ATTLIST CNS
CNT (Y|N) 'N'
VOI (Y|N) 'N'
NAS (Y|N) 'N'
STR (Y|N) 'N'
SON (Y|N) 'N'
RHO (Y|N) 'N'
CNSGRV (Y|N) 'N'
CNSCMP (Y|N) 'N'
VOCGRV (Y|N) 'N'
VOCHEIGHT (CLOSE|MID|OPEN) 'MID'
VOCRND (Y|N) 'N'
AMBI (Y|N) 'N' >
<!ATTLIST VOC
GRV (Y|N) 'N'
HEIGHT (CLOSE|MID|OPEN) 'MID'
RND (Y|N) 'N' >
]>
<LEXICON>
<ENTRY ID='RAY'>
<HW>ray</HW>
<PRONSEQ>
<PRON ID='1'>
<IPA ID='1'>'reI</IPA>
<SYLSEQ>
<SYL STRENGTH='STRONG' WEIGHT='HEAVY'>
<ONSET>
<CNS CNT='Y' VOI='Y' NAS='N' STR='N' SON='Y' RHO='Y'
CNSGRV='N' CNSCMP='N' VOCGRV='Y' VOCHEIGHT='MID' VOCRND='N'>r</CNS>
</ONSET>
<RHYME WEIGHT='HEAVY'>
<NUC WEIGHT='HEAVY' LONG='Y'>
<VOC GRV='N' HEIGHT='MID' RND='N'>e</VOC>
<VOC GRV='N' HEIGHT='CLOSE' RND='N'>I</VOC>
</NUC>
</RHYME>
</SYL>
</SYLSEQ>
</PRON>
</PRONSEQ>
</ENTRY>
<ENTRY ID='TAY'>
<HW>tay</HW>
<PRONSEQ>
<PRON ID='1'>
<IPA ID='1'>'teI</IPA>
<SYLSEQ>
<SYL STRENGTH='STRONG' WEIGHT='HEAVY'>
<ONSET>
<CNS VOCRND='N' VOCHEIGHT='MID' VOCGRV='N' CNT='N' VOI='N'
NAS='N' STR='N' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>t</CNS>
</ONSET>
<RHYME WEIGHT='HEAVY'>
<NUC WEIGHT='HEAVY' LONG='Y'>
<VOC GRV='N' HEIGHT='MID' RND='N'>e</VOC>
<VOC GRV='N' HEIGHT='CLOSE' RND='N'>I</VOC>
</NUC>
</RHYME>
</SYL>
</SYLSEQ>
</PRON>
</PRONSEQ>
</ENTRY>
<ENTRY ID='SET'>
<HW>set</HW>
<PRONSEQ>
<PRON ID='1'>
<IPA ID='1'>'set</IPA>
<SYLSEQ>
<SYL STRENGTH='STRONG'>
<ONSET>
<CNS VOCRND='N' VOCHEIGHT='MID' VOCGRV='N' CNT='Y' VOI='N'
NAS='N' STR='Y' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>s</CNS>
</ONSET>
<RHYME VOI='N'>
<NUC VOI='N'>
<VOC GRV='N' HEIGHT='MID' RND='N'>e</VOC>
<VOC GRV='N' HEIGHT='MID' RND='N'>e</VOC>
</NUC>
<CODA>
<CNS VOCRND='N' VOCHEIGHT='MID' VOCGRV='N' CNT='N' VOI='N'
NAS='N' STR='N' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>t</CNS>
</CODA>
</RHYME>
</SYL>
</SYLSEQ>
</PRON>
</PRONSEQ>
</ENTRY>
<ENTRY ID='TRAY'>
<HW>tray</HW>
<PRONSEQ>
<PRON ID='1'>
<IPA ID='1'>'treI</IPA>
<SYLSEQ>
<SYL STRENGTH='STRONG' WEIGHT='HEAVY'>
<ONSET>
<CNS VOCRND='N' VOCHEIGHT='MID' VOCGRV='Y' CNT='N' VOI='N'
NAS='N' STR='N' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>t</CNS>
<CNS CNT='Y' VOI='Y' NAS='N' STR='N' SON='Y' RHO='Y'
CNSGRV='N' CNSCMP='N' VOCGRV='Y' VOCHEIGHT='MID' VOCRND='N'>r</CNS>
</ONSET>
<RHYME WEIGHT='HEAVY'>
<NUC WEIGHT='HEAVY' LONG='Y'>
<VOC GRV='N' HEIGHT='MID' RND='N'>e</VOC>
<VOC GRV='N' HEIGHT='CLOSE' RND='N'>I</VOC>
</NUC>
</RHYME>
</SYL>
</SYLSEQ>
</PRON>
</PRONSEQ>
</ENTRY>
<ENTRY ID='STAY'>
<HW>stay</HW>
<PRONSEQ>
<PRON ID='1'>
<IPA ID='1'>steI</IPA>
<SYLSEQ>
<SYL WEIGHT='HEAVY'>
<ONSET>
<CNS VOCRND='N' VOCHEIGHT='MID' VOCGRV='N' CNT='Y' VOI='N'
NAS='N' STR='Y' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>s</CNS>
<CNS VOCRND='N' VOCHEIGHT='MID' VOCGRV='N' CNT='N' VOI='N'
NAS='N' STR='N' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>t</CNS>
</ONSET>
<RHYME WEIGHT='HEAVY'>
<NUC WEIGHT='HEAVY' LONG='Y'>
<VOC GRV='N' HEIGHT='MID' RND='N'>e</VOC>
<VOC GRV='N' HEIGHT='CLOSE' RND='N'>I</VOC>
</NUC>
</RHYME>
</SYL>
</SYLSEQ>
</PRON>
</PRONSEQ>
</ENTRY>
<ENTRY ID='STRAY'>
<HW>stray</HW>
<PRONSEQ>
<PRON ID='1'>
<IPA ID='1'>'streI</IPA>
<SYLSEQ>
<SYL STRENGTH='STRONG' WEIGHT='HEAVY'>
<ONSET>
<CNS VOCRND='N' VOCHEIGHT='MID' VOCGRV='Y' CNT='Y' VOI='N'
NAS='N' STR='Y' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>s</CNS>
<CNS VOCRND='N' VOCHEIGHT='MID' VOCGRV='Y' CNT='N' VOI='N'
NAS='N' STR='N' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>t</CNS>
<CNS CNT='Y' VOI='Y' NAS='N' STR='N' SON='Y' RHO='Y'
CNSGRV='N' CNSCMP='N' VOCGRV='Y' VOCHEIGHT='MID' VOCRND='N'>r</CNS>
</ONSET>
<RHYME WEIGHT='HEAVY'>
<NUC WEIGHT='HEAVY' LONG='Y'>
<VOC GRV='N' HEIGHT='MID' RND='N'>e</VOC>
<VOC GRV='N' HEIGHT='CLOSE' RND='N'>I</VOC>
</NUC>
</RHYME>
</SYL>
</SYLSEQ>
</PRON>
</PRONSEQ>
</ENTRY>
<ENTRY ID='LETTER'>
<HW>letter</HW>
<PRONSEQ>
<PRON ID='1'>
<IPA ID='1'>'let@</IPA>
<SYLSEQ>
<SYL STRENGTH='STRONG'>
<ONSET>
<CNS VOCGRV='N' CNT='Y' VOI='Y' NAS='N' STR='N' SON='Y'
RHO='N' CNSGRV='N' CNSCMP='N' VOCHEIGHT='CLOSE' VOCRND='N'>l</CNS>
</ONSET>
<RHYME VOI='N'>
<NUC VOI='N'>
<VOC GRV='N' HEIGHT='MID' RND='N'>e</VOC>
<VOC GRV='N' HEIGHT='MID' RND='N'>e</VOC>
</NUC>
<CODA>
<CNS VOCRND='N' VOCHEIGHT='MID' VOCGRV='N' AMBI='Y' CNT='N'
VOI='N' NAS='N' STR='N' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>t</CNS>
</CODA>
</RHYME>
</SYL>
<SYL>
<ONSET>
<CNS VOCRND='N' VOCHEIGHT='MID' VOCGRV='Y' AMBI='Y' CNT='N'
VOI='N' NAS='N' STR='N' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>t</CNS>
</ONSET>
<RHYME>
<NUC>
<VOC GRV='Y' HEIGHT='MID' RND='N'>@</VOC>
<VOC GRV='Y' HEIGHT='MID' RND='N'>@</VOC>
</NUC>
</RHYME>
</SYL>
</SYLSEQ>
</PRON>
</PRONSEQ>
</ENTRY>
<ENTRY ID='ACTOR'>
<HW>actor</HW>
<PRONSEQ>
<PRON ID='1'>
<IPA ID='1'>'{kt@</IPA>
<SYLSEQ>
<SYL STRENGTH='STRONG'>
<RHYME>
<NUC>
<VOC GRV='N' HEIGHT='OPEN' RND='N'>{</VOC>
<VOC GRV='N' HEIGHT='OPEN' RND='N'>{</VOC>
</NUC>
<CODA>
<CNS VOCRND='N' VOCHEIGHT='OPEN' VOCGRV='N' CNT='N' VOI='N'
NAS='N' STR='N' SON='N' RHO='N' CNSGRV='Y' CNSCMP='Y'>k</CNS>
</CODA>
</RHYME>
</SYL>
<SYL>
<ONSET>
<CNS VOCRND='N' VOCHEIGHT='MID' VOCGRV='Y' CNT='N' VOI='N'
NAS='N' STR='N' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>t</CNS>
</ONSET>
<RHYME>
<NUC>
<VOC GRV='Y' HEIGHT='MID' RND='N'>@</VOC>
<VOC GRV='Y' HEIGHT='MID' RND='N'>@</VOC>
</NUC>
</RHYME>
</SYL>
</SYLSEQ>
</PRON>
</PRONSEQ>
</ENTRY>
<ENTRY ID='RANDOM'>
<HW>random</HW>
<PRONSEQ>
<PRON ID='1'>
<IPA ID='1'>'r{nd@m</IPA>
<SYLSEQ>
<SYL STRENGTH='STRONG' WEIGHT='HEAVY'>
<ONSET>
<CNS CNT='Y' VOI='Y' NAS='N' STR='N' SON='Y' RHO='Y'
CNSGRV='N' CNSCMP='N' VOCGRV='Y' VOCHEIGHT='MID' VOCRND='N'>r</CNS>
</ONSET>
<RHYME VOI='Y' WEIGHT='HEAVY'>
<NUC VOI='Y'>
<VOC GRV='N' HEIGHT='OPEN' RND='N'>{</VOC>
<VOC GRV='N' HEIGHT='OPEN' RND='N'>{</VOC>
</NUC>
<CODA>
<CNS VOCRND='N' VOCHEIGHT='OPEN' VOCGRV='N' CNT='N' VOI='Y'
NAS='Y' STR='N' SON='Y' RHO='N' CNSGRV='N' CNSCMP='N'>n</CNS>
<CNS VOCRND='N' VOCHEIGHT='OPEN' VOCGRV='N' AMBI='Y'
CNT='N' VOI='Y' NAS='N' STR='N' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>d</CNS>
</CODA>
</RHYME>
</SYL>
<SYL>
<ONSET>
<CNS VOCRND='N' VOCHEIGHT='MID' VOCGRV='Y' AMBI='Y' CNT='N'
VOI='Y' NAS='N' STR='N' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>d</CNS>
</ONSET>
<RHYME VOI='Y'>
<NUC VOI='Y'>
<VOC GRV='Y' HEIGHT='MID' RND='N'>@</VOC>
<VOC GRV='Y' HEIGHT='MID' RND='N'>@</VOC>
</NUC>
<CODA>
<CNS VOCRND='N' VOCHEIGHT='MID' VOCGRV='Y' CNT='N' VOI='Y'
NAS='Y' STR='N' SON='Y' RHO='N' CNSGRV='Y' CNSCMP='N'>m</CNS>
</CODA>
</RHYME>
</SYL>
</SYLSEQ>
</PRON>
</PRONSEQ>
</ENTRY>
<ENTRY ID='HOSPITAL'>
<HW>hospital</HW>
<PRONSEQ>
<PRON ID='1'>
<IPA ID='1'>'hQspIt@l</IPA>
<SYLSEQ>
<SYL STRENGTH='STRONG' WEIGHT='HEAVY'>
<ONSET>
<CNS VOCRND='Y' VOCHEIGHT='MID' VOCGRV='Y' CNT='Y' VOI='N'
NAS='N' STR='Y' SON='N' RHO='N' CNSGRV='Y' CNSCMP='Y'>h</CNS>
</ONSET>
<RHYME VOI='N' WEIGHT='HEAVY'>
<NUC VOI='N'>
<VOC GRV='Y' HEIGHT='MID' RND='Y'>Q</VOC>
<VOC GRV='Y' HEIGHT='MID' RND='Y'>Q</VOC>
</NUC>
<CODA>
<CNS VOCRND='Y' VOCHEIGHT='MID' VOCGRV='Y' AMBI='Y' CNT='Y'
VOI='N' NAS='N' STR='Y' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>s</CNS>
<CNS VOCRND='Y' VOCHEIGHT='MID' VOCGRV='Y' AMBI='Y' CNT='N'
VOI='N' NAS='N' STR='N' SON='N' RHO='N' CNSGRV='Y' CNSCMP='N'>p</CNS>
</CODA>
</RHYME>
</SYL>
<SYL>
<ONSET>
<CNS VOCRND='N' VOCHEIGHT='CLOSE' VOCGRV='N' AMBI='Y' CNT='Y'
VOI='N' NAS='N' STR='Y' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>s</CNS>
<CNS VOCRND='N' VOCHEIGHT='CLOSE' VOCGRV='N' AMBI='Y' CNT='N'
VOI='N' NAS='N' STR='N' SON='N' RHO='N' CNSGRV='Y' CNSCMP='N'>p</CNS>
</ONSET>
<RHYME VOI='N'>
<NUC VOI='N'>
<VOC GRV='N' HEIGHT='CLOSE' RND='N'>I</VOC>
<VOC GRV='N' HEIGHT='CLOSE' RND='N'>I</VOC>
</NUC>
<CODA>
<CNS VOCRND='N' VOCHEIGHT='CLOSE' VOCGRV='N' AMBI='Y'
CNT='N' VOI='N' NAS='N' STR='N' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>t</CNS>
</CODA>
</RHYME>
</SYL>
<SYL>
<ONSET>
<CNS VOCRND='N' VOCHEIGHT='MID' VOCGRV='Y' AMBI='Y' CNT='N'
VOI='N' NAS='N' STR='N' SON='N' RHO='N' CNSGRV='N' CNSCMP='N'>t</CNS>
</ONSET>
<RHYME VOI='Y'>
<NUC VOI='Y'>
<VOC GRV='Y' HEIGHT='MID' RND='N'>@</VOC>
<VOC GRV='Y' HEIGHT='MID' RND='N'>@</VOC>
</NUC>
<CODA>
<CNS VOCGRV='N' CNT='Y' VOI='Y' NAS='N' STR='N' SON='Y'
RHO='N' CNSGRV='N' CNSCMP='N' VOCHEIGHT='CLOSE' VOCRND='N'>l</CNS>
</CODA>
</RHYME>
</SYL>
</SYLSEQ>
</PRON>
</PRONSEQ>
</ENTRY>
</LEXICON>