;[1y[6{[2;4x
                                              [5y   [1y131


[5y[1y[3;1xCHAPTER 7

                         [5y      [1yDETAIL OF THE EDITCOST AND PHONCODE PROGRAMS


                 [5y      [1y[2;4x7.1. Introduction

[48{


[6{[5y[1yIn [5y  [1ythis [5y  [1ychapter [5y  [1ythe [5y  [1yeditcost [5y   [1yand [5y  [1yphoncode [5y  [1yspelling [5y  [1ycorrection [5y   [1yprograms
[48{


[6{                 [5y      [1yare described in detail.


[48{


[6{                 [5y      [1y7.2. Calculating the minimum cost repair: the editcost program


[48{


[6{                 [5y      [1y7.2.1. General overview

[48{


[6{[5y[1yA shortlist of dictionary words is selected from the session dictionary as
[48{


[6{                 [5y      [1ypossible [5y    [1ycandidates [5y     [1yfor [5y     [1ythe [5y     [1ymisspelling.  [5y         [1yIf [5y     [1yall [5y     [1ywords [5y    [1yin [5y     [1ythe [5y     [1ydictionary
[48{


[6{                 [5y      [1ywere [5y       [1yconsidered [5y       [1ythen [5y        [1ya [5y       [1yvery [5y       [1ylarge [5y        [1ynumber [5y       [1yof [5y        [1ycomparisons [5y       [1yusing [5y        [1ythe
[48{


[6{                 [5y      [1ycosting [5y [1yalgorithm [5y [1ywould [5y [1yhave [5y [1yto [5y [1ybe [5y [1ymade. [5y [1yThe [5y [1yobject [5y [1yof [5y [1yshortlisting [5y [1yis [5y [1yto
[48{


[6{                 [5y      [1yreduce [5y   [1ythis [5y   [1ynumber [5y    [1ywhilst [5y   [1yretaining [5y    [1ythe [5y   [1ycorrection [5y    [1yof [5y   [1ythe [5y    [1ymisspelling [5y    [1yin
[48{


[6{                 [5y      [1ythe shortlist. [5y [1yThe [5y [1yselection [5y [1ydepends [5y [1yupon [5y [1ythe first [5y [1ytwo [5y [1ycharacters [5y [1yof [5y [1ythe
[48{


[6{                 [5y      [1ymisspelling and its length.

[48{


[6{[5y[1yThe [5y     [1ymisspelling [5y      [1y(termed [5y      [1ythe [5y      [1y'inpw') [5y     [1yis [5y      [1ycompared [5y      [1ywith [5y      [1yeach [5y      [1ydictionary
[48{


[6{                 [5y      [1yword (termed [5y [1ythe 'dictw') [5y [1yon the shortlist.  [5y [1yThe [5y [1ycost of [5y [1yediting the [5y [1yinpw
[48{


[6{                 [5y      [1yto [5y  [1ymatch [5y   [1ythe [5y  [1ydictw [5y   [1yis [5y  [1ycalculated [5y   [1y(see [5y  [1ysection [5y   [1y7.2.5).  [5y     [1yThose [5y   [1ydictws [5y   [1ywith
[48{


[6{                 [5y      [1ylowest [5y      [1yedit [5y       [1ycost [5y       [1yare [5y      [1ysaved.   [5y  [1yThe [5y      [1yfour [5y       [1ydictws [5y       [1ywith [5y      [1ylowest [5y       [1ycost [5y       [1yare
[48{


[6{                 [5y      [1yoffered to [5y [1ythe [5y [1yuser as [5y [1yoptions [5y [1yfor [5y [1ythe correction [5y [1yof [5y [1ythe [5y [1ymisspelling [5y [1y(the
[48{


[6{                 [5y      [1yinpw).[1y[6{[2;4x
                                              [5y   [1y132
[48{


[6{                 [5y      [1y7.2.2. Shortlisting candidates from the dictionary: 'shortlist'

[48{


[6{                   [5y  [1yFrom [5y  [1ythe [5y  [1ymisspellings [5y   [1ymade [5y  [1yby [5y  [1ythe [5y  [1yobserved [5y   [1ygroup [5y  [1y(see [5y  [1ychapter [5y  [1y4) [5y   [1yand
[48{


[6{                 [5y      [1ythe group in study 1 (see chapter 6), the following were noted:

                   [5y          [1y- the [5y     [1yinitial [5y     [1ytwo [5y     [1yletters [5y     [1yof [5y     [1ythe [5y      [1yword [5y     [1yand [5y     [1ymisspelling [5y     [1yand [5y      [1ythe
                     [5y        [1yfrequency [5y  [1yof [5y  [1yeach, [5y  [1yin [5y  [1ycases [5y   [1ywhere [5y  [1ythe [5y  [1yfirst [5y  [1yletter [5y  [1yof [5y  [1ya [5y   [1yword
                     [5y        [1ywas misspelt;

[5y[1y- the [5y      [1yrange [5y      [1yof [5y      [1ydifferences [5y      [1yin [5y       [1ylength [5y      [1ybetween [5y      [1ymisspellings [5y       [1yand
                     [5y        [1ycorrections.

[2;2xInitial Characters

[48{


[6{[2;4xThere [5y  [1ywere [5y  [1y'first [5y  [1yletter' [5y  [1yerrors [5y   [1yfound [5y  [1yin [5y  [1yapproximately [5y  [1y8% [5y  [1yof [5y   [1ymisspell-
[48{


[6{                 [5y      [1yings [5y    [1ymade [5y    [1yby [5y    [1ychildren [5y    [1yin [5y    [1ythe [5y    [1ystudy [5y    [1y1.  [5y        [1yFor [5y    [1ythese [5y    [1ycases, [5y    [1ytherefore, [5y    [1yit
[48{


[6{                 [5y      [1ycould [5y   [1ynot [5y   [1ybe [5y    [1yassumed [5y   [1ythat [5y    [1ythe [5y   [1yfirst [5y    [1yletter [5y   [1ywas [5y    [1yspelt [5y   [1ycorrectly.  [5y       [1yFirst
[48{


[6{                 [5y      [1yletter [5y    [1yconfusions [5y    [1yfound [5y    [1ywere [5y    [1yused [5y    [1yto [5y    [1yconstruct [5y    [1ya [5y    [1ytable [5y    [1yof [5y    [1y'alternative
[48{


[6{                 [5y      [1yfirst [5y  [1yletters'.  [5y      [1yFor [5y   [1yany [5y  [1yinpw [5y   [1yonly [5y   [1ythose [5y   [1ywords [5y   [1yfrom [5y  [1ythe [5y   [1ydictionary [5y   [1ywith
[48{


[6{                 [5y      [1ythe [5y      [1ysame [5y      [1yinitial [5y       [1yletter, [5y      [1yor [5y       [1yan [5y      [1yalternative [5y       [1yfound [5y      [1yfrom [5y       [1ythe [5y      [1ytable, [5y       [1yare
[48{


[6{                 [5y      [1yconsidered as candidate misspellings.

[48{


[6{                   [5y  [1yIn [5y [1ysome [5y [1ycases [5y [1ythe [5y [1y'alternative [5y [1yfirst [5y [1yletter' [5y [1yis [5y [1yextended [5y  [1yto [5y [1yconsider [5y [1ythe
[48{


[6{                 [5y      [1yfirst two characters [5y [1yof [5y [1ythe inpw [5y [1yand dictw.  [5y [1yIn [5y [1ydoing so [5y [1ythe [5y [1yalternatives
[48{


[6{                 [5y      [1yfor [5y   [1ythe [5y   [1yinpw [5y  [1yare [5y   [1ymade [5y   [1ymore [5y   [1yspecific [5y   [1yand [5y   [1ythe [5y   [1yshortlist [5y   [1yfurther [5y   [1yreduced
[48{


[6{                 [5y      [1y(though the risk [5y [1yof omission of [5y [1ythe correction [5y [1yis increased).  [5y [1yFor [5y [1yexample,
[48{


[6{                 [5y      [1yif the [5y [1ymisspelling [5y [1yis 'rite' [5y [1yfor [5y [1y'write' then [5y [1yall the [5y [1ywords in [5y [1ythe [5y [1ydictionary
[48{


[6{                 [5y      [1ywith [5y   [1yinitial [5y   [1yletters [5y    [1y'r' [5y   [1yor [5y   [1y'wr' [5y    [1ywould [5y   [1ybe [5y   [1yincluded [5y    [1yin [5y   [1ythe [5y   [1yshortlist [5y    [1ywhilst
[48{


[6{                 [5y      [1ythose others beginning with 'w' would not.

[48{


[6{                   [5y  [1yThe [5y   [1ydictionary [5y   [1yis [5y   [1yindexed [5y   [1yby [5y    [1y'first [5y   [1ycharacter', [5y   [1ywhere [5y   [1ythis [5y   [1ymay [5y    [1yactually
[48{


[6{                 [5y      [1ybe [5y  [1yindicated [5y  [1yby [5y  [1ythe [5y  [1yinitial [5y  [1ytwo [5y  [1ycharacters [5y  [1yof [5y  [1ythe [5y  [1yword, [5y  [1yor [5y  [1yby [5y  [1ythe [5y  [1yfirst
[48{


[6{                 [5y      [1ycharacter only.  In cases where two letters are used they are represented
[48{


[6{                 [5y      [1yby [5y   [1ya [5y    [1ysingle [5y    [1ycharacter [5y   [1yin [5y    [1ythe [5y    [1yrange [5y   [1yA-Z.  [5y        [1yThese [5y   [1y'special [5y    [1ycases' [5y    [1yof [5y    [1yfirst
[48{


[6{                 [5y      [1ycharacter are shown in figure 7-1

[48{


[6{                   [5y  [1yThe [5y     [1yfirst [5y     [1ytwo [5y     [1ycharacters [5y     [1yof [5y     [1ythe [5y     [1yinpw [5y     [1yare [5y     [1yread.  [5y           [1yIf [5y     [1ythey [5y     [1ymatch [5y     [1ya
[48{


[6{                 [5y      [1yspecial case [5y [1ythe [5y [1yfirst [5y [1ycharacters [5y [1yare [5y [1ythen [5y [1yrepresented [5y [1yby [5y [1ythe [5y [1yappropriate
[48{


[6{                 [5y      [1yletter; [5y       [1yotherwise [5y       [1ythey [5y       [1yare [5y       [1yrepresented [5y       [1yby [5y       [1ythe [5y       [1yfirst [5y       [1yletter [5y       [1yof [5y       [1yinpw.
[48{


[6{                 [5y      [1yAlternatives for the first character are found by [5y [1ytable look-up.  They [5y [1yare
[48{


[6{                 [5y      [1ygiven in figure 7-1.  All words in the section of the dictionary indexed by
[48{


[6{                 [5y      [1ythe [5y  [1yfirst [5y   [1ycharacter, [5y   [1yand [5y  [1yby [5y   [1ythe [5y   [1yalternatives [5y   [1yfor [5y  [1yit, [5y   [1yare [5y   [1yincluded [5y   [1yin [5y   [1ythe[1y[6{[2;4x
                                              [5y   [1y133
[48{


[6{                       [5y    [1y[2;2xinitial      represented     alternatives
                           letter(s)         by
a             a              auoei
                               b             b              bdp
                               c             c              ckgsqCK
                              ch             C              Ccjsk
                               d             d              db
                               e             e              eaiy
                               f             f              fPTv
                               g             g              gcjG
                              gn             G              GKgn
                               h             h              hHWo
                              ho             H              Hho
                               i             i              iuea
                               j             j              jCg
                               k             k              kKcq
                              kn             K              KGnkc
                               l             l              lL
                               m             m              mn
                               n             n              nGKNm
                               o             o              oaHWO
                               p             p              pbPN
                              pn             N              Npn
                              ph             P              Ppfv
                              ps             S              Sps
                               q             q              qkc
                               r             r              rR
                               s             s              sSc
                               t             t              tT
                              th             T              TfvtP
                               u             u              uoy
                               v             v              vTf
                               w             w              wWO
                              wo             O              Oow
                              wr             R              Rwr
                              wh             W              WwhOR
                               x             x              xe
                               y             y              yui
                               z             z              zs


                             [5y      [1y[2;4xFigure 7-1:   First character alternatives for shortlisting


                 [5y      [1yshortlist [5y  [1y(subject [5y  [1yto [5y   [1ylength [5y  [1yconstraints).  [5y    [1yFor [5y   [1yexample, [5y  [1yif [5y  [1ythe [5y  [1yinpw [5y   [1ywere
[48{


[6{                 [5y      [1y'foto' [5y [1ythe [5y [1yfirst [5y  [1ycharacter [5y [1ywould [5y [1ybe [5y  [1y'f' [5y [1yand [5y  [1ythe [5y [1yalternatives [5y  [1yfor [5y [1yit [5y  [1ywould
[48{


[6{                 [5y      [1ybe [5y [1yP(=ph), [5y  [1yT(=th) [5y [1yand [5y  [1yv; [5y [1yso [5y [1yall [5y  [1ywords [5y [1yin [5y  [1ythe [5y [1ydictionary [5y  [1ywith [5y [1yinitial [5y  [1yletters
[48{


[6{                 [5y      [1y'ph', 'th', 'v' and 'f' would be considered for the shortlist of candidates.

                 [5y      [1y[2;2xLength constraints

[48{


[6{[2;4xAny [5y [1ydictionary [5y [1yword [5y [1yconsidered [5y  [1yto [5y [1ybe [5y [1ytoo [5y  [1ylong [5y [1yor [5y [1ytoo [5y  [1yshort [5y [1yto [5y [1ybe [5y  [1ythe
[48{


[6{                 [5y      [1ycorrection [5y    [1yof [5y     [1ythe [5y     [1yinpw [5y     [1yis [5y     [1yomitted [5y     [1yfrom [5y    [1ythe [5y     [1yalternative [5y     [1ywords [5y     [1yon [5y     [1ythe[1y[6{[2;4x
                                              [5y   [1y134
[48{


[6{                 [5y      [1yshortlist.  [5y      [1yThe [5y   [1yrange [5y   [1yof [5y   [1ylength [5y   [1ypermitted [5y   [1ywas [5y   [1ydetermined [5y   [1yby [5y    [1ycomparison
[48{


[6{                 [5y      [1yof misspelling [5y [1yand [5y [1ycorrections [5y [1ylengths for [5y [1ythe [5y [1yobserved [5y [1ygroup and [5y [1ystudy [5y [1y1
[48{


[6{                 [5y      [1ygroup.  The dictw is shortlisted if:

                   [5y          [1y- the [5y  [1ydifference [5y   [1ybetween [5y  [1ythe [5y   [1ylength [5y  [1yof [5y   [1ythe [5y   [1yinpw [5y  [1y(=inl) [5y   [1yand [5y   [1ythe
                     [5y        [1ylength [5y   [1yof [5y   [1ythe [5y    [1ydictw [5y   [1y(=dwl) [5y   [1yis [5y   [1yless [5y   [1ythan [5y    [1y4, [5y   [1ywhen [5y   [1yboth [5y   [1yinl [5y    [1yand
                     [5y        [1ydwl are less than 10, or

                   [5y          [1y- the [5y   [1ydifference [5y    [1ybetween [5y    [1yinl [5y    [1yand [5y    [1ydwl [5y    [1yis [5y    [1yless [5y    [1ythan [5y    [1yor [5y    [1yequal [5y    [1yto
                     [5y        [1y(dwl/3)+1, when inl or dwl is 10 or greater.

[48{


[6{                   [5y  [1yThose candidates on [5y [1ythe shortlist, to be [5y [1ypassed to the costing [5y [1yalgorithm
[48{


[6{                 [5y      [1yare, [5y     [1ytherefore, [5y     [1ythose [5y      [1ywords [5y     [1yfrom [5y     [1ythe [5y      [1ysession [5y     [1ydictionary [5y     [1ysatisfying [5y      [1ytwo
[48{


[6{                 [5y      [1yconditions:

[5y[1y1. with [5y [1ythe [5y  [1ysame [5y [1yinitial [5y  [1yletter, [5y [1yor [5y  [1ywith [5y [1yalternative [5y  [1yinitial [5y  [1yletters,
                      [5y      [1yas that of the input word;

                    [5y   [1y2. with length within the range specified above.


[48{


[6{                 [5y      [1y7.2.3. The editcost algorithm

[48{


[6{                   [5y  [1yAt [5y  [1ythe [5y  [1yformat [5y  [1ylevel [5y  [1yof [5y  [1yclassification, [5y  [1yerrors [5y  [1yare [5y  [1ydescribed [5y  [1yin [5y  [1yterms [5y   [1yof
[48{


[6{                 [5y      [1ythe [5y       [1yediting [5y       [1yoperation [5y       [1ythat [5y       [1yis [5y       [1yapplied [5y       [1yto [5y       [1ythe [5y       [1ymisspelling [5y        [1yto [5y       [1yget [5y       [1ythe
[48{


[6{                 [5y      [1ycorrect word (see [5y [1ychapter [5y [1y4).  [5y [1yFor example, [5y [1yto correct [5y [1y'kat' to [5y [1y'cat', [5y [1y'k'
[48{


[6{                 [5y      [1ymust be changed to [5y [1y'c':  the error is [5y [1yreversed to produce the [5y [1ycorrection
[48{


[6{                 [5y      [1yby the application of the edit operation 'change' to 'k' to produce 'c'.

[48{


[6{                   [5y  [1yThe [5y    [1ybasic [5y     [1yediting [5y     [1ycorrection [5y    [1ymethod [5y     [1yis [5y     [1yused [5y    [1yin [5y     [1ya [5y     [1ynumber [5y     [1yof [5y     [1yspelling
[48{


[6{                 [5y      [1ycorrection programs, [5y [1yas [5y [1ydescribed in [5y [1ychapter 3.  [5y [1yWhilst [5y [1yin most [5y [1ycases [5y [1ythis
[48{


[6{                 [5y      [1ymethod [5y    [1yhas [5y     [1ybeen [5y     [1yused [5y    [1yfor [5y     [1ysingle [5y     [1yerror [5y    [1ymisspellings, [5y     [1yBackhouse [5y     [1ydescribes
[48{


[6{                 [5y      [1yhow [5y   [1yit [5y    [1ywould [5y   [1ybe [5y   [1yused [5y    [1yfor [5y   [1ycorrection [5y    [1yof [5y   [1ymultiple [5y    [1yerror [5y   [1ymisspellings: [5y    [1yfor
[48{


[6{                 [5y      [1ydetail of his [5y [1yalgorithm and [5y [1yPascal implementation [5y [1ysee chapter [5y [1y5 [5y [1y(Backhouse,
[48{


[6{                 [5y      [1y1979).  His method will be described here, in less detail.

[48{


[6{                   [5y  [1yThe [5y  [1ytask [5y   [1yis [5y   [1yto [5y   [1yfind [5y  [1ythe [5y   [1ybest [5y   [1yrepair [5y   [1yfor [5y   [1ytransforming [5y  [1ya [5y   [1ystring [5y   [1yE [5y   [1y(the
[48{


[6{                 [5y      [1yerror) into string C (the correction). The edit [5y [1yoperations that are used [5y [1yto
[48{


[6{                 [5y      [1ydo the transformation are:

[5y[1y- insert a character

[5y[1y- delete a character

[5y[1y- change a character[1y[6{[2;4x
                                              [5y   [1y135
[48{


[6{[4;3x1[48{


[6{                             [5y      [1y[2;4x- transpose two adjacent characters

                 [5y      [1yAdditionally, [5y     [1yleaving [5y     [1ya [5y      [1yletter [5y     [1yunchanged [5y     [1ycan [5y      [1ybe [5y     [1yconsidered [5y     [1yan [5y      [1yoperation
[48{


[6{                 [5y      [1ywith no effect.

[48{


[6{[5y[1yThe edit operations will be indicated as follows:

                    [5y          [1y[2;2xb -> 0              delete 'b' from the error string
                         0 -> d              insert 'd' in the error string
                         b -> d              change 'b' to 'd'
                        ei -> ie             transpose 'ei' to 'ie'
                         a -> a              leave 'a' unchanged

                     [2;4xThere are [5y [1yvarious ways [5y [1yin which any [5y [1ymisspelling can [5y [1ybe edited [5y [1yto form [5y [1ythe
[48{


[6{                 [5y      [1ycorrection. [5y        [1yFor [5y        [1yexample, [5y        [1ysome [5y         [1yof [5y        [1ythe [5y        [1yways [5y         [1yto [5y        [1ytransform [5y        [1y'ricev' [5y         [1yto
[48{


[6{                 [5y      [1y'receive' are:

[5y[1y[2;2x1. r -> r    2. r -> r    3. r -> r    4. r -> 0
                          i -> e       i -> 0       i -> e       i -> 0
                          c -> c       0 -> e       c -> c       c -> 0
                          e -> e       c -> c       e -> e       e -> 0
                          0 -> i       0 -> e       v -> i       v -> 0
                          v -> v       0 -> i       0 -> v       0 -> r
                          0 -> e      ev -> ve      0 -> e       0 -> e
0 -> c
0 -> e
0 -> i
0 -> v
0 -> e

                     [2;4xIn [5y [1ythe [5y [1yfourth [5y [1yexample [5y [1yall [5y [1ythe [5y [1ycharacters [5y [1yin [5y [1ythe [5y  [1yE [5y [1ystring [5y [1yare [5y [1ydeleted [5y [1yand
[48{


[6{                 [5y      [1yall those in the C string are inserted.

[48{


[6{                   [5y  [1yThese [5y  [1ydifferent [5y   [1ytransformations [5y   [1ymay [5y  [1ybe [5y   [1yrepresented [5y   [1yas [5y  [1ya [5y   [1ygraph, [5y   [1ywhere
[48{


[6{                 [5y      [1yeach node corresponds to a position in E string and a position in C string,
[48{


[6{                 [5y      [1yand each arc corresponds to an edit operation.

[48{


[6{                   [5y  [1yThe [5y  [1ygraph [5y   [1yin [5y  [1yfigure [5y   [1y7-2 [5y  [1yrepresents [5y   [1ythe [5y  [1ytranformations [5y   [1y1. [5y  [1yto [5y   [1y4. [5y   [1yabove.
[48{


[6{                 [5y      [1yIt can be seen that [5y [1ythere are many possible [5y [1ypaths through the graph.  [5y [1yIn
[48{


[6{                 [5y      [1yfact, [5y  [1yany [5y  [1yone [5y  [1yword [5y  [1ycan [5y  [1ybe [5y  [1ytransformed [5y  [1yinto [5y  [1yany [5y  [1yother [5y  [1yword [5y  [1yby [5y  [1ydeletion
[48{


[6{                 [5y      [1yof [5y     [1yall [5y     [1ythe [5y     [1yerror [5y     [1ystring [5y      [1ycharacters [5y     [1yand [5y     [1yinsertion [5y     [1yof [5y     [1yall [5y     [1ythe [5y      [1ycorrection
[48{


[6{                 [5y      [1ystring [5y   [1ycharacters.  [5y       [1yIf [5y   [1ywe [5y   [1yassign [5y    [1ycosts [5y   [1yto [5y   [1yeach [5y    [1yedit [5y   [1yoperation [5y   [1ythen [5y    [1ythe


[48{

[6{                 [5y      [1y[4m               [0m

[48{


[6{[5y[1y[4;3x1[48{


[6{Transposition [5y  [1ycan [5y  [1yonly [5y   [1ybe [5y  [1ymade [5y   [1ybetween [5y  [1yadjacent [5y   [1yletters: [5y  [1yrepeated [5y  [1ytranspositions [5y   [1yare
                          [5y  [1ynot permitted.[1y[6{[2;4x
                                              [5y   [1y136
[48{


[6{[5y[1y[2;2xC string

                                r      e      c      e      i      v      e
                            A.      .      .      .      .      .      .      .

                      E   r
  .      .      .      .      .      .      .      .

                      s   i
t      .      .      .      .      .      .      .      .
                      r
i   c
n      .      .      .      .      .      .      .      .
                      g
   e
  .      .      .      .      .      .      .      .

                          v
  .      .      .      .      .      .      .      .B


                            .       .          .                 .
.      .       .
                                .       .      .                         .
                             ok    change    delete    insert    transpose


                          [5y      [1y[2;4xFigure 7-2:   Graph representing edit operation transformations


                 [5y      [1ycost [5y     [1yof [5y      [1yany [5y      [1ypath [5y     [1ythrough [5y      [1ythe [5y      [1ygraph [5y     [1y(i.e. [5y      [1ythe [5y      [1ycost [5y     [1yof [5y      [1yany [5y      [1yparticular
[48{


[6{                 [5y      [1ytransformation [5y  [1yor [5y   [1ysequence [5y   [1yof [5y  [1yedit [5y   [1yoperations) [5y   [1yis [5y  [1ythe [5y   [1ysum [5y   [1yof [5y   [1yall [5y   [1yopera-
[48{


[6{                 [5y      [1ytions [5y  [1yon [5y  [1ythat [5y  [1ypath.  [5y    [1yThe [5y  [1y'best [5y  [1yrepair' [5y  [1yis [5y   [1ytaken [5y  [1yto [5y  [1ybe [5y  [1ythe [5y  [1ypath [5y  [1ythrough
[48{


[6{                 [5y      [1ythe graph, from [5y [1yA to [5y [1yB, with [5y [1yleast total [5y [1ycost.  For [5y [1yexample, if [5y [1yunit [5y [1ycost
[48{


[6{                 [5y      [1ywere assigned [5y [1yto all [5y [1yedit operations, [5y [1yand zero [5y [1ycost to [5y [1yok(no change), [5y [1ythen
[48{


[6{                 [5y      [1ythe [5y  [1yleast [5y  [1ycost [5y  [1ypath [5y  [1yin [5y  [1ythe [5y  [1yabove [5y  [1yexample [5y  [1ywould [5y  [1ybe [5y  [1ypath [5y  [1y1. [5y  [1ywith [5y  [1ya [5y   [1ycost
[48{


[6{                 [5y      [1yof 3 units.

[5y[1y[2;2xTo calculate the least cost path

[48{


[6{                       [2;4xConsider [5y  [1ytwo [5y  [1ystrings [5y  [1yE [5y  [1yand [5y  [1yC, [5y  [1ywith [5y  [1ylengths [5y  [1ym [5y  [1yand [5y  [1yn [5y  [1yrespectively.  [5y    [1yThe
[48{


[6{                 [5y      [1ygraph [5y     [1yrepresenting [5y     [1ythe [5y      [1ytransformations [5y     [1ybetween [5y      [1ythese [5y     [1ystrings [5y      [1ywill [5y      [1yhave
[48{


[6{                 [5y      [1ydimensions [5y  [1y(0 [5y   [1yto [5y  [1ym) [5y   [1yby [5y   [1y(0 [5y  [1yto [5y   [1yn) [5y  [1ywhere [5y   [1ythe [5y  [1yfirst [5y   [1yletters [5y  [1yof [5y   [1yeach [5y   [1ystring
[48{


[6{                 [5y      [1yE(1) and C(1) are associated with the node (1,1) (see figure 7-3).

[48{


[6{                   [5y  [1yThe least [5y [1ycost [5y [1ypath [5y [1yfrom [5y [1ythe [5y [1ynode [5y [1y(0,0) [5y [1yto [5y [1yany [5y [1ypoint [5y [1yin [5y [1ythe [5y [1ygraph [5y [1ycan
[48{


[6{                 [5y      [1ybe calculated.  [5y [1yFor points (0,1), [5y [1y(0,2)...(0,n) the least [5y [1ycost will be the [5y [1ycost
[48{


[6{                 [5y      [1yof [5y  [1yinserting [5y  [1yletters [5y  [1yC(1), [5y  [1yC(2), [5y  [1yC(3)...C(n).  [5y    [1yThe [5y   [1yleast [5y  [1ycost [5y  [1ypath [5y  [1yfrom [5y   [1y(0,0)
[48{


[6{                 [5y      [1yto (0,1) will be:[1y[6{[2;4x
                                              [5y   [1y137
[48{


[6{                        [5y  [1y[2;2x----> j         C string
                     |
|          r      e      c      e      i      v      e
                     |
V     (0,0)  (0,1)  (0,2)          (0,j)               (0,n)
                     i       .      .      .      .      .      .      .      .
                         r
 (1,0)  (1,1)  (1,2)          (1,j)               (1,n)
                      E      .      .      .      .      .      .      .      .
                         i
s
t      .      .      .      .      .      .      .      .
                      r  c
i    (i,0)  (i,1)  (i,2)         (i,j)                (i,n)
                      n      .      .      .      .      .      .      .      .
                      g  e

   .      .      .      .      .      .      .      .
                         v
 (m,0)  (m,1)  (m,2)         (m,j)                (m,n)
                             .      .      .      .      .      .      .      .


                                 [2;4xFigure 7-3:   Costgraph showing the node labelling


                  [5y    [1ycost(ins(C(1)))

[48{


[6{[5y[1ywhich [5y [1yis [5y [1ythe [5y  [1ycost [5y [1yof [5y  [1yinserting [5y [1ythe [5y [1ycharacter [5y  [1ythat [5y [1yis [5y [1yin [5y  [1yposition [5y [1y1 [5y [1yin [5y  [1ythe
[48{


[6{                 [5y      [1yC string (inserted in the E string).

[48{


[6{                   [5y  [1ySimilarly the least cost path to (0,2) will be:

[48{


[6{                  [5y    [1ycost(ins(C(1))) + cost(ins(C(2)))

[48{


[6{                 [5y      [1yThis [5y [1ywill [5y [1ybe [5y  [1yreferred [5y [1yto [5y  [1yas [5y [1ythe [5y  [1yminimum [5y [1ycost [5y  [1ypath [5y [1yto [5y  [1ythe [5y [1ynode [5y  [1y(0,2), [5y  [1yor
[48{


[6{                 [5y      [1ymincost(0,2). Thus:

[48{


[6{mincost(0,1) = cost(ins(C(1)))
                  [5y    [1ymincost(0,2) = cost(ins(C(1))) + cost(ins(C(2)))
[5y[1y= mincost(0,1) + cost(ins(C(2)))

[48{


[6{                 [5y      [1ySo for any node (0,j) in the path (0,0) to (0,n):

[48{


[6{                  [5y    [1ymincost(0,j) = mincost(0,j-1) + cost(ins(C(j)))

[48{


[6{                   [5y  [1yFor any node (i,0) in the path (0,0) to (m,0):

[48{


[6{                  [5y    [1ymincost(i,0) = mincost(i-1,0) + cost(del(E(i)))[1y[6{[2;4x
                                              [5y   [1y138
[48{


[6{                 [5y      [1ywhere [5y   [1ycost(del(E(i))) [5y   [1yis [5y   [1ythe [5y   [1ycost [5y   [1yof [5y   [1ydeleting [5y   [1ythe [5y   [1yith [5y   [1ycharacter [5y   [1yof [5y   [1ythe [5y   [1yE
[48{


[6{                 [5y      [1ystring, the error string.

[48{


[6{[5y[1yConsidering the node (1,1) there are four possible paths to this node:

[48{


[6{                    [5y   [1y1. delete(E(1)) and insert(C(1))

                       [5y    [1yinsert(C(1)) and delete(E(1))

                       [5y    [1ychange E(1) to C(1)

                       [5y    [1yif E(1) and C(1) are the same leave them unchanged

[48{


[6{                   [5y  [1yThe respective costs for each of these will be:

[48{


[6{                    [5y [1y(i) mincost(0,1) + cost(del(E(1)))

                       [5y    [1ymincost(1,0) + cost(ins(C(1)))

                       [5y    [1ymincost(0,0) + cost(change(E(1),C(1)))

                       [5y    [1ymincost(0,0) + cost(ok(E(1),C(1)))

[48{


[6{                 [5y      [1yThe mincost(1,1) will be the mininum of these four costs.

[48{


[6{                   [5y  [1yThe [5y       [1yleast [5y        [1ycost [5y        [1yfor [5y       [1yany [5y        [1ynode [5y        [1y(1,j) [5y       [1yin [5y        [1ythe [5y        [1ypath [5y       [1y(1,0) [5y        [1yto [5y        [1y(1,n) [5y        [1yis,
[48{


[6{                 [5y      [1ytherefore:

[48{


[6{mincost(1,j) = minimum of
(mincost(0,j) + cost(del(E(1))),
[5y[1ymincost(1,j-1) + cost(ins(C(j))),
[5y[1ymincost(0,j-1) + cost(change(E(1),C(j))),
[5y[1ymincost(0,j-1) + cost(ok(E(1),C(j)))).

[48{


[6{                 [5y      [1yand similarly for any node (j,1) in the path (0,1) to (m,1)

[48{


[6{                  [5y    [1ymincost(i,1) = minimum of
[5y[1y(mincost(i-1,1) + cost(del(E(i))),
[5y[1ymincost(i,0) + cost(ins(C(1))),
[5y[1ymincost(i-1,0) + cost(change(E(i),C(1))),
[5y[1ymincost(i-1,0) + cost(ok(E(i),C(1)))).

[48{


[6{                   [5y  [1yFor [5y       [1yother [5y       [1ynodes [5y       [1yin [5y       [1ythe [5y       [1ygraph, [5y       [1ywhere [5y       [1yi>=2 [5y       [1yand [5y       [1yj>=2, [5y       [1ythe [5y       [1ycost [5y       [1yof
[48{


[6{                 [5y      [1ytransposition must also be considered:

[48{


[6{                  [5y    [1ymincost(i,j), where 1>=2 and j>=2,
[5y[1y= minimum of
[5y[1y(mincost(i-1,j) + cost(del(E(i))),[1y[6{[2;4x
                                              [5y   [1y139
[48{


[6{[5y[1ymincost(i,j-1) + cost(ins(C(j))),
[5y[1ymincost(i-1,j-1) + cost(change(E(i),C(j))),
[5y[1ymincost(i-1,j-1) + cost(ok(E(i),C(j))),
[5y[1ymincost(i-2,j-2) + cost(transp(E(i-1),E(i)))).

[48{


[6{                   [5y  [1yThe [5y   [1ycost [5y   [1yof [5y   [1ythe [5y   [1yleast [5y   [1ycost [5y   [1ypath [5y   [1ythrough [5y   [1ythe [5y   [1ygraph [5y   [1y(i.e. [5y   [1ythe [5y    [1yminimum
[48{


[6{                 [5y      [1ycost repair [5y [1yof [5y [1ythe [5y [1ytwo strings) [5y [1yis [5y [1ythe minimum [5y [1ycost [5y [1ypath from [5y [1ynode [5y [1y(0,0)
[48{


[6{                 [5y      [1yto node (m,n), mincost(m,n):

[48{


[6{                  [5y    [1ymincost(m,n) = minimum of
[5y[1y(mincost(m-1,n) + cost(del(E(m))),
[5y[1ymincost(m,n-1) + cost(ins(C(n))),
[5y[1ymincost(m-1,n-1) + cost(change(E(m),C(n))),
mincost(m-1,n-1) + cost(ok(E(m),C(n))),
[5y[1ymincost(m-2,n-2) + cost(transp(E(m-1),E(m)))).

[48{


[6{                   [5y  [1yBackhouse [5y     [1ydiscusses [5y     [1ythe [5y     [1yuse [5y     [1yof [5y     [1ythe [5y     [1yalgorithm [5y     [1yfor [5y     [1yspelling [5y     [1ycorrection,
[48{


[6{                 [5y      [1yassigning [5y   [1yunit [5y   [1ycost [5y    [1yto [5y   [1yeach [5y    [1yedit [5y   [1y(Backhouse, [5y   [1y1979).  [5y       [1yHere, [5y   [1yhowever, [5y    [1ydif-
[48{


[6{                 [5y      [1yferent [5y  [1ycosts [5y  [1yhave [5y  [1ybeen [5y  [1yassigned [5y   [1yto [5y  [1yeach [5y  [1yedit [5y   [1yoperation, [5y  [1yand [5y  [1yalso [5y   [1yvarying
[48{


[6{                 [5y      [1ycosts [5y  [1yare [5y   [1yassigned [5y   [1yaccording [5y  [1yto [5y   [1ythe [5y  [1yparticular [5y   [1ycharacters [5y  [1yinvolved [5y   [1yin [5y   [1ythe
[48{


[6{                 [5y      [1yedit.  [5y    [1yWeightings [5y   [1yare [5y  [1yassigned [5y   [1yaccording [5y  [1yto [5y   [1ythe [5y  [1yparticular [5y   [1yedit [5y   [1yoperation
[48{


[6{                 [5y      [1yand [5y        [1ycharacter, [5y         [1yand [5y         [1yfrom [5y         [1ythese [5y         [1yweightings [5y         [1ythe [5y         [1ycosts [5y         [1yare [5y         [1ycalculated.
[48{


[6{                 [5y      [1y(Details [5y [1yof [5y [1ythe [5y [1ycalculations [5y [1yand [5y [1yweightings [5y [1yare [5y [1ygiven [5y  [1ybelow).  [5y  [1yThus [5y [1yfor [5y  [1yany
[48{


[6{                 [5y      [1yerror [5y    [1ythe [5y    [1yminimum [5y     [1ycost [5y    [1yof [5y    [1ytransforming [5y    [1yit [5y    [1yto [5y     [1ymatch [5y    [1yany [5y    [1yword [5y    [1yin [5y     [1ythe
[48{


[6{                 [5y      [1ydictionary [5y    [1ycan [5y     [1ybe [5y     [1ycalculated.  [5y         [1yFor [5y     [1yany [5y     [1yword [5y    [1yinput [5y     [1yby [5y     [1ythe [5y     [1yuser, [5y     [1ythose
[48{


[6{                 [5y      [1ywords [5y  [1yfrom [5y  [1ythe [5y   [1yshortlist [5y  [1ywith [5y   [1ylowest [5y  [1y'minimum [5y   [1ycost [5y  [1yrepair' [5y  [1yare [5y   [1yselected,
[48{


[6{                 [5y      [1yand [5y  [1yoffered [5y   [1yas [5y   [1yoptions [5y   [1yfor [5y   [1ycorrection [5y   [1yto [5y   [1ythe [5y   [1yuser.  [5y      [1yThree [5y   [1yexamples [5y   [1yof
[48{


[6{                 [5y      [1ythe editcost program in use are given in figure 7-4.


[48{


[6{                 [5y      [1y7.2.4. Relation of the children's errors

[48{


[6{                   [5y  [1yA major [5y [1yobjective of [5y [1ythe first [5y [1ystudy was [5y [1yto [5y [1ycollect data [5y [1yon the [5y [1yerrors
[48{


[6{                 [5y      [1ymade [5y        [1yby [5y         [1ychildren [5y         [1yfrom [5y        [1ythe [5y         [1yReading [5y         [1yUnit, [5y        [1ywhen [5y         [1ywriting [5y         [1ycompositions.
[48{


[6{                 [5y      [1yDetails [5y       [1yof [5y       [1ythis [5y        [1ystudy [5y       [1yare [5y        [1ygiven [5y       [1yin [5y        [1ychapter [5y       [1y6.   [5y   [1yDepending [5y       [1yupon [5y        [1ythe
[48{


[6{                 [5y      [1yfrequency [5y      [1yof [5y      [1yparticular [5y       [1yerrors [5y      [1ymade [5y       [1yby [5y      [1ythe [5y       [1ychildren, [5y      [1yweightings [5y       [1ywere
[48{


[6{                 [5y      [1yassigned [5y  [1yto [5y  [1yedit [5y   [1yoperations [5y  [1yin [5y   [1ythe [5y  [1yeditcost [5y  [1yprogram.  [5y     [1yThose [5y  [1yerrors [5y   [1ymade
[48{


[6{                 [5y      [1ymost [5y      [1yfrequently [5y      [1ywere [5y      [1yassigned [5y      [1yhighest [5y      [1yweighting, [5y      [1yand [5y      [1ytherefore [5y       [1ylowest
[48{


[6{                 [5y      [1ycost, [5y     [1ywhich [5y     [1yinfluenced [5y     [1ythe [5y     [1yselection [5y     [1yof [5y     [1ythe [5y     [1yminimum [5y     [1ycost [5y     [1yrepair [5y     [1yof [5y     [1ya
[48{


[6{                 [5y      [1ymisspelling.

[48{


[6{[5y[1yFor [5y   [1yeach [5y   [1ychild, [5y    [1yacross [5y   [1ysessions, [5y    [1ythe [5y   [1yfrequency [5y    [1yof [5y   [1yincorrect [5y    [1ywords [5y    [1ywas[1y[6{[2;4x
                                              [5y   [1y140
[48{


[6{[5y[1y[2;2xw:check
What word do you want to check?
                               w:berayd
Wait a minute while I check it
I have nearly finished checking it
                               It could be
     buried

                                               bed

                                               bad

                                               board

                               w:check
What word do you want to check?
                               w:houes
Wait a minute while I check it
I have nearly finished checking it
                               It could be
     house

                                               hours

                                               horses

                                               hour

                               w:check
What word do you want to check?
                               w:wen
Wait a minute while I check it
It could be
     when

                                               went

                                               win

                                               we

[5y[1y[2;4xFigure 7-4:   Example of the spelling corrector in use


                 [5y      [1ynoted, [5y [1ytogether [5y [1ywith [5y [1ythe [5y [1ymisspelling [5y  [1yand [5y [1ycorrection.  [5y  [1yFor [5y [1yeach [5y  [1ymisspelling,
[48{


[6{                 [5y      [1yall [5y     [1yerrors [5y     [1ywithin [5y     [1ythe [5y     [1ymisspelt [5y     [1yword [5y     [1ywere [5y     [1ytreated [5y     [1yseparately, [5y     [1yand [5y     [1ywere
[48{


[6{                 [5y      [1yclassified [5y     [1yaccording [5y     [1yto [5y      [1ywhether [5y     [1ythey [5y      [1yinvolved [5y     [1ydeletion, [5y     [1yinsertion, [5y      [1ytrans-
[48{


[6{                 [5y      [1yposition, [5y  [1yor [5y  [1ythe [5y  [1ychanging [5y  [1yof [5y  [1ya [5y  [1ycharacter.  [5y    [1yThe [5y  [1ytransformation [5y  [1yof [5y   [1yspelling
[48{


[6{                 [5y      [1yto [5y [1ycorrection [5y [1yinvolving [5y [1ythe [5y [1yminimum [5y  [1ynumber [5y [1yof [5y [1yedit [5y [1yoperations [5y [1ywas [5y  [1ychosen
[48{


[6{                 [5y      [1yin [5y   [1ymost [5y   [1ycases, [5y    [1yusing [5y   [1ythe [5y    [1ysubjective [5y   [1yjudgement [5y    [1yof [5y   [1ythe [5y    [1yauthor [5y   [1yto [5y    [1ydecide
[48{


[6{                 [5y      [1ythe most likely error in [5y [1ycases where a number of interpretations might [5y [1ybe
[48{


[6{                 [5y      [1ymade.[1y[6{[2;4x
                                              [5y   [1y141
[48{


[6{                   [5y  [1yThese [5y  [1yjudgements [5y   [1ywere [5y   [1ybased [5y   [1yon [5y  [1yprevious [5y   [1yobservation [5y   [1yof [5y   [1ythe [5y   [1ychildren's
[48{


[6{                 [5y      [1yerrors, [5y [1yand [5y  [1yreported [5y [1y'frequent [5y  [1yerrors' [5y [1yof [5y  [1yother [5y [1yresearchers. [5y  [1yFor [5y  [1yexample,
[48{


[6{                 [5y      [1ya preferance in [5y [1ycertain cases for [5y [1yphonetic over non-phonetic [5y [1ysubstitutions.
[48{


[6{                 [5y      [1yThree [5y  [1yexamples [5y  [1yof [5y  [1ythe [5y  [1ychoices [5y  [1ymade [5y  [1ywill [5y  [1ybe [5y  [1ygiven [5y  [1yhere.  [5y    [1yIn [5y  [1ythe [5y  [1ycase [5y  [1yof
[48{


[6{                 [5y      [1y'panes' [5y [1ymisspelt [5y  [1yas [5y  [1y'pains' [5y  [1ytwo [5y [1ypossible [5y  [1ytransformations, [5y  [1yeach [5y  [1yinvolving [5y  [1ytwo
[48{


[6{                 [5y      [1yedit operations, are:

[5y[1y[2;2x1. p -> p       2. p -> p
a -> a          a -> a
i -> n          i -> 0
n -> e          n -> n
s -> s          0 -> e
s -> s

                     [2;4xThe second is [5y [1ychosen as the [5y [1yinterpretation: the confusion [5y [1yof 'ai' for [5y [1y'a_e'
[48{


[6{                 [5y      [1ywas [5y  [1yconsidered [5y  [1ya [5y  [1ymore [5y  [1ylikely [5y  [1yerror [5y  [1ythan [5y  [1ythe [5y  [1yconfusion [5y  [1yof [5y  [1y'i' [5y  [1yand [5y  [1y'n' [5y  [1yand
[48{


[6{                 [5y      [1yof 'n' and 'e'.

[48{


[6{[5y[1ySimilarly, in 'wigule' for 'wiggled' the second example is chosen:

                     [5y        [1y[2;2x1. w -> w       2. w -> w
i -> i          i -> i
g -> g          g -> g
u -> g          0 -> g
l -> l          u -> 0
e -> e          l -> l
0 -> d          e -> e
0 -> d

                     [2;4xIn this [5y [1ycase it [5y [1yseemed more [5y [1ylikely that [5y [1ythe [5y [1ysecond 'g' [5y [1yhad been [5y [1yommitted
[48{


[6{                 [5y      [1yand [5y   [1ythat [5y   [1ythe [5y   [1y'u' [5y   [1ywas [5y   [1ypart [5y   [1yof [5y   [1ythe [5y   [1y'ule' [5y    [1ygrapheme, [5y   [1yrather [5y   [1ythan [5y   [1ythat [5y    [1y'u'
[48{


[6{                 [5y      [1yand [5y [1y'g' [5y [1yhad [5y [1ybeen [5y [1yconfused.  [5y   [1yIn [5y [1ysome [5y [1ycases, [5y [1ywhere [5y [1ythe [5y [1ytransformation [5y  [1ywas
[48{


[6{                 [5y      [1ynot clear, both sets of errors were counted:

                        [5y  [1y[2;2x'lifet' for 'left'

1. l -> l       2. l -> l
i -> e          i -> 0
f -> f         fe -> ef
e -> 0          t -> t
t -> t

[48{


[6{[2;4xA frequency count [5y [1ywas made of [5y [1yeach operation involved [5y [1yin an error, [5y [1yand
[48{


[6{                 [5y      [1ythe [5y [1yparticular [5y [1yletter(s) [5y [1yinvolved.  [5y  [1yTotals [5y [1yfor [5y [1yerrors, [5y [1yaccording [5y [1yto [5y [1ythe [5y [1yedit
[48{


[6{                 [5y      [1yoperation involved, are given in figure 7-5.

[48{


[6{                   [5y  [1yIt can be [5y [1yseen that [5y [1ythe most [5y [1yfrequent errors [5y [1ywere those [5y [1yrequiring [5y [1ythe
[48{


[6{                 [5y      [1yinsert operation for correction i.e. [5y [1yletters were omitted from the [5y [1ycorrect[1y[6{[2;4x
                                              [5y   [1y142
[48{


[6{                        [5y  [1y[2;2x1. INSERT.            159      (43%)

                             2. DELETE.             78      (21%)

                             3. TRANSPOSE.          24       (7%)

                             4. CHANGE.            109      (29%)

                             5. TOTAL.             370

                     Operations:
insert - insertion of a letter into error to get correction.
                     delete - deletion of a letter from error to give correction.
                     change - change of letter in error into corresponding letter
                              in correction, error/correction.
                     transpose - transposition of letters AB in error to BA in correction.

                                 [5y      [1y[2;4xFigure 7-5:   Study 1: frequency of error types


                 [5y      [1yword.  The change operation accounted for the next highest proportion of
[48{


[6{                 [5y      [1yerrors, with deletions [5y [1yhaving slightly [5y [1ylower percentage [5y [1yoccurrence.  A [5y [1ymuch
[48{


[6{                 [5y      [1ysmaller [5y  [1ypercentage [5y  [1yof [5y  [1yerrors [5y  [1ymade [5y   [1yinvolved [5y  [1ytranspositions.  [5y    [1yThese [5y   [1yfindings
[48{


[6{                 [5y      [1yare [5y      [1yin [5y       [1yaccord [5y       [1ywith [5y       [1ythose [5y      [1yof [5y       [1yMasters [5y       [1y(Masters, [5y       [1y1927) [5y      [1ywho [5y       [1yalso [5y       [1yfound
[48{


[6{                 [5y      [1yinsertions most frequent and transpositions the least frequent.

[48{


[6{                   [5y  [1yFrequencies of [5y [1yerrors [5y [1yfor [5y [1yspecific characters, [5y [1yfor [5y [1yall [5y [1ychildren, [5y [1yare [5y [1ygiven
[48{


[6{                 [5y      [1yin [5y [1yfigure [5y  [1y7-6.  [5y   [1yThe [5y  [1ynumber [5y  [1yof [5y [1ychildren [5y  [1ymaking [5y [1yeach [5y  [1yerror [5y [1y(maximum [5y  [1y7) [5y  [1yis
[48{


[6{                 [5y      [1yalso given.  [5y [1yIt should be [5y [1ynoted that, as [5y [1ywell as [5y [1yconsidering the [5y [1yapplication
[48{


[6{                 [5y      [1yof [5y  [1yedit [5y  [1yoperations [5y  [1yto [5y  [1yindividual [5y   [1ycharacters [5y  [1y(a [5y  [1yto [5y  [1yz), [5y  [1ya [5y  [1ynumber [5y  [1yof [5y   [1yspecial
[48{


[6{                 [5y      [1ycases [5y  [1ywere [5y  [1yalso [5y   [1yconsidered [5y  [1ye.g. [5y   [1yeach [5y  [1y'l' [5y   [1yof [5y  [1y'll' [5y   [1y(double [5y  [1y'l' [5y   [1yin [5y  [1yerror [5y   [1yor [5y   [1yin
[48{


[6{                 [5y      [1ycorrection); [5y   [1ysilent [5y    [1yinitial [5y   [1y'k' [5y    [1yor [5y   [1y'w' [5y    [1y('know' [5y   [1yor [5y    [1y'write'); [5y    [1yfinal [5y   [1y'e' [5y    [1y('cane');
[48{


[6{                 [5y      [1ysilent second 'h' ('when'); the 'c' or 'k' of 'ck' ('back').

[48{


[6{                   [5y  [1yThe most frequent errors were those involving vowels, 'e' in particular is
[48{


[6{                 [5y      [1yinvolved in some 100 of the 370 errors.


[48{


[6{                 [5y      [1y7.2.5. Detail of the editcost program

[48{


[6{                   [5y  [1yThe word [5y [1yto [5y [1ybe [5y [1ychecked, [5y [1ythe [5y [1yinpw, [5y [1yis [5y [1ycompared with [5y [1yeach [5y [1yword [5y [1yon [5y [1ythe
[48{


[6{                 [5y      [1yshortlist, [5y  [1ydictw, [5y   [1yin [5y   [1yturn.  [5y     [1yFor [5y   [1yeach [5y  [1ypair, [5y   [1yinpw [5y   [1yand [5y  [1ydictw, [5y   [1ythe [5y   [1ystring [5y   [1yto
[48{


[6{                 [5y      [1ystring [5y  [1yrepair [5y   [1ygraph [5y   [1yis [5y   [1yconstructed [5y  [1yand [5y   [1yall [5y   [1ycost [5y   [1ypaths [5y  [1ythrough [5y   [1ythe [5y   [1ygraph
[48{


[6{                 [5y      [1yare calculated, [5y [1yusing [5y [1ythe [5y [1yalgorithm [5y [1ydescribed [5y [1yabove.  [5y  [1yCosts [5y [1yare [5y [1ydetermined
[48{


[6{                 [5y      [1yby [5y  [1yweightings [5y  [1yassigned [5y  [1yby [5y  [1ythe [5y  [1yprogram [5y  [1yat [5y  [1ythe [5y  [1ystart [5y   [1yof [5y  [1yeach [5y  [1ysession [5y  [1y(see
[48{


[6{                 [5y      [1ybelow for details [5y [1yof the weightings [5y [1yand calculations).  [5y [1yThe five words [5y [1ywith[1y[6{[2;4x
                                              [5y   [1y143
[48{


[6{                    [5y          [1y[2;2xInsert         Delete         Change       Transpose
                      letter freq.   letter freq.  letters  freq.  letters freq.
                         e   20/7       a   15/6      e/a   8/5     ae/ea   5/4
                     fnl e   20/6   fnl e   14/6      o/a   8/4     hg/gh   2/2
                         i   14/6       i   10/4      u/o   6/4     se/es   3/1
                         a   12/5       e    7/5      e/u   4/4     de/ed   2/1
                         r   12/5       o    5/3      a/e   4/4     ed/de   1/1
                         w    5/5       u    4/3      a/o   4/3     el/le   1/1
                     dbl l    7/4       r    4/3      s/c   3/3     le/el   1/1
                     scd h    7/4   scd h    4/2      m/n   3/3     er/re   1/1
                         g    7/3       g    2/2      d/b   3/2     en/ne   1/1
                         u    5/3       t    2/1      c/k   2/2     ol/lo   1/1
                         l    4/3       y    1/1      i/e   2/2     ye/ey   1/1
                         d    4/3   dbl r    1/1      a/u   2/2     uo/ou   1/1
                         o    4/3   dbl p    1/1      i/y   2/2     nh/hn   1/1
                         y    3/3   dbl g    1/1      t/p   2/2     fe/ef   1/1
                         t    5/2   dbl o    1/1      u/e   2/2     oh/ho   1/1
                         n    5/2       h    1/1      h/i   2/2     th/ht   1/1
                         c    3/2    kn k    1/1      k/c   3/1
                     dbl s    2/2       n    1/1      f/v   3/1
                         f    2/2       l    1/1      o/u   3/1
                     dbl t    2/2   dbl n    1/1      c/g   2/1
                      ck c    2/2       d    1/1      g/c   2/1
                         s    2/2                     s/k   2/1
                     dbl r    2/2                     o/e   1/1
                     dbl e    1/1                     u/w   1/1
                     dbl d    1/1                     t/r   1/1

                     Frequency of errors: frequencies given as the number of
                     errors made/number of the students making the error.
                     (Only 25 most frequent given for insert and change)

                     Abbreviations:
fnl = final (fnl e in make)    dbl = double (dbl l in bell)
                     scd = second (scd h in when)   kn = silent k (knit)
                     ck = c or k of pair ck


[5y[1y[2;4xFigure 7-6:   Study 1: frequency of types of spelling errors


                 [5y      [1yminimum [5y     [1yrepair [5y      [1ycosts [5y      [1yare [5y      [1yalways [5y      [1ysaved.   When [5y     [1yall [5y      [1ythe [5y      [1ydictws [5y      [1yon [5y      [1ythe
[48{


[6{                 [5y      [1yshortlist have been [5y [1ycompared with [5y [1ythe inpw, [5y [1ythe four [5y [1ywith minimum [5y [1yrepair
[48{


[6{                 [5y      [1ycost [5y [1yare [5y [1yoffered [5y  [1yto [5y [1ythe [5y  [1yuser.  [5y   [1yExamples [5y [1yof [5y  [1ythe [5y [1ycosts [5y [1yof [5y  [1ythe [5y [1yfive [5y  [1ysaved
[48{


[6{                 [5y      [1ydictws for [5y [1yeach [5y [1yof four [5y [1yinpws [5y [1yare given [5y [1yin [5y [1yfigure 7-7, [5y [1ytogether [5y [1ywith [5y [1ythe
[48{


[6{                 [5y      [1yintended word.

[48{


[6{[5y[1yCosts [5y      [1ywere [5y       [1yassigned [5y       [1yaccording [5y      [1yto [5y       [1ythe [5y       [1yparticular [5y      [1ycharacter [5y       [1yand [5y       [1yedit
[48{


[6{                 [5y      [1yoperation [5y [1yinvolved.  [5y    [1yAs [5y  [1ywell [5y [1yas [5y  [1yconsidering [5y  [1ythe [5y  [1ycharacters [5y [1y'a' [5y  [1yto [5y  [1y'z', [5y  [1yin [5y  [1ya
[48{


[6{                 [5y      [1ynumber [5y  [1yof [5y  [1ycases [5y   [1ythe [5y  [1yposition [5y  [1yof [5y   [1ythe [5y  [1ycharacter, [5y  [1yand [5y  [1yadjacent [5y   [1ycharacters,
[48{


[6{                 [5y      [1ywere [5y [1yalso [5y [1yconsidered.  [5y   [1yThese [5y [1ycases [5y  [1yare [5y [1yreferred [5y [1yto [5y  [1yas [5y [1y'special [5y [1ycases', [5y  [1yand
[48{


[6{                 [5y      [1ywere [5y       [1yassigned [5y        [1yweightings [5y        [1yindependent [5y        [1yof [5y       [1ythose [5y        [1yassigned [5y        [1yto [5y        [1ythe [5y        [1ysame[1y[6{[2;4x
                                              [5y   [1y144
[48{


[6{                        [5y  [1y[2;2xinpw=reck                           wreck
                             Options were
wreck   cost=  0.362
rock    cost=  0.883
reach   cost=  1.211
rocks   cost=  1.433
recall  cost=  1.573

                             inpw=roack                          rock
                             Options were
rock    cost=  0.466
rocks   cost=  1.016
wreck   cost=  1.319
reach   cost=  1.733
road    cost=  1.766

                             inpw=kuver                          cover
                             Options were
cover   cost=  1.082
curve   cost=  1.677
keeper  cost=  1.733
corner  cost=  2.293
keep    cost=  2.316

                             inpw=bilt                           built
                             Options were
built   cost=  0.407
belt    cost=  0.550
bit     cost=  0.764
belts   cost=  1.100
build   cost=  1.290


                             [5y    [1y[2;4xFigure 7-7:   Example of candidates and mininum editcost


                 [5y      [1ycharacters [5y [1yin [5y [1yother [5y  [1ycontexts.  [5y   [1yFor [5y  [1yexample, [5y [1y'e' [5y  [1yin [5y [1ythe [5y  [1yfinal [5y [1yposition [5y  [1yin [5y  [1ya
[48{


[6{                 [5y      [1ystring [5y  [1y(error [5y   [1yor [5y   [1ycorrection) [5y  [1yhad [5y   [1ya [5y   [1ydifferent [5y  [1yweighting [5y   [1yfrom [5y  [1y'e' [5y   [1yin [5y   [1yother
[48{


[6{                 [5y      [1ypositions.  A list of [5y [1yspecial cases is [5y [1ygiven in figure [5y [1y7-8.  When [5y [1yconsidering
[48{


[6{                 [5y      [1yany character [5y [1yin [5y [1ythe E [5y [1yor [5y [1yC strings, [5y [1yit [5y [1ywas first [5y [1ytested to [5y [1ysee if [5y [1yit [5y [1ywas
[48{


[6{                 [5y      [1yone of these [5y [1y'special cases'. If [5y [1yit was, it [5y [1ywas recoded with [5y [1yan upper [5y [1ycase
[48{


[6{                 [5y      [1ycharacter, as shown in the [5y [1yfigure 7-8.  For example, the 'k' in 'know' [5y [1ywas
[48{


[6{                 [5y      [1yrecoded as 'B'.

[48{


[6{[5y[1yWeightings assigned were represented as array values [5y [1yin the range 2.5 [5y [1yto
[48{


[6{                 [5y      [1y10.  [5y   [1yFour [5y  [1yarrays [5y [1yof [5y  [1yweightings [5y  [1ywere [5y [1yset [5y  [1yup, [5y [1yone [5y  [1yfor [5y [1yeach [5y  [1yedit [5y  [1yoperation
[48{


[6{                 [5y      [1y(no [5y      [1yweighting [5y      [1ywas [5y      [1yrecorded [5y      [1yfor [5y      [1ythe [5y      [1yok [5y      [1yedit).   A [5y      [1ylist [5y      [1yof [5y      [1ythe [5y      [1yactual
[48{


[6{                 [5y      [1yweightings [5y [1yassigned [5y  [1yis [5y  [1ygiven [5y  [1yin [5y [1yfigure [5y  [1y7-9.  [5y    [1yThe [5y  [1yweighting [5y [1yfor [5y  [1ydeleting [5y  [1yor
[48{


[6{                 [5y      [1yinserting [5y    [1yany [5y    [1ycharacter [5y    [1yis [5y    [1ystored [5y    [1yin [5y    [1ythe [5y    [1yone-dimensional [5y    [1yarrays [5y    [1ydeletew-
[48{


[6{                 [5y      [1ytarray [5y [1yand [5y [1yinsertwtarray, [5y  [1yrespectively, [5y [1yindexed [5y  [1yby [5y [1ythe [5y  [1ycharacter [5y [1yitself [5y  [1y(or[1y[6{[2;4x
                                              [5y   [1y145
[48{


[6{                   [5y  [1y[2;2xRepresentation     Letter(adjacent letter)

                             A               final e
B               k(n) at start of word
                             C               w(r) or w(h)
D               h in second position
                             E               t(t)
F               r(r)
G               o(o)
H               e(e)
I               p(p)
J               b(b)
K               k(k)
L               m(m)
M               l(l)
N               s(s)
O               f(f)
P               n(n)
Q               d(d)
R               z(z)
S               c(k)
T               (c)k
U               g(h)

[5y[1y[2;4xFigure 7-8:   Representation of 'special cases'


                 [5y      [1ycharacter [5y  [1yrepresentation [5y   [1yin [5y  [1yspecial [5y   [1ycases).  [5y     [1yThe [5y  [1ychangewtarray [5y   [1yand [5y   [1ytrans-
[48{


[6{                 [5y      [1yposewtarray are [5y [1ytwo-dimensional.  Weightings [5y [1yare given [5y [1yin the [5y [1yfigure for [5y [1ya
[48{


[6{                 [5y      [1ynumber of [5y [1ychange [5y [1yand [5y [1ytranspose combinations.  [5y  [1yThe [5y [1ycost [5y [1yof [5y [1ychanging [5y [1ypairs
[48{


[6{                 [5y      [1yof characters [5y [1yis [5y [1yconsidered separately [5y [1yin [5y [1ya number [5y [1yof [5y [1ycases: e.g. [5y [1ythe [5y [1ycost
[48{


[6{                 [5y      [1yof changing [5y [1y'f' [5y [1yto 'th', [5y [1yor [5y [1y'ff' to [5y [1y'gh' [5y [1yare indexed [5y [1yseparately. [5y [1y(see [5y [1yfigure
[48{


[6{                 [5y      [1y7-9).

[48{


[6{[5y[1yFor [5y  [1yeach [5y   [1ypair [5y   [1yof [5y  [1ynodes [5y   [1yto [5y   [1ybe [5y  [1ycompared [5y   [1ythe [5y  [1ycostgraph [5y   [1yis [5y   [1yconstructed.
[48{


[6{                 [5y      [1yAt each node [5y [1ythe pair [5y [1yof characters [5y [1yE(i) and [5y [1yC(j) is [5y [1yconsidered:  [5y [1ythey [5y [1yare
[48{


[6{                 [5y      [1ytested [5y [1yfirst [5y [1yto [5y [1ysee [5y [1yif [5y  [1ythey [5y [1yare [5y [1y'special [5y [1ycases'.  [5y  [1yWeightings [5y [1yfor [5y [1yeach [5y  [1yedit
[48{


[6{                 [5y      [1yoperation [5y      [1yat [5y      [1ythe [5y      [1ynode [5y      [1y(i,j) [5y      [1yare [5y      [1yfound.   [5y [1yInsert [5y      [1yweightings [5y      [1yand [5y       [1ydelete
[48{


[6{                 [5y      [1yweightings are the values of the array elements indexed by the characters.
[48{


[6{                 [5y      [1yIf [5y       [1ythere [5y        [1yis [5y        [1ya [5y       [1ymatch [5y        [1yfor [5y        [1ya [5y        [1ytransposition, [5y       [1ythat [5y        [1yis [5y        [1yif [5y        [1yE(i-1)=C(j) [5y        [1yand
[48{


[6{                 [5y      [1yE(i)=C(j-1), [5y  [1ythen [5y   [1ythe [5y   [1ytranspose [5y   [1yedit [5y  [1yweighting [5y   [1yis [5y   [1ygiven [5y  [1yby [5y   [1ythe [5y   [1ytranposew-
[48{


[6{                 [5y      [1ytarray [5y  [1yelement [5y   [1y(E(i-1),E(i)).  [5y     [1yIf [5y  [1yE(i)=C(j), [5y   [1ythat [5y  [1yis [5y   [1yif [5y  [1ythe [5y   [1ycharacters [5y   [1ymatch,
[48{


[6{                 [5y      [1ythen [5y [1ythe [5y [1yedit [5y [1ycost [5y [1yis [5y [1yzero, [5y [1yotherwise [5y [1ythe [5y [1ychange [5y [1yedit [5y [1yweighting [5y [1yis [5y [1yfound.
[48{


[6{                 [5y      [1yCharacters preceding [5y [1yand [5y [1yfollowing [5y [1yE(i) and [5y [1yC(j) [5y [1yare [5y [1ynoted.  [5y  [1yAdjacent [5y [1ypairs
[48{


[6{                 [5y      [1yof [5y     [1ycharacters, [5y      [1yE(i),E(i+1)/E(i-1),E(i)/C(j),C(j+1)/C(j-1),C(j), [5y     [1yare [5y      [1ycompared [5y      [1ywith
[48{


[6{                 [5y      [1ythe [5y   [1ycharacters [5y    [1ypairs [5y    [1ylisted [5y    [1yunder [5y    [1y'changewts' [5y    [1y(see [5y    [1yfigure [5y    [1y7-9) [5y    [1yand [5y    [1yif [5y    [1ya
[48{


[6{                 [5y      [1ymatch [5y    [1yis [5y     [1yfound [5y     [1yweightings [5y     [1yare [5y    [1yassigned [5y     [1yaccordingly: [5y     [1yotherwise [5y     [1ythe [5y     [1yvalue[1y[6{[2;4x
                                              [5y   [1y146
[48{


[6{                 [5y      [1y[2;2xinsertwt       deletewt       changewt      transwt
                     a  9.0         a  6.0         a/e  7.0      ae  9.0
                     b  4.0         b  2.5         a/o  7.0      au  8.0
                     c  5.0         c  2.5         a/u  5.0      de  8.0
                     d  7.0         d  3.5         b/d  4.0      ea  9.0
                     e 10.0         e  5.0         c/k  5.0      ei  9.0
                     f  5.0         f  2.5         e/a  8.0      el  9.0
                     g  7.0         g  4.0         e/i  4.0      es  9.0
                     h  8.0         h  3.5         e/u  7.0      er  9.0
                     i  9.0         i  5.0         h/i  5.0      ed  8.0
                     j  4.0         j  2.5         i/e  5.0      ey  8.0
                     k  4.0         k  2.5         i/y  6.0      ef  8.0
                     l  7.0         l  3.5         k/c  4.0      fe  8.0
                     m  4.0         m  2.5         m/n  6.0      gh  8.0
                     n  5.0         n  3.5         n/m  4.0      hg  8.0
                     o  7.0         o  5.0         o/u  4.0      hn  8.0
                     p  4.0         p  2.5         p/b  6.0      ht  8.0
                     q  4.0         q  2.5         s/c  6.0      ie  9.0
                     r  9.0         r  4.0         t/p  5.0      le  9.0
                     s  5.0         s  3.5         u/a  4.0      nh  8.0
                     t  5.0         t  3.5         u/e  5.0      re  9.0
                     u  7.0         u  5.0         u/o  7.0      se  9.0
                     v  4.0         v  2.5         y/i  4.0      th  8.0
                     w  8.0         w  2.5         f/gh 4.0      ua  8.0
                     x  4.0         x  2.5         f/th 6.0      ye  8.0
                     y  7.0         y  4.0         f/ph 6.0   all others=7.0
                     z  4.0         z  2.5         g/ch 4.0
                     A 10.0         A  6.0         j/ch 4.0
                     B  8.0         B  3.5         v/th 4.0
                     C  8.0         C  2.5         w/gh 4.0
                     D  8.0         D  4.0         y/gh 4.0
                     E  7.0         E  3.5         y/ie 5.0
                     F  9.0         F  4.0        ch/j  4.0
                     G  7.0         G  5.0        ch/t  4.0
                     H 10.0         H  5.0        ff/gh 4.0
                     I  6.0         I  3.5        gh/ff 3.5
                     J  6.0         J  3.0        oo/ue 4.5
                     K  7.0         K  4.0        ow/ue 4.5
                     L  6.0         L  3.0        th/f  4.5
                     M  8.0         M  3.5      all others=3.0
                     N  7.0         N  3.5
                     O  6.0         O  3.0
                     P  7.0         P  4.0
                     Q  7.0         Q  3.5
                     R  6.0         R  3.0
                     S  7.0         S  3.0
                     T  6.0         T  3.0
                     U  4.0         U  4.0


[5y[1y[2;4xFigure 7-9:   Weightings assigned to edit functions[1y[6{[2;4x
                                              [5y   [1y147
[48{


[6{                 [5y      [1ystored in the [5y [1ychangewtarray element [5y [1y(E(i),C(j)) is [5y [1ythe change [5y [1yedit [5y [1yweighting
[48{


[6{                 [5y      [1yfor the [5y [1ycurrent [5y [1ynode.  [5y [1yThe [5y [1yweightings are [5y [1yused to [5y [1ycalculate the [5y [1ycost [5y [1yfor
[48{


[6{                 [5y      [1yeach edit operation at each node, where

[48{


[6{                  [5y    [1ycost = 0.05 + (2.5/weighting)

[48{


[6{                 [5y      [1yThe maximum [5y [1ycost [5y [1yof [5y [1ya single [5y [1yedit [5y [1yis [5y [1y1.05 [5y [1y(weighting=2.5) [5y [1yand [5y [1ythe [5y [1yminimum
[48{


[6{                 [5y      [1ycost [5y       [1yis [5y       [1y0.3 [5y       [1y(weighting=10).   [5y  [1yUsing [5y       [1ythe [5y       [1yalgorithm [5y       [1ydescribed [5y       [1yabove, [5y       [1ythe
[48{


[6{                 [5y      [1yminimum cost of each node [5y [1yis calculated, for all [5y [1ynodes, and the least [5y [1ycost
[48{


[6{                 [5y      [1ypath through the graph determined.

[48{


[6{                   [5y  [1yThe [5y [1yweightings [5y  [1ywere [5y [1ychosen [5y  [1yby [5y [1yconsidering [5y  [1ythose [5y [1yerrors [5y  [1ymost [5y  [1yfrequently
[48{


[6{                 [5y      [1ymade [5y    [1yby [5y    [1ythe [5y    [1ychildren [5y    [1yin [5y    [1yStudy [5y    [1y1, [5y     [1yand [5y    [1yby [5y    [1yexperimenting [5y    [1ywith [5y     [1ydifferent
[48{


[6{                 [5y      [1ycosts [5y   [1yand [5y   [1yweighting [5y    [1yfunctions, [5y   [1ytesting [5y    [1ythem [5y   [1yon [5y   [1ya [5y    [1ysubset [5y   [1yof [5y   [1ythe [5y    [1yerrors.
[48{


[6{                 [5y      [1yThey [5y   [1ywere [5y    [1yset [5y   [1yup [5y    [1ysuch [5y   [1ythat [5y    [1y2 [5y   [1yvery [5y    [1yfrequent [5y    [1yerrors, [5y   [1ythat [5y    [1ymight [5y    [1yoften
[48{


[6{                 [5y      [1yoccur together, would [5y [1yhave lower cost [5y [1ythan a single [5y [1y(less likely error), [5y [1yand
[48{


[6{                 [5y      [1yhence [5y   [1ythe [5y   [1ymatched [5y   [1ydictw [5y   [1yinvolving [5y   [1y2 [5y   [1yedit [5y   [1yoperations [5y   [1ycould [5y   [1ybe [5y   [1ychosen [5y    [1yin
[48{


[6{                 [5y      [1ypreference to [5y [1yanother dictw [5y [1yinvolving only [5y [1y1 edit [5y [1yoperation.  [5y [1yFor [5y [1yexample,
[48{


[6{                 [5y      [1yif [5y [1ythe [5y [1ymisspelling [5y  [1yis [5y [1y"wud" [5y [1yit [5y  [1ycould [5y [1ybe [5y [1yedited [5y  [1yto [5y [1y"would" [5y  [1yby [5y [1yinserting [5y  [1y"o"
[48{


[6{                 [5y      [1yand [5y [1y"l" [5y [1y(2 [5y  [1yoperations, [5y [1ycost=.814). [5y [1yIt [5y [1ycould [5y [1ybe [5y  [1yedited [5y [1yto [5y [1ymatch [5y [1y"mud" [5y  [1ywith
[48{


[6{                 [5y      [1y1 [5y      [1yoperation, [5y      [1ychange [5y       [1y"w" [5y      [1yto [5y      [1y"m" [5y       [1y(cost=.838). [5y      [1yThe [5y      [1ymatch [5y       [1yto [5y      [1y"would" [5y       [1yis
[48{


[6{                 [5y      [1ycheaper.  [5y  [1yIn [5y [1ytheory, [5y [1y3 [5y [1yof [5y [1ythe [5y [1y'cheapest' [5y [1yedits [5y [1y(minimum [5y [1ycost [5y [1y0.3, [5y [1yweight-
[48{


[6{                 [5y      [1ying [5y [1y10) [5y [1ywould [5y [1ybe [5y [1yless [5y  [1ycostly [5y [1ythan [5y [1y1 [5y [1yof [5y  [1ythe [5y [1ymost [5y [1yexpensive [5y [1y(maximum [5y  [1ycost
[48{


[6{                 [5y      [1y1.05, [5y   [1yweighting=2.5): [5y    [1yit [5y   [1yis [5y    [1yvery [5y   [1ydifficult, [5y    [1yhowever, [5y   [1yto [5y    [1yimagine [5y   [1ycases [5y    [1ywhen
[48{


[6{                 [5y      [1ythis [5y       [1ywould [5y        [1yhappen.   [5y    [1yThough [5y       [1ythe [5y        [1ytransposition [5y        [1yerrors [5y        [1ywere [5y        [1ythe [5y        [1yleast
[48{


[6{                 [5y      [1yfrequent [5y [1yof [5y [1ythe [5y [1yerror types [5y [1ythey [5y [1ywere [5y [1ygiven [5y [1yhigh [5y [1yweightings: [5y [1ythis [5y [1ywas [5y [1yto
[48{


[6{                 [5y      [1yincrease [5y [1ythe [5y [1ylikelihood [5y [1yof [5y [1yany [5y  [1yerror [5y [1ybeing [5y [1yclassed [5y [1yas [5y  [1ya [5y [1ytransposition, [5y [1yif [5y  [1yit
[48{


[6{                 [5y      [1ycould be considered as such.

[48{


[6{                   [5y  [1yAn [5y [1yexample [5y [1ywill [5y  [1ybe [5y [1ygiven [5y [1yto [5y [1yillustrate [5y [1ythe [5y  [1ymethod [5y [1yof [5y [1ycalculation [5y [1yof [5y  [1ythe
[48{


[6{                 [5y      [1yminimum [5y [1ycost [5y  [1yrepair.  [5y   [1yFor [5y  [1ythe [5y  [1yfour [5y [1ypaths [5y  [1ygiven [5y  [1yin [5y [1yfigure [5y  [1y7-2, [5y  [1ythe [5y  [1ygraph
[48{


[6{                 [5y      [1yshowing [5y      [1ythe [5y      [1yweightings, [5y      [1yfour [5y      [1yof [5y      [1ythe [5y      [1ypossible [5y      [1ytransformations, [5y      [1yand [5y       [1ythe
[48{


[6{                 [5y      [1ycosts [5y  [1yfor [5y   [1yeach [5y  [1ytransformation [5y   [1yare [5y  [1ygiven.  [5y     [1yThe [5y   [1yweightings [5y  [1yfor [5y   [1ythe [5y   [1ytrans-
[48{


[6{                 [5y      [1yformations are given in figure 7-10.

[48{


[6{                   [5y  [1yThe transformations are:[1y[6{[2;4x
                                              [5y   [1y148
[48{


[6{[5y[1y[2;2xricev -> receive

C string

                                r      e      c      e      i      v      e
                             .      .      .      .      .      .      .      .
                          r
E     4     ok
.      .      .      .      .      .      .      .
                          i
s     5      5     5
t      .      .      .      .      .      .      .      .
                      r   c
i    2.5          10       ok
                      n      .      .      .      .  10  .  9   .      .      .
                      g   e
 5                           ok
                             .      .      .      .      .  9   .      . 7    .
                          v
2.5                                3       ok
                             .      .      .      .      .      .      .      .
                                9      10     5      10     9      4      10


                                  [2;4xFigure 7-10:   Graph showing example weightings


                   [5y  [1y[2;2x1. r -> r    2. r -> r    3. r -> r    4. r -> 0
                          i -> e       i -> 0       i -> e       i -> 0
                          c -> c       0 -> e       c -> c       c -> 0
                          e -> e       c -> c       e -> e       e -> 0
                          0 -> i       0 -> e       v -> i       v -> 0
                          v -> v       0 -> i       0 -> v       0 -> r
                          0 -> e      ev -> ve      0 -> e       0 -> e
0 -> c
0 -> e
0 -> i
0 -> v
0 -> e

                     [2;4xThe costs for each transformation will be:

                    [5y   [1y1. 0 + .55 + 0 + 0 + .327 + 0 + .3 = 1.177

                    [5y   [1y2. 0 + .55 + .3 + 0 + .3 + .327 + .407 = 1.884

                    [5y   [1y3. 0 + .55 + 0 + 0 + .883 + .675 + .3 = 2.408

                    [5y   [1y4. .675 + .55 + 1.05 + .55 + 1.05 [5y [1y+ .327 + .3 + .55 + .3 + [5y [1y.327 +
                      [5y      [1y.675 + .3 = 6.654

[48{


[6{[5y[1yThe [5y  [1yperformance [5y   [1yof [5y   [1ythe [5y  [1yeditcost [5y   [1yalgorithm, [5y   [1ytogether [5y  [1ywith [5y   [1ypossible [5y   [1yim-
[48{


[6{                 [5y      [1yprovements and extensions, is discussed in chapter 8.[1y[6{[2;4x
                                              [5y   [1y149
[48{


[6{                 [5y      [1y7.3. Phonemic coding of words: the phoncode program


[48{


[6{                 [5y      [1y7.3.1. General overview

[48{


[6{[5y[1yWhen [5y        [1yphoneme-grapheme [5y        [1ycorrespondence [5y        [1yrules [5y        [1yare [5y        [1yused [5y        [1yto [5y         [1ygenerate
[48{


[6{                 [5y      [1yspellings, [5y   [1ymisspellings [5y    [1ymay [5y    [1yoccur [5y    [1ywhen [5y    [1yincorrect [5y    [1yrules [5y    [1yare [5y    [1yused, [5y    [1yor [5y    [1ywhen
[48{


[6{                 [5y      [1ythe [5y [1yrules [5y  [1yare [5y  [1yinappropriate [5y [1y(for [5y  [1yexample [5y  [1yan [5y [1yirregularly [5y  [1yspelt [5y  [1yword).  [5y   [1yIf [5y  [1ya
[48{


[6{                 [5y      [1yword is misspelt in this way, it might be corrected as follows:

                    [5y   [1y1. isolate the graphemes in the word

                    [5y   [1y2. infer [5y    [1ywhich [5y     [1yphoneme-grapheme [5y     [1ycorrespondence [5y    [1yrules [5y     [1ymay [5y     [1yhave
                      [5y      [1ybeen used to produce the graphemes

                    [5y   [1y3. select [5y     [1ya [5y     [1yset [5y      [1yof [5y     [1yphonemes [5y      [1ythat [5y     [1ycould [5y      [1yhave [5y     [1ygenerated [5y      [1ythese
                      [5y      [1ygraphemes

[5y[1y4. use the set of phonemes to generate the correct spelling

[48{


[6{                   [5y  [1yIn [5y  [1ythe [5y  [1yfirst [5y  [1ythree [5y  [1ysteps, [5y  [1ythe [5y  [1yphoneme-grapheme [5y  [1ycorrespondence [5y  [1yrule [5y  [1yis
[48{


[6{                 [5y      [1ybeing [5y       [1yused [5y       [1yin [5y       [1yreverse. [5y       [1yThis [5y       [1yis [5y       [1ynot [5y       [1yequivalent, [5y       [1yhowever, [5y       [1yto [5y       [1yusing [5y       [1ythe
[48{


[6{                 [5y      [1ygrapheme-phoneme [5y  [1yrules [5y  [1yas [5y  [1yin [5y  [1yreading.  [5y    [1yThis [5y  [1ymethod [5y  [1yof [5y  [1ycorrection [5y  [1yis [5y   [1ythe
[48{


[6{                 [5y      [1ybasis of the phoncode program, to be described here.


[48{


[6{                 [5y      [1y7.3.2. Related work

[48{


[6{Research [5y   [1yon [5y    [1ygrapheme [5y    [1yto [5y   [1yphoneme [5y    [1ycorrespondence [5y    [1yrules [5y   [1yis [5y    [1yof [5y    [1yinterest
[48{


[6{                 [5y      [1yhere, [5y     [1yin [5y     [1ythat [5y      [1yit [5y     [1ygives [5y     [1ysome [5y      [1yguide [5y     [1yto [5y     [1ypronunciation [5y      [1yof [5y     [1ycorrectly [5y      [1yspelt
[48{


[6{                 [5y      [1ywords, [5y         [1yand [5y          [1yalso [5y         [1yfor [5y          [1yregular [5y         [1ynon-words. [5y          [1yAs [5y         [1ydiscussed [5y          [1yin [5y         [1ychapter [5y          [1y2,
[48{


[6{                 [5y      [1ygrapheme-phoneme [5y        [1yrules [5y         [1ycan [5y         [1ybe [5y         [1yspecified [5y         [1ymore [5y         [1yeasily [5y         [1ythan [5y         [1yphoneme-
[48{


[6{                 [5y      [1ygrapheme [5y [1yrules. [5y [1yWork [5y  [1yby [5y [1yVenezky [5y  [1yis [5y [1yof [5y  [1yparticular [5y [1yrelevance [5y [1yhere [5y  [1y(Venezky,
[48{


[6{                 [5y      [1y1966).  [5y         [1yThe [5y     [1ygrapheme-phoneme [5y    [1yrules [5y     [1yare [5y     [1yof [5y    [1ylimited [5y     [1yuse, [5y     [1yhowever, [5y     [1ysince
[48{


[6{                 [5y      [1ythey do not provide information [5y [1yabout all possible phonemes that might [5y [1ybe
[48{


[6{                 [5y      [1ygenerated; [5y  [1yor [5y  [1ywhich [5y  [1yalternative [5y  [1ygraphemes [5y  [1ycould [5y  [1ybe [5y  [1yused [5y  [1yin [5y  [1yplace [5y  [1yof [5y   [1ythe
[48{


[6{                 [5y      [1ygiven one, in order to produce the same phoneme.

[48{


[6{                   [5y  [1yWork [5y           [1yon [5y           [1ycomputer [5y           [1ytext-to-speech [5y           [1yproduction [5y           [1ysystems [5y           [1yis [5y           [1yalso [5y           [1yof
[48{


[6{                 [5y      [1yrelevance (Ellovitz [5y [1yet al, [5y [1y1976), (Ciarcia, [5y [1y1982), (Allen, [5y [1y1981), but [5y [1yhas [5y [1ysimilar
[48{


[6{                 [5y      [1ylimitations. [5y   [1yThe [5y   [1yfocus [5y   [1yis [5y   [1yon [5y    [1yspecifying [5y   [1ygrapheme-phoneme [5y   [1yrules [5y   [1yin [5y    [1ycertain
[48{


[6{                 [5y      [1ygraphemic contexts, and most difficulties are encountered in these [5y [1ysystems
[48{


[6{                 [5y      [1ywith pronunciations of irregularly spelt words.[1y[6{[2;4x
                                              [5y   [1y150
[48{


[6{                   [5y  [1yResearch [5y        [1yon [5y        [1yphoneme-grapheme [5y        [1ycorrespondence [5y        [1yis [5y        [1yof [5y        [1ymore [5y        [1yrelevance
[48{


[6{                 [5y      [1yhere, [5y [1yin [5y [1yparticular [5y [1ythe [5y [1ystudies [5y [1yby [5y [1yHanna [5y [1yet [5y [1yal [5y [1y(Hanna [5y [1yet [5y [1yal, [5y [1y1966), [5y [1yand [5y  [1yby
[48{


[6{                 [5y      [1ySimon [5y  [1yand [5y  [1ySimon [5y  [1y(Simon [5y [1yand [5y  [1ySimon, [5y  [1y1973).  [5y    [1yThese [5y  [1ystudies [5y  [1yare [5y  [1ydiscussed [5y  [1yin
[48{


[6{                 [5y      [1yChapter [5y    [1y2.  [5y          [1yInformation [5y     [1yabout [5y     [1ythe [5y     [1ycorrect [5y     [1ygraphemes [5y     [1yfor [5y     [1yrepresenting
[48{


[6{                 [5y      [1yphonemes [5y [1yin [5y  [1yspecific [5y  [1ywords [5y  [1ywas [5y [1yobtained [5y  [1yin [5y  [1ythese [5y  [1ystudies.  [5y   [1yThe [5y  [1yphoneme-
[48{


[6{                 [5y      [1ygrapheme [5y     [1ycorrespondences [5y      [1ythat [5y     [1ywere [5y      [1ygenerated, [5y      [1yused [5y     [1yin [5y      [1yreverse, [5y      [1ywould
[48{


[6{                 [5y      [1yprovide [5y      [1ysome [5y       [1yof [5y       [1ythe [5y      [1yinformation [5y       [1yrequired [5y       [1yfor [5y      [1ythe [5y       [1yphoncode [5y       [1yprogram.
[48{


[6{                 [5y      [1yHowever, [5y          [1yas [5y          [1ywith [5y          [1yVenezky's [5y          [1ywork, [5y          [1yand [5y          [1ythe [5y          [1ytext-to-speech [5y           [1yresearch,
[48{


[6{                 [5y      [1ylegitimate [5y      [1ycorrespondences [5y       [1y(phoneme-grapheme [5y      [1yand [5y       [1ygrapheme-phoneme) [5y       [1yin
[48{


[6{                 [5y      [1yspecific [5y    [1ycontexts [5y     [1ywere [5y     [1ybeing [5y    [1ystudied: [5y     [1ythe [5y     [1yaim [5y    [1ywas [5y     [1yto [5y     [1yproduce [5y     [1ycorrect
[48{


[6{                 [5y      [1ypronunciation [5y   [1yor [5y    [1yspelling, [5y    [1yusing [5y   [1ycontext-specific [5y    [1yrules. [5y    [1yAs [5y   [1ythe [5y    [1yconcern [5y    [1yin
[48{


[6{                 [5y      [1ythis [5y   [1ythesis [5y   [1yis [5y   [1ymisspellings, [5y   [1ythe [5y   [1ycorrespondence [5y   [1yrules [5y   [1yto [5y   [1ybe [5y   [1yused [5y   [1ymust [5y   [1ybe
[48{


[6{                 [5y      [1ylargely [5y     [1ycontext-free. [5y      [1yA [5y      [1ymisspelling [5y      [1ymight [5y      [1ywell [5y      [1ybe [5y      [1ya [5y      [1y'correct' [5y      [1yphoneme-
[48{


[6{                 [5y      [1ygrapheme [5y [1ycorrespondence [5y [1yused [5y  [1yin [5y [1yan [5y  [1y'incorrect' [5y [1ycontext. [5y  [1yTherefore, [5y  [1yinfor-
[48{


[6{                 [5y      [1ymation from these studies is useful, but not sufficient.


[48{


[6{                 [5y      [1y7.3.3. Design of the phoncode program

[48{


[6{                   [5y  [1yThe [5y     [1yphoncode [5y     [1yprogram [5y     [1ytakes [5y     [1yan [5y     [1yinput [5y     [1yword [5y     [1y(inpw) [5y     [1yand [5y      [1yselects [5y     [1ythose
[48{


[6{                 [5y      [1ywords [5y  [1yfrom [5y  [1ythe [5y  [1ydictionary [5y  [1ythat [5y   [1ycan [5y  [1ybe [5y  [1yconsidered [5y  [1yphonemically [5y   [1yequivalent
[48{


[6{                 [5y      [1yto [5y  [1yit. [5y  [1yThe [5y  [1ydictionary [5y [1ywords [5y  [1ymatched [5y  [1yare [5y  [1yoffered [5y  [1yto [5y  [1ythe [5y  [1yuser [5y  [1yas [5y  [1ypossible
[48{


[6{                 [5y      [1ycorrections for the inpw. See figure 7-11 for some examples.


                        [5y  [1y[2;2x:[7;4xwear
[5y[1y[2;2xIs it one of these?
wear
where
were

                             :[7;4xturtul
[5y[1y[2;2xIs it one of these?
turtle

                             :[7;4xthiar
[5y[1y[2;2xIs it one of these?
their
there

                             :[7;4xsomb
[5y[1y[2;2xIs it one of these?
some
sum

[5y[1y[2;4xFigure 7-11:   Examples of use of the phoncode program[1y[6{[2;4x
                                              [5y   [1y151
[48{


[6{                   [5y  [1yThe [5y    [1yphoncode [5y    [1yprogram [5y     [1yworks [5y    [1yby [5y     [1ysegmenting [5y    [1ythe [5y     [1yinpw [5y    [1yinto [5y     [1ygraphemes;
[48{


[6{                 [5y      [1yfinding [5y  [1yphonemes [5y   [1ythat [5y  [1ythese [5y   [1ygraphemes [5y  [1ymight [5y   [1yrepresent [5y  [1y(in [5y   [1yany [5y   [1ycontext);
[48{


[6{                 [5y      [1yusing a set [5y [1yof these [5y [1yphonemes to [5y [1ysearch for [5y [1ylegitimate words [5y [1yrepresented
[48{


[6{                 [5y      [1yby matching phonemes. Decisions were [5y [1ymade concerning selection of the [5y [1yset
[48{


[6{                 [5y      [1yof [5y    [1ygraphemes [5y    [1y(into [5y    [1ywhich [5y    [1ywords [5y    [1ywere [5y    [1ysegmented), [5y    [1ythe [5y    [1yset [5y    [1yof [5y     [1yphonemes
[48{


[6{                 [5y      [1y(used [5y [1yto [5y [1yrepresent [5y  [1yall [5y [1ywords), [5y  [1yand [5y [1ythe [5y [1ygrapheme-phoneme [5y  [1ycorrespondences.
[48{


[6{                 [5y      [1yInformation from four sources was used in making these decisions:

                   [5y          [1y- errors made by children in both studies;

                   [5y          [1y- related work by Hanna et al (Hanna et al, 1966);

                   [5y          [1y- related work by Simon and Simon (Simon and Simon, 1973);

                   [5y          [1y- additional examples generated by the author.


[48{


[6{                 [5y      [1y7.3.4. Defining the set of phonemes

[48{


[6{                   [5y  [1yIn [5y  [1ythe [5y   [1yHanna [5y   [1ystudy [5y  [1ywords [5y   [1ywere [5y   [1yphonemically [5y  [1ycoded [5y   [1yusing [5y   [1ya [5y   [1y62-phoneme
[48{


[6{                 [5y      [1yclassification [5y      [1yscheme, [5y      [1ybased [5y       [1yon [5y      [1ythe [5y       [1yMerriam-Webster [5y      [1ydictionary [5y       [1ypronun-
[48{


[6{                 [5y      [1yciation code (Hanna [5y [1yet al, 1966).  [5y [1yThis scheme [5y [1yused 32 [5y [1yvowel phonemes [5y [1yand
[48{


[6{                 [5y      [1y30 [5y        [1yconsonant [5y         [1yphonemes.   [5y     [1yLater [5y         [1ythey [5y        [1yreduced [5y         [1ythe [5y        [1ynumber [5y         [1yof [5y         [1yvowel
[48{


[6{                 [5y      [1yphonemes [5y  [1yin [5y  [1ythe [5y  [1yclassification [5y  [1yscheme, [5y  [1ycombining [5y  [1ythe [5y  [1yweakest [5y  [1yvowel [5y   [1yforms
[48{
[6{                            [5y    [1y[4;3x2[48{


[6{[5y[1y[2;4xto [5y   [1ythe [5y   [1yschwa[5y        [1y, [5y   [1yand [5y   [1ycombining [5y    [1yseveral [5y   [1yother [5y   [1ycategories [5y   [1ywhere [5y    [1ydistinctions
[48{


[6{                 [5y      [1ybetween [5y   [1yphonemes [5y    [1ywere [5y    [1ynot [5y   [1yclear, [5y    [1ye.g. [5y    [1yreducing [5y   [1ythe [5y    [1ytwo [5y    [1ycategories [5y    [1y/A/
[48{


[6{                 [5y      [1yand [5y [1y/A1/ [5y  [1y(ale [5y [1yand [5y  [1ychaotic) [5y [1yto [5y [1ya [5y  [1ysingle [5y [1ycategory, [5y  [1y/A/. [5y [1yThe [5y  [1ytotal [5y [1ynumber [5y  [1yof
[48{


[6{                 [5y      [1yvowel phoneme categories [5y [1ywas reduced to [5y [1y22. Ellovitz et [5y [1yal. (Ellovitz et [5y [1yal,
[48{


[6{                 [5y      [1y1976) [5y      [1yadopted [5y      [1ya [5y       [1yscheme [5y      [1yof [5y       [1y41 [5y      [1yphonemes, [5y      [1y16 [5y       [1yvowel [5y      [1yphonemes [5y      [1yand [5y       [1y25
[48{


[6{                 [5y      [1yconsonant [5y  [1yphonemes, [5y  [1yin [5y  [1ytheir [5y  [1ytext-to-speech [5y   [1yprogram. [5y  [1yThe [5y  [1yphonemes [5y   [1ywere
[48{
[6{[5y[1y[4;3x3[48{


[6{                          [5y  [1y[2;4xused [5y    [1yin [5y     [1yconverting [5y    [1yenglish [5y     [1ytext [5y    [1yto [5y     [1yIPA [5y    [1yrepresentation  [5y [1y, [5y     [1ywhich [5y    [1yis [5y     [1ythen
[48{


[6{                 [5y      [1ypassed to the Votrax synthesizer (Ellovitz et [5y [1yal, 1976). Morris-Wilson, in [5y [1yhis
[48{


[6{                 [5y      [1yphonemic transcription textbook, used a representation of 44 phonemes, [5y [1y24
[48{


[6{                 [5y      [1yconsonantal and 20 [5y [1yvowel phonemes, [5y [1ytaken from [5y [1y'Gimson's Set' [5y [1y(see [5y [1y(Morris-
[48{


[6{                 [5y      [1yWilson, 1984) for details and references).


[48{


[6{                 [5y      [1y[4m               [0m

[48{


[6{[5y[1y[4;3x2[48{


[6{the vowel sound occurring in unstressed syllables e.g. about, vowel, mother

[48{


[6{                            [5y  [1y3[48{


[6{International Phonetic Alphabet[1y[6{[2;4x
                                              [5y   [1y152
[48{


[6{                   [5y  [1yThe [5y     [1yset [5y     [1yused [5y      [1yin [5y     [1ythis [5y      [1ystudy [5y     [1ycomprised [5y      [1y46 [5y     [1yphonemes [5y      [1yin [5y     [1yall, [5y     [1y20 [5y      [1yvowel
[48{


[6{                 [5y      [1yphonemes [5y   [1yand [5y   [1y26 [5y    [1yconsonantal [5y   [1yphonemes. [5y    [1yFigures [5y   [1y7-12 [5y    [1yand [5y   [1y7-13 [5y    [1yshow [5y    [1ythe
[48{
[6{[5y[1y[4;3x4[48{


[6{                          [5y  [1y[2;4xphonemes used, with examples[5y        [1y.


[5y[1y[2;2xMorris-   IPA   Hanna   Notation here
                      Examples         Wilson         et al   (text)  (code)
                     late, day           eI     eI     A/A1    eI      10
                     air, care           e              A2     eE      12
                     bat, add                        A3/A4/A6  ae      13
                     car, aunt            :      a      A5     a:      15
                     about, silent                   A7/E4/I4   E      57
O4/U4
                     beat, keep          i:      i     E/E1     i      50
                     here, ear           I      I       E2     IE      52
                     end, let             e             E3      e      53
                     maker, urn           :           E5/U2    e:      55
                     ice, high           aI     aI      I      aI      90
                     ill, bit             I      I      I3      I      93
                     boat, know           U     o      O/O1    EU     150
                     port, saw            :             O2     o:     152
                     pot, soft                        O3/O5     O     153
                     food, rude          u:      u      O6      u     156
                     foot, book           U             O7      U     157
                     cube, unite          -     ju     U/U1    ju     200
                     up, son              ^      ^      U3      ^     203
                     oil, boy             I      I      OI     oI     158
                     out, cow            aU     a       OU     aU     159
                     honest               -      -      H9     -      -
                     late                 -      -      E9     -      -

                                 [5y       [1y[2;4xFigure 7-12:   Representation of vowel phonemes


                   [5y  [1yThe [5y   [1y20 [5y   [1yvowel [5y    [1yphonemes [5y   [1ywere [5y   [1yequivalent [5y    [1yto [5y   [1y20 [5y   [1yof [5y    [1ythe [5y   [1yvowel [5y    [1yphonemes
[48{


[6{                 [5y      [1yused [5y    [1yby [5y     [1yHanna, [5y    [1ycombining [5y     [1ythe [5y    [1y/E5/ [5y     [1yand [5y    [1y/U2/ [5y     [1ycategories [5y     [1yto [5y    [1ymatch [5y     [1ycom-
[48{


[6{                 [5y      [1ypletely. [5y [1yOf [5y [1ythe [5y  [1yvowel [5y [1yphonemes, [5y [1y19 [5y  [1yof [5y [1ythe [5y  [1y20 [5y [1yused [5y  [1yby [5y [1yMorris-Wilson [5y  [1ywere
[48{


[6{                 [5y      [1yused [5y        [1yhere. [5y         [1yThe [5y         [1y/U2/ [5y         [1ycategory [5y        [1ywas [5y         [1yomitted [5y         [1y(combined [5y        [1ywith [5y         [1ythe [5y         [1y/o:/
[48{


[6{                 [5y      [1ycategory), and [5y [1ya [5y [1yseparate [5y [1yvowel phoneme [5y [1y/ju/ [5y [1ywas [5y [1yadded: [5y [1yMorris-Wilson [5y [1yhas
[48{


[6{                 [5y      [1ya [5y       [1yconsonant [5y        [1ycategory [5y        [1y/j/, [5y       [1ybut [5y        [1yno [5y       [1yindependent [5y        [1yvowel [5y       [1ycategory.   [5y    [1yTwo
[48{


[6{                 [5y      [1yconsonantal [5y  [1ycategories [5y   [1ywere [5y  [1yadded [5y   [1yto [5y  [1ythe [5y   [1yMorris-Wilson [5y   [1yset [5y  [1yto [5y   [1ymake [5y   [1ythe
[48{


[6{                 [5y      [1yset [5y [1yhere: [5y  [1y/ks/ [5y  [1yand [5y [1y/kw/ [5y  [1yare [5y  [1yadded, [5y [1yas [5y  [1ythey [5y [1ywere [5y  [1yconsidered [5y [1yto [5y  [1ybe [5y  [1ysingle
[48{


[6{                 [5y      [1yphonemes [5y   [1yin [5y    [1ycertain [5y   [1ycontexts.  [5y       [1yThis [5y    [1yset [5y   [1yis [5y    [1yequivalent [5y    [1yto [5y   [1ythe [5y    [1yHanna [5y    [1yset
[48{


[6{                 [5y      [1ywith [5y   [1ycategory [5y    [1ypairs [5y   [1y/L/ [5y    [1yand [5y   [1y/L1/, [5y   [1y/M/ [5y    [1yand [5y   [1y/M1/, [5y    [1y/N/ [5y   [1yand [5y    [1y/N1/, [5y   [1y/W/ [5y    [1yand


[48{


[6{                 [5y      [1y[4m               [0m

[48{


[6{[5y[1y[4;3x4[48{


[6{The [5y     [1ycode [5y     [1ycolumn [5y     [1yindicates [5y     [1ythe [5y    [1yinteger [5y     [1ycode [5y     [1yused [5y     [1yin [5y     [1ythe [5y     [1yactual [5y     [1yprogram: [5y     [1ythe [5y     [1ytext
                          [5y  [1ynotation will generally be used in this thesis for ease of reading.[1y[6{[2;4x
                                              [5y   [1y153
[48{


[6{                  [5y    [1y[2;2xExamples        Morris-   IPA   Hanna   Notation here
Wilson         et al   (text)  (code)
                     bad, rub             b      b      B      b      20
                     bad, day             d      d      D      d      40
                     fat, rough           f      f      F      f      60
                     go, big              g      g      G      g      70
                     hit, behind          h      h      H      h      80
                     gin, joke           dz     dz      J     dz     100
                     keep, cock           k      k      K      k     110
                     loud, kill           l      l     L,L1    l     120
                     mad, jam             m      m     M,M1    m     130
                     man, no              n      n     N,N1    n     140
                     pit, top             p      p      P      p     160
                     run, bread           r      r      R      r     170
                     sit, loss            s      s      S      s     180
                     trap, step           t      t      T      t     190
                     very, love           v      v      V      v     210
                     wash, when           w      w     W,HW    w     220
                     yellow, yet          j      j      Y      y     230
                     zoo, beds            z      z      Z      z     240
                     chair, lunch        t      t      CH     ch      31
                     ethics, accent       -      -     KS     ks     111
                     quick, aqua          -     kw     KW     kw     112
                     sing, along                       NG     ng     142
                     sugar, bush                       SH     sh     181
                     theatre, thank                    T1     th     191
                     that, with                        T2     tv     192
                     garage,pleasure                   ZH     zh     241
                     honest               -      -     H9     -     -


                               [5y       [1y[2;4xFigure 7-13:   Representation of consonant phonemes


                 [5y      [1y/WH/ [5y [1yeach [5y [1ybeing [5y [1yconsidered [5y [1yas [5y  [1yone [5y [1ycategory. [5y [1yThe [5y  [1ybasis [5y [1yfor [5y [1ycombination [5y  [1yof
[48{


[6{                 [5y      [1yphoneme [5y [1ycategories, [5y  [1yconsidered [5y  [1ydistinct [5y  [1yby [5y [1yHanna [5y  [1yet [5y  [1yal, [5y  [1ywas [5y [1ythat [5y  [1yin [5y  [1ymany
[48{


[6{                 [5y      [1ycontexts [5y      [1ythe [5y       [1ypronunciations [5y       [1ywould [5y      [1ybe [5y       [1yconsidered [5y       [1yindistinguishable [5y       [1yto [5y       [1ya
[48{


[6{                 [5y      [1ynon-linguist, [5y     [1yboth [5y     [1ywhen [5y      [1ypronounced [5y     [1yby [5y     [1ythe [5y      [1yauthor, [5y     [1yor [5y     [1yby [5y     [1ythe [5y      [1ychildren
[48{


[6{                 [5y      [1yfrom the reading unit.


[48{


[6{                 [5y      [1y7.3.5. Phoneme-grapheme correspondences

[48{


[6{                   [5y  [1yWhen [5y   [1yconsidering [5y    [1ya [5y    [1yword [5y   [1yand [5y    [1yits [5y    [1yphonemic [5y   [1yrepresentation, [5y    [1yhow [5y    [1ydo [5y    [1ywe
[48{
[6{[5y[1y[4;3x5[48{


[6{                          [5y  [1y[2;4xdecide [5y [1ywhich [5y  [1ycharacter [5y [1yor [5y  [1ycharacters [5y [1yrepresent [5y  [1yeach [5y [1yphoneme?  [5y           [1yIn [5y  [1ycases
[48{


[6{                 [5y      [1ysuch as the following the relationship is clear:


[48{


[6{                 [5y      [1y[4m               [0m

[48{


[6{[5y[1y[4;3x5[48{


[6{Note that the convention here will be grapheme = /phoneme/.[1y[6{[2;4x
                                              [5y   [1y154
[48{


[6{                        [5y  [1y[2;2xcat      = /k/ /ae/ /t/
dog      = /d/ /O/ /g/
biting   = /b/ /aI/ /t/ /I/ /ng/

                             c = /k/         d = /d/         b = /b/
                             a = /ae/        o = /O/         i = /aI/
                             t = /t/         g = /g/         t = /t/
i = /I/
ng = /ng/

                     [2;4xIn [5y [1ysome [5y [1yother [5y  [1ywords [5y [1yit [5y [1ymay [5y  [1ybe [5y [1ya [5y [1ylittle [5y  [1ymore [5y [1ydifficult [5y [1yto [5y  [1ydecide, [5y [1ybut [5y  [1yan
[48{


[6{                 [5y      [1yinterpretation can be given:

[5y[1y[2;2xabbey   = /ae/ /b/ /i/
nation  = /n/ /eI/ /sh/ /E/ /n/
                             science = /s/ /aI/ /E/ /n/ /s/

                             a  = /ae/       n  = /n/        sc = /s/
                             bb = /b/        a  = /eI/       i  = /aI/
                             ey = /i/        ti = /sh/       e  = /E/
o  = /E/        n  = /n/
n  = /n/        ce = /s/

                     [2;4xWith [5y [1ythe [5y [1yfollowing [5y [1yexamples, [5y [1yhowever, [5y [1yit [5y [1yis [5y [1ymuch [5y [1ymore [5y [1ydifficult [5y [1yto [5y [1ydecide
[48{


[6{                 [5y      [1ywhich graphemes correspond to each phoneme:

                        [5y  [1y[2;2xlamb = /l/ /ae/ /m/

l = /l/         l = /l/
a = /ae/        a = /ae/
m = /m/        mb = /m/
b = ?


receive =  /r/ /E/ /s/ /i/ /v/

                             r = /r/         r = /r/         r = /r/
                             e =  /E/        e =  /E/        e =  /E/
                             c =  /s/       ce = /s/        ce = /s/
                             e =  /i/        i =  /i/      i+e =  /i/
                             i =   ?        ve =  /v/        v =  /v/
                             v =  /v/
e =  ?


vague   =  /v/ /eI/ /g/

v =  /v/        v =  /v/        v =  /v/
                             a =  /eI/       a =  /eI/       a =  /eI/
                             g =  /g/       gu =  /g/      gue =  /g/
                            ue =  ?          e =  ?


[48{


[6{                       [2;4xIt is necessary to specify the full set of graphemes such that each [5y [1ymay[1y[6{[2;4x
                                              [5y   [1y155
[48{


[6{                 [5y      [1ybe [5y       [1yconsidered [5y        [1yto [5y        [1ycorrespond [5y        [1yto [5y       [1ya [5y        [1ysingle [5y        [1yphoneme [5y        [1y(or [5y       [1ya [5y        [1ynumber [5y        [1yof
[48{


[6{                 [5y      [1yalternative single phonemes). Hanna et al. (Hanna et [5y [1yal, 1966) and Simon [5y [1yand
[48{


[6{                 [5y      [1ySimon [5y      [1y(Simon [5y       [1yand [5y       [1ySimon, [5y       [1y1973) [5y      [1yeach [5y       [1ygive [5y       [1ya [5y      [1yset [5y       [1yof [5y       [1yphoneme-grapheme
[48{


[6{                 [5y      [1ycorrespondences, [5y        [1ythe [5y        [1ylatter's [5y        [1yset [5y        [1ybeing [5y        [1ya [5y        [1yslight [5y        [1ymodification [5y        [1yof [5y         [1ythe
[48{


[6{                 [5y      [1yformer's.  [5y  [1yHanna [5y  [1yet [5y [1yal [5y [1ylist [5y [1y107 [5y [1ydifferent [5y  [1ygraphemes, [5y [1yand [5y [1ySimon [5y [1yand [5y  [1ySimon
[48{


[6{                 [5y      [1ylist  [5y [1y104.  [5y  [1yYannakoudakis  [5y [1yand  [5y  [1yFawthrop  [5y [1y(Yannakoudakis  [5y  [1yand  [5y  [1yFawthrop,
[48{


[6{                 [5y      [1y1983b) divide words into vowel and consonant elements, using 267 elements.

[48{


[6{                   [5y  [1yA [5y    [1ynumber [5y    [1yof [5y    [1yspecific [5y    [1yproblems [5y    [1ywere [5y    [1yencountered [5y    [1ywhen [5y    [1yattempting [5y     [1yto
[48{


[6{                 [5y      [1ysegment [5y  [1ywords [5y  [1yinto [5y  [1ygraphemes, [5y  [1ysome [5y  [1yof [5y   [1ythe [5y  [1yproblems [5y  [1ybeing [5y  [1yillustrated [5y   [1yin
[48{


[6{                 [5y      [1ythe examples above.

[48{


[6{[5y[1yFor [5y    [1yexample, [5y    [1yconsider [5y     [1y'silent [5y    [1yletters', [5y    [1ythat [5y     [1yis, [5y    [1ysingle [5y    [1ycharacters [5y     [1ywhich
[48{


[6{                 [5y      [1yapparently do not represent a [5y [1yphoneme.  The [5y [1yfinal 'e' is [5y [1ya special case [5y [1yof
[48{


[6{                 [5y      [1ythis [5y      [1yin [5y       [1ywords [5y       [1ywhere [5y      [1yit [5y       [1yis [5y       [1yused [5y      [1yto [5y       [1ymodify [5y       [1ythe [5y      [1ypronunciation [5y       [1yof [5y       [1ythe
[48{


[6{                 [5y      [1ypreceding [5y    [1yvowel [5y     [1y(often [5y    [1yreferred [5y     [1yto [5y    [1yas [5y     [1ythe [5y    [1y'magic [5y     [1ye' [5y     [1yin [5y    [1yteaching).  [5y          [1yIt
[48{


[6{                 [5y      [1ymodifies the vowel, changing a soft vowel into a hard one:

                         [2;2xcan  =  /k/ /ae/ /n/    cane  =  /k/ /eI/ /n/
                              fin  =  /f/ /I/ /n/     fine  =  /f/ /aI/ /n/
                              cut  =  /k/ /^/ /t/     cute  =  /k/ /ju/ /t/

                     [2;4xThe [5y     [1y'e' [5y     [1ymay [5y     [1ybe [5y     [1ytreated [5y    [1yas [5y     [1ya [5y     [1yseparate [5y     [1ysilent [5y     [1ygrapheme, [5y     [1yor [5y     [1yit [5y     [1ymay [5y     [1ybe
[48{


[6{                 [5y      [1yconsidered [5y [1ypart [5y [1yof [5y  [1ythe [5y [1yprececeding [5y  [1yvowel [5y [1ygrapheme, [5y  [1yrepresented [5y [1yin [5y  [1y'cane'
[48{


[6{                 [5y      [1yas [5y     [1y'a_e'. [5y      [1yHanna [5y     [1yet [5y      [1yal [5y     [1y(Hanna [5y     [1yet [5y      [1yal, [5y     [1y1966) [5y      [1ydealt [5y     [1ywith [5y      [1ythis [5y     [1yproblem [5y      [1yby
[48{


[6{                 [5y      [1yinventing a separate /E9/ phoneme category to represent the grapheme [5y [1y'e'.
[48{


[6{                 [5y      [1yIf [5y [1yit [5y  [1yis [5y  [1yrepresented [5y  [1yin [5y  [1ythis [5y [1yway, [5y  [1yit [5y  [1yis [5y  [1yno [5y [1ylonger [5y  [1ylinked [5y  [1yto [5y  [1ythe [5y  [1ypreceding
[48{


[6{                 [5y      [1yvowel.  [5y           [1yHowever, [5y      [1yin [5y      [1ysome [5y      [1ycases, [5y      [1ywhere [5y      [1ythe [5y      [1y'e' [5y      [1yis [5y      [1ynot [5y      [1yfinal [5y      [1ybut [5y      [1ystill
[48{


[6{                 [5y      [1ymodifies the preceding vowel, the 'e' is sounded:

                         [2;2xcases  =  /k/ /eI/ /s/ /I/ /z/

                     [2;4xThe [5y   [1y'e' [5y   [1ycorresponds [5y    [1yto [5y   [1y/I/. [5y    [1yThe [5y   [1ygraphemic [5y   [1yconstruction [5y    [1yin [5y   [1ywhich [5y   [1ythe [5y    [1y'e'
[48{


[6{                 [5y      [1yoccurs [5y [1ywill [5y  [1ybe [5y [1ydescribed [5y  [1yas [5y [1ya [5y  [1y'vc+e' [5y [1ygrapheme [5y  [1y(vowel, [5y  [1yconsonant [5y [1y+ [5y  [1y'e'). [5y  [1yIn
[48{


[6{                 [5y      [1ysome [5y    [1ycases [5y    [1ythe [5y    [1yvowel [5y     [1yand [5y    [1y'e' [5y    [1ywill [5y    [1ybe [5y    [1ytaken [5y     [1yto [5y    [1ycorrespond [5y    [1yto [5y    [1ya [5y     [1ysingle
[48{


[6{                 [5y      [1yphoneme, [5y [1y'a_e' [5y  [1yin [5y  [1y'cane'; [5y  [1yin [5y [1yothers [5y  [1ythey [5y  [1yrepresent [5y  [1ytwo [5y  [1yphonemes [5y  [1yand [5y  [1yare
[48{


[6{                 [5y      [1ytreated as separate graphemes.

[48{


[6{                   [5y  [1yOther silent letters [5y [1ycause difficulties, [5y [1yfor example the [5y [1y'b' in 'lamb', [5y [1ythe
[48{


[6{                 [5y      [1y'k' [5y   [1yin [5y   [1y'know', [5y   [1y'g' [5y   [1yand [5y   [1y'h' [5y   [1yin [5y   [1y'high', [5y   [1y'u' [5y   [1yin [5y   [1y'guard'.  [5y      [1ySimilarly [5y   [1yin [5y   [1ycases [5y    [1yof
[48{


[6{                 [5y      [1ydouble [5y  [1yletters [5y   [1yonly [5y  [1yone [5y   [1yis [5y  [1ypronounced:  [5y     [1y'cotton', [5y   [1y'tell', [5y   [1y'pass'. [5y  [1yThe [5y   [1ysilent
[48{


[6{                 [5y      [1yletter [5y [1ymay [5y  [1ybe [5y [1ygiven [5y  [1yno [5y [1ycorresponding [5y  [1yphoneme, [5y [1yor [5y  [1ymay [5y  [1ybe [5y [1yassigned [5y  [1yto [5y  [1yan[1y[6{[2;4x
                                              [5y   [1y156
[48{


[6{                 [5y      [1yadjacent [5y  [1ygrapheme [5y  [1ywith [5y  [1ya [5y  [1ycorresponding [5y  [1yphoneme.  [5y    [1yIn [5y  [1ythe [5y   [1yformer [5y  [1ycase [5y  [1ya
[48{


[6{                 [5y      [1yletter [5y [1ythat [5y [1ymight [5y [1ybe [5y [1ysilent [5y [1yin [5y [1ysome [5y [1ycontexts [5y [1ycould [5y [1ybe [5y [1yplaced [5y [1yanywhere [5y [1yin
[48{


[6{                 [5y      [1ya [5y [1yword [5y [1yand [5y [1ynot [5y [1yaffect [5y [1yits [5y [1ypronunciation:  [5y  [1yif [5y  [1ya [5y [1yphoneme [5y [1y/b0/ [5y [1yrepresented
[48{


[6{                 [5y      [1ya silent 'b' then 'at' [5y [1ywould be a [5y [1ypossible misspelling of [5y [1y'bat', or 'brubn' [5y [1ya
[48{


[6{                 [5y      [1ymisspelling [5y  [1yof [5y   [1y'run'.  [5y     [1yIf [5y  [1ythe [5y  [1ysilent [5y   [1yletter [5y  [1yis [5y   [1ytreated [5y  [1yas [5y   [1ypart [5y  [1yof [5y   [1yanother
[48{


[6{                 [5y      [1ygrapheme, [5y    [1ythen [5y    [1ythe [5y    [1ycases [5y    [1yin [5y    [1ywhich [5y    [1yit [5y    [1ywould [5y    [1ybe [5y    [1yconsidered [5y    [1ya [5y     [1ylegitimate
[48{


[6{                 [5y      [1yphonetic [5y  [1ymisspelling [5y  [1yare [5y   [1yless [5y  [1yarbitrary.  [5y     [1yIf [5y  [1y'k' [5y  [1yis [5y   [1ysilent [5y  [1ywhen [5y  [1yfollowed [5y   [1yby
[48{


[6{                 [5y      [1y'n', [5y       [1yin [5y        [1ythe [5y        [1yinitial [5y        [1yposition [5y        [1yof [5y        [1ya [5y        [1yword, [5y        [1ythe [5y        [1ygrapheme [5y        [1y'kn' [5y        [1ycould [5y        [1ybe
[48{


[6{                 [5y      [1yconsidered [5y    [1yas [5y    [1ya [5y     [1ypossible [5y    [1ycorrespondence [5y     [1yto [5y    [1y/n/, [5y     [1yproducing [5y    [1ythe [5y     [1yfollowing
[48{


[6{                 [5y      [1y'phonetic equivalents':

[5y[1y[2;2xknot =  /n/ /O/ /t/     not =  /n/ /O/ /t/
                               kn =  /n/               n =  /n/
o =  /O/               o =  /O/
t =  /t/               t =  /t/

[48{


[6{                       [2;4xIn [5y     [1ydiscussing [5y      [1ythe [5y     [1ysilent [5y      [1yletter [5y     [1ygraphemes, [5y      [1yHanna [5y     [1yet [5y      [1yal [5y     [1y(Hanna [5y      [1yet [5y      [1yal,
[48{


[6{                 [5y      [1y1966) state that:

[48{


[6{[5y[1y"Considerable [5y   [1ydisagreement [5y   [1yoccurs [5y   [1yamong [5y   [1ylinguists [5y   [1yregarding [5y    [1yhow
                    [5y          [1ysuch graphemes should be classified."  p. 14

[48{


[6{                 [5y      [1yThey were all considered in this study to be part of a grapheme that [5y [1yhad
[48{


[6{                 [5y      [1ya corresponding phoneme: [5y [1yexamples of [5y [1ygraphemes incorporating these [5y [1y'silent
[48{


[6{                 [5y      [1ygraphemes' are

[5y[1y[2;2x'ce'  since      'gh'  ghost     'wh'  what
                        'wr'  write      'kn'  know      'bt'  debt

                     [2;4xA [5y    [1ycomplete [5y     [1ylist [5y     [1yof [5y     [1ythe [5y    [1ygrapheme-phoneme [5y     [1ycorrespondences [5y     [1yused [5y     [1yin [5y     [1ythis
[48{


[6{                 [5y      [1ythesis is given in appendix B.

[48{


[6{                   [5y  [1yThe [5y  [1yschwa [5y   [1y/E/ [5y   [1yalso [5y  [1ypresents [5y   [1yproblems, [5y   [1yparticularly [5y  [1yin [5y   [1ycases [5y  [1ywhere [5y   [1yit [5y   [1yis
[48{


[6{                 [5y      [1yfollowed by /n/:

[5y[1y[2;2xopening =  /EU/ /p/ /E/ /n/ /I/ /ng/

                     [2;4xThe [5y      [1y'en' [5y      [1yis [5y       [1yrepresented [5y      [1yby [5y       [1ytwo [5y      [1yphonemes, [5y       [1y/E/ [5y      [1yand [5y       [1y/n/.   [5y [1yHowever, [5y       [1ya
[48{


[6{                 [5y      [1ypossible [5y  [1ymisspelling [5y  [1yof [5y   [1y'opening', [5y  [1ywhere [5y   [1ythe [5y  [1y'e' [5y  [1yis [5y   [1yomitted, [5y  [1yis [5y  [1y'opning'. [5y   [1yTo
[48{


[6{                 [5y      [1ycater [5y         [1yfor [5y         [1ythis [5y         [1yand [5y         [1ysimilar [5y          [1ycases, [5y         [1y'en' [5y         [1ywas [5y          [1ytreated [5y         [1yas [5y         [1ya [5y          [1ygrapheme
[48{


[6{                 [5y      [1yrepresenting a single phoneme, as was 'on' and 'an'.

[48{


[6{                   [5y  [1yIn [5y [1ysome [5y [1ydialects [5y [1ythe [5y [1y'r' [5y [1yin [5y [1y'er' [5y [1yin [5y [1ynot [5y  [1ypronounced: [5y [1ythe [5y [1y'er' [5y [1ycorresponds
[48{


[6{                 [5y      [1yto a single phoneme, /e:/ or /E/.  In [5y [1yother dialects the 'r' is sounded [5y [1yand[1y[6{[2;4x
                                              [5y   [1y157
[48{


[6{                 [5y      [1ythe [5y  [1y'er' [5y   [1ycorresponds [5y   [1yto [5y   [1ytwo [5y   [1yphonemes, [5y   [1y/E/ [5y   [1yand [5y   [1y/r/.  [5y     [1yTo [5y   [1yallow [5y   [1yfor [5y   [1yboth
[48{


[6{                 [5y      [1ycases [5y     [1y'er' [5y     [1ywas [5y     [1ytaken [5y     [1yas [5y     [1ya [5y     [1ygrapheme [5y     [1yrepresenting [5y     [1ya [5y     [1ysingle [5y     [1yphoneme, [5y     [1yor
[48{


[6{                 [5y      [1ycould [5y [1ybe [5y  [1ysplit [5y  [1yto [5y  [1yrepresent [5y  [1ytwo [5y  [1yphonemes.  [5y   [1yOther [5y  [1ygraphemes [5y  [1yinvolving [5y  [1y'r'
[48{


[6{                 [5y      [1ywere treated in the same way:

[5y[1y[2;2xayor    oar     air     aer     are     ar
                             ear     re      er      ier     ir      our
                             oor     ore     or      ure     ur

                     [2;4xEach corresponds [5y [1yto [5y [1ya [5y [1ysingle vowel [5y [1yphoneme, [5y [1yor [5y [1yto [5y [1ya [5y [1ysingle [5y [1yvowel [5y [1yand [5y [1y/r/.
[48{


[6{                 [5y      [1ySome [5y [1yalso [5y  [1ycorrespond [5y  [1yto [5y [1ythe [5y  [1ysingle [5y [1yphoneme [5y  [1y/r/, [5y [1yor [5y  [1ymay [5y [1ybe [5y  [1ysplit [5y  [1yfurther
[48{


[6{                 [5y      [1yinto [5y  [1ymore [5y  [1ythan [5y  [1ytwo [5y  [1yphonemes, [5y   [1ye.g. [5y  [1y'ier' [5y  [1yin [5y  [1y'carrier'.  [5y     [1yA [5y  [1ylarge [5y  [1ynumber [5y   [1yof
[48{


[6{                 [5y      [1ythese correspondences were derived from the children's errors.

[48{


[6{                   [5y  [1yThe phoneme /sh/ is spelt in a variety of different ways:

                    [2;2x'ssi'   mission      'ss'    reassure     'ti'    nation
                        'si'    mansion      'ch'    machine      'sh'    show
                        'ci'    special

[2;4xAll these were represented as individual graphemes.

[48{


[6{                   [5y  [1yA [5y   [1ylarge [5y   [1ynumber [5y   [1yof [5y   [1ygraphemes [5y   [1ycorrespond [5y   [1yto [5y   [1ya [5y   [1ysingle [5y   [1yphoneme [5y   [1yin [5y   [1ysome
[48{


[6{                 [5y      [1ycases, [5y   [1ybut [5y   [1yto [5y   [1ymore [5y   [1ythan [5y   [1yone [5y   [1yphoneme [5y   [1yin [5y   [1yothers.  [5y      [1yBecause [5y   [1yof [5y   [1ythis [5y   [1ythey
[48{


[6{                 [5y      [1ymust be taken [5y [1yto correspond [5y [1yto single [5y [1yphonemes but also [5y [1yable to be [5y [1ysplit
[48{


[6{                 [5y      [1yinto [5y    [1ysmaller [5y    [1ygraphemes, [5y    [1ycorresponding [5y    [1yto [5y    [1yother [5y    [1yphonemes.  [5y        [1yFor [5y    [1yexample,
[48{


[6{                 [5y      [1ythe grapheme 'ough':

[5y[1y[2;2xcough  =  /k/ /O/ /f/
though =  /tv/ /EU/

                     [2;4xIn [5y [1y'cough' [5y  [1yit [5y  [1ycorresponds [5y  [1yto [5y [1ytwo [5y  [1yphonemes; [5y  [1yin [5y  [1y'though' [5y  [1yonly [5y [1ya [5y  [1ysingle [5y  [1yone.
[48{


[6{                 [5y      [1yDoubled [5y [1ycharacters, [5y [1yhowever, [5y [1yand [5y [1ya [5y [1ynumber [5y [1yof [5y [1yother [5y [1ygraphemes [5y [1yoccur [5y [1yonly
[48{


[6{                 [5y      [1yas single phonemes in the majority of cases:

                        [5y  [1y[2;2x'igh'    high =  /h/ /aI/
'll'     will =  /w/ /I/ /l/
'ch'     chip =  /ch/ /I/ /p/
                             'ph'    phone =  /f/ /EU/ /n/

                     [2;4xThese graphemes, [5y [1ycorresponding [5y [1yto one [5y [1ysingle phoneme, [5y [1ywill be [5y [1yreferred [5y [1yto
[48{


[6{                 [5y      [1yas 'tied' graphemes.  If [5y [1ya tied grapheme occurs in [5y [1ya word or a [5y [1ymisspelling
[48{


[6{                 [5y      [1ythe [5y [1ycorresponding [5y [1yphonemes [5y [1ywere [5y [1yfound, [5y  [1yand [5y [1ythe [5y [1ygrapheme [5y [1ywas [5y  [1ysegmented
[48{


[6{                 [5y      [1yno [5y   [1yfurther.  [5y        [1yGraphemes [5y    [1ythat [5y    [1yare [5y    [1ynot [5y    [1ytied [5y    [1ywere [5y    [1yfurther [5y    [1ysegmented [5y    [1y(or
[48{


[6{                 [5y      [1ysplit) [5y    [1yto [5y    [1yfind [5y     [1yconstituent [5y    [1ygraphemes [5y     [1yand [5y    [1ycorresponding [5y     [1yphonemes.  [5y         [1yTied
[48{


[6{                 [5y      [1ygraphemes are indicated by a "1" [5y [1ypreceding them in the [5y [1ygrapheme-phoneme[1y[6{[2;4x
                                              [5y   [1y158
[48{


[6{                 [5y      [1ycorrespondence [5y  [1ytable [5y  [1y(figure [5y  [1yB-1, [5y   [1yappendix [5y  [1yB), [5y  [1yand [5y  [1ysegmentable [5y   [1ygraphemes
[48{


[6{                 [5y      [1yby a 0. All 'vc+e' graphemes are segmentable, and are indicated by *.


[48{


[6{                 [5y      [1y7.3.6. Phonemic coding of the dictionary

[48{


[6{                   [5y  [1yThe [5y  [1yinpw [5y  [1ywas [5y   [1ysegmented [5y  [1yinto [5y   [1yall [5y  [1ypossible [5y   [1ygraphemes, [5y  [1yand [5y   [1yphoneme [5y   [1ycor-
[48{


[6{                 [5y      [1yrespondences [5y [1ywere [5y  [1yfound [5y  [1yfor [5y [1yeach [5y  [1ygrapheme.  [5y   [1yAll [5y  [1ywords [5y [1yin [5y  [1ythe [5y  [1ydictionary
[48{


[6{                 [5y      [1ywere [5y     [1ycoded [5y     [1yphonemically.  [5y          [1yThe [5y     [1yset [5y     [1yof [5y     [1yphonemes [5y     [1yrepresenting [5y     [1ythe [5y      [1yinpw
[48{


[6{                 [5y      [1ywere [5y   [1ycompared [5y   [1ywith [5y   [1ythose [5y   [1yrepresenting [5y   [1ythe [5y   [1ydictionary [5y   [1ywords: [5y   [1yif [5y   [1ymatches
[48{


[6{                 [5y      [1ywere found they were taken to be "possible phonemic equivalents".

[48{


[6{                   [5y  [1yEach [5y [1yword [5y [1yin [5y  [1ythe [5y [1ydictionary [5y  [1ywas [5y [1yhand [5y  [1ycoded [5y [1yby [5y  [1ythe [5y [1yauthor [5y  [1yin [5y  [1yconjunc-
[48{


[6{                 [5y      [1ytion [5y [1ywith [5y [1ya [5y [1ylinguist [5y [1yspecializing [5y [1yin [5y [1yspeech [5y [1ysynthesis.  [5y  [1yThe [5y [1ygeneral [5y [1yguidelines
[48{


[6{                 [5y      [1ysuggested [5y         [1yin [5y         [1ythe [5y          [1ytext [5y         [1y"English [5y          [1yPhonemic [5y         [1yTranscription" [5y          [1y(Morris-Wilson,
[48{


[6{                 [5y      [1y1984) [5y [1ywere [5y  [1yused [5y  [1yin [5y  [1ycoding.  [5y   [1y'Strong [5y  [1yforms' [5y [1ywere [5y  [1yused [5y  [1yin [5y [1ymost [5y  [1ycases [5y  [1y(see
[48{


[6{                 [5y      [1yp [5y   [1y76-82, [5y   [1y(Morris-Wilson, [5y    [1y1984)) [5y   [1ythough [5y    [1ythe [5y   [1y'weak [5y    [1yform' [5y   [1yalternatives [5y    [1ywere
[48{


[6{                 [5y      [1yalso used in a few cases.

[48{


[6{[5y[1yFor [5y       [1ya [5y       [1ynumber [5y        [1yof [5y       [1ythe [5y        [1ywords, [5y       [1ythe [5y        [1yambiguity [5y       [1yof [5y       [1ypossible [5y        [1yalternative
[48{


[6{                 [5y      [1ypronunciations [5y [1ymeant [5y  [1ythat [5y  [1ymore [5y [1ythan [5y  [1yone [5y  [1yphonemic [5y [1ycoding [5y  [1yof [5y  [1ya [5y  [1yword [5y  [1ywas
[48{


[6{                 [5y      [1yincluded [5y    [1yin [5y    [1ythe [5y    [1ycoded [5y    [1ydictionary.  [5y        [1yIn [5y    [1yparticular, [5y    [1y'er' [5y    [1yat [5y    [1ythe [5y    [1yend [5y    [1yof [5y    [1ya
[48{


[6{                 [5y      [1yword [5y   [1ywas [5y    [1ycoded [5y    [1yboth [5y    [1yas [5y    [1y/E/ [5y    [1yand [5y    [1yas [5y    [1y/E/ [5y    [1y/r/ [5y    [1yto [5y    [1yallow [5y    [1yfor [5y    [1yvariations [5y    [1yin
[48{


[6{                 [5y      [1ydialect.   'er' [5y      [1yoccurring [5y     [1yelsewhere [5y      [1yin [5y      [1ya [5y      [1yword [5y      [1ywas [5y      [1ycoded [5y      [1yas [5y      [1y/e:/ [5y      [1ywhen
[48{


[6{                 [5y      [1yrepresenting [5y      [1y'r-less' [5y      [1ydialects.   Other [5y      [1y'vowel [5y      [1y+ [5y      [1yr' [5y      [1ygraphemes [5y      [1ywere [5y       [1yalso
[48{


[6{                 [5y      [1ycoded with and without the 'r'.

[5y[1y[2;2xboard =  /b/ /o:/ /r/ /d/
& =  /b/ /o:/ /d/
car =  /k/ /a:/
& =  /k/ /a:/ /r/
error =  /e/ /r/ /E/ /r/
& =  /e/ /r/ /E/

[48{


[6{                       [2;4xThe 'd' [5y [1yin [5y [1y'procedure', [5y [1y'produce' [5y [1yand [5y [1y'soldier' may [5y [1ybe [5y [1ypronounced [5y [1y/d/ [5y [1yor
[48{


[6{                 [5y      [1y/dz/, so both are represented:

[5y[1y[2;2xproduce =  /p/ /r/ /O/ /d/ /ju/ /s/
&  =  /p/ /r/ /O/ /dz/ /u/ /s/

[48{


[6{                       [2;4xUnstressed [5y  [1yvowels [5y  [1ywere [5y   [1ycoded [5y  [1yas [5y  [1yschwa, [5y   [1y/E/.  [5y    [1yIn [5y   [1ysome [5y  [1ywords [5y  [1yboth [5y   [1ythe
[48{


[6{                 [5y      [1ystrong and the weak forms of vowels were coded:[1y[6{[2;4x
                                              [5y   [1y159
[48{


[6{                        [5y  [1y[2;2xaround =  /eI/ /r/ /aU/ /n/ /d/
                             around =  /E/ /r/ /aU/ /n/ /d/

                     [2;4xIn [5y [1ygeneral [5y  [1ywhen [5y  [1ythere [5y  [1ywas [5y  [1yuncertainty [5y  [1yabout [5y [1ythe [5y  [1yvowel [5y  [1yphoneme, [5y  [1ythe [5y  [1y/E/
[48{


[6{                 [5y      [1ywas used and matched to all single vowel graphemes.

[48{


[6{                   [5y  [1yIn some [5y [1ywords, the [5y [1yschwa [5y [1ywas omitted, [5y [1yand [5y [1ythe following [5y [1yconsonant [5y [1yonly
[48{


[6{                 [5y      [1ywas coded. The schwa is unpronounced in some dialects.

                        [5y  [1y[2;2xdifference =  /d/ /I/ /f/ /E/ /r/ /E/ /n/ /s/
                                     &  =  /d/ /I/ /f/ /r/ /E/ /n/ /s/
                             edinburgh  =  /e/ /d/ /I/ /n/ /b/ /r/ /E/
&  =  /e/ /d/ /I/ /n/ /b/ /E/ /r/ /E/
                               factory  =  /f/ /ae/ /k/ /t/ /r/ /I/
&  =  /f/ /ae/ /k/ /t/ /E/ /r/ /I/

[48{


[6{                       [2;4xThe [5y    [1ygraphemes [5y     [1y'el' [5y     [1y'le [5y    [1y' [5y     [1yand [5y     [1y'en' [5y    [1yalso [5y     [1ypresented [5y     [1ysome [5y    [1yproblems.  [5y          [1yIn
[48{


[6{                 [5y      [1ycases where they were clearly [5y [1ypronounced with a [5y [1yschwa the vowel [5y [1yphoneme
[48{


[6{                 [5y      [1ywas coded separately, e.g.

[5y[1y[2;2xkitchen =  /k/ /I/ /ch/ /E/ /n/
pixel =  /p/ /I/ /ks/ /E/ /l/

                     [2;4xIn [5y [1yother [5y [1ycases [5y  [1ythe [5y [1yrepresentation [5y [1ywas [5y  [1ynot [5y [1yclear [5y [1yand [5y  [1ythe [5y [1yword [5y [1ywas [5y  [1ycoded
[48{


[6{                 [5y      [1ywith and without the schwa:

[5y[1y[2;2xjewels =  /dz/ /ju/ /w/ /E/ /l/ /z/
& =  /dz/ /ju/ /w/ /l/ /z/
open =  /EU/ /p/ /n/
& =  /EU/ /p/ /E/ /n/
simple =  /s/ /I/ /m/ /p/ /l/
& =  /s/ /I/ /m/ /p/ /E/ /l/

                     [2;4xIn coding some other words the schwa was omitted:

                        [5y  [1y[2;2xpeople =  /p/ /i/ /p/ /l/
little =  /l/ /I/ /t/ /l/

[48{


[6{                       [2;4xThe graphemes 'lm' 'ld' and 'lk' also present coding difficulties:

                        [5y  [1y[2;2xcalmly =  /k/ /a:/ /m/ /l/ /I/
milk =  /m/ /I/ /l/ /k/
could =  /k/ /u/ /d/
shoulder =  /sh/ /EU/ /l/ /d/ /E/
&  =  /sh/ /EU/ /l/ /d/ /E/ /r/
&  =  /sh/ /EU/ /d/ /E/
&  =  /sh/ /EU/ /d/ /E/ /r/
talk =  /t/ /o:/ /k/
&  =  /t/ /o:/ /l/ /k/

                     [2;4xThe [5y   [1ycoding [5y   [1yhere [5y    [1yis [5y   [1ynot [5y   [1yconsistent. [5y    [1yThe [5y   [1ydifficulties [5y   [1ythat [5y    [1yit [5y   [1ypresents [5y    [1yare[1y[6{[2;4x
                                              [5y   [1y160
[48{


[6{                 [5y      [1ydiscussed [5y  [1yin [5y   [1ychapter [5y   [1y8.  [5y     [1yOther [5y   [1yambiguities [5y   [1yand [5y   [1yproblems [5y  [1ywith [5y   [1ythe [5y   [1ycoding
[48{


[6{                 [5y      [1yare also discussed in that chapter.


[48{


[6{                 [5y      [1y7.3.7. Detail of the phoncode program

[48{


[6{                   [5y  [1yThe [5y [1yphonetic [5y  [1ycoding [5y  [1yprogram [5y  [1ytakes [5y  [1ythe [5y  [1yinput [5y  [1yword, [5y  [1yinpw, [5y  [1yand [5y  [1ysegments
[48{


[6{                 [5y      [1yit [5y        [1yinto [5y        [1yall [5y        [1ycombinations [5y        [1yof [5y        [1ygraphemes.   [5y    [1yThe [5y        [1yphonemes [5y         [1ythat [5y        [1ycan [5y        [1ybe
[48{


[6{                 [5y      [1yrepresented [5y  [1yby [5y   [1yeach [5y   [1ygrapheme [5y   [1yare [5y  [1yfound [5y   [1yby [5y   [1ytable [5y   [1ylook-up. [5y   [1yAll [5y   [1ysequences
[48{


[6{                 [5y      [1yof [5y [1yphonemes [5y [1ythat [5y [1ymay [5y [1ybe [5y [1yconsidered [5y [1yto [5y [1yrepresent [5y [1ythe [5y [1yinpw [5y [1yare [5y [1ycompared
[48{


[6{                 [5y      [1ywith [5y  [1ythe [5y  [1ydictionary. [5y   [1yThe [5y  [1ydictionary [5y  [1yis [5y   [1yrepresented [5y  [1yas [5y  [1ya [5y   [1ytree, [5y  [1ywhere [5y   [1yeach
[48{


[6{                 [5y      [1ynode represents a phoneme, and also stores information about [5y [1yactual words
[48{


[6{                 [5y      [1y(see figure [5y [1y7-19).  [5y [1yIf [5y [1ya sequence [5y [1yof [5y [1yphonemes (representing [5y [1yinpw) [5y [1ymatches
[48{


[6{                 [5y      [1ya [5y [1ypath [5y [1yin [5y  [1ythe [5y [1ytree, [5y [1yand [5y  [1ythe [5y [1yfinal [5y [1ynode [5y  [1yin [5y [1ythe [5y [1ypath [5y  [1yalso [5y [1ycontains [5y [1ya [5y  [1yword
[48{


[6{                 [5y      [1y(stored [5y  [1yas [5y  [1ya [5y  [1ystring), [5y   [1ythen [5y  [1ythat [5y  [1yword [5y   [1yis [5y  [1yoffered [5y  [1yas [5y   [1ya [5y  [1yphonetic [5y  [1ymatch [5y   [1yto
[48{


[6{                 [5y      [1yinpw.


[48{


[6{[5y[1y7.3.8. Segmenting the word

[48{


[6{                   [5y  [1y. [5y   [1yEach [5y   [1ygrapheme [5y   [1yin [5y   [1ythe [5y   [1ygrapheme-phoneme [5y   [1ytable [5y   [1yis [5y   [1ycompared [5y   [1ywith [5y   [1ythe
[48{


[6{                 [5y      [1yinpw [5y     [1ystring. [5y     [1yIf [5y      [1ythere [5y     [1yis [5y     [1ya [5y      [1ymatch, [5y     [1ythe [5y     [1yphonemes [5y      [1ycorresponding [5y     [1yto [5y      [1ythe
[48{


[6{                 [5y      [1ygrapheme, [5y  [1yand [5y   [1ythe [5y  [1yposition [5y   [1yof [5y  [1ythe [5y   [1ygrapheme [5y  [1yin [5y   [1ythe [5y  [1yword, [5y   [1yare [5y  [1ynoted. [5y   [1yIf
[48{


[6{                 [5y      [1ythe [5y   [1ycharacter [5y    [1yis [5y    [1ymarked [5y   [1yas [5y    [1ya [5y    [1y'tied' [5y    [1ygrapheme [5y   [1ythe [5y    [1ycharacters [5y    [1yin [5y    [1yit [5y    [1yare
[48{


[6{                 [5y      [1ysegmented [5y [1yno [5y [1yfurther: [5y [1ythese [5y [1ycharacters [5y [1yin [5y [1ythe [5y [1yword [5y [1yare [5y  [1yno [5y [1ylonger [5y [1yacces-
[48{


[6{                 [5y      [1ysible. If the [5y [1ygrapheme [5y [1yis not [5y [1ytied it [5y [1ymay be [5y [1ysegmented further. [5y [1yThe [5y [1ynext
[48{


[6{                 [5y      [1ygrapheme [5y   [1yis [5y   [1ycompared [5y    [1ywith [5y   [1ythose [5y    [1yremaining [5y   [1yin [5y   [1ythe [5y    [1yinpw [5y   [1ystring [5y   [1ythat [5y    [1yare
[48{


[6{                 [5y      [1ystill accessible.  [5y  [1yAgain, [5y [1yif [5y [1ythe [5y [1ymatch [5y [1ysucceeds, [5y [1ycorresponding [5y [1yphonemes [5y [1yand
[48{


[6{                 [5y      [1yposition in the [5y [1ystring are [5y [1ynoted: tied phonemes [5y [1yare marked as [5y [1yinaccessible.
[48{


[6{                 [5y      [1yThe [5y      [1yprocess [5y       [1yis [5y       [1ycontinued [5y      [1yuntil [5y       [1yall [5y       [1ygraphemes [5y      [1yin [5y       [1ythe [5y       [1ytable [5y       [1yhave [5y       [1ybeen
[48{


[6{                 [5y      [1ycompared, or until there are no accessible characters left in the string.

[48{


[6{                   [5y  [1yFor [5y      [1yexample, [5y      [1yif [5y      [1ythe [5y      [1yinpw [5y      [1ywere [5y      [1y'caught', [5y      [1ythe [5y      [1ygrapheme [5y      [1y'augh' [5y      [1ywould
[48{


[6{                 [5y      [1ymatch [5y    [1yto [5y     [1ycharacters [5y     [1y2 [5y     [1yto [5y     [1y5 [5y     [1yin [5y     [1ythe [5y     [1yinpw [5y     [1ystring.  [5y          [1yThe [5y     [1yphonemes [5y     [1ycor-
[48{


[6{                 [5y      [1yresponding [5y [1yto [5y [1ythis [5y [1ygrapheme [5y [1yare [5y [1y/o:/ [5y [1yand [5y [1y/a:/. [5y [1yThe [5y  [1ygrapheme [5y [1y'augh' [5y [1yis [5y [1ynot
[48{


[6{                 [5y      [1ytied, [5y [1yand [5y [1ymay [5y  [1ybe [5y [1yfurther [5y  [1ysplit. [5y [1yThe [5y  [1ynext [5y [1ymatching [5y  [1ygrapheme [5y [1yin [5y  [1ythe [5y  [1ytable
[48{


[6{                 [5y      [1yis 'gh', with [5y [1yphonemes /f/ and [5y [1y/g/. This grapheme is [5y [1ymarked as tied, so [5y [1yno
[48{


[6{                 [5y      [1yfurther [5y   [1ysegmentation [5y    [1yof [5y    [1ythe [5y    [1ygrapheme [5y    [1y'gh' [5y    [1yis [5y    [1yrequired.  [5y        [1yThese [5y    [1ymatches
[48{


[6{                 [5y      [1ymay be represented in the following format:[1y[6{[2;4x
                                              [5y   [1y161
[48{


[6{                    [5y          [1y[2;2xgrapheme => alternative phonemes
augh => /o:/ /a:/
gh   => /f/ /g/

                     [2;4xThe remaining matches found are:

[5y[1y[2;2xau   =>  /EU/ /aU/ /o:/ /a:/ /o/
                             c    =>  /k/ /s/ /sh/
t    =>  /t/ /ch/ /sh/ /d/ /th/

[48{


[6{                       [2;4xThe [5y [1yset [5y  [1yof [5y [1yphonemes [5y [1yrepresenting [5y  [1ythe [5y [1yinpw [5y  [1ymay [5y [1yalso [5y  [1ybe [5y [1yrepresented [5y  [1yas
[48{


[6{                 [5y      [1ya finite state grammar, as in figure 7-14.


[5y[1y[2;2x/o/
/EU/                            /d/
                             /k/             /aU/            /f/             /t/
                     1       /s/     2       3       4       5       6       /ch/    end
                             /sh/            /o:/            /g/             /sh/
/a:/                            /th/
/o:/
/a:/

                          [5y        [1y[2;4xFigure 7-14:   Finite State Grammar representation of 'caught'


                   [5y  [1yIf [5y [1yn [5y  [1yis [5y  [1ythe [5y  [1ylength [5y [1yof [5y  [1ythe [5y  [1yinpw, [5y  [1ythere [5y  [1ywill [5y [1ybe [5y  [1y(n+1) [5y  [1ynodes, [5y  [1ythe [5y  [1y(n+1)th
[48{


[6{                 [5y      [1ybeing [5y   [1ythe [5y   [1yend [5y   [1ynode. [5y   [1yEach [5y   [1ynode [5y   [1yindicates [5y   [1ythe [5y   [1yposition [5y   [1yof [5y   [1ya [5y   [1ycharacter [5y   [1yin
[48{


[6{                 [5y      [1ythe inpw: [5y [1yarcs [5y [1yleaving [5y [1ythe [5y [1ynodes [5y [1yrepresent [5y [1yphonemes [5y [1ycorresponding [5y [1yto [5y [1ythe
[48{


[6{                 [5y      [1ygraphemes [5y   [1ycommencing [5y   [1ywith [5y   [1ythat [5y   [1ycharacter, [5y   [1yin [5y   [1ythat [5y   [1yposition. [5y   [1ySome [5y    [1ynodes
[48{


[6{                 [5y      [1yhave [5y [1yno [5y [1yarc [5y [1yconnected [5y [1yto [5y [1ythem: [5y [1ythese [5y [1yrepresent [5y [1ythe [5y [1ycharacters [5y  [1yoccurring
[48{


[6{                 [5y      [1yin [5y [1ytied [5y [1ygraphemes. [5y [1yIn [5y [1yfigure [5y [1y7-14 [5y [1ythe [5y [1ycharacter [5y [1y'h' [5y [1yin [5y [1ythe [5y [1ystring [5y [1y'caught'
[48{


[6{                 [5y      [1ycorresponds [5y [1yto [5y  [1ynode [5y [1y5. [5y  [1yThe [5y  [1ygrapheme [5y [1y'gh' [5y  [1yis [5y  [1ymarked [5y [1yas [5y  [1ytied, [5y  [1yrepresented
[48{


[6{                 [5y      [1yby [5y     [1yphonemes [5y     [1y/f/ [5y     [1yand [5y     [1y/g/. [5y     [1yThe [5y     [1yarcs [5y     [1yleaving [5y     [1ythe [5y      [1y'g' [5y     [1ynode, [5y     [1ynode [5y     [1y4, [5y     [1yare
[48{


[6{                 [5y      [1ylabelled /f/ and [5y [1y/g/. No [5y [1yarc goes [5y [1yto or [5y [1yfrom the [5y [1y'h' node, [5y [1ynode 5: [5y [1yit [5y [1yhas
[48{


[6{                 [5y      [1yno corresponding phoneme in this case.

[48{


[6{                   [5y  [1yThe [5y  [1yrepresentation [5y   [1yof [5y   [1ythe [5y   [1yphonemes [5y  [1ycorresponding [5y   [1yto [5y   [1ya [5y  [1yword [5y   [1ymay [5y   [1yalso
[48{


[6{                 [5y      [1ybe given in a slightly different form, as in figure 7-15.

[48{


[6{                   [5y  [1yIn this format, the nodes [5y [1yare numbered, and [5y [1ythe phonemes labelling [5y [1yarcs
[48{


[6{                 [5y      [1yfrom [5y    [1ythe [5y    [1ynode [5y    [1yare [5y   [1ygiven, [5y    [1yas [5y    [1ybefore. [5y    [1yThe [5y    [1yarcs [5y    [1yare [5y    [1yreplaced [5y    [1yby [5y    [1yexplicit
[48{


[6{                 [5y      [1yvalues [5y [1yof [5y [1ythe [5y  [1y'next [5y [1ynode', [5y [1yfrom [5y  [1yeach [5y [1ynode.  [5y   [1yIn [5y [1ythe [5y  [1yfinite [5y [1ystate [5y  [1ygrammar
[48{


[6{                 [5y      [1yrepresentation, [5y  [1ya [5y   [1ysequence [5y   [1yof [5y   [1yphonemes [5y   [1yrepresenting [5y   [1ythe [5y   [1ystring [5y   [1yis [5y   [1yfound
[48{


[6{                 [5y      [1yby traversing [5y [1ythe arcs [5y [1yin the [5y [1ydirection [5y [1yindicated from [5y [1ynode [5y [1y1 to [5y [1ythe [5y [1yend
[48{


[6{                 [5y      [1ynode, [5y    [1yselecting [5y    [1yany [5y    [1yone [5y    [1yarc [5y    [1yfrom [5y    [1yeach [5y    [1ynode, [5y    [1yand [5y    [1ymoving [5y    [1yto [5y    [1yeach [5y    [1ynode[1y[6{[2;4x
                                              [5y   [1y162
[48{


[6{                 [5y      [1y[2;2xinpw='caught'
node = 1
phon = /k/ , next = 2
phon = /s/ , next = 2
phon = /sh/, next = 2
                     node = 2
phon = /o:/, next = 6
phon = /a:/, next = 6
phon = /O/ , next = 4
phon = /EU/, next = 4
phon = /aU/, next = 4
phon = /o:/, next = 4
phon = /a:/, next = 4
                     node = 3
node = 4
phon = /f/ , next = 6
phon = /g/ , next = 6
                     node = 5
node = 6
phon = /d/ , next = end
phon = /t/ , next = end
phon = /ch/, next = end
phon = /sh/, next = end
phon = /th/, next = end
                     node = end

[5y        [1y[2;4xFigure 7-15:   Alternative representation of 'caught'


                 [5y      [1yconnected [5y [1yby [5y [1ythe [5y [1yarcs, [5y [1yin [5y [1yturn. [5y [1yThe [5y [1ylabels [5y [1yof [5y [1yeach [5y [1yarc [5y [1ytraversed [5y [1yare [5y  [1ythe
[48{


[6{                 [5y      [1yphonemes [5y      [1yrepresenting [5y      [1ythe [5y      [1ystring. [5y      [1yAll [5y       [1ypossible [5y      [1ysequences [5y      [1yare [5y      [1yfound [5y       [1yby
[48{


[6{                 [5y      [1yfollowing [5y [1yeach [5y [1yarc [5y [1yfrom [5y [1ya [5y [1ynode, [5y [1yin [5y [1yorder, [5y [1yand [5y [1ybacktracking [5y [1yuntil [5y [1yall [5y [1ypaths
[48{


[6{                 [5y      [1ybetween node [5y [1y1 [5y [1yand the [5y [1yend node [5y [1yhave been [5y [1ytraversed. In [5y [1ythe [5y [1yalternative
[48{


[6{                 [5y      [1yrepresentation, [5y  [1ya [5y   [1ysequence [5y  [1yof [5y   [1yphonemes [5y   [1yis [5y  [1yfound [5y   [1yby [5y   [1ystarting [5y  [1yat [5y   [1ynode [5y   [1y1,
[48{


[6{                 [5y      [1yselecting [5y   [1yany [5y   [1yphoneme [5y    [1yfrom [5y   [1ythe [5y    [1ylist [5y   [1yfor [5y    [1ythat [5y   [1ynode, [5y    [1yand [5y   [1ymoving [5y   [1yto [5y    [1ythe
[48{


[6{                 [5y      [1y'next node' as indicated. Further phonemes are [5y [1yselected, and moves to [5y [1ythe
[48{


[6{                 [5y      [1y'next node' made, until the end node is encountered. All possible sequences
[48{


[6{                 [5y      [1yare [5y    [1yfound [5y    [1yby [5y     [1yselection [5y    [1yof [5y     [1yeach [5y    [1yphoneme [5y     [1yfrom [5y    [1yeach [5y     [1ynode [5y    [1ylist [5y     [1yin [5y     [1yturn,
[48{


[6{                 [5y      [1ybacktracking to cover all possible combinations.

[48{


[6{                   [5y  [1yWe might consider listing all [5y [1ypossible sequences of phonemes [5y [1yrepresenting
[48{


[6{                 [5y      [1ythe [5y  [1yinpw: [5y   [1yhowever, [5y   [1yeven [5y   [1yfor [5y   [1ythis [5y   [1ysimple [5y   [1yexample, [5y   [1ythere [5y   [1yare [5y   [1y180 [5y   [1ypossible
[48{


[6{                 [5y      [1ysequences, [5y     [1yor [5y     [1ypaths. [5y     [1yThis [5y     [1yis [5y      [1ycalculated [5y     [1yas [5y     [1yfollows.  [5y          [1yIf [5y     [1ythe [5y     [1ynumber [5y      [1yof
[48{


[6{                 [5y      [1ypossible [5y [1ypaths [5y  [1ybetween [5y [1ynodes [5y  [1y1 [5y [1yand [5y  [1y2 [5y [1yis [5y  [1yrewritten [5y  [1yas [5y [1ypaths(1,2), [5y  [1yand [5y  [1ythe
[48{


[6{                 [5y      [1ypath [5y [1yfrom [5y [1ynode [5y [1y1 [5y [1yto [5y  [1yend [5y [1yvia [5y [1ynodes [5y [1y2,4, [5y  [1yand [5y [1y6 [5y [1yis [5y [1ywritten [5y [1yas [5y  [1y[1,2,4,6,end]
[48{


[6{                 [5y      [1y:[1y[6{[2;4x
                                              [5y   [1y163
[48{


[6{                        [5y  [1y[2;2xpaths(1,2)   = 3
paths(2,4)   = 5
paths(2,6)   = 2
paths(4,6)   = 2
paths(6,end) = 5

total paths(1,end) = (3 x 5 x 2 x 5)  [1,2,4,6,end]
+ (3 x 2 x 5)    [1,2,6,end]
= 150 + 30
= 180 possible paths

[48{


[6{                       [2;4xThe set of graphemes [5y [1yand corresponding phonemes, [5y [1yused in the [5y [1yphoncode
[48{


[6{                 [5y      [1yprogram is given in figure [5y [1yB-1 in appendix B.  [5y [1yA "1" preceding a [5y [1ygrapheme
[48{


[6{                 [5y      [1yindicates [5y      [1ythat [5y      [1yit [5y       [1yis [5y      [1ytied; [5y      [1ya [5y       [1y"0" [5y      [1yindicates [5y      [1ythat [5y       [1yit [5y      [1ymay [5y      [1ybe [5y       [1ysegmented
[48{


[6{                 [5y      [1yfurther; a [5y [1y"*" [5y [1yrepresents [5y [1ythe 'vc+e' [5y [1yconstruction.  [5y  [1ySo, [5y [1yin the [5y [1yword [5y [1y'cane'
[48{


[6{                 [5y      [1ythe [5y    [1y'a_e' [5y     [1yis [5y     [1yrepresented [5y    [1yin [5y     [1ythe [5y     [1ygrammar [5y    [1yby [5y     [1y'*a'.  [5y         [1ySimilarly, [5y     [1yin [5y     [1y'raise',
[48{


[6{                 [5y      [1y'ai_e' [5y   [1yis [5y   [1yrepresented [5y   [1yby [5y  [1y'*ai'.  [5y      [1yThe [5y   [1y* [5y   [1ymarked [5y   [1ygraphemes [5y   [1yare [5y   [1ymatched [5y   [1yif
[48{


[6{                 [5y      [1ythe [5y     [1yvowel [5y     [1yor [5y     [1yvowel [5y     [1ydigraph [5y     [1ymatches, [5y     [1yand [5y     [1ythe [5y     [1ynext [5y     [1ybut [5y     [1yone [5y      [1ycharacter
[48{


[6{                 [5y      [1yafter [5y   [1yit [5y   [1yis [5y   [1y'e'. [5y   [1yThere [5y   [1yare [5y   [1ytwo [5y   [1ysets [5y   [1yof [5y   [1yrepresentation [5y   [1yfor [5y   [1ythe [5y   [1y'vc [5y   [1y+ [5y   [1ye'
[48{


[6{                 [5y      [1ygrapheme. [5y  [1yIn [5y  [1ythe [5y  [1yfirst, [5y  [1ythe [5y  [1ysegmentation [5y  [1yis [5y  [1y'v' [5y  [1yand [5y   [1y'c+e': [5y  [1ythe [5y  [1y'e' [5y  [1yis [5y   [1ynot
[48{


[6{                 [5y      [1yrepresented [5y       [1yby [5y       [1yany [5y       [1yseparate [5y       [1yphoneme.   [5y  [1yIn [5y       [1ythe [5y       [1yfinite [5y       [1ystate [5y       [1ygrammar
[48{


[6{                 [5y      [1yrepresentation, [5y       [1ythe [5y        [1yarc [5y        [1yrepresenting [5y       [1ythe [5y        [1yconsonant [5y        [1ypreceding [5y        [1ythe [5y        [1y'e'
[48{


[6{                 [5y      [1ypasses [5y  [1ydirectly [5y [1yto [5y  [1ythe [5y  [1ynode [5y  [1ycorresponding [5y  [1yto [5y  [1ythe [5y  [1ycharacter [5y  [1yfollowing [5y  [1ythe
[48{


[6{                 [5y      [1y'e'. For example, the grapheme-phoneme correspondences for 'rime' are:

                        [5y  [1y[2;2xi_e => /i/ /aI/ /I/ /e/ /E/
m   => /m/
r   => /r/ /e:/ /E/

                     [2;4xIn [5y [1ythe [5y  [1ysecond [5y  [1yrepresentation [5y [1yof [5y  [1y'vc+e', [5y  [1ythe [5y  [1ystructure [5y [1yis [5y  [1ysplit [5y  [1y'v' [5y  [1yand [5y  [1y'c'
[48{


[6{                 [5y      [1yand [5y [1y'e', [5y  [1ythe [5y  [1yvowel [5y  [1yor [5y [1yvowel [5y  [1ydigraph, [5y  [1ythe [5y [1yconsonant, [5y  [1yand [5y  [1ythe [5y [1y'e' [5y  [1yall [5y  [1ybeing
[48{


[6{                 [5y      [1yrepresented independently:

[2;2xe => /i/ /IE/ /e/ /e:/ /E/ /I/ /eI/ /eE/ /ae/
                             i => /e:/ /E/ /aI/ /I/ /y/ /i/ /e/ /^/
                             m => /m/
r => /r/ /e:/ /E/

                     [2;4xThe corresponding finite state grammars for each are shown in figure 7-16
[48{


[6{                 [5y      [1yand figure 7-17.

[48{


[6{[5y[1yThese [5y   [1ytwo [5y    [1ysets [5y    [1yof [5y    [1yphoneme [5y    [1yrepresentation [5y   [1yfor [5y    [1y'rime' [5y    [1ycannot [5y    [1ybe [5y    [1ycon-
[48{


[6{                 [5y      [1ysidered [5y [1yin [5y [1yone [5y  [1yfinite [5y [1ystate [5y  [1ygrammar [5y [1yform: [5y  [1ythe [5y [1yarcs [5y  [1ybetween [5y [1ynodes [5y  [1y2 [5y  [1yand
[48{


[6{                 [5y      [1y3 [5y   [1yin [5y   [1ythe [5y   [1yfirst [5y   [1ycase [5y   [1y( [5y   [1ywith [5y   [1y4 [5y   [1ypassed [5y   [1yover) [5y   [1yare [5y   [1ynot [5y   [1yalternatives [5y   [1yfor [5y   [1ythe
[48{


[6{                 [5y      [1yarcs [5y   [1ybetween [5y   [1ynodes [5y   [1y2 [5y   [1yand [5y   [1y3 [5y   [1yin [5y   [1ythe [5y   [1ysecond [5y   [1ycase. [5y   [1yThere [5y   [1yis [5y   [1yno [5y   [1ylegitimate[1y[6{[2;4x
                                              [5y   [1y164
[48{


[6{[5y[1y[2;2x/i/
/r/             /aI/            /m/
                     1       /e:/    2       /I/     3       4       end
                             /E/             /e/
/E/

[5y[1y[2;4xFigure 7-16:   Finite state grammar representation of 'rime': v, c+e


[5y[1y[2;2x/e:/                            /i/
/E/                             /IE/
/aI/                            /e/
                             /r/             /I/                             /e:/
                     1       /e:/    2       /y/     3       /m/     4       /E/     end
                             /E/             /i/                             /I/
/e/                             /eI/
/^/                             /eE/
/ae/


                       [5y        [1y[2;4xFigure 7-17:   Finite state grammar representation of 'rime': v, c, e


                 [5y      [1ypath [5y [1yfollowing [5y [1ythe [5y [1yarcs [5y  [1ybetween [5y [1ynodes [5y [1y2 [5y [1yand [5y [1y3 [5y  [1yin [5y [1ythe [5y [1ysecond [5y [1ycase, [5y  [1yalong
[48{


[6{                 [5y      [1yarc labelled [5y [1y/aI/, [5y [1yand then [5y [1yfollowing [5y [1yarcs between [5y [1ynodes [5y [1y3 and [5y [1ythe [5y [1yend [5y [1yin
[48{


[6{                 [5y      [1ythe first case, along arc labelled /m/.

[48{


[6{                   [5y  [1yThe [5y  [1ytwo [5y   [1ysets [5y   [1yof [5y  [1yrepresentation [5y   [1yfor [5y  [1y'vc+e' [5y   [1ygraphemes [5y  [1ycan, [5y   [1yhowever, [5y   [1ybe
[48{


[6{                 [5y      [1ycombined [5y  [1yin [5y   [1ythe [5y   [1y'alternative [5y  [1yrepresentation' [5y   [1yformat.  [5y     [1yIn [5y   [1yfigure [5y   [1y7-18 [5y   [1ythe
[48{


[6{                 [5y      [1yfull [5y [1yrepresentation [5y  [1yof [5y  [1y'rime' [5y  [1yis [5y [1ygiven.  [5y    [1yTo [5y  [1yindicate [5y  [1ythe [5y [1yform [5y  [1yin [5y  [1ywhich [5y  [1y'e'
[48{


[6{                 [5y      [1yis [5y       [1ypassed [5y        [1yover, [5y        [1ythe [5y        [1y'next [5y       [1ynode' [5y        [1yof [5y        [1ythe [5y        [1yvowel [5y       [1yhas [5y        [1ya [5y        [1yvalue [5y        [1yof [5y        [1ythe
[48{


[6{                 [5y      [1ycorresponding [5y  [1y(following) [5y  [1yconsonant [5y   [1ynode, [5y  [1yplus [5y  [1y100. [5y   [1yIf [5y  [1ya [5y  [1yvowel [5y  [1yphoneme [5y   [1yis
[48{


[6{                 [5y      [1yselected, [5y     [1ywith [5y      [1ya [5y      [1ynextnode [5y      [1yvalue [5y      [1ygreater [5y      [1ythan [5y      [1y100, [5y      [1ythe [5y      [1ynode [5y      [1yfor [5y      [1ythe
[48{


[6{                 [5y      [1yconsonant [5y  [1yis [5y   [1ytaken [5y   [1y(i.e. [5y   [1ythe [5y  [1ynext [5y   [1ynode [5y   [1yless [5y   [1y100) [5y   [1yand [5y  [1ya [5y   [1yphoneme [5y   [1yvalue [5y   [1yis
[48{


[6{                 [5y      [1yobtained: the [5y [1yvalue [5y [1yof the [5y [1yconsonant [5y [1ynextnode [5y [1yis increased [5y [1yby [5y [1y1, [5y [1yand [5y [1ythis
[48{


[6{                 [5y      [1ynew value becomes the following node, i.e.  the 'e' node is passed over. In
[48{


[6{                 [5y      [1ythis example if at node [5y [1y2 the phoneme /^/ [5y [1ywere selected (next=103), [5y [1ythen
[48{


[6{                 [5y      [1yat [5y    [1ynode [5y    [1y3 [5y     [1ythe [5y    [1yphoneme [5y    [1y/m/, [5y    [1ynext=end, [5y    [1ywould [5y     [1ybe [5y    [1ychosen, [5y    [1yand [5y    [1yany [5y     [1yarcs
[48{


[6{                 [5y      [1yfrom node 4 would be skipped over.

[48{


[6{                   [5y  [1yFurther examples of 'parses' of input words are given in appendix B.[1y[6{[2;4x
                                              [5y   [1y165
[48{


[6{                 [5y      [1y[2;2xinpw = 'rime'
node = 1
phon = /r/      next = 2
phon = /e:/     next = 2
phon = /E/      next = 2
                     node = 2
phon = /i/      next = 3
phon = /aI/     next = 3
phon = /I/      next = 3
phon = /e/      next = 3
phon = /E/      next = 3
phon = /e:/     next = 3
phon = /^/      next = 3
phon = /y/      next = 3
phon = /E/      next = 103
phon = /aI/     next = 103
phon = /I/      next = 103
phon = /i/      next = 103
phon = /e/      next = 103
                     node = 3
phon = /m/      next = 4
phon = /m/      next = end
                     node = 4
phon = /i/      next = end
phon = /IE/     next = end
phon = /e/      next = end
phon = /e:/     next = end
phon = /E/      next = end
phon = /I/      next = end
phon = /eI/     next = end
phon = /eE/     next = end
phon = /ae/     next = end
                     node = end

[5y         [1y[2;4xFigure 7-18:   Representation of 'vc + e' graphemes


[48{


[6{                 [5y      [1y7.3.9. Representing the dictionary

[48{


[6{                   [5y  [1yGiven [5y    [1ya [5y    [1yfile [5y    [1yof [5y    [1ywords [5y    [1ycoded [5y     [1yphonemically, [5y    [1ya [5y    [1ydictionary [5y    [1yis [5y     [1yconstructed
[48{


[6{                 [5y      [1yrepresenting [5y      [1ythe [5y      [1yset [5y      [1yof [5y      [1ywords [5y       [1yas [5y      [1ya [5y      [1ytree [5y      [1ywhere [5y      [1yeach [5y      [1ynode [5y      [1ystores [5y       [1ya
[48{


[6{                 [5y      [1yphoneme value.  The phoneme [5y [1yrepresentation used is [5y [1ythe integer one, [5y [1ygiven
[48{


[6{                 [5y      [1yin [5y        [1yfigures [5y         [1y7-12 [5y        [1yand [5y         [1y7-13.   [5y     [1yExamples [5y        [1yof [5y         [1ywords [5y         [1yand [5y        [1ytheir [5y         [1yphonemic
[48{


[6{                 [5y      [1yrepresentation are:

[5y[1y[2;2xhe      /h/ /i/               80 50
                       help    /h/ /e/ /l/ /p/       80 53 120 160
                       helped  /h/ /e/ /l/ /p/ /d/   80 53 120 160 40
                       nine    /n/ /ai/ /n/          140 90 140
                       air     /eE/ /r/              12 170

                     [2;4xThese are represented in tree form in figure 7-19.[1y[6{[2;4x
                                              [5y   [1y166
[48{


[6{[5y[1y[2;2xstart of
tree

    > 12 . . /
         >"air"
> 170 / / .

                                      > 80 . . /
          >"he"
> 50 . / .

> 53 / . /

                          > 140 / . /          > 120 / . /
      >"help"
                              > 90 / . /             > 160 / . .
>"nine"                 >"helped"
                                 > 140 / / .              > 40 / / .

                       Key to nodes:  1 2 3 4
1 = integer representing phoneme
                       2 = pointers to alternative phoneme at same level
                       3 = pointer to next phoneme in word
                       4 = pointer to word

[5y[1y[2;4xFigure 7-19:   Tree representation of part of the
[5y[1yphoncode dictionary


                   [5y  [1yThe dictionary [5y [1ytree [5y [1yto [5y [1yrepresent these [5y [1yfive [5y [1ywords [5y [1ywould [5y [1ybe [5y [1ybuilt [5y [1yup [5y [1yas
[48{


[6{                 [5y      [1yfollows.  The [5y [1yfirst phoneme [5y [1yin each of [5y [1ythe words 'he, [5y [1y'help' and ' [5y [1yhelped'
[48{


[6{                 [5y      [1yis [5y    [1ythe [5y    [1ysame, [5y     [1y80, [5y    [1yand [5y     [1yso [5y    [1ywould [5y     [1yall [5y    [1ybe [5y     [1ystored [5y    [1yin [5y    [1ythe [5y     [1ysame [5y    [1ynode.  [5y          [1yThe
[48{


[6{                 [5y      [1ysecond [5y   [1yphoneme [5y   [1yis [5y    [1y50 [5y   [1yin [5y    [1y'he' [5y   [1yand [5y   [1y53 [5y    [1yin [5y   [1y'help' [5y   [1yand [5y    [1y'helped'.  [5y      [1yThe [5y    [1yright
[48{


[6{                 [5y      [1yoffspring of the [5y [1ynode storing [5y [1y80 will [5y [1ystore 50: [5y [1ythe left offspring [5y [1yof [5y [1ythis
[48{


[6{                 [5y      [1ynode [5y    [1y(50) [5y     [1ystores [5y    [1ythe [5y    [1y'alternative [5y     [1yphoneme', [5y    [1y53.  [5y         [1yFor [5y     [1yother [5y    [1ywords [5y     [1ywith
[48{


[6{                 [5y      [1yfirst phoneme [5y [1y80 [5y [1yand [5y [1yan [5y [1yalternative [5y [1ysecond [5y [1yphoneme, [5y [1ye.g. [5y [1y'hill' [5y [1y80 [5y [1y93 [5y [1y120,
[48{


[6{                 [5y      [1ythe [5y  [1ysecond [5y   [1yphoneme [5y   [1yis [5y  [1yadded [5y   [1yin [5y  [1ythe [5y   [1yleft [5y  [1yoffspring [5y   [1yof [5y  [1ythe [5y   [1ynode [5y   [1ystoring
[48{


[6{                 [5y      [1y53.  The word 'he' [5y [1yis represented by two [5y [1yphonemes, both now stored: [5y [1ythe
[48{


[6{                 [5y      [1ystring 'he' [5y [1yis [5y [1yalso [5y [1ystored in [5y [1ythe [5y [1ynode [5y [1ywith the [5y [1ylast [5y [1yphoneme in [5y [1ythe [5y [1yword,
[48{


[6{                 [5y      [1y50.  [5y [1yThe third [5y [1yphoneme [5y [1yin 'help', [5y [1y120, [5y [1yis stored [5y [1yin [5y [1ythe right [5y [1yoffspring [5y [1yof
[48{


[6{                 [5y      [1ythat [5y  [1ywith [5y  [1y53.  [5y    [1yThis [5y   [1yalso [5y  [1ymatches [5y  [1ythe [5y  [1ynext [5y  [1yphoneme [5y  [1yin [5y  [1y'helped' [5y  [1yand [5y   [1ydoes
[48{


[6{                 [5y      [1ynot [5y    [1yneed [5y    [1yto [5y     [1ybe [5y    [1yrepresented [5y    [1ytwice.  [5y         [1yThe [5y    [1yright [5y     [1yoffspring [5y    [1yof [5y    [1ythis [5y     [1ynode
[48{


[6{                 [5y      [1y(storing 120) stores the fourth [5y [1yphoneme, 160.  This is the last phoneme [5y [1yin
[48{


[6{                 [5y      [1y'help', so [5y [1ythe string [5y [1y'help' [5y [1yis also [5y [1ystored [5y [1yin this [5y [1ynode.  [5y [1yThe [5y [1yfinal [5y [1yphoneme
[48{


[6{                 [5y      [1yin [5y    [1y'helped' [5y    [1yis [5y     [1yadded [5y    [1yas [5y     [1ythe [5y    [1yright [5y     [1yoffspring, [5y    [1ystoring [5y     [1y40 [5y    [1yand [5y    [1ythe [5y     [1ystring
[48{


[6{                 [5y      [1y'helped'.

[48{


[6{[5y[1yThe [5y      [1yword [5y      [1y'nine' [5y      [1yhas [5y      [1yfirst [5y      [1yphoneme [5y      [1y140, [5y      [1yand [5y      [1yis [5y      [1ystored [5y      [1yas [5y      [1ythe [5y       [1yleft[1y[6{[2;4x
                                              [5y   [1y167
[48{


[6{                 [5y      [1yoffspring [5y     [1y(alternative [5y      [1yfirst [5y      [1yphoneme) [5y      [1yto [5y     [1ythe [5y      [1ynode [5y      [1ycontaining [5y     [1y80.   The
[48{


[6{                 [5y      [1yremaining [5y  [1yphonemes [5y   [1yin [5y   [1ythe [5y  [1yword [5y   [1y'nine' [5y   [1yare [5y  [1ystored [5y   [1yin [5y   [1ythe [5y   [1yright [5y   [1yoffspring
[48{


[6{                 [5y      [1yof this [5y [1ynode [5y [1y(storing [5y [1y140).  [5y [1yThe [5y [1ystring [5y [1y'nine' is [5y [1ystored [5y [1yalso with [5y [1ythe [5y [1yfinal
[48{


[6{                 [5y      [1yphoneme.

[48{


[6{The [5y   [1yword [5y   [1y'air' [5y   [1yis [5y   [1ycoded [5y   [1y12 [5y    [1y170.  [5y      [1yIt [5y   [1ydoes [5y   [1ynot [5y    [1ymatch [5y   [1y80 [5y   [1yor [5y   [1y140, [5y    [1ythe
[48{


[6{                 [5y      [1yalternative [5y     [1yinitial [5y     [1yphonemes.  [5y           [1yIt [5y      [1ymust [5y     [1ybe [5y      [1yadded [5y     [1yas [5y     [1yanother [5y      [1yalternative
[48{


[6{                 [5y      [1yinitial [5y    [1yphoneme, [5y    [1yas [5y     [1ya [5y    [1yleft [5y    [1yoffspring.  [5y         [1yHowever, [5y    [1ythe [5y     [1yleft [5y    [1yoffsprings [5y     [1yare
[48{


[6{                 [5y      [1yordered [5y [1yin [5y [1yincreasing [5y  [1yorder.  [5y  [1yThe [5y [1ynode [5y [1ystoring [5y  [1y12 [5y [1ybecomes [5y [1ythe [5y [1yroot [5y  [1ynode
[48{


[6{                 [5y      [1yand the parent of the node storing 80, this latter node becoming its [5y [1yleft
[48{


[6{                 [5y      [1yoffspring:  [5y [1ythe new [5y [1ynode is [5y [1yinserted in [5y [1ythe tree.  [5y [1yThe [5y [1ysecond phoneme [5y [1yis
[48{


[6{                 [5y      [1yadded as the [5y [1yright offspring [5y [1yof this [5y [1ynew node [5y [1yand the string [5y [1y'air' [5y [1ystored
[48{


[6{                 [5y      [1yalso.

[48{


[6{[5y[1yFurther [5y [1ywords [5y [1ymay [5y [1ybe [5y [1yadded. [5y [1yThe [5y [1yinitial [5y [1yphoneme [5y [1yis [5y [1ycompared [5y [1ywith [5y [1yeach
[48{


[6{                 [5y      [1yleft offspring node, starting [5y [1ywith the current [5y [1yroot node.  [5y [1yIf no match [5y [1yis
[48{


[6{                 [5y      [1yfound [5y [1ythe [5y [1yfirst [5y  [1yphoneme [5y [1yof [5y  [1ythe [5y [1yword [5y  [1yis [5y [1yinserted [5y  [1yin [5y [1ythe [5y [1ycorrect [5y  [1yposition
[48{


[6{                 [5y      [1yin [5y  [1ythe [5y  [1yordering; [5y  [1ythe [5y  [1yremaining [5y   [1yphonemes [5y  [1yin [5y  [1ythe [5y  [1yword [5y   [1yare [5y  [1yadded [5y  [1yas [5y   [1yright
[48{


[6{                 [5y      [1ydescendants.  [5y          [1yIf [5y     [1ya [5y     [1ymatch [5y      [1yis [5y     [1yfound [5y     [1ythe [5y     [1ynext [5y     [1yphoneme [5y     [1y(the [5y     [1ysecond) [5y      [1yis
[48{


[6{                 [5y      [1ycompared [5y [1yfirstly [5y  [1ywith [5y  [1ythe [5y  [1yright [5y  [1yoffspring [5y  [1yof [5y  [1ythe [5y  [1ymatched [5y  [1yphoneme [5y  [1ynode,
[48{


[6{                 [5y      [1yand [5y      [1ythen [5y     [1ywith [5y      [1yits [5y      [1yoffsprings, [5y      [1yand [5y      [1yleft [5y      [1ydescendants [5y      [1yof [5y      [1ythis [5y      [1yoffspring.
[48{


[6{                 [5y      [1yAgain, [5y     [1yif [5y      [1yno [5y      [1ymatch [5y     [1yis [5y      [1yfound, [5y      [1ya [5y     [1ynew [5y      [1ynode [5y      [1yis [5y     [1yinserted [5y      [1yin [5y      [1ythe [5y      [1ycorrect
[48{


[6{                 [5y      [1yposition, [5y      [1yand [5y      [1ythe [5y      [1yremaining [5y      [1yphonemes [5y      [1yadded; [5y      [1yotherwise, [5y      [1yif [5y      [1ya [5y       [1ymatch [5y      [1yis
[48{


[6{                 [5y      [1yfound, the [5y [1ynext [5y [1yphoneme is [5y [1ycompared [5y [1ywith firstly [5y [1ythe [5y [1yright [5y [1yoffspring [5y [1yand
[48{


[6{                 [5y      [1ythen [5y        [1ywith [5y        [1yits [5y         [1yleft [5y        [1ydescendants.   [5y     [1yThe [5y        [1yprocess [5y         [1yis [5y        [1yrepeated [5y        [1yuntil [5y         [1yall
[48{


[6{                 [5y      [1yphonemes [5y   [1yin [5y    [1ythe [5y    [1yword [5y    [1yare [5y    [1ymatched, [5y    [1yor [5y    [1yhave [5y    [1ybeen [5y    [1yadded/inserted.  [5y        [1yThe
[48{


[6{                 [5y      [1yword string [5y [1yis [5y [1ystored [5y [1yin [5y [1ythe [5y [1ysame [5y [1ynode [5y [1yas [5y [1ythe last [5y [1yphoneme [5y [1yin [5y [1ythe [5y [1yword.
[48{


[6{                 [5y      [1yIn [5y [1ythis [5y  [1yway [5y  [1ya [5y  [1yfile [5y [1yof [5y  [1yphonemically [5y  [1ycoded [5y  [1ywords [5y  [1ymay [5y [1ybe [5y  [1ystored [5y  [1yas [5y  [1ya [5y  [1ytree
[48{


[6{                 [5y      [1ystructured dictionary.


[48{


[6{[5y[1y7.3.10. Matching the word and dictionary

[48{


[6{                   [5y  [1yThe [5y  [1ycomparison [5y   [1ypart [5y   [1yof [5y  [1ythe [5y   [1yphoncode [5y  [1yprogram [5y   [1ytakes [5y  [1ythe [5y   [1ydictionary [5y   [1yof
[48{


[6{                 [5y      [1yphonemically [5y [1ycoded [5y  [1ywords, [5y  [1yrepresented [5y  [1yas [5y [1ya [5y  [1ytree, [5y  [1yand [5y  [1yan [5y  [1yinpw, [5y  [1yparsed [5y  [1yto
[48{


[6{                 [5y      [1yshow [5y       [1yall [5y        [1ysequences [5y       [1yof [5y        [1yphonemes [5y       [1ythat [5y        [1ycould [5y       [1yhave [5y        [1yproduced [5y        [1yit.   [5y   [1yThe
[48{


[6{                 [5y      [1yalternative [5y  [1yrepresentation [5y  [1yof [5y   [1ythe [5y  [1yparsed [5y   [1yinpw [5y  [1y(as [5y   [1yin [5y  [1yfigure [5y   [1y7-15) [5y  [1ywill [5y   [1ybe
[48{


[6{                 [5y      [1yused [5y  [1yhere [5y   [1yto [5y  [1ydescribe [5y   [1ythe [5y  [1ymatching [5y   [1yprocess:  [5y     [1yit [5y   [1ywill [5y  [1ybe [5y   [1yreferred [5y  [1yto [5y   [1yas
[48{


[6{                 [5y      [1ythe inpw network.  In the program the integer phonemic coding is used,[1y[6{[2;4x
                                              [5y   [1y168
[48{


[6{                   [5y  [1yStarting at the [5y [1yroot [5y [1yof the [5y [1ydictionary tree, [5y [1yand the [5y [1yfirst node [5y [1yof [5y [1ythe
[48{


[6{                 [5y      [1yinpw [5y  [1ynetwork, [5y  [1ythe [5y   [1yfirst [5y  [1yphoneme [5y  [1ylisted [5y  [1yat [5y  [1ythe [5y   [1yinpw [5y  [1ynode [5y  [1y1 [5y  [1yis [5y   [1ycompared
[48{


[6{                 [5y      [1ywith the [5y [1ydictionary [5y [1yroot [5y [1ynode phoneme.  [5y  [1yThe [5y [1yphonemes [5y [1ylisted [5y [1yat [5y [1ythe [5y [1yinpw
[48{


[6{                 [5y      [1ynodes are in [5y [1yincreasing order, [5y [1yas are the [5y [1yleft descendant dictionary [5y [1ynodes.
[48{


[6{                 [5y      [1yIf [5y     [1ythe [5y      [1ycompared [5y     [1yphonemes [5y      [1ymatch, [5y     [1ythen [5y      [1ythe [5y     [1ynext [5y      [1yinpw [5y     [1ynode [5y      [1yis [5y      [1yfound
[48{


[6{                 [5y      [1y(numbered [5y    [1yas [5y     [1y'next') [5y    [1yand [5y     [1ythe [5y    [1yfirst [5y     [1yphoneme [5y    [1yof [5y     [1ythis [5y    [1ynew [5y     [1yinpw [5y    [1ynode [5y     [1yis
[48{


[6{                 [5y      [1ycompared [5y     [1ywith [5y     [1ythe [5y     [1yright [5y     [1yoffspring [5y     [1yphoneme [5y     [1yof [5y     [1ythe [5y     [1ymatched [5y      [1ydictionary
[48{


[6{                 [5y      [1ynode.  [5y      [1yIf [5y   [1ythe [5y   [1ymatch [5y    [1ysucceeds [5y   [1ythen [5y   [1ythe [5y   [1ycomparison [5y   [1yprocess [5y   [1yis [5y    [1yrepeated.
[48{


[6{                 [5y      [1yIf [5y    [1ythe [5y    [1ymatch [5y    [1yfails, [5y    [1ythe [5y    [1yinpw [5y    [1ynode [5y    [1yphoneme [5y    [1yis [5y    [1ycompared [5y    [1ywith [5y    [1ythe [5y    [1yleft
[48{


[6{                 [5y      [1yoffspring [5y     [1ydictionary [5y      [1ynode [5y      [1yphoneme.  [5y           [1yTaking [5y      [1yaccount [5y      [1yof [5y     [1ythe [5y      [1yfact [5y      [1ythat
[48{


[6{                 [5y      [1ydictionary [5y  [1yand [5y   [1yinpw [5y  [1ynodes [5y   [1yare [5y  [1yordered, [5y   [1ywhenever [5y  [1ya [5y   [1ymatch [5y  [1yfails [5y   [1ythe [5y   [1ynext
[48{


[6{                 [5y      [1yinpw [5y  [1ynode [5y  [1yor [5y  [1ydictionary [5y  [1yword [5y [1ynode [5y  [1yis [5y  [1ytried.  [5y    [1yFor [5y  [1yexample, [5y  [1ywhen [5y  [1yan [5y  [1yinpw
[48{


[6{                 [5y      [1yphoneme 80 fails to match a dictionary node phoneme 60, and also fails [5y [1yto
[48{


[6{                 [5y      [1ymatch [5y  [1yits [5y  [1yleft [5y  [1yoffspring [5y  [1y90, [5y   [1yit [5y  [1yis [5y  [1ypointless [5y  [1yto [5y  [1ycompare [5y  [1yit [5y  [1ywith [5y  [1ythe [5y   [1yleft
[48{


[6{                 [5y      [1ydescendants of the [5y [1ynode storing 90, [5y [1yas the [5y [1yphonemes will [5y [1ybe greater [5y [1ythan
[48{


[6{                 [5y      [1y90.  [5y [1yInstead [5y [1ythe next [5y [1yinpw [5y [1yphoneme is [5y [1ycompared [5y [1ywith the [5y [1ydictionary [5y [1ynode
[48{


[6{                 [5y      [1ystoring 90.  [5y [1yIf [5y [1ythis inpw [5y [1yphoneme is [5y [1y120 [5y [1ythen the [5y [1ymatch would [5y [1yagain [5y [1yfail,
[48{


[6{                 [5y      [1yand [5y [1ythe [5y [1ynext left [5y [1yoffspring [5y [1yof [5y [1ythe [5y [1ydictionary [5y [1ywould [5y [1ybe [5y [1ycompared [5y [1yinstead.
[48{


[6{                 [5y      [1yIf [5y [1yat [5y [1yany [5y [1ypoint [5y [1ythere [5y [1yare [5y [1yno [5y [1ymore [5y [1yphonemes [5y  [1ylisted [5y [1yat [5y [1ythe [5y [1yinpw [5y [1ynode, [5y  [1yor
[48{


[6{                 [5y      [1yno [5y    [1ymore [5y     [1yleft [5y    [1yoffspring [5y     [1yphonemes [5y    [1yto [5y     [1ycompare, [5y    [1ythen [5y     [1ythe [5y    [1yprogram [5y     [1yback-
[48{


[6{                 [5y      [1ytracks to the last pair of nodes matched, [5y [1yfails that match, and [5y [1ycontinues.
[48{


[6{                 [5y      [1yIf [5y    [1ymatching [5y    [1ysucceeds [5y     [1ysuch [5y    [1ythat [5y    [1ythe [5y    [1yend [5y    [1ynode [5y     [1yof [5y    [1ythe [5y    [1yinpw [5y    [1ynetwork [5y     [1yis
[48{


[6{                 [5y      [1yreached then [5y [1yany [5y [1yword [5y [1ystrings [5y [1ystored [5y [1yin [5y [1ythe [5y [1ylast [5y [1ymatched [5y [1ydictionary [5y [1ynode
[48{


[6{                 [5y      [1yare [5y      [1ysaved [5y      [1yas [5y      [1y'possible [5y      [1yphonemic [5y       [1yequivalents' [5y      [1yfor [5y      [1ythe [5y      [1yinpw.   All [5y       [1ypaths
[48{


[6{                 [5y      [1ythrough [5y       [1ythe [5y        [1yinpw [5y        [1ynetwork [5y        [1yare [5y        [1ytried [5y        [1yand [5y        [1ythe [5y        [1ydictionary [5y        [1yis [5y        [1ysearched
[48{


[6{                 [5y      [1yexhaustively.  All possible matches are found.

[48{


[6{                   [5y  [1yIn [5y  [1yappendix [5y   [1yB [5y   [1ya [5y   [1yset [5y   [1yof [5y   [1yexamples [5y   [1yis [5y   [1ygiven:  [5y     [1ythe [5y   [1yphonetic [5y   [1ycoding [5y   [1yof [5y   [1ya
[48{


[6{                 [5y      [1ysmall example dictionary is shown; examples of [5y [1yinpws, parsed to produce [5y [1yall
[48{


[6{                 [5y      [1ysets of [5y [1yphonemes, are [5y [1ygiven.  [5y [1ySuccessful matches [5y [1yfor each [5y [1yinpw, from [5y [1ythe
[48{


[6{                 [5y      [1yexample dictionary, are given.

[48{


[6{                   [5y  [1yThe [5y     [1yeditcost [5y      [1yand [5y      [1yphoncode [5y      [1yprograms [5y     [1ydescribed [5y      [1yin [5y      [1ythis [5y      [1ychapter [5y      [1ywere
[48{


[6{                 [5y      [1ytested [5y     [1yon [5y     [1ya [5y      [1ycorpus [5y     [1yof [5y      [1yerrors [5y     [1yproduced [5y     [1yby [5y      [1ychildren [5y     [1ywith [5y     [1yspelling [5y      [1ydis-
[48{


[6{                 [5y      [1yabilities. Additionally, the [5y [1yeditcost program [5y [1ywas used [5y [1yand tested [5y [1yby a [5y [1ysmall
[48{


[6{                 [5y      [1ygroup [5y [1yof [5y  [1ychildren [5y  [1y(see [5y  [1yStudy [5y  [1y2 [5y  [1yin [5y  [1ychapter [5y  [1y6).  [5y   [1yThe [5y  [1yperformance [5y  [1yof [5y  [1yeach
[48{


[6{                 [5y      [1yof the programs is discussed in chapter 8.[1y[6{[2;4x
                                               [5y  [1yI


[5y[1y[3;1xTABLE OF CONTENTS


                 [5y      [1y[2;4x7. Detail of the editcost and phoncode programs                  [5y          [1y131
[48{


[6{                    [5y      [1y[3;1x7.1. Introduction                                     131
                    [5y      [1y7.2. Calculating [5y  [1ythe [5y  [1yminimum [5y  [1ycost [5y  [1yrepair: [5y  [1ythe [5y  [1yedit-  131
                         [5y      [1ycost program
7.2.1. General overview                           131
                        [5y      [1y7.2.2. Shortlisting candidates from the diction-  132
                               [5y      [1yary: 'shortlist'
7.2.3. The editcost algorithm                     134
                        [5y      [1y7.2.4. Relation of the children's errors          139
                        [5y      [1y7.2.5. Detail of the editcost program             142
                    [5y      [1y7.3. Phonemic coding of words: the phoncode program   149
                        [5y      [1y7.3.1. General overview                           149
                        [5y      [1y7.3.2. Related work                               149
                        [5y      [1y7.3.3. Design of the phoncode program             150
                        [5y      [1y7.3.4. Defining the set of phonemes               151
                        [5y      [1y7.3.5. Phoneme-grapheme correspondences           153
                        [5y      [1y7.3.6. Phonemic coding of the dictionary          158
                        [5y      [1y7.3.7. Detail of the phoncode program             160
                        [5y      [1y7.3.8. Segmenting the word                        160
                        [5y      [1y7.3.9. Representing the dictionary                165
                        [5y      [1y7.3.10. Matching the word and dictionary          167[1y[6{[2;4x
                                              [5y           [1yII


[5y[1y[3;1xLIST OF FIGURES


                    [5y      [1yFigure 7-1:   First   character   alternatives   for  133
                                  [5y      [1yshortlisting
                    [5y      [1yFigure 7-2:   Graph  [5y        [1yrepresenting  [5y        [1yedit  [5y        [1yoperation  136
                                  [5y      [1ytransformations
                    [5y      [1yFigure 7-3:   Costgraph showing the node labelling    137
                    [5y      [1yFigure 7-4:   Example [5y    [1yof [5y     [1ythe [5y     [1yspelling [5y     [1ycorrector [5y     [1yin  140
                                  [5y      [1yuse
Figure 7-5:   Study 1: frequency of error types       142
                    [5y      [1yFigure 7-6:   Study [5y  [1y1: [5y  [1yfrequency [5y  [1yof [5y  [1ytypes [5y  [1yof [5y  [1yspell-  143
                                  [5y      [1ying errors
                    [5y      [1yFigure 7-7:   Example  [5y   [1yof  [5y   [1ycandidates  [5y   [1yand  [5y   [1ymininum  144
                                  [5y      [1yeditcost
                    [5y      [1yFigure 7-8:   Representation of 'special cases'       145
                    [5y      [1yFigure 7-9:   Weightings assigned to edit functions   146
                    [5y      [1yFigure 7-10:   Graph showing example weightings       148
                    [5y      [1yFigure 7-11:   Examples  [5y  [1yof  [5y  [1yuse  [5y   [1yof  [5y  [1ythe  [5y   [1yphoncode  150
                                   [5y      [1yprogram
                    [5y      [1yFigure 7-12:   Representation of vowel phonemes       152
                    [5y      [1yFigure 7-13:   Representation of consonant phonemes   153
                    [5y      [1yFigure 7-14:   Finite [5y        [1yState [5y        [1yGrammar [5y        [1yrepresentation  161
                                   [5y      [1yof 'caught'
                    [5y      [1yFigure 7-15:   Alternative     representation     of  162
                                   [5y      [1y'caught'
                    [5y      [1yFigure 7-16:   Finite [5y        [1ystate [5y        [1ygrammar [5y        [1yrepresentation  164
                                   [5y      [1yof 'rime': v, c+e
                    [5y      [1yFigure 7-17:   Finite [5y        [1ystate [5y        [1ygrammar [5y        [1yrepresentation  164
                                   [5y      [1yof 'rime': v, c, e
                    [5y      [1yFigure 7-18:   Representation of 'vc + e' graphemes   165
                    [5y      [1yFigure 7-19:   Tree [5y       [1yrepresentation [5y       [1yof [5y       [1ypart [5y       [1yof [5y        [1ythe  166
                                   [5y      [1yphoncode dictionary