ESpeakEngine - Objective-C speech synthesizer

Jozef Bozek

Rate me:

4.80/5 (3 votes)

23 Jan 2012BSD2 min read

74.8K

ESpeakEngine - Objective-C speech synthesizer

ESpeakTest.zip
- __MACOSX
  - ESpeakTest
    - ._.DS_Store
    - .git
      - info
        
        ._exclude
    - ESpeakTest
      - ._AppDelegate.h
      - ._AppDelegate.m
      - ._ESpeakTest-Prefix.pch
      - ._main.m
      - ._ViewController.h
      - ._ViewController.m
      - en.lproj
        
        ._InfoPlist.strings
        
        ._ViewController_iPad.xib
    - ESpeakTestTests
      - ._ESpeakTestTests.h
      - ._ESpeakTestTests.m
      - en.lproj
        
        ._InfoPlist.strings
- ESpeakTest
  - .DS_Store
  - .git
    - branches
    - COMMIT_EDITMSG
    - config
    - description
    - HEAD
    - hooks
      - applypatch-msg.sample
      - commit-msg.sample
      - post-commit.sample
      - post-receive.sample
      - post-update.sample
      - pre-applypatch.sample
      - pre-commit.sample
      - prepare-commit-msg.sample
      - pre-rebase.sample
      - update.sample
    - index
    - info
      - exclude
    - logs
      - HEAD
      - refs
        
        heads
        
        master
    - objects
      - 00
        
        e88867c94b8f6728422a4ad099a53a9f392cb7
      - 01
        
        477be5465c04d4cfd46ab95003f17445731d74
      - 02
        
        37597b848a1890bb30ba0ff4102f8107cafdcb
        
        6363f6a3bb9fe78b03b09f4d0fdce472b95e20
        
        69a98a29eb1baf79dd1f6f2bbc9370b9c4c9cb
        
        78ea2136d97866104e3789d7950d39632b5046
      - 03
        
        7b0f820ace631b85715dfb13cc21fe26daa44d
        
        dac4f6baff6f5a2b06f5a68b6daa265c16e0a2
        
        edde41daf54530ac1fe426e9349a5544b48ccc
      - 05
        
        b2d0d21b687b4190600f6ea0206972c960dd1c
      - 06
        
        23379b22e1417ed806ff4c48337afbe9457cdf
      - 0c
        
        2d13a65548266d9c8a6758599c9a86faf53b28
      - 0d
        
        51695daffab058d065e942018f5c56067942fe
        
        6fa2a91273ee3271fb1d3202d7f6ad86379ef7
      - 10
        
        e91b22ea1e6c67962cd858e8d03de74e7abf6f
      - 11
        
        8095eb5859b9c2ee14be00adeb87ee66eaec94
      - 12
        
        83826f9250bed7326aed2542a0e3c5b47edbec
        
        ce1096a4ef6c4538a43ebd951dcaf2b624b717
      - 13
        
        664a34fe6a3b585603e00df15b17bcef3591e0
        
        93b3551c88468dccede7550726aae27a931555
      - 14
        
        1160885f6955ee4855933ce984bc117649d220
        
        417c1fdfdb3af16ef717d90a078f5c9b8468c3
      - 15
        
        96e3c77205e1688ad5968359106b5ea92d322a
      - 17
        
        004519410f433308228397abc30d2b69e55b26
      - 19
        
        3700525eaa0aa02256a4211c820007bb005995
        
        da34a5b9b6e585ece12d4a6ec24341fa98f50c
        
        fd69d3bec6857b0d4b29f4f26c03ac0dc727e3
      - 1a
        
        61238c5c772724cb12490eb555630bcc0e7870
        
        9e53b6e584bd1e8245f3fc69751211b7d4e86a
      - 1c
        
        2992dd5455746aef85905cc0293031e3e9ceaa
        
        a6f6abadb2e86be2baf2f823a27d16c43d2528
      - 1e
        
        9a757f891fd7ece2ff350dc9225837cb7e70f7
      - 1f
        
        2eb929019174a9b4c2654c1398ed26aca50e2c
      - 20
        
        5e59c21f973ea13de6deab139efee2f171027a
      - 21
        
        4d6f9d708a7691c1abf13b0801ee9a54a44ae6
      - 22
        
        a3b80f6954fd663b59f66210e7b658c5db3a3f
        
        a95d18a3ead5d0274abab7986121dccafc1842
      - 23
        
        8c69126e18387f9c2b3d059db6d7df1cd91a6f
      - 25
        
        55d5d8bec5ee0524034d96ea5aa95eeb1a90dd
        
        5fe35ca3bf7c8743abf0f95518aae822aac4f0
        
        bfdbf47ea384bd8118ed197a8842cb2104eb2a
        
        d78c05ca841d2019f204184927282dc69ebd61
      - 28
        
        59e093f75f1f88ca412e0bde9345afc01f15ac
      - 29
        
        91e99d136fe8e13f7c0c99eaa27c8ca397186d
      - 2a
        
        736d4d3f3c3ffe36bea620d6c28b672efc5867
        
        fb1adc71b7f4e90bd02355dd8cdb75e8d23870
      - 2e
        
        1534872410e5819a69396cdbb57225baa3a888
        
        9dd1f58881b69e931f3b5a73fef461eb9b838b
      - 30
        
        441d7e239ccd9169d15b04efc59be7a158a4a5
        
        dea89200864b8e84dc0fec67850491d460a78d
      - 31
        
        02c9a1a9a5db99cadf90502de610f69c994913
        
        bd479a3d5873c8a970de821a84d2addc864839
      - 32
        
        49dd4f8012e94af03784f043478ebab38fd0b7
      - 33
        
        00c360065de4a18e093dd02df3f6419b656f74
        
        430a22c186f11e5cf838e81dacb386a7e4c8d0
        
        8b8c450f3027ea5d3751fc1e0b4bf969cc1afc
      - 35
        
        a4a3fc517a71ec8bad8f9d0c71bd9da960c494
      - 36
        
        665314753a98e11162485805608fe1aca7bc1e
        
        669d3f0592eaeb8465b81341b486a4c9c1eb11
        
        a4bff6503dfb82fcdc7a160cc36f4cdd9e333d
      - 3a
        
        f2aa1af75587b7a29685fa2dbbebbd2b3592c2
      - 3b
        
        105a7fb0f9b3bb28a87a7212dfcef08daf53c0
      - 3d
        
        d75260a68d0fb7b88fe70d0e3e73c916b963e5
      - 3e
        
        520ec5c8b88db8f95f6a230273278fd39bfbd6
      - 41
        
        22d96b39bf2bc1025a1c57ef01b8b03936773d
      - 42
        
        dbdc5586bc89d681d23851f4a5aafd79b414cb
        
        de58882d0c80e94597b575893afc8e99bd431e
      - 46
        
        07dd079dd2748f8e9cde034268e6cd68278644
        
        317618d912082d6070e4e3972809824bd35395
      - 47
        
        7b28ff8f86a3158a71c4934fbd3a2456717d7a
      - 4b
        
        6a9ae550599ea85d77fea7c0f71b4d5aaf1ba8
      - 4c
        
        6239268d21312d311a504ad0d8aeb0e4f1030b
      - 4d
        
        ec15997c4e00c7a764156687431ac8c47676a5
      - 4e
        
        2b9d23e84059b93883e1a0c0f7a859a23b087e
      - 4f
        
        1904e5164410f93689beb55d46901b214271fe
        
        8f5e88f436d478b126c5c4eccf3568e398c26f
        
        e4188e53b10cc21b50c3bf47e9ef3b2fc4c641
      - 50
        
        1b5a4a8620d5bd9a545c8941cdcbd565fca1c6
      - 52
        
        1be164ce6c87e1d6df58fd82ab160c8f6255db
        
        692c38546eb82aee2a7550c93798f70f02dc9a
        
        c5ac93561331143a9caea14d6c0f008216b4e9
      - 53
        
        6957cb8fe03bde580784e6f97537ec3444e9c3
        
        7beb3ba82da8af147f028685e61fc839cad713
        
        c2a70482993f53d6df321687b5cc4d9e95abc1
        
        cb31446e077a5f159c831e126a0e3f9a2d0ed2
      - 56
        
        9f9d05432267a13b75ca2562beb85e1e1c17db
      - 58
        
        1cd883fed6aa3b84b580a543b6ec8998f4d327
      - 5a
        
        24e11ad4dc2842c79033ad323f02e2e6c2f566
        
        85640ee385afef9b9dc9b7d2889d47b81aa1bd
      - 5c
        
        3583da4700ab6982766d187d1195b37f9a3fb5
      - 5e
        
        bb6a35716f489f249db8bb0e9df7dde150eba4
      - 5f
        
        3297d3a2009a6051a8ebc606bc674056ea03fc
      - 61
        
        124ff298a7d392b816cb1a71095ed1ec8ffe6b
      - 65
        
        3c3f5c4a2d2e44b8a188b88b64278085ebde27
      - 68
        
        1cad9627cb3af687a30507f05114c89ef9340f
      - 69
        
        cceefb779a5236074db6871d7523d92f8a709f
      - 6a
        
        8d5efd87553a3f0e977636c6b819cddf3a99e7
        
        cadba6aea97cd920745428a1c4ccd998581cc7
      - 6c
        
        65e3c6851f204d9c4cd9b616b46a9ff425b3c2
      - 6d
        
        826477b6ee1ecb3e502ffe3c26387d1bce3961
      - 6e
        
        11c93121ab5d535e4f2d50253ee4a527694a9f
      - 71
        
        99341c34f93f5fa5219ff479e82edaee5d7936
        
        ecab7197ec9646efdae05bb02b465f5b5e361a
      - 73
        
        ac62a4ab12374bbf6f72539b2e104d10d7d394
      - 74
        
        00c07a5c17fbbead0d252a22f1fcdb6e5f15c4
        
        0601d129aa08fd59be839301c923b684361dbe
      - 79
        
        2d8a9f9ef248c4358c36000722ba0c53a76497
      - 7c
        
        bdab338114c51e83e0b54c67280b91872211d5
      - 7d
        
        276eb2b779d73c46d8ed97e4be287bec96c828
      - 7e
        
        6c16a2c28e97392d20d4f4c243ecd6f6f40a91
        
        f93a5edd61fddc97d982242d7654e5ab07a09e
      - 7f
        
        4631899e208f50b855ad579b726eadea70f67d
        
        fccbe6dd68c968e78da5b6265a13c62c1fc639
      - 82
        
        2c9a312addee71797811c17690f2be8746bea4
        
        98f98722e5f5f405e9631eb4a5064d87114424
      - 83
        
        71a46410d32c3f000db4c7b11254f48a3d6055
      - 84
        
        79e658ebe74cdd0b9525a41dededf8b9839858
        
        ccc3a6d4681e19dbe6b982ddcee2e760944d55
      - 85
        
        ebb03e3089c5055e4f76d272866738a90a7842
      - 88
        
        1634035cad7fbc213a9def0b5e5ef7f15dffa2
        
        48d6820e826b907349234a642535725247f837
      - 89
        
        28f0ff69aa677f7c5f96053ca70589552e17b0
        
        e6c82914aa9457a644d5a498fa643f98b9ade3
      - 8f
        
        c65d4bab0f132f34e70868a961188deabc55dc
        
        d4a63a1a24c8b25eab5ed28c135457a8332e6b
      - 92
        
        3d517415d489cc9b3f91638c14264dd0df55a3
        
        a1582817dc2f8256db5a02bed320a05f6e5e43
      - 95
        
        8799c61770d05ba341183cd2d6a107a1ec093c
      - 96
        
        35ac150af1804b398d67cf4703d718a16806a7
      - 97
        
        8ec49ed00c46862d89580efe68f7efd98c93c3
        
        a337d34bb9ab89812b5e79c3bc2bb784d48953
      - 98
        
        9f9eab7b5ee98f4b6acf35fe8b4ef86db3a62e
      - 9b
        
        06e0bd24aa4658ed8009be3e2fe7e32ccee54e
        
        280bf8bc106ca904c9b33a90d0822c4c9b03fd
        
        2d891f12030afadc1e737914a1759ab59ef01f
        
        a872a49ab896e3d7c6203bedfd2502d8cb6521
        
        c60c7cbd38db3307551ae17ef2a8a5d623b3a0
      - 9d
        
        e1630d90e22bf6df53a0093c212e9e1d7da9b6
        
        eba8432350a07d0ab15189bb124d48b836fb62
      - 9e
        
        9c4e7476f3dce3b6808b0c8ea917a4d8503d7f
      - a3
        
        72fb170d6218ccc7298335f1ea55ff674fb3cc
      - a5
        
        4cb02cd26c7ecc2bd08debb1cfe85c3546c039
        
        504505ef08ce6040091e48eb5c1653a34574b0
      - a6
        
        56d2c7f2e9509fef687b3174282f6ec9b61498
        
        e0f46bb57f876255cdb5767729aefccbe3a33e
      - a7
        
        a8223dbda4d4cd47ae8796ad2be9bc70e46754
      - a9
        
        09e1af21f9dc9dccf095d02920266ea11fe7f5
        
        0c7b72565da6e015014e343f10ae50197587c9
      - aa
        
        80edaad05f0f16c6195e72a0130d803b58bcbc
      - ae
        
        76a4c4deb77d53e7ee512c3e85f45ba802dd08
        
        9247d41055f6721d3500645539ee00ae29d7e4
        
        a3d895c09d5eae5411aec5fb5ecbe82451bd50
      - b0
        
        d4979c857d151ef5cd27248926fb112c0c3cee
      - b1
        
        a874be65ad7df189c933f4c576475f29d15f67
      - b2
        
        7a8114a03ed27348a40f37428107e02f67acc8
        
        fd9d084c6df70da314916ee674421872f9ef50
      - b3
        
        2b6a6660b12a14fc5e8749eff9ba696b7f6061
      - b4
        
        8b1788b979853cdd57bb6cec6b9cc4dd7925bc
      - b7
        
        39a86e488eeec6f5693b7ee2590f84d6c95191
      - b8
        
        519559d3db834193518d4f4c4fed777734c8ee
        
        6f59306a576f4548ff3bd62e344570cc538932
        
        f782946f4728a629eda8038e82dd165dadee1d
      - ba
        
        7c42cc48ae095ccfffeb03cf36d519d7cbe5a3
      - bc
        
        bb2a0058b7866064b779ae246244c5342a0ccb
      - bd
        
        336a9884877889e2f85ee1849f8a068d2c6279
      - be
        
        1b6246a01d3d9c01dac0f888454369e0b32892
      - c0
        
        a5475ece89c3274e62f9132560ec8afdd569d4
      - c2
        
        34f46877a761d5c98fda2cbbeb172dc2efc81a
        
        76bec0dd56b68a8e0ed0062b38dd149422b45d
      - c3
        
        2db3968df0779b3c3a47899085625a7b86339b
      - c6
        
        32e263c2a639311be4ca1512aadee97a91bc9a
      - cb
        
        c4fb3a5d3dcc07f26b5ca02eb53a52b897aa80
      - cd
        
        02abedb89d8975a792d73de536d2ce82260553
      - ce
        
        800f70be34d9fba11f7d09b0c329b3f259507b
      - cf
        
        584b7dd3f005be3cffb47d27f1bfe980a6e53b
        
        f13bac9dd46f2c2a2fb66db64ce78caffd5b5a
      - d0
        
        2b035cae9b12c66a5e0d5ae9cf57433041ed40
        
        864f3d6209ad6f3e8ab51dc880836e67c96fc5
        
        b729579de2537a63cebdb809e8bdfb5a897a33
      - d2
        
        5865608d7d973e77c77d13bbdbe3ae454d864d
      - d3
        
        d7720074a2fc7e3bfbc18cc1bacad0f9ea61d2
      - d5
        
        06e7f9f85667d054794f808f9098b2a1625372
        
        9fe79529970f627e83857f9bd516f5474bf685
      - d6
        
        737d787752a799349095b49cf81024dfd00fb6
        
        811d3ae4f710d3eb8a16c690cd42bebc4faf4e
      - d7
        
        59cfdf018f8814d995588d176dadde0820b5ca
      - d8
        
        ecd252c04bc00a6dcc6d0b84d64285726b65d4
        
        f35efaa2dc2293277365d811c9b6222cfe59b8
      - da
        
        c1e4d0643b01e99052f575b5f6add2e10a2143
        
        ef5160c9c1500d3a9f6b0eadf434ef702a009f
      - db
        
        63d6ca3d87629e693327a2ba4a719e79847b6c
        
        de212341a0b131224b3e123f91d154348070ba
      - dc
        
        51396ce24aad46d1c761e2c96f8aee68d4b622
      - de
        
        4786c94cfa90c84982ca06a2a9623035993dfc
      - df
        
        70f4387ca97d30c66d7dc87d5abca9b0ffa820
        
        7fa77bc23477530674f05f4f619803983d5eb0
      - e0
        
        783ec3b1e38ce0f77b5b018d9b8641a7b924c3
        
        ea6d6394ab8409463adfeb753f1632ef09a47f
      - e4
        
        16c6dc5e784243ad8d33000139178fa178de87
        
        1d3105c048e789fe605c780efe2881df833ea8
      - e7
        
        178e4d5666a3b75aa48de33b966f0590665a8e
      - e8
        
        5978c76abd7430436356cd2a126018642d6a2d
      - ea
        
        dd707322e08d90e3a2208aef9060706c340799
      - eb
        
        d92ffb3ec9499292d1faa7ca60adcc5edac74f
      - ed
        
        05f4240da98a569e3c9f9a5b9e2301d7caa79e
      - ee
        
        3bd233e2bc458aab63eb36f613f853f72e6bf7
      - f2
        
        033dc11fee0a1db4a2cae358c1a808149a5aa2
        
        130ba4f980783f8605eb50387ffc2e54f66b3c
      - f3
        
        10f868efea6408fc49fd4e6d6c293db2098114
        
        e97b52355ea6f5384790bb3cda677222be900c
      - f4
        
        3ef84fa6caf08bc6e9e442e15d71eaa8c6962a
        
        ede3296c4fb294a58715e61ecef26f74ed898a
      - f5
        
        0e89c905a3e8dd519f415585283757fc85d2d6
      - f9
        
        624b31623b500b57b74e9765ac7a2d9f039c65
      - fa
        
        4eece0b1cc7dababed3d09d560f38e00ea8755
      - fc
        
        377156b487a559efb384ec2b6e551d6c2085c6
        
        60f41672c8fb6fc69c1548552988f046a2aa14
      - fe
        
        7c4d8d002499fbaff530adfaa0543d626536dd
      - ff
        
        a94206372e46914dcadeb10c212a9674daf62e
      - info
      - pack
    - refs
      - heads
        
        master
      - tags
  - ESpeakTest.xcodeproj
    - project.pbxproj
    - project.xcworkspace
      - contents.xcworkspacedata
      - xcuserdata
        
        jozefbozek.xcuserdatad
        
        UserInterfaceState.xcuserstate
    - xcuserdata
      - jozefbozek.xcuserdatad
        
        xcdebugger
        
        Breakpoints.xcbkptlist
        
        xcschemes
        
        ESpeakTest.xcscheme
        
        xcschememanagement.plist
  - ESpeakTest
    - AppDelegate.h
    - AppDelegate.m
    - en.lproj
      - InfoPlist.strings
      - ViewController_iPad.xib
      - ViewController_iPhone.xib
    - ESpeakTest-Info.plist
    - ESpeakTest-Prefix.pch
    - main.m
    - ViewController.h
    - ViewController.m
  - ESpeakTestTests
    - en.lproj
      - InfoPlist.strings
    - ESpeakTestTests.h
    - ESpeakTestTests.m
    - ESpeakTestTests-Info.plist
eSpeak_1.0.zip
- eSpeak_1.0
  - ._eSpeak_Prefix.pch
  - ._TestApp-Info.plist
  - Classes
    - ._ESpeakEngine.h
    - ._ESpeakEngine.m
    - Libraries
      - ._compiledict.cpp
      - ._debug.cpp
      - ._debug.h
      - ._dictionary.cpp
      - ._espeak_command.cpp
      - ._espeak_command.h
      - ._espeak-data
      - ._event.cpp
      - ._event.h
      - ._fifo.cpp
      - ._fifo.h
      - ._intonation.cpp
      - ._klatt.cpp
      - ._klatt.h
      - ._mbrowrap.cpp
      - ._mbrowrap.h
      - ._numbers.cpp
      - ._phoneme.h
      - ._phonemelist.cpp
      - ._portaudio.h
      - ._portaudio18.h
      - ._portaudio19.h
      - ._readclause.cpp
      - ._setlengths.cpp
      - ._sintab.h
      - ._speak_lib.cpp
      - ._speak_lib.h
      - ._speech.h
      - ._StdAfx.h
      - ._synth_mbrola.cpp
      - ._synthdata.cpp
      - ._synthesize.cpp
      - ._synthesize.h
      - ._tr_languages.cpp
      - ._translate.cpp
      - ._translate.h
      - ._voice.h
      - ._voices.cpp
      - ._wave.cpp
      - ._wave.h
      - ._wave_pulse.cpp
      - ._wave_sada.cpp
      - ._wavegen.cpp
      - espeak-data
        
        ._af_dict
        
        ._ca_dict
        
        ._config
        
        ._cs_dict
        
        ._cy_dict
        
        ._da_dict
        
        ._de_dict
        
        ._el_dict
        
        ._en_dict
        
        ._eo_dict
        
        ._es_dict
        
        ._fi_dict
        
        ._fr_dict
        
        ._grc_dict
        
        ._hbs_dict
        
        ._hi_dict
        
        ._hu_dict
        
        ._hy_dict
        
        ._id_dict
        
        ._intonations
        
        ._is_dict
        
        ._it_dict
        
        ._jbo_dict
        
        ._ku_dict
        
        ._la_dict
        
        ._lv_dict
        
        ._mbrola
        
        ._mbrola_ph
        
        ._mk_dict
        
        ._nci_dict
        
        ._nl_dict
        
        ._no_dict
        
        ._pap_dict
        
        ._phondata
        
        ._phonindex
        
        ._phontab
        
        ._pl_dict
        
        ._pt_dict
        
        ._ro_dict
        
        ._ru_dict
        
        ._sk_dict
        
        ._soundicons
        
        ._sq_dict
        
        ._sv_dict
        
        ._sw_dict
        
        ._ta_dict
        
        ._tr_dict
        
        ._vi_dict
        
        ._voices
        
        ._zh_dict
        
        ._zhy_dict
        
        mbrola_ph
        
        ._af1_phtrans
        
        ._ca1_phtrans
        
        ._cr1_phtrans
        
        ._cs_phtrans
        
        ._de2_phtrans
        
        ._de4_phtrans
        
        ._de6_phtrans
        
        ._en1_phtrans
        
        ._es_phtrans
        
        ._fr1_phtrans
        
        ._gr2_phtrans
        
        ._grc-de6_phtrans
        
        ._hu1_phtrans
        
        ._ic1_phtrans
        
        ._id1_phtrans
        
        ._in1_phtrans
        
        ._it3_phtrans
        
        ._la1_phtrans
        
        ._nl_phtrans
        
        ._pl1_phtrans
        
        ._pt_phtrans
        
        ._pt1_phtrans
        
        ._ptbr_phtrans
        
        ._ptbr4_phtrans
        
        ._ro1_phtrans
        
        ._sv_phtrans
        
        ._sv2_phtrans
        
        ._tr1_phtrans
        
        ._us_phtrans
        
        ._us3_phtrans
        
        voices
        
        !v
        
        ._croak
        
        ._f1
        
        ._f2
        
        ._f3
        
        ._f4
        
        ._f5
        
        ._fast
        
        ._klatt
        
        ._klatt2
        
        ._klatt3
        
        ._m1
        
        ._m2
        
        ._m3
        
        ._m4
        
        ._m5
        
        ._m6
        
        ._m7
        
        ._whisper
        
        ._whisperf
        
        ._!v
        
        ._af
        
        ._bs
        
        ._ca
        
        ._cs
        
        ._cy
        
        ._da
        
        ._de
        
        ._default
        
        ._el
        
        ._en
        
        ._eo
        
        ._es
        
        ._es-la
        
        ._fi
        
        ._fr
        
        ._fr-be
        
        ._hi
        
        ._hr
        
        ._hu
        
        ._hy
        
        ._hy-west
        
        ._id
        
        ._is
        
        ._it
        
        ._ku
        
        ._la
        
        ._lv
        
        ._mb
        
        ._mk
        
        ._nl
        
        ._no
        
        ._pl
        
        ._pt
        
        ._pt-pt
        
        ._ro
        
        ._ru
        
        ._sk
        
        ._sq
        
        ._sr
        
        ._sv
        
        ._sw
        
        ._ta
        
        ._test
        
        ._tr
        
        ._vi
        
        ._zh
        
        ._zh-yue
        
        en
        
        ._en
        
        ._en-n
        
        ._en-rp
        
        ._en-sc
        
        ._en-us
        
        ._en-wi
        
        ._en-wm
        
        mb
        
        ._mb-af1
        
        ._mb-af1-en
        
        ._mb-br1
        
        ._mb-br3
        
        ._mb-br4
        
        ._mb-cr1
        
        ._mb-cz2
        
        ._mb-de2
        
        ._mb-de4
        
        ._mb-de4-en
        
        ._mb-de5
        
        ._mb-de5-en
        
        ._mb-de6
        
        ._mb-de6-grc
        
        ._mb-de7
        
        ._mb-en1
        
        ._mb-es1
        
        ._mb-es2
        
        ._mb-fr1
        
        ._mb-fr1-en
        
        ._mb-fr4
        
        ._mb-fr4-en
        
        ._mb-gr2
        
        ._mb-gr2-en
        
        ._mb-hu1
        
        ._mb-hu1-en
        
        ._mb-ic1
        
        ._mb-id1
        
        ._mb-it3
        
        ._mb-it4
        
        ._mb-la1
        
        ._mb-nl2
        
        ._mb-nl2-en
        
        ._mb-pl1
        
        ._mb-pl1-en
        
        ._mb-pt1
        
        ._mb-ro1
        
        ._mb-ro1-en
        
        ._mb-sw1
        
        ._mb-sw1-en
        
        ._mb-sw2
        
        ._mb-sw2-en
        
        ._mb-tr1
        
        ._mb-tr2
        
        ._mb-us1
        
        ._mb-us2
        
        ._mb-us3
        
        test
        
        ._grc
        
        ._jbo
        
        ._nci
        
        ._pap
    - Tests
- eSpeak_1.0
  - Classes
    - ESpeakEngine.h
    - ESpeakEngine.m
  - eSpeak.xcodeproj
    - jBozEk.mode1v3
    - jBozEk.pbxuser
    - project.pbxproj
    - project.xcworkspace
      - contents.xcworkspacedata
      - xcuserdata
        
        jBozEk.xcuserdatad
        
        UserInterfaceState.xcuserstate
        
        jozefbozek.xcuserdatad
        
        UserInterfaceState.xcuserstate
        
        WorkspaceSettings.xcsettings
    - xcuserdata
      - jBozEk.xcuserdatad
        
        xcschemes
        
        xcschememanagement.plist
      - jozefbozek.xcuserdatad
        
        xcdebugger
        
        Breakpoints.xcbkptlist
        
        xcschemes
        
        eSpeak.xcscheme
        
        TestApp.xcscheme
        
        xcschememanagement.plist
  - eSpeak_Prefix.pch
  - Libraries
    - compiledict.cpp
    - debug.cpp
    - debug.h
    - dictionary.cpp
    - espeak_command.cpp
    - espeak_command.h
    - espeak-data
      - af_dict
      - ca_dict
      - config
      - cs_dict
      - cy_dict
      - da_dict
      - de_dict
      - el_dict
      - en_dict
      - eo_dict
      - es_dict
      - fi_dict
      - fr_dict
      - grc_dict
      - hbs_dict
      - hi_dict
      - hu_dict
      - hy_dict
      - id_dict
      - intonations
      - is_dict
      - it_dict
      - jbo_dict
      - ku_dict
      - la_dict
      - lv_dict
      - mbrola
      - mbrola_ph
        
        af1_phtrans
        
        ca1_phtrans
        
        cr1_phtrans
        
        cs_phtrans
        
        de2_phtrans
        
        de4_phtrans
        
        de6_phtrans
        
        en1_phtrans
        
        es_phtrans
        
        fr1_phtrans
        
        gr2_phtrans
        
        grc-de6_phtrans
        
        hu1_phtrans
        
        ic1_phtrans
        
        id1_phtrans
        
        in1_phtrans
        
        it3_phtrans
        
        la1_phtrans
        
        nl_phtrans
        
        pl1_phtrans
        
        pt_phtrans
        
        pt1_phtrans
        
        ptbr_phtrans
        
        ptbr4_phtrans
        
        ro1_phtrans
        
        sv_phtrans
        
        sv2_phtrans
        
        tr1_phtrans
        
        us_phtrans
        
        us3_phtrans
      - mk_dict
      - nci_dict
      - nl_dict
      - no_dict
      - pap_dict
      - phondata
      - phonindex
      - phontab
      - pl_dict
      - pt_dict
      - ro_dict
      - ru_dict
      - sk_dict
      - soundicons
      - sq_dict
      - sv_dict
      - sw_dict
      - ta_dict
      - tr_dict
      - vi_dict
      - voices
        
        !v
        
        croak
        
        f1
        
        f2
        
        f3
        
        f4
        
        f5
        
        fast
        
        klatt
        
        klatt2
        
        klatt3
        
        m1
        
        m2
        
        m3
        
        m4
        
        m5
        
        m6
        
        m7
        
        whisper
        
        whisperf
        
        af
        
        bs
        
        ca
        
        cs
        
        cy
        
        da
        
        de
        
        default
        
        el
        
        en
        
        en
        
        en-n
        
        en-rp
        
        en-sc
        
        en-us
        
        en-wi
        
        en-wm
        
        eo
        
        es
        
        es-la
        
        fi
        
        fr
        
        fr-be
        
        hi
        
        hr
        
        hu
        
        hy
        
        hy-west
        
        id
        
        is
        
        it
        
        ku
        
        la
        
        lv
        
        mb
        
        mb-af1
        
        mb-af1-en
        
        mb-br1
        
        mb-br3
        
        mb-br4
        
        mb-cr1
        
        mb-cz2
        
        mb-de2
        
        mb-de4
        
        mb-de4-en
        
        mb-de5
        
        mb-de5-en
        
        mb-de6
        
        mb-de6-grc
        
        mb-de7
        
        mb-en1
        
        mb-es1
        
        mb-es2
        
        mb-fr1
        
        mb-fr1-en
        
        mb-fr4
        
        mb-fr4-en
        
        mb-gr2
        
        mb-gr2-en
        
        mb-hu1
        
        mb-hu1-en
        
        mb-ic1
        
        mb-id1
        
        mb-it3
        
        mb-it4
        
        mb-la1
        
        mb-nl2
        
        mb-nl2-en
        
        mb-pl1
        
        mb-pl1-en
        
        mb-pt1
        
        mb-ro1
        
        mb-ro1-en
        
        mb-sw1
        
        mb-sw1-en
        
        mb-sw2
        
        mb-sw2-en
        
        mb-tr1
        
        mb-tr2
        
        mb-us1
        
        mb-us2
        
        mb-us3
        
        mk
        
        nl
        
        no
        
        pl
        
        pt
        
        pt-pt
        
        ro
        
        ru
        
        sk
        
        sq
        
        sr
        
        sv
        
        sw
        
        ta
        
        test
        
        grc
        
        jbo
        
        nci
        
        pap
        
        tr
        
        vi
        
        zh
        
        zh-yue
      - zh_dict
      - zhy_dict
    - event.cpp
    - event.h
    - fifo.cpp
    - fifo.h
    - intonation.cpp
    - klatt.cpp
    - klatt.h
    - mbrowrap.cpp
    - mbrowrap.h
    - numbers.cpp
    - phoneme.h
    - phonemelist.cpp
    - portaudio.h
    - portaudio18.h
    - portaudio19.h
    - readclause.cpp
    - setlengths.cpp
    - sintab.h
    - speak_lib.cpp
    - speak_lib.h
    - speech.h
    - StdAfx.h
    - synth_mbrola.cpp
    - synthdata.cpp
    - synthesize.cpp
    - synthesize.h
    - tr_languages.cpp
    - translate.cpp
    - translate.h
    - voice.h
    - voices.cpp
    - wave.cpp
    - wave.h
    - wave_pulse.cpp
    - wave_sada.cpp
    - wavegen.cpp
  - TestApp-Info.plist
  - Tests

/***************************************************************************
 *   Copyright (C) 2005 to 2010 by Jonathan Duddington                     *
 *   email: jonsd@users.sourceforge.net                                    *
 *                                                                         *
 *   This program is free software; you can redistribute it and/or modify  *
 *   it under the terms of the GNU General Public License as published by  *
 *   the Free Software Foundation; either version 3 of the License, or     *
 *   (at your option) any later version.                                   *
 *                                                                         *
 *   This program is distributed in the hope that it will be useful,       *
 *   but WITHOUT ANY WARRANTY; without even the implied warranty of        *
 *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the         *
 *   GNU General Public License for more details.                          *
 *                                                                         *
 *   You should have received a copy of the GNU General Public License     *
 *   along with this program; if not, see:                                 *
 *               <http://www.gnu.org/licenses/>.                           *
 ***************************************************************************/

#include "StdAfx.h"

#include <stdio.h>
#include <ctype.h>
#include <wctype.h>
#include <stdlib.h>
#include <string.h>
#include <locale.h>

#include <wctype.h>

#include "speak_lib.h"
#include "speech.h"
#include "phoneme.h"
#include "synthesize.h"
#include "translate.h"



#define L_qa   0x716100
#define L_grc  0x677263   // grc  Ancient Greek
#define L_jbo  0x6a626f   // jbo  Lojban
#define L_pap  0x706170   // pap  Papiamento]
#define L_shs  0x736873   // shs  Shuswap / Secwepemctsin
#define L_zhy  0x7a6879   // zhy

// start of unicode pages for character sets
#define OFFSET_GREEK  0x380
#define OFFSET_CYRILLIC 0x420
#define OFFSET_ARMENIAN 0x530
#define OFFSET_ARABIC 0x600
#define OFFSET_DEVANAGARI  0x900
#define OFFSET_BENGALI 0x980
#define OFFSET_GURMUKHI 0xa00
#define OFFSET_TAMIL  0xb80
#define OFFSET_KANNADA 0xc80
#define OFFSET_MALAYALAM 0xd00
#define OFFSET_KOREAN 0x1100

static void Translator_Russian(Translator *tr);



static void SetLetterVowel(Translator *tr, int c)
{//==============================================
	tr->letter_bits[c] = (tr->letter_bits[c] & 0x40) | 0x81;  // keep value for group 6 (front vowels e,i,y)
}

static void ResetLetterBits(Translator *tr, int groups)
{//====================================================
// Clear all the specified groups
	unsigned int ix;
	unsigned int mask;

	mask = ~groups;

	for(ix=0; ix<sizeof(tr->letter_bits); ix++)
	{
		tr->letter_bits[ix] &= mask;
	}
}

static void SetLetterBits(Translator *tr, int group, const char *string)
{//=====================================================================
	int bits;
	unsigned char c;
	
	bits = (1L << group);
	while((c = *string++) != 0)
		tr->letter_bits[c] |= bits;
}

static void SetLetterBitsRange(Translator *tr, int group, int first, int last)
{//===========================================================================
	int bits;
	int ix;

	bits = (1L << group);
	for(ix=first; ix<=last; ix++)
	{
		tr->letter_bits[ix] |= bits;
	}
}


static Translator* NewTranslator(void)
{//===================================
	Translator *tr;
	int ix;
	static const unsigned char stress_amps2[] = {17,17, 20,20, 20,22, 22,20 };
	static const short stress_lengths2[8] = {182,140, 220,220, 220,240, 260,280};
	static const wchar_t empty_wstring[1] = {0};
	static const wchar_t punct_in_word[2] = {'\'', 0};  // allow hyphen within words
	static const unsigned char default_tunes[6] = {0, 1, 2, 3, 0, 0};

	tr = (Translator *)Alloc(sizeof(Translator));
	if(tr == NULL)
		return(NULL);

	tr->charset_a0 = charsets[1];   // ISO-8859-1, this is for when the input is not utf8
	dictionary_name[0] = 0;
	tr->dict_condition=0;
	tr->data_dictrules = NULL;     // language_1   translation rules file
	tr->data_dictlist = NULL;      // language_2   dictionary lookup file

	tr->transpose_min = 'a';
	tr->transpose_max = 'z';
	tr->frequent_pairs = NULL;

	// only need lower case
	tr->letter_bits_offset = 0;
	memset(tr->letter_bits,0,sizeof(tr->letter_bits));
	memset(tr->letter_groups,0,sizeof(tr->letter_groups));

	// 0-5 sets of characters matched by A B C H F G Y  in pronunciation rules
	// these may be set differently for different languages
	SetLetterBits(tr,0,"aeiou");  // A  vowels, except y
	SetLetterBits(tr,1,"bcdfgjklmnpqstvxz");      // B  hard consonants, excluding h,r,w
	SetLetterBits(tr,2,"bcdfghjklmnpqrstvwxz");  // C  all consonants
	SetLetterBits(tr,3,"hlmnr");                 // H  'soft' consonants
	SetLetterBits(tr,4,"cfhkpqstx");             // F  voiceless consonants
	SetLetterBits(tr,5,"bdgjlmnrvwyz");   // G voiced
	SetLetterBits(tr,6,"eiy");   // Letter group Y, front vowels
	SetLetterBits(tr,7,"aeiouy");  // vowels, including y


	tr->char_plus_apostrophe = empty_wstring;
	tr->punct_within_word = punct_in_word;

	for(ix=0; ix<8; ix++)
	{
		tr->stress_amps[ix] = stress_amps2[ix];
		tr->stress_amps_r[ix] = stress_amps2[ix] - 1;
		tr->stress_lengths[ix] = stress_lengths2[ix];
	}
	memset(&(tr->langopts),0,sizeof(tr->langopts));
	tr->langopts.max_lengthmod = 500;

	tr->langopts.stress_rule = STRESSPOSN_2R;
	tr->langopts.unstressed_wd1 = 1;
	tr->langopts.unstressed_wd2 = 3;
	tr->langopts.param[LOPT_SONORANT_MIN] = 95;
	tr->langopts.param[LOPT_LONG_VOWEL_THRESHOLD] = 190/2;
	tr->langopts.param[LOPT_MAXAMP_EOC] = 19;
	tr->langopts.param[LOPT_UNPRONOUNCABLE] = 's';    // don't count this character at start of word
	tr->langopts.param[LOPT_BRACKET_PAUSE] = 4;      // pause at bracket
	tr->langopts.param2[LOPT_BRACKET_PAUSE] = 2;    // pauses when announcing bracket names
	tr->langopts.max_initial_consonants = 3;
	tr->langopts.replace_chars = NULL;
	tr->langopts.ascii_language = "";    // Non-Latin alphabet languages, use this language to speak Latin words, default is English


	SetLengthMods(tr,201);
//	tr->langopts.length_mods = length_mods_en;
//	tr->langopts.length_mods0 = length_mods_en0;

	tr->langopts.long_stop = 100;

	tr->langopts.max_roman = 49;
	tr->langopts.min_roman = 2;
	tr->langopts.thousands_sep = ',';
	tr->langopts.decimal_sep = '.';
	tr->langopts.break_numbers = BREAK_THOUSANDS;   // 1000, 1000,000  1,000,000 etc
	tr->langopts.max_digits = 14;

	memcpy(tr->punct_to_tone, punctuation_to_tone, sizeof(tr->punct_to_tone));

	memcpy(tr->langopts.tunes, default_tunes, sizeof(tr->langopts.tunes));

	return(tr);
}

// common letter pairs, encode these as a single byte
//  2 bytes, using the transposed character codes
static const short pairs_ru[] = { 
0x010c, //  ла   21052  0x23
0x010e, //  на   18400
0x0113, //  та   14254
0x0301, //  ав   31083
0x030f, //  ов   13420
0x060e, //  не   21798
0x0611, //  ре   19458
0x0903, //  ви   16226
0x0b01, //  ак   14456
0x0b0f, //  ок   17836
0x0c01, //  ал   13324
0x0c09, //  ил   16877
0x0e01, //  ан   15359
0x0e06, //  ен   13543  0x30
0x0e09, //  ин   17168
0x0e0e, //  нн   15973
0x0e0f, //  он   22373
0x0e1c, //  ын   15052
0x0f03, //  во   24947
0x0f11, //  ро   13552
0x0f12, //  со   16368
0x100f, //  оп   19054
0x1011, //  рп   17067
0x1101, //  ар   23967
0x1106, //  ер   18795
0x1109, //  ир   13797
0x110f, //  ор   21737
0x1213, //  тс   25076
0x1220, //  яс   14310
0x7fff};
//0x040f  ог   12976
//0x1306  ет   12826
//0x0f0d  мо   12688



static const unsigned int replace_cyrillic_latin[] = 
	{0x430,'a',
	0x431,'b',
	0x446,'c',
	0x45b,0x107,
	0x447,0x10d,
	0x45f,'d'+(0x17e<<16),
	0x455,'d'+('z'<<16),
	0x434,'d',
	0x452,0x111,
	0x435,'e',
	0x444,'f',
	0x433,'g',
	0x445,'h',
	0x438,'i',
	0x458,'j',
	0x43a,'k',
	0x459,'l'+('j'<<16),
	0x43b,'l',
	0x43c,'m',
	0x45a,'n'+('j'<<16),
	0x43d,'n',
	0x43e,'o',
	0x43f,'p',
	0x440,'r',
	0x441,'s',
	0x448,0x161,
	0x442,'t',
	0x443,'u',
	0x432,'v',
	0x437,'z',
	0x436,0x17e,
	0x453,0x111,
	0x45c,0x107,
0};  // ѓ  ѕ  ќ

static void SetCyrillicLetters(Translator *tr)
{//===========================================
	// character codes offset by 0x420
	static const char ru_vowels[] = {0x10,0x15,0x31,0x18,0x1e,0x23,0x2b,0x2d,0x2e,0x2f,0};
	static const char ru_consonants[] = {0x11,0x12,0x13,0x14,0x16,0x17,0x19,0x1a,0x1b,0x1c,0x1d,0x1f,0x20,0x21,0x22,0x24,0x25,0x26,0x27,0x28,0x29,0x2a,0x2c,0};
	static const char ru_soft[] = {0x2c,0x19,0x27,0x29,0};   // letter group B  [k ts; s;]
	static const char ru_hard[] = {0x2a,0x16,0x26,0x28,0};   // letter group H  [S Z ts]
	static const char ru_nothard[] = {0x11,0x12,0x13,0x14,0x17,0x19,0x1a,0x1b,0x1c,0x1d,0x1f,0x20,0x21,0x22,0x24,0x25,0x27,0x29,0x2c,0};
	static const char ru_voiced[] = {0x11,0x12,0x13,0x14,0x16,0x17,0};    // letter group G  (voiced obstruents)
	static const char ru_ivowels[] = {0x2c,0x2e,0x2f,0x31,0};   // letter group Y  (iotated vowels & soft-sign)
	tr->charset_a0 = charsets[18];   // KOI8-R
	tr->transpose_min = 0x430;  // convert cyrillic from unicode into range 0x01 to 0x22
	tr->transpose_max = 0x451;
	tr->frequent_pairs = pairs_ru;

	tr->letter_bits_offset = OFFSET_CYRILLIC;
	memset(tr->letter_bits,0,sizeof(tr->letter_bits));
	SetLetterBits(tr,LETTERGP_A,ru_vowels);
	SetLetterBits(tr,1,ru_soft);
	SetLetterBits(tr,2,ru_consonants);
	SetLetterBits(tr,3,ru_hard);
	SetLetterBits(tr,4,ru_nothard);
	SetLetterBits(tr,5,ru_voiced);
	SetLetterBits(tr,6,ru_ivowels);
	SetLetterBits(tr,LETTERGP_VOWEL2,ru_vowels);
}  // end of SetCyrillicLetters


void SetIndicLetters(Translator *tr)
{//=================================
	// Set letter types for Indic scripts, Devanagari, Tamill, etc
	static const char dev_consonants2[] = {0x02,0x03,0x58,0x59,0x5a,0x5b,0x5c,0x5d,0x5e,0x5f};

	memset(tr->letter_bits,0,sizeof(tr->letter_bits));
	SetLetterBitsRange(tr,LETTERGP_A,0x04,0x14);   // vowel letters
	SetLetterBitsRange(tr,LETTERGP_A,0x3e,0x4d);   // + vowel signs, and virama

	SetLetterBitsRange(tr,LETTERGP_B,0x3e,0x4d);   // vowel signs, and virama

	SetLetterBitsRange(tr,LETTERGP_C,0x15,0x39);   // the main consonant range
	SetLetterBits(tr,LETTERGP_C,dev_consonants2);  // + additional consonants

	SetLetterBitsRange(tr,LETTERGP_Y,0x04,0x14);   // vowel letters
	SetLetterBitsRange(tr,LETTERGP_Y,0x3e,0x4c);   // + vowel signs

	tr->langopts.param[LOPT_UNPRONOUNCABLE] = 1;   // disable check for unpronouncable words
	tr->langopts.suffix_add_e = tr->letter_bits_offset + 0x4d;   //virama
}


void SetupTranslator(Translator *tr, const short *lengths, const unsigned char *amps)
{//==================================================================================
	if(lengths != NULL)
		memcpy(tr->stress_lengths,lengths,sizeof(tr->stress_lengths));
	if(amps != NULL)
		memcpy(tr->stress_amps,amps,sizeof(tr->stress_amps));
}


Translator *SelectTranslator(const char *name)
{//===========================================
	int name2 = 0;
	Translator *tr;

	static const unsigned char stress_amps_sk[8] = {17,17, 20,20, 20,22, 22,21 };
	static const short stress_lengths_sk[8] = {190,190, 210,210, 0,0, 210,210};

	// convert name string into a word of up to 4 characters, for the switch()
	while(*name != 0)
		name2 = (name2 << 8) + *name++;

	tr = NewTranslator();

	switch(name2)
	{
	case L('a','f'):
		{
			static const short stress_lengths_af[8] = {170,140, 220,220,  0, 0, 250,270};
			SetupTranslator(tr,stress_lengths_af,NULL);

			tr->langopts.stress_rule = STRESSPOSN_1L;
			tr->langopts.vowel_pause = 0x30;
			tr->langopts.param[LOPT_DIERESES] = 1;
			tr->langopts.param[LOPT_PREFIXES] = 1;
			SetLetterVowel(tr,'y');  // add 'y' to vowels
		
			tr->langopts.numbers = NUM_SWAP_TENS | NUM_HUNDRED_AND | NUM_SINGLE_AND | NUM_ROMAN | NUM_1900;
			tr->langopts.accents = 1;
		}
		break;

	case L('a','r'):   // Arabic
			tr->letter_bits_offset = OFFSET_ARABIC;
			tr->langopts.param[LOPT_UNPRONOUNCABLE] = 1;   // disable check for unpronouncable words
		break;

	case L('b','g'):  //Bulgarian
		{
			SetCyrillicLetters(tr);
			SetLetterVowel(tr,0x2a);
			tr->langopts.param[LOPT_UNPRONOUNCABLE] = 0x432;    // [v]  don't count this character at start of word
			tr->langopts.param[LOPT_REGRESSIVE_VOICING] = 0x10;  // devoice at end of word
			tr->langopts.param[LOPT_REDUCE] = 2;
			tr->langopts.stress_rule = STRESSPOSN_2R;
			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_ALLOW_SPACE | NUM_OMIT_1_HUNDRED | NUM_HUNDRED_AND | NUM_AND_UNITS | NUM_SINGLE_AND | NUM_ROMAN | NUM_ROMAN_ORDINAL | NUM_ROMAN_CAPITALS ;
			tr->langopts.thousands_sep = ' ';   // don't allow dot as thousands separator
		}
		break;

	case L('b','n'):  // Bengali
		{
			static const short stress_lengths_bn[8] = {180, 180,  210, 210,  0, 0,  230, 240};
			static const unsigned char stress_amps_bn[8] = {18,18, 18,18, 20,20, 22,22 };

			SetupTranslator(tr,stress_lengths_bn,stress_amps_bn);
			tr->langopts.length_mods0 = tr->langopts.length_mods;  // don't lengthen vowels in the last syllable

			tr->langopts.stress_rule = STRESSPOSN_1L;
			tr->langopts.stress_flags =  0x10004;   // use 'diminished' for unstressed final syllable
			tr->letter_bits_offset = OFFSET_BENGALI;
			SetIndicLetters(tr);   // call this after setting OFFSET_BENGALI
			SetLetterBitsRange(tr,LETTERGP_F,0x3e,0x4c);   // vowel signs, but not virama

			tr->langopts.numbers = 0x1;
			tr->langopts.break_numbers = 0x24924aa8;  // for languages which have numbers for 100,000 and 100,00,000, eg Hindi
		}
		break;

	case L('c','y'):   // Welsh
		{
			static const short stress_lengths_cy[8] = {170,220, 180,180, 0, 0, 250,270};
			static const unsigned char stress_amps_cy[8] = {17,15, 18,18, 0,0, 22,20 };    // 'diminished' is used to mark a quieter, final unstressed syllable

			SetupTranslator(tr,stress_lengths_cy,stress_amps_cy);

			tr->charset_a0 = charsets[14];   // ISO-8859-14
//			tr->langopts.length_mods0 = tr->langopts.length_mods;  // don't lengthen vowels in the last syllable
			tr->langopts.stress_rule = STRESSPOSN_2R;
//			tr->langopts.intonation_group = 4;

			// 'diminished' is an unstressed final syllable
			tr->langopts.stress_flags =  0x6 | 0x10; 
			tr->langopts.unstressed_wd1 = 0;
			tr->langopts.unstressed_wd2 = 2;
			tr->langopts.param[LOPT_SONORANT_MIN] = 120;  // limit the shortening of sonorants before short vowels

			tr->langopts.numbers = NUM_OMIT_1_HUNDRED;

			SetLetterVowel(tr,'w');  // add letter to vowels and remove from consonants
			SetLetterVowel(tr,'y');
		}
		break;

	case L('d','a'):  // Danish
		{
			static const short stress_lengths_da[8] = {160,140, 200,200, 0,0, 220,230};
			SetupTranslator(tr,stress_lengths_da,NULL);

			tr->langopts.stress_rule = STRESSPOSN_1L;
			tr->langopts.param[LOPT_PREFIXES] = 1;
			SetLetterVowel(tr,'y');
			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_SWAP_TENS | NUM_HUNDRED_AND | NUM_OMIT_1_HUNDRED | NUM_ORDINAL_DOT | NUM_1900 | NUM_ROMAN | NUM_ROMAN_CAPITALS | NUM_ROMAN_ORDINAL;
		}
		break;


	case L('d','e'):
		{
			static const short stress_lengths_de[8] = {150,130, 200,200,  0, 0, 250,260};
			tr->langopts.stress_rule = STRESSPOSN_1L;
			tr->langopts.word_gap = 0x8;   // don't use linking phonemes
			tr->langopts.vowel_pause = 0x30;
			tr->langopts.param[LOPT_PREFIXES] = 1;
			tr->langopts.param[LOPT_REGRESSIVE_VOICING] = 0x10;  // devoice at end of word
			tr->langopts.param[LOPT_LONG_VOWEL_THRESHOLD] = 175/2;
			memcpy(tr->stress_lengths,stress_lengths_de,sizeof(tr->stress_lengths));
		
			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_SWAP_TENS | NUM_OMIT_1_HUNDRED | NUM_OMIT_1_THOUSAND | NUM_ALLOW_SPACE | NUM_ORDINAL_DOT | NUM_ROMAN;
			SetLetterVowel(tr,'y');
			tr->langopts.param[LOPT_UNPRONOUNCABLE] = 2;   // use de_rules for unpronouncable rules
		}
		break;

	case L('e','n'):
		{
			static const short stress_lengths_en[8] = {182,140, 220,220, 0,0, 248,275};
			SetupTranslator(tr,stress_lengths_en,NULL);

			tr->langopts.stress_rule = STRESSPOSN_1L;
			tr->langopts.stress_flags = 0x08;
			tr->langopts.numbers = NUM_HUNDRED_AND | NUM_ROMAN | NUM_1900;
			tr->langopts.param[LOPT_COMBINE_WORDS] = 2;       // allow "mc" to cmbine with the following word
			tr->langopts.suffix_add_e = 'e';
			tr->langopts.param[LOPT_UNPRONOUNCABLE] = 2;   // use en_rules for unpronouncable rules
			SetLetterBits(tr,6,"aeiouy");  // Group Y: vowels, including y
		}
		break;

	case L('e','l'):   // Greek
	case L_grc:        // Ancient Greek
		{
			static const short stress_lengths_el[8] = {155, 180,  210, 210,  0, 0,  270, 300};
			static const unsigned char stress_amps_el[8] = {15,12, 20,20, 20,22, 22,21 };    // 'diminished' is used to mark a quieter, final unstressed syllable

			// character codes offset by 0x380
			static const char el_vowels[] = {0x10,0x2c,0x2d,0x2e,0x2f,0x30,0x31,0x35,0x37,0x39,0x3f,0x45,0x49,0x4a,0x4b,0x4c,0x4d,0x4e,0x4f,0};
			static const char el_fvowels[] = {0x2d,0x2e,0x2f,0x35,0x37,0x39,0x45,0x4d,0}; // ε η ι υ  έ ή ί ύ
			static const char el_voiceless[]= {0x38,0x3a,0x3e,0x40,0x42,0x43,0x44,0x46,0x47,0};  // θ κ ξ π ς σ τ φ χ 
			static const char el_consonants[]={0x32,0x33,0x34,0x36,0x38,0x3a,0x3b,0x3c,0x3d,0x3e,0x40,0x41,0x42,0x43,0x44,0x46,0x47,0x48,0};
			static const wchar_t el_char_apostrophe[] = {0x3c3,0};  // σ

			SetupTranslator(tr,stress_lengths_el,stress_amps_el);

			tr->charset_a0 = charsets[7];   // ISO-8859-7
			tr->char_plus_apostrophe = el_char_apostrophe;

			tr->letter_bits_offset = OFFSET_GREEK;
			memset(tr->letter_bits,0,sizeof(tr->letter_bits));
			SetLetterBits(tr,LETTERGP_A,el_vowels);
			SetLetterBits(tr,LETTERGP_VOWEL2,el_vowels);
			SetLetterBits(tr,LETTERGP_B,el_voiceless);
			SetLetterBits(tr,LETTERGP_C,el_consonants);
			SetLetterBits(tr,LETTERGP_Y,el_fvowels);    // front vowels: ε η ι υ

			tr->langopts.length_mods0 = tr->langopts.length_mods;  // don't lengthen vowels in the last syllable
			tr->langopts.stress_rule = STRESSPOSN_2R;
			tr->langopts.stress_flags = 0x6;  // mark unstressed final syllables as diminished
			tr->langopts.unstressed_wd1 = 0;
			tr->langopts.unstressed_wd2 = 2;
			tr->langopts.param[LOPT_SONORANT_MIN] = 130;  // limit the shortening of sonorants before short vowels

			tr->langopts.numbers = NUM_SINGLE_STRESS | NUM_DECIMAL_COMMA; 
			tr->langopts.numbers2 = 0x2;   // variant form of numbers before thousands

			if(name2 == L_grc)
			{
				// ancient greek
				tr->langopts.param[LOPT_UNPRONOUNCABLE] = 1;
			}
		}
		break;

	case L('e','o'):
		{
			static const short stress_lengths_eo[8] = {145, 145,  230, 170,    0,   0,  360, 370};
			static const unsigned char stress_amps_eo[] = {16,14, 20,20, 20,22, 22,21 };
			static const wchar_t eo_char_apostrophe[2] = {'l',0};
		
			SetupTranslator(tr,stress_lengths_eo,stress_amps_eo);

			tr->charset_a0 = charsets[3];  // ISO-8859-3
			tr->char_plus_apostrophe = eo_char_apostrophe;

			tr->langopts.word_gap = 1;
			tr->langopts.vowel_pause = 2;
			tr->langopts.stress_rule = STRESSPOSN_2R;
			tr->langopts.stress_flags =  0x6 | 0x10; 
			tr->langopts.unstressed_wd1 = 3;
			tr->langopts.unstressed_wd2 = 2;

			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_OMIT_1_HUNDRED | NUM_ALLOW_SPACE | NUM_ROMAN;
		}
		break;

	case L('e','s'):   // Spanish
	case L('c','a'):   // Catalan
	case L_pap:        // Papiamento
		{
			static const short stress_lengths_es[8] = {180, 210,  190, 190,  0, 0,  230, 260};
//			static const short stress_lengths_es[8] = {170, 200,  180, 180,  0, 0,  220, 250};
			static const unsigned char stress_amps_es[8] = {16,12, 18,18, 20,20, 20,20 };    // 'diminished' is used to mark a quieter, final unstressed syllable
			static const wchar_t ca_punct_within_word[] = {'\'',0xb7,0};   // ca: allow middle-dot within word

			SetupTranslator(tr,stress_lengths_es,stress_amps_es);

			tr->langopts.length_mods0 = tr->langopts.length_mods;  // don't lengthen vowels in the last syllable
			tr->langopts.stress_rule = STRESSPOSN_2R;

			// stress last syllable if it doesn't end in vowel or "s" or "n"
			// 'diminished' is an unstressed final syllable
			tr->langopts.stress_flags = 0x200 | 0x6 | 0x10; 
			tr->langopts.unstressed_wd1 = 0;
			tr->langopts.unstressed_wd2 = 2;
			tr->langopts.param[LOPT_SONORANT_MIN] = 120;  // limit the shortening of sonorants before short vowels

			tr->langopts.numbers = NUM_SINGLE_STRESS | NUM_DECIMAL_COMMA | NUM_AND_UNITS | NUM_OMIT_1_HUNDRED | NUM_OMIT_1_THOUSAND | NUM_ROMAN | NUM_ROMAN_AFTER;

			if(name2 == L('c','a'))
			{
				tr->punct_within_word = ca_punct_within_word;
				tr->langopts.stress_flags = 0x200 | 0x6 | 0x30;  // stress last syllable unless word ends with a vowel
			}
			else
			if(name2 == L_pap)
			{
				tr->langopts.stress_flags = 0x100 | 0x6 | 0x30;  // stress last syllable unless word ends with a vowel
			}
			else
			{
				tr->langopts.param[LOPT_UNPRONOUNCABLE] = 2;   // use es_rules for unpronouncable rules
			}
		}
		break;


	case L('e','u'):  // basque
		{
			static const short stress_lengths_eu[8] = {200, 200,  200, 200,  0, 0,  210, 230};  // very weak stress
			static const unsigned char stress_amps_eu[8] = {16,16, 18,18, 18,18, 18,18 };
			SetupTranslator(tr,stress_lengths_eu,stress_amps_eu);
			tr->langopts.stress_rule = STRESSPOSN_2L;  // ?? second syllable ??
			tr->langopts.numbers = NUM_SINGLE_STRESS | NUM_DECIMAL_COMMA | NUM_AND_UNITS | NUM_HUNDRED_AND | NUM_OMIT_1_HUNDRED | NUM_VIGESIMAL;
		}
		break;


	case L('f','a'):   // Farsi
		{
			tr->letter_bits_offset = OFFSET_ARABIC;
			tr->langopts.numbers = NUM_AND_UNITS | NUM_HUNDRED_AND;
			tr->langopts.param[LOPT_UNPRONOUNCABLE] = 1;   // disable check for unpronouncable words
		}
		break;


	case L('f','i'):   // Finnish
		{
			static const unsigned char stress_amps_fi[8] = {18,16, 22,22, 20,22, 22,22 };
			static const short stress_lengths_fi[8] = {150,180, 200,200, 0,0, 210,250};

			SetupTranslator(tr,stress_lengths_fi,stress_amps_fi);

			tr->langopts.stress_rule = STRESSPOSN_1L;
			tr->langopts.stress_flags = 0x56;  // move secondary stress from light to a following heavy syllable
			tr->langopts.param[LOPT_IT_DOUBLING] = 1;
			tr->langopts.long_stop = 130;

			tr->langopts.numbers = NUM_DECIMAL_COMMA + NUM_ALLOW_SPACE;
			SetLetterVowel(tr,'y');
//			tr->langopts.max_initial_consonants = 2;  // BUT foreign words may have 3
			tr->langopts.spelling_stress = 1;
			tr->langopts.intonation_group = 3;  // less intonation, don't raise pitch at comma
		}
		break;

	case L('f','r'):  // french
		{
			static const short stress_lengths_fr[8] = {190, 170,  190, 200,  0, 0,  190, 240};
			static const unsigned char stress_amps_fr[8] = {18,16, 20,20, 20,22, 18,18 };

			SetupTranslator(tr,stress_lengths_fr,stress_amps_fr);
			tr->langopts.stress_rule = STRESSPOSN_1R;      // stress on final syllable
			tr->langopts.stress_flags = 0x0024;  // don't use secondary stress
			tr->langopts.param[LOPT_IT_LENGTHEN] = 1;    // remove lengthen indicator from unstressed syllables
			tr->langopts.length_mods0 = tr->langopts.length_mods;  // don't lengthen vowels in the last syllable
			tr->langopts.accents = 2;   // Say "Capital" after the letter.
			tr->langopts.vowel_pause = 0;

			tr->langopts.numbers = NUM_SINGLE_STRESS | NUM_DECIMAL_COMMA | NUM_ALLOW_SPACE | NUM_OMIT_1_HUNDRED | NUM_NOPAUSE | NUM_ROMAN | NUM_ROMAN_CAPITALS | NUM_ROMAN_AFTER | NUM_VIGESIMAL | NUM_DFRACTION_4;
			SetLetterVowel(tr,'y');
		}
		break;

	case L('h','i'):    // Hindi
	case L('n','e'):    // Nepali
	case L('p','a'):    // Punjabi
		{
			static const short stress_lengths_hi[8] = {190, 190,  210, 210,  0, 0,  230, 250};
			static const unsigned char stress_amps_hi[8] = {17,14, 20,19, 20,22, 22,21 };

			SetupTranslator(tr,stress_lengths_hi,stress_amps_hi);
			tr->charset_a0 = charsets[19];   // ISCII
			tr->langopts.length_mods0 = tr->langopts.length_mods;  // don't lengthen vowels in the last syllable

			tr->langopts.stress_rule = 6;      // stress on last heaviest syllable, excluding final syllable
			tr->langopts.stress_flags =  0x10004;   // use 'diminished' for unstressed final syllable
			tr->langopts.numbers = NUM_SWAP_TENS;
			tr->langopts.break_numbers = 0x14aa8;  // for languages which have numbers for 100,000 and 100,00,000, eg Hindi
			tr->letter_bits_offset = OFFSET_DEVANAGARI;

			if(name2 == L('p','a'))
			{
				tr->letter_bits_offset = OFFSET_GURMUKHI;
			}
			SetIndicLetters(tr);
		}
		break;


	case L('h','r'):   // Croatian
	case L('b','s'):   // Bosnian
	case L('s','r'):   // Serbian
		{
			static const unsigned char stress_amps_hr[8] = {17,17, 20,20, 20,22, 22,21 };
			static const short stress_lengths_hr[8] = {180,160, 200,200, 0,0, 220,230};
			static const short stress_lengths_sr[8] = {160,150, 200,200, 0,0, 250,260};

			if(name2 == L('s','r'))
				SetupTranslator(tr,stress_lengths_sr,stress_amps_hr);
			else
				SetupTranslator(tr,stress_lengths_hr,stress_amps_hr);
			tr->charset_a0 = charsets[2];   // ISO-8859-2

			tr->langopts.stress_rule = STRESSPOSN_1L;
			tr->langopts.stress_flags = 0x10;  
			tr->langopts.param[LOPT_REGRESSIVE_VOICING] = 0x3;
 			tr->langopts.max_initial_consonants = 5;
			tr->langopts.spelling_stress = 1;
			tr->langopts.accents = 1;

			tr->langopts.numbers = NUM_SINGLE_STRESS | NUM_HUNDRED_AND | NUM_OMIT_1_HUNDRED | NUM_DECIMAL_COMMA | NUM_THOUS_SPACE | NUM_DFRACTION_2 | NUM_ROMAN_CAPITALS;
			tr->langopts.numbers2 = 0x4a;  // variant numbers before thousands,milliards
			tr->langopts.replace_chars = replace_cyrillic_latin;

			SetLetterVowel(tr,'y');
			SetLetterVowel(tr,'r');
		}
		break;


	case L('h','t'):  // Haitian Creole
//			static const short stress_lengths_fr[8] = {190, 170,  190, 200,  0, 0,  235, 240};
//			memcpy(tr->stress_lengths,stress_lengths_fr,sizeof(tr->stress_lengths));
			tr->langopts.stress_rule = STRESSPOSN_1R;      // stress on final syllable
			tr->langopts.stress_flags = 0x0024;  // don't use secondary stress
			tr->langopts.numbers = NUM_SINGLE_STRESS | NUM_OMIT_1_HUNDRED | NUM_NOPAUSE | NUM_ROMAN | NUM_VIGESIMAL | NUM_DFRACTION_4;
		break;


	case L('h','u'):   // Hungarian
		{
			static const unsigned char stress_amps_hu[8] = {17,17, 19,19, 20,22, 22,21 };
			static const short stress_lengths_hu[8] = {185,195, 195,190, 0,0, 210,220};

			SetupTranslator(tr,stress_lengths_hu,stress_amps_hu);
			tr->charset_a0 = charsets[2];   // ISO-8859-2

			tr->langopts.vowel_pause = 0x20;
			tr->langopts.stress_rule = STRESSPOSN_1L;
			tr->langopts.stress_flags = 0x8036 | S_HYPEN_UNSTRESS;
			tr->langopts.unstressed_wd1 = 2;
			tr->langopts.param[LOPT_IT_DOUBLING] = 1;
			tr->langopts.param[LOPT_ANNOUNCE_PUNCT] = 2;  // don't break clause before announcing . ? !

			tr->langopts.numbers = NUM_DFRACTION_5 | NUM_ALLOW_SPACE | NUM_ROMAN | NUM_ROMAN_ORDINAL | NUM_ROMAN_CAPITALS | NUM_ORDINAL_DOT | NUM_OMIT_1_HUNDRED | NUM_OMIT_1_THOUSAND;
			tr->langopts.thousands_sep = ' ';   // don't allow dot as thousands separator
			tr->langopts.decimal_sep = ',';
			tr->langopts.max_roman = 899;
			tr->langopts.min_roman = 1;
			SetLetterVowel(tr,'y');
			tr->langopts.spelling_stress = 1;
SetLengthMods(tr,3);  // all equal
		}
		break;

	case L('h','y'):   // Armenian
		{
			static const short stress_lengths_hy[8] = {250, 200,  250, 250,  0, 0,  250, 250};
			static const char hy_vowels[] = {0x31, 0x35, 0x37, 0x38, 0x3b, 0x48, 0x55, 0};
			static const char hy_consonants[] = {0x32,0x33,0x34,0x36,0x39,0x3a,0x3c,0x3d,0x3e,0x3f,
				0x40,0x41,0x42,0x43,0x44,0x45,0x46,0x47,0x49,0x4a,0x4b,0x4c,0x4d,0x4e,0x4f,0x50,0x51,0x52,0x53,0x54,0x56,0};

			SetupTranslator(tr,stress_lengths_hy,NULL);
			tr->langopts.stress_rule = STRESSPOSN_1R;  // default stress on final syllable

			tr->letter_bits_offset = OFFSET_ARMENIAN;
			memset(tr->letter_bits,0,sizeof(tr->letter_bits));
			SetLetterBits(tr,LETTERGP_A,hy_vowels);
			SetLetterBits(tr,LETTERGP_VOWEL2,hy_vowels);
			SetLetterBits(tr,LETTERGP_C,hy_consonants);
			tr->langopts.max_initial_consonants = 6;
			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_OMIT_1_HUNDRED;
//	tr->langopts.param[LOPT_UNPRONOUNCABLE] = 1;   // disable check for unpronouncable words
		}
		break;

	case L('i','d'):   // Indonesian
		{
			static const short stress_lengths_id[8] = {160, 200,  180, 180,  0, 0,  220, 240};
			static const unsigned char stress_amps_id[8] = {16,18, 18,18, 20,22, 22,21 };

			SetupTranslator(tr,stress_lengths_id,stress_amps_id);
			tr->langopts.stress_rule = STRESSPOSN_2R;
			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_ALLOW_SPACE | NUM_ROMAN;
			tr->langopts.stress_flags =  0x6 | 0x10; 
			tr->langopts.accents = 2;  // "capital" after letter name
		}
		break;

	case L('i','s'):   // Icelandic
		{
			static const short stress_lengths_is[8] = {180,160, 200,200, 0,0, 240,250};
			static const wchar_t is_lettergroup_B[] = {'c','f','h','k','p','t','x',0xfe,0};  // voiceless conants, including 'þ'  ?? 's'

			SetupTranslator(tr,stress_lengths_is,NULL);
			tr->langopts.stress_rule = STRESSPOSN_1L;
			tr->langopts.stress_flags = 0x10;
			tr->langopts.param[LOPT_IT_LENGTHEN] = 0x11;    // remove lengthen indicator from unstressed vowels
			tr->langopts.param[LOPT_REDUCE] = 2;

			ResetLetterBits(tr,0x18);
			SetLetterBits(tr,4,"kpst");   // Letter group F
			SetLetterBits(tr,3,"jvr");    // Letter group H
			tr->letter_groups[1] = is_lettergroup_B;
			SetLetterVowel(tr,'y');
			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_SINGLE_AND | NUM_HUNDRED_AND | NUM_AND_UNITS | NUM_1900;
			tr->langopts.numbers2 = 0x2;
		}
		break;

	case L('i','t'):   // Italian
		{
			static const short stress_lengths_it[8] = {150, 140,  170, 170,  0, 0,  300, 330};
			static const unsigned char stress_amps_it[8] = {15,14, 19,19, 20,22, 22,20 };

			SetupTranslator(tr,stress_lengths_it,stress_amps_it);

			tr->langopts.length_mods0 = tr->langopts.length_mods;  // don't lengthen vowels in the last syllable
			tr->langopts.stress_rule = STRESSPOSN_2R;
			tr->langopts.stress_flags = 0x10 | 0x20000; 
			tr->langopts.vowel_pause = 1;
			tr->langopts.unstressed_wd1 = 2;
			tr->langopts.unstressed_wd2 = 2;
			tr->langopts.param[LOPT_IT_LENGTHEN] = 2;    // remove lengthen indicator from unstressed or non-penultimate syllables
			tr->langopts.param[LOPT_IT_DOUBLING] = 2;    // double the first consonant if the previous word ends in a stressed vowel
			tr->langopts.param[LOPT_SONORANT_MIN] = 130;  // limit the shortening of sonorants before short vowels
			tr->langopts.param[LOPT_REDUCE] = 1;        // reduce vowels even if phonemes are specified in it_list
			tr->langopts.param[LOPT_ALT] = 2;      // call ApplySpecialAttributes2() if a word has $alt or $alt2
			tr->langopts.numbers = NUM_SINGLE_VOWEL | NUM_OMIT_1_HUNDRED |NUM_DECIMAL_COMMA | NUM_ROMAN | NUM_DFRACTION_1;
			tr->langopts.accents = 2;   // Say "Capital" after the letter.
			SetLetterVowel(tr,'y');
		}
		break;

	case L_jbo:   // Lojban
		{
			static const short stress_lengths_jbo[8] = {145,145, 170,160, 0,0, 330,350};
			static const wchar_t jbo_punct_within_word[] = {'.',',','\'',0x2c8,0};  // allow period and comma within a word, also stress marker (from LOPT_CAPS_IN_WORD)

			SetupTranslator(tr,stress_lengths_jbo,NULL);
			tr->langopts.stress_rule = STRESSPOSN_2R;
			tr->langopts.vowel_pause = 0x20c;  // pause before a word which starts with a vowel, or after a word which ends in a consonant
//			tr->langopts.word_gap = 1;
			tr->punct_within_word = jbo_punct_within_word;
			tr->langopts.param[LOPT_CAPS_IN_WORD] = 2;  // capitals indicate stressed syllables
			SetLetterVowel(tr,'y');
			tr->langopts.max_lengthmod = 368;
		}
		break;

	case L('k','o'):   // Korean, TEST
		{
			static const char ko_ivowels[] = {0x63,0x64,0x67,0x68,0x6d,0x72,0x74,0x75,0};  // y and i vowels
			static const unsigned char ko_voiced[] = {0x02,0x05,0x06,0xab,0xaf,0xb7,0xbc,0};  // voiced consonants, l,m,n,N

			tr->letter_bits_offset = OFFSET_KOREAN;
			memset(tr->letter_bits,0,sizeof(tr->letter_bits));
			SetLetterBitsRange(tr,LETTERGP_A,0x61,0x75);
			SetLetterBits(tr,LETTERGP_Y,ko_ivowels);
			SetLetterBits(tr,LETTERGP_G,(const char *)ko_voiced);

			tr->langopts.stress_rule = 8;   // ?? 1st syllable if it is heavy, else 2nd syllable
			tr->langopts.param[LOPT_UNPRONOUNCABLE] = 1;   // disable check for unpronouncable words
			tr->langopts.numbers = NUM_OMIT_1_HUNDRED;
		}
		break;

	case L('k','u'):   // Kurdish
		{
			static const unsigned char stress_amps_ku[8] = {18,18, 20,20, 20,22, 22,21 };
			static const short stress_lengths_ku[8] = {180,180, 190,180, 0,0, 230,240};

			SetupTranslator(tr,stress_lengths_ku,stress_amps_ku);
			tr->charset_a0 = charsets[9];   // ISO-8859-9 - Latin5

			tr->langopts.stress_rule = 7;   // stress on the last syllable, before any explicitly unstressed syllable

			tr->langopts.numbers = NUM_HUNDRED_AND | NUM_AND_UNITS | NUM_OMIT_1_HUNDRED | NUM_AND_HUNDRED;
			tr->langopts.max_initial_consonants = 2;
		}
		break;

	case L('l','a'):  //Latin
		{
			tr->charset_a0 = charsets[4];   // ISO-8859-4, includes a,e,i,o,u-macron
			tr->langopts.stress_rule = STRESSPOSN_2R;
			tr->langopts.stress_flags = 0x20;
			tr->langopts.unstressed_wd1 = 0;
			tr->langopts.unstressed_wd2 = 2;
			tr->langopts.param[LOPT_DIERESES] = 1;
			tr->langopts.numbers = NUM_ROMAN;
			tr->langopts.max_roman = 5000;
		}
		break;

	case L('l','v'):  // latvian
		{
			static const unsigned char stress_amps_lv[8] = {17,13, 20,20, 20,22, 22,21 };
			static const short stress_lengths_lv[8] = {180,130, 210,210, 0,0, 210,210};

			SetupTranslator(tr,stress_lengths_lv,stress_amps_lv);

			tr->langopts.stress_rule = STRESSPOSN_1L;
			tr->langopts.spelling_stress = 1;
			tr->charset_a0 = charsets[4];   // ISO-8859-4
			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_OMIT_1_HUNDRED | NUM_DFRACTION_4 | NUM_ORDINAL_DOT;
			tr->langopts.stress_flags = 0x16 + 0x40000;
		}
		break;

	case L('m','k'):   // Macedonian
		{
			static wchar_t vowels_cyrillic[] = {0x440,  // also include 'р' [R]
				 0x430,0x435,0x438,0x439,0x43e,0x443,0x44b,0x44d,0x44e,0x44f,0x450,0x451,0x456,0x457,0x45d,0x45e,0};
			static const unsigned char stress_amps_mk[8] = {17,17, 20,20, 20,22, 22,21 };
			static const short stress_lengths_mk[8] = {180,160, 200,200, 0,0, 220,230};

			SetupTranslator(tr,stress_lengths_mk,stress_amps_mk);
			tr->charset_a0 = charsets[5];   // ISO-8859-5
			tr->letter_groups[0] = tr->letter_groups[7] = vowels_cyrillic;

			tr->langopts.stress_rule = STRESSPOSN_3R;   // antipenultimate
			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_AND_UNITS | NUM_OMIT_1_HUNDRED | NUM_OMIT_1_THOUSAND | NUM_DFRACTION_2;
			tr->langopts.numbers2 = 0x8a;  // variant numbers before thousands,milliards
		}
		break;


	case L('n','l'):  // Dutch
		{
			static const short stress_lengths_nl[8] = {160,135, 210,210,  0, 0, 260,280};

			tr->langopts.stress_rule = STRESSPOSN_1L;
			tr->langopts.vowel_pause = 0x30;  // ??
			tr->langopts.param[LOPT_DIERESES] = 1;
			tr->langopts.param[LOPT_PREFIXES] = 1;
			tr->langopts.param[LOPT_REGRESSIVE_VOICING] = 0x10;  // devoice at end of word
			SetLetterVowel(tr,'y');

			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_SWAP_TENS | NUM_OMIT_1_HUNDRED | NUM_ALLOW_SPACE | NUM_1900 | NUM_ORDINAL_DOT;
			tr->langopts.ordinal_indicator = "e";
			memcpy(tr->stress_lengths,stress_lengths_nl,sizeof(tr->stress_lengths));
		}
		break;

	case L('n','o'):  // Norwegian
		{
			static const short stress_lengths_no[8] = {160,140, 200,200, 0,0, 220,230};

			SetupTranslator(tr,stress_lengths_no,NULL);
			tr->langopts.stress_rule = STRESSPOSN_1L;
			SetLetterVowel(tr,'y');
			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_HUNDRED_AND | NUM_ALLOW_SPACE | NUM_1900 | NUM_ORDINAL_DOT;
		}
		break;

	case L('o','m'):
		{
			static const unsigned char stress_amps_om[] = {18,15, 20,20, 20,22, 22,22 };
			static const short stress_lengths_om[8] = {200,200, 200,200, 0,0, 200,200};

			SetupTranslator(tr,stress_lengths_om,stress_amps_om);
			tr->langopts.stress_rule = STRESSPOSN_2R;
			tr->langopts.stress_flags = 0x16 + 0x80000;
		}
		break;

	case L('p','l'):   // Polish
		{
			static const short stress_lengths_pl[8] = {160, 190,  175, 175,  0, 0,  200, 210};
			static const unsigned char stress_amps_pl[8] = {17,13, 19,19, 20,22, 22,21 };    // 'diminished' is used to mark a quieter, final unstressed syllable

			SetupTranslator(tr,stress_lengths_pl,stress_amps_pl);

			tr->charset_a0 = charsets[2];   // ISO-8859-2
			tr->langopts.stress_rule = STRESSPOSN_2R;
			tr->langopts.stress_flags = 0x6;  // mark unstressed final syllables as diminished
			tr->langopts.param[LOPT_REGRESSIVE_VOICING] = 0x8;
 			tr->langopts.max_initial_consonants = 7; // for example: wchrzczony :)
 			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_ALLOW_SPACE | NUM_DFRACTION_2;
			tr->langopts.numbers2 = 0x40;
			tr->langopts.param[LOPT_COMBINE_WORDS] = 4 + 0x100;  // combine 'nie' (marked with $alt2) with some 1-syllable (and 2-syllable) words (marked with $alt)
			SetLetterVowel(tr,'y');
		}
		break;

	case L('p','t'):  // Portuguese
		{
			static const short stress_lengths_pt[8] = {170, 115,  210, 240,  0, 0,  260, 280};
			static const unsigned char stress_amps_pt[8] = {16,11, 19,21, 20,22, 22,21 };    // 'diminished' is used to mark a quieter, final unstressed syllable

			SetupTranslator(tr,stress_lengths_pt,stress_amps_pt);
			tr->langopts.length_mods0 = tr->langopts.length_mods;  // don't lengthen vowels in the last syllable

			tr->langopts.stress_rule = STRESSPOSN_1R;        // stress on final syllable
			tr->langopts.stress_flags =  0x6 | 0x10 | 0x2000 | 0x20000; 
			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_DFRACTION_2 | NUM_HUNDRED_AND | NUM_AND_UNITS | NUM_ROMAN;
			SetLetterVowel(tr,'y');
			ResetLetterBits(tr,0x2);
			SetLetterBits(tr,1,"bcdfgjkmnpqstvxz");      // B  hard consonants, excluding h,l,r,w,y
			tr->langopts.param[LOPT_ALT] = 2;      // call ApplySpecialAttributes2() if a word has $alt or $alt2
		}
		break;

	case L('r','o'):  // Romanian
		{
			static const short stress_lengths_ro[8] = {170, 170,  180, 180,  0, 0,  240, 260};
			static const unsigned char stress_amps_ro[8] = {15,13, 18,18, 20,22, 22,21 };

			SetupTranslator(tr,stress_lengths_ro,stress_amps_ro);

			tr->langopts.stress_rule = STRESSPOSN_2R;
			tr->langopts.stress_flags = 0x100 + 0x6;

			tr->charset_a0 = charsets[2];   // ISO-8859-2
			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_ALLOW_SPACE | NUM_DFRACTION_3 | NUM_AND_UNITS | NUM_ROMAN;
			tr->langopts.numbers2 = 0x1e;  // variant numbers before all thousandplex
		}
		break;

	case L('r','u'):  // Russian
			Translator_Russian(tr);
		break;

	case L('r','w'):   // Kiryarwanda
		{
			tr->langopts.stress_rule = STRESSPOSN_2R;
			tr->langopts.stress_flags = 0x16;
			tr->langopts.length_mods0 = tr->langopts.length_mods;  // don't lengthen vowels in the last syllable

			tr->langopts.numbers = NUM_HUNDRED_AND | NUM_AND_UNITS | NUM_DFRACTION_2 | NUM_AND_HUNDRED;
			tr->langopts.numbers2 = 0x200;  // say "thousands" before its number
		}
		break;

	case L('s','k'):   // Slovak
	case L('c','s'):   // Czech
		{
			static const char *sk_voiced = "bdgjlmnrvwzaeiouy";

			SetupTranslator(tr,stress_lengths_sk,stress_amps_sk);
			tr->charset_a0 = charsets[2];   // ISO-8859-2

			tr->langopts.stress_rule = STRESSPOSN_1L;
			tr->langopts.stress_flags = 0x16;  
			tr->langopts.param[LOPT_REGRESSIVE_VOICING] = 0x3;
 			tr->langopts.max_initial_consonants = 5;
			tr->langopts.spelling_stress = 1;
			tr->langopts.param[LOPT_COMBINE_WORDS] = 4;  // combine some prepositions with the following word

			tr->langopts.numbers = NUM_OMIT_1_HUNDRED | NUM_DFRACTION_2 | NUM_ROMAN;
			tr->langopts.numbers2 = 0x100;
			tr->langopts.thousands_sep = STRESSPOSN_1L;   //no thousands separator
			tr->langopts.decimal_sep = ',';

			if(name2 == L('c','s'))
			{
				tr->langopts.numbers2 = 0x108;  // variant numbers before milliards
			}

			SetLetterVowel(tr,'y');
			SetLetterVowel(tr,'r');
			ResetLetterBits(tr,0x20);
			SetLetterBits(tr,5,sk_voiced);
		}
		break;

	case L('s','l'):  // Slovenian
			tr->charset_a0 = charsets[2];   // ISO-8859-2
			tr->langopts.stress_rule = STRESSPOSN_2R;   // Temporary
			tr->langopts.stress_flags = 0x20;
			tr->langopts.param[LOPT_REGRESSIVE_VOICING] = 0x13;
			tr->langopts.numbers =  NUM_DECIMAL_COMMA | NUM_ALLOW_SPACE | NUM_SWAP_TENS | NUM_OMIT_1_HUNDRED | NUM_DFRACTION_2 | NUM_ORDINAL_DOT | NUM_ROMAN;
			tr->langopts.numbers2 = 0x100;   // plural forms of millions etc
			tr->langopts.thousands_sep = ' ';   // don't allow dot as thousands separator
			SetLetterVowel(tr,'r');
		break;

	case L('s','q'):  // Albanian
		{
			static const short stress_lengths_sq[8] = {150, 150,  180, 180,  0, 0,  300, 300};
			static const unsigned char stress_amps_sq[8] = {16,12, 16,16, 20,20, 21,19 };

			SetupTranslator(tr,stress_lengths_sq,stress_amps_sq);

			tr->langopts.stress_rule = STRESSPOSN_2R;
			tr->langopts.stress_flags =  0x16 + 0x100; 
			SetLetterVowel(tr,'y');
			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_HUNDRED_AND | NUM_AND_UNITS | NUM_DFRACTION_4;
			tr->langopts.accents = 2;  // "capital" after letter name
		}
		break;


	case L('s','v'):  // Swedish
		{
			static const unsigned char stress_amps_sv[] = {16,16, 20,20, 20,22, 22,21 };
			static const short stress_lengths_sv[8] = {160,135, 220,220, 0,0, 250,280};
			SetupTranslator(tr,stress_lengths_sv,stress_amps_sv);

			tr->langopts.stress_rule = STRESSPOSN_1L;
			SetLetterVowel(tr,'y');
			tr->langopts.numbers = NUM_SINGLE_STRESS | NUM_DECIMAL_COMMA | NUM_ALLOW_SPACE | NUM_1900;
			tr->langopts.accents = 1;
		}
		break;

	case L('s','w'):  // Swahili
		{
			static const short stress_lengths_sw[8] = {160, 170,  200, 200,    0,   0,  320, 340};
			static const unsigned char stress_amps_sw[] = {16,12, 19,19, 20,22, 22,21 };

			SetupTranslator(tr,stress_lengths_sw,stress_amps_sw);
			tr->langopts.length_mods0 = tr->langopts.length_mods;  // don't lengthen vowels in the last syllable

			tr->langopts.vowel_pause = 1;
			tr->langopts.stress_rule = STRESSPOSN_2R;
			tr->langopts.stress_flags =  0x6 | 0x10; 

			tr->langopts.numbers = NUM_AND_UNITS | NUM_HUNDRED_AND | NUM_SINGLE_AND | NUM_OMIT_1_HUNDRED;
			tr->langopts.break_numbers = 0x49249268;  // for languages which have numbers for 100,000 and 1,000,000
		}
		break;

	case L('t','a'):  // Tamil
	case L('m','l'):  // Malayalam
	case L('k','n'):  // Kannada
	case L('m','r'):  // Marathi
		{
			static const short stress_lengths_ta[8] = {200, 200,  210, 210,  0, 0,  230, 230};
			static const unsigned char stress_amps_ta[8] = {18,18, 18,18, 20,20, 22,22 };

			SetupTranslator(tr,stress_lengths_ta,stress_amps_ta);
			tr->langopts.length_mods0 = tr->langopts.length_mods;  // don't lengthen vowels in the last syllable

			tr->langopts.stress_rule = STRESSPOSN_1L;
			tr->langopts.stress_flags =  0x10004;   // use 'diminished' for unstressed final syllable
			tr->langopts.break_numbers = 0x14a8;  // 1000, 100,000  10,000,000 

			if(name2 == L('t','a'))
			{
				tr->letter_bits_offset = OFFSET_TAMIL;
				tr->langopts.numbers =  NUM_OMIT_1_THOUSAND ;
			}
			if(name2 == L('m','r'))
			{
				tr->letter_bits_offset = OFFSET_DEVANAGARI;
			}
			else
			if(name2 == L('m','l'))
			{
				tr->letter_bits_offset = OFFSET_MALAYALAM;
			}
			else
			if(name2 == L('k','n'))
			{
				tr->letter_bits_offset = OFFSET_KANNADA;
				tr->langopts.numbers = 0x1;
			}
			tr->langopts.param[LOPT_WORD_MERGE] = 1;   // don't break vowels betwen words
			SetIndicLetters(tr);   // call this after setting OFFSET_
		}
		break;

#ifdef deleted
	case L('t','h'):  // Thai
		{
			static const short stress_lengths_th[8] = {230,150, 230,230, 230,0, 230,250};
			static const unsigned char stress_amps_th[] = {22,16, 22,22, 22,22, 22,22 };

			SetupTranslator(tr,stress_lengths_th,stress_amps_th);

			tr->langopts.stress_rule = 0;   // stress on final syllable of a "word"
			tr->langopts.stress_flags = 2;          // don't automatically set diminished stress (may be set in the intonation module)
			tr->langopts.tone_language = 1;   // Tone language, use  CalcPitches_Tone() rather than CalcPitches()
			tr->langopts.length_mods0 = tr->langopts.length_mods;  // don't lengthen vowels in the last syllable
//			tr->langopts.tone_numbers = 1;   // a number after letters indicates a tone number (eg. pinyin or jyutping)
			tr->langopts.word_gap = 0x21;   // length of a final vowel is less dependent on the next consonant, don't merge consonant with next word
		}
		break;
#endif

	case L('t','r'):   // Turkish
		{
			static const unsigned char stress_amps_tr[8] = {18,16, 20,21, 20,21, 21,20 };
			static const short stress_lengths_tr[8] = {190,180, 200,230, 0,0, 240,250};

			SetupTranslator(tr,stress_lengths_tr,stress_amps_tr);
			tr->charset_a0 = charsets[9];   // ISO-8859-9 - Latin5

			tr->langopts.stress_rule = 7;   // stress on the last syllable, before any explicitly unstressed syllable
			tr->langopts.stress_flags = 0x20;  //no automatic secondary stress

			tr->langopts.numbers = NUM_SINGLE_STRESS | NUM_DECIMAL_COMMA | NUM_ALLOW_SPACE | NUM_OMIT_1_HUNDRED | NUM_OMIT_1_THOUSAND | NUM_DFRACTION_2;
			tr->langopts.max_initial_consonants = 2;
		}
		break;

	case L('u','r'):   // Urdu
			tr->letter_bits_offset = OFFSET_ARABIC;
			tr->langopts.param[LOPT_UNPRONOUNCABLE] = 1;   // disable check for unpronouncable words
			tr->langopts.numbers = NUM_SWAP_TENS;
			tr->langopts.break_numbers = 0x52a8;  // for languages which have numbers for 100,000 and 100,00,000, eg Hindi
		break;

	case L('v','i'):  // Vietnamese
		{
			static const short stress_lengths_vi[8] = {150, 150,  180, 180,  210, 230,  230, 240};
			static const unsigned char stress_amps_vi[] = {16,16, 16,16, 22,22, 22,22 };
			static wchar_t vowels_vi[] = {
				0x61, 0xe0, 0xe1, 0x1ea3, 0xe3, 0x1ea1,			// a
				0x103, 0x1eb1, 0x1eaf, 0x1eb3, 0x1eb5, 0x1eb7,	// ă
				0xe2, 0x1ea7, 0x1ea5, 0x1ea9, 0x1eab, 0x1ead,	// â
				0x65, 0xe8, 0xe9, 0x1ebb, 0x1ebd, 0x1eb9,			// e
				0xea, 0x1ec1, 0x1ebf, 0x1ec3, 0x1ec5, 0x1ec7,	// i
				0x69, 0xec, 0xed, 0x1ec9, 0x129, 0x1ecb,			// i
				0x6f, 0xf2, 0xf3, 0x1ecf, 0xf5, 0x1ecd,			// o
				0xf4, 0x1ed3, 0x1ed1, 0x1ed5, 0x1ed7, 0x1ed9, 	// ô
				0x1a1, 0x1edd, 0x1edb, 0x1edf, 0x1ee1, 0x1ee3,	// ơ
				0x75, 0xf9, 0xfa, 0x1ee7, 0x169, 0x1ee5,			// u
				0x1b0, 0x1eeb, 0x1ee9, 0x1eed, 0x1eef, 0x1ef1,	// ư
				0x79, 0x1ef3, 0xfd, 0x1ef7, 0x1ef9, 0x1e, 0 };	// y

			SetupTranslator(tr,stress_lengths_vi,stress_amps_vi);
			tr->langopts.length_mods0 = tr->langopts.length_mods;  // don't lengthen vowels in the last syllable

			tr->langopts.stress_rule = STRESSPOSN_1L;
			tr->langopts.word_gap = 0x21;   // length of a final vowel is less dependent on the next consonant, don't merge consonant with next word
//			tr->langopts.vowel_pause = 4;
			tr->letter_groups[0] = tr->letter_groups[7] = vowels_vi;
			tr->langopts.tone_language = 1;   // Tone language, use  CalcPitches_Tone() rather than CalcPitches()
			tr->langopts.unstressed_wd1 = 2;
			tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_HUNDRED_AND | NUM_DFRACTION_4;

		}
		break;

	case L('z','h'):
	case L_zhy:
		{
			static const short stress_lengths_zh[8] = {230,150, 230,230, 230,0, 240,250};  // 1=tone5. end-of-sentence, 6=tone 1&4, 7=tone 2&3
			static const unsigned char stress_amps_zh[] = {22,16, 22,22, 22,22, 22,22 };

			SetupTranslator(tr,stress_lengths_zh,stress_amps_zh);

			tr->langopts.stress_rule = STRESSPOSN_1R;   // stress on final syllable of a "word"
			tr->langopts.stress_flags = 2;          // don't automatically set diminished stress (may be set in the intonation module)
			tr->langopts.vowel_pause = 0;
			tr->langopts.tone_language = 1;   // Tone language, use  CalcPitches_Tone() rather than CalcPitches()
			tr->langopts.length_mods0 = tr->langopts.length_mods;  // don't lengthen vowels in the last syllable
			tr->langopts.tone_numbers = 1;   // a number after letters indicates a tone number (eg. pinyin or jyutping)
			tr->langopts.ideographs = 1;
			tr->langopts.word_gap = 0x21;   // length of a final vowel is less dependent on the next consonant, don't merge consonant with next word
			if(name2 == L('z','h'))
			{
				tr->langopts.textmode = 1;
				tr->langopts.listx = 1;    // compile zh_listx after zh_list
			}
		}
		break;

	default:
		tr->langopts.param[LOPT_UNPRONOUNCABLE] = 1;   // disable check for unpronouncable words
		break;
	}

	tr->translator_name = name2;

	if(tr->langopts.numbers & NUM_DECIMAL_COMMA)
	{
		// use . and ; for thousands and decimal separators
		tr->langopts.thousands_sep = '.';
		tr->langopts.decimal_sep = ',';
	}
	if(tr->langopts.numbers & NUM_THOUS_SPACE)
	{
		tr->langopts.thousands_sep = 0;   // don't allow thousands separator, except space
	}

	return(tr);
}  // end of SelectTranslator



//**********************************************************************************************************




static void Translator_Russian(Translator *tr)
{//===========================================
	static const unsigned char stress_amps_ru[] = {16,16, 18,18, 20,24, 24,22 };
	static const short stress_lengths_ru[8] = {150,140, 220,220, 0,0, 260,280};
	static const char ru_ivowels2[] = {0x2c,0x15,0x18,0x2e,0x2f,0};   // add more vowels to letter group Y  (iotated vowels & soft-sign)

	SetupTranslator(tr,stress_lengths_ru,stress_amps_ru);
	SetCyrillicLetters(tr);
	SetLetterBits(tr,6,ru_ivowels2);

	tr->langopts.param[LOPT_UNPRONOUNCABLE] = 0x432;    // [v]  don't count this character at start of word
	tr->langopts.param[LOPT_REGRESSIVE_VOICING] = 1;
	tr->langopts.param[LOPT_REDUCE] = 2;
	tr->langopts.stress_rule = 5;
	tr->langopts.stress_flags = 0x0020;  // waas 0x1010

	tr->langopts.numbers = NUM_DECIMAL_COMMA | NUM_OMIT_1_HUNDRED;
	tr->langopts.numbers2 = 0xc2;  // variant numbers before thousands
	tr->langopts.phoneme_change = 1;
	tr->langopts.testing = 2;

}  // end of Translator_Russian



/*
typedef struct {
	int flags;
	unsigned char stress;          // stress level of this vowel
	unsigned char stress_highest;  // the highest stress level of a vowel in this word
	unsigned char n_vowels;        // number of vowels in the word
	unsigned char vowel_this;      // syllable number of this vowel (counting from 1)
	unsigned char vowel_stressed;  // syllable number of the highest stressed vowel
} CHANGEPH;
*/



#ifdef RUSSIAN2
// This is now done in the phoneme data, ph_russian

int ChangePhonemes_ru(Translator *tr, PHONEME_LIST2 *phlist, int n_ph, int index, PHONEME_TAB *ph, CHANGEPH *ch)
{//=============================================================================================================
// Called for each phoneme in the phoneme list, to allow a language to make changes
// ph     The current phoneme

	int variant;
	int vowelix;
	PHONEME_TAB *prev, *next;

	if(ch->flags & 8)
		return(0);    // full phoneme translation has already been given
	// Russian vowel softening and reduction rules

	if(ph->type == phVOWEL)
	{
		int prestressed = ch->vowel_stressed==ch->vowel_this+1;  // the next vowel after this has the main stress

		#define N_VOWELS_RU   11
                static unsigned int vowels_ru[N_VOWELS_RU] = {'a','V','O','I',PH('I','#'),PH('E','#'),PH('E','2'),
PH('V','#'),PH('I','3'),PH('I','2'),PH('E','3')};


                static unsigned int vowel_replace[N_VOWELS_RU][6] = {
                        // stressed, soft, soft-stressed, j+stressed, j+soft, j+soft-stressed
                /*0*/        {'A', 'I', PH('j','a'),         'a', 'a', 'a'},                // a   Uses 3,4,5 columns.
                /*1*/        {'A', 'V', PH('j','a'),         'a', 'V', 'a'},                // V   Uses 3,4,5 columns.
                /*2*/        {'o', '8', '8',                 'o', '8', '8'},                // O
                /*3*/        {'i', 'I', 'i',                 'a', 'I', 'a'},                // I  Uses 3,4,5 columns.
                /*4*/        {'i', PH('I','#'), 'i',         'i', PH('I','#'), 'i'},        // I#
                /*5*/        {'E', PH('E','#'), 'E',         'e', PH('E','#'), 'e'},        // E# 
                /*6*/        {'E', PH('E','2'), 'E',         'e', PH('E','2'), 'e'},        // E2  Uses 3,4,5 columns.
                /*7*/        {PH('j','a'), 'V', PH('j','a'), 'A', 'V', 'A'},                // V#
                /*8*/        {PH('j','a'), 'I', PH('j','a'), 'e', 'I', 'e'},                // I3 Uses 3,4,5 columns.
                /*9*/        {'e', 'I', 'e',                 'e', 'I', 'e'},                // I2
                /*10*/       {'e', PH('E', '2'), 'e',        'e', PH('E','2'), 'e'}         // E3
                };

		prev = phoneme_tab[phlist[index-1].phcode];
		next = phoneme_tab[phlist[index+1].phcode];

		// lookup the vowel name to get an index into the vowel_replace[] table
		for(vowelix=0; vowelix<N_VOWELS_RU; vowelix++)
		{
			if(vowels_ru[vowelix] == ph->mnemonic)
				break;
		}
		if(vowelix == N_VOWELS_RU)
			return(0);

		if(prestressed)
		{
			if((vowelix==6)&&(prev->mnemonic=='j'))
				vowelix=8;
			if(vowelix==1)
				vowelix=0;
			if(vowelix==4)
				vowelix=3;
			if(vowelix==6)
				vowelix=5;
			if(vowelix==7)
				vowelix=8;
			if(vowelix==10)
				vowelix=9;
		}
		// do we need a variant of this vowel, depending on the stress and adjacent phonemes ?
		variant = -1;
		int stressed = ch->flags & 2;
		int soft=prev->phflags & phPALATAL;

		if (soft && stressed)
			variant = 2; else
				if (stressed)
					variant = 0; else
						if (soft)
							variant = 1;
		if(variant >= 0)
		{
			if(prev->mnemonic == 'j')
				variant += 3;

			phlist[index].phcode = PhonemeCode(vowel_replace[vowelix][variant]);
		}
		else
		{
			phlist[index].phcode = PhonemeCode(vowels_ru[vowelix]);
		}
	}

	return(0);
}

#endif

By viewing downloads associated with this article you agree to the Terms of Service and the article's licence.

If a file you wish to view isn't highlighted, and is a text file (not binary), please let us know and we'll add colourisation support for it.

License

This article, along with any associated source code and files, is licensed under The BSD License

Written By

Jozef Bozek

CEO bring-it-together s.r.o.

Slovakia

Jozef Božek is currently a software engineer at bring-it-together s.r.o. in area of large scale infomation systems and mobile applications development.
He has been developing in C++ nearly full time since 2000, in Java since 2004 and in Objective-C since 2009. He is programming using Java EE SDK, iOS SDK, COM/DCOM, MFC, ATL, STL and so on Smile | :)

ESpeakEngine - Objective-C speech synthesizer

License

Comments and Discussions