<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">inform</journal-id><journal-title-group><journal-title xml:lang="ru">Информатика</journal-title><trans-title-group xml:lang="en"><trans-title>Informatics</trans-title></trans-title-group></journal-title-group><issn pub-type="ppub">1816-0301</issn><issn pub-type="epub">2617-6963</issn><publisher><publisher-name>UIIP NASB</publisher-name></publisher></journal-meta><article-meta><article-id custom-type="elpub" pub-id-type="custom">inform-597</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>ОБРАБОТКА СИГНАЛОВ, ИЗОБРАЖЕНИЙ, РЕЧИ, ТЕКСТА И РАСПОЗНАВАНИЕ ОБРАЗОВ</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="en"><subject>SIGNAL, IMAGE, SPEECH, TEXT PROCESSING AND PATTERN RECOGNITION</subject></subj-group></article-categories><title-group><article-title>СИСТЕМА АУДИОВИЗУАЛЬНОГО СИНТЕЗА РУССКОЙ РЕЧИ</article-title><trans-title-group xml:lang="en"><trans-title></trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Лобанов</surname><given-names>Б. М.</given-names></name></name-alternatives><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Цирульник</surname><given-names>Л. И.</given-names></name></name-alternatives><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Железны</surname><given-names>М.</given-names></name></name-alternatives><xref ref-type="aff" rid="aff-2"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Крноул</surname><given-names>З.</given-names></name></name-alternatives><xref ref-type="aff" rid="aff-2"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Ронжин</surname><given-names>А.</given-names></name></name-alternatives><xref ref-type="aff" rid="aff-3"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Карпов</surname><given-names>А.</given-names></name></name-alternatives><xref ref-type="aff" rid="aff-3"/></contrib></contrib-group><aff xml:lang="ru" id="aff-1"><institution>Объединенный институт проблем информатики НАН Беларуси</institution><country>Belarus</country></aff><aff xml:lang="ru" id="aff-2"><institution>University of West Bohemia in Pilsen</institution><country>Czech Republic</country></aff><aff xml:lang="ru" id="aff-3"><institution>Санкт-Петербургский институт информатики и автоматизации РАН</institution><country>Russian Federation</country></aff><pub-date pub-type="collection"><year>2008</year></pub-date><pub-date pub-type="epub"><day>09</day><month>11</month><year>2018</year></pub-date><volume>0</volume><issue>4(20)</issue><fpage>67</fpage><lpage>78</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Лобанов Б.М., Цирульник Л.И., Железны М., Крноул З., Ронжин А., Карпов А., 2018</copyright-statement><copyright-year>2018</copyright-year><copyright-holder xml:lang="ru">Лобанов Б.М., Цирульник Л.И., Железны М., Крноул З., Ронжин А., Карпов А.</copyright-holder><copyright-holder xml:lang="en">Лобанов Б.М., Цирульник Л.И., Железны М., Крноул З., Ронжин А., Карпов А.</copyright-holder><license xml:lang="ru" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>Данная работа распространяется под лицензией Creative Commons Attribution 4.0.</license-p></license><license xml:lang="en" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://inf.grid.by/jour/article/view/597">https://inf.grid.by/jour/article/view/597</self-uri><abstract><p>Описываются имитационная и компиляционная модели аудиовизуального синтеза русской речи и созданный на их основе аудиовизуальный синтезатор речи. Рассматриваются преимущества и недостатки каждой из моделей, а также особенности их построения для русской речи.</p></abstract></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Issues in Visual and Audio-Visual Speech Processing. – Cambridge : MIT Press, 2004. – 478 p.</mixed-citation><mixed-citation xml:lang="en">Issues in Visual and Audio-Visual Speech Processing. – Cambridge : MIT Press, 2004. – 478 p.</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Tekalp, A.M. Face and 2-D Mesh Animation in MPEG-4 / A.M. Tekalp, J. Ostermann // Signal Processing: Image Communication, Special Issue on MPEG-4. – 2000. – Vol. 15. – P. 387–421.</mixed-citation><mixed-citation xml:lang="en">Tekalp, A.M. Face and 2-D Mesh Animation in MPEG-4 / A.M. Tekalp, J. Ostermann // Signal Processing: Image Communication, Special Issue on MPEG-4. – 2000. – Vol. 15. – P. 387–421.</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Animated Talking Head with Personalized 3D Head Model / L.S. Chen [et al.] // IEEE First Workshop on Multimedia Signal Processing. – 1997. – P. 274–279.</mixed-citation><mixed-citation xml:lang="en">Animated Talking Head with Personalized 3D Head Model / L.S. Chen [et al.] // IEEE First Workshop on Multimedia Signal Processing. – 1997. – P. 274–279.</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Video Rewrite: Driving Visual Speech with Audio / C. Bregler [et al.] // Proc. of 24 Int. conf. on Computer Graphics and Interactive Techniques «DIGGRAPH97». – Los Angeles, USA, 1997. – P. 353–360.</mixed-citation><mixed-citation xml:lang="en">Video Rewrite: Driving Visual Speech with Audio / C. Bregler [et al.] // Proc. of 24 Int. conf. on Computer Graphics and Interactive Techniques «DIGGRAPH97». – Los Angeles, USA, 1997. – P. 353–360.</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">Cosatto, E. Photo-Realistic Talking-Heads from Image Samples / E. Cosatto, H.P. Graf // IEEE Transactions on Multimedia. – Sept. 2000. – Vol. 2. – P. 152–163.</mixed-citation><mixed-citation xml:lang="en">Cosatto, E. Photo-Realistic Talking-Heads from Image Samples / E. Cosatto, H.P. Graf // IEEE Transactions on Multimedia. – Sept. 2000. – Vol. 2. – P. 152–163.</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">Лобанов, Б.М. Компьютерное клонирование персонального голоса и речи / Б.М. Лобанов // Новости искусственного интеллекта. – 2002. – № 5(55). – С. 35–39.</mixed-citation><mixed-citation xml:lang="en">Лобанов, Б.М. Компьютерное клонирование персонального голоса и речи / Б.М. Лобанов // Новости искусственного интеллекта. – 2002. – № 5(55). – С. 35–39.</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Lobanov, B. TTS-Synthesizer as a Computer Means for Personal Voice Cloning (On the example of Russian) / B. Lobanov, H. Karnevskaya // Phonetics and its Applications. – Stuttgart : Steiner, 2002. – P. 445–452.</mixed-citation><mixed-citation xml:lang="en">Lobanov, B. TTS-Synthesizer as a Computer Means for Personal Voice Cloning (On the example of Russian) / B. Lobanov, H. Karnevskaya // Phonetics and its Applications. – Stuttgart : Steiner, 2002. – P. 445–452.</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Лобанов, Б.М. Персональные особенности синтагматического членения речи телеведущего Ю. Сенкевича / Б.М. Лобанов, Л.И. Цирульник // Тр. Междунар. конф. «Диалог-2004». – М. : Наука, 2004. – C. 419–423.</mixed-citation><mixed-citation xml:lang="en">Лобанов, Б.М. Персональные особенности синтагматического членения речи телеведущего Ю. Сенкевича / Б.М. Лобанов, Л.И. Цирульник // Тр. Междунар. конф. «Диалог-2004». – М. : Наука, 2004. – C. 419–423.</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">Lobanov, B. Phonetic-Acoustical Problems of Personal Voice Cloning by TTS / B. Lobanov, L. Tsirulnik // Proc. of 9th Int. conf. «Speech and Computer» (SPECOM’2004). – SPb. : Anatolia, 2004. – P. 17–21.</mixed-citation><mixed-citation xml:lang="en">Lobanov, B. Phonetic-Acoustical Problems of Personal Voice Cloning by TTS / B. Lobanov, L. Tsirulnik // Proc. of 9th Int. conf. «Speech and Computer» (SPECOM’2004). – SPb. : Anatolia, 2004. – P. 17–21.</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Embodied Conversational Agents / Eds. : J. Cassell, J. Sullivan, S. Prevost, E. Churchill. – Cambridge : MIT Press, 2000. – 420 p.</mixed-citation><mixed-citation xml:lang="en">Embodied Conversational Agents / Eds. : J. Cassell, J. Sullivan, S. Prevost, E. Churchill. – Cambridge : MIT Press, 2000. – 420 p.</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">Лобанов, Б.М. Микроволновой синтез речи по тексту / Б.М. Лобанов // Анализ и синтез речи : сб. науч. тр. – Минск : Ин-т техн. кибернетики АН БССР, 1991. – С. 21-38.</mixed-citation><mixed-citation xml:lang="en">Лобанов, Б.М. Микроволновой синтез речи по тексту / Б.М. Лобанов // Анализ и синтез речи : сб. науч. тр. – Минск : Ин-т техн. кибернетики АН БССР, 1991. – С. 21-38.</mixed-citation></citation-alternatives></ref><ref id="cit12"><label>12</label><citation-alternatives><mixed-citation xml:lang="ru">Lobanov, B. МW-Speech Synthesis from Text / B. Lobanov // Proc. of the XII International Congress of Phonetic Sciences ICPhS’91. – Aix-en-Provense, France, 1991. – P. 128–132.</mixed-citation><mixed-citation xml:lang="en">Lobanov, B. МW-Speech Synthesis from Text / B. Lobanov // Proc. of the XII International Congress of Phonetic Sciences ICPhS’91. – Aix-en-Provense, France, 1991. – P. 128–132.</mixed-citation></citation-alternatives></ref><ref id="cit13"><label>13</label><citation-alternatives><mixed-citation xml:lang="ru">Lobanov, B. Development of Multi-Voice and Multi-Language TTS Synthesizer (languages: Belarussian, Polish, Russian) / B. Lobanov, L. Tsirulnik // Proc. of 11th Int. conf. «Speech and Computer» (SPECOM’2006). – SPb. : Anatolia, 2006. – P. 274–283.</mixed-citation><mixed-citation xml:lang="en">Lobanov, B. Development of Multi-Voice and Multi-Language TTS Synthesizer (languages: Belarussian, Polish, Russian) / B. Lobanov, L. Tsirulnik // Proc. of 11th Int. conf. «Speech and Computer» (SPECOM’2006). – SPb. : Anatolia, 2006. – P. 274–283.</mixed-citation></citation-alternatives></ref><ref id="cit14"><label>14</label><citation-alternatives><mixed-citation xml:lang="ru">Лобанов, Б.М. Компьютерный синтез и клонирование речи / Б.М. Лобанов, Л.И. Цирульник. – Минск : Белорусская наука, 2008. – 344 с.</mixed-citation><mixed-citation xml:lang="en">Лобанов, Б.М. Компьютерный синтез и клонирование речи / Б.М. Лобанов, Л.И. Цирульник. – Минск : Белорусская наука, 2008. – 344 с.</mixed-citation></citation-alternatives></ref><ref id="cit15"><label>15</label><citation-alternatives><mixed-citation xml:lang="ru">Porter, Th. Compositing Digital Images / Th. Porter, T. Duff // Computer Graphics. – July 1984. – № 18(3). – P. 253–259.</mixed-citation><mixed-citation xml:lang="en">Porter, Th. Compositing Digital Images / Th. Porter, T. Duff // Computer Graphics. – July 1984. – № 18(3). – P. 253–259.</mixed-citation></citation-alternatives></ref><ref id="cit16"><label>16</label><citation-alternatives><mixed-citation xml:lang="ru">Design, Implementation and Evaluation of the Czech Realistic Audio-Visual Speech Synthesis / M. Železný [et al.] // Signal Processing. – 2006. – № 86. – V. 12. – P. 3657–3673.</mixed-citation><mixed-citation xml:lang="en">Design, Implementation and Evaluation of the Czech Realistic Audio-Visual Speech Synthesis / M. Železný [et al.] // Signal Processing. – 2006. – № 86. – V. 12. – P. 3657–3673.</mixed-citation></citation-alternatives></ref><ref id="cit17"><label>17</label><citation-alternatives><mixed-citation xml:lang="ru">Krňoul Z. Innovations in Czech Audio-Visual Speech Synthesis for Precise Articulation / Z. Krňoul, M. Železný // Proc. of the workshop on Audio-Visual Speech Processing. – 2007. – P. 172–175.</mixed-citation><mixed-citation xml:lang="en">Krňoul Z. Innovations in Czech Audio-Visual Speech Synthesis for Precise Articulation / Z. Krňoul, M. Železný // Proc. of the workshop on Audio-Visual Speech Processing. – 2007. – P. 172–175.</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
