<?xml version="1.0" encoding="UTF-8"?>
<collection xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.loc.gov/MARC21/slim http://www.loc.gov/standards/marcxml/schema/MARC21slim.xsd" xmlns="http://www.loc.gov/MARC21/slim">
 <record>
  <leader>00000ctm a22000004a 4500</leader>
  <controlfield tag="001">UP-99796217603116358</controlfield>
  <controlfield tag="003">Buklod</controlfield>
  <controlfield tag="005">20230503092542.0</controlfield>
  <controlfield tag="006">m    |o  d |      </controlfield>
  <controlfield tag="007">ta</controlfield>
  <controlfield tag="008">070718s2000    xx      r    |||| u|eng d</controlfield>
  <datafield tag="035" ind1=" " ind2=" ">
   <subfield code="a">(iLib)UPD-00000179802</subfield>
  </datafield>
  <datafield tag="040" ind1=" " ind2=" ">
   <subfield code="a">DENGII</subfield>
  </datafield>
  <datafield tag="090" ind1=" " ind2=" ">
   <subfield code="a">LG 993.5 2000 C65</subfield>
   <subfield code="b">B45</subfield>
  </datafield>
  <datafield tag="100" ind1="1" ind2=" ">
   <subfield code="a">Baquiran, Eric P.</subfield>
  </datafield>
  <datafield tag="245" ind1="1" ind2="0">
   <subfield code="a">The Applicability of linear predictive coding and vector quantization to Filipino speech recognition</subfield>
   <subfield code="c">Eric P. Baquiran ... [et al.].</subfield>
  </datafield>
  <datafield tag="264" ind1=" " ind2="1">
   <subfield code="c">2000.</subfield>
  </datafield>
  <datafield tag="300" ind1=" " ind2=" ">
   <subfield code="a">vi, 41 leaves</subfield>
   <subfield code="b">col. ill.</subfield>
  </datafield>
  <datafield tag="502" ind1=" " ind2=" ">
   <subfield code="a">Thesis (B.S. Computer Science)--University of the Philippines Diliman.</subfield>
  </datafield>
  <datafield tag="520" ind1=" " ind2=" ">
   <subfield code="a">This thesis examines how Linear Predictive Coding and Vector Quantization can benefit a small vocabulary, speaker independent, isolated Filipino speech recognition system. It uses a template-based approach, in which an unknown word sample is compared against a number of stored word templates to find the best match. A speaker independent isolated speech database of 10 words was created using a training set consisting of 160 training words (16 utterances per digit sample). Voices of Filipino males between the ages of 15 to 25 were recorded in low-noise environments. The samples were preprocessed using FIR filtering. Excess leading and trailing silences were then removed. Finally, each sample was linearly time warped. Individual code-books for each digit were created using the K-means clustering algorithm applied to the spectralcoefficients derived from each training word using LPC Analysis. The codebooks were then concatenated to form the global codebook. Preliminary testing showed that this approach performed with good recognition accuracy (over 85%). However, when the approach was extended to a vocabulary of 101 words (the English words for the numbers 0 to 100), accuracy fell greatly (below 15%). It is recommended that improvements be done to the quality of the training set and the preprocessing steps (endpoint detection, time warping) to increase the accuracy when applied to larger vocabularies.</subfield>
  </datafield>
  <datafield tag="650" ind1=" " ind2="0">
   <subfield code="a">Automatic speech recognition.</subfield>
  </datafield>
  <datafield tag="650" ind1=" " ind2="0">
   <subfield code="a">Speech processing systems.</subfield>
  </datafield>
  <datafield tag="650" ind1=" " ind2="0">
   <subfield code="a">Speech processing</subfield>
   <subfield code="x">Digital techniques.</subfield>
  </datafield>
  <datafield tag="650" ind1=" " ind2="0">
   <subfield code="a">Speech synthesis.</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
   <subfield code="a">Filipino speech recognition.</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
   <subfield code="a">Linear Predictive Coding and Vector Quantization.</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
   <subfield code="a">Speech recognition system.</subfield>
  </datafield>
  <datafield tag="700" ind1="1" ind2=" ">
   <subfield code="a">Belleza, Liberty Irene A.</subfield>
  </datafield>
  <datafield tag="700" ind1="1" ind2=" ">
   <subfield code="a">Catoy, Marvin N.</subfield>
  </datafield>
  <datafield tag="700" ind1="1" ind2=" ">
   <subfield code="a">Dideles, Myra Colina B.</subfield>
  </datafield>
  <datafield tag="842" ind1=" " ind2=" ">
   <subfield code="a">Thesis</subfield>
  </datafield>
  <datafield tag="905" ind1=" " ind2=" ">
   <subfield code="a">FI</subfield>
  </datafield>
  <datafield tag="905" ind1=" " ind2=" ">
   <subfield code="a">UP</subfield>
  </datafield>
  <datafield tag="852" ind1="0" ind2=" ">
   <subfield code="a">UPD</subfield>
   <subfield code="b">DENG-II</subfield>
   <subfield code="h">LG 993.5 2000 C65 B45</subfield>
  </datafield>
  <datafield tag="942" ind1=" " ind2=" ">
   <subfield code="a">Thesis</subfield>
  </datafield>
 </record>
</collection>
