<?xml version="1.0" encoding="UTF-8"?>
<collection xmlns="http://www.loc.gov/MARC21/slim">
 <record>
  <leader>01378naa a2200205 i 4500</leader>
  <controlfield tag="001">acta58962</controlfield>
  <controlfield tag="005">20260224081030.0</controlfield>
  <controlfield tag="008">190701s2016    hu      o     100   eng d</controlfield>
  <datafield tag="020" ind1=" " ind2=" ">
   <subfield code="a">978-963-306-450-4</subfield>
  </datafield>
  <datafield tag="040" ind1=" " ind2=" ">
   <subfield code="a">SZTE Egyetemi Kiadványok Repozitórium</subfield>
   <subfield code="b">hun</subfield>
  </datafield>
  <datafield tag="041" ind1=" " ind2=" ">
   <subfield code="a">eng</subfield>
  </datafield>
  <datafield tag="100" ind1="1" ind2=" ">
   <subfield code="a">Berend Gábor</subfield>
  </datafield>
  <datafield tag="245" ind1="1" ind2="0">
   <subfield code="a">Utilizing word embeddings for part-of-speech tagging</subfield>
   <subfield code="h">[elektronikus dokumentum] /</subfield>
   <subfield code="c"> Berend Gábor</subfield>
  </datafield>
  <datafield tag="260" ind1=" " ind2=" ">
   <subfield code="c">2016</subfield>
  </datafield>
  <datafield tag="300" ind1=" " ind2=" ">
   <subfield code="a">59-67</subfield>
  </datafield>
  <datafield tag="490" ind1="0" ind2=" ">
   <subfield code="a">Magyar Számítógépes Nyelvészeti Konferencia</subfield>
   <subfield code="v">12</subfield>
  </datafield>
  <datafield tag="520" ind1="3" ind2=" ">
   <subfield code="a">In this paper, we illustrate the power of distributed word representations for the part-of-speech tagging of Hungarian texts. We trained CRF models for POS-tagging that made use of features derived from the sparse coding of the word embeddings of Hungarian words as signals. We show that relying on such a representation, it is possible to avoid the creation of language specific features for achieving reliable performance. We evaluated our models on all the subsections of the Szeged Treebank both using MSD and universal morphology tag sets. Furthermore, we also report results for inter-subcorpora experiments.</subfield>
  </datafield>
  <datafield tag="695" ind1=" " ind2=" ">
   <subfield code="a">Nyelvészet - számítógép alkalmazása</subfield>
  </datafield>
  <datafield tag="710" ind1=" " ind2=" ">
   <subfield code="a">Magyar Számítógépes Nyelvészeti Konferencia (12.) (2016) (Szeged)</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2="0">
   <subfield code="u">http://acta.bibl.u-szeged.hu/58962/1/msznykonf_012_059-067.pdf</subfield>
   <subfield code="z">Dokumentum-elérés </subfield>
  </datafield>
 </record>
</collection>
