@@ -300,7 +300,7 @@ void CGNTagger::add_tags( const vector<folia::Word*>& wv,
300300 for ( const auto & word : fd.units ){
301301 folia::KWargs u_args;
302302 u_args[" set" ] = getTagset ();
303- u_args[" class" ] = TiCC::UnicodeToUTF8 (word.tag );
303+ u_args[" class" ] = TiCC::UnicodeToUTF8 (word.tag ,_normalizer );
304304 if ( textclass != " current" ){
305305 u_args[" textclass" ] = textclass;
306306 }
@@ -312,7 +312,7 @@ void CGNTagger::add_tags( const vector<folia::Word*>& wv,
312312 }
313313 vector<UnicodeString> hv = TiCC::split_at_first_of ( word.tag , " ()" );
314314 UnicodeString head = hv[0 ];
315- u_args[" class" ] = TiCC::UnicodeToUTF8 (head);
315+ u_args[" class" ] = TiCC::UnicodeToUTF8 (head,_normalizer );
316316#pragma omp critical (foliaupdate)
317317 {
318318 postag->add_child <folia::HeadFeature>( u_args );
@@ -325,10 +325,10 @@ void CGNTagger::add_tags( const vector<folia::Word*>& wv,
325325 for ( const auto & f : feats ){
326326 folia::KWargs f_args;
327327 f_args[" set" ] = getTagset ();
328- f_args[" subset" ] = getSubSet ( TiCC::UnicodeToUTF8 (f),
329- TiCC::UnicodeToUTF8 (head),
330- TiCC::UnicodeToUTF8 (word.tag ) );
331- f_args[" class" ] = TiCC::UnicodeToUTF8 (f);
328+ f_args[" subset" ] = getSubSet ( TiCC::UnicodeToUTF8 (f,_normalizer ),
329+ TiCC::UnicodeToUTF8 (head,_normalizer ),
330+ TiCC::UnicodeToUTF8 (word.tag ,_normalizer ) );
331+ f_args[" class" ] = TiCC::UnicodeToUTF8 (f,_normalizer );
332332#pragma omp critical (foliaupdate)
333333 {
334334 postag->add_child <folia::Feature>( f_args );
0 commit comments