@@ -242,8 +242,9 @@ ostream& operator<<( ostream& os, const Status& st ){
242242
243243BracketLeaf::BracketLeaf ( const RulePart& p,
244244 int debug_flag,
245- TiCC::LogStream& l ):
246- BaseBracket(p.ResultClass, p.RightHand, debug_flag, l ),
245+ TiCC::LogStream& l,
246+ TiCC::UnicodeNormalizer& norm ):
247+ BaseBracket(p.ResultClass, p.RightHand, debug_flag, l, norm ),
247248 _glue(false ),
248249 _morph(p.morpheme )
249250{
@@ -300,8 +301,9 @@ BracketLeaf::BracketLeaf( const RulePart& p,
300301BracketLeaf::BracketLeaf ( CLEX::Type t,
301302 const icu::UnicodeString& morpheme,
302303 int debug_flag,
303- TiCC::LogStream& l ):
304- BaseBracket( t, vector<CLEX::Type>(), debug_flag, l ),
304+ TiCC::LogStream& l,
305+ TiCC::UnicodeNormalizer& norm ):
306+ BaseBracket( t, vector<CLEX::Type>(), debug_flag, l, norm ),
305307 _glue(false ),
306308 _orig( toUnicodeString( t ) ),
307309 _morph( morpheme )
@@ -320,8 +322,9 @@ BracketLeaf::BracketLeaf( CLEX::Type t,
320322BracketNest::BracketNest ( CLEX::Type t,
321323 Compound::Type c,
322324 int debug_flag,
323- TiCC::LogStream& l ):
324- BaseBracket( t, debug_flag, l ),
325+ TiCC::LogStream& l,
326+ TiCC::UnicodeNormalizer& norm ):
327+ BaseBracket( t, debug_flag, l, norm ),
325328 _compound( c )
326329{
327330 // / create a BracketNest object from a CLEX::Type and a CompoundType
@@ -799,7 +802,6 @@ folia::Morpheme *BracketLeaf::createMorpheme( folia::Document *doc,
799802 */
800803 folia::Morpheme *result = 0 ;
801804 desc.remove ();
802- TiCC::UnicodeNormalizer UN;
803805 int pos = _orig.indexOf ( " ^" );
804806 bool glue = ( pos != -1 );
805807 string m_class = toString ( _status );
@@ -862,22 +864,22 @@ folia::Morpheme *BracketLeaf::createMorpheme( folia::Document *doc,
862864 args[" set" ] = Mbma::clex_tagset;
863865 if ( glue ){
864866 UnicodeString next_tag = _orig[pos+1 ];
865- args[" class" ] = TiCC::UnicodeToUTF8 (next_tag,UN );
867+ args[" class" ] = TiCC::UnicodeToUTF8 (next_tag,_normalizer );
866868 desc = " [" + _morph + " ]" + CLEX::get_tag_descr ( CLEX::toCLEX (next_tag) );
867869 // spread the word upwards!
868870 }
869871 else {
870- args[" class" ] = TiCC::UnicodeToUTF8 (toString (tag ()), UN );
872+ args[" class" ] = TiCC::UnicodeToUTF8 (toString (tag ()), _normalizer );
871873 desc = " [" + _morph + " ]" + CLEX::get_tag_descr ( tag () );
872874 // spread the word upwards!
873875 folia::KWargs fargs;
874876 fargs[" subset" ] = " structure" ;
875877 if ( tag () == CLEX::SPEC
876878 || tag () == CLEX::LET ){
877- fargs[" class" ] = TiCC::UnicodeToUTF8 (" [" + _morph + " ]" ,UN );
879+ fargs[" class" ] = TiCC::UnicodeToUTF8 (" [" + _morph + " ]" ,_normalizer );
878880 }
879881 else {
880- fargs[" class" ] = TiCC::UnicodeToUTF8 (desc,UN );
882+ fargs[" class" ] = TiCC::UnicodeToUTF8 (desc,_normalizer );
881883 }
882884#pragma omp critical (foliaupdate)
883885 {
@@ -892,7 +894,7 @@ folia::Morpheme *BracketLeaf::createMorpheme( folia::Document *doc,
892894 else if ( _status == Status::PARTICLE ){
893895 folia::KWargs args;
894896 args[" set" ] = Mbma::clex_tagset;
895- args[" class" ] = TiCC::UnicodeToUTF8 (toString ( tag () ), UN );
897+ args[" class" ] = TiCC::UnicodeToUTF8 (toString ( tag () ), _normalizer );
896898#pragma omp critical (foliaupdate)
897899 {
898900 result->addPosAnnotation ( args );
@@ -917,7 +919,7 @@ folia::Morpheme *BracketLeaf::createMorpheme( folia::Document *doc,
917919 UnicodeString d = CLEX::get_inflect_descr (inf);
918920 if ( !d.isEmpty () ){
919921 // happens sometimes when there is fawlty data
920- args[" class" ] = TiCC::UnicodeToUTF8 (d,UN );
922+ args[" class" ] = TiCC::UnicodeToUTF8 (d,_normalizer );
921923 desc += " /" + d;
922924#pragma omp critical (foliaupdate)
923925 {
@@ -946,7 +948,7 @@ folia::Morpheme *BracketLeaf::createMorpheme( folia::Document *doc,
946948 // now we add the description as a feature
947949 folia::KWargs args;
948950 args[" subset" ] = " structure" ;
949- args[" class" ] = TiCC::UnicodeToUTF8 (desc,UN );
951+ args[" class" ] = TiCC::UnicodeToUTF8 (desc,_normalizer );
950952#pragma omp critical (foliaupdate)
951953 {
952954 result->add_child <folia::Feature>( args );
@@ -979,7 +981,6 @@ folia::Morpheme *BracketNest::createMorpheme( folia::Document *doc,
979981 \param cnt a counter for the number of handled morphemes
980982 */
981983 folia::Morpheme *result = 0 ;
982- TiCC::UnicodeNormalizer UN;
983984 folia::KWargs args;
984985 args[" class" ] = " complex" ;
985986 args[" set" ] = Mbma::mbma_tagset;
@@ -1002,7 +1003,7 @@ folia::Morpheme *BracketNest::createMorpheme( folia::Document *doc,
10021003 if ( !it->original ().isEmpty () ){
10031004 args.clear ();
10041005 args[" subset" ] = " applied_rule" ;
1005- args[" class" ] = TiCC::UnicodeToUTF8 (it->original (),UN );
1006+ args[" class" ] = TiCC::UnicodeToUTF8 (it->original (),_normalizer );
10061007#pragma omp critical (foliaupdate)
10071008 {
10081009 result->add_child <folia::Feature>( args );
@@ -1024,14 +1025,14 @@ folia::Morpheme *BracketNest::createMorpheme( folia::Document *doc,
10241025 if ( desc.isEmpty () ){
10251026 desc = " XYZ" ;
10261027 }
1027- args[" class" ] = TiCC::UnicodeToUTF8 (desc,UN );
1028+ args[" class" ] = TiCC::UnicodeToUTF8 (desc,_normalizer );
10281029#pragma omp critical (foliaupdate)
10291030 {
10301031 result->add_child <folia::Feature>( args );
10311032 }
10321033 args.clear ();
10331034 args[" set" ] = Mbma::clex_tagset;
1034- args[" class" ] = TiCC::UnicodeToUTF8 (toString ( tag () ), UN );
1035+ args[" class" ] = TiCC::UnicodeToUTF8 (toString ( tag () ), _normalizer );
10351036 folia::PosAnnotation *pos = 0 ;
10361037#pragma omp critical (foliaupdate)
10371038 {
@@ -1098,7 +1099,8 @@ list<BaseBracket*>::const_iterator BracketNest::resolveAffix( list<BaseBracket*>
10981099 BracketNest *tmp = new BracketNest ( (*rpos)->tag (),
10991100 Compound::Type::NONE,
11001101 debugFlag,
1101- myLog );
1102+ myLog,
1103+ _normalizer );
11021104 for ( size_t j = 0 ; j < len; ++j ){
11031105 tmp->append ( *it );
11041106 if ( debugFlag > 5 ){
@@ -1137,7 +1139,8 @@ void BracketNest::resolveNouns( ){
11371139 if ( (*prev)->compound () == Compound::Type::NN ){
11381140 newt = Compound::Type::NNN;
11391141 }
1140- BaseBracket *tmp = new BracketNest ( CLEX::N, newt, debugFlag, myLog );
1142+ BaseBracket *tmp = new BracketNest ( CLEX::N, newt, debugFlag,
1143+ myLog, _normalizer );
11411144 tmp->append ( *prev );
11421145 tmp->append ( *it );
11431146 if ( debugFlag > 5 ){
@@ -1213,7 +1216,8 @@ list<BaseBracket*>::iterator BracketNest::glue( list<BaseBracket*>& result,
12131216 }
12141217 list<BaseBracket*>::iterator it = bit--;
12151218 BracketNest *tmp
1216- = new BracketNest ( (*rpos)->tag (), Compound::Type::NONE, debugFlag, myLog );
1219+ = new BracketNest ( (*rpos)->tag (), Compound::Type::NONE,
1220+ debugFlag, myLog, _normalizer );
12171221 for ( size_t j = 0 ; j < len-1 ; ++j ){
12181222 tmp->append ( *it );
12191223 if ( debugFlag > 5 ){
0 commit comments