machine_learning.h ソースファイル

説明を見る。
 // 
 // Copyright (c) 2003-2011, MIST Project, Nagoya University
 // All rights reserved.
 // 
 // Redistribution and use in source and binary forms, with or without modification,
 // are permitted provided that the following conditions are met:
 // 
 // 1. Redistributions of source code must retain the above copyright notice,
 // this list of conditions and the following disclaimer.
 // 
 // 2. Redistributions in binary form must reproduce the above copyright notice,
 // this list of conditions and the following disclaimer in the documentation
 // and/or other materials provided with the distribution.
 // 
 // 3. Neither the name of the Nagoya University nor the names of its contributors
 // may be used to endorse or promote products derived from this software
 // without specific prior written permission.
 // 
 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR
 // IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
 // FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
 // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 // DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
 // IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF
 // THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 // 
 
 #ifndef __INCLUDE_MACHINE_LEARNING__
 #define __INCLUDE_MACHINE_LEARNING__
 
 
 #ifndef __INCLUDE_MIST_H__
     #include "mist.h"
 #endif
 
 #ifndef __INCLUDE_MIST_RANDOM__
     #include "random.h"
 #endif
 
 
 #include <ctime>
 #include <vector>
 #include <map>
 #include <algorithm>
 
 #ifdef _OPENMP
     #include <omp.h>
 #endif
 
 
 // mist名前空間の始まり
 _MIST_BEGIN
 
 
 #define __ASYMMETRIC_WEIGHTING__        0       
 #define __ONE_PER_CLASS_CODE_WORD__     0       
 #define __RANDOM_CODE_WORD__            0       
 #define __DEBUG_OUTPUT_LEVEL__          0       
 #define __NUMBER_OF_INNER_LOOPS__       10      
 
 
 namespace machine_learning
 {
     typedef double feature_value_type;      
     typedef double feature_weight_type;     
 
     struct feature_one
     {
         typedef size_t size_type;           
         typedef ptrdiff_t difference_type;  
 
         feature_value_type  value;      
         bool                category;   
         feature_weight_type weight;     
 
         feature_one( ) : value( 0.0 ), category( true ), weight( 0.0 )
         {
         }
 
         feature_one( feature_value_type val, bool cate, feature_weight_type wei ) : value( val ), category( cate ), weight( wei )
         {
         }
 
         feature_one( const feature_one &f ): value( f.value ), category( f.category ), weight( f.weight )
         {
         }
 
         feature_one &operator =( const feature_one &f )
         {
             if( &f != this )
             {
                 value  = f.value;
                 category = f.category;
                 weight = f.weight;
             }
 
             return( *this );
         }
 
         bool operator <( const feature_one &f ) const
         {
             return( value < f.value );
         }
     };
 
     struct feature : public std::vector< feature_value_type >
     {
         typedef std::vector< feature_value_type > base;
         typedef base::value_type value_type;            
         typedef base::size_type size_type;              
         typedef base::difference_type difference_type;  
 
         std::string         category;   
         feature_weight_type weight;     
         bool                valid;      
 
         feature( ) : base( ), category( "unknown" ), weight( 0.0 ), valid( true )
         {
         }
 
         feature( size_type dimension ) : base( dimension ), category( "unknown" ), weight( 0.0 ), valid( true )
         {
         }
 
         feature( const std::string &cate ) : base( ), category( cate ), weight( 0.0 ), valid( true )
         {
         }
 
         feature( size_type dimension, const std::string &cate ) : base( dimension, 0.0 ), category( cate ), weight( 0.0 ), valid( true )
         {
         }
 
         feature( const feature &f ): base( f ), category( f.category ), weight( f.weight ), valid( f.valid )
         {
         }
 
         feature &operator =( const feature &f )
         {
             if( &f != this )
             {
                 base::operator =( f );
                 category = f.category;
                 weight = f.weight;
                 valid  = f.valid;
             }
 
             return( *this );
         }
     };
 
     template < class KEY, class VALUE >
     struct pair
     {
         KEY   key;
         VALUE value;
 
         pair( ){ }
 
         pair( const KEY &k, const VALUE &val ) : key( k ), value( val ){ }
 
         bool operator <( const pair &f ) const
         {
             return( key < f.key );
         }
 
         static bool greater( const pair &f1, const pair &f2 )
         {
             return( f2 < f1 );
         }
     };
 
 
 
     namespace adaboost
     {
         inline size_t __power_of_two__( size_t x )
         {
             size_t val = 1;
             for( size_t i = 0 ; i < x ; i++ )
             {
                 val *= 2;
             }
             return( val );
         }
 
         class threshold_classifier
         {
         public:
             typedef feature feature_type;
             typedef feature_type::value_type value_type;            
             typedef feature_type::size_type size_type;              
             typedef feature_type::difference_type difference_type;  
 
         private:
             double sign_;       
             double threshold_;  
             size_type index_;   
 
         public:
             threshold_classifier( ) : sign_( 1.0 ), threshold_( 0.0 ), index_( 0 )
             {
             }
 
             threshold_classifier( const threshold_classifier& w ) : sign_( w.sign_ ), threshold_( w.threshold_ ), index_( w.index_ )
             {
             }
 
             threshold_classifier& operator =( const threshold_classifier& other )
             {
                 if( this != &other )
                 {
                     sign_      = other.sign_;
                     threshold_ = other.threshold_;
                     index_     = other.index_;
                 }
 
                 return( *this );
             }
 
         public:
             template < template < typename, typename > class FEATURE_LIST, template < typename, typename > class CATEGORY_LIST, class Allocator1, class Allocator2 >
             bool learn( const FEATURE_LIST< feature_type, Allocator1 > & features, const CATEGORY_LIST< bool, Allocator2 > &categories )
             {
                 if( features.empty( ) )
                 {
                     return( false );
                 }
 
                 double _minimum_classification_error_ = 1.0e100;
 
                 // Positive と Negative それぞれの重みの合計を計算する
                 double overall_sum_of_positive_weights = 0.0;
                 double overall_sum_of_negative_weights = 0.0;
                 for( size_type i = 0 ; i < features.size( ) ; i++ )
                 {
                     const feature_type &f = features[ i ];
                     if( categories[ i ] )
                     {
                         overall_sum_of_positive_weights += f.weight;
                     }
                     else
                     {
                         overall_sum_of_negative_weights += f.weight;
                     }
                 }
 
                 if( overall_sum_of_positive_weights == 0.0 || overall_sum_of_negative_weights == 0.0 )
                 {
                     return( false );
                 }
 
                 double max_sigma = -1.0;
                 int nfeatures = static_cast< int >( features[ 0 ].size( ) );
 
                 // 特徴量のリストを作成する
                 #pragma omp parallel for firstprivate( nfeatures ) schedule( guided )
                 for( int index = 0 ; index < nfeatures ; index++ )
                 {
                     std::vector< feature_one > flist;
                     flist.reserve( features.size( ) );
                     for( size_type i = 0 ; i < features.size( ) ; i++ )
                     {
                         const feature_type &f = features[ i ];
                         if( f.valid )
                         {
                             flist.push_back( feature_one( f[ index ], categories[ i ], f.weight ) );
                         }
                     }
 
                     // 特徴量をソートする
                     std::sort( flist.begin( ), flist.end( ) );
 
                     // 各しきい値での重み付き誤差を計算し，誤差最小のしきい値を求める
                     double min_error = 1.0e100, sgn = 1.0, th = 0.0;
                     double sum_of_positive_weights = 0.0;
                     double sum_of_negative_weights = 0.0;
 
                     for( size_type i = 0 ; i < flist.size( ) ; i++ )
                     {
                         const feature_one &f = flist[ i ];
                         if( f.category )
                         {
                             sum_of_positive_weights += f.weight;
                         }
                         else
                         {
                             sum_of_negative_weights += f.weight;
                         }
 
                         double e1 = sum_of_positive_weights + overall_sum_of_negative_weights - sum_of_negative_weights;
                         double e2 = sum_of_negative_weights + overall_sum_of_positive_weights - sum_of_positive_weights;
                         double error = e1 < e2 ? e1 : e2;
 
                         if( error <= min_error )
                         {
                             min_error = error;
                             th        = f.value;
                             sgn       = e1 < e2 ? -1.0 : 1.0;
 
                             if( 0 < i && i < flist.size( ) - 2 )
                             {
                                 double v1 = std::abs( flist[ i - 1 ].value - flist[ i + 0 ].value );
                                 double v2 = std::abs( flist[ i + 1 ].value - flist[ i + 2 ].value );
                                 if( std::abs( v1 + v2 ) > 0 )
                                 {
                                     double t1 = flist[ i + 0 ].value;
                                     double t2 = flist[ i + 1 ].value;
                                     th = ( t1 * v1 + t2 * v2 ) / ( v1 + v2 );
                                 }
                             }
                             else if( i < flist.size( ) - 1 )
                             {
                                 th = ( th + flist[ i + 1 ].value ) * 0.5;
                             }
                         }
                     }
 
                     double e = 0.0;
                     for( size_t i = 0 ; i < features.size( ) ; i++ )
                     {
                         const feature_type &f = features[ i ];
                         if( f.valid )
                         {
                             if( evaluate( f, index, sgn, th ) != categories[ i ] )
                             {
                                 e += f.weight;
                             }
                         }
                     }
 
                     double sigma = 0.0;
                     {
                         double M1 = 0.0;
                         double M2 = 0.0;
                         double S1 = 0.0;
                         double S2 = 0.0;
 
                         for( size_type i = 0 ; i < flist.size( ) ; i++ )
                         {
                             const feature_type &f = features[ i ];
                             if( categories[ i ] )
                             {
                                 M1 += f.weight * f[ index ];
                             }
                             else
                             {
                                 M2 += f.weight * f[ index ];
                             }
                         }
 
                         M1 /= overall_sum_of_positive_weights;
                         M2 /= overall_sum_of_negative_weights;
 
                         for( size_type i = 0 ; i < features.size( ) ; i++ )
                         {
                             const feature_type &f = features[ i ];
                             if( categories[ i ] )
                             {
                                 S1 += f.weight * ( f[ index ] - M1 ) * ( f[ index ] - M1 );
                             }
                             else
                             {
                                 S2 += f.weight * ( f[ index ] - M2 ) * ( f[ index ] - M2 );
                             }
                         }
 
                         S1 /= overall_sum_of_positive_weights;
                         S2 /= overall_sum_of_negative_weights;
                         double V1 = overall_sum_of_positive_weights * overall_sum_of_negative_weights * ( M1 - M2 ) * ( M1 - M2 );
                         double V2 = ( overall_sum_of_positive_weights + overall_sum_of_negative_weights ) * ( overall_sum_of_positive_weights * S1 + overall_sum_of_negative_weights * S2 );
                         sigma = V1 / ( 1.0 + V2 );
                     }
 
                     #pragma omp critical
                     {
                         if( _minimum_classification_error_ > e )
                         {
                             _minimum_classification_error_ = e;
                             index_ = index;
                             sign_ = sgn;
                             threshold_ = th;
                             max_sigma = sigma;
                         }
                         else if( _minimum_classification_error_ == e && sigma > max_sigma )
                         {
                             _minimum_classification_error_ = e;
                             index_ = index;
                             sign_ = sgn;
                             threshold_ = th;
                             max_sigma = sigma;
                         }
                     }
                 }
 
                 return( true );
             }
 
         public:
             template < class FEATURE >
             bool operator ()( const FEATURE &f ) const
             {
                 return( evaluate( f ) );
             }
 
             template < class FEATURE >
             bool evaluate( const FEATURE &f ) const
             {
                 return( evaluate( f, index_, sign_, threshold_ ) );
             }
 
             template < class FEATURE >
             bool evaluate( const FEATURE &f, size_type indx, double sgn, double th ) const
             {
                 return( sgn * f[ indx ] <= sgn * th );
             }
 
             const std::string serialize( ) const
             {
                 char buff[ 1024 ];
                 sprintf( buff, "%ld,%f,%f", index_, sign_, threshold_ );
                 return( buff );
             }
 
             void deserialize( const std::string &data )
             {
                 sscanf( data.c_str( ), "%ld,%lf,%lf", &index_, &sign_, &threshold_ );
             }
         };
 
         class mahalanobis_classifier
         {
         public:
             typedef feature feature_type;
             typedef feature_type::value_type value_type;            
             typedef feature_type::size_type size_type;              
             typedef feature_type::difference_type difference_type;  
 
         private:
             double ave_[ 2 ];   
             double sig_[ 2 ];   
             size_type index_;   
 
         public:
             mahalanobis_classifier( ) : index_( 0 )
             {
                 ave_[ 0 ] = ave_[ 1 ] = 0.0;
                 sig_[ 0 ] = sig_[ 1 ] = 1.0;
             }
 
             mahalanobis_classifier( const mahalanobis_classifier& w ) : index_( w.index_ )
             {
                 memcpy( ave_, w.ave_, sizeof( double ) * 2 );
                 memcpy( sig_, w.sig_, sizeof( double ) * 2 );
             }
 
             mahalanobis_classifier& operator =( const mahalanobis_classifier& other )
             {
                 if( this != &other )
                 {
                     memcpy( ave_, other.ave_, sizeof( double ) * 2 );
                     memcpy( sig_, other.sig_, sizeof( double ) * 2 );
                     index_   = other.index_;
                 }
 
                 return( *this );
             }
 
         public:
             template < template < typename, typename > class FEATURE_LIST, template < typename, typename > class CATEGORY_LIST, class Allocator1, class Allocator2 >
             bool learn( const FEATURE_LIST< feature_type, Allocator1 > & features, const CATEGORY_LIST< bool, Allocator2 > &categories )
             {
                 if( features.empty( ) )
                 {
                     return( false );
                 }
 
                 double _minimum_classification_error_ = 1.0e100;
 
                 // Positive と Negative それぞれの重みの合計を計算する
                 double overall_sum_of_positive_weights = 0.0;
                 double overall_sum_of_negative_weights = 0.0;
                 for( size_type i = 0 ; i < features.size( ) ; i++ )
                 {
                     const feature_type &f = features[ i ];
                     if( categories[ i ] )
                     {
                         overall_sum_of_positive_weights += f.weight;
                     }
                     else
                     {
                         overall_sum_of_negative_weights += f.weight;
                     }
                 }
 
                 double max_sigma = -1.0;
                 int nfeatures = static_cast< int >( features[ 0 ].size( ) );
 
                 // 特徴量のリストを作成する
                 #pragma omp parallel for firstprivate( nfeatures ) schedule( guided )
                 for( int index = 0 ; index < nfeatures ; index++ )
                 {
                     double ave[ 2 ] = { 0.0, 0.0 };
                     double sig[ 2 ] = { 0.0, 0.0 };
 
                     for( size_type i = 0 ; i < features.size( ) ; i++ )
                     {
                         const feature_type &f = features[ i ];
                         if( categories[ i ] )
                         {
                             ave[ 0 ] += f.weight * f[ index ];
                         }
                         else
                         {
                             ave[ 1 ] += f.weight * f[ index ];
                         }
                     }
 
                     ave[ 0 ] /= overall_sum_of_positive_weights;
                     ave[ 1 ] /= overall_sum_of_negative_weights;
 
                     for( size_type i = 0 ; i < features.size( ) ; i++ )
                     {
                         const feature_type &f = features[ i ];
                         if( categories[ i ] )
                         {
                             sig[ 0 ] += f.weight * ( f[ index ] - ave[ 0 ] ) * ( f[ index ] - ave[ 0 ] );
                         }
                         else
                         {
                             sig[ 1 ] += f.weight * ( f[ index ] - ave[ 1 ] ) * ( f[ index ] - ave[ 1 ] );
                         }
                     }
 
                     sig[ 0 ] /= overall_sum_of_positive_weights;
                     sig[ 1 ] /= overall_sum_of_negative_weights;
 
                     double e = 0.0;
                     for( size_t i = 0 ; i < features.size( ) ; i++ )
                     {
                         const feature_type &f = features[ i ];
                         if( f.valid )
                         {
                             if( evaluate( f, index, ave, sig ) != categories[ i ] )
                             {
                                 e += f.weight;
                             }
                         }
                     }
 
                     double sigma = 0.0;
                     {
                         double V1 = overall_sum_of_positive_weights * overall_sum_of_negative_weights * ( ave[ 0 ] - ave[ 1 ] ) * ( ave[ 0 ] - ave[ 1 ] );
                         double V2 = ( overall_sum_of_positive_weights + overall_sum_of_negative_weights ) * ( overall_sum_of_positive_weights * sig[ 0 ] + overall_sum_of_negative_weights * sig[ 1 ] );
                         sigma = V1 / V2;
                     }
 
                     #pragma omp critical
                     {
                         if( _minimum_classification_error_ >= e && sigma > max_sigma )
                         {
                             _minimum_classification_error_ = e;
                             index_ = index;
                             memcpy( ave_, ave, sizeof( double ) * 2 );
                             memcpy( sig_, sig, sizeof( double ) * 2 );
                         }
                     }
                 }
 
                 return( true );
             }
 
         public:
             template < class FEATURE >
             bool operator ()( const FEATURE &f ) const
             {
                 return( evaluate( f ) );
             }
 
             template < class FEATURE >
             bool evaluate( const FEATURE &f ) const
             {
                 return( evaluate( f, index_, ave_, sig_ ) );
             }
 
             template < class FEATURE >
             bool evaluate( const FEATURE &f, size_type indx, const double ave[ 2 ], const double sig[ 2 ] ) const
             {
                 double v0 = f[ indx ] - ave[ 0 ];
                 double v1 = f[ indx ] - ave[ 1 ];
                 return( v0 * v0 * sig[ 1 ] <= v1 * v1 * sig[ 0 ] );
             }
 
             const std::string serialize( ) const
             {
                 char buff[ 1024 ];
                 sprintf( buff, "%ld,%f,%f,%f,%f", index_, ave_[ 0 ], ave_[ 1 ], sig_[ 0 ], sig_[ 1 ] );
                 return( buff );
             }
 
             void deserialize( const std::string &data )
             {
                 sscanf( data.c_str( ), "%ld,%lf,%lf,%lf,%lf", &index_, &ave_[ 0 ], &ave_[ 1 ], &sig_[ 0 ], &sig_[ 1 ] );
             }
         };
 
         class confidence_rating_classifier
         {
         public:
             typedef feature feature_type;
             typedef feature_type::value_type value_type;            
             typedef feature_type::size_type size_type;              
             typedef feature_type::difference_type difference_type;  
 
             _MIST_CONST( size_type, __number_of_bins__, 100 );
 
         private:
             double hist1_[ __number_of_bins__ ];    
             double hist2_[ __number_of_bins__ ];    
             double min_;    
             double max_;    
             size_type index_;   
 
         public:
             confidence_rating_classifier( ) : min_( 0 ), max_( 0 ), index_( 0 )
             {
                 memset( hist1_, 0, sizeof( double ) * __number_of_bins__ );
                 memset( hist2_, 0, sizeof( double ) * __number_of_bins__ );
             }
 
             confidence_rating_classifier( const confidence_rating_classifier& w ) : min_( w.min_ ), max_( w.max_ ), index_( w.index_ )
             {
                 memcpy( hist1_, w.hist1_, sizeof( double ) * __number_of_bins__ );
                 memcpy( hist2_, w.hist2_, sizeof( double ) * __number_of_bins__ );
             }
 
             confidence_rating_classifier& operator =( const confidence_rating_classifier& other )
             {
                 if( this != &other )
                 {
                     memcpy( hist1_, other.hist1_, sizeof( double ) * __number_of_bins__ );
                     memcpy( hist2_, other.hist2_, sizeof( double ) * __number_of_bins__ );
                     index_  = other.index_;
                     min_    = other.min_;
                     max_    = other.max_;
                 }
 
                 return( *this );
             }
 
         public:
             template < template < typename, typename > class FEATURE_LIST, template < typename, typename > class CATEGORY_LIST, class Allocator1, class Allocator2 >
             bool learn( const FEATURE_LIST< feature_type, Allocator1 > & features, const CATEGORY_LIST< bool, Allocator2 > &categories )
             {
                 if( features.empty( ) )
                 {
                     return( false );
                 }
 
                 double _minimum_classification_error_ = 1.0e100;
                 int nfeatures = static_cast< int >( features[ 0 ].size( ) );
 
                 // 特徴量のリストを作成する
                 #pragma omp parallel for firstprivate( nfeatures ) schedule( guided )
                 for( int index = 0 ; index < nfeatures ; index++ )
                 {
                     double min = features[ 0 ][ index ];
                     double max = min;
 
                     for( size_type i = 0 ; i < features.size( ) ; i++ )
                     {
                         const feature_type &f = features[ i ];
                         if( min > f[ index ] )
                         {
                             min = f[ index ];
                         }
                         else if( max < f[ index ] )
                         {
                             max = f[ index ];
                         }
                     }
 
                     double hist1[ __number_of_bins__ ];
                     double hist2[ __number_of_bins__ ];
                     for( size_type i = 0 ; i < __number_of_bins__ ; i++ )
                     {
                         hist1[ i ] = hist2[ i ] = 0.0;
                     }
 
                     for( size_type i = 0 ; i < features.size( ) ; i++ )
                     {
                         const feature_type &f = features[ i ];
                         int bin = ( int )( ( f[ index ] - min ) * __number_of_bins__ / ( max - min + 1 ) + 0.5 );
                         if( bin < 0 )
                         {
                             bin = 0;
                         }
                         else if( bin >= __number_of_bins__ )
                         {
                             bin = __number_of_bins__ - 1;
                         }
 
                         if( categories[ i ] )
                         {
                             hist1[ bin ] += f.weight;
                         }
                         else
                         {
                             hist2[ bin ] += f.weight;
                         }
                     }
 
                     double e = 0.0;
                     for( size_t i = 0 ; i < features.size( ) ; i++ )
                     {
                         const feature_type &f = features[ i ];
                         if( f.valid )
                         {
                             if( evaluate( f, index, hist1, hist2, min, max ) != categories[ i ] )
                             {
                                 e += f.weight;
                             }
                         }
                     }
 
                     #pragma omp critical
                     {
                         if( _minimum_classification_error_ >= e )
                         {
                             _minimum_classification_error_ = e;
                             index_ = index;
                             min_ = min;
                             max_ = max;
                             memcpy( hist1_, hist1, sizeof( double ) * __number_of_bins__ );
                             memcpy( hist2_, hist2, sizeof( double ) * __number_of_bins__ );
                         }
                     }
                 }
 
                 return( true );
             }
 
         public:
             template < class FEATURE >
             bool operator ()( const FEATURE &f ) const
             {
                 return( evaluate( f ) );
             }
 
             template < class FEATURE >
             bool evaluate( const FEATURE &f ) const
             {
                 return( evaluate( f, index_, hist1_, hist2_, min_, max_ ) );
             }
 
             template < class FEATURE >
             bool evaluate( const FEATURE &f, size_type indx, const double hist1[ ], const double hist2[ ], double min, double max ) const
             {
                 int bin = ( int )( ( f[ indx ] - min ) * __number_of_bins__ / ( max - min + 1 ) + 0.5 );
                 if( bin < 0 )
                 {
                     bin = 0;
                 }
                 else if( bin >= __number_of_bins__ )
                 {
                     bin = __number_of_bins__ - 1;
                 }
                 return( hist1[ bin ] <= hist2[ bin ] );
             }
 
             const std::string serialize( ) const
             {
                 //char buff[ 1024 ];
                 //sprintf( buff, "%d,%f,%f,%f,%f", index_, ave_[ 0 ], ave_[ 1 ], sig_[ 0 ], sig_[ 1 ] );
                 //return( buff );
                 return( "" );
             }
 
             void deserialize( const std::string & /* data */ )
             {
                 //sscanf( data.c_str( ), "%d,%lf,%lf,%lf,%lf", &index_, &ave_[ 0 ], &ave_[ 1 ], &sig_[ 0 ], &sig_[ 1 ] );
             }
         };
 
         template < typename __WEAK_CLASSIFIER__ = threshold_classifier >
         class classifier
         {
         public:
             typedef __WEAK_CLASSIFIER__ weak_classifier_type;       
             typedef feature feature_type;                           
             typedef feature_type::value_type value_type;            
             typedef feature_type::size_type size_type;              
             typedef feature_type::difference_type difference_type;  
 
         private:
             std::vector< std::string >          categories_;        
             std::vector< weak_classifier_type > weak_classifiers_;  
             std::vector< std::vector< bool > >  code_word_;         
             std::vector< double >               alpha_;             
             std::vector< double >               beta_;              
 
         public:
             classifier( )
             {
             }
 
             classifier( const classifier &cls ) : categories_( cls.categories_ ), weak_classifiers_( cls.weak_classifiers_ ), code_word_( cls.code_word_ ), alpha_( cls.alpha_ ), beta_( cls.beta_ )
             {
             }
 
             classifier& operator =( const classifier& other )
             {
                 if( this != &other )
                 {
                     categories_        = other.categories_;
                     weak_classifiers_  = other.weak_classifiers_;
                     code_word_         = other.code_word_;
                     alpha_             = other.alpha_;
                     beta_              = other.beta_;
                 }
 
                 return( *this );
             }
 
         public:
             const std::vector< weak_classifier_type > &weak_classifiers( ) const
             {
                 return( weak_classifiers_ );
             }
 
             std::vector< weak_classifier_type > &weak_classifiers( )
             {
                 return( weak_classifiers_ );
             }
 
             const std::vector< std::string > &categories( ) const
             {
                 return( categories_ );
             }
 
             std::vector< std::string > &categories( )
             {
                 return( categories_ );
             }
 
             const std::vector< std::vector< bool > > &code_word( ) const
             {
                 return( code_word_ );
             }
 
             std::vector< std::vector< bool > > &code_word( )
             {
                 return( code_word_ );
             }
 
             const std::vector< double > &alpha( ) const
             {
                 return( alpha_ );
             }
 
             std::vector< double > &alpha( )
             {
                 return( alpha_ );
             }
 
             const std::vector< double > &beta( ) const
             {
                 return( beta_ );
             }
 
             std::vector< double > &beta( )
             {
                 return( beta_ );
             }
 
         public:
             template < template < typename, typename > class FEATURE_LIST, class Allocator >
             bool learn( FEATURE_LIST< feature_type, Allocator > & features, size_type number_of_iterations )
             {
                 if( features.empty( ) )
                 {
                     std::cerr << "特徴データが指定されていません．" << std::endl;
                     return( false );
                 }
                 else if( number_of_iterations == 0 )
                 {
                     // 少なくとも1回は実行する
                     number_of_iterations++;
                 }
 
                 // 強識別器を初期化する
                 weak_classifiers_.clear( );
                 categories_.clear( );
                 code_word_.clear( );
                 alpha_.clear( );
                 beta_.clear( );
 
 
                 // カテゴリの数を数える
                 std::map< std::string, size_type > category_map;
                 for( size_type i = 0 ; i < features.size( ) ; i++ )
                 {
                     category_map[ features[ i ].category ] = 0;
                 }
 
                 // カテゴリの数を確定する
                 categories_.reserve( category_map.size( ) );
 
                 // カテゴリのリストを登録する
                 std::map< std::string, size_type >::iterator ite = category_map.begin( );
                 for( ; ite != category_map.end( ) ; ++ite )
                 {
                     ite->second = categories_.size( );
                     categories_.push_back( ite->first );
                 }
 
                 // 重みを初期化する
                 mist::matrix< double > D( features.size( ), categories_.size( ) );
                 for( size_type i = 0 ; i < features.size( ) ; i++ )
                 {
                     const feature_type &f = features[ i ];
                     size_type category_index = category_map[ f.category ];
                     for( size_type l = 0 ; l < categories_.size( ) ; l++ )
                     {
                         if( l != category_index )
                         {
                             D( i, l ) = 1.0 / static_cast< double >( features.size( ) * ( categories_.size( ) - 1 ) );
                         }
                         else
                         {
                             D( i, l ) = 0.0;
                         }
                     }
                 }
 
                 std::vector< size_type > fcatemap( features.size( ) );
                 std::vector< bool > fcategories( features.size( ) );
                 std::vector< double > rpweight( categories_.size( ) );
                 for( size_type i = 0 ; i < fcatemap.size( ) ; i++ )
                 {
                     fcatemap[ i ] = static_cast< typename std::vector< size_type >::value_type >( category_map[ features[ i ].category ] );
                 }
 
 #if defined( __ONE_PER_CLASS_CODE_WORD__ ) && __ONE_PER_CLASS_CODE_WORD__ == 1
                 // 各クラス単位で code word を作る
                 size_type nhypothesis = categories_.size( );
 #elif defined( __RANDOM_CODE_WORD__ ) && __RANDOM_CODE_WORD__ == 1
                 uniform::random rnd( std::clock( ) );
                 // code word を ECC ベースで作る
                 size_type nhypothesis = categories_.size( );
 #else
                 // code word を ECC ベースで作る
                 size_type nhypothesis = 0;
 #endif
 
                 // AdaBoost により強識別器を学習する
                 for( size_type t = 0 ; t < number_of_iterations ; t++ )
                 {
                     // カラーリングを決定する
                     code_word_.push_back( std::vector< bool >( categories_.size( ) ) );
                     std::vector< bool > &myu = code_word_.back( );
 
 #if defined( __ONE_PER_CLASS_CODE_WORD__ ) && __ONE_PER_CLASS_CODE_WORD__ == 1
                     myu[ t % nhypothesis ] = true;
 #elif defined( __RANDOM_CODE_WORD__ ) && __RANDOM_CODE_WORD__ == 1
                     {
                         std::vector< pair< double, size_type > > list( nhypothesis );
                         for( size_type i = 0 ; i < list.size( ) ; i++ )
                         {
                             list[ i ].key = rnd.real1( );
                             list[ i ].value = i;
                         }
                         std::sort( list.begin( ), list.end( ) );
                         for( size_type i = 0 ; i < list.size( ) ; i++ )
                         {
                             myu[ list[ i ].value ] = i < list.size( ) / 2;
                         }
                     }
 #else
                     if( categories_.size( ) == 2 )
                     {
                         myu[ 0 ] = ( t % 2 ) == 0;
                         myu[ 1 ] = !myu[ 0 ];
                     }
                     else
                     {
                         myu[ 0 ] = true;
                         size_type val = nhypothesis++;
                         bool flag = true;
                         for( size_type r = categories_.size( ) - 1 ; r > 0 ; r-- )
                         {
                             bool b = ( val & 1 ) != 0;
                             flag = flag && b;
                             myu[ r ] = b;
                             val >>= 1;
                         }
 
                         if( flag )
                         {
                             val = nhypothesis++;
                             for( size_type r = categories_.size( ) - 1 ; r > 0 ; r-- )
                             {
                                 myu[ r ] = ( val & 1 ) != 0;
                                 val >>= 1;
                             }
                         }
                     }
 #endif
 
 #if defined( __DEBUG_OUTPUT_LEVEL__ ) && __DEBUG_OUTPUT_LEVEL__ >= 3
                     // 弱識別器の学習用カテゴリデータを作る
                     for( size_type i = 0 ; i < fcategories.size( ) ; i++ )
                     {
                         std::cout << myu[ fcatemap[ i ] ];
                     }
                     std::cout << std::endl;
 #endif
 
                     // 学習に使う弱識別器を用意する
                     weak_classifiers_.push_back( weak_classifier_type( ) );
                     weak_classifier_type &weak = weak_classifiers_.back( );
 
                     for( size_type m = 0 ; m < __NUMBER_OF_INNER_LOOPS__ ; m++ )
                     {
                         // 弱識別器の学習用カテゴリデータを作る
                         for( size_type i = 0 ; i < fcategories.size( ) ; i++ )
                         {
                             fcategories[ i ] = myu[ fcatemap[ i ] ];
                         }
 
                         // 重みを正規化する
                         double Ut = 0.0;
                         for( size_type i = 0 ; i < features.size( ) ; i++ )
                         {
                             const feature_type &f = features[ i ];
                             if( f.valid )
                             {
                                 bool myuY = fcategories[ i ];
                                 for( size_type l = 0 ; l < categories_.size( ) ; l++ )
                                 {
                                     if( myuY != myu[ l ] )
                                     {
                                         Ut += D( i, l );
                                     }
                                 }
                             }
                         }
 
                         for( size_type i = 0 ; i < D.rows( ) ; i++ )
                         {
                             feature_type &f = features[ i ];
                             if( f.valid )
                             {
                                 bool myuY = fcategories[ i ];
                                 double sum = 0.0;
                                 for( size_type l = 0 ; l < categories_.size( ) ; l++ )
                                 {
                                     if( myuY != myu[ l ] )
                                     {
                                         sum += D( i, l );
                                     }
                                 }
 
                                 f.weight = static_cast< feature_value_type >( sum / Ut );
                             }
                         }
 
                         // 弱識別器を学習する
                         weak.learn( features, fcategories );
                         //std::cout << "しきい値: " << weak.threshold( ) << ", 符号: " << ( weak.sign( ) < 0.0 ? "-" : "+" ) << ", 番号: " << weak.index( ) << std::endl;
 
                         if( m < __NUMBER_OF_INNER_LOOPS__ - 1 )
                         {
                             for( size_type i = 0 ; i < rpweight.size( ) ; i++ )
                             {
                                 rpweight[ i ] = 0.0;
                             }
 
                             for( size_type i = 0 ; i < features.size( ) ; i++ )
                             {
                                 feature_type &f = features[ i ];
                                 if( f.valid )
                                 {
                                     double val = weak( f ) ? 1.0 : -1.0;
 
                                     double tmp = 0.0;
                                     for( size_type l = 0 ; l < D.cols( ) ; l++ )
                                     {
                                         tmp += D( i, l ) * val;
                                     }
 
                                     rpweight[ fcatemap[ i ] ] += tmp;
 
                                     for( size_type l = 0 ; l < D.cols( ) ; l++ )
                                     {
                                         rpweight[ l ] -= D( i, l ) * val;
                                     }
                                 }
                             }
 
                             std::vector< bool > tmyu( myu );
                             bool isChanged = false;
                             for( size_type i = 0 ; i < rpweight.size( ) ; i++ )
                             {
                                 bool nmyu = rpweight[ i ] >= 0.0;
                                 isChanged = isChanged || nmyu != tmyu[ i ];
                                 tmyu[ i ] = nmyu;
                             }
 
                             if( !isChanged )
                             {
                                 // 前回とまったく同じなので終了する
                                 break;
                             }
 
                             // すべて同じコードワードになっていないかをチェックする
                             {
                                 size_type idx = 1;
                                 for( ; idx < tmyu.size( ) ; idx++ )
                                 {
                                     if( tmyu[ 0 ] != tmyu[ idx ] )
                                     {
                                         break;
                                     }
                                 }
 
                                 if( idx < tmyu.size( ) )
                                 {
                                     myu = tmyu;
                                 }
                                 else
                                 {
                                     break;
                                 }
                             }
                         }
                     }
 
 
 #if defined( __DEBUG_OUTPUT_LEVEL__ ) && __DEBUG_OUTPUT_LEVEL__ >= 3
                     // 学習した弱識別器の分類結果を表示する
                     for( size_type i = 0 ; i < features.size( ) ; i++ )
                     {
                         const feature_type &f = features[ i ];
                         if( f.valid )
                         {
                             std::cout << weak.evaluate( f );
                         }
                     }
                     std::cout << std::endl;
 #endif
 
 #if defined( __ASYMMETRIC_WEIGHTING__ ) && __ASYMMETRIC_WEIGHTING__ == 1
                     // 重みの更新を非対称に行う
                     const double eps = 1.0e-16;
                     double h1u1 = eps;
                     double h1u0 = eps;
                     double h0u0 = eps;
                     double h0u1 = eps;
 
                     for( size_type i = 0 ; i < features.size( ) ; i++ )
                     {
                         const feature_type &f = features[ i ];
                         if( f.valid )
                         {
                             bool uY = fcategories[ i ];
                             bool hX = weak( f );
                             if( hX && uY )
                             {
                                 h1u1 += f.weight;
                             }
                             else if( hX && !uY )
                             {
                                 h1u0 += f.weight;
                             }
                             else if( !hX && !uY )
                             {
                                 h0u0 += f.weight;
                             }
                             else
                             {
                                 h0u1 += f.weight;
                             }
                         }
                     }
 
                     double alpha = 0.5 * std::log( h1u1 / h1u0 );
                     double beta = -0.5 * std::log( h0u0 / h0u1 );
 #else
                     // 重みの更新を対称にする
                     const double eps = 1.0e-16;
                     double positives = eps;
                     double negatives = eps;
 
                     for( size_type i = 0 ; i < features.size( ) ; i++ )
                     {
                         const feature_type &f = features[ i ];
                         if( f.valid )
                         {
                             bool uY = fcategories[ i ];
                             bool hX = weak( f );
                             if( hX == uY )
                             {
                                 positives += f.weight;
                             }
                             else
                             {
                                 negatives += f.weight;
                             }
                         }
                     }
 
                     double alpha = 0.5 * std::log( positives / negatives );
                     double beta = -alpha;
 #endif
 
                     alpha_.push_back( alpha );
                     beta_.push_back( beta );
 
                     double Zt = 0.0;
                     for( size_type i = 0 ; i < features.size( ) ; i++ )
                     {
                         const feature_type &f = features[ i ];
                         if( f.valid )
                         {
                             bool myuY = fcategories[ i ];
                             for( size_type l = 0 ; l < categories_.size( ) ; l++ )
                             {
                                 double v = ( myu[ l ] - myuY ) * 0.5;
                                 if( weak( f ) )
                                 {
                                     v *= alpha;
                                 }
                                 else
                                 {
                                     v *= beta;
                                 }
 
                                 D( i, l ) *= std::exp( v );
                                 Zt += D( i, l );
                             }
                         }
                     }
 
                     for( size_type i = 0 ; i < D.size( ) ; i++ )
                     {
                         D[ i ] /= Zt;
                     }
 
                     if( ( ( t + 1 ) % 5 ) == 0 )
                     {
                         double __classification_error__ = error_rate( features );
 
 #if defined( __DEBUG_OUTPUT_LEVEL__ ) && __DEBUG_OUTPUT_LEVEL__ >= 1
                         // 1ループ終了
                         std::cout << "識別器の学習ループ " << t + 1 << " / " << number_of_iterations << " が終了しました。";
                         std::cout << "分類誤差: " << __classification_error__ << std::endl;
 #endif
 
                         if( __classification_error__ == 0.0 )
                         {
                             // 分類器の性能に変化が無かった，もしくは，すべて分類できたので終了する
                             break;
                         }
                     }
                 }
 
                 return( true );
             }
 
         public:
             template < class FEATURE >
             const std::string operator ()( const FEATURE &f ) const
             {
                 return( evaluate( f ) );
             }
 
             template < class FEATURE >
             const std::string evaluate( const FEATURE &f ) const
             {
 #if 1
                 std::vector< double > values( categories_.size( ), 0.0 );
                 for( size_type t = 0 ; t < weak_classifiers_.size( ) ; t++ )
                 {
                     const std::vector< bool > &code = code_word_[ t ];
                     double weight = weak_classifiers_[ t ]( f ) ? alpha_[ t ] : beta_[ t ];
 
                     for( size_type l = 0 ; l < categories_.size( ) ; l++ )
                     {
                         values[ l ] += code[ l ] * weight;
                     }
                 }
 
                 size_type category = 0;
                 for( size_type l = 1 ; l < categories_.size( ) ; l++ )
                 {
                     if( values[ category ] < values[ l ] )
                     {
                         category = l;
                     }
                 }
 #else
                 double max = 0.0;
                 size_type category = 0;
                 for( size_type l = 0 ; l < categories_.size( ) ; l++ )
                 {
                     double sum = 0.0;
                     for( size_type t = 0 ; t < weak_classifiers_.size( ) ; t++ )
                     {
                         double val = code_word_[ t ][ l ];
                         if( weak_classifiers_[ t ]( f ) )
                         {
                             val *= alpha_[ t ];
                         }
                         else
                         {
                             val *= beta_[ t ];
                         }
 
                         sum += val;
                     }
 
                     if( sum > max )
                     {
                         max = sum;
                         category = l;
                     }
                 }
 #endif
 
                 return( categories_[ category ] );
             }
 
             template < class FEATURE >
             void compute_category_ranks( const FEATURE &f, std::vector< pair< double, std::string > > &ranks ) const
             {
                 std::vector< double > values( categories_.size( ), 0.0 );
                 for( size_type t = 0 ; t < weak_classifiers_.size( ) ; t++ )
                 {
                     const std::vector< bool > &code = code_word_[ t ];
                     double weight = weak_classifiers_[ t ]( f ) ? alpha_[ t ] : beta_[ t ];
 
                     for( size_type l = 0 ; l < categories_.size( ) ; l++ )
                     {
                         values[ l ] += code[ l ] * weight;
                     }
                 }
 
                 ranks.clear( );
                 ranks.reserve( values.size( ) );
 
                 for( size_type l = 0 ; l < values.size( ) ; l++ )
                 {
                     ranks.push_back( pair< double, std::string >( values[ l ], categories_[ l ] ) );
                 }
 
                 std::sort( ranks.begin( ), ranks.end( ), pair< double, std::string >::greater );
             }
 
             template < template < typename, typename > class FEATURE_LIST, class Allocator >
             double error_rate( const FEATURE_LIST< feature_type, Allocator > & features ) const
             {
                 if( features.empty( ) )
                 {
                     return( 0.0 );
                 }
 
                 size_type error = 0;
                 int nfeatures = static_cast< int >( features.size( ) );
 
                 #pragma omp parallel for firstprivate( nfeatures ) reduction( +: error ) schedule( guided )
                 for( int i = 0 ; i < nfeatures ; i++ )
                 {
                     const feature_type &f = features[ i ];
                     if( f.valid )
                     {
                         std::string ret = evaluate( f );
 #if defined( __DEBUG_OUTPUT_LEVEL__ ) && __DEBUG_OUTPUT_LEVEL__ >= 3
                         std::cout << ret;
 #endif
                         if( f.category != ret )
                         {
                             error++;
                         }
                     }
                 }
 
 #if defined( __DEBUG_OUTPUT_LEVEL__ ) && __DEBUG_OUTPUT_LEVEL__ >= 3
                 std::cout << std::endl;
 #endif
 
                 return( static_cast< double >( error ) / static_cast< double >( nfeatures ) );
             }
 
         public:
             static const char *get_value( const char *s, const char *e, std::string &val )
             {
                 // 先頭の空白（改行やタブを含む）を飛ばす
                 while( s < e )
                 {
                     if( s[ 0 ] == '\r' )
                     {
                         if( s + 1 != e && s[ 1 ] == '\n' )
                         {
                             s = s + 2;
                         }
                         else
                         {
                             s++;
                         }
                     }
                     else if( s[ 0 ] == '\n' )
                     {
                         s++;
                     }
                     else if( s[ 0 ] == ' ' || s[ 0 ] == '\t' )
                     {
                         s++;
                     }
                     else
                     {
                         break;
                     }
                 }
 
                 const char *sp = s;
                 const char *ep = sp;
 
                 // 次にコンマが来る前まで進める
                 while( s < e )
                 {
                     if( s[ 0 ] == '\r' )
                     {
                         if( s + 1 != e && s[ 1 ] == '\n' )
                         {
                             s = s + 2;
                         }
                         else
                         {
                             s++;
                         }
                         break;
                     }
                     else if( s[ 0 ] == '\n' )
                     {
                         s++;
                         break;
                     }
                     else if( s[ 0 ] == ',' )
                     {
                         s++;
                         break;
                     }
 
                     ep++;
                     s++;
                 }
 
                 if( sp < ep )
                 {
                     val = std::string( sp, ep );
                 }
 
                 return( s > e ? e : s );
             }
 
         public:
             bool save( const std::string &filename ) const
             {
                 FILE *fp = fopen( filename.c_str( ), "wt" );
 
                 if( fp == NULL )
                 {
                     return( false );
                 }
 
                 // クラス数等の基本情報を書き込む
                 fprintf( fp, "Category = %ld\n", categories_.size( ) );
                 fprintf( fp, "Stage    = %ld\n", weak_classifiers_.size( ) );
 
                 // クラス名を列挙する
                 for( size_type i = 0 ; i < categories_.size( ) ; i++ )
                 {
                     fprintf( fp, "Class[%ld] : %s\n", i + 1, categories_[ i ].c_str( ) );
                 }
 
                 // Code Word を列挙する
                 for( size_type i = 0 ; i < code_word_.size( ) ; i++ )
                 {
                     const std::vector< bool > &code = code_word_[ i ];
                     fprintf( fp, "%d", code[ 0 ] ? 1: 0 );
                     for( size_type l = 1 ; l < code.size( ) ; l++ )
                     {
                         fprintf( fp, ",%d", code[ l ] ? 1: 0 );
                     }
                     fprintf( fp, "\n" );
                 }
 
                 // 弱識別器と Alpha と Beta を列挙する
                 for( size_type i = 0 ; i < weak_classifiers_.size( ) ; i++ )
                 {
                     const weak_classifier_type &weak = weak_classifiers_[ i ];
                     fprintf( fp, "%s\n", weak.serialize( ).c_str( ) );
                     fprintf( fp, "%f,%f\n", alpha_[ i ], beta_[ i ] );
                 }
 
                 fclose( fp );
 
                 return( true );
             }
 
             bool load( const std::string &filename )
             {
                 FILE *fp = fopen( filename.c_str( ), "rt" );
 
                 if( fp == NULL )
                 {
                     return( false );
                 }
 
                 int numClasses = 0, numStages = 0, dmy;
                 char line[ 4096 ], buff[ 4096 ];
 
                 // クラス数等の基本情報を書き込む
                 if( fgets( line, 4096, fp ) != NULL )
                 {
                     sscanf( line, "Category  = %d", &numClasses );
                 }
                 if( fgets( line, 4096, fp ) != NULL )
                 {
                     sscanf( line, "Stage     = %d", &numStages );
                 }
 
                 // 強識別器を初期化する
                 weak_classifiers_.resize( numStages );
                 alpha_.resize( numStages );
                 beta_.resize( numStages );
                 code_word_.resize( numStages );
                 categories_.resize( numClasses );
 
                 // クラス名を読み込む
                 for( size_type i = 0 ; i < categories_.size( ) ; i++ )
                 {
                     if( fgets( line, 4096, fp ) != NULL )
                     {
                         memset( buff, '\0', 4096 );
                         sscanf( line, "Class[%d] : %s", &dmy, buff );
                         categories_[ i ] = buff;
                     }
                 }
 
                 // Code Word を読み込む
                 for( size_type i = 0 ; i < code_word_.size( ) ; i++ )
                 {
                     std::vector< bool > &code = code_word_[ i ];
                     code.resize( numClasses );
 
                     if( fgets( line, 4096, fp ) == NULL )
                     {
                         break;
                     }
 
                     const char *p = line, *ep = line + 4096;
 
                     for( size_type l = 0 ; l < code.size( ) ; l++ )
                     {
                         std::string val;
                         p = get_value( p, ep, val );
                         code[ l ] = val == "1" ? true : false;
                     }
                 }
 
                 // 弱識別器と Alpha と Beta を列挙する
                 for( size_type i = 0 ; i < weak_classifiers_.size( ) ; i++ )
                 {
                     if( fgets( line, 4096, fp ) != NULL )
                     {
                         weak_classifiers_[ i ].deserialize( line );
                     }
 
                     if( fgets( line, 4096, fp ) != NULL )
                     {
                         double alpha, beta;
                         sscanf( line, "%lf,%lf", &alpha, &beta );
                         alpha_[ i ] = alpha;
                         beta_[ i ] = beta;
                     }
                 }
 
                 fclose( fp );
 
                 return( true );
             }
         };
     }
 
 
     //  機械学習グループの終わり
 }
 
 
 // mist名前空間の終わり
 _MIST_END
 
 
 
 #endif // __INCLUDE_MACHINE_LEARNING__