OpenCV的softcascade代碼解讀

最後更新：2018-12-04 來源：互聯網
上載者：User
創建阿里雲帳戶，並獲得超過 40 款產品的免費試用版；而企業帳戶則可以享有總值 $1200 的免費試用版。立即註冊！
//標頭檔為softcascade.hpp、core.hpp//實現檔案為octave.cpp//但是還涉及到了ml.hpp和Dtree.cpp等檔案//softcascade檢測器訓練函數的代碼如下：bool BoostedSoftCascadeOctave::train(const Dataset* dataset, const FeaturePool* pool, int weaks, int treeDepth){//第1個參數dataset是一個可以與訓練集通訊的執行個體，第2個參數表示特徵集，第3個參數是需要訓練的弱分類器樹數量，第4個參數是分類器樹的深度    CV_Assert(treeDepth == 2);//？要求弱分類樹的深度只能為2嗎？    CV_Assert(weaks > 0);    params.max_depth  = treeDepth;    params.weak_count = weaks;    // 1. fill integrals and classes，？這裡計算了每個樣本的所有積分圖和標定了標籤嗎？是的，對於正樣本，response向量中響應的元素值設定為了1，負樣本設定為了0    processPositives(dataset);    generateNegatives(dataset);    // 2. only simple case (all features used)//使用所有的特徵    int nfeatures = pool->size();    cv::Mat varIdx(1, nfeatures, CV_32SC1);    int* ptr = varIdx.ptr<int>(0);    for (int x = 0; x < nfeatures; ++x)        ptr[x] = x;    // 3. only simple case (all samples used)//使用所有訓練樣本    int nsamples = npositives + nnegatives;    cv::Mat sampleIdx(1, nsamples, CV_32SC1);    ptr = sampleIdx.ptr<int>(0);    for (int x = 0; x < nsamples; ++x)        ptr[x] = x;    // 4. ICF has an ordered response.    cv::Mat varType(1, nfeatures + 1, CV_8UC1);//指定按特徵響應排序？最後多的一個元素表示什麼意思？是不是表示將要輸入訓練函數train()（在倒數第3行）中的response向量儲存的是類標籤    uchar* uptr = varType.ptr<uchar>(0);    for (int x = 0; x < nfeatures; ++x)        uptr[x] = CV_VAR_ORDERED;//這個排序無法理解！    uptr[nfeatures] = CV_VAR_CATEGORICAL;    trainData.create(nfeatures, nsamples, CV_32FC1);//產生用來訓練用的資料矩陣，看下面的雙重迴圈就知道，其中每行對應到一個特徵，每列對應到一個樣本，該矩陣每個元素儲存的是某樣本某特徵的積分圖。    for (int fi = 0; fi < nfeatures; ++fi)    {        float* dptr = trainData.ptr<float>(fi);        for (int si = 0; si < nsamples; ++si)        {            dptr[si] = pool->apply(fi, si, integrals);        }    }    cv::Mat missingMask;    bool ok = train(trainData, responses, varIdx, sampleIdx, varType, missingMask); //？主要的訓練函數，trainData是用特徵表示的訓練集矩陣，responses是樣本對應的類標籤，varIdx是所學習的特徵的所有索引，sampleIdx是訓練樣本的索引，？varType表示是否對特徵響應排序？，missingMask用來儲存錯誤的分類。    if (!ok)        CV_Error(CV_StsInternal, "ERROR: tree can not be trained");    return ok;}//其中用到的訓練函數如下，可見它調用了boost類的train()函數，並且推測得到的檢測器儲存在params中。//它調用了CvBoostTree::train()函數來,並加入了params參數，看來在BoostedSoftCascadeOctave類中沒有params成員，但是最終的檢測器時儲存在該成員中的，到現在為止還是訓練整個的檢測器:bool BoostedSoftCascadeOctave::train( const cv::Mat& _trainData, const cv::Mat& _responses, const cv::Mat& varIdx,       const cv::Mat& sampleIdx, const cv::Mat& varType, const cv::Mat& missingDataMask){    bool update = false;    return cv::Boost::train(_trainData, CV_COL_SAMPLE, _responses, varIdx, sampleIdx, varType, missingDataMask, params,    update);}//boost類的train()函數定義如下（在boost.cpp中）：boolCvBoost::train( const CvMat* _train_data, int _tflag,              const CvMat* _responses, const CvMat* _var_idx,              const CvMat* _sample_idx, const CvMat* _var_type,              const CvMat* _missing_mask,              CvBoostParams _params, bool _update ){//順著來，到了這裡，_train_data是訓練資料，每行對應到一個特徵每列對應到一個樣本；_tflag表明了訓練資料矩陣的每列對應到一個樣本；//_responsens是各樣本對應的類標籤；_var_idx是特徵索引（序號），_sample_idx是樣本索引，_var_type在這裡表示按特徵響應排序；_missing_mask不知何意；//_params儲存訓練得到的檢測器；_update為false。這裡使用CvBoost.tree->train()函數訓練每一個弱分類器//    bool ok = false;    CvMemStorage* storage = 0;    CV_FUNCNAME( "CvBoost::train" );    __BEGIN__;    int i;    set_params( _params );//初始化檢測器參數    cvReleaseMat( &active_vars );    cvReleaseMat( &active_vars_abs );    if( !_update || !data )//準備好訓練用的資料，並確定只包含正負樣本兩類，分配儲存弱分類器的儲存空間    {        clear();        data = new CvDTreeTrainData( _train_data, _tflag, _responses, _var_idx,//準備訓練資料，但是這裡怎麼還要用到boost的參數_params呢?            _sample_idx, _var_type, _missing_mask, _params, true, true );        if( data->get_num_classes() != 2 )            CV_ERROR( CV_StsNotImplemented,            "Boosted trees can only be used for 2-class classification." );        CV_CALL( storage = cvCreateMemStorage() );        weak = cvCreateSeq( 0, sizeof(CvSeq), sizeof(CvBoostTree*), storage );//這是CvBoost類中儲存弱分類器的向量？        storage = 0;    }    else    {        data->set_data( _train_data, _tflag, _responses, _var_idx,            _sample_idx, _var_type, _missing_mask, _params, true, true, true );    }    if ( (_params.boost_type == LOGIT) || (_params.boost_type == GENTLE) )        data->do_responses_copy();    update_weights( 0 );//將各樣本權重平均分配    for( i = 0; i < params.weak_count; i++ )//訓練weak_count個弱分類器    {        CvBoostTree* tree = new CvBoostTree;        if( !tree->train( data, subsample_mask, this ) )//主要的訓練函數,subsample_mask似乎是一個輸出參數，查了其初始值是值為0的指標，記錄弱分類器正確分類的樣本，也許初始值是全0的向量？//第三個參數是訓練出的弱分類器要串連的‘宿主’分類器        {            delete tree;            break;        }        //cvCheckArr( get_weak_response());        cvSeqPush( weak, &tree );        update_weights( tree );//這裡是不是根據訓練出的弱分類器的分類情況調整各樣本的權重？        trim_weights();        if( cvCountNonZero(subsample_mask) == 0 )            break;    }    if(weak->total > 0)//釋放儲存空間    {        get_active_vars(); // recompute active_vars* maps and condensed_idx's in the splits.        data->is_classifier = true;        data->free_train_data();        ok = true;    }    else        clear();    __END__;    return ok;}//CvBoostTree::train()函數定義如下，它用來訓練單個弱分類器，它進一步調用了CvDTree::do_train()函數：CvBoostTree::train( CvDTreeTrainData* _train_data,                    const CvMat* _subsample_idx, CvBoost* _ensemble ){    clear();    ensemble = _ensemble;    data = _train_data;    data->shared = true;    return do_train( _subsample_idx );}//CvDTree::do_train()函數定義如下(在檔案tree.cpp中，標頭檔為ml.hpp）：bool CvDTree::do_train( const CvMat* _subsample_idx ){    bool result = false;    CV_FUNCNAME( "CvDTree::do_train" );    __BEGIN__;    root = data->subsample_data( _subsample_idx );//明顯是選擇參與訓練的樣本    CV_CALL( try_split_node(root));    if( root->split )    {        CV_Assert( root->left );        CV_Assert( root->right );        if( data->params.cv_folds > 0 )            CV_CALL( prune_cv() );        if( !data->shared )            data->free_train_data();        result = true;    }    __END__;    return result;}//do_train()的核心函數如下：CvDTreeNode* CvDTreeTrainData::subsample_data( const CvMat* _subsample_idx ){    CvDTreeNode* root = 0;    CvMat* isubsample_idx = 0;    CvMat* subsample_co = 0;    bool isMakeRootCopy = true;    CV_FUNCNAME( "CvDTreeTrainData::subsample_data" );    __BEGIN__;    if( !data_root )        CV_ERROR( CV_StsError, "No training data has been set" );    if( _subsample_idx )    {        CV_CALL( isubsample_idx = cvPreprocessIndexArray( _subsample_idx, sample_count ));//如果已訓練出了一些弱分類器，則在這裡進行一定的處理。_subsample_idx只能是一個行向量或者是列向量//_subsample_idx中儲存的可能是選中的樣本的索引，也可能長度為sample_count的表明選擇的'0''1'掩膜，但//輸出只包含了選擇的樣本的編號，並且進行了排序。        if( isubsample_idx->cols + isubsample_idx->rows - 1 == sample_count )//isubsample_idx是一個指向行向量或者列向量的指標，這裡驗證元素個數與樣本數是否相等。        {            const int* sidx = isubsample_idx->data.i;            for( int i = 0; i < sample_count; i++ )            {                if( sidx[i] != i )                {                    isMakeRootCopy = false;//若尚無任何弱分類器，則'isMakeRootCopy = true'，                    break;                }            }        }        else            isMakeRootCopy = false;    }    if( isMakeRootCopy )    {        // make a copy of the root node        CvDTreeNode temp;        int i;        root = new_node( 0, 1, 0, 0 );        temp = *root;        *root = *data_root;        root->num_valid = temp.num_valid;        if( root->num_valid )        {            for( i = 0; i < var_count; i++ )                root->num_valid[i] = data_root->num_valid[i];        }        root->cv_Tn = temp.cv_Tn;        root->cv_node_risk = temp.cv_node_risk;        root->cv_node_error = temp.cv_node_error;    }    else    {        int* sidx = isubsample_idx->data.i;        // co - array of count/offset pairs (to handle duplicated values in _subsample_idx)        int* co, cur_ofs = 0;        int vi, i;        int workVarCount = get_work_var_count();//得到已使用的特徵個數？        int count = isubsample_idx->rows + isubsample_idx->cols - 1;//該弱分類器判斷為正的樣本個數        root = new_node( 0, count, 1, 0 );        CV_CALL( subsample_co = cvCreateMat( 1, sample_count*2, CV_32SC1 ));        cvZero( subsample_co );        co = subsample_co->data.i;        for( i = 0; i < count; i++ )            co[sidx[i]*2]++;        for( i = 0; i < sample_count; i++ )        {            if( co[i*2] )            {                co[i*2+1] = cur_ofs;                cur_ofs += co[i*2];            }            else                co[i*2+1] = -1;        }        cv::AutoBuffer<uchar> inn_buf(sample_count*(2*sizeof(int) + sizeof(float)));        for( vi = 0; vi < workVarCount; vi++ )        {            int ci = get_var_type(vi);            if( ci >= 0 || vi >= var_count )            {                int num_valid = 0;                const int* src = CvDTreeTrainData::get_cat_var_data( data_root, vi, (int*)(uchar*)inn_buf );                if (is_buf_16u)                {                    unsigned short* udst = (unsigned short*)(buf->data.s + root->buf_idx*get_length_subbuf() +                        vi*sample_count + root->offset);                    for( i = 0; i < count; i++ )                    {                        int val = src[sidx[i]];                        udst[i] = (unsigned short)val;                        num_valid += val >= 0;                    }                }                else                {                    int* idst = buf->data.i + root->buf_idx*get_length_subbuf() +                        vi*sample_count + root->offset;                    for( i = 0; i < count; i++ )                    {                        int val = src[sidx[i]];                        idst[i] = val;                        num_valid += val >= 0;                    }                }                if( vi < var_count )                    root->set_num_valid(vi, num_valid);            }            else            {                int *src_idx_buf = (int*)(uchar*)inn_buf;                float *src_val_buf = (float*)(src_idx_buf + sample_count);                int* sample_indices_buf = (int*)(src_val_buf + sample_count);                const int* src_idx = 0;                const float* src_val = 0;                get_ord_var_data( data_root, vi, src_val_buf, src_idx_buf, &src_val, &src_idx, sample_indices_buf );                int j = 0, idx, count_i;                int num_valid = data_root->get_num_valid(vi);                if (is_buf_16u)                {                    unsigned short* udst_idx = (unsigned short*)(buf->data.s + root->buf_idx*get_length_subbuf() +                        vi*sample_count + data_root->offset);                    for( i = 0; i < num_valid; i++ )                    {                        idx = src_idx[i];                        count_i = co[idx*2];                        if( count_i )                            for( cur_ofs = co[idx*2+1]; count_i > 0; count_i--, j++, cur_ofs++ )                                udst_idx[j] = (unsigned short)cur_ofs;                    }                    root->set_num_valid(vi, j);                    for( ; i < sample_count; i++ )                    {                        idx = src_idx[i];                        count_i = co[idx*2];                        if( count_i )                            for( cur_ofs = co[idx*2+1]; count_i > 0; count_i--, j++, cur_ofs++ )                                udst_idx[j] = (unsigned short)cur_ofs;                    }                }                else                {                    int* idst_idx = buf->data.i + root->buf_idx*get_length_subbuf() +                        vi*sample_count + root->offset;                    for( i = 0; i < num_valid; i++ )                    {                        idx = src_idx[i];                        count_i = co[idx*2];                        if( count_i )                            for( cur_ofs = co[idx*2+1]; count_i > 0; count_i--, j++, cur_ofs++ )                                idst_idx[j] = cur_ofs;                    }                    root->set_num_valid(vi, j);                    for( ; i < sample_count; i++ )                    {                        idx = src_idx[i];                        count_i = co[idx*2];                        if( count_i )                            for( cur_ofs = co[idx*2+1]; count_i > 0; count_i--, j++, cur_ofs++ )                                idst_idx[j] = cur_ofs;                    }                }            }        }        // sample indices subsampling        const int* sample_idx_src = get_sample_indices(data_root, (int*)(uchar*)inn_buf);        if (is_buf_16u)        {            unsigned short* sample_idx_dst = (unsigned short*)(buf->data.s + root->buf_idx*get_length_subbuf() +                workVarCount*sample_count + root->offset);            for (i = 0; i < count; i++)                sample_idx_dst[i] = (unsigned short)sample_idx_src[sidx[i]];        }        else        {            int* sample_idx_dst = buf->data.i + root->buf_idx*get_length_subbuf() +                workVarCount*sample_count + root->offset;            for (i = 0; i < count; i++)                sample_idx_dst[i] = sample_idx_src[sidx[i]];        }    }    __END__;    cvReleaseMat( &isubsample_idx );    cvReleaseMat( &subsample_co );    return root;}//do_train()另一個核心函數如下：void CvDTree::try_split_node( CvDTreeNode* node ){    CvDTreeSplit* best_split = 0;    int i, n = node->sample_count, vi;    bool can_split = true;    double quality_scale;    calc_node_value( node );    if( node->sample_count <= data->params.min_sample_count ||        node->depth >= data->params.max_depth )        can_split = false;    if( can_split && data->is_classifier )    {        // check if we have a "pure" node,        // we assume that cls_count is filled by calc_node_value()        int* cls_count = data->counts->data.i;        int nz = 0, m = data->get_num_classes();        for( i = 0; i < m; i++ )            nz += cls_count[i] != 0;        if( nz == 1 ) // there is only one class            can_split = false;    }    else if( can_split )    {        if( sqrt(node->node_risk)/n < data->params.regression_accuracy )            can_split = false;    }    if( can_split )    {        best_split = find_best_split(node);        // TODO: check the split quality ...        node->split = best_split;    }    if( !can_split || !best_split )    {        data->free_node_data(node);        return;    }    quality_scale = calc_node_dir( node );    if( data->params.use_surrogates )    {        // find all the surrogate splits        // and sort them by their similarity to the primary one        for( vi = 0; vi < data->var_count; vi++ )        {            CvDTreeSplit* split;            int ci = data->get_var_type(vi);            if( vi == best_split->var_idx )                continue;            if( ci >= 0 )                split = find_surrogate_split_cat( node, vi );            else                split = find_surrogate_split_ord( node, vi );            if( split )            {                // insert the split                CvDTreeSplit* prev_split = node->split;                split->quality = (float)(split->quality*quality_scale);                while( prev_split->next &&                       prev_split->next->quality > split->quality )                    prev_split = prev_split->next;                split->next = prev_split->next;                prev_split->next = split;            }        }    }    split_node_data( node );    try_split_node( node->left );    try_split_node( node->right );}
本文章原先以中文撰寫並發佈於 aliyun.com，亦設英文版本，僅作資訊用途。本網站不對文章的準確性，完整性或可靠性或其任何翻譯作出任何明示或暗示的陳述或保證。如對該文章有任何疑慮或投訴，請傳送電郵至 info-contact@alibabacloud.com 並提供相關疑慮或投訴的詳細說明。職員會於 5 個工作天內與您聯絡，一經驗證之後，即會刪除該侵權內容。
A Free Trial That Lets You Build Big!

Start building with 50+ products and up to 12 months usage for Elastic Compute Service
Get Started for Free
Sales Support

1 on 1 presale consultation

Chat Contact Sales
After-Sales Support

24/7 Technical Support 6 Free Tickets per Quarter Faster Response

Open a Ticket
Alibaba Cloud offers highly flexible support services tailored to meet your exact needs.

Learn More
OpenCV的softcascade代碼解讀

聯繫我們

A Free Trial That Lets You Build Big!

Sales Support

After-Sales Support