__author__ = 'chunk' from ..common import * from ..mdata import ILSVRC, ILSVRC_S from ..mmodel.svm import SVM2 def test_ILSVRC(category='Train_100'): timer = Timer() # dil = ILSVRC.DataILSVRC(base='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val', category='Train') dil = ILSVRC.DataILSVRC(base_dir='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val', category=category,host='master') # dil = ILSVRC.DataILSVRC(base='/media/chunk/Elements/D/data/ImageNet/img/ILSVRC2013_DET_val', category='Train_1') print '[time]category:', category timer.mark() print '[time]formatting...' dil.format() timer.report() timer.mark() print '[time]embedding...' dil.embed(rate=0.2) timer.report() timer.mark() print '[time]extracting...' dil.extract_feat(feattype='ibd') timer.report() # dil.extract_feat(feattype='hog') timer.mark() dil.store_img() timer.report() timer.mark() dil.store_tag() timer.report() timer.mark() dil.store_info() timer.report() timer.mark() dil.store_feat() timer.report() def train_embed_and_feat_local(category='Train_100',feat_type = 'ibd'): timer = Timer() timer.mark() dil = ILSVRC.DataILSVRC(base_dir='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val', category=category,host='master') dil.delete_table() dil.format() dil.store_img() timer.report() dils = ILSVRC_S.DataILSVRC_S(base='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val', category=category,host='master') # dils._extract_data(mode='hbase', writeback=True) # dils._embed_data(mode='hbase', rate=0.1, readforward=True, writeback=True) # dils._extract_feat( mode='hbase', feattype='ibd', readforward=True, writeback=True) dils._extract_data(mode='hbase', writeback=False) dils._embed_data(mode='hbase', rate=0.1, readforward=False, writeback=False) dils._extract_feat(mode='hbase', feattype=feat_type, readforward=False, writeback=True) timer.report() def train_embed_and_feat_spark(category='Train_100', feat_type = 'ibd'): timer = Timer() timer.mark() dil = ILSVRC.DataILSVRC(base_dir='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val', category=categor,host='master') dil.delete_table() dil.format() dil.store_img() timer.report() #return dils = ILSVRC_S.DataILSVRC_S(base='ILSVRC2013_DET_val', category=category,host='master') timer.mark() dils._extract_data(mode='spark', writeback=False) dils._embed_data(mode='spark', rate=0.2, readforward=False, writeback=False) dils._extract_feat(mode='spark', feattype=feat_type, readforward=False, writeback=True,withdata=True) timer.report() def train_feat_label_spark(category='Train_100',label_file = '',feat_type = 'ibd'): timer = Timer() timer.mark() dil = ILSVRC.DataILSVRC(base_dir='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val', category=category,host='master',label_file = label_file) dil.delete_table() dil.format() dil.store_img() dil.store_tag() dil.store_info() timer.report() #return dils = ILSVRC_S.DataILSVRC_S(base='ILSVRC2013_DET_val', category=category,host='master') timer.mark() dils._extract_feat_1(mode='spark', feattype=feat_type, readforward=True, writeback=True, withdata=False) timer.report() def train_new_model(table_name = '',model_path = 'res/svm_sklearn1.model', feat_type ='ibd'): timer = Timer() timer.mark() dil = ILSVRC.DataILSVRC(tablename = table_name,host='master') timer.mark() X,Y = dil.load_data(mode='hbase', feattype= feat_type,tagtype = 'class') classifer = SVM2.ModelSVM(toolset = 'sklearn') classifer.train(X,Y,model_path) timer.report() def analysis_local_data_spark(category='Train_100', table_name='', model_path = 'res/svm_sklearn.model', feat_type = 'ibd'): timer = Timer() timer.mark() dil = ILSVRC.DataILSVRC(base_dir='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val', category=category,host='master') dil.delete_table() dil.format() dil.store_img() dil.store_tag() dil.store_info() timer.report() # return dils = ILSVRC_S.DataILSVRC_S(base='ILSVRC2013_DET_val', category=category,host='master') timer.mark() dils._extract_data(mode='analysis', writeback=False,withdata = False) timer.report() timer.mark() dils._analysis(mode='analysis', model_path = 'res/svm_sklearn.model', feattype='ibd', readforward=False, writeback=True, withdata=False) timer.report() def analysis_hbase_data_spark(table_name='MSPIDER', model_path = 'res/svm_sklearn.model',feat_type = 'ibd'): timer = Timer() # timer.mark() # dil = ILSVRC.DataILSVRC(base_dir='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val', category=category,host='master') # dil.delete_table() # # dil.format() # dil.store_img() # timer.report() # # return dils = ILSVRC_S.DataILSVRC_S(tablename=table_name,host='master') timer.mark() dils._extract_data(mode='analysis', writeback=False) timer.report() timer.mark() dils._analysis(mode='analysis', model_path = model_path,feattype=feat_type, readforward=False, writeback=True, withdata=False) timer.report() def export_hbase_to_dir(type_name = 'tagged', table_name = 'MSPIDER',dst_dir = ''): timer = Timer() dil = ILSVRC.DataILSVRC(base_dir='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val', tablename = table_name,host='master') dil.export_data(mode = 'hbase',tagtype='class',type_name = type_name, dst_dir = dst_dir) timer.mark() timer.report() def test_ILSVRC_S(): # test_ILSVRC_S_LOCAL() test_ILSVRC_S_SPARK() def test_ILSVRC_IMPORT(category='Train_1000'): dil = ILSVRC.DataILSVRC(base_dir='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val', category=category,host='master') dil.delete_table() # dil.format() dil.store_img() def test_ILSVRC_EXPORT(category='Train_1000'): pass def test_pipeline(): timer = Timer() timer.mark() dils = ILSVRC_S.DataILSVRC_S(base='MSPIDER', category=None) dils._extract_data(mode='spark', writeback=False) dils._embed_data(mode='spark', rate=0.1, readforward=False, writeback=False) dils._extract_feat(mode='spark', feattype='ibd', readforward=False, writeback=True, withdata=True) timer.report() if __name__ == '__main__': # test_MSR() # test_CV() # test_ILSVRC() # test_ILSVRC_S() test_pipeline() print 'helllo'