test_data.py 3.4 KB
__author__ = 'chunk'

from ..common import *

from ..mdata import ILSVRC, ILSVRC_S


def test_ILSVRC(category='Train_100'):
    timer = Timer()

    # dil = ILSVRC.DataILSVRC(base='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val', category='Train')
    dil = ILSVRC.DataILSVRC(base_dir='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val',
                            category=category)
    # dil = ILSVRC.DataILSVRC(base='/media/chunk/Elements/D/data/ImageNet/img/ILSVRC2013_DET_val', category='Train_1')
    print '[time]category:', category

    timer.mark()
    print '[time]formatting...'
    dil.format()
    timer.report()

    timer.mark()
    print '[time]embedding...'
    dil.embed(rate=0.2)
    timer.report()

    timer.mark()
    print '[time]extracting...'
    dil.extract_feat(feattype='ibd')
    timer.report()

    # dil.extract_feat(feattype='hog')

    # timer.mark()
    # dil.store_img()
    # timer.report()

    # timer.mark()
    # dil.store_tag()
    # timer.report()
    #
    # timer.mark()
    # dil.store_info()
    # timer.report()
    #
    # timer.mark()
    # dil.store_feat()
    # timer.report()


def test_ILSVRC_S_LOCAL():
    timer = Timer()

    timer.mark()
    dil = ILSVRC.DataILSVRC(base_dir='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val',
                            category='Train_2')
    dil.delete_table()
    dil.format()
    dil.store_img()
    timer.report()

    dils = ILSVRC_S.DataILSVRC_S(base='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val',
                                 category='Train_2')

    # dils._extract_data(mode='hbase', writeback=True)
    # dils._embed_data(mode='hbase', rate=0.1, readforward=True, writeback=True)
    # dils._extract_feat( mode='hbase', feattype='ibd', readforward=True, writeback=True)

    dils._extract_data(mode='hbase', writeback=False)
    dils._embed_data(mode='hbase', rate=0.1, readforward=False, writeback=False)
    dils._extract_feat(mode='hbase', feattype='ibd', readforward=False, writeback=True)

    timer.report()


def test_ILSVRC_S_SPARK(category='Train_1000'):
    timer = Timer()

    timer.mark()
    dil = ILSVRC.DataILSVRC(base_dir='/data/hadoop/ImageNet/ILSVRC/ILSVRC2013_DET_val',
                            category=category)
    dil.delete_table()
    dil.format()
    dil.store_img()
    timer.report()
    # return

    dils = ILSVRC_S.DataILSVRC_S(base='ILSVRC2013_DET_val', category=category)

    timer.mark()
    dils._extract_data(mode='spark', writeback=False)
    timer.report()

    # print dils.rdd_data.count() # pass
    # return

    timer.mark()
    dils._embed_data(mode='spark', rate=0.2, readforward=False, writeback=False)
    timer.report()

    timer.mark()
    dils._extract_feat(mode='spark', feattype='ibd', readforward=False, writeback=True,
                       withdata=True)
    timer.report()


def test_ILSVRC_S():
    # test_ILSVRC_S_LOCAL()
    test_ILSVRC_S_SPARK()


def test_pipeline():
    timer = Timer()

    timer.mark()

    dils = ILSVRC_S.DataILSVRC_S(base='MSPIDER', category=None)

    dils._extract_data(mode='spark', writeback=False)
    dils._embed_data(mode='spark', rate=0.1, readforward=False, writeback=False)
    dils._extract_feat(mode='spark', feattype='ibd', readforward=False, writeback=True,
                       withdata=True)

    timer.report()


if __name__ == '__main__':
    # test_MSR()
    # test_CV()
    # test_ILSVRC()
    # test_ILSVRC_S()

    test_pipeline()

    print 'helllo'