test_spark.py 1.04 KB
__author__ = 'chunk'

from common import *

from mdata import MSR, CV
from mmodel import SVM
from mspark import SC


timer = Timer()


def test_spark_io():
    pass


def test_spark_ml():
    sparker = SC.Sparker(host='HPC-server', appname='ImageCV', master='spark://HPC-server:7077')
    dcv = CV.DataCV()
    X, Y = dcv.load_data()
    sparker.train_svm(X, Y)
    for path, subdirs, files in os.walk('data/467/'):
        for name in files:
            imgpath = os.path.join(path, name)
            feat = dcv.get_feat(imgpath, 'hog')
            print name, sparker.predict(feat)


def test_SVM_CV():
    dcv = CV.DataCV()
    X, Y = dcv.load_data()
    msvm = SVM.ModelSVM()
    msvm.train(X, Y)

    for path, subdirs, files in os.walk('data/467/'):
        for name in files:
            imgpath = os.path.join(path, name)
            feat = dcv.get_feat(imgpath, 'hog')
            print name, msvm.predict(feat)

    print msvm.test(X, Y)  # 0.948892561983 for svm_cv ,0.989024793388 for svm_sk


if __name__ == '__main__':
    test_SVM_CV()
    print 'helllo'