24 from daal.algorithms
import classifier
25 from daal.algorithms.stump
import training, prediction
26 from daal.data_management
import (
27 FileDataSource, DataSourceIface, HomogenNumericTable, MergedNumericTable, NumericTableIface
30 utils_folder = os.path.realpath(os.path.abspath(os.path.dirname(os.path.dirname(__file__))))
31 if utils_folder
not in sys.path:
32 sys.path.insert(0, utils_folder)
33 from utils
import printNumericTables
35 DAAL_PREFIX = os.path.join(
'..',
'data')
39 trainDatasetFileName = os.path.join(DAAL_PREFIX,
'batch',
'stump_train.csv')
40 testDatasetFileName = os.path.join(DAAL_PREFIX,
'batch',
'stump_test.csv')
43 predictionResult =
None
44 testGroundTruth =
None
50 trainDataSource = FileDataSource(
52 DataSourceIface.notAllocateNumericTable,
53 DataSourceIface.doDictionaryFromContext
57 trainData = HomogenNumericTable(nFeatures, 0, NumericTableIface.doNotAllocate)
58 trainGroundTruth = HomogenNumericTable(1, 0, NumericTableIface.doNotAllocate)
59 mergedData = MergedNumericTable(trainData, trainGroundTruth)
62 trainDataSource.loadDataBlock(mergedData)
65 algorithm = training.Batch()
68 algorithm.input.set(classifier.training.data, trainData)
69 algorithm.input.set(classifier.training.labels, trainGroundTruth)
72 trainingResult = algorithm.compute()
76 global predictionResult, testGroundTruth
79 testDataSource = FileDataSource(
81 DataSourceIface.notAllocateNumericTable,
82 DataSourceIface.doDictionaryFromContext
86 testData = HomogenNumericTable(nFeatures, 0, NumericTableIface.doNotAllocate)
87 testGroundTruth = HomogenNumericTable(1, 0, NumericTableIface.doNotAllocate)
88 mergedData = MergedNumericTable(testData, testGroundTruth)
91 testDataSource.loadDataBlock(mergedData)
94 algorithm = prediction.Batch()
97 algorithm.input.setTable(classifier.prediction.data, testData)
98 algorithm.input.setModel(classifier.prediction.model,
99 trainingResult.get(classifier.training.model))
102 predictionResult = algorithm.compute()
108 predictionResult.get(classifier.prediction.prediction),
109 "Ground truth",
"Classification results",
110 "Stump classification results (first 20 observations):", 20, flt64=
False)
112 if __name__ ==
"__main__":