47 from daal.algorithms
import classifier
48 from daal.algorithms.stump
import training, prediction
49 from daal.data_management
import (
50 FileDataSource, DataSourceIface, HomogenNumericTable, MergedNumericTable, NumericTableIface
53 utils_folder = os.path.realpath(os.path.abspath(os.path.dirname(os.path.dirname(__file__))))
54 if utils_folder
not in sys.path:
55 sys.path.insert(0, utils_folder)
56 from utils
import printNumericTables
58 DAAL_PREFIX = os.path.join(
'..',
'data')
62 trainDatasetFileName = os.path.join(DAAL_PREFIX,
'batch',
'stump_train.csv')
63 testDatasetFileName = os.path.join(DAAL_PREFIX,
'batch',
'stump_test.csv')
66 predictionResult =
None
67 testGroundTruth =
None
73 trainDataSource = FileDataSource(
75 DataSourceIface.notAllocateNumericTable,
76 DataSourceIface.doDictionaryFromContext
80 trainData = HomogenNumericTable(nFeatures, 0, NumericTableIface.doNotAllocate)
81 trainGroundTruth = HomogenNumericTable(1, 0, NumericTableIface.doNotAllocate)
82 mergedData = MergedNumericTable(trainData, trainGroundTruth)
85 trainDataSource.loadDataBlock(mergedData)
88 algorithm = training.Batch()
91 algorithm.input.set(classifier.training.data, trainData)
92 algorithm.input.set(classifier.training.labels, trainGroundTruth)
95 trainingResult = algorithm.compute()
99 global predictionResult, testGroundTruth
102 testDataSource = FileDataSource(
104 DataSourceIface.notAllocateNumericTable,
105 DataSourceIface.doDictionaryFromContext
109 testData = HomogenNumericTable(nFeatures, 0, NumericTableIface.doNotAllocate)
110 testGroundTruth = HomogenNumericTable(1, 0, NumericTableIface.doNotAllocate)
111 mergedData = MergedNumericTable(testData, testGroundTruth)
114 testDataSource.loadDataBlock(mergedData)
117 algorithm = prediction.Batch()
120 algorithm.input.setTable(classifier.prediction.data, testData)
121 algorithm.input.setModel(classifier.prediction.model,
122 trainingResult.get(classifier.training.model))
125 predictionResult = algorithm.compute()
131 predictionResult.get(classifier.prediction.prediction),
132 "Ground truth",
"Classification results",
133 "Stump classification results (first 20 observations):", 20, flt64=
False)
135 if __name__ ==
"__main__":