47 from daal
import step1Local, step2Master
48 from daal.algorithms
import pca
49 from daal.data_management
import FileDataSource, DataSourceIface
51 utils_folder = os.path.realpath(os.path.abspath(os.path.dirname(os.path.dirname(__file__))))
52 if utils_folder
not in sys.path:
53 sys.path.insert(0, utils_folder)
54 from utils
import printNumericTable
56 DAAL_PREFIX = os.path.join(
'..',
'data')
64 os.path.join(DAAL_PREFIX,
'distributed',
'pca_normalized_1.csv'),
65 os.path.join(DAAL_PREFIX,
'distributed',
'pca_normalized_2.csv'),
66 os.path.join(DAAL_PREFIX,
'distributed',
'pca_normalized_3.csv'),
67 os.path.join(DAAL_PREFIX,
'distributed',
'pca_normalized_4.csv')
70 if __name__ ==
"__main__":
73 masterAlgorithm = pca.Distributed(step2Master)
75 for i
in range(nBlocks):
77 dataSource = FileDataSource(
78 dataFileNames[i], DataSourceIface.doAllocateNumericTable,
79 DataSourceIface.doDictionaryFromContext
83 dataSource.loadDataBlock(nVectorsInBlock)
86 localAlgorithm = pca.Distributed(step1Local)
89 localAlgorithm.input.setDataset(pca.data, dataSource.getNumericTable())
93 masterAlgorithm.input.add(pca.partialResults, localAlgorithm.compute())
96 masterAlgorithm.compute()
97 result = masterAlgorithm.finalizeCompute()
100 printNumericTable(result.get(pca.eigenvalues),
"Eigenvalues:")
101 printNumericTable(result.get(pca.eigenvectors),
"Eigenvectors:")