26 from daal
import step1Local, step2Master
27 from daal.algorithms
import pca
28 from daal.data_management
import FileDataSource, DataSourceIface
30 utils_folder = os.path.realpath(os.path.abspath(os.path.dirname(os.path.dirname(__file__))))
31 if utils_folder
not in sys.path:
32 sys.path.insert(0, utils_folder)
33 from utils
import printNumericTable
35 DAAL_PREFIX = os.path.join(
'..',
'data')
43 os.path.join(DAAL_PREFIX,
'distributed',
'pca_normalized_1.csv'),
44 os.path.join(DAAL_PREFIX,
'distributed',
'pca_normalized_2.csv'),
45 os.path.join(DAAL_PREFIX,
'distributed',
'pca_normalized_3.csv'),
46 os.path.join(DAAL_PREFIX,
'distributed',
'pca_normalized_4.csv')
49 if __name__ ==
"__main__":
52 masterAlgorithm = pca.Distributed(step2Master,fptype=np.float64)
54 for i
in range(nBlocks):
56 dataSource = FileDataSource(
57 dataFileNames[i], DataSourceIface.doAllocateNumericTable,
58 DataSourceIface.doDictionaryFromContext
62 dataSource.loadDataBlock(nVectorsInBlock)
65 localAlgorithm = pca.Distributed(step1Local,fptype=np.float64)
68 localAlgorithm.input.setDataset(pca.data, dataSource.getNumericTable())
72 masterAlgorithm.input.add(pca.partialResults, localAlgorithm.compute())
75 masterAlgorithm.compute()
76 result = masterAlgorithm.finalizeCompute()
79 printNumericTable(result.get(pca.eigenvalues),
"Eigenvalues:")
80 printNumericTable(result.get(pca.eigenvectors),
"Eigenvectors:")