27 from daal.data_management
import FileDataSource, CsvDataSourceOptions, modifiers, features
28 from daal.data_management.modifiers
import csv
31 utils_folder = os.path.realpath(os.path.abspath(os.path.dirname(os.path.dirname(__file__))))
32 if utils_folder
not in sys.path:
33 sys.path.insert(0, utils_folder)
34 from utils
import printNumericTable
37 csvFileName =
"../data/batch/mixed_text_and_numbers.csv"
40 csvOptions = CsvDataSourceOptions(CsvDataSourceOptions.allocateNumericTable |\
41 CsvDataSourceOptions.createDictionaryFromContext |\
42 CsvDataSourceOptions.parseHeader)
46 ds = FileDataSource(csvFileName, csvOptions)
50 printNumericTable(ds.getNumericTable(),
"readDefault function result:")
54 def readOnlySpecifiedColumnIndices():
55 ds = FileDataSource(csvFileName, csvOptions)
60 print(modifiers.csv.automatic())
61 ds.getFeatureManager().addModifier([0,1,5], modifiers.csv.automatic())
63 printNumericTable(ds.getNumericTable(),
"readOnlySpecifiedColumnIndices function result:")
67 def readOnlySpecifiedColumnNames():
68 ds = FileDataSource(csvFileName, csvOptions)
70 ds.getFeatureManager().addModifier([
"Numeric1",
"Categorical0"], modifiers.csv.automatic())
72 printNumericTable(ds.getNumericTable(),
"readOnlySpecifiedColumnNames function result:")
76 def readUsingMultipleModifiers():
77 ds = FileDataSource(csvFileName, csvOptions)
79 fm = ds.getFeatureManager()
80 fm.addModifier([
"Numeric1"], modifiers.csv.continuous())
82 fm.addModifier([6,
"Categorical1"], modifiers.csv.categorical())
85 printNumericTable(ds.getNumericTable(),
"readUsingMultipleModifiers function result:")
88 if __name__ ==
"__main__":
93 readOnlySpecifiedColumnIndices()
96 readOnlySpecifiedColumnNames()
99 readUsingMultipleModifiers()