25 from daal.data_management
import FileDataSource, CsvDataSourceOptions, modifiers, features
26 from daal.data_management.modifiers
import csv
29 utils_folder = os.path.realpath(os.path.abspath(os.path.dirname(os.path.dirname(__file__))))
30 if utils_folder
not in sys.path:
31 sys.path.insert(0, utils_folder)
32 from utils
import printNumericTable
35 csvFileName =
"../data/batch/mixed_text_and_numbers.csv"
38 csvOptions = CsvDataSourceOptions(CsvDataSourceOptions.allocateNumericTable |\
39 CsvDataSourceOptions.createDictionaryFromContext |\
40 CsvDataSourceOptions.parseHeader)
44 ds = FileDataSource(csvFileName, csvOptions)
48 printNumericTable(ds.getNumericTable(),
"readDefault function result:")
52 def readOnlySpecifiedColumnIndices():
53 ds = FileDataSource(csvFileName, csvOptions)
58 print(modifiers.csv.automatic())
59 ds.getFeatureManager().addModifier([0,1,5], modifiers.csv.automatic())
61 printNumericTable(ds.getNumericTable(),
"readOnlySpecifiedColumnIndices function result:")
65 def readOnlySpecifiedColumnNames():
66 ds = FileDataSource(csvFileName, csvOptions)
68 ds.getFeatureManager().addModifier([
"Numeric1",
"Categorical0"], modifiers.csv.automatic())
70 printNumericTable(ds.getNumericTable(),
"readOnlySpecifiedColumnNames function result:")
74 def readUsingMultipleModifiers():
75 ds = FileDataSource(csvFileName, csvOptions)
77 fm = ds.getFeatureManager()
78 fm.addModifier([
"Numeric1"], modifiers.csv.continuous())
80 fm.addModifier([6,
"Categorical1"], modifiers.csv.categorical())
83 printNumericTable(ds.getNumericTable(),
"readUsingMultipleModifiers function result:")
86 if __name__ ==
"__main__":
91 readOnlySpecifiedColumnIndices()
94 readOnlySpecifiedColumnNames()
97 readUsingMultipleModifiers()