noctis.data_transformation.preprocessing.data_preprocessing.PreprocessorConfig

class noctis.data_transformation.preprocessing.data_preprocessing.PreprocessorConfig(inp_chem_format: str | None = 'smiles', out_chem_format: str | None = None, validation: bool | None = True, output_folder: str | None = 'output', tmp_folder: str | None = None, delete_tmp: bool | None = True, prefix: str | None = None, delimiter: str | None = ',', lineterminator: str | None = None, quotechar: str | None = '"', blocksize: int | None = 600000, chunksize: int | None = 10000, nrows: int | None = None)[source]

Configuration for preprocessing chemical data.

__init__(inp_chem_format: str | None = 'smiles', out_chem_format: str | None = None, validation: bool | None = True, output_folder: str | None = 'output', tmp_folder: str | None = None, delete_tmp: bool | None = True, prefix: str | None = None, delimiter: str | None = ',', lineterminator: str | None = None, quotechar: str | None = '"', blocksize: int | None = 600000, chunksize: int | None = 10000, nrows: int | None = None) None

Methods

__init__([inp_chem_format, out_chem_format, ...])

build_from_yaml(file_path)

save_to_yaml(file_path)

Attributes

blocksize

chunksize

delete_tmp

delimiter

inp_chem_format

lineterminator

nrows

out_chem_format

output_folder

prefix

quotechar

tmp_folder

validation