merlin namespace#
Subpackages#
- merlin.dag package
BaseOperator
BaseOperator.compute_selector()
BaseOperator.compute_input_schema()
BaseOperator.compute_output_schema()
BaseOperator.validate_schemas()
BaseOperator.transform()
BaseOperator.column_mapping()
BaseOperator.compute_column_schema()
BaseOperator.dynamic_dtypes
BaseOperator.output_column_names()
BaseOperator.dependencies
BaseOperator.output_dtype
BaseOperator.output_tags
BaseOperator.output_properties
BaseOperator.label
BaseOperator.create_node()
BaseOperator.supports
BaseOperator.supported_formats
Graph
Node
Node.selector
Node.add_dependency()
Node.add_parent()
Node.add_child()
Node.remove_child()
Node.compute_schemas()
Node.validate_schemas()
Node.remove_inputs()
Node.exportable()
Node.parents_with_dependencies
Node.grouped_parents_with_dependencies
Node.input_columns
Node.output_columns
Node.column_mapping
Node.dependency_columns
Node.label
Node.graph
Node.Nodable
Node.construct_from()
ColumnSelector
- merlin.io package
Dataset
Dataset.to_ddf()
Dataset.file_partition_map
Dataset.partition_lens
Dataset.to_cpu()
Dataset.to_gpu()
Dataset.shuffle_by_keys()
Dataset.repartition()
Dataset.merge()
Dataset.to_iter()
Dataset.to_parquet()
Dataset.compute()
Dataset.head()
Dataset.persist()
Dataset.tail()
Dataset.to_hugectr()
Dataset.num_rows
Dataset.npartitions
Dataset.validate_dataset()
Dataset.regenerate_dataset()
Dataset.infer_schema()
Dataset.sample_dtypes()
- merlin.schema package
Schema
Schema.column_names
Schema.select()
Schema.apply()
Schema.excluding()
Schema.apply_inverse()
Schema.select_by_tag()
Schema.excluding_by_tag()
Schema.remove_by_tag()
Schema.select_by_name()
Schema.excluding_by_name()
Schema.remove_col()
Schema.without()
Schema.get()
Schema.first
Schema.to_pandas()
Schema.copy()
ColumnSchema
ColumnSchema.name
ColumnSchema.tags
ColumnSchema.properties
ColumnSchema.dtype
ColumnSchema.is_list
ColumnSchema.is_ragged
ColumnSchema.dims
ColumnSchema.shape
ColumnSchema.with_name()
ColumnSchema.with_tags()
ColumnSchema.with_properties()
ColumnSchema.with_dtype()
ColumnSchema.with_shape()
ColumnSchema.int_domain
ColumnSchema.float_domain
ColumnSchema.value_count
Tags
Tags.CATEGORICAL
Tags.CONTINUOUS
Tags.LIST
Tags.SEQUENCE
Tags.TEXT
Tags.TOKENIZED
Tags.TIME
Tags.EMBEDDING
Tags.ID
Tags.USER
Tags.ITEM
Tags.SESSION
Tags.CONTEXT
Tags.TARGET
Tags.REGRESSION
Tags.CLASSIFICATION
Tags.BINARY
Tags.MULTI_CLASS
Tags.USER_ID
Tags.ITEM_ID
Tags.SESSION_ID
Tags.TEXT_TOKENIZED
Tags.BINARY_CLASSIFICATION
Tags.MULTI_CLASS_CLASSIFICATION