Fill NA

Example

>>> import shutil
>>> shutil.copy("examples/fintech/database.csv.zip", "examples/fintech/data/processed/database.csv.zip")
'examples/fintech/data/processed/database.csv.zip'
>>> import shutil
>>> shutil.copy("examples/fintech/database.csv.zip", "examples/fintech/data/processed/database.csv.zip")
'examples/fintech/data/processed/database.csv.zip'
>>> import pandas as pd
>>> from techminer2.database.operators import TransformOperator
>>> TransformOperator(
...     field="index_keywords_raw",
...     other_field="na_field",
...     root_directory="examples/fintech/",
...     transformation_function=lambda x: pd.NA,
... ).run()
>>> # Query the database to obtain the number of NA values
>>> from techminer2.io import Query
>>> query = (
...     Query()
...     .with_query_expression("SELECT na_field FROM database;")
...     .where_root_directory("examples/fintech/")
...     .where_database("main")
...     .where_record_years_range(None, None)
...     .where_record_citations_range(None, None)
... )
>>> df = query.run()
>>> int(df.na_field.isna().sum())
50
>>> # Creates, configures, and runs the operator
>>> from techminer2.database.operators import FillNAOperator
>>> fillna_operator = (
...     FillNAOperator()
...     #
...     # FIELDS:
...     .with_field("na_field")
...     .with_other_field("index_keywords_raw")
...     #
...     # DATABASE:
...     .where_root_directory("examples/fintech/")
... )
>>> fillna_operator.run()
>>> # Query the database to test the operator
>>> from techminer2.io import Query
>>> query = (
...     Query()
...     .with_query_expression("SELECT na_field FROM database;")
...     .where_root_directory("examples/fintech/")
...     .where_database("main")
...     .where_record_years_range(None, None)
...     .where_record_citations_range(None, None)
... )
>>> df = query.run()
>>> int(df.na_field.isna().sum())
31
>>> # Deletes the field
>>> from techminer2.database.operators import DeleteOperator
>>> DeleteOperator(
...     field="na_field",
...     root_directory="examples/fintech/",
... ).run()
class techminer2.operations.coalesce_column.CoalesceColumn(**kwargs)[source]

Bases: ParamsMixin

run()[source]