Source code for econuy.transform

import warnings
from datetime import datetime
from os import PathLike, getcwd, path
from pathlib import Path
from typing import Union, Optional, Tuple, Dict

import numpy as np
import pandas as pd
from statsmodels.tools.sm_exceptions import X13Error, X13Warning
from statsmodels.tsa import x13
from statsmodels.tsa.x13 import x13_arima_analysis as x13a
from statsmodels.tsa.seasonal import STL, seasonal_decompose

from econuy.utils import metadata, x13util


[docs]def convert_usd(df: pd.DataFrame, pipeline=None, errors: str = "raise") -> pd.DataFrame:
    """Convert to other units.

    See Also
    --------
    :mod:`~econuy.core.Pipeline.convert`.

    """
    if errors not in ["raise", "coerce", "ignore"]:
        raise ValueError("'errors' must be one of 'raise', " "'coerce' or 'ignore'.")
    if "Moneda" not in df.columns.names:
        raise ValueError("Input dataframe's multiindex requires the " "'Moneda' level.")

    if pipeline is None:
        from econuy.core import Pipeline

        pipeline = Pipeline()

    checks = [x == "UYU" for x in df.columns.get_level_values("Moneda")]
    if any(checks):
        if not all(checks) and errors == "raise":
            error_df = df.loc[:, [not check for check in checks]]
            msg = f"{error_df.columns[0][0]} does not have the " f"appropiate metadata."
            return error_handler(df=df, errors=errors, msg=msg)
        pipeline.get(name="nxr_monthly")
        nxr_data = pipeline.dataset
        all_metadata = df.columns.droplevel("Indicador")
        if all(x == all_metadata[0] for x in all_metadata):
            return _convert_usd(df=df, nxr=nxr_data)
        else:
            columns = []
            for column_name, check in zip(df.columns, checks):
                df_column = df[[column_name]]
                if check is False:
                    msg = f"{column_name[0]} does not have the " f"appropiate metadata."
                    columns.append(error_handler(df=df_column, errors=errors, msg=msg))
                else:
                    converted = _convert_usd(df=df_column, nxr=nxr_data)
                    columns.append(converted)
            return pd.concat(columns, axis=1)
    else:
        return error_handler(df=df, errors=errors)


def _convert_usd(df: pd.DataFrame, nxr: Optional[pd.DataFrame] = None) -> pd.DataFrame:
    if nxr is None:
        from econuy.core import Pipeline

        pipeline = Pipeline()
        pipeline.get("nxr_monthly")
        nxr = pipeline.dataset

    inferred_freq = pd.infer_freq(df.index)
    if inferred_freq in ["D", "B", "C", "W", "W-SUN", None]:
        if df.columns.get_level_values("Tipo")[0] == "Flujo":
            df = df.resample("M").sum()
        else:
            df = df.resample("M").last()
        inferred_freq = pd.infer_freq(df.index)

    if df.columns.get_level_values("Tipo")[0] == "Stock":
        metadata._set(nxr, ts_type="Stock")
        nxr_freq = resample(nxr, rule=inferred_freq, operation="last").iloc[:, [1]]
    else:
        metadata._set(nxr, ts_type="Flujo")
        nxr_freq = resample(nxr, rule=inferred_freq, operation="mean").iloc[:, [0]]
        cum_periods = int(df.columns.get_level_values("Acum. períodos")[0])
        nxr_freq = rolling(nxr_freq, window=cum_periods, operation="mean")

    nxr_to_use = nxr_freq.reindex(df.index).iloc[:, 0]
    converted_df = df.div(nxr_to_use, axis=0)
    metadata._set(converted_df, currency="USD")

    return converted_df


[docs]def convert_real(
    df: pd.DataFrame,
    start_date: Union[str, datetime, None] = None,
    end_date: Union[str, datetime, None] = None,
    pipeline=None,
    errors: str = "raise",
) -> pd.DataFrame:
    """Convert to other units.

    See Also
    --------
    :mod:`~econuy.core.Pipeline.convert`.

    """
    if errors not in ["raise", "coerce", "ignore"]:
        raise ValueError("'errors' must be one of 'raise', " "'coerce' or 'ignore'.")
    if "Inf. adj." not in df.columns.names:
        raise ValueError("Input dataframe's multiindex requires the " "'Inf. adj.' level.")

    if pipeline is None:
        from econuy.core import Pipeline

        pipeline = Pipeline()

    checks = [
        x == "UYU" and "Const." not in y
        for x, y in zip(
            df.columns.get_level_values("Moneda"), df.columns.get_level_values("Inf. adj.")
        )
    ]
    if any(checks):
        if not all(checks) and errors == "raise":
            error_df = df.loc[:, [not check for check in checks]]
            msg = f"{error_df.columns[0][0]} does not have the " f"appropiate metadata."
            return error_handler(df=df, errors=errors, msg=msg)
        pipeline.get(name="cpi")
        cpi_data = pipeline.dataset
        all_metadata = df.columns.droplevel("Indicador")
        if all(x == all_metadata[0] for x in all_metadata):
            return _convert_real(df=df, start_date=start_date, end_date=end_date, cpi=cpi_data)
        else:
            columns = []
            for column_name, check in zip(df.columns, checks):
                df_column = df[[column_name]]
                if check is False:
                    msg = f"{column_name[0]} does not have the " f"appropiate metadata."
                    columns.append(error_handler(df=df_column, errors=errors, msg=msg))
                else:
                    converted = _convert_real(
                        df=df_column, start_date=start_date, end_date=end_date, cpi=cpi_data
                    )
                    columns.append(converted)
            return pd.concat(columns, axis=1)
    else:
        return error_handler(df=df, errors=errors)


def _convert_real(
    df: pd.DataFrame,
    start_date: Union[str, datetime, None] = None,
    end_date: Union[str, datetime, None] = None,
    cpi: Optional[pd.DataFrame] = None,
) -> pd.DataFrame:
    if cpi is None:
        from econuy.core import Pipeline

        pipeline = Pipeline()
        pipeline.get("cpi")
        cpi = pipeline.dataset

    inferred_freq = pd.infer_freq(df.index)
    if inferred_freq in ["D", "B", "C", "W", "W-SUN", None]:
        if df.columns.get_level_values("Tipo")[0] == "Flujo":
            df = df.resample("M").sum()
        else:
            df = df.resample("M").mean()
        inferred_freq = pd.infer_freq(df.index)

    metadata._set(cpi, ts_type="Flujo")
    cpi_freq = resample(cpi, rule=inferred_freq, operation="mean").iloc[:, [0]]
    cum_periods = int(df.columns.get_level_values("Acum. períodos")[0])
    cpi_to_use = rolling(cpi_freq, window=cum_periods, operation="mean").squeeze()

    if start_date is None:
        converted_df = df.div(cpi_to_use, axis=0)
        col_text = "Const."
    elif end_date is None:
        month = df.iloc[df.index.get_loc(start_date, method="nearest")].name
        converted_df = df.div(cpi_to_use, axis=0) * cpi_to_use.loc[month]
        m_start = datetime.strptime(start_date, "%Y-%m-%d").strftime("%Y-%m")
        col_text = f"Const. {m_start}"
    else:
        converted_df = df.div(cpi_to_use, axis=0) * cpi_to_use[start_date:end_date].mean()
        m_start = datetime.strptime(start_date, "%Y-%m-%d").strftime("%Y-%m")
        m_end = datetime.strptime(end_date, "%Y-%m-%d").strftime("%Y-%m")
        if m_start == m_end:
            col_text = f"Const. {m_start}"
        else:
            col_text = f"Const. {m_start}_{m_end}"

    converted_df = converted_df.reindex(df.index)
    metadata._set(converted_df, inf_adj=col_text)

    return converted_df


[docs]def convert_gdp(df: pd.DataFrame, pipeline=None, errors: str = "raise") -> pd.DataFrame:
    """Convert to other units.

    See Also
    --------
    :mod:`~econuy.core.Pipeline.convert`.

    """
    if errors not in ["raise", "coerce", "ignore"]:
        raise ValueError("'errors' must be one of 'raise', 'coerce' or " "'ignore'.")
    if any(x not in df.columns.names for x in ["Área", "Unidad"]):
        raise ValueError(
            "Input dataframe's multiindex requires the 'Área' " "and 'Unidad' levels."
        )

    if pipeline is None:
        from econuy.core import Pipeline

        pipeline = Pipeline()

    checks = [
        x not in ["Regional", "Global"] and "%PBI" not in y
        for x, y in zip(df.columns.get_level_values("Área"), df.columns.get_level_values("Unidad"))
    ]
    if any(checks):
        if not all(checks) and errors == "raise":
            error_df = df.loc[:, [not check for check in checks]]
            msg = f"{error_df.columns[0][0]} does not have the " f"appropiate metadata."
            return error_handler(df=df, errors=errors, msg=msg)
        pipeline.get(name="_lin_gdp")
        gdp_data = pipeline.dataset
        all_metadata = df.columns.droplevel("Indicador")
        if all(x == all_metadata[0] for x in all_metadata):
            return _convert_gdp(df=df, gdp=gdp_data)
        else:
            columns = []
            for column_name, check in zip(df.columns, checks):
                df_column = df[[column_name]]
                if check is False:
                    msg = f"{column_name[0]} does not have the " f"appropiate metadata."
                    columns.append(error_handler(df=df_column, errors=errors, msg=msg))
                else:
                    converted = _convert_gdp(df=df_column, gdp=gdp_data)
                    columns.append(converted)
            return pd.concat(columns, axis=1)
    else:
        return error_handler(df=df, errors=errors)


def _convert_gdp(df: pd.DataFrame, gdp: Optional[pd.DataFrame] = None) -> pd.DataFrame:
    if gdp is None:
        from econuy.core import Pipeline

        pipeline = Pipeline()
        pipeline.get("_lin_gdp")
        gdp = pipeline.dataset

    inferred_freq = pd.infer_freq(df.index)
    cum = int(df.columns.get_level_values("Acum. períodos")[0])
    if inferred_freq in ["M", "MS"]:
        gdp = resample(gdp, rule=inferred_freq, operation="upsample", interpolation="linear")
        if cum != 12 and df.columns.get_level_values("Tipo")[0] == "Flujo":
            converter = int(12 / cum)
            df = rolling(df, window=converter, operation="sum")
    elif inferred_freq in ["Q", "Q-DEC"]:
        gdp = gdp.resample(inferred_freq, convention="end").asfreq()
        if cum != 4 and df.columns.get_level_values("Tipo")[0] == "Flujo":
            converter = int(4 / cum)
            df = rolling(df, window=converter, operation="sum")
    elif inferred_freq in ["A", "A-DEC"]:
        gdp = gdp.resample(inferred_freq, convention="end").asfreq()
    elif inferred_freq in ["D", "B", "C", "W", "W-SUN", None]:
        if df.columns.get_level_values("Tipo")[0] == "Flujo":
            df = df.resample("M").sum()
        else:
            df = df.resample("M").mean()
        gdp = resample(gdp, rule="M", operation="upsample", interpolation="linear")
    else:
        raise ValueError(
            "Frequency of input dataframe not any of 'D', 'C', "
            "'W', 'B', 'M', 'MS', 'Q', 'Q-DEC', 'A' or 'A-DEC'."
        )

    if df.columns.get_level_values("Moneda")[0] == "USD":
        gdp = gdp.iloc[:, 1].to_frame()
    else:
        gdp = gdp.iloc[:, 0].to_frame()

    gdp_to_use = gdp.reindex(df.index).iloc[:, 0]
    converted_df = df.div(gdp_to_use, axis=0).multiply(100)

    metadata._set(converted_df, unit="% PBI")

    return converted_df


[docs]def resample(
    df: pd.DataFrame,
    rule: Union[pd.DateOffset, pd.Timedelta, str],
    operation: str = "sum",
    interpolation: str = "linear",
    warn: bool = False,
) -> pd.DataFrame:
    """
    Resample to target frequencies.

    See Also
    --------
    :mod:`~econuy.core.Pipeline.resample`

    """
    if operation not in ["sum", "mean", "upsample", "last"]:
        raise ValueError("Invalid 'operation' option.")
    if "Acum. períodos" not in df.columns.names:
        raise ValueError("Input dataframe's multiindex requires the " "'Acum. períodos' level.")

    all_metadata = df.columns.droplevel("Indicador")
    if all(x == all_metadata[0] for x in all_metadata):
        return _resample(
            df=df, rule=rule, operation=operation, interpolation=interpolation, warn=warn
        )
    else:
        columns = []
        for column_name in df.columns:
            df_column = df[[column_name]]
            converted = _resample(
                df=df_column,
                rule=rule,
                operation=operation,
                interpolation=interpolation,
                warn=warn,
            )
            columns.append(converted)
        return pd.concat(columns, axis=1)


def _resample(
    df: pd.DataFrame,
    rule: Union[pd.DateOffset, pd.Timedelta, str],
    operation: str = "sum",
    interpolation: str = "linear",
    warn: bool = False,
) -> pd.DataFrame:
    pd_frequencies = {
        "A": 1,
        "A-DEC": 1,
        "Q": 4,
        "Q-DEC": 4,
        "M": 12,
        "W": 52.143,
        "W-SUN": 52.143,
        "2W": 26.071,
        "2W-SUN": 26.071,
        "B": 240,
        "D": 365,
    }

    if operation == "sum":
        resampled_df = df.resample(rule).sum()
    elif operation == "mean":
        resampled_df = df.resample(rule).mean()
    elif operation == "last":
        resampled_df = df.resample(rule).last()
    else:
        resampled_df = df.resample(rule).last()
        resampled_df = resampled_df.interpolate(method=interpolation)

    cum_periods = int(df.columns.get_level_values("Acum. períodos")[0])
    if cum_periods != 1:
        input_notna = df.iloc[:, 0].count()
        output_notna = resampled_df.iloc[:, 0].count()
        cum_adj = round(output_notna / input_notna)
        metadata._set(resampled_df, cumperiods=int(cum_periods * cum_adj))

    if operation in ["sum", "mean", "last"]:
        infer_base = pd.infer_freq(df.index)
        try:
            base_freq = pd_frequencies[infer_base]
            target_freq = pd_frequencies[rule]
            if target_freq < base_freq:
                count = int(base_freq / target_freq)
                proc = df.resample(rule).count()
                antimask = np.where(proc >= count, False, True)
                resampled_df = resampled_df.mask(antimask, np.nan)
        except KeyError:
            if warn:
                warnings.warn(
                    "No bin trimming performed because frequencies "
                    "could not be assigned a numeric value",
                    UserWarning,
                )

    metadata._set(resampled_df)
    resampled_df = resampled_df.dropna(how="all")

    return resampled_df


[docs]def rolling(
    df: pd.DataFrame, window: Optional[int] = None, operation: str = "sum"
) -> pd.DataFrame:
    """
    Calculate rolling averages or sums.

    See Also
    --------
    :mod:`~econuy.core.Pipeline.rolling`.

    """
    if operation not in ["sum", "mean"]:
        raise ValueError("Invalid 'operation' option.")
    if "Tipo" not in df.columns.names:
        raise ValueError("Input dataframe's multiindex requires the " "'Tipo' level.")

    all_metadata = df.columns.droplevel("Indicador")
    if all(x == all_metadata[0] for x in all_metadata):
        return _rolling(df=df, window=window, operation=operation)
    else:
        columns = []
        for column_name in df.columns:
            df_column = df[[column_name]]
            converted = _rolling(df=df_column, window=window, operation=operation)
            columns.append(converted)
        return pd.concat(columns, axis=1)


def _rolling(
    df: pd.DataFrame, window: Optional[int] = None, operation: str = "sum"
) -> pd.DataFrame:
    pd_frequencies = {
        "A": 1,
        "A-DEC": 1,
        "Q": 4,
        "Q-DEC": 4,
        "M": 12,
        "MS": 12,
        "W": 52,
        "W-SUN": 52,
        "2W": 26,
        "2W-SUN": 26,
        "B": 260,
        "D": 365,
    }

    window_operation = {
        "sum": lambda x: x.rolling(window=window, min_periods=window).sum(),
        "mean": lambda x: x.rolling(window=window, min_periods=window).mean(),
    }

    if df.columns.get_level_values("Tipo")[0] == "Stock":
        warnings.warn(
            "Rolling operations should not be " "calculated on stock variables", UserWarning
        )

    if window is None:
        inferred_freq = pd.infer_freq(df.index)
        window = pd_frequencies[inferred_freq]

    rolling_df = df.apply(window_operation[operation])

    metadata._set(rolling_df, cumperiods=window)

    return rolling_df


[docs]def rebase(
    df: pd.DataFrame,
    start_date: Union[str, datetime],
    end_date: Union[str, datetime, None] = None,
    base: Union[int, float] = 100.0,
) -> pd.DataFrame:
    """
    Scale to a period or range of periods.

    See Also
    --------
    :mod:`~econuy.core.Pipeline.rebase`.

    """
    all_metadata = df.columns.droplevel("Indicador")
    if all(x == all_metadata[0] for x in all_metadata):
        return _rebase(df=df, end_date=end_date, start_date=start_date, base=base)
    else:
        columns = []
        for column_name in df.columns:
            df_column = df[[column_name]]
            converted = _rebase(df=df_column, end_date=end_date, start_date=start_date, base=base)
            columns.append(converted)
        return pd.concat(columns, axis=1)


def _rebase(
    df: pd.DataFrame,
    start_date: Union[str, datetime],
    end_date: Union[str, datetime, None] = None,
    base: float = 100.0,
) -> pd.DataFrame:
    if end_date is None:
        start_date = df.iloc[df.index.get_loc(start_date, method="nearest")].name
        indexed = df.apply(lambda x: x / x.loc[start_date] * base)
        if isinstance(start_date, str):
            start_date = datetime.strptime(start_date, "%Y-%m-%d")
        if not isinstance(base, int):
            if base.is_integer():
                base = int(base)
        m_start = start_date.strftime("%Y-%m")
        metadata._set(indexed, unit=f"{m_start}={base}")

    else:
        indexed = df.apply(lambda x: x / x[start_date:end_date].mean() * base)
        if isinstance(start_date, str):
            start_date = datetime.strptime(start_date, "%Y-%m-%d")
        if isinstance(end_date, str):
            end_date = datetime.strptime(end_date, "%Y-%m-%d")
        m_start = start_date.strftime("%Y-%m")
        m_end = end_date.strftime("%Y-%m")
        if not isinstance(base, int):
            if base.is_integer():
                base = int(base)
        if m_start == m_end:
            metadata._set(indexed, unit=f"{m_start}={base}")
        else:
            metadata._set(indexed, unit=f"{m_start}_{m_end}={base}")

    return indexed


# The `_open_and_read` function needs to be monkey-patched to specify the
# encoding or decomposition will fail on Windows
def _new_open_and_read(fname):
    with open(fname, "r", encoding="utf8") as fin:
        fout = fin.read()
    return fout


x13._open_and_read = _new_open_and_read


[docs]def decompose(
    df: pd.DataFrame,
    component: str = "both",
    method: str = "x13",
    force_x13: bool = False,
    fallback: str = "loess",
    outlier: bool = True,
    trading: bool = True,
    x13_binary: Union[str, PathLike, None] = "search",
    search_parents: int = 0,
    ignore_warnings: bool = True,
    errors: str = "raise",
    **kwargs,
) -> Union[Dict[str, pd.DataFrame], pd.DataFrame]:
    """
    Apply seasonal decomposition.

    By default returns both trend and seasonally adjusted components,
    unlike the class method referred below.

    See Also
    --------
    :mod:`~econuy.core.Pipeline.decompose`.

    """
    if errors not in ["raise", "coerce", "ignore"]:
        raise ValueError("method can only be 'x13', 'loess' or 'ma'.")
    if method not in ["x13", "loess", "ma"]:
        raise ValueError("method can only be 'x13', 'loess' or 'ma'.")
    if fallback not in ["loess", "ma"]:
        raise ValueError("method can only be 'loess' or 'ma'.")
    if component not in ["trend", "seas", "both"]:
        raise ValueError("component can only be 'trend', 'seas' or 'both'.")
    if "Seas. Adj." not in df.columns.names:
        raise ValueError("Input dataframe's multiindex requires the " "'Seas. Adj.' level.")

    binary_path = None
    if method == "x13":
        if x13_binary == "search":
            binary_path = x13util._search_binary(
                start_path=getcwd(), n=search_parents, download_path=getcwd()
            )
        elif isinstance(x13_binary, str):
            binary_path = x13_binary
        elif isinstance(x13_binary, PathLike):
            binary_path = Path(x13_binary).as_posix()
        else:
            binary_path = None
        if isinstance(binary_path, str) and path.isfile(binary_path) is False:
            raise FileNotFoundError("X13 binary missing. Try using 'x13_binary=search'.")

    checks = [x not in ["Tendencia", "SA"] for x in df.columns.get_level_values("Seas. Adj.")]
    passing = df.loc[:, checks]
    not_passing = df.loc[:, [not x for x in checks]]
    if any(checks):
        if not all(checks) and errors == "raise":
            error_df = df.loc[:, [not check for check in checks]]
            msg = f"{error_df.columns[0][0]} does not have the " f"appropiate metadata."
            return error_handler(df=df, errors=errors, msg=msg)
        passing_output = _decompose(
            passing,
            component=component,
            method=method,
            force_x13=force_x13,
            fallback=fallback,
            outlier=outlier,
            trading=trading,
            x13_binary=binary_path,
            ignore_warnings=ignore_warnings,
            errors=errors,
            **kwargs,
        )
        if not_passing.shape[1] != 0:
            not_passing_output = error_handler(df=not_passing, errors=errors)
        else:
            not_passing_output = not_passing
        if isinstance(passing_output, pd.DataFrame):
            output = pd.concat([passing_output, not_passing_output], axis=1)
            output = output[df.columns.get_level_values(0)]
            return output
        elif isinstance(passing_output, Dict):
            output = {}
            for name, data in passing_output.items():
                aux = pd.concat([data, not_passing_output], axis=1)
                output[name] = aux[df.columns.get_level_values(0)]
            return output
    else:
        return error_handler(df=df, errors=errors)


def _decompose(
    df: pd.DataFrame,
    component: str = "both",
    method: str = "x13",
    force_x13: bool = False,
    fallback: str = "loess",
    outlier: bool = True,
    trading: bool = True,
    x13_binary: Union[str, PathLike, None] = None,
    ignore_warnings: bool = True,
    errors: str = "raise",
    **kwargs,
) -> Union[Tuple[pd.DataFrame, pd.DataFrame], pd.DataFrame]:
    if method not in ["x13", "loess", "ma"]:
        raise ValueError("method can only be 'x13', 'loess' or 'ma'.")
    if fallback not in ["loess", "ma"]:
        raise ValueError("method can only be 'loess' or 'ma'.")

    df_proc = df.copy()
    old_columns = df_proc.columns
    df_proc.columns = df_proc.columns.get_level_values(level=0)
    df_proc.index = pd.to_datetime(df_proc.index, errors="coerce")

    trends_array = []
    seas_adjs_array = []
    for col in df_proc.columns:
        col_df = df_proc[col].dropna()
        if method == "x13":
            try:
                with warnings.catch_warnings():
                    if ignore_warnings is True:
                        action = "ignore"
                    else:
                        action = "default"
                    warnings.filterwarnings(action=action, category=X13Warning)
                    results = x13a(
                        col_df,
                        outlier=outlier,
                        trading=trading,
                        x12path=x13_binary,
                        prefer_x13=True,
                        **kwargs,
                    )

                    trends = results.trend.reindex(df_proc.index).T
                    seas_adjs = results.seasadj.reindex(df_proc.index).T

            except X13Error:
                if force_x13 is True:
                    if outlier is True:
                        try:
                            warnings.warn(
                                "X13 error found with selected "
                                "parameters. Trying with outlier=False.",
                                UserWarning,
                            )
                            results = x13a(
                                col_df,
                                outlier=False,
                                trading=trading,
                                x12path=x13_binary,
                                prefer_x13=True,
                                **kwargs,
                            )
                        except X13Error:
                            try:
                                warnings.warn(
                                    "X13 error found with trading=True. "
                                    "Trying with trading=False.",
                                    UserWarning,
                                )
                                results = x13a(
                                    col_df,
                                    outlier=False,
                                    trading=False,
                                    x12path=x13_binary,
                                    prefer_x13=True,
                                    **kwargs,
                                )
                                trends = results.trend.reindex(df_proc.index).T
                                seas_adjs = results.seasadj.reindex(df_proc.index).T
                            except X13Error:
                                warnings.warn(
                                    "No combination of parameters "
                                    "successful. No decomposition "
                                    "performed.",
                                    UserWarning,
                                )
                                trends = error_handler(df=col_df, errors=errors)
                                seas_adjs = trends.copy()

                    elif trading is True:
                        try:
                            warnings.warn(
                                "X13 error found with trading=True. "
                                "Trying with trading=False...",
                                UserWarning,
                            )
                            results = x13a(
                                col_df,
                                trading=False,
                                x12path=x13_binary,
                                prefer_x13=True,
                                **kwargs,
                            )
                            trends = results.trend.reindex(df_proc.index).T
                            seas_adjs = results.seasadj.reindex(df_proc.index).T
                        except X13Error:
                            warnings.warn(
                                "No combination of parameters " "successful. Filling with NaN.",
                                UserWarning,
                            )
                            trends = error_handler(df=col_df, errors=errors)
                            seas_adjs = trends.copy()

                else:
                    if fallback == "loess":
                        results = STL(col_df).fit()
                    else:
                        results = seasonal_decompose(col_df, extrapolate_trend="freq")
                    trends = results.trend.reindex(df_proc.index).T
                    seas_adjs = (results.observed - results.seasonal).reindex(df_proc.index).T

        else:
            if method == "loess":
                results = STL(col_df).fit()
            else:
                results = seasonal_decompose(col_df, extrapolate_trend="freq")
            trends = results.trend.reindex(df_proc.index).T
            seas_adjs = (results.observed - results.seasonal).reindex(df_proc.index).T

        trends_array.append(trends)
        seas_adjs_array.append(seas_adjs)
    trends = pd.concat(trends_array, axis=1)
    seas_adjs = pd.concat(seas_adjs_array, axis=1)
    trends.columns = old_columns
    seas_adjs.columns = old_columns
    metadata._set(trends, seas_adj="Tendencia")
    metadata._set(seas_adjs, seas_adj="SA")
    if component == "both":
        output = {"trend": trends, "seas": seas_adjs}
    elif component == "seas":
        output = seas_adjs
    elif component == "trend":
        output = trends

    return output


[docs]def chg_diff(df: pd.DataFrame, operation: str = "chg", period: str = "last") -> pd.DataFrame:
    """
    Calculate pct change or difference.

    See Also
    --------
    :mod:`~econuy.core.Pipeline.chg_diff`.

    """
    if operation not in ["chg", "diff"]:
        raise ValueError("Invalid 'operation' option.")
    if period not in ["last", "inter", "annual"]:
        raise ValueError("Invalid 'period' option.")
    if "Tipo" not in df.columns.names:
        raise ValueError("Input dataframe's multiindex requires the " "'Tipo' level.")

    all_metadata = df.columns.droplevel("Indicador")
    if all(x == all_metadata[0] for x in all_metadata):
        return _chg_diff(df=df, operation=operation, period=period)
    else:
        columns = []
        for column_name in df.columns:
            df_column = df[[column_name]]
            converted = _chg_diff(df=df_column, operation=operation, period=period)
            columns.append(converted)
        return pd.concat(columns, axis=1)


def _chg_diff(df: pd.DataFrame, operation: str = "chg", period: str = "last") -> pd.DataFrame:
    inferred_freq = pd.infer_freq(df.index)

    type_change = {
        "last": {
            "chg": [lambda x: x.pct_change(periods=1), "% variación"],
            "diff": [lambda x: x.diff(periods=1), "Cambio"],
        },
        "inter": {
            "chg": [lambda x: x.pct_change(periods=last_year), "% variación interanual"],
            "diff": [lambda x: x.diff(periods=last_year), "Cambio interanual"],
        },
        "annual": {
            "chg": [lambda x: x.pct_change(periods=last_year), "% variación anual"],
            "diff": [lambda x: x.diff(periods=last_year), "Cambio anual"],
        },
    }

    if inferred_freq == "M":
        last_year = 12
    elif inferred_freq == "Q" or inferred_freq == "Q-DEC":
        last_year = 4
    elif inferred_freq == "A" or inferred_freq == "A-DEC":
        last_year = 1
    else:
        raise ValueError(
            "The dataframe needs to have a frequency of M "
            "(month end), Q (quarter end) or A (year end)"
        )

    if period == "annual":

        if df.columns.get_level_values("Tipo")[0] == "Stock":
            output = df.apply(type_change[period][operation][0])
        else:
            output = rolling(df, operation="sum")
            output = output.apply(type_change[period][operation][0])

        metadata._set(output, unit=type_change[period][operation][1])

    else:
        output = df.apply(type_change[period][operation][0])
        metadata._set(output, unit=type_change[period][operation][1])

    if operation == "chg":
        output = output.multiply(100)

    return output


[docs]def error_handler(df: pd.DataFrame, errors: str, msg: str = None) -> pd.DataFrame:
    if errors == "coerce":
        return pd.DataFrame(data=np.nan, index=df.index, columns=df.columns)
    elif errors == "ignore":
        return df
    elif errors == "raise":
        if msg is None:
            msg = ""
        raise ValueError(msg)