Source code for impyute.util.count_missing

""" impyute.util.count_missing.py """
import numpy as np
from impyute.util import find_null


[docs]def count_missing(data): """ Calculate the total percentage of missing values and also the percentage in each column. Parameters ---------- data: np.array Data to impute. Returns ------- dict Percentage of missing values in total and in each column. """ size = len(data.flatten()) null_xy = find_null(data) np.unique(null_xy) counter = {y: 0. for y in np.unique(null_xy.T[1])} change_in_percentage = 1./size for _, y in null_xy: counter[y] += change_in_percentage total_missing = len(null_xy)/size counter["total"] = total_missing return counter