import os, math, subprocess
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import pandas_profiling
# some settings for displaying Pandas results
pd.set_option('display.width', 2000)
pd.set_option('display.max_rows', 500)
pd.set_option('display.max_columns', 500)
pd.set_option('display.precision', 4)
pd.set_option('display.max_colwidth', -1)
# load data
pdf_data = pd.read_csv("data/application_train.csv")
print(pdf_data.shape)
pdf_data.head()
(307511, 122)
SK_ID_CURR | TARGET | NAME_CONTRACT_TYPE | CODE_GENDER | FLAG_OWN_CAR | FLAG_OWN_REALTY | CNT_CHILDREN | AMT_INCOME_TOTAL | AMT_CREDIT | AMT_ANNUITY | AMT_GOODS_PRICE | NAME_TYPE_SUITE | NAME_INCOME_TYPE | NAME_EDUCATION_TYPE | NAME_FAMILY_STATUS | NAME_HOUSING_TYPE | REGION_POPULATION_RELATIVE | DAYS_BIRTH | DAYS_EMPLOYED | DAYS_REGISTRATION | DAYS_ID_PUBLISH | OWN_CAR_AGE | FLAG_MOBIL | FLAG_EMP_PHONE | FLAG_WORK_PHONE | FLAG_CONT_MOBILE | FLAG_PHONE | FLAG_EMAIL | OCCUPATION_TYPE | CNT_FAM_MEMBERS | REGION_RATING_CLIENT | REGION_RATING_CLIENT_W_CITY | WEEKDAY_APPR_PROCESS_START | HOUR_APPR_PROCESS_START | REG_REGION_NOT_LIVE_REGION | REG_REGION_NOT_WORK_REGION | LIVE_REGION_NOT_WORK_REGION | REG_CITY_NOT_LIVE_CITY | REG_CITY_NOT_WORK_CITY | LIVE_CITY_NOT_WORK_CITY | ORGANIZATION_TYPE | EXT_SOURCE_1 | EXT_SOURCE_2 | EXT_SOURCE_3 | APARTMENTS_AVG | BASEMENTAREA_AVG | YEARS_BEGINEXPLUATATION_AVG | YEARS_BUILD_AVG | COMMONAREA_AVG | ELEVATORS_AVG | ENTRANCES_AVG | FLOORSMAX_AVG | FLOORSMIN_AVG | LANDAREA_AVG | LIVINGAPARTMENTS_AVG | LIVINGAREA_AVG | NONLIVINGAPARTMENTS_AVG | NONLIVINGAREA_AVG | APARTMENTS_MODE | BASEMENTAREA_MODE | YEARS_BEGINEXPLUATATION_MODE | YEARS_BUILD_MODE | COMMONAREA_MODE | ELEVATORS_MODE | ENTRANCES_MODE | FLOORSMAX_MODE | FLOORSMIN_MODE | LANDAREA_MODE | LIVINGAPARTMENTS_MODE | LIVINGAREA_MODE | NONLIVINGAPARTMENTS_MODE | NONLIVINGAREA_MODE | APARTMENTS_MEDI | BASEMENTAREA_MEDI | YEARS_BEGINEXPLUATATION_MEDI | YEARS_BUILD_MEDI | COMMONAREA_MEDI | ELEVATORS_MEDI | ENTRANCES_MEDI | FLOORSMAX_MEDI | FLOORSMIN_MEDI | LANDAREA_MEDI | LIVINGAPARTMENTS_MEDI | LIVINGAREA_MEDI | NONLIVINGAPARTMENTS_MEDI | NONLIVINGAREA_MEDI | FONDKAPREMONT_MODE | HOUSETYPE_MODE | TOTALAREA_MODE | WALLSMATERIAL_MODE | EMERGENCYSTATE_MODE | OBS_30_CNT_SOCIAL_CIRCLE | DEF_30_CNT_SOCIAL_CIRCLE | OBS_60_CNT_SOCIAL_CIRCLE | DEF_60_CNT_SOCIAL_CIRCLE | DAYS_LAST_PHONE_CHANGE | FLAG_DOCUMENT_2 | FLAG_DOCUMENT_3 | FLAG_DOCUMENT_4 | FLAG_DOCUMENT_5 | FLAG_DOCUMENT_6 | FLAG_DOCUMENT_7 | FLAG_DOCUMENT_8 | FLAG_DOCUMENT_9 | FLAG_DOCUMENT_10 | FLAG_DOCUMENT_11 | FLAG_DOCUMENT_12 | FLAG_DOCUMENT_13 | FLAG_DOCUMENT_14 | FLAG_DOCUMENT_15 | FLAG_DOCUMENT_16 | FLAG_DOCUMENT_17 | FLAG_DOCUMENT_18 | FLAG_DOCUMENT_19 | FLAG_DOCUMENT_20 | FLAG_DOCUMENT_21 | AMT_REQ_CREDIT_BUREAU_HOUR | AMT_REQ_CREDIT_BUREAU_DAY | AMT_REQ_CREDIT_BUREAU_WEEK | AMT_REQ_CREDIT_BUREAU_MON | AMT_REQ_CREDIT_BUREAU_QRT | AMT_REQ_CREDIT_BUREAU_YEAR | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | 100002 | 1 | Cash loans | M | N | Y | 0 | 202500.0 | 406597.5 | 24700.5 | 351000.0 | Unaccompanied | Working | Secondary / secondary special | Single / not married | House / apartment | 0.0188 | -9461 | -637 | -3648.0 | -2120 | NaN | 1 | 1 | 0 | 1 | 1 | 0 | Laborers | 1.0 | 2 | 2 | WEDNESDAY | 10 | 0 | 0 | 0 | 0 | 0 | 0 | Business Entity Type 3 | 0.0830 | 0.2629 | 0.1394 | 0.0247 | 0.0369 | 0.9722 | 0.6192 | 0.0143 | 0.00 | 0.0690 | 0.0833 | 0.1250 | 0.0369 | 0.0202 | 0.0190 | 0.0000 | 0.0000 | 0.0252 | 0.0383 | 0.9722 | 0.6341 | 0.0144 | 0.0000 | 0.0690 | 0.0833 | 0.1250 | 0.0377 | 0.022 | 0.0198 | 0.0 | 0.0 | 0.0250 | 0.0369 | 0.9722 | 0.6243 | 0.0144 | 0.00 | 0.0690 | 0.0833 | 0.1250 | 0.0375 | 0.0205 | 0.0193 | 0.0000 | 0.00 | reg oper account | block of flats | 0.0149 | Stone, brick | No | 2.0 | 2.0 | 2.0 | 2.0 | -1134.0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 1.0 |
1 | 100003 | 0 | Cash loans | F | N | N | 0 | 270000.0 | 1293502.5 | 35698.5 | 1129500.0 | Family | State servant | Higher education | Married | House / apartment | 0.0035 | -16765 | -1188 | -1186.0 | -291 | NaN | 1 | 1 | 0 | 1 | 1 | 0 | Core staff | 2.0 | 1 | 1 | MONDAY | 11 | 0 | 0 | 0 | 0 | 0 | 0 | School | 0.3113 | 0.6222 | NaN | 0.0959 | 0.0529 | 0.9851 | 0.7960 | 0.0605 | 0.08 | 0.0345 | 0.2917 | 0.3333 | 0.0130 | 0.0773 | 0.0549 | 0.0039 | 0.0098 | 0.0924 | 0.0538 | 0.9851 | 0.8040 | 0.0497 | 0.0806 | 0.0345 | 0.2917 | 0.3333 | 0.0128 | 0.079 | 0.0554 | 0.0 | 0.0 | 0.0968 | 0.0529 | 0.9851 | 0.7987 | 0.0608 | 0.08 | 0.0345 | 0.2917 | 0.3333 | 0.0132 | 0.0787 | 0.0558 | 0.0039 | 0.01 | reg oper account | block of flats | 0.0714 | Block | No | 1.0 | 0.0 | 1.0 | 0.0 | -828.0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
2 | 100004 | 0 | Revolving loans | M | Y | Y | 0 | 67500.0 | 135000.0 | 6750.0 | 135000.0 | Unaccompanied | Working | Secondary / secondary special | Single / not married | House / apartment | 0.0100 | -19046 | -225 | -4260.0 | -2531 | 26.0 | 1 | 1 | 1 | 1 | 1 | 0 | Laborers | 1.0 | 2 | 2 | MONDAY | 9 | 0 | 0 | 0 | 0 | 0 | 0 | Government | NaN | 0.5559 | 0.7296 | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | 0.0 | 0.0 | 0.0 | 0.0 | -815.0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
3 | 100006 | 0 | Cash loans | F | N | Y | 0 | 135000.0 | 312682.5 | 29686.5 | 297000.0 | Unaccompanied | Working | Secondary / secondary special | Civil marriage | House / apartment | 0.0080 | -19005 | -3039 | -9833.0 | -2437 | NaN | 1 | 1 | 0 | 1 | 0 | 0 | Laborers | 2.0 | 2 | 2 | WEDNESDAY | 17 | 0 | 0 | 0 | 0 | 0 | 0 | Business Entity Type 3 | NaN | 0.6504 | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | 2.0 | 0.0 | 2.0 | 0.0 | -617.0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | NaN | NaN | NaN | NaN | NaN | NaN |
4 | 100007 | 0 | Cash loans | M | N | Y | 0 | 121500.0 | 513000.0 | 21865.5 | 513000.0 | Unaccompanied | Working | Secondary / secondary special | Single / not married | House / apartment | 0.0287 | -19932 | -3038 | -4311.0 | -3458 | NaN | 1 | 1 | 0 | 1 | 0 | 0 | Core staff | 1.0 | 2 | 2 | THURSDAY | 11 | 0 | 0 | 0 | 0 | 1 | 1 | Religion | NaN | 0.3227 | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | NaN | 0.0 | 0.0 | 0.0 | 0.0 | -1106.0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 |
%%time
profile = pandas_profiling.ProfileReport(pdf_data)
profile
CPU times: user 4min 2s, sys: 7.74 s, total: 4min 9s Wall time: 2min 59s
Dataset info
Number of variables | 122 |
---|---|
Number of observations | 307511 |
Total Missing (%) | 9.6% |
Total size in memory | 286.2 MiB |
Average record size in memory | 976.0 B |
Variables types
Numeric | 39 |
---|---|
Categorical | 16 |
Boolean | 33 |
Date | 0 |
Text (Unique) | 0 |
Rejected | 34 |
Unsupported | 0 |
Warnings
AMT_GOODS_PRICE
is highly correlated with AMT_CREDIT
(ρ = 0.98697) RejectedAMT_INCOME_TOTAL
is highly skewed (γ1 = 391.56) SkewedAMT_REQ_CREDIT_BUREAU_DAY
has 41519 / 13.5% missing values MissingAMT_REQ_CREDIT_BUREAU_DAY
is highly skewed (γ1 = 27.044) SkewedAMT_REQ_CREDIT_BUREAU_DAY
has 264503 / 86.0% zeros ZerosAMT_REQ_CREDIT_BUREAU_HOUR
has 41519 / 13.5% missing values MissingAMT_REQ_CREDIT_BUREAU_HOUR
has 264366 / 86.0% zeros ZerosAMT_REQ_CREDIT_BUREAU_MON
has 41519 / 13.5% missing values MissingAMT_REQ_CREDIT_BUREAU_MON
has 222233 / 72.3% zeros ZerosAMT_REQ_CREDIT_BUREAU_QRT
has 41519 / 13.5% missing values MissingAMT_REQ_CREDIT_BUREAU_QRT
is highly skewed (γ1 = 134.37) SkewedAMT_REQ_CREDIT_BUREAU_QRT
has 215417 / 70.1% zeros ZerosAMT_REQ_CREDIT_BUREAU_WEEK
has 41519 / 13.5% missing values MissingAMT_REQ_CREDIT_BUREAU_WEEK
has 257456 / 83.7% zeros ZerosAMT_REQ_CREDIT_BUREAU_YEAR
has 41519 / 13.5% missing values MissingAMT_REQ_CREDIT_BUREAU_YEAR
has 71801 / 23.3% zeros ZerosAPARTMENTS_AVG
has 156061 / 50.7% missing values MissingAPARTMENTS_MEDI
is highly correlated with LIVINGAPARTMENTS_MODE
(ρ = 0.93217) RejectedAPARTMENTS_MODE
is highly correlated with LIVINGAPARTMENTS_AVG
(ρ = 0.90828) RejectedBASEMENTAREA_AVG
has 179943 / 58.5% missing values MissingBASEMENTAREA_AVG
has 14745 / 4.8% zeros ZerosBASEMENTAREA_MEDI
is highly correlated with BASEMENTAREA_MODE
(ρ = 0.97794) RejectedBASEMENTAREA_MODE
is highly correlated with BASEMENTAREA_AVG
(ρ = 0.9735) RejectedCNT_CHILDREN
has 215371 / 70.0% zeros ZerosCOMMONAREA_AVG
has 214865 / 69.9% missing values MissingCOMMONAREA_AVG
has 8442 / 2.7% zeros ZerosCOMMONAREA_MEDI
is highly correlated with COMMONAREA_MODE
(ρ = 0.97989) RejectedCOMMONAREA_MODE
is highly correlated with COMMONAREA_AVG
(ρ = 0.97715) RejectedDAYS_LAST_PHONE_CHANGE
has 37672 / 12.3% zeros ZerosDEF_30_CNT_SOCIAL_CIRCLE
has 271324 / 88.2% zeros ZerosDEF_60_CNT_SOCIAL_CIRCLE
has 280721 / 91.3% zeros ZerosELEVATORS_AVG
has 163891 / 53.3% missing values MissingELEVATORS_AVG
has 85718 / 27.9% zeros ZerosELEVATORS_MEDI
is highly correlated with ELEVATORS_MODE
(ρ = 0.98283) RejectedELEVATORS_MODE
is highly correlated with ELEVATORS_AVG
(ρ = 0.97884) RejectedEMERGENCYSTATE_MODE
has 145755 / 47.4% missing values MissingENTRANCES_AVG
has 154828 / 50.3% missing values MissingENTRANCES_MEDI
is highly correlated with ENTRANCES_MODE
(ρ = 0.98068) RejectedENTRANCES_MODE
is highly correlated with ENTRANCES_AVG
(ρ = 0.97774) RejectedEXT_SOURCE_1
has 173378 / 56.4% missing values MissingEXT_SOURCE_3
has 60965 / 19.8% missing values MissingFLOORSMAX_AVG
has 153020 / 49.8% missing values MissingFLOORSMAX_MEDI
is highly correlated with FLOORSMAX_MODE
(ρ = 0.98824) RejectedFLOORSMAX_MODE
is highly correlated with FLOORSMAX_AVG
(ρ = 0.98569) RejectedFLOORSMIN_AVG
has 208642 / 67.8% missing values MissingFLOORSMIN_MEDI
is highly correlated with FLOORSMIN_MODE
(ρ = 0.98841) RejectedFLOORSMIN_MODE
is highly correlated with FLOORSMIN_AVG
(ρ = 0.98588) RejectedFONDKAPREMONT_MODE
has 210295 / 68.4% missing values MissingHOUSETYPE_MODE
has 154297 / 50.2% missing values MissingLANDAREA_AVG
has 182590 / 59.4% missing values MissingLANDAREA_AVG
has 15600 / 5.1% zeros ZerosLANDAREA_MEDI
is highly correlated with LANDAREA_MODE
(ρ = 0.98084) RejectedLANDAREA_MODE
is highly correlated with LANDAREA_AVG
(ρ = 0.9737) RejectedLIVINGAPARTMENTS_AVG
is highly correlated with APARTMENTS_AVG
(ρ = 0.94395) RejectedLIVINGAPARTMENTS_MEDI
is highly correlated with APARTMENTS_MEDI
(ρ = 0.94249) RejectedLIVINGAPARTMENTS_MODE
is highly correlated with APARTMENTS_MODE
(ρ = 0.93776) RejectedLIVINGAREA_AVG
is highly correlated with APARTMENTS_AVG
(ρ = 0.91362) RejectedLIVINGAREA_MEDI
is highly correlated with APARTMENTS_MEDI
(ρ = 0.91595) RejectedLIVINGAREA_MODE
is highly correlated with APARTMENTS_MODE
(ρ = 0.91038) RejectedNONLIVINGAPARTMENTS_AVG
has 213514 / 69.4% missing values MissingNONLIVINGAPARTMENTS_AVG
has 54549 / 17.7% zeros ZerosNONLIVINGAPARTMENTS_MEDI
is highly correlated with NONLIVINGAPARTMENTS_MODE
(ρ = 0.97857) RejectedNONLIVINGAPARTMENTS_MODE
is highly correlated with NONLIVINGAPARTMENTS_AVG
(ρ = 0.96937) RejectedNONLIVINGAREA_AVG
has 169682 / 55.2% missing values MissingNONLIVINGAREA_AVG
has 58735 / 19.1% zeros ZerosNONLIVINGAREA_MEDI
is highly correlated with NONLIVINGAREA_MODE
(ρ = 0.97584) RejectedNONLIVINGAREA_MODE
is highly correlated with NONLIVINGAREA_AVG
(ρ = 0.96609) RejectedOBS_30_CNT_SOCIAL_CIRCLE
has 163910 / 53.3% zeros ZerosOBS_60_CNT_SOCIAL_CIRCLE
is highly correlated with OBS_30_CNT_SOCIAL_CIRCLE
(ρ = 0.99849) RejectedOCCUPATION_TYPE
has 96391 / 31.3% missing values MissingORGANIZATION_TYPE
has a high cardinality: 58 distinct values WarningOWN_CAR_AGE
has 202929 / 66.0% missing values MissingREGION_RATING_CLIENT_W_CITY
is highly correlated with REGION_RATING_CLIENT
(ρ = 0.95084) RejectedTOTALAREA_MODE
is highly correlated with LIVINGAREA_MEDI
(ρ = 0.91936) RejectedWALLSMATERIAL_MODE
has 156341 / 50.8% missing values MissingYEARS_BEGINEXPLUATATION_AVG
has 150007 / 48.8% missing values MissingYEARS_BEGINEXPLUATATION_MEDI
is highly correlated with YEARS_BEGINEXPLUATATION_MODE
(ρ = 0.96354) RejectedYEARS_BEGINEXPLUATATION_MODE
is highly correlated with YEARS_BEGINEXPLUATATION_AVG
(ρ = 0.97189) RejectedYEARS_BUILD_AVG
has 204488 / 66.5% missing values MissingYEARS_BUILD_MEDI
is highly correlated with YEARS_BUILD_MODE
(ρ = 0.98946) RejectedYEARS_BUILD_MODE
is highly correlated with YEARS_BUILD_AVG
(ρ = 0.98944) RejectedAMT_ANNUITY
Numeric
Distinct count | 13673 |
---|---|
Unique (%) | 4.4% |
Missing (%) | 0.0% |
Missing (n) | 12 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 27109 |
---|---|
Minimum | 1615.5 |
Maximum | 258030 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1615.5 |
---|---|
5-th percentile | 9000 |
Q1 | 16524 |
Median | 24903 |
Q3 | 34596 |
95-th percentile | 53325 |
Maximum | 258030 |
Range | 256410 |
Interquartile range | 18072 |
Descriptive statistics
Standard deviation | 14494 |
---|---|
Coef of variation | 0.53466 |
Kurtosis | 7.7073 |
Mean | 27109 |
MAD | 10975 |
Skewness | 1.5798 |
Sum | 8335900000 |
Variance | 210070000 |
Memory size | 2.3 MiB |
Value | Count | Frequency (%) | |
9000.0 | 6385 | 2.1% | |
13500.0 | 5514 | 1.8% | |
6750.0 | 2279 | 0.7% | |
10125.0 | 2035 | 0.7% | |
37800.0 | 1602 | 0.5% | |
11250.0 | 1459 | 0.5% | |
26217.0 | 1453 | 0.5% | |
20250.0 | 1345 | 0.4% | |
12375.0 | 1339 | 0.4% | |
31653.0 | 1269 | 0.4% | |
Other values (13662) | 282819 | 92.0% |
Minimum 5 values
Value | Count | Frequency (%) | |
1615.5 | 1 | 0.0% | |
1980.0 | 2 | 0.0% | |
1993.5 | 1 | 0.0% | |
2052.0 | 1 | 0.0% | |
2164.5 | 2 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
216589.5 | 1 | 0.0% | |
220297.5 | 1 | 0.0% | |
225000.0 | 23 | 0.0% | |
230161.5 | 1 | 0.0% | |
258025.5 | 1 | 0.0% |
AMT_CREDIT
Numeric
Distinct count | 5603 |
---|---|
Unique (%) | 1.8% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 599030 |
---|---|
Minimum | 45000 |
Maximum | 4050000 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 45000 |
---|---|
5-th percentile | 135000 |
Q1 | 270000 |
Median | 513530 |
Q3 | 808650 |
95-th percentile | 1350000 |
Maximum | 4050000 |
Range | 4005000 |
Interquartile range | 538650 |
Descriptive statistics
Standard deviation | 402490 |
---|---|
Coef of variation | 0.67191 |
Kurtosis | 1.934 |
Mean | 599030 |
MAD | 316580 |
Skewness | 1.2348 |
Sum | 184210000000 |
Variance | 162000000000 |
Memory size | 2.3 MiB |
Value | Count | Frequency (%) | |
450000.0 | 9709 | 3.2% | |
675000.0 | 8877 | 2.9% | |
225000.0 | 8162 | 2.7% | |
180000.0 | 7342 | 2.4% | |
270000.0 | 7241 | 2.4% | |
900000.0 | 6246 | 2.0% | |
254700.0 | 4500 | 1.5% | |
545040.0 | 4437 | 1.4% | |
808650.0 | 4152 | 1.4% | |
135000.0 | 3660 | 1.2% | |
Other values (5593) | 243185 | 79.1% |
Minimum 5 values
Value | Count | Frequency (%) | |
45000.0 | 230 | 0.1% | |
47970.0 | 218 | 0.1% | |
48519.0 | 1 | 0.0% | |
49455.0 | 19 | 0.0% | |
49500.0 | 40 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
3860019.0 | 1 | 0.0% | |
3956274.0 | 1 | 0.0% | |
4027680.0 | 1 | 0.0% | |
4031032.5 | 1 | 0.0% | |
4050000.0 | 8 | 0.0% |
AMT_GOODS_PRICE
Highly correlated
This variable is highly correlated with AMT_CREDIT
and should be ignored for analysis
Correlation | 0.98697 |
---|
AMT_INCOME_TOTAL
Numeric
Distinct count | 2548 |
---|---|
Unique (%) | 0.8% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 168800 |
---|---|
Minimum | 25650 |
Maximum | 117000000 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 25650 |
---|---|
5-th percentile | 67500 |
Q1 | 112500 |
Median | 147150 |
Q3 | 202500 |
95-th percentile | 337500 |
Maximum | 117000000 |
Range | 116970000 |
Interquartile range | 90000 |
Descriptive statistics
Standard deviation | 237120 |
---|---|
Coef of variation | 1.4048 |
Kurtosis | 191790 |
Mean | 168800 |
MAD | 66226 |
Skewness | 391.56 |
Sum | 51907000000 |
Variance | 56227000000 |
Memory size | 2.3 MiB |
Value | Count | Frequency (%) | |
135000.0 | 35750 | 11.6% | |
112500.0 | 31019 | 10.1% | |
157500.0 | 26556 | 8.6% | |
180000.0 | 24719 | 8.0% | |
90000.0 | 22483 | 7.3% | |
225000.0 | 20698 | 6.7% | |
202500.0 | 16341 | 5.3% | |
67500.0 | 11147 | 3.6% | |
270000.0 | 10827 | 3.5% | |
81000.0 | 6001 | 2.0% | |
Other values (2538) | 101970 | 33.2% |
Minimum 5 values
Value | Count | Frequency (%) | |
25650.0 | 2 | 0.0% | |
26100.0 | 3 | 0.0% | |
26460.0 | 1 | 0.0% | |
26550.0 | 2 | 0.0% | |
27000.0 | 66 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
6750000.0 | 1 | 0.0% | |
9000000.0 | 1 | 0.0% | |
13500000.0 | 1 | 0.0% | |
18000090.0 | 1 | 0.0% | |
117000000.0 | 1 | 0.0% |
AMT_REQ_CREDIT_BUREAU_DAY
Numeric
Distinct count | 10 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 13.5% |
Missing (n) | 41519 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 0.0070002 |
---|---|
Minimum | 0 |
Maximum | 9 |
Zeros (%) | 86.0% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 0 |
Q3 | 0 |
95-th percentile | 0 |
Maximum | 9 |
Range | 9 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.11076 |
---|---|
Coef of variation | 15.822 |
Kurtosis | 1151.9 |
Mean | 0.0070002 |
MAD | 0.013922 |
Skewness | 27.044 |
Sum | 1862 |
Variance | 0.012267 |
Memory size | 2.3 MiB |
Value | Count | Frequency (%) | |
0.0 | 264503 | 86.0% | |
1.0 | 1292 | 0.4% | |
2.0 | 106 | 0.0% | |
3.0 | 45 | 0.0% | |
4.0 | 26 | 0.0% | |
5.0 | 9 | 0.0% | |
6.0 | 8 | 0.0% | |
9.0 | 2 | 0.0% | |
8.0 | 1 | 0.0% | |
(Missing) | 41519 | 13.5% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 264503 | 86.0% | |
1.0 | 1292 | 0.4% | |
2.0 | 106 | 0.0% | |
3.0 | 45 | 0.0% | |
4.0 | 26 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
4.0 | 26 | 0.0% | |
5.0 | 9 | 0.0% | |
6.0 | 8 | 0.0% | |
8.0 | 1 | 0.0% | |
9.0 | 2 | 0.0% |
AMT_REQ_CREDIT_BUREAU_HOUR
Numeric
Distinct count | 6 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 13.5% |
Missing (n) | 41519 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 0.0064024 |
---|---|
Minimum | 0 |
Maximum | 4 |
Zeros (%) | 86.0% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 0 |
Q3 | 0 |
95-th percentile | 0 |
Maximum | 4 |
Range | 4 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.083849 |
---|---|
Coef of variation | 13.096 |
Kurtosis | 254.24 |
Mean | 0.0064024 |
MAD | 0.012727 |
Skewness | 14.534 |
Sum | 1703 |
Variance | 0.0070307 |
Memory size | 2.3 MiB |
Value | Count | Frequency (%) | |
0.0 | 264366 | 86.0% | |
1.0 | 1560 | 0.5% | |
2.0 | 56 | 0.0% | |
3.0 | 9 | 0.0% | |
4.0 | 1 | 0.0% | |
(Missing) | 41519 | 13.5% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 264366 | 86.0% | |
1.0 | 1560 | 0.5% | |
2.0 | 56 | 0.0% | |
3.0 | 9 | 0.0% | |
4.0 | 1 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
0.0 | 264366 | 86.0% | |
1.0 | 1560 | 0.5% | |
2.0 | 56 | 0.0% | |
3.0 | 9 | 0.0% | |
4.0 | 1 | 0.0% |
AMT_REQ_CREDIT_BUREAU_MON
Numeric
Distinct count | 25 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 13.5% |
Missing (n) | 41519 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 0.2674 |
---|---|
Minimum | 0 |
Maximum | 27 |
Zeros (%) | 72.3% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 0 |
Q3 | 0 |
95-th percentile | 1 |
Maximum | 27 |
Range | 27 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.916 |
---|---|
Coef of variation | 3.4256 |
Kurtosis | 90.435 |
Mean | 0.2674 |
MAD | 0.44681 |
Skewness | 7.8048 |
Sum | 71125 |
Variance | 0.83906 |
Memory size | 2.3 MiB |
Value | Count | Frequency (%) | |
0.0 | 222233 | 72.3% | |
1.0 | 33147 | 10.8% | |
2.0 | 5386 | 1.8% | |
3.0 | 1991 | 0.6% | |
4.0 | 1076 | 0.3% | |
5.0 | 602 | 0.2% | |
6.0 | 343 | 0.1% | |
7.0 | 298 | 0.1% | |
9.0 | 206 | 0.1% | |
8.0 | 185 | 0.1% | |
Other values (14) | 525 | 0.2% | |
(Missing) | 41519 | 13.5% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 222233 | 72.3% | |
1.0 | 33147 | 10.8% | |
2.0 | 5386 | 1.8% | |
3.0 | 1991 | 0.6% | |
4.0 | 1076 | 0.3% |
Maximum 5 values
Value | Count | Frequency (%) | |
19.0 | 3 | 0.0% | |
22.0 | 1 | 0.0% | |
23.0 | 1 | 0.0% | |
24.0 | 1 | 0.0% | |
27.0 | 1 | 0.0% |
AMT_REQ_CREDIT_BUREAU_QRT
Numeric
Distinct count | 12 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 13.5% |
Missing (n) | 41519 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 0.26547 |
---|---|
Minimum | 0 |
Maximum | 261 |
Zeros (%) | 70.1% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 0 |
Q3 | 0 |
95-th percentile | 2 |
Maximum | 261 |
Range | 261 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.79406 |
---|---|
Coef of variation | 2.9911 |
Kurtosis | 43707 |
Mean | 0.26547 |
MAD | 0.43 |
Skewness | 134.37 |
Sum | 70614 |
Variance | 0.63052 |
Memory size | 2.3 MiB |
Value | Count | Frequency (%) | |
0.0 | 215417 | 70.1% | |
1.0 | 33862 | 11.0% | |
2.0 | 14412 | 4.7% | |
3.0 | 1717 | 0.6% | |
4.0 | 476 | 0.2% | |
5.0 | 64 | 0.0% | |
6.0 | 28 | 0.0% | |
7.0 | 7 | 0.0% | |
8.0 | 7 | 0.0% | |
19.0 | 1 | 0.0% | |
(Missing) | 41519 | 13.5% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 215417 | 70.1% | |
1.0 | 33862 | 11.0% | |
2.0 | 14412 | 4.7% | |
3.0 | 1717 | 0.6% | |
4.0 | 476 | 0.2% |
Maximum 5 values
Value | Count | Frequency (%) | |
6.0 | 28 | 0.0% | |
7.0 | 7 | 0.0% | |
8.0 | 7 | 0.0% | |
19.0 | 1 | 0.0% | |
261.0 | 1 | 0.0% |
AMT_REQ_CREDIT_BUREAU_WEEK
Numeric
Distinct count | 10 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 13.5% |
Missing (n) | 41519 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 0.034362 |
---|---|
Minimum | 0 |
Maximum | 8 |
Zeros (%) | 83.7% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 0 |
Q3 | 0 |
95-th percentile | 0 |
Maximum | 8 |
Range | 8 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.20468 |
---|---|
Coef of variation | 5.9567 |
Kurtosis | 166.75 |
Mean | 0.034362 |
MAD | 0.066518 |
Skewness | 9.2936 |
Sum | 9140 |
Variance | 0.041896 |
Memory size | 2.3 MiB |
Value | Count | Frequency (%) | |
0.0 | 257456 | 83.7% | |
1.0 | 8208 | 2.7% | |
2.0 | 199 | 0.1% | |
3.0 | 58 | 0.0% | |
4.0 | 34 | 0.0% | |
6.0 | 20 | 0.0% | |
5.0 | 10 | 0.0% | |
8.0 | 5 | 0.0% | |
7.0 | 2 | 0.0% | |
(Missing) | 41519 | 13.5% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 257456 | 83.7% | |
1.0 | 8208 | 2.7% | |
2.0 | 199 | 0.1% | |
3.0 | 58 | 0.0% | |
4.0 | 34 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
4.0 | 34 | 0.0% | |
5.0 | 10 | 0.0% | |
6.0 | 20 | 0.0% | |
7.0 | 2 | 0.0% | |
8.0 | 5 | 0.0% |
AMT_REQ_CREDIT_BUREAU_YEAR
Numeric
Distinct count | 26 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 13.5% |
Missing (n) | 41519 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.9 |
---|---|
Minimum | 0 |
Maximum | 25 |
Zeros (%) | 23.3% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 1 |
Q3 | 3 |
95-th percentile | 6 |
Maximum | 25 |
Range | 25 |
Interquartile range | 3 |
Descriptive statistics
Standard deviation | 1.8693 |
---|---|
Coef of variation | 0.98385 |
Kurtosis | 1.969 |
Mean | 1.9 |
MAD | 1.4548 |
Skewness | 1.2436 |
Sum | 505380 |
Variance | 3.4943 |
Memory size | 2.3 MiB |
Value | Count | Frequency (%) | |
0.0 | 71801 | 23.3% | |
1.0 | 63405 | 20.6% | |
2.0 | 50192 | 16.3% | |
3.0 | 33628 | 10.9% | |
4.0 | 20714 | 6.7% | |
5.0 | 12052 | 3.9% | |
6.0 | 6967 | 2.3% | |
7.0 | 3869 | 1.3% | |
8.0 | 2127 | 0.7% | |
9.0 | 1096 | 0.4% | |
Other values (15) | 141 | 0.0% | |
(Missing) | 41519 | 13.5% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 71801 | 23.3% | |
1.0 | 63405 | 20.6% | |
2.0 | 50192 | 16.3% | |
3.0 | 33628 | 10.9% | |
4.0 | 20714 | 6.7% |
Maximum 5 values
Value | Count | Frequency (%) | |
20.0 | 1 | 0.0% | |
21.0 | 1 | 0.0% | |
22.0 | 1 | 0.0% | |
23.0 | 1 | 0.0% | |
25.0 | 1 | 0.0% |
APARTMENTS_AVG
Numeric
Distinct count | 2340 |
---|---|
Unique (%) | 0.8% |
Missing (%) | 50.7% |
Missing (n) | 156061 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 0.11744 |
---|---|
Minimum | 0 |
Maximum | 1 |
Zeros (%) | 0.2% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0.0082 |
Q1 | 0.0577 |
Median | 0.0876 |
Q3 | 0.1485 |
95-th percentile | 0.3268 |
Maximum | 1 |
Range | 1 |
Interquartile range | 0.0908 |
Descriptive statistics
Standard deviation | 0.10824 |
---|---|
Coef of variation | 0.92166 |
Kurtosis | 11.394 |
Mean | 0.11744 |
MAD | 0.073286 |
Skewness | 2.6418 |
Sum | 17786 |
Variance | 0.011716 |
Memory size | 2.3 MiB |
Value | Count | Frequency (%) | |
0.0825 | 6663 | 2.2% | |
0.0619 | 6332 | 2.1% | |
0.0928 | 4404 | 1.4% | |
0.0722 | 3986 | 1.3% | |
0.0082 | 3507 | 1.1% | |
0.0165 | 3027 | 1.0% | |
0.1031 | 2892 | 0.9% | |
0.1485 | 2769 | 0.9% | |
0.0124 | 2721 | 0.9% | |
0.0742 | 2231 | 0.7% | |
Other values (2329) | 112918 | 36.7% | |
(Missing) | 156061 | 50.7% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 751 | 0.2% | |
0.001 | 197 | 0.1% | |
0.0014 | 1 | 0.0% | |
0.0015 | 6 | 0.0% | |
0.0017 | 1 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
0.9814 | 9 | 0.0% | |
0.9876 | 7 | 0.0% | |
0.9897 | 1 | 0.0% | |
0.9907 | 2 | 0.0% | |
1.0 | 147 | 0.0% |
APARTMENTS_MEDI
Highly correlated
This variable is highly correlated with LIVINGAPARTMENTS_MODE
and should be ignored for analysis
Correlation | 0.93217 |
---|
APARTMENTS_MODE
Highly correlated
This variable is highly correlated with LIVINGAPARTMENTS_AVG
and should be ignored for analysis
Correlation | 0.90828 |
---|
BASEMENTAREA_AVG
Numeric
Distinct count | 3781 |
---|---|
Unique (%) | 1.2% |
Missing (%) | 58.5% |
Missing (n) | 179943 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 0.088442 |
---|---|
Minimum | 0 |
Maximum | 1 |
Zeros (%) | 4.8% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0.0442 |
Median | 0.0763 |
Q3 | 0.1122 |
95-th percentile | 0.2237 |
Maximum | 1 |
Range | 1 |
Interquartile range | 0.068 |
Descriptive statistics
Standard deviation | 0.082438 |
---|---|
Coef of variation | 0.93211 |
Kurtosis | 25.93 |
Mean | 0.088442 |
MAD | 0.052361 |
Skewness | 3.5663 |
Sum | 11282 |
Variance | 0.0067961 |
Memory size | 2.3 MiB |
Value | Count | Frequency (%) | |
0.0 | 14745 | 4.8% | |
0.0545 | 251 | 0.1% | |
0.0818 | 251 | 0.1% | |
0.0727 | 248 | 0.1% | |
0.1091 | 246 | 0.1% | |
0.0796 | 245 | 0.1% | |
0.08 | 239 | 0.1% | |
0.0805 | 230 | 0.1% | |
0.0764 | 220 | 0.1% | |
0.0793 | 211 | 0.1% | |
Other values (3770) | 110682 | 36.0% | |
(Missing) | 179943 | 58.5% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 14745 | 4.8% | |
0.0001 | 99 | 0.0% | |
0.0002 | 38 | 0.0% | |
0.0003 | 8 | 0.0% | |
0.0004 | 33 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
0.9677 | 1 | 0.0% | |
0.9682 | 1 | 0.0% | |
0.9694 | 2 | 0.0% | |
0.9945 | 1 | 0.0% | |
1.0 | 130 | 0.0% |
BASEMENTAREA_MEDI
Highly correlated
This variable is highly correlated with BASEMENTAREA_MODE
and should be ignored for analysis
Correlation | 0.97794 |
---|
BASEMENTAREA_MODE
Highly correlated
This variable is highly correlated with BASEMENTAREA_AVG
and should be ignored for analysis
Correlation | 0.9735 |
---|
CNT_CHILDREN
Numeric
Distinct count | 15 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 0.41705 |
---|---|
Minimum | 0 |
Maximum | 19 |
Zeros (%) | 70.0% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 0 |
Q3 | 1 |
95-th percentile | 2 |
Maximum | 19 |
Range | 19 |
Interquartile range | 1 |
Descriptive statistics
Standard deviation | 0.72212 |
---|---|
Coef of variation | 1.7315 |
Kurtosis | 7.9041 |
Mean | 0.41705 |
MAD | 0.58418 |
Skewness | 1.9746 |
Sum | 128248 |
Variance | 0.52146 |
Memory size | 2.3 MiB |
Value | Count | Frequency (%) | |
0 | 215371 | 70.0% | |
1 | 61119 | 19.9% | |
2 | 26749 | 8.7% | |
3 | 3717 | 1.2% | |
4 | 429 | 0.1% | |
5 | 84 | 0.0% | |
6 | 21 | 0.0% | |
7 | 7 | 0.0% | |
14 | 3 | 0.0% | |
19 | 2 | 0.0% | |
Other values (5) | 9 | 0.0% |
Minimum 5 values
Value | Count | Frequency (%) | |
0 | 215371 | 70.0% | |
1 | 61119 | 19.9% | |
2 | 26749 | 8.7% | |
3 | 3717 | 1.2% | |
4 | 429 | 0.1% |
Maximum 5 values
Value | Count | Frequency (%) | |
10 | 2 | 0.0% | |
11 | 1 | 0.0% | |
12 | 2 | 0.0% | |
14 | 3 | 0.0% | |
19 | 2 | 0.0% |
CNT_FAM_MEMBERS
Numeric
Distinct count | 18 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 0.0% |
Missing (n) | 2 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 2.1527 |
---|---|
Minimum | 1 |
Maximum | 20 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 2 |
Median | 2 |
Q3 | 3 |
95-th percentile | 4 |
Maximum | 20 |
Range | 19 |
Interquartile range | 1 |
Descriptive statistics
Standard deviation | 0.91068 |
---|---|
Coef of variation | 0.42305 |
Kurtosis | 2.802 |
Mean | 2.1527 |
MAD | 0.66587 |
Skewness | 0.98754 |
Sum | 661960 |
Variance | 0.82934 |
Memory size | 2.3 MiB |
Value | Count | Frequency (%) | |
2.0 | 158357 | 51.5% | |
1.0 | 67847 | 22.1% | |
3.0 | 52601 | 17.1% | |
4.0 | 24697 | 8.0% | |
5.0 | 3478 | 1.1% | |
6.0 | 408 | 0.1% | |
7.0 | 81 | 0.0% | |
8.0 | 20 | 0.0% | |
9.0 | 6 | 0.0% | |
10.0 | 3 | 0.0% | |
Other values (7) | 11 | 0.0% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 67847 | 22.1% | |
2.0 | 158357 | 51.5% | |
3.0 | 52601 | 17.1% | |
4.0 | 24697 | 8.0% | |
5.0 | 3478 | 1.1% |
Maximum 5 values
Value | Count | Frequency (%) | |
13.0 | 1 | 0.0% | |
14.0 | 2 | 0.0% | |
15.0 | 1 | 0.0% | |
16.0 | 2 | 0.0% | |
20.0 | 2 | 0.0% |
CODE_GENDER
Categorical
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 0.0% |
Missing (n) | 0 |
F | |
---|---|
M | |
XNA | 4 |
Value | Count | Frequency (%) | |
F | 202448 | 65.8% | |
M | 105059 | 34.2% | |
XNA | 4 | 0.0% |
COMMONAREA_AVG
Numeric
Distinct count | 3182 |
---|---|
Unique (%) | 1.0% |
Missing (%) | 69.9% |
Missing (n) | 214865 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 0.044621 |
---|---|
Minimum | 0 |
Maximum | 1 |
Zeros (%) | 2.7% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0.0078 |
Median | 0.0211 |
Q3 | 0.0515 |
95-th percentile | 0.1601 |
Maximum | 1 |
Range | 1 |
Interquartile range | 0.0437 |
Descriptive statistics
Standard deviation | 0.076036 |
---|---|
Coef of variation | 1.704 |
Kurtosis | 45.988 |
Mean | 0.044621 |
MAD | 0.042024 |
Skewness | 5.4573 |
Sum | 4133.9 |
Variance | 0.0057814 |
Memory size | 2.3 MiB |