import pandas as pd
import numpy as np
import seaborn as sns
import matplotlib.pyplot as plt
import matplotlib.ticker as ticker
import os
from sklearn import datasets
%matplotlib inline
from IPython.core.display import display, HTML
pd.options.display.max_columns = None
display(HTML("<style>.container { width:100% !important; }</style>"))
pd.set_option('display.float_format',lambda x: '%.3f' % x)
plt.rcParams['figure.figsize'] = 10,10
import missingno as msno
import pandas_profiling
CSV_PATH = os.path.join('data', 'immigration', 'mig161.csv')
mig_df = pd.read_csv(CSV_PATH, encoding='latin1', na_values=[8888, 9999])
C:\Users\mattt\Anaconda3\envs\py36\lib\site-packages\IPython\core\interactiveshell.py:2728: DtypeWarning: Columns (14,15,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,33,42,53,54,55,56,57,58,59,288,289,290,291,294,295,297,298,299,300,303,304,307,308,309,310,313,314,317,318,319,320,323,324,327,328,329,330,333,334,337,338,339,340,343,344,347,348,349,350,353,354,357,358,359,360,363,364,365,366,367,368,369,370,371,372,373,374,375,376,377,378,379,380,381,382,383,384,385,386,387,388,389,390,391,392,393,394,395,396,397,398,399,400,401,402,403,404,405,406,407,408,409,410,411,412,413,414,415,416,417,418,419,420,421,422,423,424,433,434,435,436,439,440,441,442,447,450,451,453,454,455,456,464,465,466,467,468,469,470,471,472,473,474,475,476,478,479,480,500,501,502,503,507,508,509) have mixed types. Specify dtype option on import or set low_memory=False. interactivity=interactivity, compiler=compiler, result=result)
mig_df.head()
country | commun | surveypl | surveyyr | hhnum | weight | sex | yrborn | age | placebrn | statebrn | marstat | edyrs | occ | hhincome | ldowage | @by | height | kgs | smokes | smoked | smokeage | health | healthly | healthnw | hyperten | sugar | heart | brain | lung | nerves | cancer | usyr1 | usmar1 | usdur1 | usdoc1 | usplace1 | usstate1 | usocc1 | uswage1 | usby1 | usyrl | usmarl | usdurl | usdocl | usplacel | usstatel | usoccl | uswagel | usbyl | uscurtrp | ustrips | usexp | ushealth | mxhealth | legyrapp | legyrrec | legspon | cityrapp | cityrrec | dacaapp | dacarec | crsyr1 | crspl1 | crsst1 | crshow1 | crscoy1 | crscst1 | crspay1 | crsdep1 | crsyes1 | crsyr2 | crspl2 | crsst2 | crshow2 | crscoy2 | crscst2 | crspay2 | crsdep2 | crsyes2 | crsyr3 | crspl3 | crsst3 | crshow3 | crscoy3 | crscst3 | crspay3 | crsdep3 | crsyes3 | crsyr4 | crspl4 | crsst4 | crshow4 | crscoy4 | crscst4 | crspay4 | crsdep4 | crsyes4 | crsyr5 | crspl5 | crsst5 | crshow5 | crscoy5 | crscst5 | crspay5 | crsdep5 | crsyes5 | crsyr6 | crspl6 | crsst6 | crshow6 | crscoy6 | crscst6 | crspay6 | crsdep6 | crsyes6 | crsyr7 | crspl7 | crsst7 | crshow7 | crscoy7 | crscst7 | crspay7 | crsdep7 | crsyes7 | crsyr8 | crspl8 | crsst8 | crshow8 | crscoy8 | crscst8 | crspay8 | crsdep8 | crsyes8 | crsyr9 | crspl9 | crsst9 | crshow9 | crscoy9 | crscst9 | crspay9 | crsdep9 | crsyes9 | crsyr10 | crspl10 | crsst10 | crshow10 | crscoy10 | crscst10 | crspay10 | crsdep10 | crsyes10 | crsyr11 | crspl11 | crsst11 | crshow11 | crscoy11 | crscst11 | crspay11 | crsdep11 | crsyes11 | crsyr12 | crspl12 | crsst12 | crshow12 | crscoy12 | crscst12 | crspay12 | crsdep12 | crsyes12 | crsyr13 | crspl13 | crsst13 | crshow13 | crscoy13 | crscst13 | crspay13 | crsdep13 | crsyes13 | crsyr14 | crspl14 | crsst14 | crshow14 | crscoy14 | crscst14 | crspay14 | crsdep14 | crsyes14 | crsyr15 | crspl15 | crsst15 | crshow15 | crscoy15 | crscst15 | crspay15 | crsdep15 | crsyes15 | crsyr16 | crspl16 | crsst16 | crshow16 | crscoy16 | crscst16 | crspay16 | crsdep16 | crsyes16 | crsyr17 | crspl17 | crsst17 | crshow17 | crscoy17 | crscst17 | crspay17 | crsdep17 | crsyes17 | crsyr18 | crspl18 | crsst18 | crshow18 | crscoy18 | crscst18 | crspay18 | crsdep18 | crsyes18 | crsyr19 | crspl19 | crsst19 | crshow19 | crscoy19 | crscst19 | crspay19 | crsdep19 | crsyes19 | crsyr20 | crspl20 | crsst20 | crshow20 | crscoy20 | crscst20 | crspay20 | crsdep20 | crsyes20 | crsyr21 | crspl21 | crsst21 | crshow21 | crscoy21 | crscst21 | crspay21 | crsdep21 | crsyes21 | crsyr22 | crspl22 | crsst22 | crshow22 | crscoy22 | crscst22 | crspay22 | crsdep22 | crsyes22 | crsyr23 | crspl23 | crsst23 | crshow23 | crscoy23 | crscst23 | crspay23 | crsdep23 | crsyes23 | crsyr24 | crspl24 | crsst24 | crshow24 | crscoy24 | crscst24 | crspay24 | crsdep24 | crsyes24 | crsyr25 | crspl25 | crsst25 | crshow25 | crscoy25 | crscst25 | crspay25 | crsdep25 | crsyes25 | momgyr | mogree | moyrgr | modoc | modoyr | molive | mousnw | mouspl | mousst | famgyr | fagree | fayrgr | fadoc | fadoyr | falive | fausnw | fauspl | fausst | sbsex1 | sbmgyr1 | sbgree1 | sbyrgr1 | sbdoc1 | sbdoyr1 | sblive1 | sbusnw1 | sbuspl1 | sbusst1 | sbsex2 | sbmgyr2 | sbgree2 | sbyrgr2 | sbdoc2 | sbdoyr2 | sblive2 | sbusnw2 | sbuspl2 | sbusst2 | sbsex3 | sbmgyr3 | sbgree3 | sbyrgr3 | sbdoc3 | sbdoyr3 | sblive3 | sbusnw3 | sbuspl3 | sbusst3 | sbsex4 | sbmgyr4 | sbgree4 | sbyrgr4 | sbdoc4 | sbdoyr4 | sblive4 | sbusnw4 | sbuspl4 | sbusst4 | sbsex5 | sbmgyr5 | sbgree5 | sbyrgr5 | sbdoc5 | sbdoyr5 | sblive5 | sbusnw5 | sbuspl5 | sbusst5 | sbsex6 | sbmgyr6 | sbgree6 | sbyrgr6 | sbdoc6 | sbdoyr6 | sblive6 | sbusnw6 | sbuspl6 | sbusst6 | sbsex7 | sbmgyr7 | sbgree7 | sbyrgr7 | sbdoc7 | sbdoyr7 | sblive7 | sbusnw7 | sbuspl7 | sbusst7 | sbsex8 | sbmgyr8 | sbgree8 | sbyrgr8 | sbdoc8 | sbdoyr8 | sblive8 | sbusnw8 | sbuspl8 | sbusst8 | sbsex9 | sbmgyr9 | sbgree9 | sbyrgr9 | sbdoc9 | sbdoyr9 | sblive9 | sbusnw9 | sbuspl9 | sbusst9 | sbsex10 | sbmgyr10 | sbgree10 | sbyrgr10 | sbdoc10 | sbdoyr10 | sblive10 | sbusnw10 | sbuspl10 | sbusst10 | sbsex11 | sbmgyr11 | sbgree11 | sbyrgr11 | sbdoc11 | sbdoyr11 | sblive11 | sbusnw11 | sbuspl11 | sbusst11 | sbsex12 | sbmgyr12 | sbgree12 | sbyrgr12 | sbdoc12 | sbdoyr12 | sblive12 | sbusnw12 | sbuspl12 | sbusst12 | uncinus | uncevus | coinus | coevus | neinus | neevus | sbilinus | sbilevus | chilinus | chilevus | pilinus | pilevus | frinus | frevus | reltrip1 | reltrip | paistp1 | paistrip | sport | social | chicanos | blacks | asians | anglos | latinos | lodging1 | lodging | english | enghome | engwork | engfrnd | engneig | howjob | hrwage | hrweek | monsyr | howpaid | sstax | fedtx | rowner | rsuper | howjobs | hrwages | hrweeks | monsyrs | howpaids | sstaxs | fedtxs | rowners | rsupers | finhelp1 | finhelp | bankacct | card | taxes | consular | rent | food | remit | remit1 | remit2 | remit3 | remit4 | remit5 | savings | savretrn | savings1 | savings2 | savings3 | savings4 | savings5 | schools | unemp | foodst | welfare | afdc | wic | ssi | general | doctor | hospital | hlthpmt1 | hlthpmt2 | hlthpmt3 | hlthpmt4 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | 1 | 1 | 1 | 1987 | 3 | 3.900 | 1 | 1942.000 | 45.000 | 0.000 | 11.000 | 2.000 | 0.000 | 529.000 | NaN | nan | 1977.000 | 12.000 | nan | 7320.000 | 105 | 529.000 | nan | nan | 1977.000 | 12.000 | nan | 7320.000 | 105 | 529.000 | nan | nan | 2 | 1.000 | 12.000 | NaN | 1977.000 | nan | nan | nan | nan | nan | nan | nan | 1.000 | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | NaN | NaN | NaN | NaN | nan | nan | nan | nan | nan | nan | NaN | NaN | nan | nan | nan | nan | nan | nan | nan | nan | NaN | NaN | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | ||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||
1 | 1 | 1 | 1 | 1987 | 9 | 3.900 | 1 | 1933.000 | 54.000 | 0.000 | 11.000 | 2.000 | 0.000 | 410.000 | NaN | nan | 1952.000 | 12.000 | 2.000 | nan | 103 | 410.000 | 0.300 | 1.000 | 1954.000 | 3.000 | 8.000 | nan | 105 | 410.000 | 0.370 | 1.000 | 2 | 2.000 | 15.000 | NaN | 1954.000 | nan | nan | nan | nan | nan | nan | nan | 1.000 | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 2.000 | 1.000 | 2.000 | 2.000 | 2.000 | 2.000 | 2.000 | 1.000 | 3.000 | 0.000 | 6.000 | 0.370 | 40.000 | nan | 1.000 | 2.000 | 2.000 | 3.000 | 2.000 | 0.000 | 0.000 | 0.000 | nan | nan | nan | nan | nan | 0.000 | 40.000 | 11.000 | nan | nan | nan | nan | 2.000 | 2.000 | 2.000 | 2.000 | 2.000 | 2.000 | nan | ||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||
2 | 1 | 1 | 1 | 1987 | 12 | 3.900 | 1 | 1943.000 | 44.000 | 0.000 | 11.000 | 2.000 | 4.000 | 549.000 | NaN | nan | 1962.000 | 2.000 | 2.000 | 8735.000 | 105 | 410.000 | 1.000 | 1.000 | 1962.000 | 2.000 | 2.000 | 8735.000 | 105 | 410.000 | 1.000 | 1.000 | 2 | 1.000 | 2.000 | NaN | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 2 | 2.000 | 1 | 1.000 | 2.000 | 2.000 | 1.000 | 2.000 | 2.000 | 2.000 | 3 | 3.000 | 0.000 | nan | 1.000 | 55.000 | 2.000 | 1.000 | 1.000 | nan | 3 | 3.000 | 2.000 | nan | nan | 80.000 | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | 2.000 | 2.000 | 2.000 | 2.000 | 2.000 | 2.000 | nan | ||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||
3 | 1 | 1 | 1 | 1987 | 14 | 3.900 | 1 | 1938.000 | 49.000 | nan | 11.000 | 2.000 | 3.000 | 522.000 | 250000.000 | 5.000 | 1972.000 | 12.000 | 8.000 | 1600.000 | 114 | 810.000 | 3.000 | 1.000 | 1973.000 | 6.000 | 8.000 | 1600.000 | 114 | 810.000 | 3.000 | 1.000 | 2 | 2.000 | 18.000 | NaN | 1972.000 | 4.000 | 2.000 | 1.000 | 1.000 | nan | nan | 1.000 | 1.000 | 1973.000 | nan | 2.000 | 1.000 | 1.000 | nan | nan | 0.000 | 1.000 | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | 1.000 | 1.000 | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 1.000 | 1.000 | 2.000 | 2.000 | 2.000 | 2.000 | 2.000 | 1.000 | 4.000 | 0.000 | 3.000 | 3.000 | 40.000 | 12.000 | 2.000 | 2.000 | 2.000 | 4.000 | 2.000 | 0.000 | 0.000 | 200.000 | 11.000 | nan | nan | nan | nan | 200.000 | 1000.000 | 11.000 | nan | nan | nan | nan | 2.000 | 2.000 | 2.000 | 2.000 | 2.000 | 2.000 | nan | ||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||||
4 | 1 | 1 | 1 | 1987 | 16 | 3.900 | 1 | 1928.000 | 59.000 | 0.000 | 11.000 | 2.000 | 3.000 | 522.000 | 200000.000 | 5.000 | 1958.000 | 12.000 | 2.000 | 7360.000 | 105 | 410.000 | nan | nan | 1966.000 | 12.000 | 8.000 | 4480.000 | 105 | 410.000 | nan | nan | 2 | 2.000 | 24.000 | NaN | 1966.000 | nan | 2.000 | nan | nan | nan | nan | 0.000 | 1.000 | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | nan | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 0.000 | 2.000 | 1.000 | 2.000 | 2.000 | 2.000 | 2.000 | 1.000 | 1.000 | 3.000 | 0.000 | 6.000 | nan | 40.000 | 6.000 | 2.000 | 1.000 | 1.000 | 3.000 | 2.000 | 0.000 | nan | 20.000 | 11.000 | nan | nan | nan | nan | nan | 150.000 | 3.000 | nan | nan | nan | nan | 2.000 | 2.000 | 2.000 | 2.000 | 2.000 | 2.000 | nan |
mig_df.info()
<class 'pandas.core.frame.DataFrame'> RangeIndex: 8557 entries, 0 to 8556 Columns: 510 entries, country to hlthpmt4 dtypes: float64(327), int64(9), object(174) memory usage: 33.3+ MB
mig_df.shape
(8557, 510)
column_list = list(mig_df.select_dtypes(include=['object']).columns.values)
len(column_list)
174
# convert columns with strings to 'categorical' type they have low cardinality.
def convert_to_categorical(df, cols):
for col in cols:
# get number of unique values
unique_vals = len(df[col].unique())
# calculate the ratio of unique values to total number of rows
unique_ratio = unique_vals / len(df)
if unique_ratio <= 0.2:
df[col] = df[col].astype('category')
return df
mig_df = convert_to_categorical(mig_df, column_list)
After converting the type of any columns with low cardinality to 'category' we see that we've shaved about 10MB from the size of the DataFrame.
mig_df.info()
<class 'pandas.core.frame.DataFrame'> RangeIndex: 8557 entries, 0 to 8556 Columns: 510 entries, country to hlthpmt4 dtypes: category(174), float64(327), int64(9) memory usage: 23.6 MB
msno.matrix(mig_df.iloc[:,:50])
<matplotlib.axes._subplots.AxesSubplot at 0x22db17a0fd0>
msno.matrix(mig_df.iloc[:,50:100])
<matplotlib.axes._subplots.AxesSubplot at 0x22db244eb00>
msno.matrix(mig_df.iloc[:,100:150])
<matplotlib.axes._subplots.AxesSubplot at 0x22d90f21c18>
msno.matrix(mig_df.iloc[:,150:200])
<matplotlib.axes._subplots.AxesSubplot at 0x22d9116e1d0>
msno.matrix(mig_df.iloc[:,200:250])
<matplotlib.axes._subplots.AxesSubplot at 0x22d94613748>
msno.matrix(mig_df.iloc[:,250:300])
<matplotlib.axes._subplots.AxesSubplot at 0x22d9e297da0>
msno.matrix(mig_df.iloc[:,300:350])
<matplotlib.axes._subplots.AxesSubplot at 0x22d9f422da0>
msno.matrix(mig_df.iloc[:,350:400])
<matplotlib.axes._subplots.AxesSubplot at 0x22d9f571be0>
msno.matrix(mig_df.iloc[:,400:450])
<matplotlib.axes._subplots.AxesSubplot at 0x22d9f624fd0>
msno.matrix(mig_df.iloc[:,450:500])
<matplotlib.axes._subplots.AxesSubplot at 0x22dab23a5c0>
Looking at these plots of missing data (each column corresponds to a feature in the data set, and white bars indicate missing data), we can quickly see that some features are missing the majority of values. It is possible to use imputation to guess at what the values should be and insert that value, but when we have nearly no data for a column, we lack the data to justify an imputation choice. The chart below shows how many features would remain at different missing value thresholds. For example, if I dropped any feature missing more than 60% of the observations, I'd have about 260 features left. If I dropped any features missing more than 40% of the data, I'd have about 180 features left. I'll start by dropping any columns with more than 60% of data missing.
tmp = mig_df.isnull().sum()
tmp.sort_values(inplace=True)
tmp = tmp.divide(mig_df.shape[0])*100
tmp = tmp.reset_index(drop=True)
with sns.axes_style("darkgrid"):
fig, ax = plt.subplots(figsize=(10,7))
ax.plot(tmp)
ax.set_title('Percent of Data Missing for Each Feature (Gain Chart)')
ax.set_xlabel('Features')
ax.set_ylabel('Percent of Data Missing')
mig_df.shape
(8557, 510)
mig_drop = mig_df.dropna(axis=1, thresh=int((1-0.60)*len(mig_df.index)))
mig_drop.shape
(8557, 259)
mig_drop.info()
<class 'pandas.core.frame.DataFrame'> RangeIndex: 8557 entries, 0 to 8556 Columns: 259 entries, country to hlthpmt4 dtypes: category(173), float64(77), int64(9) memory usage: 7.2 MB
We see that we've trimmed the data down to about 25% of the size we started with. Calculations would have been quick enough with the 33 MB we were working with before, but we would have been lugging a lot of unnecessary data through the computations.
profile = pandas_profiling.ProfileReport(mig_drop.select_dtypes(exclude=['object']))
profile
Dataset info
Number of variables | 259 |
---|---|
Number of observations | 8557 |
Total Missing (%) | 24.0% |
Total size in memory | 7.2 MiB |
Average record size in memory | 883.3 B |
Variables types
Numeric | 75 |
---|---|
Categorical | 173 |
Boolean | 3 |
Date | 0 |
Text (Unique) | 0 |
Rejected | 8 |
Unsupported | 0 |
Warnings
@by
has 3179 / 37.2% missing values Missingafdc
has 4220 / 49.3% missing values Missinganglos
has 927 / 10.8% zeros Zerosanglos
has 591 / 6.9% missing values Missingasians
has 392 / 4.6% missing values Missingbankacct
has 397 / 4.6% missing values Missingblacks
has 2542 / 29.7% zeros Zerosblacks
has 616 / 7.2% missing values Missingcard
has 226 / 2.6% missing values Missingchicanos
has 1673 / 19.6% zeros Zeroschicanos
has 631 / 7.4% missing values Missingcityrapp
has 3597 / 42.0% missing values Missingcityrrec
has 3602 / 42.1% missing values Missingcoevus
is highly correlated with coinus
(ρ = 0.90918) Rejectedcoinus
has 4022 / 47.0% zeros Zeroscoinus
has 241 / 2.8% missing values Missingconsular
has 220 / 2.6% missing values Missingcountry
has constant value 1 Rejectedcrscoy1
has 2449 / 28.6% missing values Missingcrsdep1
has 4193 / 49.0% zeros Zeroscrsdep1
has 2822 / 33.0% missing values Missingcrshow1
has 2466 / 28.8% missing values Missingcrspl1
has 3553 / 41.5% missing values Missingcrspl1
is highly skewed (γ1 = 27.708) Skewedcrsst1
is highly correlated with crspl1
(ρ = 0.92971) Rejectedcrsyes1
has 2149 / 25.1% missing values Missingcrsyr1
is highly correlated with usyr1
(ρ = 0.95644) Rejecteddoctor
has 397 / 4.6% missing values Missingedyrs
has 1056 / 12.3% zeros Zerosengfrnd
has 180 / 2.1% missing values Missingenghome
has 176 / 2.1% missing values Missingenglish
has 3319 / 38.8% zeros Zerosenglish
has 295 / 3.4% missing values Missingengneig
has 196 / 2.3% missing values Missingengwork
has 310 / 3.6% missing values Missingfadoc
has 1534 / 17.9% missing values Missingfadoyr
has 1631 / 19.1% missing values Missingfagree
has 2481 / 29.0% missing values Missingfauspl
has 4388 / 51.3% missing values Missingfausst
has 4291 / 50.1% missing values Missingfayrgr
has 2756 / 32.2% missing values Missingfedtx
has 1801 / 21.0% missing values Missingfedtxs
has 4095 / 47.9% missing values Missingfinhelp
has 457 / 5.3% missing values Missingfinhelp1
has 350 / 4.1% missing values Missingfood
has 1021 / 11.9% zeros Zerosfood
has 2149 / 25.1% missing values Missingfoodst
has 416 / 4.9% missing values Missingfrevus
is highly correlated with frinus
(ρ = 0.90996) Rejectedfrinus
has 4350 / 50.8% zeros Zerosfrinus
has 653 / 7.6% missing values Missinggeneral
has 4224 / 49.4% missing values Missingheight
has a high cardinality: 87 distinct values Warninghhincome
has 1208 / 14.1% missing values Missinghhincome
has a high cardinality: 646 distinct values Warninghhnum
is highly correlated with surveypl
(ρ = 0.96261) Rejectedhlthpmt2
has 4334 / 50.6% missing values Missinghlthpmt3
has 4488 / 52.4% missing values Missinghlthpmt4
has 4506 / 52.7% missing values Missinghospital
has 410 / 4.8% missing values Missinghowjob
has 1212 / 14.2% missing values Missinghowjobs
has 4087 / 47.8% missing values Missinghowpaid
has 1164 / 13.6% missing values Missinghowpaids
has 4086 / 47.8% missing values Missinghrwage
has 2504 / 29.3% missing values Missinghrwages
has 4160 / 48.6% missing values Missinghrwages
has a high cardinality: 95 distinct values Warninghrweek
has 1304 / 15.2% missing values Missinghrweeks
has 4095 / 47.9% missing values Missingkgs
has 90 / 1.1% missing values Missingkgs
has a high cardinality: 139 distinct values Warninglatinos
has 740 / 8.6% zeros Zeroslatinos
has 588 / 6.9% missing values Missingldowage
has 1935 / 22.6% missing values Missingldowage
has a high cardinality: 228 distinct values Warninglegspon
has 3635 / 42.5% missing values Missinglegyrapp
has 3714 / 43.4% missing values Missinglegyrapp
has a high cardinality: 73 distinct values Warninglodging
has 641 / 7.5% missing values Missinglodging1
has 358 / 4.2% missing values Missingmodoc
has 1575 / 18.4% missing values Missingmodoyr
has 1633 / 19.1% missing values Missingmogree
has 2679 / 31.3% missing values Missingmonsyr
has 1051 / 12.3% missing values Missingmonsyrs
has 4087 / 47.8% missing values Missingmouspl
has 4390 / 51.3% missing values Missingmousst
has 4352 / 50.9% missing values Missingmoyrgr
has 2774 / 32.4% missing values Missingmxhealth
has 370 / 4.3% missing values Missingneevus
is highly correlated with neinus
(ρ = 0.92759) Rejectedneinus
has 3906 / 45.6% zeros Zerosneinus
has 173 / 2.0% missing values Missingpaistp1
has 253 / 3.0% missing values Missingpaistrip
has 298 / 3.5% missing values Missingplacebrn
has 6748 / 78.9% zeros Zerosplacebrn
has 186 / 2.2% missing values Missingreltrip
has 615 / 7.2% missing values Missingreltrip1
has 347 / 4.1% missing values Missingremit
has 1940 / 22.7% zeros Zerosremit
has 1256 / 14.7% missing values Missingremit1
has 3379 / 39.5% missing values Missingrent
has 2271 / 26.5% zeros Zerosrent
has 1794 / 21.0% missing values Missingrowner
has 852 / 10.0% missing values Missingrowners
has 4128 / 48.2% missing values Missingrsuper
has 1075 / 12.6% missing values Missingrsupers
has 4146 / 48.5% missing values Missingsavings
has 2897 / 33.9% zeros Zerossavings
has 2604 / 30.4% missing values Missingsavings1
has 3987 / 46.6% missing values Missingsavretrn
has 2527 / 29.5% zeros Zerossavretrn
has 2163 / 25.3% missing values Missingsbdoc1
has 779 / 9.1% missing values Missingsbdoc10
has 1662 / 19.4% missing values Missingsbdoc11
has 1663 / 19.4% missing values Missingsbdoc12
has 1667 / 19.5% missing values Missingsbdoc2
has 1094 / 12.8% missing values Missingsbdoc3
has 1302 / 15.2% missing values Missingsbdoc4
has 1441 / 16.8% missing values Missingsbdoc5
has 1518 / 17.7% missing values Missingsbdoc6
has 1588 / 18.6% missing values Missingsbdoc7
has 1613 / 18.9% missing values Missingsbdoc8
has 1641 / 19.2% missing values Missingsbdoc9
has 1655 / 19.3% missing values Missingsbdoyr1
has 1505 / 17.6% missing values Missingsbdoyr1
has a high cardinality: 56 distinct values Warningsbdoyr10
has 1665 / 19.5% missing values Missingsbdoyr11
has 1665 / 19.5% missing values Missingsbdoyr12
has 1667 / 19.5% missing values Missingsbdoyr2
has 1577 / 18.4% missing values Missingsbdoyr3
has 1611 / 18.8% missing values Missingsbdoyr4
has 1634 / 19.1% missing values Missingsbdoyr5
has 1645 / 19.2% missing values Missingsbdoyr6
has 1654 / 19.3% missing values Missingsbdoyr7
has 1657 / 19.4% missing values Missingsbdoyr8
has 1662 / 19.4% missing values Missingsbdoyr9
has 1662 / 19.4% missing values Missingsbgree1
has 1242 / 14.5% missing values Missingsbgree10
has 2816 / 32.9% missing values Missingsbgree11
has 2826 / 33.0% missing values Missingsbgree12
has 2838 / 33.2% missing values Missingsbgree2
has 1796 / 21.0% missing values Missingsbgree3
has 2202 / 25.7% missing values Missingsbgree4
has 2464 / 28.8% missing values Missingsbgree5
has 2613 / 30.5% missing values Missingsbgree6
has 2705 / 31.6% missing values Missingsbgree7
has 2750 / 32.1% missing values Missingsbgree8
has 2786 / 32.6% missing values Missingsbgree9
has 2805 / 32.8% missing values Missingsbilevus
has 3958 / 46.3% zeros Zerossbilevus
has 460 / 5.4% missing values Missingsbilinus
has 4902 / 57.3% zeros Zerossblive1
has 3235 / 37.8% missing values Missingsblive10
has 4485 / 52.4% missing values Missingsblive11
has 4496 / 52.5% missing values Missingsblive12
has 4512 / 52.7% missing values Missingsblive2
has 4970 / 58.1% missing values Missingsblive7
has 4361 / 51.0% missing values Missingsblive8
has 4429 / 51.8% missing values Missingsblive9
has 4464 / 52.2% missing values Missingsbmgyr1
has 4210 / 49.2% missing values Missingsbmgyr10
has 4493 / 52.5% missing values Missingsbmgyr11
has 4502 / 52.6% missing values Missingsbmgyr12
has 4513 / 52.7% missing values Missingsbmgyr7
has 4415 / 51.6% missing values Missingsbmgyr8
has 4460 / 52.1% missing values Missingsbmgyr9
has 4482 / 52.4% missing values Missingsbsex1
has 3286 / 38.4% missing values Missingsbsex10
has 4485 / 52.4% missing values Missingsbsex11
has 4496 / 52.5% missing values Missingsbsex12
has 4512 / 52.7% missing values Missingsbsex2
has 4979 / 58.2% missing values Missingsbsex7
has 4361 / 51.0% missing values Missingsbsex8
has 4430 / 51.8% missing values Missingsbsex9
has 4464 / 52.2% missing values Missingsbusnw1
has 3511 / 41.0% missing values Missingsbusnw10
has 4487 / 52.4% missing values Missingsbusnw11
has 4498 / 52.6% missing values Missingsbusnw12
has 4514 / 52.8% missing values Missingsbusnw2
has 5104 / 59.6% missing values Missingsbusnw7
has 4364 / 51.0% missing values Missingsbusnw8
has 4432 / 51.8% missing values Missingsbusnw9
has 4466 / 52.2% missing values Missingsbuspl1
has 2714 / 31.7% missing values Missingsbuspl1
has a high cardinality: 111 distinct values Warningsbuspl10
has 4483 / 52.4% missing values Missingsbuspl11
has 4490 / 52.5% missing values Missingsbuspl12
has 4505 / 52.6% missing values Missingsbuspl2
has 3328 / 38.9% missing values Missingsbuspl2
has a high cardinality: 91 distinct values Warningsbuspl3
has 3781 / 44.2% missing values Missingsbuspl3
has a high cardinality: 83 distinct values Warningsbuspl4
has 4075 / 47.6% missing values Missingsbuspl4
has a high cardinality: 65 distinct values Warningsbuspl5
has 4231 / 49.4% missing values Missingsbuspl5
has a high cardinality: 52 distinct values Warningsbuspl6
has 4352 / 50.9% missing values Missingsbuspl7
has 4389 / 51.3% missing values Missingsbuspl8
has 4448 / 52.0% missing values Missingsbuspl9
has 4474 / 52.3% missing values Missingsbusst1
has 2050 / 24.0% missing values Missingsbusst10
has 4479 / 52.3% missing values Missingsbusst11
has 4490 / 52.5% missing values Missingsbusst12
has 4504 / 52.6% missing values Missingsbusst2
has 2916 / 34.1% missing values Missingsbusst3
has 3523 / 41.2% missing values Missingsbusst4
has 3911 / 45.7% missing values Missingsbusst5
has 4134 / 48.3% missing values Missingsbusst6
has 4297 / 50.2% missing values Missingsbusst7
has 4360 / 51.0% missing values Missingsbusst8
has 4430 / 51.8% missing values Missingsbusst9
has 4463 / 52.2% missing values Missingsbyrgr1
has 2443 / 28.5% missing values Missingsbyrgr1
has a high cardinality: 72 distinct values Warningsbyrgr10
has 2830 / 33.1% missing values Missingsbyrgr11
has 2836 / 33.1% missing values Missingsbyrgr12
has 2838 / 33.2% missing values Missingsbyrgr2
has 2603 / 30.4% missing values Missingsbyrgr2
has a high cardinality: 58 distinct values Warningsbyrgr3
has 2684 / 31.4% missing values Missingsbyrgr4
has 2726 / 31.9% missing values Missingsbyrgr5
has 2773 / 32.4% missing values Missingsbyrgr6
has 2796 / 32.7% missing values Missingsbyrgr7
has 2816 / 32.9% missing values Missingsbyrgr8
has 2825 / 33.0% missing values Missingsbyrgr9
has 2828 / 33.0% missing values Missingschools
has 192 / 2.2% missing values Missingsmokeage
has 1203 / 14.1% missing values Missingsmokeage
has a high cardinality: 58 distinct values Warningsocial
has 440 / 5.1% missing values Missingsport
has 427 / 5.0% missing values Missingssi
has 4223 / 49.4% missing values Missingsstax
has 1702 / 19.9% missing values Missingsstaxs
has 4091 / 47.8% missing values Missingsurveyyr
is highly correlated with commun
(ρ = 0.97277) Rejectedtaxes
has 325 / 3.8% missing values Missinguncevus
has 5015 / 58.6% zeros Zerosuncevus
has 533 / 6.2% missing values Missinguncinus
has 6089 / 71.2% zeros Zerosuncinus
has 148 / 1.7% missing values Missingunemp
has 347 / 4.1% missing values Missingusby1
has 3486 / 40.7% missing values Missingusbyl
has 2787 / 32.6% missing values Missingusbyl
is highly skewed (γ1 = 75.61) Skewedusexp
has 319 / 3.7% missing values Missingushealth
has 114 / 1.3% missing values Missingusocc1
has 150 / 1.8% missing values Missingusoccl
has 145 / 1.7% missing values Missingusplace1
has 1490 / 17.4% missing values Missingusplacel
has 1434 / 16.8% missing values Missinguswage1
has 3545 / 41.4% missing values Missinguswage1
is highly skewed (γ1 = 29.428) Skeweduswagel
has 2825 / 33.0% missing values Missinguswagel
is highly skewed (γ1 = 48.345) Skewedwelfare
has 458 / 5.4% missing values Missingwic
has 4219 / 49.3% missing values Missing@by
Numeric
Distinct count | 7 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 37.2% |
Missing (n) | 3179 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 3.6607 |
---|---|
Minimum | 1 |
Maximum | 6 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 2 |
Median | 4 |
Q3 | 5 |
95-th percentile | 5 |
Maximum | 6 |
Range | 5 |
Interquartile range | 3 |
Descriptive statistics
Standard deviation | 1.4719 |
---|---|
Coef of variation | 0.40209 |
Kurtosis | -1.2283 |
Mean | 3.6607 |
MAD | 1.3478 |
Skewness | -0.48007 |
Sum | 19687 |
Variance | 2.1666 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
5.0 | 2599 | 30.4% | |
3.0 | 1186 | 13.9% | |
2.0 | 775 | 9.1% | |
1.0 | 584 | 6.8% | |
4.0 | 202 | 2.4% | |
6.0 | 32 | 0.4% | |
(Missing) | 3179 | 37.2% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 584 | 6.8% | |
2.0 | 775 | 9.1% | |
3.0 | 1186 | 13.9% | |
4.0 | 202 | 2.4% | |
5.0 | 2599 | 30.4% |
Maximum 5 values
Value | Count | Frequency (%) | |
2.0 | 775 | 9.1% | |
3.0 | 1186 | 13.9% | |
4.0 | 202 | 2.4% | |
5.0 | 2599 | 30.4% | |
6.0 | 32 | 0.4% |
afdc
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 49.3% |
Missing (n) | 4220 |
2.0 | 247 |
---|---|
1.0 | 40 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
2.0 | 247 | 2.9% | |
1.0 | 40 | 0.5% | |
(Missing) | 4220 | 49.3% |
age
Numeric
Distinct count | 82 |
---|---|
Unique (%) | 1.0% |
Missing (%) | 0.0% |
Missing (n) | 3 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 46.432 |
---|---|
Minimum | 17 |
Maximum | 98 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 17 |
---|---|
5-th percentile | 26 |
Q1 | 34 |
Median | 44 |
Q3 | 57 |
95-th percentile | 74 |
Maximum | 98 |
Range | 81 |
Interquartile range | 23 |
Descriptive statistics
Standard deviation | 15.046 |
---|---|
Coef of variation | 0.32404 |
Kurtosis | -0.44176 |
Mean | 46.432 |
MAD | 12.464 |
Skewness | 0.52276 |
Sum | 397180 |
Variance | 226.37 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
36.0 | 244 | 2.9% | |
33.0 | 239 | 2.8% | |
35.0 | 238 | 2.8% | |
32.0 | 234 | 2.7% | |
39.0 | 234 | 2.7% | |
38.0 | 230 | 2.7% | |
42.0 | 225 | 2.6% | |
34.0 | 224 | 2.6% | |
31.0 | 220 | 2.6% | |
40.0 | 219 | 2.6% | |
Other values (71) | 6247 | 73.0% |
Minimum 5 values
Value | Count | Frequency (%) | |
17.0 | 1 | 0.0% | |
18.0 | 5 | 0.1% | |
19.0 | 11 | 0.1% | |
20.0 | 19 | 0.2% | |
21.0 | 27 | 0.3% |
Maximum 5 values
Value | Count | Frequency (%) | |
93.0 | 3 | 0.0% | |
94.0 | 2 | 0.0% | |
95.0 | 1 | 0.0% | |
96.0 | 1 | 0.0% | |
98.0 | 2 | 0.0% |
anglos
Numeric
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 6.9% |
Missing (n) | 591 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.2983 |
---|---|
Minimum | 0 |
Maximum | 4 |
Zeros (%) | 10.8% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 1 |
Median | 1 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 4 |
Range | 4 |
Interquartile range | 1 |
Descriptive statistics
Standard deviation | 0.69681 |
---|---|
Coef of variation | 0.53672 |
Kurtosis | -0.3796 |
Mean | 1.2983 |
MAD | 0.59466 |
Skewness | -0.089033 |
Sum | 10342 |
Variance | 0.48554 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 3906 | 45.6% | |
2.0 | 2966 | 34.7% | |
0.0 | 927 | 10.8% | |
3.0 | 164 | 1.9% | |
4.0 | 3 | 0.0% | |
(Missing) | 591 | 6.9% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 927 | 10.8% | |
1.0 | 3906 | 45.6% | |
2.0 | 2966 | 34.7% | |
3.0 | 164 | 1.9% | |
4.0 | 3 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
0.0 | 927 | 10.8% | |
1.0 | 3906 | 45.6% | |
2.0 | 2966 | 34.7% | |
3.0 | 164 | 1.9% | |
4.0 | 3 | 0.0% |
asians
Categorical
Distinct count | 11 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 4.6% |
Missing (n) | 392 |
0.0 | |
---|---|
1.0 | |
Other values (7) | 478 |
(Missing) | 392 |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
0.0 | 2749 | 32.1% | |
1.0 | 888 | 10.4% | |
2.0 | 343 | 4.0% | |
3.0 | 83 | 1.0% | |
0 | 27 | 0.3% | |
1 | 9 | 0.1% | |
2 | 7 | 0.1% | |
4.0 | 7 | 0.1% | |
3 | 2 | 0.0% | |
(Missing) | 392 | 4.6% |
bankacct
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 4.6% |
Missing (n) | 397 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.8496 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 2 |
Median | 2 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.35745 |
---|---|
Coef of variation | 0.19326 |
Kurtosis | 1.8292 |
Mean | 1.8496 |
MAD | 0.25551 |
Skewness | -1.9567 |
Sum | 15093 |
Variance | 0.12777 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
2.0 | 6933 | 81.0% | |
1.0 | 1227 | 14.3% | |
(Missing) | 397 | 4.6% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 1227 | 14.3% | |
2.0 | 6933 | 81.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 1227 | 14.3% | |
2.0 | 6933 | 81.0% |
blacks
Numeric
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 7.2% |
Missing (n) | 616 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.1376 |
---|---|
Minimum | 0 |
Maximum | 4 |
Zeros (%) | 29.7% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 1 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 4 |
Range | 4 |
Interquartile range | 2 |
Descriptive statistics
Standard deviation | 0.88498 |
---|---|
Coef of variation | 0.77791 |
Kurtosis | -1.4841 |
Mean | 1.1376 |
MAD | 0.79275 |
Skewness | -0.16494 |
Sum | 9034 |
Variance | 0.78319 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
2.0 | 3449 | 40.3% | |
0.0 | 2542 | 29.7% | |
1.0 | 1858 | 21.7% | |
3.0 | 90 | 1.1% | |
4.0 | 2 | 0.0% | |
(Missing) | 616 | 7.2% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 2542 | 29.7% | |
1.0 | 1858 | 21.7% | |
2.0 | 3449 | 40.3% | |
3.0 | 90 | 1.1% | |
4.0 | 2 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
0.0 | 2542 | 29.7% | |
1.0 | 1858 | 21.7% | |
2.0 | 3449 | 40.3% | |
3.0 | 90 | 1.1% | |
4.0 | 2 | 0.0% |
brain
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.1% |
Missing (n) | 7 |
2 | |
---|---|
2.0 | 361 |
Other values (2) | 10 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
2 | 1464 | 17.1% | |
2.0 | 361 | 4.2% | |
1 | 8 | 0.1% | |
1.0 | 2 | 0.0% | |
(Missing) | 7 | 0.1% |
cancer
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.1% |
Missing (n) | 8 |
2 | |
---|---|
2.0 | 362 |
Other values (2) | 7 |
(Missing) | 8 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
2 | 1465 | 17.1% | |
2.0 | 362 | 4.2% | |
1 | 6 | 0.1% | |
1.0 | 1 | 0.0% | |
(Missing) | 8 | 0.1% |
card
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 2.6% |
Missing (n) | 226 |
2.0 | |
---|---|
1.0 | 416 |
Other values (2) | 45 |
(Missing) | 226 |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
2.0 | 3820 | 44.6% | |
1.0 | 416 | 4.9% | |
2 | 42 | 0.5% | |
1 | 3 | 0.0% | |
(Missing) | 226 | 2.6% |
chicanos
Numeric
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 7.4% |
Missing (n) | 631 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.2272 |
---|---|
Minimum | 0 |
Maximum | 4 |
Zeros (%) | 19.6% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 1 |
Median | 1 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 4 |
Range | 4 |
Interquartile range | 1 |
Descriptive statistics
Standard deviation | 0.80595 |
---|---|
Coef of variation | 0.65673 |
Kurtosis | -0.88428 |
Mean | 1.2272 |
MAD | 0.68889 |
Skewness | -0.13046 |
Sum | 9727 |
Variance | 0.64956 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
2.0 | 3079 | 36.0% | |
1.0 | 2979 | 34.8% | |
0.0 | 1673 | 19.6% | |
3.0 | 190 | 2.2% | |
4.0 | 5 | 0.1% | |
(Missing) | 631 | 7.4% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 1673 | 19.6% | |
1.0 | 2979 | 34.8% | |
2.0 | 3079 | 36.0% | |
3.0 | 190 | 2.2% | |
4.0 | 5 | 0.1% |
Maximum 5 values
Value | Count | Frequency (%) | |
0.0 | 1673 | 19.6% | |
1.0 | 2979 | 34.8% | |
2.0 | 3079 | 36.0% | |
3.0 | 190 | 2.2% | |
4.0 | 5 | 0.1% |
chilevus
Categorical
Distinct count | 22 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 0.6% |
Missing (n) | 54 |
0.0 | |
---|---|
1.0 | 174 |
Other values (18) | 399 |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
0.0 | 3880 | 45.3% | |
1.0 | 174 | 2.0% | |
2.0 | 142 | 1.7% | |
3.0 | 68 | 0.8% | |
4.0 | 61 | 0.7% | |
0 | 34 | 0.4% | |
6.0 | 28 | 0.3% | |
5.0 | 24 | 0.3% | |
7.0 | 9 | 0.1% | |
Other values (11) | 33 | 0.4% | |
(Missing) | 54 | 0.6% |
chilinus
Categorical
Distinct count | 17 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 0.3% |
Missing (n) | 22 |
0.0 | |
---|---|
1.0 | 210 |
Other values (13) | 350 |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
0.0 | 3925 | 45.9% | |
1.0 | 210 | 2.5% | |
2.0 | 131 | 1.5% | |
3.0 | 82 | 1.0% | |
4.0 | 37 | 0.4% | |
0 | 34 | 0.4% | |
5.0 | 21 | 0.2% | |
6.0 | 18 | 0.2% | |
7.0 | 9 | 0.1% | |
Other values (6) | 18 | 0.2% | |
(Missing) | 22 | 0.3% |
cityrapp
Categorical
Distinct count | 46 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 42.0% |
Missing (n) | 3597 |
1998 | 6 |
---|---|
1993.0 | 5 |
Other values (42) | 93 |
(Missing) |
Value | Count | Frequency (%) | |
4856 | 56.7% | ||
1998 | 6 | 0.1% | |
1993.0 | 5 | 0.1% | |
1994.0 | 5 | 0.1% | |
2005.0 | 5 | 0.1% | |
2007.0 | 5 | 0.1% | |
1996 | 5 | 0.1% | |
2009.0 | 4 | 0.0% | |
2000.0 | 4 | 0.0% | |
1992.0 | 4 | 0.0% | |
Other values (35) | 61 | 0.7% | |
(Missing) | 3597 | 42.0% |
cityrrec
Categorical
Distinct count | 48 |
---|---|
Unique (%) | 0.6% |
Missing (%) | 42.1% |
Missing (n) | 3602 |
2012.0 | 5 |
---|---|
2008.0 | 5 |
Other values (44) | 89 |
(Missing) |
Value | Count | Frequency (%) | |
4856 | 56.7% | ||
2012.0 | 5 | 0.1% | |
2008.0 | 5 | 0.1% | |
1993.0 | 4 | 0.0% | |
1998 | 4 | 0.0% | |
2000.0 | 4 | 0.0% | |
2001.0 | 4 | 0.0% | |
1996.0 | 4 | 0.0% | |
2004.0 | 4 | 0.0% | |
2005.0 | 4 | 0.0% | |
Other values (37) | 61 | 0.7% | |
(Missing) | 3602 | 42.1% |
coevus
Highly correlated
This variable is highly correlated with coinus
and should be ignored for analysis
Correlation | 0.90918 |
---|
coinus
Numeric
Distinct count | 49 |
---|---|
Unique (%) | 0.6% |
Missing (%) | 2.8% |
Missing (n) | 241 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 4.7704 |
---|---|
Minimum | 0 |
Maximum | 120 |
Zeros (%) | 47.0% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 1 |
Q3 | 6 |
95-th percentile | 20 |
Maximum | 120 |
Range | 120 |
Interquartile range | 6 |
Descriptive statistics
Standard deviation | 8.3749 |
---|---|
Coef of variation | 1.7556 |
Kurtosis | 19.114 |
Mean | 4.7704 |
MAD | 5.5655 |
Skewness | 3.3704 |
Sum | 39671 |
Variance | 70.138 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 4022 | 47.0% | |
10.0 | 498 | 5.8% | |
3.0 | 472 | 5.5% | |
1.0 | 435 | 5.1% | |
2.0 | 434 | 5.1% | |
5.0 | 390 | 4.6% | |
4.0 | 359 | 4.2% | |
20.0 | 301 | 3.5% | |
15.0 | 258 | 3.0% | |
6.0 | 249 | 2.9% | |
Other values (38) | 898 | 10.5% | |
(Missing) | 241 | 2.8% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 4022 | 47.0% | |
1.0 | 435 | 5.1% | |
2.0 | 434 | 5.1% | |
3.0 | 472 | 5.5% | |
4.0 | 359 | 4.2% |
Maximum 5 values
Value | Count | Frequency (%) | |
70.0 | 5 | 0.1% | |
80.0 | 1 | 0.0% | |
90.0 | 1 | 0.0% | |
100.0 | 2 | 0.0% | |
120.0 | 1 | 0.0% |
commun
Numeric
Distinct count | 161 |
---|---|
Unique (%) | 1.9% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 66.314 |
---|---|
Minimum | 1 |
Maximum | 161 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 6 |
Q1 | 22 |
Median | 58 |
Q3 | 107 |
95-th percentile | 151 |
Maximum | 161 |
Range | 160 |
Interquartile range | 85 |
Descriptive statistics
Standard deviation | 48.092 |
---|---|
Coef of variation | 0.72522 |
Kurtosis | -1.1102 |
Mean | 66.314 |
MAD | 41.763 |
Skewness | 0.41461 |
Sum | 567445 |
Variance | 2312.8 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
18 | 228 | 2.7% | |
3 | 164 | 1.9% | |
30 | 154 | 1.8% | |
10 | 142 | 1.7% | |
40 | 142 | 1.7% | |
22 | 142 | 1.7% | |
8 | 141 | 1.6% | |
17 | 119 | 1.4% | |
13 | 117 | 1.4% | |
72 | 112 | 1.3% | |
Other values (151) | 7096 | 82.9% |
Minimum 5 values
Value | Count | Frequency (%) | |
1 | 96 | 1.1% | |
2 | 37 | 0.4% | |
3 | 164 | 1.9% | |
4 | 75 | 0.9% | |
5 | 32 | 0.4% |
Maximum 5 values
Value | Count | Frequency (%) | |
157 | 27 | 0.3% | |
158 | 62 | 0.7% | |
159 | 40 | 0.5% | |
160 | 66 | 0.8% | |
161 | 28 | 0.3% |
consular
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 2.6% |
Missing (n) | 220 |
2 | 898 |
---|---|
1 | 246 |
Other values (2) | 303 |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
2 | 898 | 10.5% | |
1 | 246 | 2.9% | |
2.0 | 222 | 2.6% | |
1.0 | 81 | 0.9% | |
(Missing) | 220 | 2.6% |
country
Constant
This variable is constant and should be ignored for analysis
Constant value | 1 |
---|
crscoy1
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 28.6% |
Missing (n) | 2449 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.2125 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 1 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.40912 |
---|---|
Coef of variation | 0.33741 |
Kurtosis | -0.023482 |
Mean | 1.2125 |
MAD | 0.3347 |
Skewness | 1.4059 |
Sum | 7406 |
Variance | 0.16738 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 4810 | 56.2% | |
2.0 | 1298 | 15.2% | |
(Missing) | 2449 | 28.6% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 4810 | 56.2% | |
2.0 | 1298 | 15.2% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 4810 | 56.2% | |
2.0 | 1298 | 15.2% |
crsdep1
Numeric
Distinct count | 17 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 33.0% |
Missing (n) | 2822 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 0.68771 |
---|---|
Minimum | 0 |
Maximum | 30 |
Zeros (%) | 49.0% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 0 |
Q3 | 1 |
95-th percentile | 3 |
Maximum | 30 |
Range | 30 |
Interquartile range | 1 |
Descriptive statistics
Standard deviation | 1.8153 |
---|---|
Coef of variation | 2.6397 |
Kurtosis | 30.449 |
Mean | 0.68771 |
MAD | 1.0056 |
Skewness | 4.5255 |
Sum | 3944 |
Variance | 3.2954 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 4193 | 49.0% | |
1.0 | 878 | 10.3% | |
2.0 | 240 | 2.8% | |
3.0 | 142 | 1.7% | |
8.0 | 138 | 1.6% | |
7.0 | 42 | 0.5% | |
5.0 | 33 | 0.4% | |
4.0 | 17 | 0.2% | |
6.0 | 16 | 0.2% | |
9.0 | 13 | 0.2% | |
Other values (6) | 23 | 0.3% | |
(Missing) | 2822 | 33.0% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 4193 | 49.0% | |
1.0 | 878 | 10.3% | |
2.0 | 240 | 2.8% | |
3.0 | 142 | 1.7% | |
4.0 | 17 | 0.2% |
Maximum 5 values
Value | Count | Frequency (%) | |
12.0 | 2 | 0.0% | |
14.0 | 3 | 0.0% | |
15.0 | 4 | 0.0% | |
20.0 | 3 | 0.0% | |
30.0 | 1 | 0.0% |
crshow1
Numeric
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 28.8% |
Missing (n) | 2466 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 2.3338 |
---|---|
Minimum | 1 |
Maximum | 5 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 2 |
Q3 | 3 |
95-th percentile | 5 |
Maximum | 5 |
Range | 4 |
Interquartile range | 2 |
Descriptive statistics
Standard deviation | 1.0808 |
---|---|
Coef of variation | 0.46313 |
Kurtosis | -0.21478 |
Mean | 2.3338 |
MAD | 0.91972 |
Skewness | 0.41586 |
Sum | 14215 |
Variance | 1.1682 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
3.0 | 2510 | 29.3% | |
1.0 | 1770 | 20.7% | |
2.0 | 1319 | 15.4% | |
5.0 | 309 | 3.6% | |
4.0 | 183 | 2.1% | |
(Missing) | 2466 | 28.8% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 1770 | 20.7% | |
2.0 | 1319 | 15.4% | |
3.0 | 2510 | 29.3% | |
4.0 | 183 | 2.1% | |
5.0 | 309 | 3.6% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 1770 | 20.7% | |
2.0 | 1319 | 15.4% | |
3.0 | 2510 | 29.3% | |
4.0 | 183 | 2.1% | |
5.0 | 309 | 3.6% |
crspl1
Numeric
Distinct count | 27 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 41.5% |
Missing (n) | 3553 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 12.849 |
---|---|
Minimum | 1 |
Maximum | 1111 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 2 |
Q1 | 4 |
Median | 4 |
Q3 | 22 |
95-th percentile | 43 |
Maximum | 1111 |
Range | 1110 |
Interquartile range | 18 |
Descriptive statistics
Standard deviation | 30.664 |
---|---|
Coef of variation | 2.3865 |
Kurtosis | 984.77 |
Mean | 12.849 |
MAD | 13.188 |
Skewness | 27.708 |
Sum | 64295 |
Variance | 940.27 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
4.0 | 3000 | 35.1% | |
2.0 | 525 | 6.1% | |
37.0 | 357 | 4.2% | |
27.0 | 266 | 3.1% | |
43.0 | 200 | 2.3% | |
25.0 | 162 | 1.9% | |
22.0 | 154 | 1.8% | |
32.0 | 112 | 1.3% | |
3.0 | 61 | 0.7% | |
55.0 | 50 | 0.6% | |
Other values (16) | 117 | 1.4% | |
(Missing) | 3553 | 41.5% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 2 | 0.0% | |
2.0 | 525 | 6.1% | |
3.0 | 61 | 0.7% | |
4.0 | 3000 | 35.1% | |
5.0 | 12 | 0.1% |
Maximum 5 values
Value | Count | Frequency (%) | |
48.0 | 4 | 0.0% | |
52.0 | 15 | 0.2% | |
55.0 | 50 | 0.6% | |
70.0 | 40 | 0.5% | |
1111.0 | 3 | 0.0% |
crsst1
Highly correlated
This variable is highly correlated with crspl1
and should be ignored for analysis
Correlation | 0.92971 |
---|
crsyes1
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 25.1% |
Missing (n) | 2149 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.0097 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 1 |
95-th percentile | 1 |
Maximum | 2 |
Range | 1 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.097894 |
---|---|
Coef of variation | 0.096956 |
Kurtosis | 98.442 |
Mean | 1.0097 |
MAD | 0.019164 |
Skewness | 10.021 |
Sum | 6470 |
Variance | 0.0095833 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 6346 | 74.2% | |
2.0 | 62 | 0.7% | |
(Missing) | 2149 | 25.1% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 6346 | 74.2% | |
2.0 | 62 | 0.7% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 6346 | 74.2% | |
2.0 | 62 | 0.7% |
crsyr1
Highly correlated
This variable is highly correlated with usyr1
and should be ignored for analysis
Correlation | 0.95644 |
---|
dacaapp
Categorical
Distinct count | 2 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 0.8% |
Missing (n) | 67 |
(Missing) | 67 |
---|
Value | Count | Frequency (%) | |
8490 | 99.2% | ||
(Missing) | 67 | 0.8% |
dacarec
Categorical
Distinct count | 2 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 0.8% |
Missing (n) | 67 |
(Missing) | 67 |
---|
Value | Count | Frequency (%) | |
8490 | 99.2% | ||
(Missing) | 67 | 0.8% |
doctor
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 4.6% |
Missing (n) | 397 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.6585 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 2 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 1 |
Descriptive statistics
Standard deviation | 0.47426 |
---|---|
Coef of variation | 0.28596 |
Kurtosis | -1.5536 |
Mean | 1.6585 |
MAD | 0.44978 |
Skewness | -0.66839 |
Sum | 13533 |
Variance | 0.22492 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
2.0 | 5373 | 62.8% | |
1.0 | 2787 | 32.6% | |
(Missing) | 397 | 4.6% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 2787 | 32.6% | |
2.0 | 5373 | 62.8% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 2787 | 32.6% | |
2.0 | 5373 | 62.8% |
edyrs
Numeric
Distinct count | 24 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 0.2% |
Missing (n) | 18 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 5.4824 |
---|---|
Minimum | 0 |
Maximum | 28 |
Zeros (%) | 12.3% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 3 |
Median | 6 |
Q3 | 8 |
95-th percentile | 12 |
Maximum | 28 |
Range | 28 |
Interquartile range | 5 |
Descriptive statistics
Standard deviation | 3.9844 |
---|---|
Coef of variation | 0.72676 |
Kurtosis | 0.52912 |
Mean | 5.4824 |
MAD | 3.1189 |
Skewness | 0.73764 |
Sum | 46814 |
Variance | 15.875 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
6.0 | 2149 | 25.1% | |
9.0 | 1109 | 13.0% | |
0.0 | 1056 | 12.3% | |
3.0 | 1009 | 11.8% | |
2.0 | 689 | 8.1% | |
4.0 | 486 | 5.7% | |
12.0 | 420 | 4.9% | |
1.0 | 388 | 4.5% | |
5.0 | 338 | 3.9% | |
8.0 | 192 | 2.2% | |
Other values (13) | 703 | 8.2% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 1056 | 12.3% | |
1.0 | 388 | 4.5% | |
2.0 | 689 | 8.1% | |
3.0 | 1009 | 11.8% | |
4.0 | 486 | 5.7% |
Maximum 5 values
Value | Count | Frequency (%) | |
18.0 | 19 | 0.2% | |
19.0 | 14 | 0.2% | |
20.0 | 1 | 0.0% | |
24.0 | 2 | 0.0% | |
28.0 | 1 | 0.0% |
engfrnd
Categorical
Distinct count | 9 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 2.1% |
Missing (n) | 180 |
1.0 | |
---|---|
2.0 | 762 |
Other values (5) | 237 |
(Missing) | 180 |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
1.0 | 3328 | 38.9% | |
2.0 | 762 | 8.9% | |
3.0 | 140 | 1.6% | |
4.0 | 53 | 0.6% | |
1 | 37 | 0.4% | |
2 | 6 | 0.1% | |
3 | 1 | 0.0% | |
(Missing) | 180 | 2.1% |
enghome
Categorical
Distinct count | 8 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 2.1% |
Missing (n) | 176 |
1.0 | |
---|---|
2.0 | 623 |
Other values (4) | 210 |
(Missing) | 176 |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
1.0 | 3498 | 40.9% | |
2.0 | 623 | 7.3% | |
3.0 | 120 | 1.4% | |
4.0 | 46 | 0.5% | |
1 | 37 | 0.4% | |
2 | 7 | 0.1% | |
(Missing) | 176 | 2.1% |
english
Numeric
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 3.4% |
Missing (n) | 295 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.295 |
---|---|
Minimum | 0 |
Maximum | 4 |
Zeros (%) | 38.8% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 1 |
Q3 | 3 |
95-th percentile | 4 |
Maximum | 4 |
Range | 4 |
Interquartile range | 3 |
Descriptive statistics
Standard deviation | 1.3517 |
---|---|
Coef of variation | 1.0438 |
Kurtosis | -0.98255 |
Mean | 1.295 |
MAD | 1.1784 |
Skewness | 0.62879 |
Sum | 10699 |
Variance | 1.8272 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 3319 | 38.8% | |
1.0 | 1932 | 22.6% | |
3.0 | 1497 | 17.5% | |
2.0 | 890 | 10.4% | |
4.0 | 624 | 7.3% | |
(Missing) | 295 | 3.4% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 3319 | 38.8% | |
1.0 | 1932 | 22.6% | |
2.0 | 890 | 10.4% | |
3.0 | 1497 | 17.5% | |
4.0 | 624 | 7.3% |
Maximum 5 values
Value | Count | Frequency (%) | |
0.0 | 3319 | 38.8% | |
1.0 | 1932 | 22.6% | |
2.0 | 890 | 10.4% | |
3.0 | 1497 | 17.5% | |
4.0 | 624 | 7.3% |
engneig
Categorical
Distinct count | 9 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 2.3% |
Missing (n) | 196 |
1.0 | |
---|---|
2.0 | |
Other values (5) | 386 |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
1.0 | 2816 | 32.9% | |
2.0 | 1109 | 13.0% | |
3.0 | 226 | 2.6% | |
4.0 | 116 | 1.4% | |
1 | 33 | 0.4% | |
2 | 10 | 0.1% | |
3 | 1 | 0.0% | |
(Missing) | 196 | 2.3% |
engwork
Categorical
Distinct count | 9 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 3.6% |
Missing (n) | 310 |
1.0 | |
---|---|
2.0 | |
Other values (5) | 676 |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
1.0 | 2081 | 24.3% | |
2.0 | 1440 | 16.8% | |
3.0 | 446 | 5.2% | |
4.0 | 192 | 2.2% | |
1 | 23 | 0.3% | |
2 | 14 | 0.2% | |
0.0 | 1 | 0.0% | |
(Missing) | 310 | 3.6% |
fadoc
Categorical
Distinct count | 11 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 17.9% |
Missing (n) | 1534 |
1 | 42 |
---|---|
3 | 37 |
Other values (7) | 54 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1 | 42 | 0.5% | |
3 | 37 | 0.4% | |
4 | 17 | 0.2% | |
2 | 16 | 0.2% | |
1.0 | 10 | 0.1% | |
3.0 | 7 | 0.1% | |
2.0 | 2 | 0.0% | |
8 | 1 | 0.0% | |
4.0 | 1 | 0.0% | |
(Missing) | 1534 | 17.9% |
fadoyr
Categorical
Distinct count | 23 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 19.1% |
Missing (n) | 1631 |
1989.0 | 4 |
---|---|
1980 | 4 |
Other values (19) | 28 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1989.0 | 4 | 0.0% | |
1980 | 4 | 0.0% | |
1999 | 3 | 0.0% | |
1987 | 3 | 0.0% | |
1958 | 2 | 0.0% | |
1987.0 | 2 | 0.0% | |
1990 | 2 | 0.0% | |
1986 | 2 | 0.0% | |
2004 | 2 | 0.0% | |
Other values (12) | 12 | 0.1% | |
(Missing) | 1631 | 19.1% |
fagree
Categorical
Distinct count | 7 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 29.0% |
Missing (n) | 2481 |
2.0 | 208 |
---|---|
1.0 | 124 |
Other values (3) | 27 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
2.0 | 208 | 2.4% | |
1.0 | 124 | 1.4% | |
2 | 14 | 0.2% | |
1 | 10 | 0.1% | |
3.0 | 3 | 0.0% | |
(Missing) | 2481 | 29.0% |
fauspl
Categorical
Distinct count | 34 |
---|---|
Unique (%) | 0.4% |
Missing (%) | 51.3% |
Missing (n) | 4388 |
4480.0 | 27 |
---|---|
7777.0 | 14 |
Other values (30) | 78 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
4480.0 | 27 | 0.3% | |
7777.0 | 14 | 0.2% | |
1600.0 | 10 | 0.1% | |
7320.0 | 7 | 0.1% | |
6160.0 | 7 | 0.1% | |
5945.0 | 5 | 0.1% | |
7400.0 | 5 | 0.1% | |
6200.0 | 4 | 0.0% | |
1920.0 | 4 | 0.0% | |
Other values (23) | 36 | 0.4% | |
(Missing) | 4388 | 51.3% |
fausst
Categorical
Distinct count | 26 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 50.1% |
Missing (n) | 4291 |
199.0 | 82 |
---|---|
105.0 | 64 |
Other values (22) | 70 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
199.0 | 82 | 1.0% | |
105.0 | 64 | 0.7% | |
144.0 | 13 | 0.2% | |
114.0 | 11 | 0.1% | |
139.0 | 8 | 0.1% | |
110.0 | 7 | 0.1% | |
103.0 | 5 | 0.1% | |
143.0 | 2 | 0.0% | |
115.0 | 2 | 0.0% | |
Other values (15) | 22 | 0.3% | |
(Missing) | 4291 | 50.1% |
fayrgr
Categorical
Distinct count | 35 |
---|---|
Unique (%) | 0.4% |
Missing (%) | 32.2% |
Missing (n) | 2756 |
1987.0 | 13 |
---|---|
1986.0 | 9 |
Other values (31) | 62 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1987.0 | 13 | 0.2% | |
1986.0 | 9 | 0.1% | |
1999.0 | 6 | 0.1% | |
1988.0 | 4 | 0.0% | |
1973.0 | 3 | 0.0% | |
1985.0 | 3 | 0.0% | |
1978.0 | 3 | 0.0% | |
1956.0 | 3 | 0.0% | |
1955.0 | 3 | 0.0% | |
Other values (24) | 37 | 0.4% | |
(Missing) | 2756 | 32.2% |
fedtx
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 21.0% |
Missing (n) | 1801 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.2848 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 1 |
Descriptive statistics
Standard deviation | 0.45134 |
---|---|
Coef of variation | 0.3513 |
Kurtosis | -1.0903 |
Mean | 1.2848 |
MAD | 0.40736 |
Skewness | 0.95395 |
Sum | 8680 |
Variance | 0.20371 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 4832 | 56.5% | |
2.0 | 1924 | 22.5% | |
(Missing) | 1801 | 21.0% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 4832 | 56.5% | |
2.0 | 1924 | 22.5% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 4832 | 56.5% | |
2.0 | 1924 | 22.5% |
fedtxs
Categorical
Distinct count | 5 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 47.9% |
Missing (n) | 4095 |
1.0 | 290 |
---|---|
2.0 | 117 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
1.0 | 290 | 3.4% | |
2.0 | 117 | 1.4% | |
1 | 5 | 0.1% | |
(Missing) | 4095 | 47.9% |
finhelp
Categorical
Distinct count | 16 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 5.3% |
Missing (n) | 457 |
6.0 | |
---|---|
4 | |
4.0 | |
Other values (12) |
Value | Count | Frequency (%) | |
6.0 | 2107 | 24.6% | |
4 | 1171 | 13.7% | |
4.0 | 1074 | 12.6% | |
995 | 11.6% | ||
6 | 922 | 10.8% | |
2.0 | 608 | 7.1% | |
2 | 556 | 6.5% | |
3.0 | 203 | 2.4% | |
3 | 173 | 2.0% | |
1.0 | 99 | 1.2% | |
Other values (5) | 192 | 2.2% | |
(Missing) | 457 | 5.3% |
finhelp1
Categorical
Distinct count | 16 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 4.1% |
Missing (n) | 350 |
6 | |
---|---|
4.0 | |
Other values (12) |
Value | Count | Frequency (%) | |
3354 | 39.2% | ||
6 | 954 | 11.1% | |
4.0 | 938 | 11.0% | |
4 | 913 | 10.7% | |
6.0 | 672 | 7.9% | |
2.0 | 454 | 5.3% | |
2 | 446 | 5.2% | |
3 | 188 | 2.2% | |
3.0 | 85 | 1.0% | |
1 | 82 | 1.0% | |
Other values (5) | 121 | 1.4% | |
(Missing) | 350 | 4.1% |
food
Numeric
Distinct count | 146 |
---|---|
Unique (%) | 1.7% |
Missing (%) | 25.1% |
Missing (n) | 2149 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 164.83 |
---|---|
Minimum | 0 |
Maximum | 2800 |
Zeros (%) | 11.9% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 40 |
Median | 100 |
Q3 | 200 |
95-th percentile | 500 |
Maximum | 2800 |
Range | 2800 |
Interquartile range | 160 |
Descriptive statistics
Standard deviation | 185.04 |
---|---|
Coef of variation | 1.1226 |
Kurtosis | 12.902 |
Mean | 164.83 |
MAD | 130.39 |
Skewness | 2.5371 |
Sum | 1056300 |
Variance | 34239 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 1021 | 11.9% | |
200.0 | 706 | 8.3% | |
100.0 | 666 | 7.8% | |
400.0 | 337 | 3.9% | |
120.0 | 313 | 3.7% | |
80.0 | 297 | 3.5% | |
150.0 | 289 | 3.4% | |
50.0 | 265 | 3.1% | |
300.0 | 261 | 3.1% | |
160.0 | 181 | 2.1% | |
Other values (135) | 2072 | 24.2% | |
(Missing) | 2149 | 25.1% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 1021 | 11.9% | |
1.0 | 2 | 0.0% | |
1.75 | 1 | 0.0% | |
2.0 | 3 | 0.0% | |
3.0 | 4 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
1200.0 | 9 | 0.1% | |
1400.0 | 1 | 0.0% | |
1500.0 | 4 | 0.0% | |
1600.0 | 1 | 0.0% | |
2800.0 | 1 | 0.0% |
foodst
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 4.9% |
Missing (n) | 416 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.9478 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 2 |
Median | 2 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.22245 |
---|---|
Coef of variation | 0.11421 |
Kurtosis | 14.22 |
Mean | 1.9478 |
MAD | 0.098959 |
Skewness | -4.027 |
Sum | 15857 |
Variance | 0.049486 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
2.0 | 7716 | 90.2% | |
1.0 | 425 | 5.0% | |
(Missing) | 416 | 4.9% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 425 | 5.0% | |
2.0 | 7716 | 90.2% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 425 | 5.0% | |
2.0 | 7716 | 90.2% |
frevus
Highly correlated
This variable is highly correlated with frinus
and should be ignored for analysis
Correlation | 0.90996 |
---|
frinus
Numeric
Distinct count | 44 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 7.6% |
Missing (n) | 653 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 5.0659 |
---|---|
Minimum | 0 |
Maximum | 300 |
Zeros (%) | 50.8% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 0 |
Q3 | 5 |
95-th percentile | 20 |
Maximum | 300 |
Range | 300 |
Interquartile range | 5 |
Descriptive statistics
Standard deviation | 12.63 |
---|---|
Coef of variation | 2.4931 |
Kurtosis | 110.14 |
Mean | 5.0659 |
MAD | 6.5234 |
Skewness | 7.8374 |
Sum | 40041 |
Variance | 159.51 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 4350 | 50.8% | |
10.0 | 549 | 6.4% | |
5.0 | 406 | 4.7% | |
2.0 | 400 | 4.7% | |
1.0 | 374 | 4.4% | |
3.0 | 355 | 4.1% | |
20.0 | 284 | 3.3% | |
4.0 | 222 | 2.6% | |
15.0 | 180 | 2.1% | |
6.0 | 152 | 1.8% | |
Other values (33) | 632 | 7.4% | |
(Missing) | 653 | 7.6% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 4350 | 50.8% | |
1.0 | 374 | 4.4% | |
2.0 | 400 | 4.7% | |
3.0 | 355 | 4.1% | |
4.0 | 222 | 2.6% |
Maximum 5 values
Value | Count | Frequency (%) | |
150.0 | 2 | 0.0% | |
190.0 | 1 | 0.0% | |
200.0 | 5 | 0.1% | |
250.0 | 1 | 0.0% | |
300.0 | 1 | 0.0% |
general
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 49.4% |
Missing (n) | 4224 |
2.0 | 230 |
---|---|
1.0 | 53 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
2.0 | 230 | 2.7% | |
1.0 | 53 | 0.6% | |
(Missing) | 4224 | 49.4% |
health
Categorical
Distinct count | 10 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.1% |
Missing (n) | 8 |
3 | 716 |
---|---|
4 | 713 |
Other values (6) | 405 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
3 | 716 | 8.4% | |
4 | 713 | 8.3% | |
3.0 | 212 | 2.5% | |
4.0 | 140 | 1.6% | |
2 | 38 | 0.4% | |
2.0 | 9 | 0.1% | |
1 | 5 | 0.1% | |
1.0 | 1 | 0.0% | |
(Missing) | 8 | 0.1% |
healthly
Categorical
Distinct count | 10 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.1% |
Missing (n) | 5 |
3 | 922 |
---|---|
2 | 315 |
Other values (6) | 600 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
3 | 922 | 10.8% | |
2 | 315 | 3.7% | |
3.0 | 233 | 2.7% | |
4 | 171 | 2.0% | |
2.0 | 71 | 0.8% | |
1 | 66 | 0.8% | |
4.0 | 54 | 0.6% | |
1.0 | 5 | 0.1% | |
(Missing) | 5 | 0.1% |
healthnw
Categorical
Distinct count | 10 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.1% |
Missing (n) | 5 |
3 | 864 |
---|---|
2 | 379 |
Other values (6) | 594 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
3 | 864 | 10.1% | |
2 | 379 | 4.4% | |
3.0 | 220 | 2.6% | |
4 | 163 | 1.9% | |
2.0 | 84 | 1.0% | |
1 | 68 | 0.8% | |
4.0 | 52 | 0.6% | |
1.0 | 7 | 0.1% | |
(Missing) | 5 | 0.1% |
heart
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.1% |
Missing (n) | 8 |
2 | |
---|---|
2.0 | 357 |
Other values (2) | 73 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
2 | 1404 | 16.4% | |
2.0 | 357 | 4.2% | |
1 | 67 | 0.8% | |
1.0 | 6 | 0.1% | |
(Missing) | 8 | 0.1% |
height
Categorical
Distinct count | 87 |
---|---|
Unique (%) | 1.0% |
Missing (%) | 0.5% |
Missing (n) | 39 |
1.7 | 286 |
---|---|
1.65 | 164 |
Other values (83) | 1353 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
1.7 | 286 | 3.3% | |
1.65 | 164 | 1.9% | |
1.6 | 157 | 1.8% | |
1.8 | 96 | 1.1% | |
1.75 | 83 | 1.0% | |
1.7 | 76 | 0.9% | |
1.6 | 60 | 0.7% | |
1.68 | 60 | 0.7% | |
1.55 | 48 | 0.6% | |
Other values (76) | 773 | 9.0% |
hhincome
Categorical
Distinct count | 646 |
---|---|
Unique (%) | 7.5% |
Missing (%) | 14.1% |
Missing (n) | 1208 |
0.0 | 187 |
---|---|
0 | 167 |
Other values (642) | |
(Missing) |
Value | Count | Frequency (%) | |
4507 | 52.7% | ||
0.0 | 187 | 2.2% | |
0 | 167 | 2.0% | |
400000.0 | 88 | 1.0% | |
600000.0 | 70 | 0.8% | |
300000.0 | 63 | 0.7% | |
600 | 60 | 0.7% | |
400 | 57 | 0.7% | |
800000.0 | 55 | 0.6% | |
200000.0 | 54 | 0.6% | |
Other values (635) | 2041 | 23.9% | |
(Missing) | 1208 | 14.1% |
hhnum
Highly correlated
This variable is highly correlated with surveypl
and should be ignored for analysis
Correlation | 0.96261 |
---|
hlthpmt2
Categorical
Distinct count | 10 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 50.6% |
Missing (n) | 4334 |
4.0 | 64 |
---|---|
3.0 | 34 |
Other values (6) | 75 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
4.0 | 64 | 0.7% | |
3.0 | 34 | 0.4% | |
5.0 | 25 | 0.3% | |
1.0 | 25 | 0.3% | |
2.0 | 18 | 0.2% | |
7.0 | 3 | 0.0% | |
2 | 2 | 0.0% | |
6.0 | 2 | 0.0% | |
(Missing) | 4334 | 50.6% |
hlthpmt3
Categorical
Distinct count | 9 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 52.4% |
Missing (n) | 4488 |
3.0 | 6 |
---|---|
4.0 | 5 |
Other values (5) | 8 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
3.0 | 6 | 0.1% | |
4.0 | 5 | 0.1% | |
2.0 | 4 | 0.0% | |
7.0 | 1 | 0.0% | |
6.0 | 1 | 0.0% | |
5.0 | 1 | 0.0% | |
1.0 | 1 | 0.0% | |
(Missing) | 4488 | 52.4% |
hlthpmt4
Categorical
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 52.7% |
Missing (n) | 4506 |
6.0 | 1 |
---|---|
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
6.0 | 1 | 0.0% | |
(Missing) | 4506 | 52.7% |
hospital
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 4.8% |
Missing (n) | 410 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.6913 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 2 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 1 |
Descriptive statistics
Standard deviation | 0.46199 |
---|---|
Coef of variation | 0.27316 |
Kurtosis | -1.3142 |
Mean | 1.6913 |
MAD | 0.42681 |
Skewness | -0.82835 |
Sum | 13779 |
Variance | 0.21343 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
2.0 | 5632 | 65.8% | |
1.0 | 2515 | 29.4% | |
(Missing) | 410 | 4.8% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 2515 | 29.4% | |
2.0 | 5632 | 65.8% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 2515 | 29.4% | |
2.0 | 5632 | 65.8% |
howjob
Numeric
Distinct count | 10 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 14.2% |
Missing (n) | 1212 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 2.5673 |
---|---|
Minimum | 1 |
Maximum | 9 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 2 |
Q3 | 3 |
95-th percentile | 6 |
Maximum | 9 |
Range | 8 |
Interquartile range | 2 |
Descriptive statistics
Standard deviation | 1.5723 |
---|---|
Coef of variation | 0.61242 |
Kurtosis | 1.0317 |
Mean | 2.5673 |
MAD | 1.2057 |
Skewness | 1.2569 |
Sum | 18857 |
Variance | 2.4721 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
2.0 | 2260 | 26.4% | |
1.0 | 2007 | 23.5% | |
3.0 | 1889 | 22.1% | |
6.0 | 833 | 9.7% | |
4.0 | 274 | 3.2% | |
8.0 | 39 | 0.5% | |
5.0 | 31 | 0.4% | |
9.0 | 9 | 0.1% | |
7.0 | 3 | 0.0% | |
(Missing) | 1212 | 14.2% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 2007 | 23.5% | |
2.0 | 2260 | 26.4% | |
3.0 | 1889 | 22.1% | |
4.0 | 274 | 3.2% | |
5.0 | 31 | 0.4% |
Maximum 5 values
Value | Count | Frequency (%) | |
5.0 | 31 | 0.4% | |
6.0 | 833 | 9.7% | |
7.0 | 3 | 0.0% | |
8.0 | 39 | 0.5% | |
9.0 | 9 | 0.1% |
howjobs
Categorical
Distinct count | 11 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 47.8% |
Missing (n) | 4087 |
2.0 | 170 |
---|---|
1.0 | 138 |
Other values (7) | 112 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
2.0 | 170 | 2.0% | |
1.0 | 138 | 1.6% | |
3.0 | 81 | 0.9% | |
4.0 | 11 | 0.1% | |
6.0 | 8 | 0.1% | |
8.0 | 6 | 0.1% | |
2 | 4 | 0.0% | |
1 | 1 | 0.0% | |
7.0 | 1 | 0.0% | |
(Missing) | 4087 | 47.8% |
howpaid
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 13.6% |
Missing (n) | 1164 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.2561 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 1 |
Descriptive statistics
Standard deviation | 0.43648 |
---|---|
Coef of variation | 0.3475 |
Kurtosis | -0.75007 |
Mean | 1.2561 |
MAD | 0.38098 |
Skewness | 1.1181 |
Sum | 9286 |
Variance | 0.19052 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 5500 | 64.3% | |
2.0 | 1893 | 22.1% | |
(Missing) | 1164 | 13.6% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 5500 | 64.3% | |
2.0 | 1893 | 22.1% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 5500 | 64.3% | |
2.0 | 1893 | 22.1% |
howpaids
Categorical
Distinct count | 5 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 47.8% |
Missing (n) | 4086 |
1.0 | 289 |
---|---|
2.0 | 127 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
1.0 | 289 | 3.4% | |
2.0 | 127 | 1.5% | |
1 | 5 | 0.1% | |
(Missing) | 4086 | 47.8% |
hrwage
Numeric
Distinct count | 432 |
---|---|
Unique (%) | 5.0% |
Missing (%) | 29.3% |
Missing (n) | 2504 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 5.9034 |
---|---|
Minimum | 0 |
Maximum | 200 |
Zeros (%) | 0.1% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0.8 |
Q1 | 3 |
Median | 5 |
Q3 | 7.79 |
95-th percentile | 13 |
Maximum | 200 |
Range | 200 |
Interquartile range | 4.79 |
Descriptive statistics
Standard deviation | 5.0759 |
---|---|
Coef of variation | 0.85982 |
Kurtosis | 385.54 |
Mean | 5.9034 |
MAD | 3.0825 |
Skewness | 11.823 |
Sum | 35733 |
Variance | 25.764 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
5.0 | 413 | 4.8% | |
6.0 | 338 | 3.9% | |
7.0 | 284 | 3.3% | |
8.0 | 266 | 3.1% | |
4.0 | 240 | 2.8% | |
3.0 | 239 | 2.8% | |
10.0 | 222 | 2.6% | |
4.5 | 193 | 2.3% | |
2.5 | 166 | 1.9% | |
9.0 | 155 | 1.8% | |
Other values (421) | 3537 | 41.3% | |
(Missing) | 2504 | 29.3% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 7 | 0.1% | |
0.03 | 1 | 0.0% | |
0.07 | 1 | 0.0% | |
0.1 | 5 | 0.1% | |
0.11 | 1 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
37.5 | 1 | 0.0% | |
40.0 | 2 | 0.0% | |
50.0 | 1 | 0.0% | |
110.0 | 1 | 0.0% | |
200.0 | 1 | 0.0% |
hrwages
Categorical
Distinct count | 95 |
---|---|
Unique (%) | 1.1% |
Missing (%) | 48.6% |
Missing (n) | 4160 |
6.0 | 29 |
---|---|
7.0 | 22 |
Other values (91) | 296 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
6.0 | 29 | 0.3% | |
7.0 | 22 | 0.3% | |
8.0 | 21 | 0.2% | |
5.0 | 18 | 0.2% | |
10.0 | 12 | 0.1% | |
4.25 | 10 | 0.1% | |
5.5 | 10 | 0.1% | |
9.0 | 9 | 0.1% | |
12.0 | 9 | 0.1% | |
Other values (84) | 207 | 2.4% | |
(Missing) | 4160 | 48.6% |
hrweek
Numeric
Distinct count | 92 |
---|---|
Unique (%) | 1.1% |
Missing (%) | 15.2% |
Missing (n) | 1304 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 45.771 |
---|---|
Minimum | 1 |
Maximum | 133 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 20 |
Q1 | 40 |
Median | 40 |
Q3 | 50 |
95-th percentile | 72 |
Maximum | 133 |
Range | 132 |
Interquartile range | 10 |
Descriptive statistics
Standard deviation | 14.881 |
---|---|
Coef of variation | 0.32512 |
Kurtosis | 2.9353 |
Mean | 45.771 |
MAD | 10.434 |
Skewness | 0.46688 |
Sum | 331980 |
Variance | 221.45 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
40.0 | 2738 | 32.0% | |
48.0 | 1006 | 11.8% | |
60.0 | 643 | 7.5% | |
50.0 | 512 | 6.0% | |
45.0 | 200 | 2.3% | |
70.0 | 170 | 2.0% | |
30.0 | 170 | 2.0% | |
56.0 | 155 | 1.8% | |
72.0 | 138 | 1.6% | |
8.0 | 110 | 1.3% | |
Other values (81) | 1411 | 16.5% | |
(Missing) | 1304 | 15.2% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 3 | 0.0% | |
2.0 | 1 | 0.0% | |
3.0 | 4 | 0.0% | |
4.0 | 6 | 0.1% | |
5.0 | 7 | 0.1% |
Maximum 5 values
Value | Count | Frequency (%) | |
120.0 | 4 | 0.0% | |
126.0 | 3 | 0.0% | |
130.0 | 1 | 0.0% | |
132.0 | 1 | 0.0% | |
133.0 | 1 | 0.0% |
hrweeks
Categorical
Distinct count | 45 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 47.9% |
Missing (n) | 4095 |
40.0 | 199 |
---|---|
48.0 | 45 |
Other values (41) | 168 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
40.0 | 199 | 2.3% | |
48.0 | 45 | 0.5% | |
60.0 | 21 | 0.2% | |
35.0 | 19 | 0.2% | |
30.0 | 19 | 0.2% | |
50.0 | 19 | 0.2% | |
20.0 | 8 | 0.1% | |
8.0 | 7 | 0.1% | |
12.0 | 5 | 0.1% | |
Other values (34) | 70 | 0.8% | |
(Missing) | 4095 | 47.9% |
hyperten
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.1% |
Missing (n) | 6 |
2 | 1230 |
---|---|
2.0 | 314 |
Other values (2) | 292 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
2 | 1230 | 14.4% | |
2.0 | 314 | 3.7% | |
1 | 243 | 2.8% | |
1.0 | 49 | 0.6% | |
(Missing) | 6 | 0.1% |
kgs
Categorical
Distinct count | 139 |
---|---|
Unique (%) | 1.6% |
Missing (%) | 1.1% |
Missing (n) | 90 |
80 | 184 |
---|---|
70 | 171 |
Other values (135) |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
80 | 184 | 2.2% | |
70 | 171 | 2.0% | |
75 | 104 | 1.2% | |
90 | 71 | 0.8% | |
60 | 70 | 0.8% | |
85 | 64 | 0.7% | |
65 | 63 | 0.7% | |
80.0 | 53 | 0.6% | |
78 | 51 | 0.6% | |
Other values (128) | 921 | 10.8% | |
(Missing) | 90 | 1.1% |
latinos
Numeric
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 6.9% |
Missing (n) | 588 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.4688 |
---|---|
Minimum | 0 |
Maximum | 4 |
Zeros (%) | 8.6% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 1 |
Median | 2 |
Q3 | 2 |
95-th percentile | 3 |
Maximum | 4 |
Range | 4 |
Interquartile range | 1 |
Descriptive statistics
Standard deviation | 0.7379 |
---|---|
Coef of variation | 0.50237 |
Kurtosis | -0.28517 |
Mean | 1.4688 |
MAD | 0.64754 |
Skewness | -0.16716 |
Sum | 11705 |
Variance | 0.54449 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
2.0 | 3617 | 42.3% | |
1.0 | 3185 | 37.2% | |
0.0 | 740 | 8.6% | |
3.0 | 422 | 4.9% | |
4.0 | 5 | 0.1% | |
(Missing) | 588 | 6.9% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 740 | 8.6% | |
1.0 | 3185 | 37.2% | |
2.0 | 3617 | 42.3% | |
3.0 | 422 | 4.9% | |
4.0 | 5 | 0.1% |
Maximum 5 values
Value | Count | Frequency (%) | |
0.0 | 740 | 8.6% | |
1.0 | 3185 | 37.2% | |
2.0 | 3617 | 42.3% | |
3.0 | 422 | 4.9% | |
4.0 | 5 | 0.1% |
ldowage
Categorical
Distinct count | 228 |
---|---|
Unique (%) | 2.7% |
Missing (%) | 22.6% |
Missing (n) | 1935 |
100.0 | 157 |
---|---|
1000.0 | 152 |
Other values (224) | |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
100.0 | 157 | 1.8% | |
1000.0 | 152 | 1.8% | |
800.0 | 126 | 1.5% | |
200.0 | 110 | 1.3% | |
500.0 | 105 | 1.2% | |
600.0 | 98 | 1.1% | |
150.0 | 93 | 1.1% | |
300.0 | 90 | 1.1% | |
120.0 | 83 | 1.0% | |
Other values (217) | 1558 | 18.2% | |
(Missing) | 1935 | 22.6% |
legspon
Categorical
Distinct count | 13 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 42.5% |
Missing (n) | 3635 |
5.0 | 309 |
---|---|
6 | 261 |
Other values (9) | |
(Missing) |
Value | Count | Frequency (%) | |
3583 | 41.9% | ||
5.0 | 309 | 3.6% | |
6 | 261 | 3.1% | |
5 | 209 | 2.4% | |
7.0 | 159 | 1.9% | |
3.0 | 126 | 1.5% | |
6.0 | 71 | 0.8% | |
1.0 | 68 | 0.8% | |
2.0 | 64 | 0.7% | |
4.0 | 45 | 0.5% | |
Other values (2) | 27 | 0.3% | |
(Missing) | 3635 | 42.5% |
legyrapp
Categorical
Distinct count | 73 |
---|---|
Unique (%) | 0.9% |
Missing (%) | 43.4% |
Missing (n) | 3714 |
1987.0 | 175 |
---|---|
1986.0 | 85 |
Other values (69) | 534 |
(Missing) |
Value | Count | Frequency (%) | |
4049 | 47.3% | ||
1987.0 | 175 | 2.0% | |
1986.0 | 85 | 1.0% | |
1988.0 | 74 | 0.9% | |
1985.0 | 29 | 0.3% | |
1989.0 | 27 | 0.3% | |
2001.0 | 20 | 0.2% | |
1996.0 | 18 | 0.2% | |
1991.0 | 16 | 0.2% | |
1990.0 | 15 | 0.2% | |
Other values (62) | 335 | 3.9% | |
(Missing) | 3714 | 43.4% |
lodging
Categorical
Distinct count | 14 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 7.5% |
Missing (n) | 641 |
4.0 | |
---|---|
4 | |
Other values (10) |
Value | Count | Frequency (%) | |
4.0 | 1726 | 20.2% | |
4 | 1489 | 17.4% | |
995 | 11.6% | ||
3.0 | 831 | 9.7% | |
2 | 779 | 9.1% | |
2.0 | 737 | 8.6% | |
3 | 346 | 4.0% | |
6.0 | 279 | 3.3% | |
1.0 | 231 | 2.7% | |
6 | 179 | 2.1% | |
Other values (3) | 324 | 3.8% | |
(Missing) | 641 | 7.5% |
lodging1
Categorical
Distinct count | 14 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 4.2% |
Missing (n) | 358 |
4.0 | |
---|---|
4 | |
Other values (10) |
Value | Count | Frequency (%) | |
3354 | 39.2% | ||
4.0 | 1203 | 14.1% | |
4 | 1160 | 13.6% | |
2 | 594 | 6.9% | |
2.0 | 588 | 6.9% | |
3 | 425 | 5.0% | |
3.0 | 236 | 2.8% | |
1 | 169 | 2.0% | |
1.0 | 166 | 1.9% | |
6 | 140 | 1.6% | |
Other values (3) | 164 | 1.9% | |
(Missing) | 358 | 4.2% |
lung
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.1% |
Missing (n) | 8 |
2 | |
---|---|
2.0 | 358 |
Other values (2) | 47 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
2 | 1429 | 16.7% | |
2.0 | 358 | 4.2% | |
1 | 42 | 0.5% | |
1.0 | 5 | 0.1% | |
(Missing) | 8 | 0.1% |
marstat
Numeric
Distinct count | 7 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.0% |
Missing (n) | 4 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 2.2155 |
---|---|
Minimum | 1 |
Maximum | 6 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 2 |
Q1 | 2 |
Median | 2 |
Q3 | 2 |
95-th percentile | 4 |
Maximum | 6 |
Range | 5 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.75647 |
---|---|
Coef of variation | 0.34145 |
Kurtosis | 11.889 |
Mean | 2.2155 |
MAD | 0.42294 |
Skewness | 3.2659 |
Sum | 18949 |
Variance | 0.57225 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
2.0 | 7277 | 85.0% | |
3.0 | 518 | 6.1% | |
4.0 | 317 | 3.7% | |
1.0 | 198 | 2.3% | |
6.0 | 160 | 1.9% | |
5.0 | 83 | 1.0% | |
(Missing) | 4 | 0.0% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 198 | 2.3% | |
2.0 | 7277 | 85.0% | |
3.0 | 518 | 6.1% | |
4.0 | 317 | 3.7% | |
5.0 | 83 | 1.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
2.0 | 7277 | 85.0% | |
3.0 | 518 | 6.1% | |
4.0 | 317 | 3.7% | |
5.0 | 83 | 1.0% | |
6.0 | 160 | 1.9% |
modoc
Categorical
Distinct count | 9 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 18.4% |
Missing (n) | 1575 |
1 | 40 |
---|---|
4 | 14 |
Other values (5) | 38 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1 | 40 | 0.5% | |
4 | 14 | 0.2% | |
2 | 12 | 0.1% | |
3 | 10 | 0.1% | |
1.0 | 9 | 0.1% | |
3.0 | 5 | 0.1% | |
2.0 | 2 | 0.0% | |
(Missing) | 1575 | 18.4% |
modoyr
Categorical
Distinct count | 25 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 19.1% |
Missing (n) | 1633 |
1999 | 4 |
---|---|
1987 | 4 |
Other values (21) | 26 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1999 | 4 | 0.0% | |
1987 | 4 | 0.0% | |
1989.0 | 3 | 0.0% | |
1987.0 | 2 | 0.0% | |
1980 | 2 | 0.0% | |
2006 | 2 | 0.0% | |
2003 | 1 | 0.0% | |
1958 | 1 | 0.0% | |
2013 | 1 | 0.0% | |
Other values (14) | 14 | 0.2% | |
(Missing) | 1633 | 19.1% |
mogree
Categorical
Distinct count | 7 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 31.3% |
Missing (n) | 2679 |
1.0 | 94 |
---|---|
2.0 | 54 |
Other values (3) | 14 |
(Missing) |
Value | Count | Frequency (%) | |
5716 | 66.8% | ||
1.0 | 94 | 1.1% | |
2.0 | 54 | 0.6% | |
1 | 6 | 0.1% | |
2 | 4 | 0.0% | |
3.0 | 4 | 0.0% | |
(Missing) | 2679 | 31.3% |
monsyr
Numeric
Distinct count | 20 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 12.3% |
Missing (n) | 1051 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 8.3702 |
---|---|
Minimum | 0 |
Maximum | 12 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 2 |
Q1 | 5 |
Median | 9 |
Q3 | 12 |
95-th percentile | 12 |
Maximum | 12 |
Range | 12 |
Interquartile range | 7 |
Descriptive statistics
Standard deviation | 3.7665 |
---|---|
Coef of variation | 0.44999 |
Kurtosis | -1.2037 |
Mean | 8.3702 |
MAD | 3.3708 |
Skewness | -0.51051 |
Sum | 62827 |
Variance | 14.186 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
12.0 | 3051 | 35.7% | |
6.0 | 802 | 9.4% | |
3.0 | 538 | 6.3% | |
8.0 | 513 | 6.0% | |
2.0 | 451 | 5.3% | |
10.0 | 389 | 4.5% | |
4.0 | 348 | 4.1% | |
9.0 | 306 | 3.6% | |
11.0 | 285 | 3.3% | |
5.0 | 282 | 3.3% | |
Other values (9) | 541 | 6.3% | |
(Missing) | 1051 | 12.3% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 2 | 0.0% | |
0.06 | 1 | 0.0% | |
0.07 | 1 | 0.0% | |
0.1 | 1 | 0.0% | |
0.29998779296875 | 1 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
8.0 | 513 | 6.0% | |
9.0 | 306 | 3.6% | |
10.0 | 389 | 4.5% | |
11.0 | 285 | 3.3% | |
12.0 | 3051 | 35.7% |
monsyrs
Categorical
Distinct count | 15 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 47.8% |
Missing (n) | 4087 |
12.0 | 270 |
---|---|
6.0 | 32 |
Other values (11) | 118 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
12.0 | 270 | 3.2% | |
6.0 | 32 | 0.4% | |
10.0 | 31 | 0.4% | |
11.0 | 22 | 0.3% | |
8.0 | 12 | 0.1% | |
4.0 | 10 | 0.1% | |
9.0 | 9 | 0.1% | |
7.0 | 9 | 0.1% | |
3.0 | 7 | 0.1% | |
Other values (4) | 18 | 0.2% | |
(Missing) | 4087 | 47.8% |
mouspl
Categorical
Distinct count | 30 |
---|---|
Unique (%) | 0.4% |
Missing (%) | 51.3% |
Missing (n) | 4390 |
4480.0 | 25 |
---|---|
7777.0 | 16 |
Other values (26) | 76 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
4480.0 | 25 | 0.3% | |
7777.0 | 16 | 0.2% | |
7320.0 | 15 | 0.2% | |
6160.0 | 6 | 0.1% | |
5945.0 | 6 | 0.1% | |
7400.0 | 5 | 0.1% | |
1920.0 | 4 | 0.0% | |
7360.0 | 4 | 0.0% | |
1600.0 | 3 | 0.0% | |
Other values (19) | 33 | 0.4% | |
(Missing) | 4390 | 51.3% |
mousst
Categorical
Distinct count | 22 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 50.9% |
Missing (n) | 4352 |
105.0 | 71 |
---|---|
199.0 | 27 |
Other values (18) | 57 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
105.0 | 71 | 0.8% | |
199.0 | 27 | 0.3% | |
144.0 | 15 | 0.2% | |
110.0 | 7 | 0.1% | |
139.0 | 6 | 0.1% | |
133.0 | 4 | 0.0% | |
114.0 | 4 | 0.0% | |
113.0 | 3 | 0.0% | |
103.0 | 3 | 0.0% | |
Other values (11) | 15 | 0.2% | |
(Missing) | 4352 | 50.9% |
moyrgr
Categorical
Distinct count | 36 |
---|---|
Unique (%) | 0.4% |
Missing (%) | 32.4% |
Missing (n) | 2774 |
1999.0 | 10 |
---|---|
1995.0 | 5 |
Other values (32) | 52 |
(Missing) |
Value | Count | Frequency (%) | |
5716 | 66.8% | ||
1999.0 | 10 | 0.1% | |
1995.0 | 5 | 0.1% | |
1998.0 | 4 | 0.0% | |
1970.0 | 4 | 0.0% | |
1988.0 | 4 | 0.0% | |
1983.0 | 3 | 0.0% | |
1997.0 | 3 | 0.0% | |
1978.0 | 2 | 0.0% | |
1973.0 | 2 | 0.0% | |
Other values (25) | 30 | 0.4% | |
(Missing) | 2774 | 32.4% |
mxhealth
Categorical
Distinct count | 10 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 4.3% |
Missing (n) | 370 |
3 | 856 |
---|---|
4 | 201 |
Other values (6) | 415 |
(Missing) | 370 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
3 | 856 | 10.0% | |
4 | 201 | 2.3% | |
3.0 | 163 | 1.9% | |
2 | 115 | 1.3% | |
4.0 | 63 | 0.7% | |
1 | 38 | 0.4% | |
2.0 | 31 | 0.4% | |
1.0 | 5 | 0.1% | |
(Missing) | 370 | 4.3% |
neevus
Highly correlated
This variable is highly correlated with neinus
and should be ignored for analysis
Correlation | 0.92759 |
---|
neinus
Numeric
Distinct count | 44 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 2.0% |
Missing (n) | 173 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 4.4645 |
---|---|
Minimum | 0 |
Maximum | 100 |
Zeros (%) | 45.6% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 1 |
Q3 | 6 |
95-th percentile | 20 |
Maximum | 100 |
Range | 100 |
Interquartile range | 6 |
Descriptive statistics
Standard deviation | 7.8352 |
---|---|
Coef of variation | 1.755 |
Kurtosis | 24.569 |
Mean | 4.4645 |
MAD | 5.0671 |
Skewness | 3.8163 |
Sum | 37430 |
Variance | 61.39 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 3906 | 45.6% | |
2.0 | 522 | 6.1% | |
1.0 | 475 | 5.6% | |
4.0 | 460 | 5.4% | |
3.0 | 449 | 5.2% | |
10.0 | 378 | 4.4% | |
5.0 | 373 | 4.4% | |
6.0 | 306 | 3.6% | |
20.0 | 252 | 2.9% | |
8.0 | 232 | 2.7% | |
Other values (33) | 1031 | 12.0% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 3906 | 45.6% | |
1.0 | 475 | 5.6% | |
2.0 | 522 | 6.1% | |
3.0 | 449 | 5.2% | |
4.0 | 460 | 5.4% |
Maximum 5 values
Value | Count | Frequency (%) | |
60.0 | 7 | 0.1% | |
65.0 | 1 | 0.0% | |
70.0 | 4 | 0.0% | |
80.0 | 4 | 0.0% | |
100.0 | 4 | 0.0% |
nerves
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.1% |
Missing (n) | 8 |
2 | |
---|---|
2.0 | 357 |
Other values (2) | 107 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
2 | 1370 | 16.0% | |
2.0 | 357 | 4.2% | |
1 | 101 | 1.2% | |
1.0 | 6 | 0.1% | |
(Missing) | 8 | 0.1% |
occ
Numeric
Distinct count | 122 |
---|---|
Unique (%) | 1.4% |
Missing (%) | 0.6% |
Missing (n) | 54 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 464.88 |
---|---|
Minimum | 10 |
Maximum | 831 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 10 |
---|---|
5-th percentile | 50 |
Q1 | 410 |
Median | 520 |
Q3 | 549 |
95-th percentile | 810 |
Maximum | 831 |
Range | 821 |
Interquartile range | 139 |
Descriptive statistics
Standard deviation | 206.81 |
---|---|
Coef of variation | 0.44487 |
Kurtosis | 0.044961 |
Mean | 464.88 |
MAD | 156.6 |
Skewness | -0.55691 |
Sum | 3952900 |
Variance | 42771 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
410.0 | 2514 | 29.4% | |
549.0 | 507 | 5.9% | |
529.0 | 403 | 4.7% | |
710.0 | 374 | 4.4% | |
713.0 | 297 | 3.5% | |
526.0 | 276 | 3.2% | |
524.0 | 241 | 2.8% | |
10.0 | 229 | 2.7% | |
546.0 | 214 | 2.5% | |
50.0 | 203 | 2.4% | |
Other values (111) | 3245 | 37.9% |
Minimum 5 values
Value | Count | Frequency (%) | |
10.0 | 229 | 2.7% | |
20.0 | 160 | 1.9% | |
21.0 | 1 | 0.0% | |
30.0 | 17 | 0.2% | |
42.0 | 5 | 0.1% |
Maximum 5 values
Value | Count | Frequency (%) | |
815.0 | 3 | 0.0% | |
819.0 | 76 | 0.9% | |
820.0 | 39 | 0.5% | |
830.0 | 78 | 0.9% | |
831.0 | 3 | 0.0% |
paistp1
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 3.0% |
Missing (n) | 253 |
1 | |
---|---|
1.0 | |
Other values (2) |
Value | Count | Frequency (%) | |
3354 | 39.2% | ||
1 | 1656 | 19.4% | |
1.0 | 1370 | 16.0% | |
2 | 1010 | 11.8% | |
2.0 | 914 | 10.7% | |
(Missing) | 253 | 3.0% |
paistrip
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 3.5% |
Missing (n) | 298 |
1.0 | |
---|---|
1 | |
2.0 | |
Other values (2) |
Value | Count | Frequency (%) | |
1.0 | 2838 | 33.2% | |
1 | 1754 | 20.5% | |
2.0 | 1433 | 16.7% | |
2 | 1239 | 14.5% | |
995 | 11.6% | ||
(Missing) | 298 | 3.5% |
pilevus
Categorical
Distinct count | 10 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.6% |
Missing (n) | 52 |
0.0 | |
---|---|
1.0 | 236 |
Other values (6) | 201 |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
0.0 | 4018 | 47.0% | |
1.0 | 236 | 2.8% | |
2.0 | 125 | 1.5% | |
0 | 41 | 0.5% | |
4.0 | 21 | 0.2% | |
3.0 | 9 | 0.1% | |
1 | 4 | 0.0% | |
4 | 1 | 0.0% | |
(Missing) | 52 | 0.6% |
pilinus
Categorical
Distinct count | 8 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.2% |
Missing (n) | 20 |
0.0 | |
---|---|
1.0 | 173 |
Other values (4) | 144 |
Value | Count | Frequency (%) | |
0.0 | 4170 | 48.7% | |
4050 | 47.3% | ||
1.0 | 173 | 2.0% | |
2.0 | 98 | 1.1% | |
0 | 43 | 0.5% | |
1 | 2 | 0.0% | |
2 | 1 | 0.0% | |
(Missing) | 20 | 0.2% |
placebrn
Numeric
Distinct count | 150 |
---|---|
Unique (%) | 1.8% |
Missing (%) | 2.2% |
Missing (n) | 186 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 11.639 |
---|---|
Minimum | 0 |
Maximum | 906 |
Zeros (%) | 78.9% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 0 |
Q3 | 0 |
95-th percentile | 68 |
Maximum | 906 |
Range | 906 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 46.208 |
---|---|
Coef of variation | 3.97 |
Kurtosis | 96.547 |
Mean | 11.639 |
MAD | 19.238 |
Skewness | 8.4163 |
Sum | 97432 |
Variance | 2135.2 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 6748 | 78.9% | |
401.0 | 61 | 0.7% | |
39.0 | 55 | 0.6% | |
1.0 | 53 | 0.6% | |
19.0 | 47 | 0.5% | |
2.0 | 43 | 0.5% | |
33.0 | 41 | 0.5% | |
6.0 | 36 | 0.4% | |
32.0 | 33 | 0.4% | |
21.0 | 31 | 0.4% | |
Other values (139) | 1223 | 14.3% | |
(Missing) | 186 | 2.2% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 6748 | 78.9% | |
1.0 | 53 | 0.6% | |
2.0 | 43 | 0.5% | |
3.0 | 20 | 0.2% | |
4.0 | 18 | 0.2% |
Maximum 5 values
Value | Count | Frequency (%) | |
537.0 | 1 | 0.0% | |
546.0 | 1 | 0.0% | |
551.0 | 2 | 0.0% | |
903.0 | 2 | 0.0% | |
906.0 | 1 | 0.0% |
reltrip
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 7.2% |
Missing (n) | 615 |
1.0 | |
---|---|
2.0 | |
1 | |
Other values (2) |
Value | Count | Frequency (%) | |
1.0 | 1993 | 23.3% | |
2.0 | 1950 | 22.8% | |
1 | 1593 | 18.6% | |
2 | 1411 | 16.5% | |
995 | 11.6% | ||
(Missing) | 615 | 7.2% |
reltrip1
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 4.1% |
Missing (n) | 347 |
2 | |
---|---|
1.0 | |
Other values (2) |
Value | Count | Frequency (%) | |
3354 | 39.2% | ||
2 | 1325 | 15.5% | |
1.0 | 1317 | 15.4% | |
1 | 1232 | 14.4% | |
2.0 | 982 | 11.5% | |
(Missing) | 347 | 4.1% |
remit
Numeric
Distinct count | 235 |
---|---|
Unique (%) | 2.7% |
Missing (%) | 14.7% |
Missing (n) | 1256 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 197.29 |
---|---|
Minimum | 0 |
Maximum | 4000 |
Zeros (%) | 22.7% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 104.47 |
Q3 | 300 |
95-th percentile | 600 |
Maximum | 4000 |
Range | 4000 |
Interquartile range | 300 |
Descriptive statistics
Standard deviation | 232.77 |
---|---|
Coef of variation | 1.1799 |
Kurtosis | 18.19 |
Mean | 197.29 |
MAD | 170.67 |
Skewness | 2.5145 |
Sum | 1440400 |
Variance | 54184 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 1940 | 22.7% | |
100.0 | 801 | 9.4% | |
200.0 | 780 | 9.1% | |
300.0 | 549 | 6.4% | |
400.0 | 425 | 5.0% | |
500.0 | 371 | 4.3% | |
150.0 | 359 | 4.2% | |
50.0 | 301 | 3.5% | |
250.0 | 181 | 2.1% | |
600.0 | 177 | 2.1% | |
Other values (224) | 1417 | 16.6% | |
(Missing) | 1256 | 14.7% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 1940 | 22.7% | |
1.0 | 1 | 0.0% | |
2.0 | 2 | 0.0% | |
3.0 | 1 | 0.0% | |
5.0 | 2 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
1500.0 | 1 | 0.0% | |
1800.0 | 1 | 0.0% | |
2000.0 | 2 | 0.0% | |
3500.0 | 1 | 0.0% | |
4000.0 | 1 | 0.0% |
remit1
Numeric
Distinct count | 17 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 39.5% |
Missing (n) | 3379 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 5.1317 |
---|---|
Minimum | 1 |
Maximum | 16 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 11 |
95-th percentile | 12 |
Maximum | 16 |
Range | 15 |
Interquartile range | 10 |
Descriptive statistics
Standard deviation | 4.9842 |
---|---|
Coef of variation | 0.97126 |
Kurtosis | -1.4837 |
Mean | 5.1317 |
MAD | 4.7625 |
Skewness | 0.53945 |
Sum | 26572 |
Variance | 24.843 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 2636 | 30.8% | |
11.0 | 1467 | 17.1% | |
2.0 | 414 | 4.8% | |
12.0 | 199 | 2.3% | |
8.0 | 151 | 1.8% | |
16.0 | 77 | 0.9% | |
15.0 | 71 | 0.8% | |
3.0 | 64 | 0.7% | |
10.0 | 36 | 0.4% | |
9.0 | 15 | 0.2% | |
Other values (6) | 48 | 0.6% | |
(Missing) | 3379 | 39.5% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 2636 | 30.8% | |
2.0 | 414 | 4.8% | |
3.0 | 64 | 0.7% | |
4.0 | 5 | 0.1% | |
5.0 | 2 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
12.0 | 199 | 2.3% | |
13.0 | 4 | 0.0% | |
14.0 | 9 | 0.1% | |
15.0 | 71 | 0.8% | |
16.0 | 77 | 0.9% |
rent
Numeric
Distinct count | 275 |
---|---|
Unique (%) | 3.2% |
Missing (%) | 21.0% |
Missing (n) | 1794 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 178.6 |
---|---|
Minimum | 0 |
Maximum | 6000 |
Zeros (%) | 26.5% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 80 |
Q3 | 200 |
95-th percentile | 720 |
Maximum | 6000 |
Range | 6000 |
Interquartile range | 200 |
Descriptive statistics
Standard deviation | 306.05 |
---|---|
Coef of variation | 1.7136 |
Kurtosis | 47.572 |
Mean | 178.6 |
MAD | 188.06 |
Skewness | 4.8365 |
Sum | 1207900 |
Variance | 93669 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 2271 | 26.5% | |
100.0 | 615 | 7.2% | |
200.0 | 363 | 4.2% | |
150.0 | 280 | 3.3% | |
300.0 | 267 | 3.1% | |
50.0 | 232 | 2.7% | |
80.0 | 185 | 2.2% | |
400.0 | 157 | 1.8% | |
250.0 | 157 | 1.8% | |
120.0 | 131 | 1.5% | |
Other values (264) | 2105 | 24.6% | |
(Missing) | 1794 | 21.0% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 2271 | 26.5% | |
1.0 | 1 | 0.0% | |
2.0 | 3 | 0.0% | |
2.5 | 1 | 0.0% | |
3.0 | 1 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
3000.0 | 3 | 0.0% | |
3200.0 | 2 | 0.0% | |
4500.0 | 1 | 0.0% | |
5000.0 | 1 | 0.0% | |
6000.0 | 1 | 0.0% |
rowner
Categorical
Distinct count | 15 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 10.0% |
Missing (n) | 852 |
1.0 | |
---|---|
5.0 | 428 |
Other values (11) | 583 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
1.0 | 2644 | 30.9% | |
5.0 | 428 | 5.0% | |
3.0 | 192 | 2.2% | |
6.0 | 120 | 1.4% | |
7.0 | 94 | 1.1% | |
4.0 | 85 | 1.0% | |
8.0 | 36 | 0.4% | |
1 | 23 | 0.3% | |
2.0 | 22 | 0.3% | |
Other values (4) | 11 | 0.1% | |
(Missing) | 852 | 10.0% |
rowners
Categorical
Distinct count | 11 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 48.2% |
Missing (n) | 4128 |
1.0 | 233 |
---|---|
5.0 | 61 |
Other values (7) | 85 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
1.0 | 233 | 2.7% | |
5.0 | 61 | 0.7% | |
3.0 | 31 | 0.4% | |
7.0 | 16 | 0.2% | |
6.0 | 13 | 0.2% | |
8.0 | 9 | 0.1% | |
4.0 | 9 | 0.1% | |
1 | 5 | 0.1% | |
2.0 | 2 | 0.0% | |
(Missing) | 4128 | 48.2% |
rsuper
Categorical
Distinct count | 16 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 12.6% |
Missing (n) | 1075 |
1.0 | |
---|---|
5.0 | |
Other values (12) | 672 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
1.0 | 1492 | 17.4% | |
5.0 | 1268 | 14.8% | |
6.0 | 196 | 2.3% | |
4.0 | 180 | 2.1% | |
3.0 | 125 | 1.5% | |
7.0 | 69 | 0.8% | |
2.0 | 57 | 0.7% | |
5 | 14 | 0.2% | |
1 | 11 | 0.1% | |
Other values (5) | 20 | 0.2% | |
(Missing) | 1075 | 12.6% |
rsupers
Categorical
Distinct count | 12 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 48.5% |
Missing (n) | 4146 |
1.0 | 147 |
---|---|
5.0 | 117 |
Other values (8) | 97 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
1.0 | 147 | 1.7% | |
5.0 | 117 | 1.4% | |
6.0 | 33 | 0.4% | |
3.0 | 21 | 0.2% | |
4.0 | 14 | 0.2% | |
7.0 | 13 | 0.2% | |
2.0 | 9 | 0.1% | |
1 | 4 | 0.0% | |
8.0 | 2 | 0.0% | |
(Missing) | 4146 | 48.5% |
savings
Numeric
Distinct count | 167 |
---|---|
Unique (%) | 2.0% |
Missing (%) | 30.4% |
Missing (n) | 2604 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 132.74 |
---|---|
Minimum | 0 |
Maximum | 3000 |
Zeros (%) | 33.9% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 13 |
Q3 | 200 |
95-th percentile | 600 |
Maximum | 3000 |
Range | 3000 |
Interquartile range | 200 |
Descriptive statistics
Standard deviation | 223.59 |
---|---|
Coef of variation | 1.6844 |
Kurtosis | 15.337 |
Mean | 132.74 |
MAD | 155.8 |
Skewness | 2.9215 |
Sum | 790190 |
Variance | 49991 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 2897 | 33.9% | |
100.0 | 533 | 6.2% | |
200.0 | 409 | 4.8% | |
300.0 | 263 | 3.1% | |
50.0 | 243 | 2.8% | |
500.0 | 241 | 2.8% | |
400.0 | 159 | 1.9% | |
150.0 | 153 | 1.8% | |
1000.0 | 95 | 1.1% | |
600.0 | 84 | 1.0% | |
Other values (156) | 876 | 10.2% | |
(Missing) | 2604 | 30.4% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 2897 | 33.9% | |
1.0 | 5 | 0.1% | |
2.0 | 3 | 0.0% | |
3.0 | 1 | 0.0% | |
4.0 | 2 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
1000.0 | 95 | 1.1% | |
1500.0 | 5 | 0.1% | |
1800.0 | 1 | 0.0% | |
2000.0 | 2 | 0.0% | |
3000.0 | 2 | 0.0% |
savings1
Numeric
Distinct count | 17 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 46.6% |
Missing (n) | 3987 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 5.9681 |
---|---|
Minimum | 1 |
Maximum | 16 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 3 |
Q3 | 11 |
95-th percentile | 15 |
Maximum | 16 |
Range | 15 |
Interquartile range | 10 |
Descriptive statistics
Standard deviation | 5.2864 |
---|---|
Coef of variation | 0.88578 |
Kurtosis | -1.3178 |
Mean | 5.9681 |
MAD | 4.893 |
Skewness | 0.52901 |
Sum | 27274 |
Variance | 27.946 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 1467 | 17.1% | |
2.0 | 798 | 9.3% | |
11.0 | 692 | 8.1% | |
8.0 | 263 | 3.1% | |
15.0 | 261 | 3.1% | |
12.0 | 190 | 2.2% | |
3.0 | 183 | 2.1% | |
16.0 | 167 | 2.0% | |
14.0 | 165 | 1.9% | |
9.0 | 112 | 1.3% | |
Other values (6) | 272 | 3.2% | |
(Missing) | 3987 | 46.6% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 1467 | 17.1% | |
2.0 | 798 | 9.3% | |
3.0 | 183 | 2.1% | |
4.0 | 85 | 1.0% | |
5.0 | 16 | 0.2% |
Maximum 5 values
Value | Count | Frequency (%) | |
12.0 | 190 | 2.2% | |
13.0 | 27 | 0.3% | |
14.0 | 165 | 1.9% | |
15.0 | 261 | 3.1% | |
16.0 | 167 | 2.0% |
savretrn
Numeric
Distinct count | 247 |
---|---|
Unique (%) | 2.9% |
Missing (%) | 25.3% |
Missing (n) | 2163 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 903.08 |
---|---|
Minimum | 0 |
Maximum | 12000 |
Zeros (%) | 29.5% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 200 |
Q3 | 1000 |
95-th percentile | 4000 |
Maximum | 12000 |
Range | 12000 |
Interquartile range | 1000 |
Descriptive statistics
Standard deviation | 1636.9 |
---|---|
Coef of variation | 1.8126 |
Kurtosis | 11.128 |
Mean | 903.08 |
MAD | 1047.4 |
Skewness | 3.0754 |
Sum | 5774300 |
Variance | 2679600 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 2527 | 29.5% | |
1000.0 | 446 | 5.2% | |
2000.0 | 339 | 4.0% | |
500.0 | 270 | 3.2% | |
200.0 | 233 | 2.7% | |
300.0 | 231 | 2.7% | |
3000.0 | 213 | 2.5% | |
100.0 | 172 | 2.0% | |
1500.0 | 167 | 2.0% | |
600.0 | 158 | 1.8% | |
Other values (236) | 1638 | 19.1% | |
(Missing) | 2163 | 25.3% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 2527 | 29.5% | |
1.0 | 1 | 0.0% | |
6.0 | 2 | 0.0% | |
7.0 | 1 | 0.0% | |
8.0 | 3 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
8768.08 | 1 | 0.0% | |
9000.0 | 7 | 0.1% | |
9443.18 | 1 | 0.0% | |
10000.0 | 54 | 0.6% | |
12000.0 | 1 | 0.0% |
sbdoc1
Categorical
Distinct count | 10 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 9.1% |
Missing (n) | 779 |
1 | 281 |
---|---|
3 | 277 |
Other values (6) | 330 |
(Missing) | 779 |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1 | 281 | 3.3% | |
3 | 277 | 3.2% | |
2 | 147 | 1.7% | |
3.0 | 80 | 0.9% | |
1.0 | 73 | 0.9% | |
2.0 | 16 | 0.2% | |
4 | 9 | 0.1% | |
4.0 | 5 | 0.1% | |
(Missing) | 779 | 9.1% |
sbdoc10
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 19.4% |
Missing (n) | 1662 |
1 | 4 |
---|---|
2 | 1 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1 | 4 | 0.0% | |
2 | 1 | 0.0% | |
(Missing) | 1662 | 19.4% |
sbdoc11
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 19.4% |
Missing (n) | 1663 |
1 | 3 |
---|---|
4 | 1 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1 | 3 | 0.0% | |
4 | 1 | 0.0% | |
(Missing) | 1663 | 19.4% |
sbdoc12
Categorical
Distinct count | 2 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 19.5% |
Missing (n) | 1667 |
(Missing) |
---|
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
(Missing) | 1667 | 19.5% |
sbdoc2
Categorical
Distinct count | 10 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 12.8% |
Missing (n) | 1094 |
1 | 194 |
---|---|
3 | 164 |
Other values (6) | 215 |
(Missing) | 1094 |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1 | 194 | 2.3% | |
3 | 164 | 1.9% | |
2 | 97 | 1.1% | |
3.0 | 53 | 0.6% | |
1.0 | 45 | 0.5% | |
2.0 | 11 | 0.1% | |
4 | 8 | 0.1% | |
4.0 | 1 | 0.0% | |
(Missing) | 1094 | 12.8% |
sbdoc3
Categorical
Distinct count | 10 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 15.2% |
Missing (n) | 1302 |
1 | 126 |
---|---|
3 | 106 |
Other values (6) | 133 |
(Missing) | 1302 |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1 | 126 | 1.5% | |
3 | 106 | 1.2% | |
2 | 54 | 0.6% | |
3.0 | 40 | 0.5% | |
1.0 | 28 | 0.3% | |
2.0 | 6 | 0.1% | |
4 | 4 | 0.0% | |
4.0 | 1 | 0.0% | |
(Missing) | 1302 | 15.2% |
sbdoc4
Categorical
Distinct count | 9 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 16.8% |
Missing (n) | 1441 |
1 | 92 |
---|---|
3 | 58 |
Other values (5) | 76 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1 | 92 | 1.1% | |
3 | 58 | 0.7% | |
2 | 34 | 0.4% | |
3.0 | 23 | 0.3% | |
1.0 | 11 | 0.1% | |
2.0 | 5 | 0.1% | |
4 | 3 | 0.0% | |
(Missing) | 1441 | 16.8% |
sbdoc5
Categorical
Distinct count | 9 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 17.7% |
Missing (n) | 1518 |
1 | 57 |
---|---|
3 | 44 |
Other values (5) | 48 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1 | 57 | 0.7% | |
3 | 44 | 0.5% | |
2 | 25 | 0.3% | |
3.0 | 11 | 0.1% | |
1.0 | 7 | 0.1% | |
2.0 | 3 | 0.0% | |
4 | 2 | 0.0% | |
(Missing) | 1518 | 17.7% |
sbdoc6
Categorical
Distinct count | 9 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 18.6% |
Missing (n) | 1588 |
1 | 28 |
---|---|
3 | 20 |
Other values (5) | 31 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1 | 28 | 0.3% | |
3 | 20 | 0.2% | |
2 | 14 | 0.2% | |
3.0 | 8 | 0.1% | |
4 | 4 | 0.0% | |
1.0 | 3 | 0.0% | |
2.0 | 2 | 0.0% | |
(Missing) | 1588 | 18.6% |
sbdoc7
Categorical
Distinct count | 9 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 18.9% |
Missing (n) | 1613 |
1 | 21 |
---|---|
3 | 12 |
Other values (5) | 21 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1 | 21 | 0.2% | |
3 | 12 | 0.1% | |
2 | 7 | 0.1% | |
3.0 | 6 | 0.1% | |
1.0 | 4 | 0.0% | |
4 | 3 | 0.0% | |
2.0 | 1 | 0.0% | |
(Missing) | 1613 | 18.9% |
sbdoc8
Categorical
Distinct count | 8 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 19.2% |
Missing (n) | 1641 |
3 | 8 |
---|---|
1 | 8 |
Other values (4) | 10 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
3 | 8 | 0.1% | |
1 | 8 | 0.1% | |
2 | 6 | 0.1% | |
3.0 | 2 | 0.0% | |
4 | 1 | 0.0% | |
1.0 | 1 | 0.0% | |
(Missing) | 1641 | 19.2% |
sbdoc9
Categorical
Distinct count | 5 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 19.3% |
Missing (n) | 1655 |
1 | 7 |
---|---|
2 | 4 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1 | 7 | 0.1% | |
2 | 4 | 0.0% | |
4 | 1 | 0.0% | |
(Missing) | 1655 | 19.3% |
sbdoyr1
Categorical
Distinct count | 56 |
---|---|
Unique (%) | 0.7% |
Missing (%) | 17.6% |
Missing (n) | 1505 |
1987 | 12 |
---|---|
1986 | 12 |
Other values (52) | 138 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1987 | 12 | 0.1% | |
1986 | 12 | 0.1% | |
1988 | 10 | 0.1% | |
2004 | 8 | 0.1% | |
1989 | 8 | 0.1% | |
1990 | 8 | 0.1% | |
1985 | 6 | 0.1% | |
2002 | 5 | 0.1% | |
2007 | 5 | 0.1% | |
Other values (45) | 88 | 1.0% | |
(Missing) | 1505 | 17.6% |
sbdoyr10
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 19.5% |
Missing (n) | 1665 |
1995 | 1 |
---|---|
1987 | 1 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1995 | 1 | 0.0% | |
1987 | 1 | 0.0% | |
(Missing) | 1665 | 19.5% |
sbdoyr11
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 19.5% |
Missing (n) | 1665 |
1995 | 1 |
---|---|
1987 | 1 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1995 | 1 | 0.0% | |
1987 | 1 | 0.0% | |
(Missing) | 1665 | 19.5% |
sbdoyr12
Categorical
Distinct count | 2 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 19.5% |
Missing (n) | 1667 |
(Missing) |
---|
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
(Missing) | 1667 | 19.5% |
sbdoyr2
Categorical
Distinct count | 40 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 18.4% |
Missing (n) | 1577 |
1987 | 7 |
---|---|
1988 | 6 |
Other values (36) | 77 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1987 | 7 | 0.1% | |
1988 | 6 | 0.1% | |
1986.0 | 5 | 0.1% | |
1989 | 5 | 0.1% | |
1986 | 4 | 0.0% | |
1990 | 4 | 0.0% | |
2004 | 4 | 0.0% | |
1987.0 | 3 | 0.0% | |
1989.0 | 3 | 0.0% | |
Other values (29) | 49 | 0.6% | |
(Missing) | 1577 | 18.4% |
sbdoyr3
Categorical
Distinct count | 33 |
---|---|
Unique (%) | 0.4% |
Missing (%) | 18.8% |
Missing (n) | 1611 |
1987 | 6 |
---|---|
1988 | 5 |
Other values (29) | 45 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1987 | 6 | 0.1% | |
1988 | 5 | 0.1% | |
1989.0 | 4 | 0.0% | |
2004 | 3 | 0.0% | |
1989 | 3 | 0.0% | |
1985 | 3 | 0.0% | |
1986.0 | 3 | 0.0% | |
1980 | 2 | 0.0% | |
1990 | 2 | 0.0% | |
Other values (22) | 25 | 0.3% | |
(Missing) | 1611 | 18.8% |
sbdoyr4
Categorical
Distinct count | 26 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 19.1% |
Missing (n) | 1634 |
1990 | 3 |
---|---|
1988 | 3 |
Other values (22) | 27 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1990 | 3 | 0.0% | |
1988 | 3 | 0.0% | |
1987 | 3 | 0.0% | |
1989 | 2 | 0.0% | |
1985 | 2 | 0.0% | |
2002 | 2 | 0.0% | |
2004 | 1 | 0.0% | |
1980 | 1 | 0.0% | |
1987.0 | 1 | 0.0% | |
Other values (15) | 15 | 0.2% | |
(Missing) | 1634 | 19.1% |
sbdoyr5
Categorical
Distinct count | 21 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 19.2% |
Missing (n) | 1645 |
1988 | 2 |
---|---|
1990 | 2 |
Other values (17) | 18 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1988 | 2 | 0.0% | |
1990 | 2 | 0.0% | |
1987 | 2 | 0.0% | |
1987.0 | 1 | 0.0% | |
1988.0 | 1 | 0.0% | |
2014.0 | 1 | 0.0% | |
1977 | 1 | 0.0% | |
1984 | 1 | 0.0% | |
1985 | 1 | 0.0% | |
Other values (10) | 10 | 0.1% | |
(Missing) | 1645 | 19.2% |
sbdoyr6
Categorical
Distinct count | 13 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 19.3% |
Missing (n) | 1654 |
1990 | 2 |
---|---|
1987 | 2 |
Other values (9) | 9 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1990 | 2 | 0.0% | |
1987 | 2 | 0.0% | |
2009 | 1 | 0.0% | |
2005 | 1 | 0.0% | |
1991 | 1 | 0.0% | |
1989 | 1 | 0.0% | |
1988 | 1 | 0.0% | |
1984 | 1 | 0.0% | |
1988.0 | 1 | 0.0% | |
Other values (2) | 2 | 0.0% | |
(Missing) | 1654 | 19.3% |
sbdoyr7
Categorical
Distinct count | 10 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 19.4% |
Missing (n) | 1657 |
2005 | 2 |
---|---|
1987 | 2 |
Other values (6) | 6 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
2005 | 2 | 0.0% | |
1987 | 2 | 0.0% | |
1991 | 1 | 0.0% | |
1990 | 1 | 0.0% | |
1988 | 1 | 0.0% | |
1984 | 1 | 0.0% | |
1988.0 | 1 | 0.0% | |
1987.0 | 1 | 0.0% | |
(Missing) | 1657 | 19.4% |
sbdoyr8
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 19.4% |
Missing (n) | 1662 |
1987 | 2 |
---|---|
1991 | 1 |
Other values (2) | 2 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1987 | 2 | 0.0% | |
1991 | 1 | 0.0% | |
1990 | 1 | 0.0% | |
1988 | 1 | 0.0% | |
(Missing) | 1662 | 19.4% |
sbdoyr9
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 19.4% |
Missing (n) | 1662 |
1987 | 2 |
---|---|
1998 | 1 |
Other values (2) | 2 |
(Missing) |
Value | Count | Frequency (%) | |
6890 | 80.5% | ||
1987 | 2 | 0.0% | |
1998 | 1 | 0.0% | |
1990 | 1 | 0.0% | |
1988 | 1 | 0.0% | |
(Missing) | 1662 | 19.4% |
sbgree1
Categorical
Distinct count | 8 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 14.5% |
Missing (n) | 1242 |
1.0 | 638 |
---|---|
2.0 | 492 |
Other values (4) | 468 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1.0 | 638 | 7.5% | |
2.0 | 492 | 5.7% | |
2 | 229 | 2.7% | |
1 | 175 | 2.0% | |
3.0 | 49 | 0.6% | |
3 | 15 | 0.2% | |
(Missing) | 1242 | 14.5% |
sbgree10
Categorical
Distinct count | 7 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 32.9% |
Missing (n) | 2816 |
1.0 | 14 |
---|---|
2.0 | 6 |
Other values (3) | 4 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1.0 | 14 | 0.2% | |
2.0 | 6 | 0.1% | |
2 | 2 | 0.0% | |
1 | 1 | 0.0% | |
3.0 | 1 | 0.0% | |
(Missing) | 2816 | 32.9% |
sbgree11
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 33.0% |
Missing (n) | 2826 |
1.0 | 7 |
---|---|
2.0 | 5 |
Other values (2) | 2 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1.0 | 7 | 0.1% | |
2.0 | 5 | 0.1% | |
2 | 1 | 0.0% | |
3.0 | 1 | 0.0% | |
(Missing) | 2826 | 33.0% |
sbgree12
Categorical
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 33.2% |
Missing (n) | 2838 |
1.0 | 2 |
---|---|
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1.0 | 2 | 0.0% | |
(Missing) | 2838 | 33.2% |
sbgree2
Categorical
Distinct count | 8 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 21.0% |
Missing (n) | 1796 |
1.0 | 403 |
---|---|
2.0 | 357 |
Other values (4) | 284 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1.0 | 403 | 4.7% | |
2.0 | 357 | 4.2% | |
2 | 151 | 1.8% | |
1 | 97 | 1.1% | |
3.0 | 26 | 0.3% | |
3 | 10 | 0.1% | |
(Missing) | 1796 | 21.0% |
sbgree3
Categorical
Distinct count | 8 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 25.7% |
Missing (n) | 2202 |
1.0 | 249 |
---|---|
2.0 | 226 |
Other values (4) | 163 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1.0 | 249 | 2.9% | |
2.0 | 226 | 2.6% | |
2 | 84 | 1.0% | |
1 | 59 | 0.7% | |
3.0 | 14 | 0.2% | |
3 | 6 | 0.1% | |
(Missing) | 2202 | 25.7% |
sbgree4
Categorical
Distinct count | 8 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 28.8% |
Missing (n) | 2464 |
1.0 | 174 |
---|---|
2.0 | 129 |
Other values (4) | 73 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1.0 | 174 | 2.0% | |
2.0 | 129 | 1.5% | |
1 | 33 | 0.4% | |
2 | 29 | 0.3% | |
3.0 | 8 | 0.1% | |
3 | 3 | 0.0% | |
(Missing) | 2464 | 28.8% |
sbgree5
Categorical
Distinct count | 8 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 30.5% |
Missing (n) | 2613 |
1.0 | 109 |
---|---|
2.0 | 79 |
Other values (4) | 39 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1.0 | 109 | 1.3% | |
2.0 | 79 | 0.9% | |
2 | 19 | 0.2% | |
1 | 13 | 0.2% | |
3.0 | 5 | 0.1% | |
3 | 2 | 0.0% | |
(Missing) | 2613 | 30.5% |
sbgree6
Categorical
Distinct count | 8 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 31.6% |
Missing (n) | 2705 |
1.0 | 67 |
---|---|
2.0 | 44 |
Other values (4) | 24 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1.0 | 67 | 0.8% | |
2.0 | 44 | 0.5% | |
2 | 11 | 0.1% | |
1 | 8 | 0.1% | |
3.0 | 3 | 0.0% | |
3 | 2 | 0.0% | |
(Missing) | 2705 | 31.6% |
sbgree7
Categorical
Distinct count | 7 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 32.1% |
Missing (n) | 2750 |
1.0 | 39 |
---|---|
2.0 | 36 |
Other values (3) | 15 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1.0 | 39 | 0.5% | |
2.0 | 36 | 0.4% | |
2 | 7 | 0.1% | |
1 | 6 | 0.1% | |
3.0 | 2 | 0.0% | |
(Missing) | 2750 | 32.1% |
sbgree8
Categorical
Distinct count | 7 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 32.6% |
Missing (n) | 2786 |
1.0 | 24 |
---|---|
2.0 | 20 |
Other values (3) | 10 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1.0 | 24 | 0.3% | |
2.0 | 20 | 0.2% | |
2 | 7 | 0.1% | |
1 | 2 | 0.0% | |
3.0 | 1 | 0.0% | |
(Missing) | 2786 | 32.6% |
sbgree9
Categorical
Distinct count | 7 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 32.8% |
Missing (n) | 2805 |
1.0 | 19 |
---|---|
2.0 | 10 |
Other values (3) | 6 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1.0 | 19 | 0.2% | |
2.0 | 10 | 0.1% | |
2 | 3 | 0.0% | |
3.0 | 2 | 0.0% | |
1 | 1 | 0.0% | |
(Missing) | 2805 | 32.8% |
sbilevus
Numeric
Distinct count | 24 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 5.4% |
Missing (n) | 460 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.7369 |
---|---|
Minimum | 0 |
Maximum | 40 |
Zeros (%) | 46.3% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 1 |
Q3 | 2 |
95-th percentile | 7 |
Maximum | 40 |
Range | 40 |
Interquartile range | 2 |
Descriptive statistics
Standard deviation | 2.7765 |
---|---|
Coef of variation | 1.5985 |
Kurtosis | 13.971 |
Mean | 1.7369 |
MAD | 1.9218 |
Skewness | 2.9044 |
Sum | 14064 |
Variance | 7.709 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 3958 | 46.3% | |
1.0 | 1229 | 14.4% | |
2.0 | 948 | 11.1% | |
3.0 | 579 | 6.8% | |
4.0 | 407 | 4.8% | |
5.0 | 257 | 3.0% | |
6.0 | 207 | 2.4% | |
8.0 | 127 | 1.5% | |
7.0 | 114 | 1.3% | |
10.0 | 97 | 1.1% | |
Other values (13) | 174 | 2.0% | |
(Missing) | 460 | 5.4% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 3958 | 46.3% | |
1.0 | 1229 | 14.4% | |
2.0 | 948 | 11.1% | |
3.0 | 579 | 6.8% | |
4.0 | 407 | 4.8% |
Maximum 5 values
Value | Count | Frequency (%) | |
19.0 | 1 | 0.0% | |
20.0 | 12 | 0.1% | |
22.0 | 7 | 0.1% | |
24.0 | 1 | 0.0% | |
40.0 | 1 | 0.0% |
sbilinus
Numeric
Distinct count | 21 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 0.9% |
Missing (n) | 81 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.2203 |
---|---|
Minimum | 0 |
Maximum | 40 |
Zeros (%) | 57.3% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 0 |
Q3 | 2 |
95-th percentile | 6 |
Maximum | 40 |
Range | 40 |
Interquartile range | 2 |
Descriptive statistics
Standard deviation | 2.1555 |
---|---|
Coef of variation | 1.7664 |
Kurtosis | 20.691 |
Mean | 1.2203 |
MAD | 1.4776 |
Skewness | 3.1833 |
Sum | 10343 |
Variance | 4.6463 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 4902 | 57.3% | |
1.0 | 1272 | 14.9% | |
2.0 | 824 | 9.6% | |
3.0 | 520 | 6.1% | |
4.0 | 320 | 3.7% | |
5.0 | 197 | 2.3% | |
6.0 | 144 | 1.7% | |
7.0 | 76 | 0.9% | |
10.0 | 70 | 0.8% | |
8.0 | 63 | 0.7% | |
Other values (10) | 88 | 1.0% | |
(Missing) | 81 | 0.9% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 4902 | 57.3% | |
1.0 | 1272 | 14.9% | |
2.0 | 824 | 9.6% | |
3.0 | 520 | 6.1% | |
4.0 | 320 | 3.7% |
Maximum 5 values
Value | Count | Frequency (%) | |
15.0 | 5 | 0.1% | |
16.0 | 1 | 0.0% | |
18.0 | 1 | 0.0% | |
20.0 | 3 | 0.0% | |
40.0 | 1 | 0.0% |
sblive1
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 37.8% |
Missing (n) | 3235 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.0472 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 1 |
95-th percentile | 1 |
Maximum | 2 |
Range | 1 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.21201 |
---|---|
Coef of variation | 0.20246 |
Kurtosis | 16.269 |
Mean | 1.0472 |
MAD | 0.089877 |
Skewness | 4.2735 |
Sum | 5573 |
Variance | 0.044947 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 5071 | 59.3% | |
2.0 | 251 | 2.9% | |
(Missing) | 3235 | 37.8% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 5071 | 59.3% | |
2.0 | 251 | 2.9% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 5071 | 59.3% | |
2.0 | 251 | 2.9% |
sblive10
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 52.4% |
Missing (n) | 4485 |
1.0 | 29 |
---|---|
2.0 | 2 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1.0 | 29 | 0.3% | |
2.0 | 2 | 0.0% | |
(Missing) | 4485 | 52.4% |
sblive11
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 52.5% |
Missing (n) | 4496 |
1.0 | 18 |
---|---|
2.0 | 2 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1.0 | 18 | 0.2% | |
2.0 | 2 | 0.0% | |
(Missing) | 4496 | 52.5% |
sblive12
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 52.7% |
Missing (n) | 4512 |
1.0 | 3 |
---|---|
2.0 | 1 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1.0 | 3 | 0.0% | |
2.0 | 1 | 0.0% | |
(Missing) | 4512 | 52.7% |
sblive2
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 58.1% |
Missing (n) | 4970 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.0326 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 1 |
95-th percentile | 1 |
Maximum | 2 |
Range | 1 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.17766 |
---|---|
Coef of variation | 0.17205 |
Kurtosis | 25.729 |
Mean | 1.0326 |
MAD | 0.063108 |
Skewness | 5.2645 |
Sum | 3704 |
Variance | 0.031563 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 3470 | 40.6% | |
2.0 | 117 | 1.4% | |
(Missing) | 4970 | 58.1% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 3470 | 40.6% | |
2.0 | 117 | 1.4% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 3470 | 40.6% | |
2.0 | 117 | 1.4% |
sblive7
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 51.0% |
Missing (n) | 4361 |
1.0 | 154 |
---|---|
1 | 1 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1.0 | 154 | 1.8% | |
1 | 1 | 0.0% | |
(Missing) | 4361 | 51.0% |
sblive8
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 51.8% |
Missing (n) | 4429 |
1.0 | 85 |
---|---|
2.0 | 2 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1.0 | 85 | 1.0% | |
2.0 | 2 | 0.0% | |
(Missing) | 4429 | 51.8% |
sblive9
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 52.2% |
Missing (n) | 4464 |
1.0 | 50 |
---|---|
2.0 | 2 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1.0 | 50 | 0.6% | |
2.0 | 2 | 0.0% | |
(Missing) | 4464 | 52.2% |
sbmgyr1
Numeric
Distinct count | 103 |
---|---|
Unique (%) | 1.2% |
Missing (%) | 49.2% |
Missing (n) | 4210 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1977.7 |
---|---|
Minimum | 1908 |
Maximum | 2016 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1908 |
---|---|
5-th percentile | 1948 |
Q1 | 1970 |
Median | 1980 |
Q3 | 1989 |
95-th percentile | 2000 |
Maximum | 2016 |
Range | 108 |
Interquartile range | 19 |
Descriptive statistics
Standard deviation | 15.771 |
---|---|
Coef of variation | 0.0079747 |
Kurtosis | 0.60759 |
Mean | 1977.7 |
MAD | 12.295 |
Skewness | -0.75148 |
Sum | 8597000 |
Variance | 248.74 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1980.0 | 208 | 2.4% | |
1978.0 | 162 | 1.9% | |
1990.0 | 160 | 1.9% | |
1985.0 | 154 | 1.8% | |
1970.0 | 148 | 1.7% | |
1986.0 | 131 | 1.5% | |
1989.0 | 125 | 1.5% | |
1975.0 | 121 | 1.4% | |
1988.0 | 117 | 1.4% | |
1976.0 | 110 | 1.3% | |
Other values (92) | 2911 | 34.0% | |
(Missing) | 4210 | 49.2% |
Minimum 5 values
Value | Count | Frequency (%) | |
1908.0 | 1 | 0.0% | |
1909.0 | 1 | 0.0% | |
1912.0 | 1 | 0.0% | |
1914.0 | 1 | 0.0% | |
1915.0 | 1 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
2012.0 | 1 | 0.0% | |
2013.0 | 2 | 0.0% | |
2014.0 | 1 | 0.0% | |
2015.0 | 1 | 0.0% | |
2016.0 | 1 | 0.0% |
sbmgyr10
Categorical
Distinct count | 18 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 52.5% |
Missing (n) | 4493 |
1989.0 | 4 |
---|---|
1968.0 | 3 |
Other values (14) | 16 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1989.0 | 4 | 0.0% | |
1968.0 | 3 | 0.0% | |
1973.0 | 3 | 0.0% | |
1987.0 | 1 | 0.0% | |
1969.0 | 1 | 0.0% | |
1974.0 | 1 | 0.0% | |
1979.0 | 1 | 0.0% | |
1981.0 | 1 | 0.0% | |
1988.0 | 1 | 0.0% | |
Other values (7) | 7 | 0.1% | |
(Missing) | 4493 | 52.5% |
sbmgyr11
Categorical
Distinct count | 12 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 52.6% |
Missing (n) | 4502 |
1989.0 | 4 |
---|---|
1974.0 | 2 |
Other values (8) | 8 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1989.0 | 4 | 0.0% | |
1974.0 | 2 | 0.0% | |
2000.0 | 1 | 0.0% | |
1998.0 | 1 | 0.0% | |
1991.0 | 1 | 0.0% | |
1990.0 | 1 | 0.0% | |
1988.0 | 1 | 0.0% | |
1978.0 | 1 | 0.0% | |
1973.0 | 1 | 0.0% | |
(Missing) | 4502 | 52.6% |
sbmgyr12
Categorical
Distinct count | 5 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 52.7% |
Missing (n) | 4513 |
1995.0 | 1 |
---|---|
1980.0 | 1 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1995.0 | 1 | 0.0% | |
1980.0 | 1 | 0.0% | |
1979.0 | 1 | 0.0% | |
(Missing) | 4513 | 52.7% |
sbmgyr7
Categorical
Distinct count | 39 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 51.6% |
Missing (n) | 4415 |
1989.0 | 9 |
---|---|
1970.0 | 6 |
Other values (35) | 86 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1989.0 | 9 | 0.1% | |
1970.0 | 6 | 0.1% | |
1995.0 | 5 | 0.1% | |
1978.0 | 5 | 0.1% | |
1980.0 | 5 | 0.1% | |
1990.0 | 5 | 0.1% | |
1991.0 | 5 | 0.1% | |
1986.0 | 5 | 0.1% | |
1998.0 | 4 | 0.0% | |
Other values (28) | 52 | 0.6% | |
(Missing) | 4415 | 51.6% |
sbmgyr8
Categorical
Distinct count | 29 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 52.1% |
Missing (n) | 4460 |
1989.0 | 5 |
---|---|
1973.0 | 4 |
Other values (25) | 47 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1989.0 | 5 | 0.1% | |
1973.0 | 4 | 0.0% | |
1982.0 | 4 | 0.0% | |
1995.0 | 4 | 0.0% | |
1990.0 | 4 | 0.0% | |
1992.0 | 3 | 0.0% | |
1970.0 | 3 | 0.0% | |
1980.0 | 3 | 0.0% | |
1986.0 | 3 | 0.0% | |
Other values (18) | 23 | 0.3% | |
(Missing) | 4460 | 52.1% |
sbmgyr9
Categorical
Distinct count | 25 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 52.4% |
Missing (n) | 4482 |
1989.0 | 5 |
---|---|
1973.0 | 3 |
Other values (21) | 26 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1989.0 | 5 | 0.1% | |
1973.0 | 3 | 0.0% | |
1968.0 | 2 | 0.0% | |
1980.0 | 2 | 0.0% | |
1988.0 | 2 | 0.0% | |
1986.0 | 2 | 0.0% | |
1994.0 | 2 | 0.0% | |
1991.0 | 1 | 0.0% | |
1976.0 | 1 | 0.0% | |
Other values (14) | 14 | 0.2% | |
(Missing) | 4482 | 52.4% |
sbsex1
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 38.4% |
Missing (n) | 3286 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.1611 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 1 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.36763 |
---|---|
Coef of variation | 0.31663 |
Kurtosis | 1.4029 |
Mean | 1.1611 |
MAD | 0.27025 |
Skewness | 1.8446 |
Sum | 6120 |
Variance | 0.13515 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 4422 | 51.7% | |
2.0 | 849 | 9.9% | |
(Missing) | 3286 | 38.4% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 4422 | 51.7% | |
2.0 | 849 | 9.9% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 4422 | 51.7% | |
2.0 | 849 | 9.9% |
sbsex10
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 52.4% |
Missing (n) | 4485 |
2.0 | 16 |
---|---|
1.0 | 15 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
2.0 | 16 | 0.2% | |
1.0 | 15 | 0.2% | |
(Missing) | 4485 | 52.4% |
sbsex11
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 52.5% |
Missing (n) | 4496 |
2.0 | 10 |
---|---|
1.0 | 10 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
2.0 | 10 | 0.1% | |
1.0 | 10 | 0.1% | |
(Missing) | 4496 | 52.5% |
sbsex12
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 52.7% |
Missing (n) | 4512 |
2.0 | 3 |
---|---|
1.0 | 1 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
2.0 | 3 | 0.0% | |
1.0 | 1 | 0.0% | |
(Missing) | 4512 | 52.7% |
sbsex2
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 58.2% |
Missing (n) | 4979 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.2093 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 1 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.40689 |
---|---|
Coef of variation | 0.33646 |
Kurtosis | 0.043531 |
Mean | 1.2093 |
MAD | 0.33103 |
Skewness | 1.4295 |
Sum | 4327 |
Variance | 0.16556 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 2829 | 33.1% | |
2.0 | 749 | 8.8% | |
(Missing) | 4979 | 58.2% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 2829 | 33.1% | |
2.0 | 749 | 8.8% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 2829 | 33.1% | |
2.0 | 749 | 8.8% |
sbsex7
Categorical
Distinct count | 5 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 51.0% |
Missing (n) | 4361 |
2.0 | 88 |
---|---|
1.0 | 66 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
2.0 | 88 | 1.0% | |
1.0 | 66 | 0.8% | |
2 | 1 | 0.0% | |
(Missing) | 4361 | 51.0% |
sbsex8
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 51.8% |
Missing (n) | 4430 |
2.0 | 47 |
---|---|
1.0 | 39 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
2.0 | 47 | 0.5% | |
1.0 | 39 | 0.5% | |
(Missing) | 4430 | 51.8% |
sbsex9
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 52.2% |
Missing (n) | 4464 |
1.0 | 27 |
---|---|
2.0 | 25 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1.0 | 27 | 0.3% | |
2.0 | 25 | 0.3% | |
(Missing) | 4464 | 52.2% |
sbusnw1
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 41.0% |
Missing (n) | 3511 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.3068 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 1 |
Descriptive statistics
Standard deviation | 0.4612 |
---|---|
Coef of variation | 0.35293 |
Kurtosis | -1.2979 |
Mean | 1.3068 |
MAD | 0.42533 |
Skewness | 0.83824 |
Sum | 6594 |
Variance | 0.21271 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 3498 | 40.9% | |
2.0 | 1548 | 18.1% | |
(Missing) | 3511 | 41.0% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 3498 | 40.9% | |
2.0 | 1548 | 18.1% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 3498 | 40.9% | |
2.0 | 1548 | 18.1% |
sbusnw10
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 52.4% |
Missing (n) | 4487 |
1.0 | 26 |
---|---|
2.0 | 3 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1.0 | 26 | 0.3% | |
2.0 | 3 | 0.0% | |
(Missing) | 4487 | 52.4% |
sbusnw11
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 52.6% |
Missing (n) | 4498 |
1.0 | 17 |
---|---|
2.0 | 1 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1.0 | 17 | 0.2% | |
2.0 | 1 | 0.0% | |
(Missing) | 4498 | 52.6% |
sbusnw12
Categorical
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 52.8% |
Missing (n) | 4514 |
1.0 | 2 |
---|---|
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1.0 | 2 | 0.0% | |
(Missing) | 4514 | 52.8% |
sbusnw2
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 59.6% |
Missing (n) | 5104 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.3078 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 1 |
Descriptive statistics
Standard deviation | 0.46167 |
---|---|
Coef of variation | 0.353 |
Kurtosis | -1.307 |
Mean | 1.3078 |
MAD | 0.42616 |
Skewness | 0.8329 |
Sum | 4516 |
Variance | 0.21314 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 2390 | 27.9% | |
2.0 | 1063 | 12.4% | |
(Missing) | 5104 | 59.6% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 2390 | 27.9% | |
2.0 | 1063 | 12.4% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 2390 | 27.9% | |
2.0 | 1063 | 12.4% |
sbusnw7
Categorical
Distinct count | 5 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 51.0% |
Missing (n) | 4364 |
1.0 | 135 |
---|---|
2.0 | 16 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1.0 | 135 | 1.6% | |
2.0 | 16 | 0.2% | |
2 | 1 | 0.0% | |
(Missing) | 4364 | 51.0% |
sbusnw8
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 51.8% |
Missing (n) | 4432 |
1.0 | 71 |
---|---|
2.0 | 13 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1.0 | 71 | 0.8% | |
2.0 | 13 | 0.2% | |
(Missing) | 4432 | 51.8% |
sbusnw9
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 52.2% |
Missing (n) | 4466 |
1.0 | 42 |
---|---|
2.0 | 8 |
(Missing) |
Value | Count | Frequency (%) | |
4041 | 47.2% | ||
1.0 | 42 | 0.5% | |
2.0 | 8 | 0.1% | |
(Missing) | 4466 | 52.2% |
sbuspl1
Categorical
Distinct count | 111 |
---|---|
Unique (%) | 1.3% |
Missing (%) | 31.7% |
Missing (n) | 2714 |
4480.0 | 375 |
---|---|
1600.0 | 214 |
Other values (107) | |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
4480.0 | 375 | 4.4% | |
1600.0 | 214 | 2.5% | |
7777.0 | 107 | 1.3% | |
5600.0 | 103 | 1.2% | |
7320.0 | 80 | 0.9% | |
7400.0 | 77 | 0.9% | |
7360.0 | 57 | 0.7% | |
5945.0 | 54 | 0.6% | |
3360.0 | 47 | 0.5% | |
Other values (100) | 679 | 7.9% | |
(Missing) | 2714 | 31.7% |
sbuspl10
Categorical
Distinct count | 12 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 52.4% |
Missing (n) | 4483 |
4480.0 | 13 |
---|---|
5945.0 | 2 |
Other values (8) | 9 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
4480.0 | 13 | 0.2% | |
5945.0 | 2 | 0.0% | |
2840.0 | 2 | 0.0% | |
6780.0 | 1 | 0.0% | |
5120.0 | 1 | 0.0% | |
5000.0 | 1 | 0.0% | |
3360.0 | 1 | 0.0% | |
2320.0 | 1 | 0.0% | |
1920.0 | 1 | 0.0% | |
(Missing) | 4483 | 52.4% |
sbuspl11
Categorical
Distinct count | 10 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 52.5% |
Missing (n) | 4490 |
4480.0 | 9 |
---|---|
2840.0 | 2 |
Other values (6) | 6 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
4480.0 | 9 | 0.1% | |
2840.0 | 2 | 0.0% | |
7460.0 | 1 | 0.0% | |
6920.0 | 1 | 0.0% | |
2320.0 | 1 | 0.0% | |
2080.0 | 1 | 0.0% | |
1920.0 | 1 | 0.0% | |
1600.0 | 1 | 0.0% | |
(Missing) | 4490 | 52.5% |
sbuspl12
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 52.6% |
Missing (n) | 4505 |
6200.0 | 1 |
---|---|
5945.0 | 1 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
6200.0 | 1 | 0.0% | |
5945.0 | 1 | 0.0% | |
(Missing) | 4505 | 52.6% |
sbuspl2
Categorical
Distinct count | 91 |
---|---|
Unique (%) | 1.1% |
Missing (%) | 38.9% |
Missing (n) | 3328 |
4480.0 | 245 |
---|---|
1600.0 | 142 |
Other values (87) | 792 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
4480.0 | 245 | 2.9% | |
1600.0 | 142 | 1.7% | |
7777.0 | 78 | 0.9% | |
5600.0 | 62 | 0.7% | |
7320.0 | 56 | 0.7% | |
7400.0 | 44 | 0.5% | |
5945.0 | 42 | 0.5% | |
3360.0 | 39 | 0.5% | |
7360.0 | 36 | 0.4% | |
Other values (80) | 435 | 5.1% | |
(Missing) | 3328 | 38.9% |
sbuspl3
Categorical
Distinct count | 83 |
---|---|
Unique (%) | 1.0% |
Missing (%) | 44.2% |
Missing (n) | 3781 |
4480.0 | 174 |
---|---|
1600.0 | 100 |
Other values (79) | 452 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
4480.0 | 174 | 2.0% | |
1600.0 | 100 | 1.2% | |
7777.0 | 49 | 0.6% | |
5600.0 | 36 | 0.4% | |
7320.0 | 36 | 0.4% | |
7400.0 | 27 | 0.3% | |
5945.0 | 23 | 0.3% | |
5775.0 | 17 | 0.2% | |
7360.0 | 17 | 0.2% | |
Other values (72) | 247 | 2.9% | |
(Missing) | 3781 | 44.2% |
sbuspl4
Categorical
Distinct count | 65 |
---|---|
Unique (%) | 0.8% |
Missing (%) | 47.6% |
Missing (n) | 4075 |
4480.0 | 107 |
---|---|
1600.0 | 58 |
Other values (61) | 267 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
4480.0 | 107 | 1.3% | |
1600.0 | 58 | 0.7% | |
7777.0 | 35 | 0.4% | |
7320.0 | 22 | 0.3% | |
5600.0 | 19 | 0.2% | |
7400.0 | 15 | 0.2% | |
6160.0 | 11 | 0.1% | |
3360.0 | 11 | 0.1% | |
5945.0 | 10 | 0.1% | |
Other values (54) | 144 | 1.7% | |
(Missing) | 4075 | 47.6% |
sbuspl5
Categorical
Distinct count | 52 |
---|---|
Unique (%) | 0.6% |
Missing (%) | 49.4% |
Missing (n) | 4231 |
4480.0 | 67 |
---|---|
1600.0 | 39 |
Other values (48) | 170 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
4480.0 | 67 | 0.8% | |
1600.0 | 39 | 0.5% | |
7777.0 | 29 | 0.3% | |
7320.0 | 16 | 0.2% | |
5600.0 | 13 | 0.2% | |
7400.0 | 11 | 0.1% | |
2840.0 | 7 | 0.1% | |
6780.0 | 6 | 0.1% | |
7360.0 | 6 | 0.1% | |
Other values (41) | 82 | 1.0% | |
(Missing) | 4231 | 49.4% |
sbuspl6
Categorical
Distinct count | 43 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 50.9% |
Missing (n) | 4352 |
4480.0 | 38 |
---|---|
1600.0 | 22 |
Other values (39) | 95 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
4480.0 | 38 | 0.4% | |
1600.0 | 22 | 0.3% | |
7777.0 | 11 | 0.1% | |
7400.0 | 8 | 0.1% | |
5600.0 | 8 | 0.1% | |
7320.0 | 7 | 0.1% | |
5945.0 | 5 | 0.1% | |
1920.0 | 4 | 0.0% | |
2840.0 | 4 | 0.0% | |
Other values (32) | 48 | 0.6% | |
(Missing) | 4352 | 50.9% |
sbuspl7
Categorical
Distinct count | 35 |
---|---|
Unique (%) | 0.4% |
Missing (%) | 51.3% |
Missing (n) | 4389 |
4480.0 | 34 |
---|---|
1600.0 | 14 |
Other values (31) | 70 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
4480.0 | 34 | 0.4% | |
1600.0 | 14 | 0.2% | |
7777.0 | 9 | 0.1% | |
7320.0 | 7 | 0.1% | |
5600.0 | 7 | 0.1% | |
5945.0 | 6 | 0.1% | |
7400.0 | 4 | 0.0% | |
520.0 | 3 | 0.0% | |
1920.0 | 3 | 0.0% | |
Other values (24) | 31 | 0.4% | |
(Missing) | 4389 | 51.3% |
sbuspl8
Categorical
Distinct count | 22 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 52.0% |
Missing (n) | 4448 |
4480.0 | 20 |
---|---|
1600.0 | 8 |
Other values (18) | 31 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
4480.0 | 20 | 0.2% | |
1600.0 | 8 | 0.1% | |
7400.0 | 4 | 0.0% | |
3360.0 | 3 | 0.0% | |
1920.0 | 3 | 0.0% | |
5945.0 | 3 | 0.0% | |
5600.0 | 2 | 0.0% | |
7320.0 | 2 | 0.0% | |
5775.0 | 2 | 0.0% | |
Other values (11) | 12 | 0.1% | |
(Missing) | 4448 | 52.0% |
sbuspl9
Categorical
Distinct count | 16 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 52.3% |
Missing (n) | 4474 |
4480.0 | 13 |
---|---|
1600.0 | 5 |
Other values (12) | 15 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
4480.0 | 13 | 0.2% | |
1600.0 | 5 | 0.1% | |
2840.0 | 3 | 0.0% | |
5945.0 | 2 | 0.0% | |
8520.0 | 1 | 0.0% | |
7480.0 | 1 | 0.0% | |
7400.0 | 1 | 0.0% | |
7320.0 | 1 | 0.0% | |
5120.0 | 1 | 0.0% | |
Other values (5) | 5 | 0.1% | |
(Missing) | 4474 | 52.3% |
sbusst1
Categorical
Distinct count | 48 |
---|---|
Unique (%) | 0.6% |
Missing (%) | 24.0% |
Missing (n) | 2050 |
105.0 | |
---|---|
199.0 | 279 |
Other values (44) | |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
105.0 | 1007 | 11.8% | |
199.0 | 279 | 3.3% | |
114.0 | 222 | 2.6% | |
144.0 | 220 | 2.6% | |
133.0 | 125 | 1.5% | |
110.0 | 72 | 0.8% | |
103.0 | 55 | 0.6% | |
139.0 | 48 | 0.6% | |
129.0 | 42 | 0.5% | |
Other values (37) | 387 | 4.5% | |
(Missing) | 2050 | 24.0% |
sbusst10
Categorical
Distinct count | 8 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 52.3% |
Missing (n) | 4479 |
105.0 | 18 |
---|---|
144.0 | 5 |
Other values (4) | 5 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
105.0 | 18 | 0.2% | |
144.0 | 5 | 0.1% | |
199.0 | 2 | 0.0% | |
124.0 | 1 | 0.0% | |
114.0 | 1 | 0.0% | |
110.0 | 1 | 0.0% | |
(Missing) | 4479 | 52.3% |
sbusst11
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 52.5% |
Missing (n) | 4490 |
105.0 | 13 |
---|---|
144.0 | 2 |
Other values (2) | 2 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
105.0 | 13 | 0.2% | |
144.0 | 2 | 0.0% | |
114.0 | 1 | 0.0% | |
106.0 | 1 | 0.0% | |
(Missing) | 4490 | 52.5% |
sbusst12
Categorical
Distinct count | 5 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 52.6% |
Missing (n) | 4504 |
199.0 | 1 |
---|---|
105.0 | 1 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
199.0 | 1 | 0.0% | |
105.0 | 1 | 0.0% | |
103.0 | 1 | 0.0% | |
(Missing) | 4504 | 52.6% |
sbusst2
Categorical
Distinct count | 44 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 34.1% |
Missing (n) | 2916 |
105.0 | 660 |
---|---|
199.0 | 181 |
Other values (40) | 750 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
105.0 | 660 | 7.7% | |
199.0 | 181 | 2.1% | |
114.0 | 145 | 1.7% | |
144.0 | 140 | 1.6% | |
133.0 | 81 | 0.9% | |
110.0 | 44 | 0.5% | |
103.0 | 35 | 0.4% | |
139.0 | 33 | 0.4% | |
115.0 | 26 | 0.3% | |
Other values (33) | 246 | 2.9% | |
(Missing) | 2916 | 34.1% |
sbusst3
Categorical
Distinct count | 40 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 41.2% |
Missing (n) | 3523 |
105.0 | 412 |
---|---|
199.0 | 107 |
Other values (36) | 465 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
105.0 | 412 | 4.8% | |
199.0 | 107 | 1.3% | |
114.0 | 101 | 1.2% | |
144.0 | 76 | 0.9% | |
133.0 | 55 | 0.6% | |
110.0 | 25 | 0.3% | |
106.0 | 18 | 0.2% | |
139.0 | 18 | 0.2% | |
103.0 | 15 | 0.2% | |
Other values (29) | 157 | 1.8% | |
(Missing) | 3523 | 41.2% |
sbusst4
Categorical
Distinct count | 39 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 45.7% |
Missing (n) | 3911 |
105.0 | 254 |
---|---|
199.0 | 63 |
Other values (35) | 279 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
105.0 | 254 | 3.0% | |
199.0 | 63 | 0.7% | |
114.0 | 60 | 0.7% | |
144.0 | 39 | 0.5% | |
133.0 | 33 | 0.4% | |
110.0 | 18 | 0.2% | |
139.0 | 17 | 0.2% | |
137.0 | 10 | 0.1% | |
103.0 | 10 | 0.1% | |
Other values (28) | 92 | 1.1% | |
(Missing) | 3911 | 45.7% |
sbusst5
Categorical
Distinct count | 33 |
---|---|
Unique (%) | 0.4% |
Missing (%) | 48.3% |
Missing (n) | 4134 |
105.0 | 162 |
---|---|
114.0 | 42 |
Other values (29) | 169 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
105.0 | 162 | 1.9% | |
114.0 | 42 | 0.5% | |
199.0 | 39 | 0.5% | |
144.0 | 28 | 0.3% | |
133.0 | 21 | 0.2% | |
110.0 | 11 | 0.1% | |
139.0 | 9 | 0.1% | |
137.0 | 6 | 0.1% | |
111.0 | 5 | 0.1% | |
Other values (22) | 50 | 0.6% | |
(Missing) | 4134 | 48.3% |
sbusst6
Categorical
Distinct count | 28 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 50.2% |
Missing (n) | 4297 |
105.0 | 90 |
---|---|
199.0 | 25 |
Other values (24) | 95 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
105.0 | 90 | 1.1% | |
199.0 | 25 | 0.3% | |
114.0 | 23 | 0.3% | |
144.0 | 16 | 0.2% | |
133.0 | 11 | 0.1% | |
110.0 | 6 | 0.1% | |
139.0 | 5 | 0.1% | |
148.0 | 4 | 0.0% | |
111.0 | 3 | 0.0% | |
Other values (17) | 27 | 0.3% | |
(Missing) | 4297 | 50.2% |
sbusst7
Categorical
Distinct count | 23 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 51.0% |
Missing (n) | 4360 |
105.0 | 64 |
---|---|
199.0 | 19 |
Other values (19) | 64 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
105.0 | 64 | 0.7% | |
199.0 | 19 | 0.2% | |
114.0 | 14 | 0.2% | |
144.0 | 12 | 0.1% | |
133.0 | 9 | 0.1% | |
111.0 | 6 | 0.1% | |
110.0 | 5 | 0.1% | |
143.0 | 2 | 0.0% | |
129.0 | 2 | 0.0% | |
Other values (12) | 14 | 0.2% | |
(Missing) | 4360 | 51.0% |
sbusst8
Categorical
Distinct count | 16 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 51.8% |
Missing (n) | 4430 |
105.0 | 35 |
---|---|
199.0 | 9 |
Other values (12) | 33 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
105.0 | 35 | 0.4% | |
199.0 | 9 | 0.1% | |
144.0 | 9 | 0.1% | |
114.0 | 8 | 0.1% | |
148.0 | 2 | 0.0% | |
143.0 | 2 | 0.0% | |
133.0 | 2 | 0.0% | |
124.0 | 2 | 0.0% | |
110.0 | 2 | 0.0% | |
Other values (5) | 6 | 0.1% | |
(Missing) | 4430 | 51.8% |
sbusst9
Categorical
Distinct count | 13 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 52.2% |
Missing (n) | 4463 |
105.0 | 21 |
---|---|
144.0 | 6 |
Other values (9) | 17 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
105.0 | 21 | 0.2% | |
144.0 | 6 | 0.1% | |
199.0 | 5 | 0.1% | |
114.0 | 5 | 0.1% | |
148.0 | 1 | 0.0% | |
138.0 | 1 | 0.0% | |
137.0 | 1 | 0.0% | |
132.0 | 1 | 0.0% | |
124.0 | 1 | 0.0% | |
Other values (2) | 2 | 0.0% | |
(Missing) | 4463 | 52.2% |
sbyrgr1
Categorical
Distinct count | 72 |
---|---|
Unique (%) | 0.8% |
Missing (%) | 28.5% |
Missing (n) | 2443 |
1987.0 | 62 |
---|---|
1988.0 | 53 |
Other values (68) | 282 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1987.0 | 62 | 0.7% | |
1988.0 | 53 | 0.6% | |
1986.0 | 30 | 0.4% | |
1987 | 21 | 0.2% | |
1985.0 | 18 | 0.2% | |
1984.0 | 12 | 0.1% | |
1988 | 9 | 0.1% | |
1989.0 | 8 | 0.1% | |
1990.0 | 8 | 0.1% | |
Other values (61) | 176 | 2.1% | |
(Missing) | 2443 | 28.5% |
sbyrgr10
Categorical
Distinct count | 9 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 33.1% |
Missing (n) | 2830 |
1986.0 | 3 |
---|---|
1987.0 | 2 |
Other values (5) | 5 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1986.0 | 3 | 0.0% | |
1987.0 | 2 | 0.0% | |
1994.0 | 1 | 0.0% | |
1979.0 | 1 | 0.0% | |
1976.0 | 1 | 0.0% | |
1975.0 | 1 | 0.0% | |
1968.0 | 1 | 0.0% | |
(Missing) | 2830 | 33.1% |
sbyrgr11
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 33.1% |
Missing (n) | 2836 |
1999.0 | 1 |
---|---|
1987.0 | 1 |
Other values (2) | 2 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1999.0 | 1 | 0.0% | |
1987.0 | 1 | 0.0% | |
1979.0 | 1 | 0.0% | |
1970.0 | 1 | 0.0% | |
(Missing) | 2836 | 33.1% |
sbyrgr12
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 33.2% |
Missing (n) | 2838 |
1987.0 | 1 |
---|---|
1979.0 | 1 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1987.0 | 1 | 0.0% | |
1979.0 | 1 | 0.0% | |
(Missing) | 2838 | 33.2% |
sbyrgr2
Categorical
Distinct count | 58 |
---|---|
Unique (%) | 0.7% |
Missing (%) | 30.4% |
Missing (n) | 2603 |
1987.0 | 49 |
---|---|
1988.0 | 31 |
Other values (54) | 157 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1987.0 | 49 | 0.6% | |
1988.0 | 31 | 0.4% | |
1986.0 | 17 | 0.2% | |
1987 | 16 | 0.2% | |
1985.0 | 12 | 0.1% | |
1980.0 | 7 | 0.1% | |
1997.0 | 6 | 0.1% | |
1990.0 | 6 | 0.1% | |
1999.0 | 5 | 0.1% | |
Other values (47) | 88 | 1.0% | |
(Missing) | 2603 | 30.4% |
sbyrgr3
Categorical
Distinct count | 45 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 31.4% |
Missing (n) | 2684 |
1987.0 | 32 |
---|---|
1987 | 17 |
Other values (41) | 107 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1987.0 | 32 | 0.4% | |
1987 | 17 | 0.2% | |
1988.0 | 14 | 0.2% | |
1986.0 | 11 | 0.1% | |
1995.0 | 6 | 0.1% | |
1985.0 | 5 | 0.1% | |
2000.0 | 4 | 0.0% | |
1980.0 | 4 | 0.0% | |
1990.0 | 4 | 0.0% | |
Other values (34) | 59 | 0.7% | |
(Missing) | 2684 | 31.4% |
sbyrgr4
Categorical
Distinct count | 40 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 31.9% |
Missing (n) | 2726 |
1987.0 | 19 |
---|---|
1988.0 | 14 |
Other values (36) | 81 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1987.0 | 19 | 0.2% | |
1988.0 | 14 | 0.2% | |
1986.0 | 12 | 0.1% | |
1987 | 10 | 0.1% | |
1995.0 | 6 | 0.1% | |
1996.0 | 4 | 0.0% | |
1980.0 | 3 | 0.0% | |
1984.0 | 3 | 0.0% | |
1999.0 | 3 | 0.0% | |
Other values (29) | 40 | 0.5% | |
(Missing) | 2726 | 31.9% |
sbyrgr5
Categorical
Distinct count | 30 |
---|---|
Unique (%) | 0.4% |
Missing (%) | 32.4% |
Missing (n) | 2773 |
1987.0 | 13 |
---|---|
1986.0 | 7 |
Other values (26) | 47 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1987.0 | 13 | 0.2% | |
1986.0 | 7 | 0.1% | |
1988.0 | 7 | 0.1% | |
1990.0 | 4 | 0.0% | |
1989.0 | 3 | 0.0% | |
1984.0 | 3 | 0.0% | |
1987 | 2 | 0.0% | |
1967.0 | 2 | 0.0% | |
1997.0 | 2 | 0.0% | |
Other values (19) | 24 | 0.3% | |
(Missing) | 2773 | 32.4% |
sbyrgr6
Categorical
Distinct count | 24 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 32.7% |
Missing (n) | 2796 |
1987.0 | 9 |
---|---|
1988.0 | 4 |
Other values (20) | 31 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1987.0 | 9 | 0.1% | |
1988.0 | 4 | 0.0% | |
1986.0 | 3 | 0.0% | |
1997.0 | 3 | 0.0% | |
1984.0 | 2 | 0.0% | |
1968.0 | 2 | 0.0% | |
1989.0 | 2 | 0.0% | |
1996.0 | 2 | 0.0% | |
1987 | 2 | 0.0% | |
Other values (13) | 15 | 0.2% | |
(Missing) | 2796 | 32.7% |
sbyrgr7
Categorical
Distinct count | 18 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 32.9% |
Missing (n) | 2816 |
1987.0 | 4 |
---|---|
1986.0 | 4 |
Other values (14) | 16 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1987.0 | 4 | 0.0% | |
1986.0 | 4 | 0.0% | |
1987 | 2 | 0.0% | |
1970.0 | 2 | 0.0% | |
1975.0 | 1 | 0.0% | |
1968.0 | 1 | 0.0% | |
1969.0 | 1 | 0.0% | |
1971.0 | 1 | 0.0% | |
1973.0 | 1 | 0.0% | |
Other values (7) | 7 | 0.1% | |
(Missing) | 2816 | 32.9% |
sbyrgr8
Categorical
Distinct count | 14 |
---|---|
Unique (%) | 0.2% |
Missing (%) | 33.0% |
Missing (n) | 2825 |
1987.0 | 3 |
---|---|
1970.0 | 2 |
Other values (10) | 10 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1987.0 | 3 | 0.0% | |
1970.0 | 2 | 0.0% | |
1987 | 1 | 0.0% | |
1993.0 | 1 | 0.0% | |
1989.0 | 1 | 0.0% | |
1986.0 | 1 | 0.0% | |
1985.0 | 1 | 0.0% | |
1975.0 | 1 | 0.0% | |
1973.0 | 1 | 0.0% | |
Other values (3) | 3 | 0.0% | |
(Missing) | 2825 | 33.0% |
sbyrgr9
Categorical
Distinct count | 10 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 33.0% |
Missing (n) | 2828 |
1986.0 | 3 |
---|---|
1987.0 | 2 |
Other values (6) | 7 |
(Missing) |
Value | Count | Frequency (%) | |
5717 | 66.8% | ||
1986.0 | 3 | 0.0% | |
1987.0 | 2 | 0.0% | |
1975.0 | 2 | 0.0% | |
1993.0 | 1 | 0.0% | |
1985.0 | 1 | 0.0% | |
1973.0 | 1 | 0.0% | |
1970.0 | 1 | 0.0% | |
1968.0 | 1 | 0.0% | |
(Missing) | 2828 | 33.0% |
schools
Numeric
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 2.2% |
Missing (n) | 192 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.9149 |
---|---|
Minimum | 1 |
Maximum | 8 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 2 |
Median | 2 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 8 |
Range | 7 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.59503 |
---|---|
Coef of variation | 0.31074 |
Kurtosis | 69.669 |
Mean | 1.9149 |
MAD | 0.22793 |
Skewness | 6.5841 |
Sum | 16018 |
Variance | 0.35406 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
2.0 | 7268 | 84.9% | |
1.0 | 1042 | 12.2% | |
8.0 | 55 | 0.6% | |
(Missing) | 192 | 2.2% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 1042 | 12.2% | |
2.0 | 7268 | 84.9% | |
8.0 | 55 | 0.6% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 1042 | 12.2% | |
2.0 | 7268 | 84.9% | |
8.0 | 55 | 0.6% |
sex
Boolean
Distinct count | 2 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Mean | 1.0473 |
---|
1 | |
---|---|
2 | 405 |
Value | Count | Frequency (%) | |
1 | 8152 | 95.3% | |
2 | 405 | 4.7% |
smokeage
Categorical
Distinct count | 58 |
---|---|
Unique (%) | 0.7% |
Missing (%) | 14.1% |
Missing (n) | 1203 |
15 | 113 |
---|---|
18 | 77 |
Other values (54) | 449 |
(Missing) | 1203 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
15 | 113 | 1.3% | |
18 | 77 | 0.9% | |
16 | 54 | 0.6% | |
20 | 50 | 0.6% | |
12 | 48 | 0.6% | |
14 | 43 | 0.5% | |
13 | 35 | 0.4% | |
17 | 33 | 0.4% | |
15.0 | 19 | 0.2% | |
Other values (47) | 167 | 2.0% | |
(Missing) | 1203 | 14.1% |
smoked
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.1% |
Missing (n) | 7 |
2 | 879 |
---|---|
1 | 592 |
Other values (2) | 364 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
2 | 879 | 10.3% | |
1 | 592 | 6.9% | |
2.0 | 250 | 2.9% | |
1.0 | 114 | 1.3% | |
(Missing) | 7 | 0.1% |
smokes
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.1% |
Missing (n) | 5 |
2 | 1156 |
---|---|
1 | 317 |
Other values (2) | 364 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
2 | 1156 | 13.5% | |
1 | 317 | 3.7% | |
2.0 | 300 | 3.5% | |
1.0 | 64 | 0.7% | |
(Missing) | 5 | 0.1% |
social
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 5.1% |
Missing (n) | 440 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.9048 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 2 |
Median | 2 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.29355 |
---|---|
Coef of variation | 0.15412 |
Kurtosis | 5.6101 |
Mean | 1.9048 |
MAD | 0.17233 |
Skewness | -2.7584 |
Sum | 15461 |
Variance | 0.086174 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
2.0 | 7344 | 85.8% | |
1.0 | 773 | 9.0% | |
(Missing) | 440 | 5.1% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 773 | 9.0% | |
2.0 | 7344 | 85.8% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 773 | 9.0% | |
2.0 | 7344 | 85.8% |
sport
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 5.0% |
Missing (n) | 427 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.9047 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 2 |
Median | 2 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.29368 |
---|---|
Coef of variation | 0.15419 |
Kurtosis | 5.5999 |
Mean | 1.9047 |
MAD | 0.17248 |
Skewness | -2.7565 |
Sum | 15485 |
Variance | 0.08625 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
2.0 | 7355 | 86.0% | |
1.0 | 775 | 9.1% | |
(Missing) | 427 | 5.0% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 775 | 9.1% | |
2.0 | 7355 | 86.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 775 | 9.1% | |
2.0 | 7355 | 86.0% |
ssi
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 49.4% |
Missing (n) | 4223 |
2.0 | 265 |
---|---|
1.0 | 19 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
2.0 | 265 | 3.1% | |
1.0 | 19 | 0.2% | |
(Missing) | 4223 | 49.4% |
sstax
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 19.9% |
Missing (n) | 1702 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.2554 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 1 |
Descriptive statistics
Standard deviation | 0.43614 |
---|---|
Coef of variation | 0.3474 |
Kurtosis | -0.7417 |
Mean | 1.2554 |
MAD | 0.38037 |
Skewness | 1.1218 |
Sum | 8606 |
Variance | 0.19022 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 5104 | 59.6% | |
2.0 | 1751 | 20.5% | |
(Missing) | 1702 | 19.9% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 5104 | 59.6% | |
2.0 | 1751 | 20.5% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 5104 | 59.6% | |
2.0 | 1751 | 20.5% |
sstaxs
Categorical
Distinct count | 5 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 47.8% |
Missing (n) | 4091 |
1.0 | 297 |
---|---|
2.0 | 114 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
1.0 | 297 | 3.5% | |
2.0 | 114 | 1.3% | |
1 | 5 | 0.1% | |
(Missing) | 4091 | 47.8% |
statebrn
Numeric
Distinct count | 35 |
---|---|
Unique (%) | 0.4% |
Missing (%) | 0.1% |
Missing (n) | 9 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 17.63 |
---|---|
Minimum | 1 |
Maximum | 280 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 8 |
Q1 | 12 |
Median | 16 |
Q3 | 22 |
95-th percentile | 32 |
Maximum | 280 |
Range | 279 |
Interquartile range | 10 |
Descriptive statistics
Standard deviation | 9.3768 |
---|---|
Coef of variation | 0.53188 |
Kurtosis | 206.96 |
Mean | 17.63 |
MAD | 6.438 |
Skewness | 8.5024 |
Sum | 150700 |
Variance | 87.924 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
14.0 | 1714 | 20.0% | |
11.0 | 1058 | 12.4% | |
16.0 | 971 | 11.3% | |
32.0 | 833 | 9.7% | |
24.0 | 637 | 7.4% | |
21.0 | 419 | 4.9% | |
10.0 | 329 | 3.8% | |
22.0 | 301 | 3.5% | |
15.0 | 260 | 3.0% | |
8.0 | 232 | 2.7% | |
Other values (24) | 1794 | 21.0% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 145 | 1.7% | |
2.0 | 84 | 1.0% | |
4.0 | 1 | 0.0% | |
5.0 | 19 | 0.2% | |
6.0 | 124 | 1.4% |
Maximum 5 values
Value | Count | Frequency (%) | |
31.0 | 144 | 1.7% | |
32.0 | 833 | 9.7% | |
212.0 | 2 | 0.0% | |
213.0 | 1 | 0.0% | |
280.0 | 2 | 0.0% |
sugar
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.1% |
Missing (n) | 8 |
2 | 1306 |
---|---|
2.0 | 327 |
Other values (2) | 201 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
2 | 1306 | 15.3% | |
2.0 | 327 | 3.8% | |
1 | 165 | 1.9% | |
1.0 | 36 | 0.4% | |
(Missing) | 8 | 0.1% |
surveypl
Boolean
Distinct count | 2 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Mean | 1.1256 |
---|
1 | |
---|---|
2 | 1075 |
Value | Count | Frequency (%) | |
1 | 7482 | 87.4% | |
2 | 1075 | 12.6% |
surveyyr
Highly correlated
This variable is highly correlated with commun
and should be ignored for analysis
Correlation | 0.97277 |
---|
taxes
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 3.8% |
Missing (n) | 325 |
2.0 | |
---|---|
1.0 | |
Other values (2) | 45 |
(Missing) | 325 |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
2.0 | 3251 | 38.0% | |
1.0 | 886 | 10.4% | |
2 | 39 | 0.5% | |
1 | 6 | 0.1% | |
(Missing) | 325 | 3.8% |
uncevus
Numeric
Distinct count | 29 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 6.2% |
Missing (n) | 533 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.5932 |
---|---|
Minimum | 0 |
Maximum | 100 |
Zeros (%) | 58.6% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 0 |
Q3 | 2 |
95-th percentile | 8 |
Maximum | 100 |
Range | 100 |
Interquartile range | 2 |
Descriptive statistics
Standard deviation | 3.6295 |
---|---|
Coef of variation | 2.2781 |
Kurtosis | 93.845 |
Mean | 1.5932 |
MAD | 2.1057 |
Skewness | 6.4132 |
Sum | 12784 |
Variance | 13.173 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 5015 | 58.6% | |
1.0 | 772 | 9.0% | |
2.0 | 658 | 7.7% | |
3.0 | 377 | 4.4% | |
4.0 | 304 | 3.6% | |
5.0 | 201 | 2.3% | |
6.0 | 163 | 1.9% | |
10.0 | 137 | 1.6% | |
8.0 | 106 | 1.2% | |
7.0 | 75 | 0.9% | |
Other values (18) | 216 | 2.5% | |
(Missing) | 533 | 6.2% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 5015 | 58.6% | |
1.0 | 772 | 9.0% | |
2.0 | 658 | 7.7% | |
3.0 | 377 | 4.4% | |
4.0 | 304 | 3.6% |
Maximum 5 values
Value | Count | Frequency (%) | |
30.0 | 10 | 0.1% | |
38.0 | 1 | 0.0% | |
40.0 | 8 | 0.1% | |
50.0 | 1 | 0.0% | |
100.0 | 1 | 0.0% |
uncinus
Numeric
Distinct count | 24 |
---|---|
Unique (%) | 0.3% |
Missing (%) | 1.7% |
Missing (n) | 148 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 0.97431 |
---|---|
Minimum | 0 |
Maximum | 50 |
Zeros (%) | 71.2% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 0 |
Q1 | 0 |
Median | 0 |
Q3 | 1 |
95-th percentile | 5 |
Maximum | 50 |
Range | 50 |
Interquartile range | 1 |
Descriptive statistics
Standard deviation | 2.5646 |
---|---|
Coef of variation | 2.6322 |
Kurtosis | 65.573 |
Mean | 0.97431 |
MAD | 1.411 |
Skewness | 5.9314 |
Sum | 8193 |
Variance | 6.5771 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
0.0 | 6089 | 71.2% | |
1.0 | 761 | 8.9% | |
2.0 | 516 | 6.0% | |
3.0 | 292 | 3.4% | |
4.0 | 205 | 2.4% | |
5.0 | 149 | 1.7% | |
10.0 | 102 | 1.2% | |
6.0 | 98 | 1.1% | |
8.0 | 57 | 0.7% | |
7.0 | 41 | 0.5% | |
Other values (13) | 99 | 1.2% | |
(Missing) | 148 | 1.7% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 6089 | 71.2% | |
1.0 | 761 | 8.9% | |
2.0 | 516 | 6.0% | |
3.0 | 292 | 3.4% | |
4.0 | 205 | 2.4% |
Maximum 5 values
Value | Count | Frequency (%) | |
19.0 | 1 | 0.0% | |
20.0 | 22 | 0.3% | |
25.0 | 1 | 0.0% | |
30.0 | 2 | 0.0% | |
50.0 | 3 | 0.0% |
unemp
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 4.1% |
Missing (n) | 347 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.92 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 2 |
Median | 2 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.27135 |
---|---|
Coef of variation | 0.14133 |
Kurtosis | 7.5885 |
Mean | 1.92 |
MAD | 0.14724 |
Skewness | -3.0962 |
Sum | 15763 |
Variance | 0.073629 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
2.0 | 7553 | 88.3% | |
1.0 | 657 | 7.7% | |
(Missing) | 347 | 4.1% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 657 | 7.7% | |
2.0 | 7553 | 88.3% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 657 | 7.7% | |
2.0 | 7553 | 88.3% |
usby1
Numeric
Distinct count | 7 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 40.7% |
Missing (n) | 3486 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.2112 |
---|---|
Minimum | 1 |
Maximum | 6 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 1 |
95-th percentile | 3 |
Maximum | 6 |
Range | 5 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.64859 |
---|---|
Coef of variation | 0.53549 |
Kurtosis | 10.935 |
Mean | 1.2112 |
MAD | 0.37634 |
Skewness | 3.26 |
Sum | 6142 |
Variance | 0.42067 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 4518 | 52.8% | |
3.0 | 358 | 4.2% | |
2.0 | 129 | 1.5% | |
4.0 | 42 | 0.5% | |
5.0 | 20 | 0.2% | |
6.0 | 4 | 0.0% | |
(Missing) | 3486 | 40.7% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 4518 | 52.8% | |
2.0 | 129 | 1.5% | |
3.0 | 358 | 4.2% | |
4.0 | 42 | 0.5% | |
5.0 | 20 | 0.2% |
Maximum 5 values
Value | Count | Frequency (%) | |
2.0 | 129 | 1.5% | |
3.0 | 358 | 4.2% | |
4.0 | 42 | 0.5% | |
5.0 | 20 | 0.2% | |
6.0 | 4 | 0.0% |
usbyl
Numeric
Distinct count | 9 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 32.6% |
Missing (n) | 2787 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.3506 |
---|---|
Minimum | 1 |
Maximum | 888 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 1 |
Q3 | 1 |
95-th percentile | 3 |
Maximum | 888 |
Range | 887 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 11.693 |
---|---|
Coef of variation | 8.6573 |
Kurtosis | 5734.4 |
Mean | 1.3506 |
MAD | 0.63255 |
Skewness | 75.61 |
Sum | 7793 |
Variance | 136.72 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 5205 | 60.8% | |
3.0 | 375 | 4.4% | |
2.0 | 111 | 1.3% | |
4.0 | 51 | 0.6% | |
5.0 | 18 | 0.2% | |
6.0 | 8 | 0.1% | |
11.0 | 1 | 0.0% | |
888.0 | 1 | 0.0% | |
(Missing) | 2787 | 32.6% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 5205 | 60.8% | |
2.0 | 111 | 1.3% | |
3.0 | 375 | 4.4% | |
4.0 | 51 | 0.6% | |
5.0 | 18 | 0.2% |
Maximum 5 values
Value | Count | Frequency (%) | |
4.0 | 51 | 0.6% | |
5.0 | 18 | 0.2% | |
6.0 | 8 | 0.1% | |
11.0 | 1 | 0.0% | |
888.0 | 1 | 0.0% |
uscurtrp
Boolean
Distinct count | 2 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Mean | 1.7829 |
---|
2 | |
---|---|
1 |
Value | Count | Frequency (%) | |
2 | 6699 | 78.3% | |
1 | 1858 | 21.7% |
usdoc1
Numeric
Distinct count | 9 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.3% |
Missing (n) | 29 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 6.5875 |
---|---|
Minimum | 1 |
Maximum | 8 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 2 |
Q1 | 5 |
Median | 8 |
Q3 | 8 |
95-th percentile | 8 |
Maximum | 8 |
Range | 7 |
Interquartile range | 3 |
Descriptive statistics
Standard deviation | 2.4622 |
---|---|
Coef of variation | 0.37376 |
Kurtosis | -0.030655 |
Mean | 6.5875 |
MAD | 2.0719 |
Skewness | -1.3186 |
Sum | 56178 |
Variance | 6.0622 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
8.0 | 6254 | 73.1% | |
2.0 | 1069 | 12.5% | |
5.0 | 540 | 6.3% | |
1.0 | 409 | 4.8% | |
3.0 | 157 | 1.8% | |
4.0 | 84 | 1.0% | |
6.0 | 13 | 0.2% | |
7.0 | 2 | 0.0% | |
(Missing) | 29 | 0.3% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 409 | 4.8% | |
2.0 | 1069 | 12.5% | |
3.0 | 157 | 1.8% | |
4.0 | 84 | 1.0% | |
5.0 | 540 | 6.3% |
Maximum 5 values
Value | Count | Frequency (%) | |
4.0 | 84 | 1.0% | |
5.0 | 540 | 6.3% | |
6.0 | 13 | 0.2% | |
7.0 | 2 | 0.0% | |
8.0 | 6254 | 73.1% |
usdocl
Numeric
Distinct count | 9 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.3% |
Missing (n) | 29 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 5.8834 |
---|---|
Minimum | 1 |
Maximum | 8 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 2 |
Median | 8 |
Q3 | 8 |
95-th percentile | 8 |
Maximum | 8 |
Range | 7 |
Interquartile range | 6 |
Descriptive statistics
Standard deviation | 2.9456 |
---|---|
Coef of variation | 0.50066 |
Kurtosis | -1.1758 |
Mean | 5.8834 |
MAD | 2.6817 |
Skewness | -0.81048 |
Sum | 50174 |
Variance | 8.6765 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
8.0 | 5398 | 63.1% | |
1.0 | 1584 | 18.5% | |
2.0 | 653 | 7.6% | |
5.0 | 566 | 6.6% | |
3.0 | 168 | 2.0% | |
4.0 | 95 | 1.1% | |
6.0 | 62 | 0.7% | |
7.0 | 2 | 0.0% | |
(Missing) | 29 | 0.3% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 1584 | 18.5% | |
2.0 | 653 | 7.6% | |
3.0 | 168 | 2.0% | |
4.0 | 95 | 1.1% | |
5.0 | 566 | 6.6% |
Maximum 5 values
Value | Count | Frequency (%) | |
4.0 | 95 | 1.1% | |
5.0 | 566 | 6.6% | |
6.0 | 62 | 0.7% | |
7.0 | 2 | 0.0% | |
8.0 | 5398 | 63.1% |
usdur1
Numeric
Distinct count | 178 |
---|---|
Unique (%) | 2.1% |
Missing (%) | 0.0% |
Missing (n) | 3 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 37.818 |
---|---|
Minimum | 1 |
Maximum | 768 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 2 |
Q1 | 6 |
Median | 12 |
Q3 | 36 |
95-th percentile | 174 |
Maximum | 768 |
Range | 767 |
Interquartile range | 30 |
Descriptive statistics
Standard deviation | 70.925 |
---|---|
Coef of variation | 1.8754 |
Kurtosis | 18.522 |
Mean | 37.818 |
MAD | 40.657 |
Skewness | 3.8828 |
Sum | 323500 |
Variance | 5030.3 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
12.0 | 1245 | 14.5% | |
6.0 | 887 | 10.4% | |
24.0 | 782 | 9.1% | |
3.0 | 611 | 7.1% | |
36.0 | 493 | 5.8% | |
2.0 | 460 | 5.4% | |
8.0 | 372 | 4.3% | |
4.0 | 305 | 3.6% | |
48.0 | 279 | 3.3% | |
1.0 | 254 | 3.0% | |
Other values (167) | 2866 | 33.5% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 254 | 3.0% | |
2.0 | 460 | 5.4% | |
3.0 | 611 | 7.1% | |
4.0 | 305 | 3.6% | |
5.0 | 194 | 2.3% |
Maximum 5 values
Value | Count | Frequency (%) | |
606.0 | 1 | 0.0% | |
612.0 | 1 | 0.0% | |
672.0 | 1 | 0.0% | |
726.0 | 1 | 0.0% | |
768.0 | 1 | 0.0% |
usdurl
Numeric
Distinct count | 194 |
---|---|
Unique (%) | 2.3% |
Missing (%) | 0.0% |
Missing (n) | 1 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 44.322 |
---|---|
Minimum | 1 |
Maximum | 768 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 2 |
Q1 | 6 |
Median | 12 |
Q3 | 36 |
95-th percentile | 222 |
Maximum | 768 |
Range | 767 |
Interquartile range | 30 |
Descriptive statistics
Standard deviation | 80.898 |
---|---|
Coef of variation | 1.8252 |
Kurtosis | 13.236 |
Mean | 44.322 |
MAD | 49.63 |
Skewness | 3.3432 |
Sum | 379220 |
Variance | 6544.4 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
12.0 | 1056 | 12.3% | |
6.0 | 1010 | 11.8% | |
24.0 | 605 | 7.1% | |
3.0 | 506 | 5.9% | |
2.0 | 423 | 4.9% | |
36.0 | 368 | 4.3% | |
8.0 | 331 | 3.9% | |
18.0 | 321 | 3.8% | |
1.0 | 314 | 3.7% | |
4.0 | 314 | 3.7% | |
Other values (183) | 3308 | 38.7% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 314 | 3.7% | |
2.0 | 423 | 4.9% | |
3.0 | 506 | 5.9% | |
4.0 | 314 | 3.7% | |
5.0 | 213 | 2.5% |
Maximum 5 values
Value | Count | Frequency (%) | |
618.0 | 2 | 0.0% | |
648.0 | 1 | 0.0% | |
672.0 | 1 | 0.0% | |
726.0 | 1 | 0.0% | |
768.0 | 1 | 0.0% |
usexp
Numeric
Distinct count | 397 |
---|---|
Unique (%) | 4.6% |
Missing (%) | 3.7% |
Missing (n) | 319 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 78.443 |
---|---|
Minimum | 1 |
Maximum | 922.5 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 3 |
Q1 | 12 |
Median | 36 |
Q3 | 108 |
95-th percentile | 288 |
Maximum | 922.5 |
Range | 921.5 |
Interquartile range | 96 |
Descriptive statistics
Standard deviation | 98.831 |
---|---|
Coef of variation | 1.2599 |
Kurtosis | 6.15 |
Mean | 78.443 |
MAD | 71.406 |
Skewness | 2.2257 |
Sum | 646210 |
Variance | 9767.6 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
12.0 | 593 | 6.9% | |
24.0 | 554 | 6.5% | |
36.0 | 393 | 4.6% | |
6.0 | 362 | 4.2% | |
48.0 | 261 | 3.1% | |
60.0 | 221 | 2.6% | |
3.0 | 190 | 2.2% | |
72.0 | 181 | 2.1% | |
4.0 | 160 | 1.9% | |
18.0 | 153 | 1.8% | |
Other values (386) | 5170 | 60.4% | |
(Missing) | 319 | 3.7% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 109 | 1.3% | |
2.0 | 144 | 1.7% | |
3.0 | 190 | 2.2% | |
4.0 | 160 | 1.9% | |
5.0 | 111 | 1.3% |
Maximum 5 values
Value | Count | Frequency (%) | |
690.0 | 1 | 0.0% | |
732.0 | 1 | 0.0% | |
768.0 | 1 | 0.0% | |
780.0 | 1 | 0.0% | |
922.5 | 1 | 0.0% |
ushealth
Categorical
Distinct count | 10 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 1.3% |
Missing (n) | 114 |
3 | 1016 |
---|---|
4 | 324 |
Other values (6) | 388 |
Value | Count | Frequency (%) | |
6715 | 78.5% | ||
3 | 1016 | 11.9% | |
4 | 324 | 3.8% | |
3.0 | 197 | 2.3% | |
4.0 | 127 | 1.5% | |
2 | 42 | 0.5% | |
2.0 | 18 | 0.2% | |
1 | 3 | 0.0% | |
1.0 | 1 | 0.0% | |
(Missing) | 114 | 1.3% |
usmar1
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.1% |
Missing (n) | 9 |
1.0 | |
---|---|
2.0 | |
Other values (2) |
Value | Count | Frequency (%) | |
4856 | 56.7% | ||
1.0 | 1234 | 14.4% | |
2.0 | 1176 | 13.7% | |
1 | 717 | 8.4% | |
2 | 565 | 6.6% | |
(Missing) | 9 | 0.1% |
usmarl
Categorical
Distinct count | 6 |
---|---|
Unique (%) | 0.1% |
Missing (%) | 0.1% |
Missing (n) | 10 |
1.0 | |
---|---|
1 | 962 |
Other values (2) |
Value | Count | Frequency (%) | |
4856 | 56.7% | ||
1.0 | 1628 | 19.0% | |
1 | 962 | 11.2% | |
2.0 | 778 | 9.1% | |
2 | 323 | 3.8% | |
(Missing) | 10 | 0.1% |
usocc1
Numeric
Distinct count | 96 |
---|---|
Unique (%) | 1.1% |
Missing (%) | 1.8% |
Missing (n) | 150 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 514.66 |
---|---|
Minimum | 10 |
Maximum | 831 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 10 |
---|---|
5-th percentile | 410 |
Q1 | 410 |
Median | 523 |
Q3 | 549 |
95-th percentile | 812 |
Maximum | 831 |
Range | 821 |
Interquartile range | 139 |
Descriptive statistics
Standard deviation | 172.51 |
---|---|
Coef of variation | 0.33519 |
Kurtosis | 0.95278 |
Mean | 514.66 |
MAD | 125.52 |
Skewness | -0.064182 |
Sum | 4326800 |
Variance | 29760 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
410.0 | 3300 | 38.6% | |
549.0 | 971 | 11.3% | |
812.0 | 664 | 7.8% | |
810.0 | 526 | 6.1% | |
526.0 | 364 | 4.3% | |
529.0 | 344 | 4.0% | |
520.0 | 250 | 2.9% | |
546.0 | 214 | 2.5% | |
524.0 | 196 | 2.3% | |
711.0 | 140 | 1.6% | |
Other values (85) | 1438 | 16.8% | |
(Missing) | 150 | 1.8% |
Minimum 5 values
Value | Count | Frequency (%) | |
10.0 | 84 | 1.0% | |
20.0 | 66 | 0.8% | |
30.0 | 12 | 0.1% | |
41.0 | 20 | 0.2% | |
42.0 | 54 | 0.6% |
Maximum 5 values
Value | Count | Frequency (%) | |
815.0 | 4 | 0.0% | |
819.0 | 66 | 0.8% | |
820.0 | 99 | 1.2% | |
830.0 | 3 | 0.0% | |
831.0 | 5 | 0.1% |
usoccl
Numeric
Distinct count | 110 |
---|---|
Unique (%) | 1.3% |
Missing (%) | 1.7% |
Missing (n) | 145 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 521.5 |
---|---|
Minimum | 10 |
Maximum | 831 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 10 |
---|---|
5-th percentile | 215 |
Q1 | 410 |
Median | 526 |
Q3 | 549 |
95-th percentile | 812 |
Maximum | 831 |
Range | 821 |
Interquartile range | 139 |
Descriptive statistics
Standard deviation | 175.8 |
---|---|
Coef of variation | 0.3371 |
Kurtosis | 1.039 |
Mean | 521.5 |
MAD | 123.48 |
Skewness | -0.27033 |
Sum | 4386900 |
Variance | 30905 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
410.0 | 2689 | 31.4% | |
549.0 | 1052 | 12.3% | |
812.0 | 625 | 7.3% | |
810.0 | 547 | 6.4% | |
526.0 | 435 | 5.1% | |
529.0 | 378 | 4.4% | |
520.0 | 294 | 3.4% | |
524.0 | 247 | 2.9% | |
546.0 | 245 | 2.9% | |
711.0 | 153 | 1.8% | |
Other values (99) | 1747 | 20.4% | |
(Missing) | 145 | 1.7% |
Minimum 5 values
Value | Count | Frequency (%) | |
10.0 | 118 | 1.4% | |
20.0 | 75 | 0.9% | |
30.0 | 12 | 0.1% | |
41.0 | 5 | 0.1% | |
42.0 | 18 | 0.2% |
Maximum 5 values
Value | Count | Frequency (%) | |
816.0 | 1 | 0.0% | |
819.0 | 85 | 1.0% | |
820.0 | 98 | 1.1% | |
830.0 | 7 | 0.1% | |
831.0 | 4 | 0.0% |
usplace1
Numeric
Distinct count | 138 |
---|---|
Unique (%) | 1.6% |
Missing (%) | 17.4% |
Missing (n) | 1490 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 5096.9 |
---|---|
Minimum | 40 |
Maximum | 9360 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 40 |
---|---|
5-th percentile | 1600 |
Q1 | 3480 |
Median | 4480 |
Q3 | 7320 |
95-th percentile | 8017.1 |
Maximum | 9360 |
Range | 9320 |
Interquartile range | 3840 |
Descriptive statistics
Standard deviation | 2200.3 |
---|---|
Coef of variation | 0.4317 |
Kurtosis | -0.93964 |
Mean | 5096.9 |
MAD | 1857.5 |
Skewness | -0.24777 |
Sum | 36020000 |
Variance | 4841500 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
4480.0 | 1713 | 20.0% | |
7777.0 | 614 | 7.2% | |
1600.0 | 574 | 6.7% | |
7320.0 | 357 | 4.2% | |
5945.0 | 288 | 3.4% | |
3360.0 | 279 | 3.3% | |
2840.0 | 265 | 3.1% | |
6780.0 | 229 | 2.7% | |
1920.0 | 198 | 2.3% | |
5600.0 | 196 | 2.3% | |
Other values (127) | 2354 | 27.5% | |
(Missing) | 1490 | 17.4% |
Minimum 5 values
Value | Count | Frequency (%) | |
40.0 | 6 | 0.1% | |
200.0 | 7 | 0.1% | |
240.0 | 4 | 0.0% | |
320.0 | 11 | 0.1% | |
334.0 | 4 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
9040.0 | 2 | 0.0% | |
9160.0 | 3 | 0.0% | |
9260.0 | 1 | 0.0% | |
9340.0 | 3 | 0.0% | |
9360.0 | 15 | 0.2% |
usplacel
Numeric
Distinct count | 149 |
---|---|
Unique (%) | 1.7% |
Missing (%) | 16.8% |
Missing (n) | 1434 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 5097.3 |
---|---|
Minimum | 40 |
Maximum | 9360 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 40 |
---|---|
5-th percentile | 1600 |
Q1 | 3360 |
Median | 4480 |
Q3 | 7320 |
95-th percentile | 8120 |
Maximum | 9360 |
Range | 9320 |
Interquartile range | 3960 |
Descriptive statistics
Standard deviation | 2216.8 |
---|---|
Coef of variation | 0.4349 |
Kurtosis | -0.95719 |
Mean | 5097.3 |
MAD | 1874.1 |
Skewness | -0.24967 |
Sum | 36308000 |
Variance | 4914300 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
4480.0 | 1706 | 19.9% | |
7777.0 | 651 | 7.6% | |
1600.0 | 591 | 6.9% | |
7320.0 | 352 | 4.1% | |
5945.0 | 283 | 3.3% | |
3360.0 | 274 | 3.2% | |
2840.0 | 261 | 3.1% | |
1920.0 | 207 | 2.4% | |
5600.0 | 196 | 2.3% | |
6780.0 | 195 | 2.3% | |
Other values (138) | 2407 | 28.1% | |
(Missing) | 1434 | 16.8% |
Minimum 5 values
Value | Count | Frequency (%) | |
40.0 | 7 | 0.1% | |
200.0 | 9 | 0.1% | |
240.0 | 3 | 0.0% | |
320.0 | 4 | 0.0% | |
334.0 | 2 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
9040.0 | 2 | 0.0% | |
9160.0 | 4 | 0.0% | |
9260.0 | 1 | 0.0% | |
9340.0 | 2 | 0.0% | |
9360.0 | 2 | 0.0% |
usstate1
Numeric
Distinct count | 46 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 116.91 |
---|---|
Minimum | 100 |
Maximum | 199 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 100 |
---|---|
5-th percentile | 105 |
Q1 | 105 |
Median | 105 |
Q3 | 133 |
95-th percentile | 144 |
Maximum | 199 |
Range | 99 |
Interquartile range | 28 |
Descriptive statistics
Standard deviation | 18.044 |
---|---|
Coef of variation | 0.15434 |
Kurtosis | 3.0944 |
Mean | 116.91 |
MAD | 14.902 |
Skewness | 1.6245 |
Sum | 1000386 |
Variance | 325.58 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
105 | 4567 | 53.4% | |
144 | 1303 | 15.2% | |
114 | 596 | 7.0% | |
133 | 255 | 3.0% | |
103 | 232 | 2.7% | |
110 | 198 | 2.3% | |
138 | 100 | 1.2% | |
106 | 99 | 1.2% | |
199 | 98 | 1.1% | |
134 | 95 | 1.1% | |
Other values (36) | 1014 | 11.8% |
Minimum 5 values
Value | Count | Frequency (%) | |
100 | 9 | 0.1% | |
102 | 1 | 0.0% | |
103 | 232 | 2.7% | |
104 | 59 | 0.7% | |
105 | 4567 | 53.4% |
Maximum 5 values
Value | Count | Frequency (%) | |
148 | 60 | 0.7% | |
150 | 9 | 0.1% | |
151 | 44 | 0.5% | |
153 | 5 | 0.1% | |
199 | 98 | 1.1% |
usstatel
Numeric
Distinct count | 47 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 116.78 |
---|---|
Minimum | 100 |
Maximum | 199 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 100 |
---|---|
5-th percentile | 105 |
Q1 | 105 |
Median | 105 |
Q3 | 132 |
95-th percentile | 144 |
Maximum | 199 |
Range | 99 |
Interquartile range | 27 |
Descriptive statistics
Standard deviation | 17.709 |
---|---|
Coef of variation | 0.15165 |
Kurtosis | 3.2972 |
Mean | 116.78 |
MAD | 14.516 |
Skewness | 1.6552 |
Sum | 999255 |
Variance | 313.61 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
105 | 4476 | 52.3% | |
144 | 1134 | 13.3% | |
114 | 627 | 7.3% | |
133 | 260 | 3.0% | |
110 | 236 | 2.8% | |
103 | 200 | 2.3% | |
106 | 121 | 1.4% | |
129 | 119 | 1.4% | |
134 | 119 | 1.4% | |
138 | 102 | 1.2% | |
Other values (37) | 1163 | 13.6% |
Minimum 5 values
Value | Count | Frequency (%) | |
100 | 11 | 0.1% | |
102 | 1 | 0.0% | |
103 | 200 | 2.3% | |
104 | 39 | 0.5% | |
105 | 4476 | 52.3% |
Maximum 5 values
Value | Count | Frequency (%) | |
148 | 72 | 0.8% | |
150 | 14 | 0.2% | |
151 | 59 | 0.7% | |
153 | 4 | 0.0% | |
199 | 93 | 1.1% |
ustrips
Numeric
Distinct count | 44 |
---|---|
Unique (%) | 0.5% |
Missing (%) | 0.1% |
Missing (n) | 8 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 3.3669 |
---|---|
Minimum | 1 |
Maximum | 44 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 1 |
Q1 | 1 |
Median | 2 |
Q3 | 3 |
95-th percentile | 12 |
Maximum | 44 |
Range | 43 |
Interquartile range | 2 |
Descriptive statistics
Standard deviation | 4.5687 |
---|---|
Coef of variation | 1.3569 |
Kurtosis | 18.173 |
Mean | 3.3669 |
MAD | 2.7375 |
Skewness | 3.7383 |
Sum | 28784 |
Variance | 20.873 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 3715 | 43.4% | |
2.0 | 1893 | 22.1% | |
3.0 | 874 | 10.2% | |
4.0 | 489 | 5.7% | |
5.0 | 311 | 3.6% | |
6.0 | 211 | 2.5% | |
7.0 | 159 | 1.9% | |
8.0 | 127 | 1.5% | |
10.0 | 126 | 1.5% | |
9.0 | 117 | 1.4% | |
Other values (33) | 527 | 6.2% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 3715 | 43.4% | |
2.0 | 1893 | 22.1% | |
3.0 | 874 | 10.2% | |
4.0 | 489 | 5.7% | |
5.0 | 311 | 3.6% |
Maximum 5 values
Value | Count | Frequency (%) | |
40.0 | 1 | 0.0% | |
41.0 | 1 | 0.0% | |
42.0 | 4 | 0.0% | |
43.0 | 2 | 0.0% | |
44.0 | 2 | 0.0% |
uswage1
Numeric
Distinct count | 386 |
---|---|
Unique (%) | 4.5% |
Missing (%) | 41.4% |
Missing (n) | 3545 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 35.761 |
---|---|
Minimum | 0.03 |
Maximum | 10000 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 0.03 |
---|---|
5-th percentile | 0.5 |
Q1 | 2 |
Median | 3.5 |
Q3 | 6 |
95-th percentile | 200 |
Maximum | 10000 |
Range | 10000 |
Interquartile range | 4 |
Descriptive statistics
Standard deviation | 248.94 |
---|---|
Coef of variation | 6.9613 |
Kurtosis | 1059.4 |
Mean | 35.761 |
MAD | 57.605 |
Skewness | 29.428 |
Sum | 179230 |
Variance | 61972 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
5.0 | 266 | 3.1% | |
3.0 | 265 | 3.1% | |
6.0 | 202 | 2.4% | |
4.0 | 186 | 2.2% | |
2.5 | 182 | 2.1% | |
1.0 | 156 | 1.8% | |
3.5 | 152 | 1.8% | |
2.0 | 148 | 1.7% | |
0.5 | 125 | 1.5% | |
4.5 | 116 | 1.4% | |
Other values (375) | 3214 | 37.6% | |
(Missing) | 3545 | 41.4% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.03 | 1 | 0.0% | |
0.04 | 1 | 0.0% | |
0.05 | 2 | 0.0% | |
0.09 | 1 | 0.0% | |
0.1 | 7 | 0.1% |
Maximum 5 values
Value | Count | Frequency (%) | |
2000.0 | 1 | 0.0% | |
2400.0 | 1 | 0.0% | |
8000.0 | 1 | 0.0% | |
9000.0 | 1 | 0.0% | |
10000.0 | 1 | 0.0% |
uswagel
Numeric
Distinct count | 482 |
---|---|
Unique (%) | 5.6% |
Missing (%) | 33.0% |
Missing (n) | 2825 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 83.596 |
---|---|
Minimum | 0.03 |
Maximum | 100000 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 0.03 |
---|---|
5-th percentile | 0.87 |
Q1 | 3.2 |
Median | 5 |
Q3 | 8.5 |
95-th percentile | 290 |
Maximum | 100000 |
Range | 100000 |
Interquartile range | 5.3 |
Descriptive statistics
Standard deviation | 1595.9 |
---|---|
Coef of variation | 19.09 |
Kurtosis | 2784.4 |
Mean | 83.596 |
MAD | 142.84 |
Skewness | 48.345 |
Sum | 479170 |
Variance | 2546800 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
5.0 | 378 | 4.4% | |
6.0 | 286 | 3.3% | |
7.0 | 258 | 3.0% | |
3.0 | 219 | 2.6% | |
8.0 | 204 | 2.4% | |
4.0 | 204 | 2.4% | |
4.5 | 171 | 2.0% | |
10.0 | 168 | 2.0% | |
2.5 | 154 | 1.8% | |
4.25 | 128 | 1.5% | |
Other values (471) | 3562 | 41.6% | |
(Missing) | 2825 | 33.0% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.03 | 1 | 0.0% | |
0.07 | 1 | 0.0% | |
0.1 | 4 | 0.0% | |
0.11 | 1 | 0.0% | |
0.12 | 2 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
25000.0 | 1 | 0.0% | |
25800.0 | 1 | 0.0% | |
27000.0 | 2 | 0.0% | |
37000.0 | 1 | 0.0% | |
100000.0 | 1 | 0.0% |
usyr1
Numeric
Distinct count | 103 |
---|---|
Unique (%) | 1.2% |
Missing (%) | 0.0% |
Missing (n) | 2 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1977.6 |
---|---|
Minimum | 1906 |
Maximum | 2016 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1906 |
---|---|
5-th percentile | 1947 |
Q1 | 1968 |
Median | 1980 |
Q3 | 1990 |
95-th percentile | 2001 |
Maximum | 2016 |
Range | 110 |
Interquartile range | 22 |
Descriptive statistics
Standard deviation | 16.65 |
---|---|
Coef of variation | 0.0084192 |
Kurtosis | -0.18754 |
Mean | 1977.6 |
MAD | 13.408 |
Skewness | -0.52274 |
Sum | 16919000 |
Variance | 277.23 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1979.0 | 266 | 3.1% | |
1985.0 | 253 | 3.0% | |
1986.0 | 248 | 2.9% | |
1988.0 | 242 | 2.8% | |
1980.0 | 241 | 2.8% | |
1990.0 | 239 | 2.8% | |
1978.0 | 218 | 2.5% | |
1989.0 | 217 | 2.5% | |
1984.0 | 214 | 2.5% | |
1973.0 | 204 | 2.4% | |
Other values (92) | 6213 | 72.6% |
Minimum 5 values
Value | Count | Frequency (%) | |
1906.0 | 1 | 0.0% | |
1912.0 | 1 | 0.0% | |
1914.0 | 1 | 0.0% | |
1915.0 | 2 | 0.0% | |
1917.0 | 1 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
2012.0 | 9 | 0.1% | |
2013.0 | 4 | 0.0% | |
2014.0 | 4 | 0.0% | |
2015.0 | 2 | 0.0% | |
2016.0 | 1 | 0.0% |
usyrl
Numeric
Distinct count | 98 |
---|---|
Unique (%) | 1.1% |
Missing (%) | 0.0% |
Missing (n) | 2 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1984.5 |
---|---|
Minimum | 1914 |
Maximum | 2016 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1914 |
---|---|
5-th percentile | 1955 |
Q1 | 1977 |
Median | 1988 |
Q3 | 1995 |
95-th percentile | 2005 |
Maximum | 2016 |
Range | 102 |
Interquartile range | 18 |
Descriptive statistics
Standard deviation | 14.991 |
---|---|
Coef of variation | 0.0075539 |
Kurtosis | 0.50739 |
Mean | 1984.5 |
MAD | 11.797 |
Skewness | -0.81362 |
Sum | 16977000 |
Variance | 224.72 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1988.0 | 377 | 4.4% | |
1990.0 | 372 | 4.3% | |
1991.0 | 343 | 4.0% | |
1989.0 | 326 | 3.8% | |
1995.0 | 265 | 3.1% | |
1994.0 | 256 | 3.0% | |
1986.0 | 243 | 2.8% | |
1987.0 | 234 | 2.7% | |
2000.0 | 222 | 2.6% | |
1998.0 | 222 | 2.6% | |
Other values (87) | 5695 | 66.6% |
Minimum 5 values
Value | Count | Frequency (%) | |
1914.0 | 1 | 0.0% | |
1915.0 | 2 | 0.0% | |
1918.0 | 1 | 0.0% | |
1921.0 | 3 | 0.0% | |
1923.0 | 1 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
2012.0 | 13 | 0.2% | |
2013.0 | 16 | 0.2% | |
2014.0 | 7 | 0.1% | |
2015.0 | 6 | 0.1% | |
2016.0 | 16 | 0.2% |
weight
Numeric
Distinct count | 207 |
---|---|
Unique (%) | 2.4% |
Missing (%) | 0.0% |
Missing (n) | 0 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 8.1477 |
---|---|
Minimum | 0 |
Maximum | 100 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 0 |
---|---|
5-th percentile | 1 |
Q1 | 2.99 |
Median | 4.8853 |
Q3 | 8.8 |
95-th percentile | 26.85 |
Maximum | 100 |
Range | 100 |
Interquartile range | 5.81 |
Descriptive statistics
Standard deviation | 11.034 |
---|---|
Coef of variation | 1.3543 |
Kurtosis | 27.011 |
Mean | 8.1477 |
MAD | 5.853 |
Skewness | 4.5607 |
Sum | 69719 |
Variance | 121.75 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1.0 | 491 | 5.7% | |
4.7 | 210 | 2.5% | |
1.25 | 154 | 1.8% | |
2.55 | 143 | 1.7% | |
9.63 | 123 | 1.4% | |
2.99 | 122 | 1.4% | |
6.98 | 121 | 1.4% | |
8.47 | 113 | 1.3% | |
9.81 | 110 | 1.3% | |
1.95 | 106 | 1.2% | |
Other values (197) | 6864 | 80.2% |
Minimum 5 values
Value | Count | Frequency (%) | |
0.0 | 1 | 0.0% | |
1.0 | 491 | 5.7% | |
1.023 | 41 | 0.5% | |
1.0714 | 48 | 0.6% | |
1.12 | 37 | 0.4% |
Maximum 5 values
Value | Count | Frequency (%) | |
60.17 | 11 | 0.1% | |
68.06 | 20 | 0.2% | |
74.27 | 11 | 0.1% | |
81.45 | 20 | 0.2% | |
100.0 | 32 | 0.4% |
welfare
Numeric
Distinct count | 3 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 5.4% |
Missing (n) | 458 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1.9518 |
---|---|
Minimum | 1 |
Maximum | 2 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1 |
---|---|
5-th percentile | 2 |
Q1 | 2 |
Median | 2 |
Q3 | 2 |
95-th percentile | 2 |
Maximum | 2 |
Range | 1 |
Interquartile range | 0 |
Descriptive statistics
Standard deviation | 0.2141 |
---|---|
Coef of variation | 0.10969 |
Kurtosis | 15.828 |
Mean | 1.9518 |
MAD | 0.091671 |
Skewness | -4.2218 |
Sum | 15808 |
Variance | 0.045841 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
2.0 | 7709 | 90.1% | |
1.0 | 390 | 4.6% | |
(Missing) | 458 | 5.4% |
Minimum 5 values
Value | Count | Frequency (%) | |
1.0 | 390 | 4.6% | |
2.0 | 7709 | 90.1% |
Maximum 5 values
Value | Count | Frequency (%) | |
1.0 | 390 | 4.6% | |
2.0 | 7709 | 90.1% |
wic
Categorical
Distinct count | 4 |
---|---|
Unique (%) | 0.0% |
Missing (%) | 49.3% |
Missing (n) | 4219 |
1.0 | 198 |
---|---|
2.0 | 90 |
(Missing) |
Value | Count | Frequency (%) | |
4050 | 47.3% | ||
1.0 | 198 | 2.3% | |
2.0 | 90 | 1.1% | |
(Missing) | 4219 | 49.3% |
yrborn
Numeric
Distinct count | 102 |
---|---|
Unique (%) | 1.2% |
Missing (%) | 0.0% |
Missing (n) | 3 |
Infinite (%) | 0.0% |
Infinite (n) | 0 |
Mean | 1952.1 |
---|---|
Minimum | 1889 |
Maximum | 1994 |
Zeros (%) | 0.0% |
Quantile statistics
Minimum | 1889 |
---|---|
5-th percentile | 1922 |
Q1 | 1940 |
Median | 1955 |
Q3 | 1965 |
95-th percentile | 1977 |
Maximum | 1994 |
Range | 105 |
Interquartile range | 25 |
Descriptive statistics
Standard deviation | 17.15 |
---|---|
Coef of variation | 0.0087856 |
Kurtosis | -0.32041 |
Mean | 1952.1 |
MAD | 14.054 |
Skewness | -0.42559 |
Sum | 16698000 |
Variance | 294.13 |
Memory size | 66.9 KiB |
Value | Count | Frequency (%) | |
1963.0 | 254 | 3.0% | |
1965.0 | 230 | 2.7% | |
1960.0 | 223 | 2.6% | |
1955.0 | 221 | 2.6% | |
1956.0 | 218 | 2.5% | |
1961.0 | 215 | 2.5% | |
1966.0 | 197 | 2.3% | |
1954.0 | 193 | 2.3% | |
1968.0 | 191 | 2.2% | |
1962.0 | 190 | 2.2% | |
Other values (91) | 6422 | 75.0% |
Minimum 5 values
Value | Count | Frequency (%) | |
1889.0 | 1 | 0.0% | |
1893.0 | 1 | 0.0% | |
1894.0 | 1 | 0.0% | |
1896.0 | 1 | 0.0% | |
1898.0 | 2 | 0.0% |
Maximum 5 values
Value | Count | Frequency (%) | |
1990.0 | 4 | 0.0% | |
1991.0 | 2 | 0.0% | |
1992.0 | 1 | 0.0% | |
1993.0 | 1 | 0.0% | |
1994.0 | 1 | 0.0% |
rejected_variables = profile.get_rejected_variables(threshold=0.9)
rejected_variables
['coevus', 'crsst1', 'crsyr1', 'frevus', 'hhnum', 'neevus', 'surveyyr']
Looking through the profile and the missing data graphs, we see that a lot of variables have a lot of missing data. We also see that a lot of variables have very high/perfect correlation. I'm not sure how the profiler picks which of the correlated variables to keep, but it looks like it's rejecting some potentially interesting variables (eg dropped 'unemp' because of perfect correlation with CRSCST21 (cost of coyote on 21st crossing)).