rm(list=ls(all=t))

Setup filenames

filename <- "IDT_raw_students_NOPII" # !!!Update filename
functions_vers <-  "functions_1.7.R" # !!!Update helper functions file

Setup data, functions and create dictionary for dataset review

source (functions_vers)

Visually inspect variables in "dictionary.csv" and flag for risk, using the following flags:

# Direct PII: Respondent Names, Addresses, Identification Numbers, Phone Numbers
# Direct PII-team: Interviewer Names, other field team names 
# Indirect PII-ordinal: Date of birth, Age, income, education, household composition. 
# Indirect PII-categorical: Gender, education, ethnicity, nationality,
# occupation, employer, head of household, marital status
# GPS: Longitude, Latitude
# Small Location: Location (<100,000) 
# Large Location (>100,000)
# Weight: weightVar
# Household ID:  hhId, 
# Open-ends: Review responses for any sensitive information, redact as necessary 

Direct PII: variables to be removed

# !!!Include any Direct PII variables
dropvars <- c("student_name",
              "student_fullname",
              "no_guardian_name",
              "consent_signature",
              "consent_signature_paper",
              "guard_name",
              "guard_app",
              "guard_apm",
              "guard_nn",
              "p4a",
              "audio1_student",
              "audio2_student",
              "audio3_student",
              "ss_phone",
              "ss_gps_whereother",
              "ss_photo",
              "random_audio_ss",
              "grado2016_admin_name") 
mydata <- mydata[!names(mydata) %in% dropvars]

Direct PII-team: Encode field team names

#  No Direct PII-team

Small locations: Encode locations with pop <100,000 using random large numbers

#  !!!Include relevant variables, but check their population size first to confirm they are <100,000

# !!! Removed as it contains identifying information

locvars <- c("nombre_colegio",
             "prompt_cole_name",
             "cole2016_correct",
             "cole2016_new",
             "school2015_name1",
             "school2014_name1",
             "school2013_name1",
             "school2012_name1",
             "school2011_name1",
             "school2010_name1",
             "ss_gps_where") 
mydata <- mydata[!names(mydata) %in% locvars]

#  !!!Include relevant variables, but check their population size first to confirm they are <100,000

locvars <- c("cod_mod2016_admin","cole2016_admin", "cole2016", "id_grado", "id_grado") 
mydata <- encode_location (variables= locvars, missing=999999)
## [1] "Frequency table before encoding"
## cod_mod2016_admin. 
## 1007160 1008440 1008929 1008960 1009844 1010040 1010149 1010180 1039676 1041516 
##       1       9       2       3       6       2       2       1       1       1 
## 1041557 1041631 1045111 1045277 1045434 1045715 1045798 1046226 1048990 1049493 
##       2      17       4       1       4       1      10       1       3       1 
## 1054154 1054196 1054352 1056902 1063106 1063148 1063221 1063304 1064989 1066026 
##       6       3       3       5       3      14       3       9       3       7 
## 1068238 1069954 1070077 1070390 1070481 1072040 1072727 1073212 1074301 1075779 
##       2       4      12       5       1       2       2       1       5       1 
## 1080068 1080258 1082031 1082874 1083633 1083674 1083716 1084508 1084987 1085851 
##       1       4       2       1       1       2       3      13       1       4 
## 1085976 1088400 1099654 1194265 1194380 1194810 1195189 1195577 1196526 1223023 
##       2       5       1      10      12       2       3       1       4       1 
## 1225549 1238229 1240720 1241454 1242908 1247832 1248392 1248509 1254192 1258334 
##       1       5       9       1       1       3      11       1       1       1 
## 1258649 1261742 1264340 1264670 1266840 1278662 1279124 1309392 1309574 1313444 
##       3       3       1       1       2       1       2       3       8       3 
## 1330315 1332220 1346675 1349448 1354091 1360957 1362318 1375211 1376870 1381342 
##       1       6       1       1       1       1       2       2       1       4 
## 1381599 1381896 1382829 1385251 1392893 1393453 1398148 1401801 1411438 1420694 
##       8       2       3       1       1       2       9       1       2       3 
## 1422666 1423615 1431667 1438027 1438035 1453232 1458850 1464668 1469675 1473511 
##       2      13       1       2       4       1       1       1       1       1 
## 1474600 1475011 1475201 1475284 1476258 1480086 1481514 1481720 1481795 1482975 
##       2      10       1       1       2       1       1       1       1       1 
## 1483627 1487339 1489822 1492255 1493964 1495365 1495407 1496314 1496355 1497007 
##       1       1       1       1       1       8       5       1       2       2 
## 1497551 1499748 1499961 1500354 1501188 1501451 1505494 1507094 1507250 1507276 
##       1       1       1       4       2      12      14      13      12       1 
## 1507532 1509108 1509496 1512789 1513159 1515360 1520279 1520287 1528520 1529981 
##      12       1       2       4       1       1       1       3       1       1 
## 1536994 1541879 1573328 1575323 1641521 1661271 1666882 1697234 1699933 1701002 
##       1       1       1       1      10       7       1       3       1       1 
##  207795  207894  207985  208058  208348  208538  208546  208561  208587  208694 
##       3       1       2       4       2       4       3       7       1       1 
##  208736  209304  209387  209510  209528  209536  209908  209916  209924  209940 
##       6       3       4       2       1       6      16       5       3       6 
##  209965  209973  210260  215632  245647  245662  245670  245688  245696  245704 
##       9       4       2       8       3       7       7      11       1       1 
##  305656  314500  317131  317214  317289  317305  317313  317370  317453  317479 
##       1       2       5       2       3       1       4       1       2       2 
##  317560  317610  317941  318063  318089  318287  318352  318741  318782  318949 
##       6       1       1       4       4       1       3       3       1       1 
##  319004  319020  319061  319145  319160  319285  320655  322479  322685  322974 
##       1       1       1       2       2       4       1       5       3       4 
##  323345  323378  325449  325464  325472  325480  325548  325563  325589  325647 
##       1       2       2       3      14       1       1      12       5       9 
##  325670  325704  327650  328047  328260  328518  328526  329151  329573  333666 
##       6       9       2       3       2       1       2       1       4       4 
##  334094  334649  334656  334664  334672  334680  334706  334714  334722  334748 
##       1       4       1       8       6       1      10       1       1      10 
##  334847  334920  334987  335042  335091  335224  336495  336537  336545  336560 
##       2       2       9       4       1       1       2       4       3       1 
##  336586  336594  336610  336628  336636  337436  337568  337592  337733  337741 
##       5       2       3       2       5       2       5       4       4       1 
##  337766  338228  338301  338343  338517  338640  338665  338848  339051  339317 
##       1       2       4       1       6       4       3       1       6       1 
##  339432  339499  339606  339804  340224  340281  340299  340315  340349  340372 
##       1       1       6       1      10       1       3      10       9       2 
##  340380  340398  340414  340422  340448  343566  432773  432906  433227  433235 
##      10       1       5       2       1       2       3       1       5       2 
##  433276  433490  433540  433680  433821  433961  434019  434076  434191  434282 
##       6       6       4       6       8       4       4       2       3       3 
##  434464  434480  434498  434506  434548  434597  434829  436170  436212  436287 
##       3       3       3       2       3       2       4       1       8       1 
##  436303  436360  436444  436451  436493  436543  436584  436634  436642  436766 
##       2       5       5       6       5       2       1       4       1       6 
##  436782  437210  437228  437236  437244  437251  437269  437277  437285  437319 
##       1       7      21      12      13       2       2      12       6       2 
##  437335  437350  437400  437509  437525  437707  437715  437723  437731  437749 
##       6       6       7       2       1       3       6       2       3       1 
##  437772  449868  466383  466730  468488  468611  469700  481853  481903  488619 
##       1      10       1      19       2       2       8       2       8      21 
##  488635  493544  495259  495812  496166  496844  497024  499699  500124  500348 
##       4      15       3       4       8       1       1       7       1       7 
##  500611  501411  501601  501676  501809  501908  502435  502633  505149  508903 
##       3       1      10       1       4       1       1       5       1       5 
##  510305  510800  513614  516674  519645  520486  521179  522318  522862  523423 
##       1       1       2       3       3       1       4       2       1       2 
##  523464  523621  523662  523761  526301  534321  535823  536029  536151  536326 
##       4       2       1       5       5       1       4       4       1      16 
##  546002  555847  555862  555946  556266  556357  556472  556548  556571  565119 
##      18       1       3       1       2       1       3       1      13       4 
##  565143  565200  565234  565267  566141  566158  566414  566430  566455  566463 
##       2       2       7       2      15       2       4       2       4       2 
##  566471  567743  567750  567768  578260  578278  578286  578336  578351  578401 
##      13       1       9       1       1       1      13       1       1       2 
##  578443  578518  578526  578534  578542  581710  581728  581736  581744  581777 
##       2      12      10      12       8       2       2       4       4       1 
##  581876  581892  581900  581991  582114  582122  582148  582163  582254  582304 
##       5       2       8       4       1       1       1       3       3       5 
##  582312  582387  582403  582411  582833  582866  582890  582932  582981  583013 
##       5      12      11       8      12       4       8       2       2       2 
##  583328  583476  583591  583922  598581  599159  599365  601492  601708  605469 
##       4       5      19       3       3       2       1       2       1       1 
##  607424  628404  628602  628842  629261  632299  632471  642801  642892  643692 
##       1       2       2       3       2       4       1       3       3       1 
##  643783  643817  644690  644880  647172  649129  649202  649947  650002  650036 
##       2       7       1       3       1       2       1       6       1      10 
##  652081  656447  659698  659722  659896  659953  662957  663005  663013  663112 
##       1       1       3       6       4       4       2       2       1       9 
##  663526  663534  663542  663559  663682  663971  664292  664698  664748  664920 
##       1       4       2       6       5      10       2      10       3       1 
##  665414  665489  691931  692434  692442  693499  693622  693655  694547  694562 
##       1       1       3      10       1      12       1       2       2       1 
##  694570  694588  694604  703215  703256  703736  703744  704072  704312  704445 
##      11      13       1       3       1       2       7       1       2       1 
##  705053  705129  705475  705772  725770  725861  728055  728196  728717  732321 
##       9       5       1       1       7       4       2       4      14       1 
##  732347  732495  739367  743773  743807  743815  743831  744540  744557  744573 
##       1       7       1      13       1       5      14       3       6       2 
##  751230  759399  759613  762120  762856  762864  762906  762914  763151  764779 
##       1       3      12       1       4       2       2       1       6       6 
##  764936  765297  765305  765313  765321  765396  765412  765859  772970  773788 
##       4       7      10       3       1       6       4       1       1      12 
##  774026  774679  774703  775312  775833  775874  777656  777680  777995  778233 
##       8       1       2       1       3       3      15       5       8      14 
##  778738  779041  779868  780759  780767  780791  781278  781302  781351  781369 
##       1       2       2       1       1       2       6       9       4       7 
##  781385  781831  781930  820407  821082  824003  824813  825752  828962  832253 
##       1       3       1       4      10       1       6       1       1       1 
##  832279  832287  832303  832311  832337  834853  835058  846048  847087  855791 
##       3       2       5       5       1       2       7       1       1       2 
##  869198  870931  872515  874198  875476  879791  879817  883884  884510  884528 
##       9       4      13       1       1      12       1       1       1       2 
##  884544  884551  884593  884627  885517  900761  900795  900852  900910  901082 
##       1       2       2       1       1       3       1       3       1       2 
##  901413  901587  915256 
##       1       1       2 
## [1] "Frequency table after encoding"
## cod_mod2016_admin. 
##  463  464  465  466  467  468  469  470  471  472  473  474  475  476  477  478  479 
##    1    6    1    1    5   14    7    1   12    2    2   13    8    1    3    5    1 
##  480  481  482  483  484  485  486  487  488  489  490  491  492  493  494  495  496 
##    1    8    3    1   11    4    1   13    2    3    1   12    1    8    1    6    1 
##  497  498  499  500  501  502  503  504  505  506  507  508  509  510  511  512  513 
##    2    1    1    4    6   14    1    3    3    4    8   11    8    2    1    2    3 
##  514  515  516  517  518  519  520  521  522  523  524  525  526  527  528  529  530 
##    1    4    5    4    2    2    1    3    1    1   19    1    2    1    2    2    1 
##  531  532  533  534  535  536  537  538  539  540  541  542  543  544  545  546  547 
##    1    4    2    2    2    3    1    2    2    1    2    3   13    7   21    1    1 
##  548  549  550  551  552  553  554  555  556  557  558  559  560  561  562  563  564 
##    2    5    4    3    1    3    1    2    1    7    7    5    4    3    3    7    3 
##  565  566  567  568  569  570  571  572  573  574  575  576  577  578  579  580  581 
##    1    1    2    1   21   12    1    8    2    1    7    3    1   13    2    1    5 
##  582  583  584  585  586  587  588  589  590  591  592  593  594  595  596  597  598 
##   12    3    1    1    4    5    2    1    6    3   10    1    5    2    2    6    9 
##  599  600  601  602  603  604  605  606  607  608  609  610  611  612  613  614  615 
##    1    1    5    1    1    1    1    1    2    2    1    3    3    4    1   10    5 
##  616  617  618  619  620  621  622  623  624  625  626  627  628  629  630  631  632 
##   10    3    1    1    1    3    8    2    1    6    1   13    2    3    1    3    1 
##  633  634  635  636  637  638  639  640  641  642  643  644  645  646  647  648  649 
##    9    2    1    1    5   10    1    1    6    2    1    4    1    3    1    1    5 
##  650  651  652  653  654  655  656  657  658  659  660  661  662  663  664  665  666 
##    9    6    9    1    1    4   16    3    4    3   10    2    4    2    9    1    1 
##  667  668  669  670  671  672  673  674  675  676  677  678  679  680  681  682  683 
##    1   10    5    4    2    3    1    7    1   15    1    6    1    4    1    1    6 
##  684  685  686  687  688  689  690  691  692  693  694  695  696  697  698  699  700 
##    2    1   10    4    2    4    1    2    1    1    1    3    1    2    9    1    3 
##  701  702  703  704  705  706  707  708  709  710  711  712  713  714  715  716  717 
##    1    1    5    1    2    4    7    1    2    4    4    1    1    4    1    9    1 
##  718  719  720  721  722  723  724  725  726  727  728  729  730  731  732  733  734 
##    6    2    1   10    1    1    5    3    2    1    1    3    1    1    2    3    1 
##  735  736  737  738  739  740  741  742  743  744  745  746  747  748  749  750  751 
##    2    6    2    2    1    2   13    1    5    1   13    4    5    2    4    2    1 
##  752  753  754  755  756  757  758  759  760  761  762  763  764  765  766  767  768 
##    4    8    3    1    1    1    1    6    8   13    2    4    6    3    5    2    2 
##  769  770  771  772  773  774  775  776  777  778  779  780  781  782  783  784  785 
##    2    2    1    2    4    8    4    1    9    1    1    1    4    3   10    1    2 
##  786  787  788  789  790  791  792  793  794  795  796  797  798  799  800  801  802 
##    2    2    2    1    1    1    1    3    4   12    1    5    3    1    6   19    8 
##  803  804  805  806  807  808  809  810  811  812  813  814  815  816  817  818  819 
##    2    1    4   17    2    4    1    6    1   13    1    1    1    2    1    2    3 
##  820  821  822  823  824  825  826  827  828  829  830  831  832  833  834  835  836 
##    5    1    3    4    6    1    2   11    3    1    2    1    1    2    2    7    3 
##  837  838  839  840  841  842  843  844  845  846  847  848  849  850  851  852  853 
##    5    3    1    3    1    2    3    1    1    2    4    1    6    2    1    2    2 
##  854  855  856  857  858  859  860  861  862  863  864  865  866  867  868  869  870 
##    5    6    5   14   16    1    7    3    1   12    1    6    4   12    1    1    1 
##  871  872  873  874  875  876  877  878  879  880  881  882  883  884  885  886  887 
##   10    1    4    3    1    7    2    1    3    2    1    1    2    7   10   15   10 
##  888  889  890  891  892  893  894  895  896  897  898  899  900  901  902  903  904 
##    7    2    5    1    2    1    1    4   12    2    1    8    1   12    1   12    1 
##  905  906  907  908  909  910  911  912  913  914  915  916  917  918  919  920  921 
##    2   15    1    1    3   10    4   14   10    5    9    2    2    9    1    4    2 
##  922  923  924  925  926  927  928  929  930  931  932  933  934  935  936  937  938 
##    3    9    6    2    1    6   14    1    1    4    4    5    7    1    8    5    4 
##  939  940  941  942  943  944  945  946  947  948  949  950  951  952  953  954  955 
##    3    2    1    1    3    5    1    2    6    1    1    5    1    2    4    1    1 
##  956  957  958  959  960  961  962  963  964  965  966  967  968  969  970  971  972 
##    1    4    6    6    1    5    1    4    1    2   13    2    2    1    9    1    2 
##  973  974  975  976  977  978  979  980  981  982  983  984  985  986  987  988  989 
##    1    8    2    2   18    2    8    3   10    2    3    3    6    1    8   12    1 
##  990  991  992  993  994  995  996  997  998  999 1000 1001 1002 1003 1004 1005 1006 
##    2    1    1   12    3    1    2    1    1    3    4    4    9    1    2    3    1 
## 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 
##    2    3    4    4    2    1    1    1    3    2    3    2    1    6    2    2    3 
## 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 
##    3    1    1    2   10    1    4    4    2    2    4    7    3   10    1    2    1 
## 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 
##    2    7   11    1    3    2    1    1    1    7    3    1    4    3    4    2    1 
## 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 
##    1    4    2    2   14    1   12    1    5    3    6   12    4    4    1    4    1 
## 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 
##    6   12   12   10    3    2    4    4    5    2    1    9    1    1    6    3    1 
## 1092 1093 1094 1095 
##    1    1    2    1 
## [1] "Frequency table before encoding"
## cole2016_admin. 
## 1007160 1008440 1008929 1008960 1009844 1010040 1010149 1010180 1039676 1041516 
##       1       9       2       3       6       2       2       1       1       1 
## 1041557 1041631 1045111 1045277 1045434 1045715 1045798 1046226 1048990 1049493 
##       2      17       4       1       4       1      10       1       3       1 
## 1054154 1054196 1054352 1056902 1063106 1063148 1063221 1063304 1064989 1066026 
##       6       3       3       5       3      14       3       9       3       7 
## 1068238 1069954 1070077 1070390 1070481 1072040 1072727 1073212 1074301 1075779 
##       2       4      12       5       1       2       2       1       5       1 
## 1080068 1080258 1082031 1082874 1083633 1083674 1083716 1084508 1084987 1085851 
##       1       4       2       1       1       2       3      13       1       4 
## 1085976 1088400 1099654 1194265 1194380 1194810 1195189 1195577 1196526 1223023 
##       2       5       1      10      12       2       3       1       4       1 
## 1225549 1238229 1240720 1241454 1242908 1247832 1248392 1248509 1254192 1258334 
##       1       5       9       1       1       3      11       1       1       1 
## 1258649 1261742 1264340 1264670 1266840 1278662 1279124 1309392 1309574 1313444 
##       3       3       1       1       2       1       2       3       8       3 
## 1330315 1332220 1346675 1349448 1354091 1360957 1362318 1375211 1376870 1381342 
##       1       6       1       1       1       1       2       2       1       4 
## 1381599 1381896 1382829 1385251 1392893 1393453 1398148 1401801 1411438 1420694 
##       8       2       3       1       1       2       9       1       2       3 
## 1422666 1423615 1431667 1438027 1438035 1453232 1458850 1464668 1469675 1473511 
##       2      13       1       2       4       1       1       1       1       1 
## 1474600 1475011 1475201 1475284 1476258 1480086 1481514 1481720 1481795 1482975 
##       2      10       1       1       2       1       1       1       1       1 
## 1483627 1487339 1489822 1492255 1493964 1495365 1495407 1496314 1496355 1497007 
##       1       1       1       1       1       8       5       1       2       2 
## 1497551 1499748 1499961 1500354 1501188 1501451 1505494 1507094 1507250 1507276 
##       1       1       1       4       2      12      14      13      12       1 
## 1507532 1509108 1509496 1512789 1513159 1515360 1520279 1520287 1528520 1529981 
##      12       1       2       4       1       1       1       3       1       1 
## 1536994 1541879 1573328 1575323 1641521 1661271 1666882 1697234 1699933 1701002 
##       1       1       1       1      10       7       1       3       1       1 
##  207795  207894  207985  208058  208348  208538  208546  208561  208587  208694 
##       3       1       2       4       2       4       3       7       1       1 
##  208736  209304  209387  209510  209528  209536  209908  209916  209924  209940 
##       6       3       4       2       1       6      16       5       3       6 
##  209965  209973  210260  215632  245647  245662  245670  245688  245696  245704 
##       9       4       2       8       3       7       7      11       1       1 
##  305656  314500  317131  317214  317289  317305  317313  317370  317453  317479 
##       1       2       5       2       3       1       4       1       2       2 
##  317560  317610  317941  318063  318089  318287  318352  318741  318782  318949 
##       6       1       1       4       4       1       3       3       1       1 
##  319004  319020  319061  319145  319160  319285  320655  322479  322685  322974 
##       1       1       1       2       2       4       1       5       3       4 
##  323345  323378  325449  325464  325472  325480  325548  325563  325589  325647 
##       1       2       2       3      14       1       1      12       5       9 
##  325670  325704  327650  328047  328260  328518  328526  329151  329573  333666 
##       6       9       2       3       2       1       2       1       4       4 
##  334094  334649  334656  334664  334672  334680  334706  334714  334722  334748 
##       1       4       1       8       6       1      10       1       1      10 
##  334847  334920  334987  335042  335091  335224  336495  336537  336545  336560 
##       2       2       9       4       1       1       2       4       3       1 
##  336586  336594  336610  336628  336636  337436  337568  337592  337733  337741 
##       5       2       3       2       5       2       5       4       4       1 
##  337766  338228  338301  338343  338517  338640  338665  338848  339051  339317 
##       1       2       4       1       6       4       3       1       6       1 
##  339432  339499  339606  339804  340224  340281  340299  340315  340349  340372 
##       1       1       6       1      10       1       3      10       9       2 
##  340380  340398  340414  340422  340448  343566  432773  432906  433227  433235 
##      10       1       5       2       1       2       3       1       5       2 
##  433276  433490  433540  433680  433821  433961  434019  434076  434191  434282 
##       6       6       4       6       8       4       4       2       3       3 
##  434464  434480  434498  434506  434548  434597  434829  436170  436212  436287 
##       3       3       3       2       3       2       4       1       8       1 
##  436303  436360  436444  436451  436493  436543  436584  436634  436642  436766 
##       2       5       5       6       5       2       1       4       1       6 
##  436782  437210  437228  437236  437244  437251  437269  437277  437285  437319 
##       1       7      21      12      13       2       2      12       6       2 
##  437335  437350  437400  437509  437525  437707  437715  437723  437731  437749 
##       6       6       7       2       1       3       6       2       3       1 
##  437772  449868  466383  466730  468488  468611  469700  481853  481903  488619 
##       1      10       1      19       2       2       8       2       8      21 
##  488635  493544  495259  495812  496166  496844  497024  499699  500124  500348 
##       4      15       3       4       8       1       1       7       1       7 
##  500611  501411  501601  501676  501809  501908  502435  502633  505149  508903 
##       3       1      10       1       4       1       1       5       1       5 
##  510305  510800  513614  516674  519645  520486  521179  522318  522862  523423 
##       1       1       2       3       3       1       4       2       1       2 
##  523464  523621  523662  523761  526301  534321  535823  536029  536151  536326 
##       4       2       1       5       5       1       4       4       1      16 
##  546002  555847  555862  555946  556266  556357  556472  556548  556571  565119 
##      18       1       3       1       2       1       3       1      13       4 
##  565143  565200  565234  565267  566141  566158  566414  566430  566455  566463 
##       2       2       7       2      15       2       4       2       4       2 
##  566471  567743  567750  567768  578260  578278  578286  578336  578351  578401 
##      13       1       9       1       1       1      13       1       1       2 
##  578443  578518  578526  578534  578542  581710  581728  581736  581744  581777 
##       2      12      10      12       8       2       2       4       4       1 
##  581876  581892  581900  581991  582114  582122  582148  582163  582254  582304 
##       5       2       8       4       1       1       1       3       3       5 
##  582312  582387  582403  582411  582833  582866  582890  582932  582981  583013 
##       5      12      11       8      12       4       8       2       2       2 
##  583328  583476  583591  583922  598581  599159  599365  601492  601708  605469 
##       4       5      19       3       3       2       1       2       1       1 
##  607424  628404  628602  628842  629261  632299  632471  642801  642892  643692 
##       1       2       2       3       2       4       1       3       3       1 
##  643783  643817  644690  644880  647172  649129  649202  649947  650002  650036 
##       2       7       1       3       1       2       1       6       1      10 
##  652081  656447  659698  659722  659896  659953  662957  663005  663013  663112 
##       1       1       3       6       4       4       2       2       1       9 
##  663526  663534  663542  663559  663682  663971  664292  664698  664748  664920 
##       1       4       2       6       5      10       2      10       3       1 
##  665414  665489  691931  692434  692442  693499  693622  693655  694547  694562 
##       1       1       3      10       1      12       1       2       2       1 
##  694570  694588  694604  703215  703256  703736  703744  704072  704312  704445 
##      11      13       1       3       1       2       7       1       2       1 
##  705053  705129  705475  705772  725770  725861  728055  728196  728717  732321 
##       9       5       1       1       7       4       2       4      14       1 
##  732347  732495  739367  743773  743807  743815  743831  744540  744557  744573 
##       1       7       1      13       1       5      14       3       6       2 
##  751230  759399  759613  762120  762856  762864  762906  762914  763151  764779 
##       1       3      12       1       4       2       2       1       6       6 
##  764936  765297  765305  765313  765321  765396  765412  765859  772970  773788 
##       4       7      10       3       1       6       4       1       1      12 
##  774026  774679  774703  775312  775833  775874  777656  777680  777995  778233 
##       8       1       2       1       3       3      15       5       8      14 
##  778738  779041  779868  780759  780767  780791  781278  781302  781351  781369 
##       1       2       2       1       1       2       6       9       4       7 
##  781385  781831  781930  820407  821082  824003  824813  825752  828962  832253 
##       1       3       1       4      10       1       6       1       1       1 
##  832279  832287  832303  832311  832337  834853  835058  846048  847087  855791 
##       3       2       5       5       1       2       7       1       1       2 
##  869198  870931  872515  874198  875476  879791  879817  883884  884510  884528 
##       9       4      13       1       1      12       1       1       1       2 
##  884544  884551  884593  884627  885517  900761  900795  900852  900910  901082 
##       1       2       2       1       1       3       1       3       1       2 
##  901413  901587  915256 
##       1       1       2 
## [1] "Frequency table after encoding"
## cole2016_admin. 
##  678  679  680  681  682  683  684  685  686  687  688  689  690  691  692  693  694 
##    1    7    9    8   11    2    9    4    6    1   10    1    3    7    1    1    1 
##  695  696  697  698  699  700  701  702  703  704  705  706  707  708  709  710  711 
##    5    4    4    5    8    5    2    1    1    2    1    1    2    1    4    4    2 
##  712  713  714  715  716  717  718  719  720  721  722  723  724  725  726  727  728 
##    1   12   21    1    6    2    8    4    5    2   12    2    4    1    1    1    9 
##  729  730  731  732  733  734  735  736  737  738  739  740  741  742  743  744  745 
##    1    2    1   12    2    4    2    3    4    1   10    1    5   11    3    4    6 
##  746  747  748  749  750  751  752  753  754  755  756  757  758  759  760  761  762 
##    1    5    8    7   10    5    1    2    1    2    6    2    1    3    9    2    8 
##  763  764  765  766  767  768  769  770  771  772  773  774  775  776  777  778  779 
##    1    1    1    7    2    4    1    2    1    2    5    7    2    4   10   13    2 
##  780  781  782  783  784  785  786  787  788  789  790  791  792  793  794  795  796 
##    9    1    3   14    1    1    1   12    4    7    6    2    1    2    1   13    1 
##  797  798  799  800  801  802  803  804  805  806  807  808  809  810  811  812  813 
##    5    2    4    1    1   13    1    2    4    8    1    2    3    1    6    1    1 
##  814  815  816  817  818  819  820  821  822  823  824  825  826  827  828  829  830 
##    2    1    5    3    2   12    7    3    4    1    1    1    2    4    1    1    3 
##  831  832  833  834  835  836  837  838  839  840  841  842  843  844  845  846  847 
##    2    6    1    2    4    2    1    6   12    1   14   10    3   13    1    1    1 
##  848  849  850  851  852  853  854  855  856  857  858  859  860  861  862  863  864 
##    1    4    6    3    1    1    1    3    6    2    5    3    2    3    2    3    9 
##  865  866  867  868  869  870  871  872  873  874  875  876  877  878  879  880  881 
##    1    2    4    6    6    4    1   11   12    1    4   15    4    3    9    3    1 
##  882  883  884  885  886  887  888  889  890  891  892  893  894  895  896  897  898 
##    5    1    1    1   12    2    2    9    8    7    4    1    1    1    1    7    1 
##  899  900  901  902  903  904  905  906  907  908  909  910  911  912  913  914  915 
##    5    3    2    3   13    1    6   10    1    1   10    1    8    2    8   10    1 
##  916  917  918  919  920  921  922  923  924  925  926  927  928  929  930  931  932 
##    1    2    1    2    3    2    8    6   10    2    1    1    4   10    4    1    1 
##  933  934  935  936  937  938  939  940  941  942  943  944  945  946  947  948  949 
##    5    2    4    3    1    3    1    2    6    1    1    7    1    4    3    4    2 
##  950  951  952  953  954  955  956  957  958  959  960  961  962  963  964  965  966 
##    2    3    1    1    1    2    1    4    5    4    4    3    9    4    1    5    2 
##  967  968  969  970  971  972  973  974  975  976  977  978  979  980  981  982  983 
##    1    3   21    1    2    2    1    7    3    1    2    1    2    2    2    1    5 
##  984  985  986  987  988  989  990  991  992  993  994  995  996  997  998  999 1000 
##    2    1    3    4    1    1    4    3    1    4    5   12   10    2   12    2    5 
## 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 
##    1    5    3    2    2    4    2    4    2   12    3   10    3    2    2   13   12 
## 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 
##   16    1    3    6    1    1   15    1   18    2    2   12    6    1    4   10    1 
## 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 
##    1    1    1    1    1    3    2    1   15    2    7    2   12    1    3    9    1 
## 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 
##    3    1    4    3    1    1    5    2    3   14    6    1    5    5    1    2    1 
## 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 
##   13    4    9    2    2    1    1    4    1    1    2    2    1    2   10    2    1 
## 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 1102 
##   14    1    1    2    1    1    3    2    4    1    3    2    1    6    1    2    2 
## 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 
##    3    5    2    1   12    4    8    6    5    2    1    1    7    4    2    1    2 
## 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 
##    3    6    2    1    6    6    3    2    2    1    1    4    5    4    1    3    1 
## 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 
##    1    1    4    1    1    3    1    1   10    1    1    2   19    7    4    4    1 
## 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 
##   10    1   14   11    1    3    3    2    1    6   13    2    3    8    2    6    1 
## 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 
##    3    2    3    1   14    1    1    7    1    1    3    3    1    1    3    1    1 
## 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 
##    1    1    5    2    2    1    1    5   13    1    9    2    1    1    4    3    1 
## 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 
##    2    1    1    1    3   13   12    2    1    1    3    2    9    1    1    1    2 
## 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 
##    1    2    3    1    4    6    2    4   19    3    3    1    1    2    1    1    7 
## 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 
##    2    6    3    1    2    1   10    5    1    8    1    1    9    4    1    4    8 
## 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 
##    2    5    1    2    1    1    1    7    3    2    2   16   10    1    1    4    3 
## 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 
##    2    1    4    3    2    3    1    4    2    1    4    3    6    2    1    6    5 
## 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 
##   17    3    4    1    1    3    8    1    6    5    1    8    1    1    2    1    3 
## 1307 1308 1309 1310 
##    3    1    1    1 
## [1] "Frequency table before encoding"
## cole2016. 
##         1007160 1008440 1008929 1008960 1009844 1010040 1010149 1010180 1039676 
##     170       1       9       2       2       6       1       2       1       1 
## 1041557 1041631 1045111 1045277 1045434 1045715 1045798 1046226 1048990 1049493 
##       2      17       3       1       4       1       7       1       2       1 
## 1054154 1054196 1054352 1055904 1056902 1057637 1063106 1063148 1063221 1063304 
##       4       2       1       1       5       1       1      12       3       9 
## 1064989 1066026 1068238 1069954 1070077 1070390 1070481 1072040 1072727 1074301 
##       2       6       1       4      12       3       1       2       2       5 
## 1080068 1080258 1082031 1082874 1083633 1083674 1083716 1084508 1085851 1085976 
##       1       1       2       1       1       2       3      10       4       2 
## 1088400 1099597 1099654 1194265 1194380 1194810 1195577 1196526 1197904 1207430 
##       5       1       1       8       9       2       1       3       1       1 
## 1223023 1225549 1226422 1228154 1238229 1240720 1241454 1241983 1242270 1242908 
##       1       1       1       1       5       9       1       1       1       1 
## 1244102 1247832 1248392 1254192 1257450 1258334 1258649 1261742 1263813 1264670 
##       1       3      10       1       2       1       3       3       1       1 
## 1265743 1266840 1267038 1278662 1302322 1309392 1309574 1313444 1330315 1332220 
##       1       1       1       1       1       2       4       3       1       6 
## 1335546 1346675 1349448 1354091 1360957 1362318 1375211 1376870 1381342 1381599 
##       1       1       1       1       1       2       2       1       4       6 
## 1381896 1382829 1385251 1392893 1393453 1398148 1401801 1402064 1411438 1412790 
##       2       3       1       1       2       9       1       1       1       1 
## 1420694 1422666 1423615 1431667 1438027 1438035 1453232 1458850 1464668 1469675 
##       3       2      13       1       2       5       1       1       1       1 
## 1475011 1475201 1475532 1480086 1481514 1481720 1481795 1482975 1483239 1483627 
##       9       1       1       1       1       1       1       1       1       1 
## 1487008 1487339 1489822 1492149 1492255 1495365 1495407 1496314 1496355 1497007 
##       1       1       1       1       1       5       3       1       2       1 
## 1497056 1497551 1499300 1499961 1500354 1501188 1501451 1505494 1505601 1507094 
##       1       1       1       1       4       2      10      14       1      13 
## 1507250 1507276 1507532 1507557 1509108 1509181 1509496 1512789 1513159 1515360 
##      12       1      11       1       1       2       2       2       1       1 
## 1519149 1520279 1520287 1522291 1528520 1529981 1541879 1573328 1575323 1641521 
##       1       1       2       1       1       1       1       1       1      10 
## 1661271 1664044 1666882 1697234 1698489 1699933 1701002  207795  207985  208058 
##       7       1       1       3       1       1       1       3       2       4 
##  208348  208538  208546  208561  208587  208736  209304  209387  209510  209528 
##       1       4       2       7       1       5       3       4       2       2 
##  209536  209908  209916  209924  209940  209965  209973  210260  215632  245647 
##       6      14       5       3       3       9       3       2       8       3 
##  245662  245670  245688  245696  245704  305656  314500  317131  317214  317289 
##       6       6      11       1       1       1       2       5       2       3 
##  317305  317313  317370  317453  317479  317560  317610  318063  318089  318287 
##       1       4       1       2       2       6       1       3       4       1 
##  318352  318741  318949  319020  319061  319145  319160  319285  320655  322479 
##       3       2       1       1       1       2       1       4       1       2 
##  322685  322958  322974  323345  323378  323451  325449  325456  325464  325472 
##       2       1       4       1       2       1       2       1       3      12 
##  325480  325548  325563  325589  325605  325647  325670  325704  327650  328047 
##       1       1      10       5       1       9       5      10       2       3 
##  328260  328518  328526  329151  329573  333674  334094  334649  334656  334664 
##       2       1       2       1       3       1       1       4       1       8 
##  334672  334680  334706  334714  334722  334748  334771  334847  334896  334920 
##       4       1      10       1       1       9       1       2       1       2 
##  334987  335042  335091  335224  336495  336537  336545  336560  336586  336594 
##       8       4       1       1       2       3       3       1       5       2 
##  336610  336628  336636  337436  337568  337592  337733  337741  337766  338228 
##       3       3       5       2       5       4       4       1       1       2 
##  338301  338343  338517  338640  338665  338848  339051  339317  339432  339499 
##       4       1       6       3       3       1       5       1       1       1 
##  339606  339804  340224  340281  340299  340315  340349  340372  340380  340398 
##       6       1       9       1       3      10       9       2      10       1 
##  340414  340422  340448  343566  432773  432906  433227  433235  433276  433490 
##       5       2       1       2       3       1       3       2       3       6 
##  433540  433680  433821  433961  434019  434076  434191  434282  434464  434480 
##       4       6       6       4       3       2       3       2       3       3 
##  434498  434506  434548  434597  434829  436170  436212  436287  436303  436360 
##       2       2       3       2       4       1       7       1       2       5 
##  436444  436451  436493  436543  436584  436634  436642  436667  436766  436782 
##       5       6       5       2       1       2       1       1       6       1 
##  437210  437228  437236  437244  437251  437269  437277  437285  437319  437335 
##       6      19      12      13       2       3      12       6       1       4 
##  437350  437400  437475  437509  437525  437707  437715  437723  437731  437749 
##       6       7       1       2       1       3       6       2       3       1 
##  437772  449868  466730  468488  468611  469700  481903  488619  488635  493544 
##       1       9      18       2       2       9       7      19       2      14 
##  493635  494732  495259  495812  496166  496844  498824  499699  500124  500348 
##       1       1       3       4       5       1       1       7       1       6 
##  500611  501601  501676  501809  502435  502633  508903  510305  510800  513614 
##       2      10       1       4       1       2       5       1       1       2 
##  516674  516773  519645  520486  521179  522318  522862  523423  523464  523621 
##       3       1       3       1       4       2       1       2       4       2 
##  523662  523761  526301  534321  535823  536029  536151  536326  546002  555847 
##       1       4       4       1       4       4       1      15      14       1 
##  555862  556266  556357  556472  556548  556571  565119  565143  565200  565234 
##       2       2       1       2       1      12       3       1       2       6 
##  565267  566141  566158  566414  566430  566455  566463  566471  567743  567750 
##       2      14       2       4       2       4       2      12       1       8 
##  567768  578260  578278  578286  578351  578401  578443  578518  578526  578534 
##       1       1       1      11       1       2       2      11      10       7 
##  578542  581710  581728  581736  581744  581777  581876  581892  581900  581991 
##       6       2       2       4       4       1       5       2       6       3 
##  582031  582114  582122  582148  582163  582171  582254  582304  582312  582387 
##       1       1       1       1       3       1       3       5       5      10 
##  582403  582411  582833  582866  582890  582981  583013  583328  583476  583591 
##      11       7      12       4       7       2       2       4       5      15 
##  583922  598581  599159  601492  601708  605469  607143  607424  628404  628602 
##       3       4       2       2       1       1       1       1       2       2 
##  628842  629261  632299  632471  642801  642892  643262  643692  643783  643817 
##       3       2       4       1       3       2       1       1       2       4 
##  644690  644880  647172  649129  649202  649301  649947  650002  650036  652081 
##       1       3       1       2       1       1       6       1       8       1 
##  659698  659722  659896  659953  662957  663005  663013  663112  663526  663534 
##       2       5       3       4       2       2       1       7       1       3 
##  663559  663682  663971  664292  664698  664748  665414  665489  691931  692434 
##       6       5      10       1      10       2       1       1       2      10 
##  692442  693499  693655  694547  694562  694570  694588  694604  703215  703256 
##       1       9       2       1       1      11      12       1       3       1 
##  703736  703744  704072  704312  704445  705053  705129  705475  705772  725770 
##       2       7       2       2       1       9       4       1       1       7 
##  725861  728055  728196  728717  732321  732347  732495  739367  743773  743807 
##       4       1       4      14       1       1       5       1      12       1 
##  743815  743831  744540  744557  744573  751230  759399  759613  762120  762856 
##       5      13       3       6       2       1       2      12       1       1 
##  762864  762906  762914  763151  764779  764936  765297  765305  765313  765321 
##       2       2       1       6       6       4       6      10       3       1 
##  765396  765412  773788  773903  774026  774679  774703  775833  775874  777656 
##       4       4      12       1       8       1       2       3       3      13 
##  777680  777995  778233  778738  779041  779868  780759  780791  781278  781302 
##       4       8      11       1       2       2       1       1       4       6 
##  781351  781369  781385  781831  781930  782078  820407  821082  824003  824813 
##       3       7       1       2       1       1       4       7       1       6 
##  825752  828962  831644  832253  832279  832287  832303  832311  832337  834853 
##       1       1       1       1       3       2       4       2       1       2 
##  835058  855791  869198  870931  871012  872515  874438  875476  879791  879817 
##       6       2       6       2       1      13       1       1       9       1 
##  883884  884510  884528  884551  884593  884627  885392  885517  900761  900852 
##       1       1       2       2       2       1       1       1       3       2 
##  900910  901082  901413  915256      99 
##       1       2       1       2      45 
## [1] "Frequency table after encoding"
## cole2016. 
##  490  491  492  493  494  495  496  497  498  499  500  501  502  503  504  505  506 
##    5    6    1    1    2   12    2    1    2   10    1    2   11    1    4   10    9 
##  507  508  509  510  511  512  513  514  515  516  517  518  519  520  521  522  523 
##    3    1    7   12    3    1    4    1    1    1    4    1    9    4    4    4    9 
##  524  525  526  527  528  529  530  531  532  533  534  535  536  537  538  539  540 
##    1    1    1    1    1    1    1    3    2    1    6   13    1    4    2   14    2 
##  541  542  543  544  545  546  547  548  549  550  551  552  553  554  555  556  557 
##    2    3    2   12    1    2    1   10    2    3    1    7    8    2    1    6    2 
##  558  559  560  561  562  563  564  565  566  567  568  569  570  571  572  573  574 
##   13    1    1    1    6   15    1    2    5    1    6    1    1    4    1    2    1 
##  575  576  577  578  579  580  581  582  583  584  585  586  587  588  589  590  591 
##    1    2    1    1    2   12    2    1    3    6    4    3    1    1    5    1    9 
##  592  593  594  595  596  597  598  599  600  601  602  603  604  605  606  607  608 
##    1    1    1    3    1    1    4    1    1    6    4    1    3    5    3    2    1 
##  609  610  611  612  613  614  615  616  617  618  619  620  621  622  623  624  625 
##    2    4    1    2    1    1    6    1    4    4    1    2    1    2    5    2    5 
##  626  627  628  629  630  631  632  633  634  635  636  637  638  639  640  641  642 
##    2    1    2    1    2    1    1    2    1    1    1    1    1    1   12   10   10 
##  643  644  645  646  647  648  649  650  651  652  653  654  655  656  657  658  659 
##    2    1    1    1    6    1    5    1    1    6    1    1    3    5   11    1    4 
##  660  661  662  663  664  665  666  667  668  669  670  671  672  673  674  675  676 
##    2    3    6    3    2    6   19    1    2    8    4    1    2    2    2    4    2 
##  677  678  679  680  681  682  683  684  685  686  687  688  689  690  691  692  693 
##    6    1    6    2   10    1    6   19    2    3    2    2    1    1    1    4    4 
##  694  695  696  697  698  699  700  701  702  703  704  705  706  707  708  709  710 
##    6    1    5   13    4    1    6    6    2    1    1    1    2    1    2    6    2 
##  711  712  713  714  715  716  717  718  719  720  721  722  723  724  725  726  727 
##    9    1    1    1    2    2    2    5    7    2    2    1    1    5    6   14    5 
##  728  729  730  731  732  733  734  735  736  737  738  739  740  741  742  743  744 
##    4    1    6    1    1    2    3    2    1    1    2    3    2    1    2   11    3 
##  745  746  747  748  749  750  751  752  753  754  755  756  757  758  759  760  761 
##    1    2    5    1    1    3    1    7    7    8    2    1    7    1   12    3    2 
##  762  763  764  765  766  767  768  769  770  771  772  773  774  775  776  777  778 
##   14    1    8    3    1    3    2    2    1    1    1    6    1    1    1    7    1 
##  779  780  781  782  783  784  785  786  787  788  789  790  791  792  793  794  795 
##    1   10    1   13    1    3    1    5    2    1    2    1    9    3    9    1    1 
##  796  797  798  799  800  801  802  803  804  805  806  807  808  809  810  811  812 
##    1    2   13    6    4    1    3    2    1    5    9    1    1    2    2   10    1 
##  813  814  815  816  817  818  819  820  821  822  823  824  825  826  827  828  829 
##    1    2    1   12    1    5    2   12    3    1    4   11    1    3    2    1    1 
##  830  831  832  833  834  835  836  837  838  839  840  841  842  843  844  845  846 
##   12    3    2    1    4    1    2    2    1    5    1    3    1    3    1   11    1 
##  847  848  849  850  851  852  853  854  855  856  857  858  859  860  861  862  863 
##    2    3    9    2    7    2   14    5    2    4    2    1    1    4    3    6    3 
##  864  865  866  867  868  869  870  871  872  873  874  875  876  877  878  879  880 
##    1    2    2    1    1    2    2    4    4    5    7    2    1    2    1    1    1 
##  881  882  883  884  885  886  887  888  889  890  891  892  893  894  895  896  897 
##    1    6    1    4    2   14    1    5    3    1    1    2   12    1    6    1    1 
##  898  899  900  901  902  903  904  905  906  907  908  909  910  911  912  913  914 
##    1    4  170    5    5    4    1    4    1    3    1    1    1    6    6    4    3 
##  915  916  917  918  919  920  921  922  923  924  925  926  927  928  929  930  931 
##    1    1    4    7    1    1   45    2    4    9    1    1    1    1    6    3    1 
##  932  933  934  935  936  937  938  939  940  941  942  943  944  945  946  947  948 
##    3    5    6    1    1    2    5    4    9    1    4    1    4    1    2    6    2 
##  949  950  951  952  953  954  955  956  957  958  959  960  961  962  963  964  965 
##    1    2    2    1    3    2    2    1    4   10    1    3    1    7    4    2    4 
##  966  967  968  969  970  971  972  973  974  975  976  977  978  979  980  981  982 
##    1    2    3    8    2    3    3   17    1    9    2    1    1    3   10    3   12 
##  983  984  985  986  987  988  989  990  991  992  993  994  995  996  997  998  999 
##    1    3    9    1    2    2    3    4    2    3    1    3    1    1    1    4    1 
## 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 
##    1    2    1    1   10    1    4    8    1    7    2    1    1    2   10    1    1 
## 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 
##   12    2    5    3    3    1    1    3    2    1    2    2    4    2    2    1    8 
## 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 
##    4    3   18    3    2    1    2    1   12    2   14    3    2    1    3    1    4 
## 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 
##    3    2    1    8    1    1    2    5    2    1    7   13    1    9    2    3    4 
## 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 
##    1   10    1    5    1    4    7    2    1   10    1    3    2    1   11    1    4 
## 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 
##    2    5    1    2    1    1    3    1    1    4    4    2    1   10    1    1    2 
## 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 
##    3    2    1    7    3    1   10    9    1    1    5    9    3    2    1    6    3 
## 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 
##    1    1    1   11    6    1    1    1    2    3    2    1    1   15    1    1 
## [1] "Frequency table before encoding"
## id_grado. 
##           100716010 100844010  10084407  10084408  10084409  10089297 100896010 
##       170         1         3         4         1         1         2         1 
##  10089608  10098447  10100408 101014911  10101498  10101807  10396767  10415577 
##         1         6         1         1         1         1         1         1 
##  10415579 104163110 104163111  10416317  10416318  10416319  10451116  10452776 
##         1         3         4         2         4         4         3         1 
## 104543410  10454347  10457157 104579811  10457987  10457988  10462267  10489907 
##         2         2         1         2         2         3         1         1 
##  10489908  10494937  10541549  10541967  10543529  10559047 105690211  10569027 
##         1         1         4         2         1         1         3         2 
##  10576377  10631069 106314810 106314811  10631487  10631488 106322111 106330410 
##         1         1         3         2         4         3         3         2 
## 106330411  10633047  10633048  10633049  10649897  10649898 106602611  10660267 
##         2         2         1         2         1         1         1         3 
##  10660269  10682389  10699547 107007710 107007711  10700777  10700778  10700779 
##         2         1         4         2         3         2         2         3 
##  10703906  10704817 107204011  10720409  10727277  10743017  10743018  10743019 
##         3         1         1         1         2         3         1         1 
##  10800686  10802588  10820317  10820319  10828747  10836337  10836748  10837167 
##         1         1         1         1         1         1         2         3 
## 108450810 108450811  10845087  10845089  10858517  10859767  10884006  10995977 
##         1         2         3         4         4         2         5         1 
## 109965411 119426510  11942657  11942658  11942659 119438010 119438011  11943807 
##         1         2         2         2         2         2         2         2 
##  11943808  11943809  11948107  11948109  11955779  11965266 119790411  12074309 
##         2         1         1         1         1         3         1         1 
##  12230239  12255497  12264227  12281547  12382295  12382296 124072010 124072011 
##         1         1         1         1         1         4         3         1 
##  12407207  12407208  12407209  12414547  12419838  12422707  12429088  12441027 
##         1         1         3         1         1         1         1         1 
##  12478327  12478328 124839210 124839211  12483927  12483928  12483929  12541927 
##         2         1         3         2         2         1         2         1 
##  12574509  12583347  12586496  12617426  12638137  12646708  12657437  12668407 
##         2         1         3         3         1         1         1         1 
##  12670387  12786627  13023228  13093927 130957411  13095747  13134446  13303157 
##         1         1         1         2         3         1         3         1 
##  13322207  13322208  13322209 133554610  13466757  13494487  13540917  13609577 
##         4         1         1         1         1         1         1         1 
##  13623187  13752117  13752118  13768707  13813426 138159911  13815997  13815998 
##         2         1         1         1         4         2         2         2 
##  13818967 138282911  13828298  13852517 139289310  13934538  13934539 139814810 
##         2         1         2         1         1         1         1         2 
## 139814811  13981487  13981488  13981489  14018017 140206410 141143810  14127909 
##         2         2         2         1         1         1         1         1 
##  14206947  14226667  14236159  14316677  14380276  14380277 143803510 143803511 
##         3         2        13         1         1         1         2         1 
##  14380357  14532327  14588507  14646687  14696757 147501110 147501111  14750117 
##         2         1         1         1         1         3         1         1 
##  14750118  14750119 147520111 147553210  14800867  14815147  14817207  14817957 
##         2         2         1         1         1         1         1         1 
##  14829757  14832397  14836277  14870086  14873397  14898227  14921498  14922557 
##         1         1         1         1         1         1         1         1 
## 149536511  14953657  14953659 149540711  14954077  14963147 149635510  14963559 
##         1         1         3         2         1         1         1         1 
## 149700710  14970567  14975517  14993007  14999617 150035410  15003547  15003548 
##         1         1         1         1         1         1         2         1 
##  15011887 150145111  15014517  15014519 150549410 150549411  15054947  15054948 
##         2         4         5         1         2         2         2         5 
##  15054949 150560111 150709410 150709411  15070947  15070948  15070949 150725010 
##         3         1         3         3         2         3         2         2 
## 150725011  15072508  15072509  15072766 150753210 150753211  15075327  15075328 
##         4         2         4         1         1         3         2         5 
##  15075579  15091087  15091819  15094966  15127897  15127899  15131597  15153607 
##         1         1         2         2         1         1         1         1 
##  15191499  15202796 152028711  15202879  15222917  15285207  15299817 154187911 
##         1         1         1         1         1         1         1         1 
##  15733287  15753237  16415217  16415218  16415219 166127110  16612717  16612718 
##         1         1         2         5         3         1         3         3 
##  16640447  16668827  16972347  16972348  16984898  16999337  17010027   2077956 
##         1         1         2         1         1         1         1         3 
##   2079856   2080586   2083486   2085386   2085466   2085616   2085876   2087365 
##         2         4         1         4         2         7         1         2 
##   2087366  20930411   2093047  20938710   2093877   2093879   2095107   2095287 
##         3         1         2         1         2         1         2         2 
##   2095367  20990810  20990811   2099087   2099088   2099089  20991610   2099167 
##         6         3         1         3         3         4         2         2 
##   2099168   2099247   2099407   2099408   2099409  20996510   2099657  20997310 
##         1         3         1         1         1         1         8         1 
##   2099739   2102607   2102608   2156326   2456477  24566210   2456627   2456628 
##         2         1         1         8         3         2         2         2 
##   2456707   2456887   2456967   2457047   3056567   3145007   3171316   3172146 
##         6        11         1         1         1         2         5         2 
##   3172896   3173056   3173136   3173706   3174536   3174796   3175606   3176106 
##         3         1         4         1         2         2         6         1 
##   3180636   3180896   3180897   3182876   3183526   3187416   3189496   3190206 
##         3         3         1         1         3         2         1         1 
##   3190616   3191456   3191606   3192856   3206556  32247910  32247911   3226856 
##         1         2         1         4         1         1         1         2 
##   3229586   3229746  32334510   3233786   3233787  32345111   3254497   3254567 
##         1         4         1         1         1         1         2         1 
##   3254647  32547210  32547211   3254726   3254727   3254728   3254807   3255487 
##         3         3         3         1         2         3         1         1 
##  32556310  32556311   3255637   3255638   3255639  32558910  32558911   3255897 
##         2         2         2         3         1         1         1         2 
##   3255898  32560511   3256477  32567010   3256707   3256709  32570410  32570411 
##         1         1         9         1         3         1         2         1 
##   3257047   3257048   3257049   3276507   3280476   3282606   3285186   3285266 
##         3         2         2         2         3         2         1         2 
##   3291517  32957311   3295737   3295739   3336746   3340946  33464910   3346497 
##         1         1         1         1         1         1         1         1 
##   3346498   3346567   3346647  33467211   3346727   3346807   3347067   3347147 
##         2         1         8         1         3         1        10         1 
##   3347227  33474811   3347487   3347717   3348476   3348966   3349206   3349876 
##         1         2         7         1         2         1         2         8 
##   3350426   3350916   3352246   3364957   3365377   3365457   3365608   3365867 
##         4         1         1         2         3         3         1         5 
##   3365947   3366107  33662811   3366286   3366287  33663610  33663611   3366367 
##         2         3         1         1         1         2         2         1 
##   3374367   3375687   3375927   3377337   3377338   3377417   3377667   3382286 
##         2         5         4         3         1         1         1         2 
##   3383016   3383436   3385176   3386406   3386656   3388486   3390516   3393176 
##         4         1         6         3         3         1         5         1 
##   3394326   3394996   3396066   3398046  34022411   3402247   3402818   3402997 
##         1         1         6         1         2         7         1         3 
##  34031510   3403157   3403158   3403159   3403497   3403498   3403727  34038011 
##         1         5         2         2         7         2         2         3 
##   3403807   3403808   3403809   3403987  34041411   3404147   3404227   3404487 
##         2         3         2         1         1         4         2         1 
##   3435667  43277310   4327737   4329066   4332276   4332356   4332766   4334906 
##         2         1         2         1         3         2         3         6 
##   4335406   4336806   4338216   4338217   4339616   4340196   4340766   4341916 
##         4         6         5         1         4         3         2         3 
##   4342825   4342826   4344646   4344805   4344806   4344986   4344987   4345066 
##         1         1         3         1         2         1         1         2 
##   4345486   4345976   4348296   4361706   4362126   4362876   4363036   4363606 
##         3         2         4         1         7         1         2         5 
##   4364446   4364516   4364936   4365436   4365846   4366346   4366427   4366675 
##         5         6         5         2         1         2         1         1 
##   4367666   4367827  43721011   4372109  43722810   4372287   4372289  43723610 
##         6         1         4         2         1        17         1         2 
##   4372367  43724411   4372447   4372448   4372517   4372697   4372699  43727710 
##        10         2         8         3         2         2         1         4 
##  43727711   4372777   4372778   4372779  43728511   4372857   4373199  43733510 
##         2         4         1         1         1         5         1         3 
##  43733511   4373507  43740011   4374007   4374009   4374757   4375097   4375258 
##         1         6         2         3         2         1         2         1 
##   4377077   4377157   4377237   4377317   4377497   4377727  44986810   4498687 
##         3         6         2         3         1         1         2         4 
##   4498688   4498689  46673010  46673011   4667307   4667308   4667309   4684886 
##         2         1         3         2         2         7         4         2 
##   4686116  46970010  46970011   4697007   4697008   4697009  48190310  48190311 
##         2         3         1         1         2         2         2         2 
##   4819037   4819039  48861910  48861911   4886197   4886357  49354410  49354411 
##         2         1         1         1        17         2         2         4 
##   4935447   4935448   4935449   4936358   4947329   4952597   4958127  49616610 
##         2         4         2         1         1         3         4         1 
##  49616611   4961668   4961669   4968446   4988247  49969911   4996997   4996998 
##         1         1         2         1         1         1         2         2 
##   4996999   5001247  50034811   5003487   5003489   5006117  50160110  50160111 
##         2         1         3         1         2         2         2         1 
##   5016018   5016019   5016767  50180910  50180911   5018097   5024357  50263311 
##         5         2         1         1         1         2         1         2 
##   5089036   5103056   5108006   5136146   5166746   5167737   5196457   5204867 
##         5         1         1         2         3         1         3         1 
##   5211796   5211797   5223187   5228627   5234237   5234646   5236217   5236626 
##         1         3         2         1         2         4         2         1 
##   5237616   5263016   5343217   5358237   5360297   5361517  53632610  53632611 
##         4         4         1         4         4         1         4         2 
##   5363267   5363268   5363269  54600211   5460028   5558477  55586211   5558627 
##         4         3         2         9         5         1         1         1 
##   5562667   5563576   5564729   5565486  55657110  55657111   5565717   5565718 
##         2         1         2         1         2         2         4         2 
##   5565719  56511911   5651197   5651437   5652007  56523410  56523411   5652349 
##         2         2         1         1         2         2         1         3 
##   5652677  56614111   5661417   5661418   5661419   5661587  56641411   5664147 
##         2         2         3         2         7         2         1         1 
##   5664148   5664149   5664307   5664557  56646311   5664638  56647110  56647111 
##         1         1         2         4         1         1         3         2 
##   5664717   5664719   5677437  56775011   5677507   5677509   5677687   5782607 
##         5         2         1         3         2         3         1         1 
##   5782787  57828610  57828611   5782867   5782868   5782869  57835110  57840110 
##         1         2         4         3         1         1         1         2 
##   5784437  57851810  57851811   5785187   5785188   5785189  57852610  57852611 
##         2         2         2         2         3         2         2         1 
##   5785267   5785268   5785269  57853411   5785347   5785349  57854210   5785427 
##         3         1         3         2         2         3         1         4 
##   5785428   5817107  58172810   5817288  58173610  58173611   5817367   5817368 
##         1         2         1         1         1         1         1         1 
##   5817447   5817778   5818767   5818927  58190011   5819007   5819009  58199110 
##         4         1         5         2         3         2         1         2 
##  58199111   5820317   5821147   5821227   5821487   5821637   5821718   5822547 
##         1         1         1         1         1         3         1         3 
##   5823047   5823127   5823128   5823129  58238711   5823877   5823878   5823879 
##         5         3         1         1         3         1         1         5 
##  58240310  58240311   5824037   5824038   5824039  58241111   5824117   5824118 
##         2         1         2         3         3         1         3         3 
##  58283310  58283311   5828337   5828338   5828339  58286610   5828667  58289010 
##         3         3         2         2         2         2         2         2 
##   5828907   5828908   5828909   5829817  58301311   5830137   5833287  58347611 
##         3         1         1         2         1         1         4         2 
##   5834767   5834768  58359110  58359111   5835917   5835919   5839226   5985816 
##         2         1         3         3         7         2         3         1 
##   5985817   5985818   5991597  60149210   6017087   6054698   6071439   6074246 
##         2         1         2         2         1         1         1         1 
##   6284046   6286026   6288427   6292616   6322996   6324717   6428017   6428927 
##         2         2         3         2         4         1         3         1 
##   6428929  64326210  64369210   6437837  64381711   6438177   6446907   6448807 
##         1         1         1         2         3         1         1         3 
##   6471729  64912910   6491297   6492027   6493019   6499476   6500027  65003610 
##         1         1         1         1         1         6         1         1 
##  65003611   6500367   6500369   6520816   6596986  65972210  65972211   6597227 
##         2         2         3         1         2         1         2         1 
##   6597228  65989611   6598968   6598969  65995310  65995311   6599537   6599538 
##         1         1         1         1         1         1         1         1 
##   6629577   6630057   6630137  66311211   6631127   6631128   6631129   6635267 
##         2         2         1         1         3         1         2         1 
##  66353410  66353411   6635347  66355910   6635597   6635598   6635599   6636826 
##         1         1         1         1         1         2         2         5 
##  66397110   6639718   6639719   6642927   6646987  66474811   6647487   6654146 
##         2         6         2         1        10         1         1         1 
##   6654897   6919317  69243410   6924347   6924348   6924349   6924428  69349910 
##         1         2         3         1         2         4         1         3 
##  69349911   6934997   6936557   6936558   6945479   6945629  69457010  69457011 
##         3         3         1         1         1         1         3         2 
##   6945707   6945708   6945709  69458810  69458811   6945887   6945888   6945889 
##         2         2         2         2         4         2         2         2 
##   6946047  70321510  70321511   7032158   7032567   7037366   7037447  70407210 
##         1         1         1         1         1         2         7         1 
##   7040729   7043126   7044456  70505310   7050537   7050538   7050539   7051296 
##         1         2         1         2         2         3         2         4 
##   7054757   7057727   7257707   7258617   7258619   7280557  72819611   7281968 
##         1         1         7         3         1         1         3         1 
##  72871710  72871711   7287177   7287178   7287179   7323217   7323477  73249511 
##         6         1         2         3         2         1         1         2 
##   7324957   7393677  74377310  74377311   7437737   7437738   7437739   7438077 
##         3         1         3         2         2         3         2         1 
##  74381511   7438157  74383110  74383111   7438317   7438318   7445406   7445576 
##         1         4         4         3         2         4         3         6 
##   7445737   7445738   7512307   7593996  75961310  75961311   7596137   7596138 
##         1         1         1         2         1         2         2         3 
##   7596139   7621207   7628569   7628647  76290611   7629147   7631516   7647796 
##         4         1         1         2         2         1         6         6 
##  76493610  76493611   7649367  76529711   7652977   7652978   7652979  76530511 
##         1         1         2         2         2         1         1         2 
##   7653057   7653059   7653137  76532111   7653967   7654127  77378810  77378811 
##         2         6         3         1         4         4         3         2 
##   7737887   7737888   7737889   7739036  77402610  77402611   7740267   7740268 
##         3         3         1         1         3         2         1         2 
##   7746797   7747037   7758337   7758747  77765610  77765611   7776567   7776568 
##         1         2         3         3         2         3         2         3 
##   7776569   7776807   7776809  77799510  77799511   7779957   7779958   7779959 
##         3         2         2         2         1         1         2         2 
##  77823311   7782337   7782338   7782339   7787387  77904110   7790417   7798687 
##         4         4         1         2         1         1         1         2 
##   7807599   7807916  78127810   7812788  78130210  78130211   7813027   7813516 
##         1         1         2         2         2         2         2         3 
##  78136911   7813697   7813698   7813699   7813856   7818316   7818317   7819308 
##         3         1         2         1         1         1         1         1 
##   7820787   8204076   8210826   8240036   8248136   8257526   8289626   8316447 
##         1         4         7         1         6         1         1         1 
##  [ reached getOption("max.print") -- omitted 50 entries ]
## [1] "Frequency table after encoding"
## id_grado. 
##  344  345  346  347  348  349  350  351  352  353  354  355  356  357  358  359  360 
##    2    1    3    3    3    3    1    2    8    2    4    7    1    1    5    1    1 
##  361  362  363  364  365  366  367  368  369  370  371  372  373  374  375  376  377 
##    1    2    2    3    1    2    3    3    1    2    4    2    1    2    1    7    1 
##  378  379  380  381  382  383  384  385  386  387  388  389  390  391  392  393  394 
##    1    1    4    6    4    2    2    1    2    4    1    3    1    2    3    2    1 
##  395  396  397  398  399  400  401  402  403  404  405  406  407  408  409  410  411 
##    1    1    2    1    1    2    4    1    1    1    1    1    1    2    1    1    2 
##  412  413  414  415  416  417  418  419  420  421  422  423  424  425  426  427  428 
##    1    4    2    2    7    1    5    1    1    1    1    3    3    1    3    1    2 
##  429  430  431  432  433  434  435  436  437  438  439  440  441  442  443  444  445 
##    1    4    2    1   10    2    1    1    3    2    2    1    1    2    1    1    3 
##  446  447  448  449  450  451  452  453  454  455  456  457  458  459  460  461  462 
##    1    1    1    3    2    2    1    1    1    8    9    3    1    4    2    4    2 
##  463  464  465  466  467  468  469  470  471  472  473  474  475  476  477  478  479 
##    2    1    7    1    1    1    2    1    3    1    1    6    1   10    3    4    1 
##  480  481  482  483  484  485  486  487  488  489  490  491  492  493  494  495  496 
##    1    1    2    1    3    1    3    1    5    1    1    3    2    1    1    1    3 
##  497  498  499  500  501  502  503  504  505  506  507  508  509  510  511  512  513 
##    3    2    1    2    1    2    2    4    2    2    1    2    1    2    5    2    1 
##  514  515  516  517  518  519  520  521  522  523  524  525  526  527  528  529  530 
##    1    1    1    6    1    3    2    1    1    2    2    2    2    2    2    1    1 
##  531  532  533  534  535  536  537  538  539  540  541  542  543  544  545  546  547 
##    2    1    1    1    8    1    1    1    6    1    3    1    3    2    1    5    2 
##  548  549  550  551  552  553  554  555  556  557  558  559  560  561  562  563  564 
##    3    2    2    2    1    1    2    2    2    5    2    2    1    4    5    1    1 
##  565  566  567  568  569  570  571  572  573  574  575  576  577  578  579  580  581 
##    2    3    3    1    2    1    1    2    4    2    2    3    4    1    3    2    1 
##  582  583  584  585  586  587  588  589  590  591  592  593  594  595  596  597  598 
##    2    2    1    3    3    1    1    2    2    1    1    3    1    1    3    1    1 
##  599  600  601  602  603  604  605  606  607  608  609  610  611  612  613  614  615 
##    1    1    2    4    1    3    4    2    2    1    1    1    1    2    2    2    3 
##  616  617  618  619  620  621  622  623  624  625  626  627  628  629  630  631  632 
##    1    4    1    2    2    2    2    4    4    1    2    1    4    2    1    2    1 
##  633  634  635  636  637  638  639  640  641  642  643  644  645  646  647  648  649 
##    1    1    1    2    3    2    2    3    2    1    3    1    4    2    6    1    1 
##  650  651  652  653  654  655  656  657  658  659  660  661  662  663  664  665  666 
##    2    2    1    2    1    1    1    4    1    3    1    1    1    1    1    2    2 
##  667  668  669  670  671  672  673  674  675  676  677  678  679  680  681  682  683 
##    3    1    1    3    2    1    1    3    3    4    2    1    4    1    2    1    5 
##  684  685  686  687  688  689  690  691  692  693  694  695  696  697  698  699  700 
##    2    1    4    1    2    1    1    1    1    1    1    2    2  170    3    1    3 
##  701  702  703  704  705  706  707  708  709  710  711  712  713  714  715  716  717 
##    1    1    8    1    1    6    2    3    1    3    1    4    1    2    1    1    1 
##  718  719  720  721  722  723  724  725  726  727  728  729  730  731  732  733  734 
##    1    1    1    3    3    2    1    2    4    2    3    1    2    6    1    1    1 
##  735  736  737  738  739  740  741  742  743  744  745  746  747  748  749  750  751 
##    2    7    2    1    1    2    4    1    2    2    3    2    2    2    2    2    1 
##  752  753  754  755  756  757  758  759  760  761  762  763  764  765  766  767  768 
##    3    1    2    1    1    1    1    2    2    1    2    1    1    2    3    2    3 
##  769  770  771  772  773  774  775  776  777  778  779  780  781  782  783  784  785 
##    1    1    1    1    1    1    2    2    2    5    2    1    1    3    1    2    1 
##  786  787  788  789  790  791  792  793  794  795  796  797  798  799  800  801  802 
##    3    2    1    2    1    2    4    3    1    2    2    1   11    1    2    1    2 
##  803  804  805  806  807  808  809  810  811  812  813  814  815  816  817  818  819 
##    5    3    5    1    4    4    2    2    8    2    3    2    1    2    1    3    3 
##  820  821  822  823  824  825  826  827  828  829  830  831  832  833  834  835  836 
##    1    1    2    1    1    1    3    1    6    3    3    1    1    3    1    7    1 
##  837  838  839  840  841  842  843  844  845  846  847  848  849  850  851  852  853 
##    1    1    2    3    1    3    3    1    1    3    2    1    1    6    1    2    1 
##  854  855  856  857  858  859  860  861  862  863  864  865  866  867  868  869  870 
##    2    1    1    1    2    2    1    3   10    1    1    4    3    6    2    3    1 
##  871  872  873  874  875  876  877  878  879  880  881  882  883  884  885  886  887 
##    3    1    1    1    1    1    1    7    5    4    2    1    7    1    3    1    4 
##  888  889  890  891  892  893  894  895  896  897  898  899  900  901  902  903  904 
##    1    1    1    1    1    4    3    1    2    2    2    1    2    2    2    1    2 
##  905  906  907  908  909  910  911  912  913  914  915  916  917  918  919  920  921 
##    3    2    4    1    3    2    1    1    1    2    1    1    1    1    2    1    3 
##  922  923  924  925  926  927  928  929  930  931  932  933  934  935  936  937  938 
##    2    2    1    3    1    1    1    1    1    2    3    3    1    2    2    3    5 
##  939  940  941  942  943  944  945  946  947  948  949  950  951  952  953  954  955 
##    3    1    1    1    3    3    1    3    3    1    1    4    1    1    4    2    1 
##  956  957  958  959  960  961  962  963  964  965  966  967  968  969  970  971  972 
##    4    1    1    2    3    1    2    1    1    7    2    6    4    2    4    2    1 
##  973  974  975  976  977  978  979  980  981  982  983  984  985  986  987  988  989 
##    4    1    2    1    1    3    2    1    3    1    1    1    2    2    3    1    1 
##  990  991  992  993  994  995  996  997  998  999 1000 1001 1002 1003 1004 1005 1006 
##    2    2    2    1    2    3    6    3    1    2    2    1    2    2    1    4    1 
## 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 
##    1    2    3    1    1    1    1    1    2    1    2    1    1    1    4    4    6 
## 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 
##    1    3    1    2    1    3    1    3    3    5    3    2    2    1    5    2    2 
## 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 
##    2    1    1    1    3    4    2    1    2    5    2    1    2    2    1    1    3 
## 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 
##    2    1    3    1    1    1    1    3    1    3    2    2    6    1    1    2    1 
## 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 
##    2    3    3   13    3    1    1    2    1    5    1    1    2    1    3    1    6 
## 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 
##    6    2   17    4    1    4    8    5    1    1    1    1    1    1    2    1    1 
## 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 
##    6    1    1    2    1    1    1    7    2    1    2    1    2    1    5    2    1 
## 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 
##    4    2    1    1    1    1    1    1    2    1    1    1    1    1    2    1   21 
## 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 
##    2    1    3    2    2    3    3    2    2    1    3    2    1    1    1    1    2 
## 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 
##    3    1    2    1    1    3    1    3    3    3    4    3    1    4    1    1    1 
## 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 
##    3    1    1    3    1    1    6    1    1    1    1    1    1    1    4    3    1 
## 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 
##    2    2    1    2    2    1    1    1    3    2    1    2    1    5    1    1    1 
## 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 
##    1    1    1    1    1    2    4    5    1    1    2    2    2    4    2    2    3 
## 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 
##    3    2    1    1    6    1    1    4    2    2    1    2    3    1    1    4    1 
## 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 
##    3    1    2    1    5    2    1    2    2    1    1    1    3    2    1    1    2 
## 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 
##    1    2    1    1    6    2    1    2    1    2    4    1    7    2    2    2    1 
## 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 
##    1    1    4    9    2    2    3    1    1    2    3    3    2    1    2    2    2 
## 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 
##    1    2    1    7    2    1    2    1    1    1    2    1    3    1    1    3    1 
## 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 
##    3    4    5    2    1    2    1    1    3    3    2    2    2    1    1    1    1 
## 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 
##    1    2    2    2    2    1    1    1    1    1    6    2    3    1 
##  [ reached getOption("max.print") -- omitted 50 entries ]
## [1] "Frequency table before encoding"
## id_grado. 
##           100716010 100844010  10084407  10084408  10084409  10089297 100896010 
##       170         1         3         4         1         1         2         1 
##  10089608  10098447  10100408 101014911  10101498  10101807  10396767  10415577 
##         1         6         1         1         1         1         1         1 
##  10415579 104163110 104163111  10416317  10416318  10416319  10451116  10452776 
##         1         3         4         2         4         4         3         1 
## 104543410  10454347  10457157 104579811  10457987  10457988  10462267  10489907 
##         2         2         1         2         2         3         1         1 
##  10489908  10494937  10541549  10541967  10543529  10559047 105690211  10569027 
##         1         1         4         2         1         1         3         2 
##  10576377  10631069 106314810 106314811  10631487  10631488 106322111 106330410 
##         1         1         3         2         4         3         3         2 
## 106330411  10633047  10633048  10633049  10649897  10649898 106602611  10660267 
##         2         2         1         2         1         1         1         3 
##  10660269  10682389  10699547 107007710 107007711  10700777  10700778  10700779 
##         2         1         4         2         3         2         2         3 
##  10703906  10704817 107204011  10720409  10727277  10743017  10743018  10743019 
##         3         1         1         1         2         3         1         1 
##  10800686  10802588  10820317  10820319  10828747  10836337  10836748  10837167 
##         1         1         1         1         1         1         2         3 
## 108450810 108450811  10845087  10845089  10858517  10859767  10884006  10995977 
##         1         2         3         4         4         2         5         1 
## 109965411 119426510  11942657  11942658  11942659 119438010 119438011  11943807 
##         1         2         2         2         2         2         2         2 
##  11943808  11943809  11948107  11948109  11955779  11965266 119790411  12074309 
##         2         1         1         1         1         3         1         1 
##  12230239  12255497  12264227  12281547  12382295  12382296 124072010 124072011 
##         1         1         1         1         1         4         3         1 
##  12407207  12407208  12407209  12414547  12419838  12422707  12429088  12441027 
##         1         1         3         1         1         1         1         1 
##  12478327  12478328 124839210 124839211  12483927  12483928  12483929  12541927 
##         2         1         3         2         2         1         2         1 
##  12574509  12583347  12586496  12617426  12638137  12646708  12657437  12668407 
##         2         1         3         3         1         1         1         1 
##  12670387  12786627  13023228  13093927 130957411  13095747  13134446  13303157 
##         1         1         1         2         3         1         3         1 
##  13322207  13322208  13322209 133554610  13466757  13494487  13540917  13609577 
##         4         1         1         1         1         1         1         1 
##  13623187  13752117  13752118  13768707  13813426 138159911  13815997  13815998 
##         2         1         1         1         4         2         2         2 
##  13818967 138282911  13828298  13852517 139289310  13934538  13934539 139814810 
##         2         1         2         1         1         1         1         2 
## 139814811  13981487  13981488  13981489  14018017 140206410 141143810  14127909 
##         2         2         2         1         1         1         1         1 
##  14206947  14226667  14236159  14316677  14380276  14380277 143803510 143803511 
##         3         2        13         1         1         1         2         1 
##  14380357  14532327  14588507  14646687  14696757 147501110 147501111  14750117 
##         2         1         1         1         1         3         1         1 
##  14750118  14750119 147520111 147553210  14800867  14815147  14817207  14817957 
##         2         2         1         1         1         1         1         1 
##  14829757  14832397  14836277  14870086  14873397  14898227  14921498  14922557 
##         1         1         1         1         1         1         1         1 
## 149536511  14953657  14953659 149540711  14954077  14963147 149635510  14963559 
##         1         1         3         2         1         1         1         1 
## 149700710  14970567  14975517  14993007  14999617 150035410  15003547  15003548 
##         1         1         1         1         1         1         2         1 
##  15011887 150145111  15014517  15014519 150549410 150549411  15054947  15054948 
##         2         4         5         1         2         2         2         5 
##  15054949 150560111 150709410 150709411  15070947  15070948  15070949 150725010 
##         3         1         3         3         2         3         2         2 
## 150725011  15072508  15072509  15072766 150753210 150753211  15075327  15075328 
##         4         2         4         1         1         3         2         5 
##  15075579  15091087  15091819  15094966  15127897  15127899  15131597  15153607 
##         1         1         2         2         1         1         1         1 
##  15191499  15202796 152028711  15202879  15222917  15285207  15299817 154187911 
##         1         1         1         1         1         1         1         1 
##  15733287  15753237  16415217  16415218  16415219 166127110  16612717  16612718 
##         1         1         2         5         3         1         3         3 
##  16640447  16668827  16972347  16972348  16984898  16999337  17010027   2077956 
##         1         1         2         1         1         1         1         3 
##   2079856   2080586   2083486   2085386   2085466   2085616   2085876   2087365 
##         2         4         1         4         2         7         1         2 
##   2087366  20930411   2093047  20938710   2093877   2093879   2095107   2095287 
##         3         1         2         1         2         1         2         2 
##   2095367  20990810  20990811   2099087   2099088   2099089  20991610   2099167 
##         6         3         1         3         3         4         2         2 
##   2099168   2099247   2099407   2099408   2099409  20996510   2099657  20997310 
##         1         3         1         1         1         1         8         1 
##   2099739   2102607   2102608   2156326   2456477  24566210   2456627   2456628 
##         2         1         1         8         3         2         2         2 
##   2456707   2456887   2456967   2457047   3056567   3145007   3171316   3172146 
##         6        11         1         1         1         2         5         2 
##   3172896   3173056   3173136   3173706   3174536   3174796   3175606   3176106 
##         3         1         4         1         2         2         6         1 
##   3180636   3180896   3180897   3182876   3183526   3187416   3189496   3190206 
##         3         3         1         1         3         2         1         1 
##   3190616   3191456   3191606   3192856   3206556  32247910  32247911   3226856 
##         1         2         1         4         1         1         1         2 
##   3229586   3229746  32334510   3233786   3233787  32345111   3254497   3254567 
##         1         4         1         1         1         1         2         1 
##   3254647  32547210  32547211   3254726   3254727   3254728   3254807   3255487 
##         3         3         3         1         2         3         1         1 
##  32556310  32556311   3255637   3255638   3255639  32558910  32558911   3255897 
##         2         2         2         3         1         1         1         2 
##   3255898  32560511   3256477  32567010   3256707   3256709  32570410  32570411 
##         1         1         9         1         3         1         2         1 
##   3257047   3257048   3257049   3276507   3280476   3282606   3285186   3285266 
##         3         2         2         2         3         2         1         2 
##   3291517  32957311   3295737   3295739   3336746   3340946  33464910   3346497 
##         1         1         1         1         1         1         1         1 
##   3346498   3346567   3346647  33467211   3346727   3346807   3347067   3347147 
##         2         1         8         1         3         1        10         1 
##   3347227  33474811   3347487   3347717   3348476   3348966   3349206   3349876 
##         1         2         7         1         2         1         2         8 
##   3350426   3350916   3352246   3364957   3365377   3365457   3365608   3365867 
##         4         1         1         2         3         3         1         5 
##   3365947   3366107  33662811   3366286   3366287  33663610  33663611   3366367 
##         2         3         1         1         1         2         2         1 
##   3374367   3375687   3375927   3377337   3377338   3377417   3377667   3382286 
##         2         5         4         3         1         1         1         2 
##   3383016   3383436   3385176   3386406   3386656   3388486   3390516   3393176 
##         4         1         6         3         3         1         5         1 
##   3394326   3394996   3396066   3398046  34022411   3402247   3402818   3402997 
##         1         1         6         1         2         7         1         3 
##  34031510   3403157   3403158   3403159   3403497   3403498   3403727  34038011 
##         1         5         2         2         7         2         2         3 
##   3403807   3403808   3403809   3403987  34041411   3404147   3404227   3404487 
##         2         3         2         1         1         4         2         1 
##   3435667  43277310   4327737   4329066   4332276   4332356   4332766   4334906 
##         2         1         2         1         3         2         3         6 
##   4335406   4336806   4338216   4338217   4339616   4340196   4340766   4341916 
##         4         6         5         1         4         3         2         3 
##   4342825   4342826   4344646   4344805   4344806   4344986   4344987   4345066 
##         1         1         3         1         2         1         1         2 
##   4345486   4345976   4348296   4361706   4362126   4362876   4363036   4363606 
##         3         2         4         1         7         1         2         5 
##   4364446   4364516   4364936   4365436   4365846   4366346   4366427   4366675 
##         5         6         5         2         1         2         1         1 
##   4367666   4367827  43721011   4372109  43722810   4372287   4372289  43723610 
##         6         1         4         2         1        17         1         2 
##   4372367  43724411   4372447   4372448   4372517   4372697   4372699  43727710 
##        10         2         8         3         2         2         1         4 
##  43727711   4372777   4372778   4372779  43728511   4372857   4373199  43733510 
##         2         4         1         1         1         5         1         3 
##  43733511   4373507  43740011   4374007   4374009   4374757   4375097   4375258 
##         1         6         2         3         2         1         2         1 
##   4377077   4377157   4377237   4377317   4377497   4377727  44986810   4498687 
##         3         6         2         3         1         1         2         4 
##   4498688   4498689  46673010  46673011   4667307   4667308   4667309   4684886 
##         2         1         3         2         2         7         4         2 
##   4686116  46970010  46970011   4697007   4697008   4697009  48190310  48190311 
##         2         3         1         1         2         2         2         2 
##   4819037   4819039  48861910  48861911   4886197   4886357  49354410  49354411 
##         2         1         1         1        17         2         2         4 
##   4935447   4935448   4935449   4936358   4947329   4952597   4958127  49616610 
##         2         4         2         1         1         3         4         1 
##  49616611   4961668   4961669   4968446   4988247  49969911   4996997   4996998 
##         1         1         2         1         1         1         2         2 
##   4996999   5001247  50034811   5003487   5003489   5006117  50160110  50160111 
##         2         1         3         1         2         2         2         1 
##   5016018   5016019   5016767  50180910  50180911   5018097   5024357  50263311 
##         5         2         1         1         1         2         1         2 
##   5089036   5103056   5108006   5136146   5166746   5167737   5196457   5204867 
##         5         1         1         2         3         1         3         1 
##   5211796   5211797   5223187   5228627   5234237   5234646   5236217   5236626 
##         1         3         2         1         2         4         2         1 
##   5237616   5263016   5343217   5358237   5360297   5361517  53632610  53632611 
##         4         4         1         4         4         1         4         2 
##   5363267   5363268   5363269  54600211   5460028   5558477  55586211   5558627 
##         4         3         2         9         5         1         1         1 
##   5562667   5563576   5564729   5565486  55657110  55657111   5565717   5565718 
##         2         1         2         1         2         2         4         2 
##   5565719  56511911   5651197   5651437   5652007  56523410  56523411   5652349 
##         2         2         1         1         2         2         1         3 
##   5652677  56614111   5661417   5661418   5661419   5661587  56641411   5664147 
##         2         2         3         2         7         2         1         1 
##   5664148   5664149   5664307   5664557  56646311   5664638  56647110  56647111 
##         1         1         2         4         1         1         3         2 
##   5664717   5664719   5677437  56775011   5677507   5677509   5677687   5782607 
##         5         2         1         3         2         3         1         1 
##   5782787  57828610  57828611   5782867   5782868   5782869  57835110  57840110 
##         1         2         4         3         1         1         1         2 
##   5784437  57851810  57851811   5785187   5785188   5785189  57852610  57852611 
##         2         2         2         2         3         2         2         1 
##   5785267   5785268   5785269  57853411   5785347   5785349  57854210   5785427 
##         3         1         3         2         2         3         1         4 
##   5785428   5817107  58172810   5817288  58173610  58173611   5817367   5817368 
##         1         2         1         1         1         1         1         1 
##   5817447   5817778   5818767   5818927  58190011   5819007   5819009  58199110 
##         4         1         5         2         3         2         1         2 
##  58199111   5820317   5821147   5821227   5821487   5821637   5821718   5822547 
##         1         1         1         1         1         3         1         3 
##   5823047   5823127   5823128   5823129  58238711   5823877   5823878   5823879 
##         5         3         1         1         3         1         1         5 
##  58240310  58240311   5824037   5824038   5824039  58241111   5824117   5824118 
##         2         1         2         3         3         1         3         3 
##  58283310  58283311   5828337   5828338   5828339  58286610   5828667  58289010 
##         3         3         2         2         2         2         2         2 
##   5828907   5828908   5828909   5829817  58301311   5830137   5833287  58347611 
##         3         1         1         2         1         1         4         2 
##   5834767   5834768  58359110  58359111   5835917   5835919   5839226   5985816 
##         2         1         3         3         7         2         3         1 
##   5985817   5985818   5991597  60149210   6017087   6054698   6071439   6074246 
##         2         1         2         2         1         1         1         1 
##   6284046   6286026   6288427   6292616   6322996   6324717   6428017   6428927 
##         2         2         3         2         4         1         3         1 
##   6428929  64326210  64369210   6437837  64381711   6438177   6446907   6448807 
##         1         1         1         2         3         1         1         3 
##   6471729  64912910   6491297   6492027   6493019   6499476   6500027  65003610 
##         1         1         1         1         1         6         1         1 
##  65003611   6500367   6500369   6520816   6596986  65972210  65972211   6597227 
##         2         2         3         1         2         1         2         1 
##   6597228  65989611   6598968   6598969  65995310  65995311   6599537   6599538 
##         1         1         1         1         1         1         1         1 
##   6629577   6630057   6630137  66311211   6631127   6631128   6631129   6635267 
##         2         2         1         1         3         1         2         1 
##  66353410  66353411   6635347  66355910   6635597   6635598   6635599   6636826 
##         1         1         1         1         1         2         2         5 
##  66397110   6639718   6639719   6642927   6646987  66474811   6647487   6654146 
##         2         6         2         1        10         1         1         1 
##   6654897   6919317  69243410   6924347   6924348   6924349   6924428  69349910 
##         1         2         3         1         2         4         1         3 
##  69349911   6934997   6936557   6936558   6945479   6945629  69457010  69457011 
##         3         3         1         1         1         1         3         2 
##   6945707   6945708   6945709  69458810  69458811   6945887   6945888   6945889 
##         2         2         2         2         4         2         2         2 
##   6946047  70321510  70321511   7032158   7032567   7037366   7037447  70407210 
##         1         1         1         1         1         2         7         1 
##   7040729   7043126   7044456  70505310   7050537   7050538   7050539   7051296 
##         1         2         1         2         2         3         2         4 
##   7054757   7057727   7257707   7258617   7258619   7280557  72819611   7281968 
##         1         1         7         3         1         1         3         1 
##  72871710  72871711   7287177   7287178   7287179   7323217   7323477  73249511 
##         6         1         2         3         2         1         1         2 
##   7324957   7393677  74377310  74377311   7437737   7437738   7437739   7438077 
##         3         1         3         2         2         3         2         1 
##  74381511   7438157  74383110  74383111   7438317   7438318   7445406   7445576 
##         1         4         4         3         2         4         3         6 
##   7445737   7445738   7512307   7593996  75961310  75961311   7596137   7596138 
##         1         1         1         2         1         2         2         3 
##   7596139   7621207   7628569   7628647  76290611   7629147   7631516   7647796 
##         4         1         1         2         2         1         6         6 
##  76493610  76493611   7649367  76529711   7652977   7652978   7652979  76530511 
##         1         1         2         2         2         1         1         2 
##   7653057   7653059   7653137  76532111   7653967   7654127  77378810  77378811 
##         2         6         3         1         4         4         3         2 
##   7737887   7737888   7737889   7739036  77402610  77402611   7740267   7740268 
##         3         3         1         1         3         2         1         2 
##   7746797   7747037   7758337   7758747  77765610  77765611   7776567   7776568 
##         1         2         3         3         2         3         2         3 
##   7776569   7776807   7776809  77799510  77799511   7779957   7779958   7779959 
##         3         2         2         2         1         1         2         2 
##  77823311   7782337   7782338   7782339   7787387  77904110   7790417   7798687 
##         4         4         1         2         1         1         1         2 
##   7807599   7807916  78127810   7812788  78130210  78130211   7813027   7813516 
##         1         1         2         2         2         2         2         3 
##  78136911   7813697   7813698   7813699   7813856   7818316   7818317   7819308 
##         3         1         2         1         1         1         1         1 
##   7820787   8204076   8210826   8240036   8248136   8257526   8289626   8316447 
##         1         4         7         1         6         1         1         1 
##  [ reached getOption("max.print") -- omitted 50 entries ]
## [1] "Frequency table after encoding"
## id_grado. 
##  658  659  660  661  662  663  664  665  666  667  668  669  670  671  672  673  674 
##    3    2    2    2    1    1    1    1    4    1    1    1    1    2    3    3    1 
##  675  676  677  678  679  680  681  682  683  684  685  686  687  688  689  690  691 
##    2    2    3    1    6    4    1    8    1    2    3    2    3    2    7    1    1 
##  692  693  694  695  696  697  698  699  700  701  702  703  704  705  706  707  708 
##    4    2    1    1    1    7    2    3    2    2    5    2    1    3    1    2    3 
##  709  710  711  712  713  714  715  716  717  718  719  720  721  722  723  724  725 
##    1    1    1    1    3    3    2    2    3    3    3    4    1    8    5    2    1 
##  726  727  728  729  730  731  732  733  734  735  736  737  738  739  740  741  742 
##    1    4    2    2    1    5    1    1    4    3    2    1    1    2    1    2    3 
##  743  744  745  746  747  748  749  750  751  752  753  754  755  756  757  758  759 
##    1    1    2    1    1    1    1    4    1    1    3    1    3    2    1    3    2 
##  760  761  762  763  764  765  766  767  768  769  770  771  772  773  774  775  776 
##    1    2    3    1    5    2    2    2    3    1    2    2    2    3    1    2    4 
##  777  778  779  780  781  782  783  784  785  786  787  788  789  790  791  792  793 
##    4    2    1    2    3    4    3    4    2    1    5    6    2    2    6    1   10 
##  794  795  796  797  798  799  800  801  802  803  804  805  806  807  808  809  810 
##    3    1    2    3    1    2    1    3    3    2    1    2    1    1    1    1    1 
##  811  812  813  814  815  816  817  818  819  820  821  822  823  824  825  826  827 
##    7    1    2    1    2    2    1    1    1    2    4    1    1    6    3    4    1 
##  828  829  830  831  832  833  834  835  836  837  838  839  840  841  842  843  844 
##    1    1    1    5    1    1    1    2    2    1    1    1    6    1    3    1    2 
##  845  846  847  848  849  850  851  852  853  854  855  856  857  858  859  860  861 
##    2    1    1    1    1    1    2    3   17    2    1    2    2    1    3    2    4 
##  862  863  864  865  866  867  868  869  870  871  872  873  874  875  876  877  878 
##    1    4    1    2    1    2    2    1    1    1    2    2    3    2    1    3    2 
##  879  880  881  882  883  884  885  886  887  888  889  890  891  892  893  894  895 
##    1    1    1    3    3    1    6    1    6    1    2    1    1    2    1    1    2 
##  896  897  898  899  900  901  902  903  904  905  906  907  908  909  910  911  912 
##    2    1    1    1    2    1    1    2    1    2    1    2    3    1    1    1    6 
##  913  914  915  916  917  918  919  920  921  922  923  924  925  926  927  928  929 
##    1    5    2    2    1    1    4    1    1    4    3    6    2    2    2    1    3 
##  930  931  932  933  934  935  936  937  938  939  940  941  942  943  944  945  946 
##    1    4    3    2    1    1    1    1    2    2    3    3    1    1    2    1    1 
##  947  948  949  950  951  952  953  954  955  956  957  958  959  960  961  962  963 
##    1    2    1    1    1    1    1    1    1    1    2    1    5    1    1    1    2 
##  964  965  966  967  968  969  970  971  972  973  974  975  976  977  978  979  980 
##    1    3    5  170   10    1    1    1    2    2    1    1    2    1    1    2    2 
##  981  982  983  984  985  986  987  988  989  990  991  992  993  994  995  996  997 
##    3    2    2    1    1    4    1    2    3    3    1    1    5    4    3    1    1 
##  998  999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 
##    4    1    2    8    3    1    1    8    2    2    1    2    3    1    1    1    1 
## 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 
##    1    4    1    6    3    6    1    1    1    1    1    2    2    1    1   21    4 
## 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 
##    2    1    5    2    1    1    1    1    1    3    1    1    3    2    4    1    2 
## 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 
##    3    2    2    2    1    1    2    2    1    1    4    7    3    1    1    2    2 
## 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 
##    1    2    1    2    1    2    4    1    4    4    1    1    1    2    2    1    2 
## 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 
##    1    2    1    1    2    3    3    1    2    1    2    2    1    5    3    1    1 
## 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 
##    1    1    9    1    1    1    3    1    1    2    3    1    2    1    1    1    2 
## 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 
##    1    1    1    1    2    3    1    1    4    3    1    1    1    2    1    1    1 
## 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 
##    3    1    3    1    1    2    2    1    1    1    3    2    4    1    1    2    3 
## 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 
##    1    1    2    7    1    3    1    2    1    1    4    1    7    2    4    2    1 
## 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 
##    2    7    1    1    1    4    2    1    2    3    1    1    1    2    2    1    6 
## 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 
##    1    3    2    2    1    2   10    1    1    2    2    1    1    2    1    6    2 
## 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 
##    1    1    1    2    1    1    2    1    1    3    1    2    3    1    1    5    1 
## 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 
##    6    1    1    2    1    1    2    2    3    3    1    1    1    1    1    2    1 
## 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 
##    1    3    1    1    1    1    2    2    1    2    2    1    2    3    1    4    1 
## 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 
##    3    2    1    3    2    1    1    3    1   17    1    2    4    4    3    5    3 
## 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 
##    5    3    4    2    1    1    5    1    1    2    2    1    1    1    1    4    2 
## 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301 1302 1303 
##    2    2    3    6    6    1    2    1    1    2    2    6    1    2    1    1    2 
## 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 
##    6    1    1    4    1    1    3    2    1    1    4    2    1    1    1    1    2 
## 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 
##    1    1    3    3    1    7    2    1    3    3    3    1    1    3    4    1    2 
## 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351 1352 1353 1354 
##    1    1    2    2    1    1    1    1    1    5    1    2    3    1    1    1    1 
## 1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 1367 1368 1369 1370 1371 
##    2    1    2    4    3   11    1    2    1    2    3    8    1    1    3    2    1 
## 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 
##    4    2    7    1    2    4    5    4    6    2    2    1    3    3    2    2    2 
## 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 
##    3    3    3    2    3    1    7    1    3    1    3    1    3    1    1    4    2 
## 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 
##    7    1    6    2    3    1    1    2    1    2    1    4    1    3    2    1    2 
## 1423 1424 1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 
##    1    1    1    1    2    1    1    1    2    2    1    1    4    2    1    2    4 
## 1440 1441 1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 
##    1    3    1    2    2    2    3    3    1    1    3    9    1    5    7    1    4 
## 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 
##    4    1    3    5    1    1    3    2    1    1    2    3    2   13    2    2    1 
## 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 
##    1    2    1    3    1    1    3    3    2    2    1    3    1    2    5    3    2 
## 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 
##    2    2    2    2    3    1    2    3    2    3    1    1    1    1    4    3    1 
## 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 
##    1    1    1    1    3    1    1    2    3    2    1    1    3    5    1    1    1 
## 1525 1526 1527 1528 1529 1530 1531 1532 1533 1534 1535 1536 1537 1538 1539 1540 1541 
##    3    1    3    2    2    3    2    3    2    2    3    1    1    2    1    3    1 
## 1542 1543 1544 1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555 1556 1557 1558 
##    2    3    1    1    1    1    3    2    4    2    2    1    2    1    1    1    1 
## 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 
##    2    2    2    1    2    1    1    1    4    1    1    3    1    2    2    2    1 
## 1576 1577 1578 1579 1580 1581 1582 1583 1584 1585 1586 1587 1588 1589 1590 1591 1592 
##    2    2    1    2    1    2    1    1    2    2    8    3    2    1    4    1    6 
## 1593 1594 1595 1596 1597 1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608 1609 
##    4    2    2    3    1    1    2    2    2    2    3    1    1    3    2    3    2 
## 1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620 1621 1622 1623 1624 1625 1626 
##    1    2    1    1    1    1    4    1    5    1    2    1    2    3    2    4    1 
## 1627 1628 1629 1630 1631 1632 1633 1634 1635 1636 1637 1638 1639 1640 1641 1642 1643 
##    4    2    1    1    1    2    3    6    1    2    1    3    3    2    3    2    1 
## 1644 1645 1646 1647 1648 1649 1650 1651 1652 1653 1654 1655 1656 1657 
##    4    2    4    1    1    3    1    2    2    2    1    5    2    2 
##  [ reached getOption("max.print") -- omitted 50 entries ]

Indirect PII - Ordinal: Global recode or Top/bottom coding for extreme values

# Focus on variables with a "Lowest Freq" in dictionary of 30 or less.

mydata <- mydata[!names(mydata) %in% "birth_date_correct"]
mydata <- mydata[!names(mydata) %in% "i15"]

percentile_99.5 <- floor(quantile(na.exclude(mydata$p7a1)[na.exclude(mydata$p7a1)!=-97], probs = c(0.995)))
mydata <- top_recode (variable="p7a1", break_point=percentile_99.5, missing=-97)
## [1] "Frequency table before encoding"
## p7a1. ¿Cuántos hermanos mayores tienes que estudiaron en tu escuela el 2016?
##    1    2    3    4    5    6 <NA> 
##  376   67   20    2    1    1 1960

## [1] "Frequency table after encoding"
## p7a1. ¿Cuántos hermanos mayores tienes que estudiaron en tu escuela el 2016?
##         1         2         3 4 or more      <NA> 
##       376        67        20         4      1960

percentile_99.5 <- floor(quantile(na.exclude(mydata$p7b1)[na.exclude(mydata$p7b1)!=-97], probs = c(0.995)))
mydata <- top_recode (variable="p7b1", break_point=percentile_99.5, missing=-97)
## [1] "Frequency table before encoding"
## p7b1. ¿Cuántos hermanos menores tienes que estudiaron en tu escuela el 2016?
##    1    2    3    4    5 <NA> 
##  528  155   28    5    1 1710

## [1] "Frequency table after encoding"
## p7b1. ¿Cuántos hermanos menores tienes que estudiaron en tu escuela el 2016?
##         1         2         3 4 or more      <NA> 
##       528       155        28         6      1710

Indirect PII - Categorical: Recode, encode, or Top/bottom coding for extreme values

# !!!Include relevant variables in list below (Indirect PII - Categorical, and Ordinal if not processed yet)

indirect_PII <- c("attending_confirm",
                  "dropout_why",
                  "dropout_why_1",
                  "dropout_why_2",
                  "dropout_why_3",
                  "dropout_why_4",
                  "dropout_why_5",
                  "dropout_why_6",
                  "dropout_why_7",
                  "dropout_why_8",
                  "dropout_why_9",
                  "dropout_why_10",
                  "dropout_why_11",
                  "dropout_why_12",
                  "dropout_why_13",
                  "dropout_why_14",
                  "dropout_confirm",
                  "highered_applied",
                  "highered_confirm",
                  "grado2016_confirm",
                  "grado2016_correct",
                  "grado2016",
                  "nivel2016",
                  "p14",
                  "pc_15",
                  "pc_16",
                  "dpout_month",
                  "dout_reasons",
                  "dout_reasons_1",
                  "dout_reasons_2",
                  "dout_reasons_3",
                  "dout_reasons_4",
                  "dout_reasons_5",
                  "dout_reasons_6",
                  "dout_reasons_7",
                  "dout_reasons_8",
                  "dout_reasons_9",
                  "dout_reasons_10",
                  "dout_reasons_11",
                  "dout_reasons_12",
                  "dout_reasons_13",
                  "dout_reasons_99",
                  "p16d",
                  "a2",
                  "a2c",
                  "a2d",
                  "a2e",
                  "a2_sel",
                  "a3",
                  "a3c",
                  "a3d",
                  "a3e",
                  "a3_sel",
                  "a4",
                  "a4c",
                  "a4d",
                  "a4e",
                  "a4_sel",
                  "a5",
                  "a5c",
                  "a5d",
                  "a5e",
                  "a5_sel",
                  "a6",
                  "a6c",
                  "a6d",
                  "a6e",
                  "a6_sel",
                  "a7",
                  "a7c",
                  "a7d",
                  "a7e",
                  "a7_sel",
                  "a8",
                  "a8c",
                  "a8d",
                  "a8e",
                  "a8_sel",
                  "a9",
                  "a9c",
                  "a9d",
                  "a9e",
                  "a9_sel",
                  "a10",
                  "a10c",
                  "a10d",
                  "a10e",
                  "a10_sel",
                  "a11",
                  "a11_o",
                  "a11c",
                  "a11d",
                  "a11e",
                  "a11_sel",
                  "m2",
                  "m2c",
                  "m2d",
                  "m2e",
                  "m2_sel",
                  "m3",
                  "m3c",
                  "m3d",
                  "m3e",
                  "m3_sel",
                  "m4",
                  "m4c",
                  "m4d",
                  "m4e",
                  "m4_sel",
                  "m5",
                  "m5c",
                  "m5d",
                  "m5e",
                  "m5_sel",
                  "m6",
                  "m6c",
                  "m6d",
                  "m6e",
                  "m6_sel",
                  "m7",
                  "m7c",
                  "m7d",
                  "m7e",
                  "m7_sel",
                  "m8",
                  "m8c",
                  "m8d",
                  "m8e",
                  "m8_sel",
                  "m9",
                  "m9c",
                  "m9d",
                  "m9e",
                  "m9_sel",
                  "m10",
                  "m10c",
                  "m10d",
                  "m10e",
                  "m10_sel",
                  "m11",
                  "m11c",
                  "m11d",
                  "m11e",
                  "m11_sel",
                  "p22a",
                  "p22b",
                  "p25_note",
                  "p25a1",
                  "p25a2",
                  "p25a3",
                  "p25b",
                  "p25c",
                  "p25d",
                  "p25e",
                  "p25_1_note1",
                  "p25_1a",
                  "p25_1b",
                  "p25_1c",
                  "p25_1d",
                  "p25_1e",
                  "p25_1f",
                  "p25_2g",
                  "p25_3h",
                  "p25_4i",
                  "p25_5j",
                  "p25_6k",
                  "p25_7l",
                  "p25_8m",
                  "p25_9n",
                  "p25_10o",
                  "p25_11p",
                  "p25_12q",
                  "p25_13r",
                  "p25_14s",
                  "p25_14t",
                  "p25_2_note",
                  "p25_2a",
                  "p25_2b",
                  "p25_2c",
                  "p25_2d",
                  "p25_2e",
                  "p25_2f",
                  "p25_2g1",
                  "p25_2h",
                  "p25_2i",
                  "p27_note",
                  "p27a",
                  "p27b",
                  "p27c",
                  "p27d",
                  "p27e",
                  "p34",
                  "same_school2015",
                  "same_school2014",
                  "same_school2013",
                  "same_school2012",
                  "same_school2011",
                  "same_school2010",
                  "cole_dif_5",
                  "cole_dif_6",
                  "cole_dif_7",
                  "cole_dif_8",
                  "cole_dif_9",
                  "cole_dif_10",
                  "cole_dif_11")

capture_tables (indirect_PII)


# Recode those with very specific values. 
# !!! No Indirect PII- Categorical variables with very specific values.

Matching and crosstabulations: Run automated PII check

# selected categorical key variables: gender, occupation/education and age
selectedKeyVars = c('i17', 'grado2016_admin') ##!!! Replace with candidate categorical demo vars


# creating the sdcMicro object with the assigned variables
sdcInitial <- createSdcObj(dat = mydata, keyVars = selectedKeyVars)
sdcInitial
## The input dataset consists of 2427 rows and 980 variables.
##   --> Categorical key variables: i17, grado2016_admin
## ----------------------------------------------------------------------
## Information on categorical key variables:
## 
## Reported is the number, mean size and size of the smallest category >0 for recoded variables.
## In parenthesis, the same statistics are shown for the unmodified data.
## Note: NA (missings) are counted as seperate categories!
##     Key Variable Number of categories      Mean size           Size of smallest (>0)
##              i17                   14 (14)   173.357 (173.357)                     1
##  grado2016_admin                    7  (7)   346.714 (346.714)                    12
##      
##   (1)
##  (12)
## ----------------------------------------------------------------------
## Infos on 2/3-Anonymity:
## 
## Number of observations violating
##   - 2-anonymity: 5 (0.206%)
##   - 3-anonymity: 9 (0.371%)
##   - 5-anonymity: 32 (1.319%)
## 
## ----------------------------------------------------------------------

Show values of key variable of records that violate k-anonymity

mydata <- labelDataset(mydata)
notAnon <- sdcInitial@risk$individual[,2] < 2 # for 2-anonymity
mydata[notAnon,selectedKeyVars]
## # A tibble: 5 x 2
##   i17   grado2016_admin
##   <chr> <chr>          
## 1 1999  8              
## 2 1994  11             
## 3 2012  7              
## 4 1999  6              
## 5 2003  5
sdcFinal <- localSuppression(sdcInitial)

# Recombining anonymized variables

extractManipData(sdcFinal)[notAnon,selectedKeyVars] # manipulated variables HH
##       i17 grado2016_admin
## 1381 <NA>               8
## 1668 <NA>              11
## 1730 <NA>               7
## 2139 <NA>               6
## 2268 <NA>               5
mydata [notAnon,"grado2016_admin"] <- NA

Open-ends: review responses for any sensitive information, redact as necessary

# !!! Identify open-end variables here: 
open_ends <- c("i16",
               "p4b",
               "p13c1",
               "v134",
               "a2_o",
               "a2g",
               "a3_o",
               "a3g",
               "a4_o",
               "a4g",
               "a5_o",
               "a5g",
               "a6_o",
               "a6g",
               "a7_o",
               "a7g",
               "a8_o",
               "a8g",
               "a9_o",
               "a9g",
               "a10_o",
               "a10g",
               "a11g",
               "m2_o",
               "m2g",
               "m3_o",
               "m3g",
               "m4_o",
               "m4g",
               "m5_o",
               "m5g",
               "m6_o",
               "m6g",
               "m7_o",
               "m7g",
               "m8_o",
               "m8g",
               "m9_o",
               "m9g",
               "m10_o",
               "m10g",
               "m11_o",
               "m11g",
               "q48",
               "p35b1",
               "pref18a",
               "pref18b",
               "pref19a",
               "pref19b",
               "pref15f",
               "pref16f",
               "school2015_name",
               "school2015_name1_extra",
               "school2014_name",
               "school2014_name1_extra",
               "school2013_name",
               "school2013_name1_extra",
               "school2012_name",
               "school2012_name1_extra",
               "school2011_name",
               "school2011_name1_extra",
               "school2010_name",
               "school2010_name1_extra",
               "cole_dif")

report_open (list_open_ends = open_ends)

# Review "verbatims.csv". Identify variables to be deleted or redacted and their row number 
# Drop all, as actually verbatim data in Spanish

mydata <- mydata[!names(mydata) %in% "i16"]
mydata <- mydata[!names(mydata) %in% "p4b"]
mydata <- mydata[!names(mydata) %in% "p13c1"]
mydata <- mydata[!names(mydata) %in% "v134"]
mydata <- mydata[!names(mydata) %in% "a2_o"]
mydata <- mydata[!names(mydata) %in% "a2g"]
mydata <- mydata[!names(mydata) %in% "a3_o"]
mydata <- mydata[!names(mydata) %in% "a3g"]
mydata <- mydata[!names(mydata) %in% "a4g"]
mydata <- mydata[!names(mydata) %in% "a5_o"]
mydata <- mydata[!names(mydata) %in% "a5g"]
mydata <- mydata[!names(mydata) %in% "a6_o"]
mydata <- mydata[!names(mydata) %in% "a6g"]
mydata <- mydata[!names(mydata) %in% "a7_o"]
mydata <- mydata[!names(mydata) %in% "a7g"]
mydata <- mydata[!names(mydata) %in% "a8_o"]
mydata <- mydata[!names(mydata) %in% "a8g"]
mydata <- mydata[!names(mydata) %in% "a9_o"]
mydata <- mydata[!names(mydata) %in% "a9g"]
mydata <- mydata[!names(mydata) %in% "a10_o"]
mydata <- mydata[!names(mydata) %in% "a10g"]
mydata <- mydata[!names(mydata) %in% "a11_o"]
mydata <- mydata[!names(mydata) %in% "a11g"]
mydata <- mydata[!names(mydata) %in% "m2_o"]
mydata <- mydata[!names(mydata) %in% "m2g"]
mydata <- mydata[!names(mydata) %in% "m3_o"]
mydata <- mydata[!names(mydata) %in% "m3g"]
mydata <- mydata[!names(mydata) %in% "m4_o"]
mydata <- mydata[!names(mydata) %in% "m4g"]
mydata <- mydata[!names(mydata) %in% "m5_o"]
mydata <- mydata[!names(mydata) %in% "m5g"]
mydata <- mydata[!names(mydata) %in% "m6_o"]
mydata <- mydata[!names(mydata) %in% "m6g"]
mydata <- mydata[!names(mydata) %in% "m7_o"]
mydata <- mydata[!names(mydata) %in% "m7g"]
mydata <- mydata[!names(mydata) %in% "m8_o"]
mydata <- mydata[!names(mydata) %in% "m8g"]
mydata <- mydata[!names(mydata) %in% "m9_o"]
mydata <- mydata[!names(mydata) %in% "m9g"]
mydata <- mydata[!names(mydata) %in% "m10_o"]
mydata <- mydata[!names(mydata) %in% "m10g"]
mydata <- mydata[!names(mydata) %in% "m11_o"]
mydata <- mydata[!names(mydata) %in% "m11g"]
mydata <- mydata[!names(mydata) %in% "q48"]
mydata <- mydata[!names(mydata) %in% "p35b1"]
mydata <- mydata[!names(mydata) %in% "pref18a"]
mydata <- mydata[!names(mydata) %in% "pref18b"]
mydata <- mydata[!names(mydata) %in% "pref19a"]
mydata <- mydata[!names(mydata) %in% "pref19b"]
mydata <- mydata[!names(mydata) %in% "pref15f"]
mydata <- mydata[!names(mydata) %in% "pref16f"]
mydata <- mydata[!names(mydata) %in% "school2015_name"]
mydata <- mydata[!names(mydata) %in% "school2015_name1_extra"]
mydata <- mydata[!names(mydata) %in% "school2014_name"]
mydata <- mydata[!names(mydata) %in% "school2014_name1_extra"]
mydata <- mydata[!names(mydata) %in% "school2013_name"]
mydata <- mydata[!names(mydata) %in% "school2013_name1_extra"]
mydata <- mydata[!names(mydata) %in% "school2012_name"]
mydata <- mydata[!names(mydata) %in% "school2012_name1_extra"]
mydata <- mydata[!names(mydata) %in% "school2011_name"]
mydata <- mydata[!names(mydata) %in% "school2011_name1_extra"]
mydata <- mydata[!names(mydata) %in% "school2010_name"]
mydata <- mydata[!names(mydata) %in% "school2010_name1_extra"]
mydata <- mydata[!names(mydata) %in% "cole_dif"]
mydata <- mydata[!names(mydata) %in% "v134"]
mydata <- mydata[!names(mydata) %in% "a4_o"]

GPS data: Displace

#  No GPS data

Save processed data in Stata and SPSS format

haven::write_dta(mydata, paste0(filename, "_PU.dta"))
haven::write_sav(mydata, paste0(filename, "_PU.sav"))

# Add report title dynamically
title_var <- paste0("DOL-ILAB SDC - ", filename)