rm(list=ls(all=t))

Setup filenames

filename <- "SAP20152016_Urbano_NOPII" # !!!Update filename
functions_vers <-  "functions_1.7.R" # !!!Update helper functions file

Setup data, functions and create dictionary for dataset review

source (functions_vers)

Visually inspect variables in "dictionary.csv" and flag for risk, using the following flags:

# Direct PII: Respondent Names, Addresses, Identification Numbers, Phone Numbers
# Direct PII-team: Interviewer Names, other field team names 
# Indirect PII-ordinal: Date of birth, Age, income, education, household composition. 
# Indirect PII-categorical: Gender, education, ethnicity, nationality,
# occupation, employer, head of household, marital status
# GPS: Longitude, Latitude
# Small Location: Location (<100,000) 
# Large Location (>100,000)
# Weight: weightVar
# Household ID:  hhId, 
# Open-ends: Review responses for any sensitive information, redact as necessary 

Direct PII: variables to be removed

# !!!Include any Direct PII variables
dropvars <- c("jefe_nom_2015",
              "jefe_priape_2015",
              "jefe_segape_2015",
              "bf1_fname_2015",
              "bf1_sname_2015",
              "bf1_flastname_2015",
              "bf1_slastname_2015",
              "bf2_fname_2015",
              "bf2_sname_2015",
              "bf2_flastname_2015",
              "bf2_slastname_2015",
              "bf3_fname_2015",
              "bf3_sname_2015",
              "bf3_flastname_2015",
              "bf3_slastname_2015",
              "A_NOM",
              "C_NOM",
              "A_APEPAT",
              "C_APEPAT",
              "A_APEMAT",
              "C_APEMAT",
              "DNI",
              "J_DNI",
              "L_DNI",
              "bf1_fname_2016",
              "bf1_sname_2016",
              "bf1_flastname_2016",
              "bf1_slastname_2016",
              "bf2_fname_2016",
              "bf2_sname_2016",
              "bf2_flastname_2016",
              "bf2_slastname_2016",
              "bf3_fname_2016",
              "bf3_sname_2016",
              "bf3_flastname_2016",
              "bf3_slastname_2016") 
mydata <- mydata[!names(mydata) %in% dropvars]

Direct PII-team: Encode field team names

# !!!Replace vector in "variables" field below with relevant variable names

mydata <- mydata[!names(mydata) %in% "DIGITA"]

Small locations: Encode locations with pop <100,000 using random large numbers

# !!!Include relevant variables, but check their population size first to confirm they are <100,000

mydata <- mydata[!names(mydata) %in% "NOMESC"]

as.numeric(mydata$CODLOC)
##    [1] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##   [14] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##   [27] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##   [40] -99998 146432 146432 146432 146132 146432 146432 146432 146432 146432 146432 146432 146432
##   [53] 146432 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##   [66] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##   [79] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##   [92] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [105] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [118] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [131] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [144] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [157] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [170] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [183] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [196] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [209] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [222] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [235] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [248] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [261] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [274] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [287] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [300] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [313] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [326] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [339] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [352] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [365] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [378] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [391] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [404] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [417] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [430] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [443] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [456] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [469] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [482] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [495] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [508] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [521] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [534] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [547] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [560] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [573] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [586] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [599] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [612] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [625] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [638] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [651] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [664] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [677] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [690] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [703] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [716] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [729] -99998 -99998 -99998 -99998 148129 -99998 -99998 -99998 -99998 146187 146187 146187 146187
##  [742] 146187 146187 146187 146187 146187 146187 146187 146187 146187 146187 146187 146187 146187
##  [755] -99998 -99998 -99998 146192 146192 146192 146192 146192 146192 -99998 -99998 -99998 -99998
##  [768] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [781] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [794] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [807] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 148983 148983
##  [820] 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983
##  [833] 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983
##  [846] 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983
##  [859] 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983
##  [872] 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983
##  [885] 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983
##  [898] 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983
##  [911] 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983
##  [924] 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983
##  [937] 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983 148983
##  [950] 148983 148983 148983 148983 148983 148983 148983 -99998 -99998 -99998 -99998 -99998 -99998
##  [963] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [976] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [989] -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998 -99998
##  [ reached getOption("max.print") -- omitted 27757 entries ]
locvars <- c("CODLOC", "COD_MOD_2015", "COD_MOD_2016", "cod_local") 
mydata <- encode_location (variables= locvars, missing=999999)
## [1] "Frequency table before encoding"
## CODLOC. Codigo de Local
## -99998 144560 144621 144782 144796 144800 146132 146187 146192 146253 146432 148129 148346 
##  25369     82      1     88      3     97      1     17      6     90     12    120     13 
## 148964 148983 148997 149020 149044 149063 149077 149261 165170 288134 288469 288520 288860 
##      2    139    114    120      3     97      1    165      1      1      3      7    124 
## 292452 292490 292517 292678 295064 295097 295115 295120 295158 298736 298779 298835 298939 
##      1     15      7     11     14     10     66     13      8     39     26     46      7 
## 299023 299024 299043 301809 304860 304898 304916 304935 304940 304983 305020 305082 305124 
##      1     32      4      1      7     92     41     41      5     72      3    107     21 
## 305142 308900 311120 316641 316679 318348 319239 320105 324429 324434 324486 324491 324542 
##      1     23      2    118     30      2     48    152      5      2      7      1      2 
## 324721 324759 324896 324976 325221 325264 325424 326838 332165 338695 338817 340274 341117 
##      4      1      3      2      1      4      2      1     93     11      3      1      1 
## 342843 346836 361641 365066 365170 365311 365325 365330 365532 365759 365900 365995 366075 
##    131      8      1     73     78     44     62      3      1     56    134      8     68 
## 366706 366872 366886 367051 528426 594459 687887 725870 
##      3      5     33     25     19     11      1    107 
## [1] "Frequency table after encoding"
## CODLOC. Codigo de Local
##   296   297   298   299   300   301   302   303   304   305   306   307   308   309   310   311 
##     1    88     1     3    44    73   165    97    15    66    11   120     6     3     1    13 
##   312   313   314   315   316   317   318   319   320   321   322   323   324   325   326   327 
##     3     2    72     2    78     1   124     1    41     5    12     1    90     1     2    21 
##   328   329   330   331   332   333   334   335   336   337   338   339   340   341   342   343 
##    32     7   107     1    41     1 25369    68    17    14    56    48    25     7     8    82 
##   344   345   346   347   348   349   350   351   352   353   354   355   356   357   358   359 
##     2     4   107   134     1     3    97     7     4     1    10    23     2    13     3    26 
##   360   361   362   363   364   365   366   367   368   369   370   371   372   373   374   375 
##   152     1    33     7    11    19     1     1     2     3    93    30   114   139     4     1 
##   376   377   378   379   380   381   382   383   384   385   386   387   388   389   390   391 
##     1   131    92    46     1     2     8     3     8     1   120     5    11     5    62    39 
##   392   393   394 
##     3   118     7 
## [1] "Frequency table before encoding"
## COD_MOD_2015. 
##  202614  203414  203448  203455  203471  203505  203745  205567  205880  205997  206011  206037 
##      29      44      13      12       4      11       2      10       1      12      30      16 
##  206136  207795  207803  207845  207852  207894  207951  207985  207993  208058  208330  208348 
##      18      24      23      33      17      46      21      66       7      47       3      21 
##  208389  208413  208538  208546  208553  208561  208579  208587  208652  208694  208710  209916 
##      18      10      30      56      22      56      40      35      38       2       6      11 
##  209924  209940  209973  215632  215707  215723  215848  215863  215921  217554  219683  235010 
##       1       4      13      92       2      37      13       4       8       8       1      38 
##  235333  236117  236174  236349  236778  245662  245704  271155  271205  271668  271775  304444 
##       2      14     100       1       1      56       1       1       1       1       1      55 
##  315275  317040  317073  317131  317214  317230  317263  317289  317305  317313  317347  317479 
##       5      15       7      84      47      17      23     101       2      19       3      33 
##  317495  317511  317529  317560  317578  318063  318089  318204  318212  318287  318303  318352 
##      33      22      29      39       2       7       4       6       8      13       9      15 
##  318436  318576  318584  318741  318782  318824  318907  318931  318949  319004  319020  319061 
##       6       3       4      22      12       9       7      37      21      11      88      72 
##  319145  319160  319202  319285  322453  322503  322560  322644  322677  322685  322743  322768 
##      34      20       1      17       9      23       3       1       7      90      13      30 
##  322826  322875  322891  322909  322925  322933  322958  322974  323295  323337  323378  323394 
##      13      54       3       1       3      30      24      27      45       4      37       1 
##  323444  323451  323865  325464  325472  325480  325498  325563  325670  325696  325845  327551 
##      42      44      60      77      72       5       1     104      29       1       4       7 
##  327627  327965  328039  328047  328062  328070  328153  328229  328252  328260  328328  328336 
##       4       3      80      15      48       7      31       5      38      15       5      36 
##  328344  328351  328369  328385  328401  328419  328443  328450  328518  328526  328567  328872 
##      40      41      25      12      18       1      47      44      46      75       3      13 
##  328963  328997  329029  329045  329128  329326  329573  330464  331702  332213  333666  333674 
##      16      18       8      37       1      80      49      60      18      27      38       4 
##  333682  334094  334649  334672  334748  334821  334847  334904  334912  334920  334961  334987 
##      10      12       3      17       1      46       7      16      37      13       5      31 
##  335000  335026  335034  335042  335083  335091  335109  335166  335182  335224  336511  336560 
##      33       2       1      51      45      61      32      42      38       1      41      47 
##  336594  336628  336636  337436  337717  337980  338129  338186  338228  338301  338343  338517 
##      67      52       1      69       2       4       2       5      15      18      25      26 
##  338525  338541  338566  338640  338665  338970  339036  339051  339077  339192  339275  339291 
##      20       3      30      15      14      21      30      10      11      20      35       8 
##  339317  339333  339432  339507  339523  339549  339606  339655  339804  340372  340380  397992 
##       6      28     124      17       2       4      25       3      61       1      92       7 
##  398016  398040  398065  398081  398115  398446  398479  398495  398578  398586  398628  398669 
##       1      23       6       7      15      10      25       1       7      19      18       5 
##  398842  398859  400036  400523  400572  400622  400663  400689  400705  400739  400754  404913 
##      14      12      40       5      14      13      14      24       8       7      10       5 
##  404947  405100  405183  405233  405308  405324  406793  432880  432906  433011  433078  433086 
##       9      28      29       3       7      11      19       4       3       1      60      68 
##  433227  433235  433243  433276  433300  433326  433367  433490  433516  433540  433680  433706 
##     104      21      13      31      11       5       2      25      53      36      39       9 
##  433722  433821  433862  433961  434019  434035  434076  434092  434134  434159  434191  434258 
##       9      42      22      53      65      15      25      15      10      44      54       6 
##  434282  434365  434381  434399  434464  434480  434498  434506  434548  434563  434597  434605 
##      43       1       8      12      51      86      37      22      60       6      64       2 
##  434621  434662  434720  434829  436154  436162  436170  436188  436196  436204  436212  436246 
##       6       1      24      44      23       4      15       3      18       1      61       8 
##  436287  436295  436303  436311  436345  436360  436410  436428  436444  436451  436485  436493 
##      31      12      27      33      20      18      51      21      18      40      21      40 
##  436501  436519  436543  436576  436584  436626  436634  436691  436709  436725  436733  436741 
##      12       3      49      69       1       7      85       1      49       1       1       1 
##  436758  436766  436774  436782  436790  436808  436816  436824  437160  437210  437228  437236 
##       7      52      21       1      47       5      14      42       6      19      34      31 
##  437244  437251  437277  437293  437319  437335  437343  437715  437731  437772  449868  466342 
##      49       2      37      74      56      26     112      55       3       1      45      27 
##  466383  466508  466730  468488  468611  469700  472654  478404  478420  481853  481903  482091 
##       1      21     100      78       4      42       8      39      19       3       1      50 
##  482109  486621  488619  488635  488676  488817  488841  489104  493338  493544  493734  493841 
##      47       1      30      32      16       3       1      58      27      94      46      65 
##  495093  495473  496133  496166  496521  496653  496844  496877  497024  497651  498824  499236 
##       2      21      29      40      46       1      55      61      45      66       1       6 
##  499699  500348  501411  501601  501676  501908  501957  502435  502484  502534  502633  505149 
##      38      18       2      56      59      37      21       4      72      37      38       1 
##  508903  510305  510602  510800  512020  512327  513614  513713  516674  516872  518340  518548 
##      11      42      18      67      64       3      13      22      42      27       2      37 
##  518647  523464  523563  523662  523761  523860  524264  524462  525055  525253  525857  526053 
##       2      72       2      94     103      22      39       1       1      15      38       2 
##  526301  526376  526400  527473  527572  528281  528380  531368  535666  536326  541011  541995 
##      53      21      29      38      46      57      16      66       3      33      43       1 
##  542357  542720  543645  546002  551804  555599  555862  555946  555987  556290  556340  556357 
##       2      23      46      56       7      14      23       3       3      40      64      43 
##  556472  556548  556555  556571  556597  557322  565119  565176  565234  566141  566166  566430 
##      17       3      18      49      35       8       5       1      60      34       5      48 
##  566448  566455  566463  566471  566489  567453  567750  573352  578286  578294  578336  578351 
##       2       2      40      54       3       1      19      23      53      59      51      48 
##  578401  578435  578443  578492  578518  578526  578534  578542  578559  579151  579706  581728 
##      33      43       2      63       2      65      51      56       2      84       1       2 
##  581736  581777  581876  581884  581892  581900  582114  582254  582262  582387  582411  582833 
##      79       2      26       3      19      25       2       1      66       1       4      60 
##  582890  582932  582981  583013  583021  583104  583500  583567  583591  583922  584946  587279 
##      42      99      32      82      97      77       1      25      42      89     107      45 
##  589085  590133  591198  598581  599365  601492  602276  602482  603738  603878  605469  607424 
##       1      44      93      40     126      12       4      24       1      46     104       1 
##  607432  607457  607556  607697  616185  628370  628404  628826  629261  629295  629329  632299 
##      46      48       2      76      97      25      37      44      26     118      34      24 
##  632356  633354  639112  639732  642801  642926  643262  644880  646646  647065  647172  647784 
##      48       7      12      23      42      62      57      46       1      90      48      46 
##  647792  649830  649897  649913  650036  652081  656843  656975  659599  659623  659664  659698 
##      45       1       1      57      15      15      12       1       1       1      45      27 
##  659706  659714  659896  659938  659953  662346  662726  662742  662841  662858  663096  663138 
##      58       5      62       7      59       8      50      42       1       2      66      24 
##  663534  663559  663682  663971  664284  664482  664508  664722  664748  664920  665265  665281 
##       1      69      26      70      67       2      24      18      64       2      77     105 
##  665372  665398  665422  665448  681783  681817  681825  682229  682245  689836  690008  691782 
##      53      44      18       2       8       1      48      91       2      22      59      21 
##  691808  691931  692434  692442  692467  693382  693465  693499  693622  693630  693655  694216 
##      72      46      92       3       1       1      22      62      78       1       1       1 
##  694224  694307  694315  694398  694422  694463  694547  694570  694588  695288  697557  703124 
##      15       1      44       9      27      28      41      68      49       1      37       1 
##  703215  703223  703231  703249  703256  703736  703751  704072  704312  704445  705053  705129 
##      66      82      63      72       2      51      78       3       1      19      61       7 
##  705137  705160  705376  720128  720235  725523  728055  728485  728634  728717  732347  732461 
##       1       3       1       1      23       1       9       4       1     121      61      48 
##  738542  743708  743773  743807  743831  744540  744557  759399  759571  759613  762120  762468 
##       3      14      52       1      46      22      46      41       1      47       1       2 
##  762500  762757  762773  762849  762856  762864  762880  762906  763151  763177  763789  764035 
##      75      24      65      51      51      80     102       1      24      14       1       4 
##  764068  764076  764084  764555  764779  764795  764910  765164  765297  765305  765321  765859 
##       1      24      14       6      31       2       1      34      38      11      39      91 
##  772913  772970  773788  773846  774026  774679  774703  774737  774794  775312  776138  776161 
##      33      15      61       1      43      74      64       3       1      23      16       2 
##  776229  776328  777144  777656  777680  777995  778076  778233  778738  778761  779041  780700 
##      20      15      26      38      45      34      67      27      33       3      65      43 
##  780759  780767  780825  781096  781278  781336  781351  781369  781385  781427  781773  781831 
##       1       2      61      42       1       1      37      90      78       1      14       5 
##  781898  781930  782078  782102  782664  785097  817916  821058  821082  824003  824813  825661 
##       2     107       2      64      79      79      52      47      43      18      57       1 
##  825752  826081  826263  826479  828160  828210  829291  829325  831313  832253  832303  832311 
##       5       1      31      47      13       2       1       1       4       1       1      16 
##  832345  834465  834853  834960  834994  835025  835058  846048  847087  855114  855247  855270 
##       1      19      61      50       1       1      34      29       7       3       3      45 
##  869032  869040  869198  869230  869248  870345  870360  871251  872127  872515  874198  874214 
##      52       1      26      58       1       4      24       2      32     105       3      45 
##  879791  882977  882993  884528  884544  884551  884585  884593  884635  900704  900761  900795 
##       1       4      10      44      35      36      66       4       2       1      46       1 
##  900852  900910  901033  901066  915256  922872  923482  923748  927814  928820  933598 1007160 
##       2      69      68      62      56       1       1       2      89      44      88      11 
## 1007491 1008127 1008440 1008960 1009802 1010040 1010107 1010149 1010214 1033729 1041391 1041516 
##       3       5      44      28      33       2      42      19       2      41       1       1 
## 1041631 1045079 1045111 1045277 1045392 1048990 1053628 1053669 1053693 1054196 1054279 1054352 
##     112      21      39      23       9       1      36      43     105     104       2      55 
## 1054436 1056902 1056944 1062942 1063106 1063148 1063221 1063304 1064989 1066026 1069954 1070036 
##      93       1      34      57      26      21      29      63       3       1       4      29 
## 1070077 1070390 1071257 1071919 1072685 1072727 1073212 1073998 1075779 1080068 1080258 1082031 
##      94      20       1      61      27      21      38       1       1      61       6       2 
## 1083815 1084508 1084987 1085919 1088400 1098102 1147610 1147768 1148014 1151661 1151901 1151943 
##      36      23      26      37      24      41       2       7      23      15       2       1 
## 1152941 1152982 1153105 1153147 1153386 1154160 1185644 1194265 1194380 1195189 1195221 1195478 
##      79      49       1      65       3      26      10      75      25      31       1      15 
## 1195841 1195874 1196047 1196526 1208891 1210137 1227461 1229558 1237106 1238229 1238542 1238708 
##      36      61      39      27       3      61       1       1       1       1      33      22 
## 1240357 1240720 1241082 1241678 1242072 1242908 1248350 1248392 1248467 1248509 1258649 1261742 
##      42      52      10       1      24       1      73     122      22      69      68      13 
## 1262211 1262542 1262930 1263011 1263052 1265214 1266840 1268150 1273150 1273234 1273275 1273929 
##       8       4      48      41       1       1       1      56      29      33     110       6 
## 1279124 1305952 1309392 1313444 1321256 1329788 1335637 1346576 1351410 1365816 1369503 1376854 
##      37       3      82       2      12       1     125      30      23      57      49       7 
## 1380690 1380740 1381078 1381110 1381144 1381219 1381334 1381342 1381375 1381581 1381599 1381862 
##      53     100       2       2       1     112      72      15      66      44      72      51 
## 1383157 1383181 1383199 1386168 1386234 1386283 1390442 1390798 1391481 1393453 1398148 1406743 
##       2       5       3     128      84      17      35      44       3     118      31       2 
## 1411438 1438027 1473644 1474600 1474899 1474964 1475011 1475045 1475201 1475219 1475250 1475284 
##      66       1      41       9      53      82      68      30      50       2      70      42 
## 1475755 1476258 1477264 1484443 1486018 1493964 1495365 1495407 1497056 1497601 1501451 1505494 
##      22      12       4      40       3       3      20      41      72      47      53     113 
## 1507094 1507250 1507276 1507318 1507532 1509496 1510544 1511351 1512789 1513951 1520287 1527225 
##       2       1      21      15      43       1      15      87      48       6       4      67 
## 1531359 1558725 1563188 1563238 1574557 1607944 1640556 1641521 1661271 
##       3      99       1      50       8       1      59      11      32 
## [1] "Frequency table after encoding"
## COD_MOD_2015. 
##  725  726  727  728  729  730  731  732  733  734  735  736  737  738  739  740  741  742  743 
##   33   29   84   47   12   36    2    1   69   21   10    1   29   77    2   14   46    4   38 
##  744  745  746  747  748  749  750  751  752  753  754  755  756  757  758  759  760  761  762 
##  110  118   26   43    2   26   18   61    1   66    3   40   22   40    2   17    3   28  105 
##  763  764  765  766  767  768  769  770  771  772  773  774  775  776  777  778  779  780  781 
##    4    3   46   72   16   24   13   10   62   14   14    6    1    3   57    3    5    1   53 
##  782  783  784  785  786  787  788  789  790  791  792  793  794  795  796  797  798  799  800 
##   72   38  101   80    9   92   46    3  104   10   41   37    5   23   36   13   12   25   46 
##  801  802  803  804  805  806  807  808  809  810  811  812  813  814  815  816  817  818  819 
##   12   97   11    6    2   54    2   33    4   64  112   51   40   19    3   65   18   78    1 
##  820  821  822  823  824  825  826  827  828  829  830  831  832  833  834  835  836  837  838 
##   89    1   30   90   21   66   70   12   16    7   29   47   18    1    2   40   34   18    1 
##  839  840  841  842  843  844  845  846  847  848  849  850  851  852  853  854  855  856  857 
##   39   25    5    1   94    1    7   48   39   44    1   39    8   66   33   41   49    1   48 
##  858  859  860  861  862  863  864  865  866  867  868  869  870  871  872  873  874  875  876 
##   42   36    7    3   94   20   16   37   37   19    1   21   18   72   57   12    7   38    1 
##  877  878  879  880  881  882  883  884  885  886  887  888  889  890  891  892  893  894  895 
##    1    1   29   56    3   38  113    1    2   38   22   44    1   46    4   99   56   25   10 
##  896  897  898  899  900  901  902  903  904  905  906  907  908  909  910  911  912  913  914 
##    4   37   61    2    3   48   12   18    4   22   30   15   23   33   24    1   18   72   29 
##  915  916  917  918  919  920  921  922  923  924  925  926  927  928  929  930  931  932  933 
##    7   35   41   46   21   66   63    2    1   23    1    2    1    2   11   41    1   14   45 
##  934  935  936  937  938  939  940  941  942  943  944  945  946  947  948  949  950  951  952 
##    2   31    1   14    4    1    6    1    5   18   52   44   44    1    2   85   43   77   15 
##  953  954  955  956  957  958  959  960  961  962  963  964  965  966  967  968  969  970  971 
##    3   46   55    2    1   34   67    5   84  112   23   59   10    1   52    1    8    2   42 
##  972  973  974  975  976  977  978  979  980  981  982  983  984  985  986  987  988  989  990 
##    1   49   33   34    3   60    1   39   18   13   60  124   78    1    1   62    4   27    3 
##  991  992  993  994  995  996  997  998  999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 
##   73   20    2   66    1   40   43   49    2   11   29    3   31   16   53    3    1    1   47 
## 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 
##    7    1   57   21   15   33    7   84    7   36   24   24   44   82    2   59   66   16   55 
## 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 
##   61   44   51    8   27   61    1    8   53  104   13   35   61    4   37    1  128    1   12 
## 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 
##   69    1    4   41   32   14    1    5   15   24   31    4  118   13   61   99   13    5    2 
## 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 
##   14   67   53   23   78    1   32   33   60    6   61    1   12   31    6    1   22   25    2 
## 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 
##   51   24   19    2   57   15   75    3    2   44  104    1    2   50    2   16    1   46    5 
## 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 
##   13   25    3   31   36  107    2   24   24    1   52   43    1   61   15   72   42   79   52 
## 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 
##   18   43   18    1    7  112    6    1    1   56    1   30    2   17   34   15   49   15    3 
## 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 
##   49    1    1   76  100   20   29   79   54   15   44    2   15   50    3   59    9   37   48 
## 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 
##   27   72   93   42   30    1    2    2   72    4   66    2    1   40    1    1    2    6   42 
## 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 
##   97   93   21   13   48   39    2   46   35  105   44    9   19    1   21    5   60    2   56 
## 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 
##   65    2    1   14   79    4   45   42  107   34   44   22    1   25    1   69   17    9    7 
## 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 
##   41    1   30   12   46    3   49   38   61    5   15   37    2    1    3   65   29   68    3 
## 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 
##   34   27   41    3    8   42   15    3   15    1   21   37    1   10   17    6   61   21   74 
## 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 
##   19   47   48    2    7   38   68   33    2   22    1    1   51   24   46   65   60   91   26 
## 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 
##    1   64    8   78   42   40   22   13   18    1   19    1   17    1    4   23    7   65   22 
## 1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 
##    1    1   48  125   87    4   21    1    8    3    3   53   88   30   13   27   58   53    3 
## 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 
##   26   80    1    6   15    2   91   61    3    8    7    2   18   45   14    6   41   23   23 
## 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351 
##   72    8   67   11   15   47    1    1   45    2   22   24  105   42    1   46    1   53   47 
## 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 1367 1368 1369 1370 
##   21   48   79    8    8   62   52    5   38    2   37   43    1   51   92   20    1    1   66 
## 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 
##   25   24    1    4   64   42    1   25   15   27    1   56    2   62   18   94    1    1   47 
## 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 
##   45   89   80   37   23   37   27   60    2   11   56    3   21   70    3   45   26   23   47 
## 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426 1427 
##    3    1   43   74  100   40    1   68    1   48   45   20   30   12   32    2   57  122    5 
## 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 
##   24   56   15  104   82   63   57    3    2   26   36    1   30   67   25   49   11    1   55 
## 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 
##   38    7    7   39   11   19   45    4    3    4   37    9   39   50   42  126    1    7    7 
## 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 
##   21    1   90   45   22   28   38   51    1  102   42   40    4   65   21    1   44   46   24 
## 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 
##   11   69    1   14   47   58   45   92    1   64    1  121   19   26   12   12   66   59    5 
## 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 
##   82   21    1   64    1   32    7   31   11   27    9   88    3    7    1   23    4    1   33 
## 1523 1524 1525 1526 1527 1528 1529 1530 1531 1532 1533 1534 1535 1536 1537 1538 1539 1540 1541 
##    4    8    1   28   21   31   37    1   26    1   41    8   26   22   35    6    3   46   23 
## 1542 1543 1544 1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555 1556 1557 1558 1559 1560 
##    1   82   18   53   15   75   26    7  100    2    1   10    7   63    6   50    1   86    2 
## 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 
##   31   43   27   12    1    1    3   68   15   40    2   33   37    5   69    3   32   38   34 
## 1580 1581 1582 1583 1584 1585 1586 1587 1588 1589 1590 1591 1592 1593 1594 1595 1596 1597 1598 
##    1    4    1    6    1   47    1    1    2   29    6   75    1   10    2   54   14   17   43 
## 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613 1614 1615 1616 1617 
##   10    4   10    7   56   67    9   23   59   50   52    1   20   51   33   20   90    2    2 
## 1618 1619 1620 1621 1622 1623 1624 1625 1626 1627 1628 1629 1630 1631 1632 1633 1634 1635 1636 
##    1    1   30   61    2   13   38   37   27    5   77   13    1    9   49    3    1   58    2 
## 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647 1648 1649 1650 1651 1652 1653 1654 1655 
##   44   22   15   46    2   64   51   27   24   44    4   35   18    1   23    5    1   28    3 
## 1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674 
##    1   33    2    9   42    3   15    1    8    3   44   19   34   19   48    1    1    5   12 
## 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 
##    2   72   16    4   17   13    4    9   61   56    4   51   42   55   25    1    5  103    3 
## 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705 
##   22    3   21   29   42    3   31   11    1   23    2   68 
## [1] "Frequency table before encoding"
## COD_MOD_2016. 
##  202614  203414  207449  207795  207845  207852  207894  207951  207985  208058  208348  208371 
##      14      26      13      14      18      13      24      10      33      27      13       1 
##  208389  208538  208546  208553  208561  208579  208587  208652  209387  209510  209536  209908 
##      12      18      37      12      31      25      26      21       5      40      75      45 
##  209916  209965  209973  215632  215723  215897  233056  233130  235010  236109  236117  236174 
##      18      80      22      46      17       1      17       1       2       6      54     139 
##  236224  236364  245654  245662  245688  245696  260612  302893  302943  302950  302968  304444 
##      12      12       1      88      91      21       1      14       5      32      37     134 
##  305656  315275  317040  317107  317131  317214  317230  317263  317289  317313  317370  317438 
##      10       1       1       2      41      25      18       5      30      18       1       1 
##  317479  317495  317511  317529  317560  318352  318931  318949  319020  319061  319145  319160 
##      30      19      13      17      27       4      15      12      45      35      29      20 
##  319228  319269  319285  322453  322461  322503  322685  322768  322875  322891  322933  322958 
##       2       1      14       8       1      10      43      19      31       1      14       9 
##  322974  323295  323311  323378  323444  323451  323865  324772  325449  325456  325464  325472 
##      22      26       2      34      22      25      29      13      34      14     131     119 
##  325506  325548  325563  325589  325605  325647  325654  325662  325670  325704  325712  327551 
##       8      26     123      40      26      87       1       1      65      57       4       1 
##  328120  328146  328153  328187  328252  328336  328344  328351  328369  328401  328435  328443 
##       2       1      11       2      14      18      21      14      13       2       1      34 
##  328450  328518  328526  328997  329045  329326  329573  330464  331702  332213  332239  334672 
##      21      41      55      18      26     115      73      66      12      13       1      22 
##  334680  334714  334722  334730  334771  334821  334912  334987  335000  335042  335083  335091 
##       7       5      26       7       7      23      14      31      19      33      28      30 
##  335109  335117  335166  335182  336495  336511  336545  336560  336586  336594  336628  337436 
##      15       2      27      18      68      47      11      58     107     106     100      89 
##  337592  337741  337766  338517  338525  338566  338822  338970  339036  339192  339275  339432 
##      10       3      21      16       7      16       4      13      18      13      26      68 
##  339499  339606  339697  339804  340281  340299  340315  340323  340331  340349  340356  340364 
##       2      19       1      37       6       4      56      11       8      68      12       6 
##  340380  340398  340414  340463  398040  398446  398479  398586  398669  398859  400036  405100 
##     124       9      57      10      10       5      13      10       2       8      23      11 
##  405167  405183  432773  433078  433086  433227  433235  433276  433490  433516  433540  433623 
##       1      10      12      32      36      45      13      24      17      41      18       1 
##  433680  433805  433821  433862  433961  434019  434035  434076  434159  434191  434282  434399 
##      26       2      28      17      39      38      15      11      24      31      39      10 
##  434464  434480  434498  434506  434548  434597  434720  434761  434829  436170  436196  436212 
##      44      37      25      10      31      22       8       1      27      10       2      49 
##  436287  436303  436311  436345  436360  436410  436428  436451  436493  436501  436543  436550 
##      16      14      19      11      13      26      15      19      25      13      32       1 
##  436576  436634  436675  436709  436766  436774  436790  436816  436824  437210  437228  437236 
##      21      32       3      25      38       1      26       1      25      32     137     140 
##  437244  437277  437285  437293  437319  437327  437335  437343  437368  437509  437707  437715 
##     107     108      37      87      66       8      26     126       2      10      33     111 
##  437723  449827  449868  466342  466722  466730  468488  469700  478404  478420  481820  482059 
##      42       3      94      18       6     123      48      68      20      12       1       1 
##  482091  482109  488619  488635  489070  489104  493544  493734  493742  493841  495150  495259 
##      41      29      59      38       1      31     118      26      26      63       2      26 
##  495812  496133  496166  496521  496844  496877  497024  497081  497651  499699  500124  500348 
##      14      14      58      23      31      35      25       2      36      93      14      18 
##  500611  501502  501601  501676  501809  501908  501957  502104  502484  502534  502633  504993 
##       7       3      57      81       4      46      13       3      91      19      63      39 
##  510305  510602  510701  510800  512020  513614  513713  514224  516674  516872  518548  522318 
##      22       2       1      31      32       7       8       1      29      19      10      14 
##  523423  523464  523621  523662  523761  523860  524264  525857  526301  526400  527473  527572 
##      47      22      37      49      57      11      30      20      28      13      20      27 
##  528281  528380  528794  531368  535823  536128  536326  536714  541011  542597  542720  543645 
##      29       1       1      36      50      27      40      25      24       2      14      27 
##  546002  555599  555862  556241  556290  556340  556357  556449  556472  556571  556597  565200 
##      56       9      45       2      21      81      25       5      28      76      31      22 
##  565234  565267  566141  566158  566414  566430  566463  566471  567750  573352  578260  578278 
##      74      15      87       3       4      63      57      73      42      30       5       3 
##  578286  578294  578336  578351  578393  578401  578435  578468  578492  578526  578534  578542 
##      77      74      64      55       3      51      47       3      75      85      90      72 
##  579151  581710  581736  581876  581892  581900  582122  582148  582163  582189  582262  582304 
##     101      11     111      49      18      53       5      45      68       1      78      47 
##  582312  582833  582866  582890  582932  582981  583013  583021  583104  583203  583476  583567 
##      12      79       4      57     125      49     110     124      96       3       7      40 
##  583591  583922  584946  587279  587303  590133  591131  591164  591198  596007  596932  598482 
##      56      42      60      31       1      26       2      13     120       1       1       1 
##  598581  599365  601492  603878  605469  605501  607143  607416  607432  607457  607697  616185 
##      57     152      17      53     140       5       1       1      29      24     100     114 
##  628404  628826  629295  629329  632299  632323  632356  633321  639674  639732  639922  642801 
##      20      25      61      20      18       1      27       1       1       1       5      70 
##  642892  642926  643262  643692  643783  643841  644690  644880  647065  647172  647784  647792 
##       4      74      56       7       4       3       6      51     109      68      24      30 
##  649913  650002  650036  652081  656843  659664  659698  659706  659896  659953  662726  662734 
##      23       9      32      15       2      23      14      45      85      83      28       1 
##  662742  662940  662957  663005  663096  663120  663138  663559  663682  663690  663971  664284 
##      17       5      12      15      88       5      35      92      21       1      92      35 
##  664292  664508  664706  664722  664748  665265  665281  665372  665398  665463  681825  682229 
##       1       7       2       2      91     107     127      21      25       2      23     115 
##  682260  689836  690008  690024  691808  691931  692434  692707  693465  693499  693622  694224 
##      30      10      73       1      35      94     111       4       1      85      95      10 
##  694315  694422  694455  694463  694547  694562  694570  694588  694596  694604  697557  703215 
##      25      11       1      10      58       4      94      59       9       8      21      90 
##  703223  703231  703249  703736  703744  703751  704445  704460  705053  705129  705772  720235 
##     100      87      96      35      61      95      11      30      77       4      10      25 
##  725770  725861  728337  728642  728717  730515  732321  732347  732461  735035  743773  743831 
##      46      22       4       2     157       6      16      85      31       3      50      66 
##  744540  744557  744573  751230  759399  759613  762500  762757  762773  762849  762856  762864 
##      14      20       2      19      32      63      39       9      76      80      69     107 
##  762880  762914  763151  763169  764076  764779  764928  764936  765164  765297  765305  765313 
##     138      61      15       1      21      22       1      45      15      52      17      11 
##  765321  765370  765859  772913  773788  774026  774455  774679  774703  775312  775346  776229 
##      51       2      52      20      68      58       7     101      88      16       1      14 
##  777144  777656  777680  777995  778027  778076  778233  778738  779041  780700  780825  781096 
##      23      55      80      46       1      32      47      53      81      28      26      22 
##  781351  781369  781385  781930  782045  782102  782664  785097  817916  820803  821058  821082 
##      31     134      53     150       1      82     101      90      27       2      21      22 
##  824003  826263  826479  832279  832311  832337  834465  834853  834960  835058  846048  847087 
##       1      19      29      21      11      49      14      50      21      21      27       6 
##  855213  855270  869032  869198  869222  869230  870360  870931  870956  872127  872515  873679 
##       3      24      34      42       2      57      16      11       3      19     122       3 
##  874206  874214  876219  884510  884528  884536  884544  884551  884585  884627  885517  900647 
##       8      61       1      11      48       5      30      91      90      10       1       1 
##  900670  900738  900761  900910  900944  901033  901066  901124  915256  927814  928200  928820 
##       1       4      65      98       3      82      84       2      75     103       1      16 
##  933598 1007160 1008440 1008929 1008960 1009802 1009844 1010107 1010149 1010180 1033729 1034016 
##     114      12      54       5      29      26      27      32      30       1      19       6 
## 1034339 1041474 1041623 1041631 1045111 1045277 1045434 1045632 1053628 1053669 1053693 1054196 
##       1       1       1     146      27      15      11       6      53      58     137     117 
## 1054352 1054394 1054436 1056944 1062942 1063106 1063148 1063221 1063304 1070036 1070077 1070390 
##      72      15     110      45      27      40      41      41      72      50     126      10 
## 1071919 1072685 1072727 1073212 1074301 1074509 1080068 1083187 1083633 1083674 1083716 1083815 
##      80      11      60      50      18      15      30       1       1      14      28      59 
## 1084508 1084987 1085919 1085976 1087295 1088400 1098102 1147537 1147610 1147651 1147933 1148014 
##      33      14      13       4       4      17      19       8       1       3       4      31 
## 1152941 1152982 1153022 1153147 1153261 1153345 1154160 1194265 1194380 1194810 1195189 1195577 
##     109      61       2      79       3       1      14      89      37       4      29       1 
## 1195841 1195874 1196047 1196526 1210137 1222595 1224104 1238542 1238948 1240357 1240720 1241082 
##      22      68      18      18      72       1       1      15       3      19      66       5 
## 1242072 1246792 1247832 1248350 1248392 1248467 1248509 1250695 1254192 1258334 1258649 1261742 
##       7       1       7      38     159      13      77       1       1       5      35       2 
## 1262211 1262930 1263011 1264159 1264639 1268150 1273150 1273234 1273275 1279124 1279637 1309152 
##      11      68      63       1       1      32      11      22     122      50       1       1 
## 1309392 1313444 1322593 1322973 1328947 1335637 1336072 1346576 1350008 1364975 1365816 1369503 
##     103       1       3       1       1     157       8      40       1       1      31      60 
## 1370378 1380690 1380740 1381219 1381334 1381342 1381375 1381581 1381599 1381862 1381896 1381987 
##       1      29     116     133      91      10      88      26      97      20      11       7 
## 1386168 1386234 1390137 1390442 1390798 1393453 1398148 1411438 1423615 1432772 1470368 1473644 
##     165      97       1      44      54     138      35      76      23       3       3      57 
## 1474899 1474964 1475011 1475045 1475201 1475250 1475284 1475755 1476258 1476290 1477264 1481662 
##      31      97      89      21      64      78      46       9      14       1       8       1 
## 1482546 1484443 1495365 1495407 1496355 1497056 1497601 1500354 1501451 1505494 1506724 1507045 
##       1      48      28      56       2      93      48       5      85     138       1       1 
## 1507276 1507532 1511351 1512789 1527225 1527316 1558725 1563238 1607944 1635689 1640556 1641521 
##      16      62     107      54      73       3     125      56       1       1      82      17 
## 1661271 1665298 1693506 1697234 1701127    <NA> 
##      43       1       1       7       1      13 
## [1] "Frequency table after encoding"
## COD_MOD_2016. 
##  892  893  894  895  896  897  898  899  900  901  902  903  904  905  906  907  908  909  910 
##    4    1   68   22    1   49   14   80   11   27   17    2   63   27   57   10   17    3   87 
##  911  912  913  914  915  916  917  918  919  920  921  922  923  924  925  926  927  928  929 
##   15   23  120    1   14    2   56   10   12   59  101   28   54    3   46    8   26   23   43 
##  930  931  932  933  934  935  936  937  938  939  940  941  942  943  944  945  946  947  948 
##   15   45  125    1    3   89    2   66   19   13    8    2   14   28   73   42   10    1   46 
##  949  950  951  952  953  954  955  956  957  958  959  960  961  962  963  964  965  966  967 
##   34    3    5   41   13   14    1   64   92  114   15   25   17  127   28   40   24    3    1 
##  968  969  970  971  972  973  974  975  976  977  978  979  980  981  982  983  984  985  986 
##   32   17   24   13  107   15  107   11   97   22   55   18    1  140    6   10   51    1   74 
##  987  988  989  990  991  992  993  994  995  996  997  998  999 1000 1001 1002 1003 1004 1005 
##    1   64   76   14   35   66   22   60   30   26   29    2   19   13   41   58   14   34   21 
## 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 
##   31   10    1   23   11   77    1   50   12   52   30   18    1    1   30   18   82    1   18 
## 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 
##   88   15  101    7    4   88    1  134   12   25   11  110    2   81    1   95   14   35  109 
## 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 
##   26   76   31   10   22   22   48    5    7    5   21   22   11   45   41   22   26   48    1 
## 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 
##    1   43   91    1  107  134   25   22   11  100   52   37   22   32   27   31   40   68   20 
## 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 
##   80   57    3  152   47   13    1   65  111    5   22   92    1    1   30   13   46   42    8 
## 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 
##   18   14   97    1   10   31   46    1   68    8   28  107   56  122   24    2   68   32   16 
## 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 
##   39   21    4    1   68   47   30  123   26  117   18   25    1    8   13    1   94   30   44 
## 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 
##    2   20   18    3   20   81    4   57    4   79    1    1   63    1    2   41   17    2   40 
## 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 
##   93    4  159   38   23   41   21    7   62   76    7   77  139   91   63   60   26   37   85 
## 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 
##    3   58   57   15    8    1    7    1    5   31    8    9   26   55  111   88   26    8    5 
## 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 
##   72    1    2    4   49   26   14   61   33    1  115   32    1   21   34   18   16   87    2 
## 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 
##    1    1   19   13   75   29   10    1    7   44    1   88   14    1   18   68   72    3   21 
## 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 
##   24   26  122   30   12    7   35    1   21   98   14   63    2   29   78    2   37    1  124 
## 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 
##   12   53   32   35   20  108   47  111    3    4   17   25   59   11    1   11   35  138   30 
## 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 
##   94   83   80   84   37   45    9  137   90   55   16   29   19   50   85   82   30   20   10 
## 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 
##    9   27   22    7   10   15   11   25   10   21   12   29   45   48    2   16    4  150   27 
## 1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 
##   11   90   58   75   15   70   27    1   91   21  103   41   32   47   14    3   21    3    1 
## 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 
##    1    2   26    4   61   18   87    5    1   32   31   27   10   73    3   19   29   15    7 
## 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 
##   56   13    2  114   24   35   20    5   19    8    9   26    1   45   31  118   75    7   13 
## 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 
##   95   17   28   28   18   27   45    9   15    6   14   72    8   32   21   25   49   20   16 
## 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 
##   13    1   15    3   31   22   56    2    5    1   40    2   13   28   60   37    2  140   29 
## 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 
##  138   21    2   17   11    6    1    6   12   36   17    2   16   14    5    2  131   17   85 
## 1424 1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 
##   10   16   25   13    1    4   11   16   32   10    3   51   57   29    1   12    1   57   19 
## 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 
##    2   10   14   91    2   21   31    5    5   10   12    1    3   26   53   63   27  100   50 
## 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 
##   93    9   18  106   53   25   57   26  119    9    7    1   19   74    1  116   10    1  107 
## 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 
##   42    7   21   40   50   81    1   18   18   33   14   19    6   90   85   42   73   19    1 
## 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 
##   85   87   82   94   65   47  100    2   39   28  125   31   26   11    4    1    1    6    1 
## 1519 1520 1521 1522 1523 1524 1525 1526 1527 1528 1529 1530 1531 1532 1533 1534 1535 1536 1537 
##   13   22   58   38    1   69   66    5   11   53    4    3   33   50   12   13   61  115   89 
## 1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555 1556 
##   24   31   30   21   45    1   78   23   38   31   45   12    1    8  165    5  124  157  101 
## 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 
##   18   31   22   26   11   35   19  146   27   89    6   29    7    4   11    1   53   25    1 
## 1576 1577 1578 1579 1580 1581 1582 1583 1584 1585 1586 1587 1588 1589 1590 1591 1592 1593 1594 
##    5    2   61   37    1   19   14   40  126    1   10    4  109    2    6   26   29    2   10 
## 1595 1596 1597 1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613 
##   14    1    1    2   61   66   23    1    2   32   58    5   14   54    3   23    1   10   79 
## 1614 1615 1616 1617 1618 1619 1620 1621 1622 1623 1624 1625 1626 1627 1628 1629 1630 1631 1632 
##    3   80    1   27   74   19  103   27    2    4   26   57    1   11   48  137    1   18   18 
## 1633 1634 1635 1636 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647 1648 1649 1650 1651 
##    1  110  123   21   14    1  133   38   13   34    1    1   73   20    1   54    3   25   96 
## 1652 1653 1654 1655 1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 
##   68    1   13   13   56   24    3   15   49   51   49   35   25   39   26   31   31   30    1 
## 1671 1672 1673 1674 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 
##   56    1    5    1   97   96   23    1  126   12    4   68   15    1   32   68    7    3   20 
## 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705 1706 1707 1708 
##   19   72   27   54   57   90   36   14    1    1   59   50   14   36   33   46   77    1    6 
## 1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724 <NA> 
##    3    1    1   37  157   11   11   25    1   91   39   14    4    8  138   25   13 
## [1] "Frequency table before encoding"
## cod_local. Codigo de Local
##  59514  62489  65586  65591  75203 119476 139827 139832 139870 139889 139894 139912 139931 
##      1      2      1      1      1      3     17     10     75     95      7      6     18 
## 139988 140034 140048 140053 140072 140091 140114 140128 140133 140147 140185 140190 140208 
##     47     35    119      5      8      1     91      2      4     12     17      5      7 
## 140213 140232 142518 142523 142537 142542 142561 143424 143438 143725 143730 144517 144522 
##      3     14     81      4     76     18     18     13     23     54     25      6      4 
## 144536 144541 144555 144560 144579 144598 144602 144635 144640 144659 144758 144782 144800 
##    115      2      6    104    168      3    107      1      2      1     15     99     72 
## 144819 145140 145244 146130 146154 146248 146253 146347 146352 146366 146385 146578 148049 
##      5      1      1    131      2      3     90     12     44     16    102     17      7 
## 148054 148068 148129 148313 148370 148412 148474 148544 148558 148681 148983 148997 149020 
##     12      1    126    108      8      9      5     10      7      3    166    132    151 
## 149063 149261 287912 287974 288054 288110 288134 288148 288191 288214 288266 288271 288308 
##    112    166      5     11      1     65     59     60     14     76     89      1     64 
## 288327 288346 288370 288431 288501 288539 288676 288860 291278 291443 291570 291607 291631 
##     77     68     86      2      2    108     48    146    118    173     23     21      1 
## 291645 291768 291834 291947 291990 292046 292126 292193 292329 292348 292353 292428 292490 
##     14     92     11     62     69      1     96     33      4      1      2      1     79 
## 292503 292579 292640 292678 292683 294979 295059 295083 295101 295115 295139 295667 295672 
##      7    116     64    103      9    169      5      7     13     90      2      4      4 
## 296681 296723 296761 296780 296860 296997 298086 298741 298784 298798 298835 298864 298883 
##     15     19      3     17      1      1     33    123      1    101     57      6      2 
## 298897 298901 298920 299081 300739 301263 301282 301319 301324 301343 301376 301418 301423 
##     90     13      1      2     47     16     94     25     21      3     47      5     46 
## 301475 301480 301507 301512 301531 301550 301593 301625 301649 301668 301692 301705 301734 
##     16     15      6     21     25     14     14     83     11    125     52      2      3 
## 301753 301767 301772 301786 301970 303064 304761 304775 304780 304879 304884 304898 304921 
##      4     11     40      1      1      1      1      2      1     21     65     70    107 
## 304983 304997 305077 305119 305789 305794 305874 305888 305925 305930 305949 305954 305987 
##     83      9     61      1     56     12      2      8     66     15      2      1      6 
## 305992 306656 307383 307401 307415 307458 307477 307590 308603 308622 308679 308684 308735 
##     10      6      1      3      5    178    130      2      7      5     12     26      3 
## 308801 308820 308839 308863 308877 308943 310880 310917 310922 310955 310960 310979 310998 
##     12      9     32      9      2     15      3      2      3      4      9     41      1 
## 311002 311035 311064 311115 311144 311158 311163 311177 311182 313478 313708 313727 313789 
##      5     93      7    116    108    154    106      2      3    195      4     89      1 
## 313845 313850 313925 313930 314005 314034 314152 314171 314227 314289 314519 314604 314958 
##      1     15      1      1      1     20      2      1      1      3    179    156      1 
## 314963 315062 315279 315321 315905 315948 315972 316655 316660 318230 318292 318334 318348 
##      3    113      8     13     16     69     51      7      5     32      1      1    110 
## 318517 318640 319102 319116 319121 319164 319178 319183 319239 319263 319296 319319 319343 
##     58      4    104     79      2      1      3      3     47    138      2     93    114 
## 319395 320105 320582 320619 320624 320638 320662 320681 320704 320723 320756 321416 321874 
##      4    186     11     70    116      6      3     13      1      2     27      4     27 
## 322543 324014 324410 324429 324434 324472 324486 324491 324504 324523 324537 324542 324556 
##     15    161     71    106     95      2    104    103      3      3    114    108    108 
## 324561 324603 324617 324641 324655 324660 324679 324684 324702 324716 324735 324778 324797 
##     72    150    126      1     92      2    128      1     72      5    108     87    122 
## 324815 324844 324863 324877 324957 324981 325004 325117 325141 325179 325184 325202 325235 
##    105     33      5     29     26    109      1     99      7     17      4      5    123 
## 325259 325320 325396 325400 325419 325438 325508 326843 329304 329610 329629 329653 329667 
##     98      4      1    120      7    104    121    177     16     61     56      5     22 
## 329686 329691 329733 329851 329865 329926 329931 329945 329950 331745 332151 332165 332245 
##     81     57     61      1      2      4    108     94      1    140     70     95      2 
## 332924 332943 332957 332962 333004 333056 333061 333099 333103 333117 333122 333160 333202 
##      1     78     18     73      8     27     88     44     48     43    103      3     10 
## 333221 333259 333264 333297 333301 333320 333339 333377 333396 333419 333424 333438 333462 
##     66     12      9     16     22     35      3     66     34     15     30     15     80 
## 333513 333532 336111 337403 337511 338681 338695 338723 338761 338822 338841 338855 338884 
##     43     10      1      6      5     92    161    102      4      3     84      3      4 
## 339685 340207 340226 340231 340269 340274 340288 340293 342843 342904 342923 343710 343767 
##      3      3      4     87    148    116      1      1    115      3      2      4     18 
## 343772 343786 343791 343828 343852 343871 343885 343913 343951 343989 343994 344007 344012 
##     18      4      4     73      1     85      1     73     70      9      4     24     14 
## 344031 344111 344125 344154 346469 346493 346515 346520 346544 346558 346577 346600 346619 
##      2     86    121     65     10      8     16     22     86     65      4      7      5 
## 346624 346638 346643 346662 346681 346723 346737 346742 346756 346761 346775 346822 348388 
##     83    109     71      3    136    148      1     40     43      1    149     93    158 
## 348411 365066 365071 365085 365108 365146 365151 365165 365170 365212 365231 365306 365311 
##      2     79      2      5      7     14     13     14     88      6     30    123     54 
## 365325 365349 365354 365368 365434 365716 365759 365778 365797 365801 365900 366018 366023 
##     70     13     12     64      3      4     60     14     55     24    121      8      7 
## 366037 366042 366075 366117 366122 366136 366513 366650 366730 366810 367466 368036 373373 
##      4     10     59      2      5     24     70      7     57      4     76      3     30 
## 373387 373410 373448 373537 373721 373877 373882 373962 374117 493771 493785 493813 494073 
##      1     18     13     25      8      2      1      7    139      1      1      1      1 
## 494940 495746 499848 506194 526328 528426 559564 580283 593539 593638 593657 593940 593983 
##      2      8      2     91      7    156      2      1      2    165    129      3    143 
## 594124 594435 595213 595411 595425 647759 687118 687528 687585 687887 708922 720839 722112 
##    116    176      1      2      8      8      4    171     72     59      1     15      2 
## 725870 725889 740352   <NA> 
##    134      6      6   7280 
## [1] "Frequency table after encoding"
## cod_local. Codigo de Local
##  172  173  174  175  176  177  178  179  180  181  182  183  184  185  186  187  188  189  190 
##    3  169    3  171    1  108    7    2   98    3   72  122   56   95    4    1    1   14   94 
##  191  192  193  194  195  196  197  198  199  200  201  202  203  204  205  206  207  208  209 
##   59    4   41    2   14   11    3   65    2    1    9    2    6   21    1   47   12  179   75 
##  210  211  212  213  214  215  216  217  218  219  220  221  222  223  224  225  226  227  228 
##    4    1  158  126   70    1    2    1    1    6   15    2   13   15  105  112    4   13    6 
##  229  230  231  232  233  234  235  236  237  238  239  240  241  242  243  244  245  246  247 
##   69    1    2   12  128  166   83    1    4   25    6    4  150    3  108   22   14   32   61 
##  248  249  250  251  252  253  254  255  256  257  258  259  260  261  262  263  264  265  266 
##   61   15    7  106   59    4    5   86   10   27   33  123   18  156  108   71    3   70  156 
##  267  268  269  270  271  272  273  274  275  276  277  278  279  280  281  282  283  284  285 
##  104    3    3  123    1    1   89   89  108    3    4  173   33   95    3    4  121   44   15 
##  286  287  288  289  290  291  292  293  294  295  296  297  298  299  300  301  302  303  304 
##    1    1    1   13  148  149   54    2  103    3  121  114    5    1   66  148  115   69    1 
##  305  306  307  308  309  310  311  312  313  314  315  316  317  318  319  320  321  322  323 
##   73   17   43   21   79    6   61  125  130   10    5  108   25    4    1    5   25   78    7 
##  324  325  326  327  328  329  330  331  332  333  334  335  336  337  338  339  340  341  342 
##   70    1   34    9   14    5  165    3   85    2    3   72   35    1    2   40   27  108    4 
##  343  344  345  346  347  348  349  350  351  352  353  354  355  356  357  358  359  360  361 
##   11    4    7    2   73   91   60   22   35  116    1    2  116    5  101   24    1  109   81 
##  362  363  364  365  366  367  368  369  370  371  372  373  374  375  376  377  378  379  380 
##    1   18   47    5  113    1    5    7    3   87    1    4    2   57    3    6   47    1    3 
##  381  382  383  384  385  386  387  388  389  390  391  392  393  394  395  396  397  398  399 
##   15  116    3    7    1    4    1  102    1   64    2  116    4   79    1   70   11    6   91 
##  400  401  402  403  404  405  406  407  408  409  410  411  412  413  414  415  416  417  418 
##  151   18    5  103   16   10   70   13   19   72   14    2   92   80    5   84    1   43   77 
##  419  420  421  422  423  424  425  426  427  428  429  430  431  432  433  434  435  436  437 
##    9   16   21  161  129   48   15    8   18   14    3   58    7   79    5   24   17  123    4 
##  438  439  440  441  442  443  444  445  446  447  448  449  450  451  452  453  454  455  456 
##    1    3   65  177    3    7    7   14   11    1    4    7    2    2    1    4   14  166   76 
##  457  458  459  460  461  462  463  464  465  466  467  468  469  470  471  472  473  474  475 
##   44    2   20   90    8   24   12    1    2  138    4    1  103   56   17    1   29  176    9 
##  476  477  478  479  480  481  482  483  484  485  486  487  488  489  490  491  492  493  494 
##    5  106    4    2  136    7   13    1   48   90   52    6   94    1  186    5   12    3    2 
##  495  496  497  498  499  500  501  502  503  504  505  506  507  508  509  510  511  512  513 
##   26   33   30   55    2   99    5   12    1    9  116   16    2    2    1    6  121   10    3 
##  514  515  516  517  518  519  520  521  522  523  524  525  526  527  528  529  530  531  532 
##    5    7   96    2   86    1   15    5    1    5   30    1   76   64    2   15  140    3    3 
##  533  534  535  536  537  538  539  540  541  542  543  544  545  546  547  548  549  550  551 
##   65  108    2    1   95   93   12  178   30  114   93    9   72   12    8   15    8  132   83 
##  552  553  554  555  556  557  558  559  560  561  562  563  564  565  566  567  568  569  570 
##    9  143   73  110    4   17    8   54    2    3   21   13   59    8  154    4   60   90   10 
##  571  572  573  574  575  576  577  578  579  580  581  582  583  584  585  586  587  588  589 
##    4   10  195   16  104   70   22    3   15   62    1    1  131   81    2   18    8   46    2 
##  590  591  592  593  594  595  596  597  598  599  600  601  602  603  604  605  606  607  608 
##    8    5   26    8   40  146    7    4   93    2   32    3    2    1    7   66    1   57    1 
##  609  610  611  612  613  614  615  616  617  618  619  620  621  622  623  624  625  626  627 
##   23    3  115  168    1  107   99   18    3   65    6    5    1   92    2   12   10   83   68 
##  628  629  630  631  632  633  634  635  636  637  638  639  640  641  642  643  644  645  646 
##   86    1   64   92    4   51    8   47  118    7  109    2    1   88   18    1    1    8   11 
##  647  648  649  650  651  652  653  654  655  656  657  658  659  660  661  662  663  664  665 
##    2   13    6   88   27    4  102   71    1   25    3   14    6   43  104   23   87    7    2 
##  666  667  668  669  670  671  672  673  674  675  676  677  678  679  680  681  682  683  684 
##    9    1   57    1    1    7    1   66   76    1   16   17  119    2  139  126   16  120   16 
##  685  686  687  688  689  690  691  692  693  694 <NA> 
##    3    2  107  104    1    4    2   13  134  161 7280

Indirect PII - Ordinal: Global recode or Top/bottom coding for extreme values

# Focus on variables with a "Lowest Freq" in dictionary of 30 or less. 
dropvars <- c("D_DD",
              "D_MM",
              "F_DD",
              "F_MM") 
mydata <- mydata[!names(mydata) %in% dropvars]

Indirect PII - Categorical: Recode, encode, or Top/bottom coding for extreme values

# !!!No Indirect PII - Categorical

Matching and crosstabulations: Run automated PII check

# Based on dictionary inspection, select variables for creating sdcMicro object
# See: https://sdcpractice.readthedocs.io/en/latest/anon_methods.html
# All variable names should correspond to the names in the data file
# selected categorical key variables: gender, occupation/education and age
selectedKeyVars = c('sexo', 'edad_2015') 

mydata$edad_2015 <- round(mydata$edad_2015, 1)

# weight variable (add if available)
# selectedWeightVar = c('projwt') ##!!! Replace with weight var

# household id variable (cluster)
# selectedHouseholdID = c('wpid') ##!!! Replace with household id

# creating the sdcMicro object with the assigned variables
sdcInitial <- createSdcObj(dat = mydata, keyVars = selectedKeyVars)
sdcInitial
## The input dataset consists of 28757 rows and 470 variables.
##   --> Categorical key variables: sexo, edad_2015
## ----------------------------------------------------------------------
## Information on categorical key variables:
## 
## Reported is the number, mean size and size of the smallest category >0 for recoded variables.
## In parenthesis, the same statistics are shown for the unmodified data.
## Note: NA (missings) are counted as seperate categories!
##  Key Variable Number of categories       Mean size             Size of smallest (>0)        
##          sexo                    2   (2) 14378.500 (14378.500)                 14256 (14256)
##     edad_2015                  116 (116)   247.905   (247.905)                     1     (1)
## ----------------------------------------------------------------------
## Infos on 2/3-Anonymity:
## 
## Number of observations violating
##   - 2-anonymity: 17 (0.059%)
##   - 3-anonymity: 37 (0.129%)
##   - 5-anonymity: 81 (0.282%)
## 
## ----------------------------------------------------------------------

Show values of key variable of records that violate k-anonymity

mydata <- labelDataset(mydata)
notAnon <- sdcInitial@risk$individual[,2] < 2 # for 2-anonymity
mydata[notAnon,selectedKeyVars]
## # A tibble: 17 x 2
##          sexo edad_2015
##     <dbl+lbl>     <dbl>
##  1 0 [Mujer]        9  
##  2 0 [Mujer]        9.3
##  3 1 [Hombre]       9.5
##  4 1 [Hombre]      21  
##  5 0 [Mujer]       19.6
##  6 0 [Mujer]       20.1
##  7 0 [Mujer]        9.1
##  8 0 [Mujer]       46.9
##  9 0 [Mujer]       19.3
## 10 0 [Mujer]       24.7
## 11 1 [Hombre]      18.9
## 12 1 [Hombre]      20.9
## 13 0 [Mujer]       18.9
## 14 0 [Mujer]        8.9
## 15 0 [Mujer]       18.4
## 16 0 [Mujer]       38  
## 17 1 [Hombre]      57.3
sdcFinal <- localSuppression(sdcInitial)

# Recombining anonymized variables

extractManipData(sdcFinal)[notAnon,selectedKeyVars] # manipulated variables HH
## Warning in if (cc != class(v_p)) {: the condition has length > 1 and only the first element will
## be used
##       sexo edad_2015
## 336      0        NA
## 3438     0        NA
## 4431     1        NA
## 6915     1        NA
## 9657     0        NA
## 11944    0        NA
## 13428    0        NA
## 15264    0        NA
## 17189    0        NA
## 17237    0        NA
## 19196    1        NA
## 20197    1        NA
## 20915    0        NA
## 25014    0        NA
## 26630    0        NA
## 27219    0        NA
## 27863    1        NA
mydata [notAnon,"sexo"] <- NA
mydata [notAnon,"edad_2015"] <- round(mydata[notAnon,"edad_2015"], 0)
sdcInitial <- createSdcObj(dat = mydata, keyVars = selectedKeyVars)
sdcInitial
## The input dataset consists of 28757 rows and 470 variables.
##   --> Categorical key variables: sexo, edad_2015
## ----------------------------------------------------------------------
## Information on categorical key variables:
## 
## Reported is the number, mean size and size of the smallest category >0 for recoded variables.
## In parenthesis, the same statistics are shown for the unmodified data.
## Note: NA (missings) are counted as seperate categories!
##  Key Variable Number of categories       Mean size             Size of smallest (>0)        
##          sexo                    3   (3) 14370.000 (14370.000)                 14251 (14251)
##     edad_2015                  108 (108)   266.269   (266.269)                     1     (1)
## ----------------------------------------------------------------------
## Infos on 2/3-Anonymity:
## 
## Number of observations violating
##   - 2-anonymity: 4 (0.014%)
##   - 3-anonymity: 22 (0.077%)
##   - 5-anonymity: 71 (0.247%)
## 
## ----------------------------------------------------------------------

Open-ends: review responses for any sensitive information, redact as necessary

# !!! Identify open-end variables here: 
open_ends <- c("name_schship_2015",
               "name_schship_2016",
               "name_cred_2016",
               "unitec_b_2016",
               "nopay_wlta_sup_b_2016")

report_open (list_open_ends = open_ends)

# Review "verbatims.csv". Identify variables to be deleted or redacted and their row number 

# !!!Remove, as they contain a lot of sensitive information and they are in Spanish.
mydata <- mydata[!names(mydata) %in% "name_schship_2015"]
mydata <- mydata[!names(mydata) %in% "name_schship_2016"]
mydata <- mydata[!names(mydata) %in% "name_cred_2016"]
mydata <- mydata[!names(mydata) %in% "unitec_b_2016"]
mydata <- mydata[!names(mydata) %in% "nopay_wlta_sup_b_2016"]

GPS data: Displace

# !!!No GPS data

Save processed data in Stata and SPSS format

haven::write_dta(mydata, paste0(filename, "_PU.dta"))

# Change names of columns containing illegal starting characters (i.e. "_") for SPSS

mydata <- haven::read_dta(paste0(filename, "_PU.dta"))
colnames(mydata)[grep("^_", colnames(mydata))] <- c("x000000_2016", "msap2016", "dropoutpooldata2015", "dropoutpooldata2016", 
                                                    "rank", "mergeCMExtra", "seguimiento2015", "seguimiento2016")
## Warning in colnames(mydata)[grep("^_", colnames(mydata))] <- c("x000000_2016", : number of items
## to replace is not a multiple of replacement length
mydata[is.na(mydata)] <- NA
haven::write_sav(mydata, paste0(filename, "_PU.sav"))

# Add report title dynamically
title_var <- paste0("DOL-ILAB SDC - ", filename)