Last compiled on May, 2025
We want to attach some new variables to the data that I&O
research initially collected. But as the original had no identifier and
we want to ascertain which repsondent is which, we make our own
identifier.
Making person
identifiers
Start out with a custom function to load a set of required
packages.
# packages and read data
df <- haven::read_dta("data/DQUESTUU_eindbestand.dta")
# first match tryout set.seed(12981298) samp <- df[sample(nrow(df), 10, replace = F), ] samp <-
# samp[, c('geslacht', 'postcode', 'leeftijd', 'postcode', 'V5a', 'V5a_anders', 'V5b',
# 'V5b_anders')] write.csv(samp, 'testsample_io.csv', row.names = F)
# match to io
iomatch <- df[, c("geslacht", "opleiding", "leeftijd", "postcode", "V5a", "V5a_anders", "V5b", "V5b_anders")]
set.seed(12981298)
personid <- sample(10000:20000, nrow(df), replace = F)
iomatch <- cbind(personid, iomatch)
write.csv(iomatch, "data/iomatch.csv", row.names = F)
LS0tCnRpdGxlOiAiSSZPIHJlc2VhcmNoIElEIgojYmlibGlvZ3JhcGh5OiByZWZlcmVuY2VzLmJpYgphdXRob3I6ICJCYXMgSG9mc3RyYSIKLS0tCgpgYGB7ciwgZ2xvYmFsc2V0dGluZ3MsIGVjaG89RkFMU0UsIHdhcm5pbmc9RkFMU0UsIHJlc3VsdHM9J2hpZGUnfQpsaWJyYXJ5KGtuaXRyKQoKa25pdHI6Om9wdHNfY2h1bmskc2V0KGVjaG8gPSBUUlVFKQpvcHRzX2NodW5rJHNldCh0aWR5Lm9wdHM9bGlzdCh3aWR0aC5jdXRvZmY9MTAwKSx0aWR5PVRSVUUsIHdhcm5pbmcgPSBGQUxTRSwgbWVzc2FnZSA9IEZBTFNFLGNvbW1lbnQgPSAiIz4iLCBjYWNoZT1UUlVFLCBjbGFzcy5zb3VyY2U9YygidGVzdCIpLCBjbGFzcy5vdXRwdXQ9YygidGVzdDIiKSkKb3B0aW9ucyh3aWR0aCA9IDEwMCkKcmdsOjpzZXR1cEtuaXRyKCkKCgoKY29sb3JpemUgPC0gZnVuY3Rpb24oeCwgY29sb3IpIHtzcHJpbnRmKCI8c3BhbiBzdHlsZT0nY29sb3I6ICVzOyc+JXM8L3NwYW4+IiwgY29sb3IsIHgpIH0KCmBgYAoKYGBge3Iga2xpcHB5LCBlY2hvPUZBTFNFLCBpbmNsdWRlPVRSVUV9CmtsaXBweTo6a2xpcHB5KHBvc2l0aW9uID0gYygndG9wJywgJ3JpZ2h0JykpCiNrbGlwcHk6OmtsaXBweShjb2xvciA9ICdkYXJrcmVkJykKI2tsaXBweTo6a2xpcHB5KHRvb2x0aXBfbWVzc2FnZSA9ICdDbGljayB0byBjb3B5JywgdG9vbHRpcF9zdWNjZXNzID0gJ0RvbmUnKQpgYGAKCkxhc3QgY29tcGlsZWQgb24gYHIgZm9ybWF0KFN5cy50aW1lKCksICclQiwgJVknKWAKCjxicj4KCi0tLS0KCldlIHdhbnQgdG8gYXR0YWNoIHNvbWUgbmV3IHZhcmlhYmxlcyB0byB0aGUgZGF0YSB0aGF0IEkmTyByZXNlYXJjaCBpbml0aWFsbHkgY29sbGVjdGVkLiBCdXQgYXMgdGhlIG9yaWdpbmFsIGhhZCBubyBpZGVudGlmaWVyIGFuZCB3ZSB3YW50IHRvIGFzY2VydGFpbiB3aGljaCByZXBzb25kZW50IGlzIHdoaWNoLCB3ZSBtYWtlIG91ciBvd24gaWRlbnRpZmllci4KCjxicj4KCi0tLS0KCiMgTWFraW5nIHBlcnNvbiBpZGVudGlmaWVycwoKU3RhcnQgb3V0IHdpdGggYSBjdXN0b20gZnVuY3Rpb24gdG8gbG9hZCBhIHNldCBvZiByZXF1aXJlZCBwYWNrYWdlcy4KICAKYGBge3IgaWQsIGV2YWw9RkFMU0V9CiMgcGFja2FnZXMgYW5kIHJlYWQgZGF0YQoKZGYgPC0gaGF2ZW46OnJlYWRfZHRhKCJkYXRhL0RRVUVTVFVVX2VpbmRiZXN0YW5kLmR0YSIpCgojIGZpcnN0IG1hdGNoIHRyeW91dAojc2V0LnNlZWQoMTI5ODEyOTgpCiNzYW1wIDwtIGRmW3NhbXBsZShucm93KGRmKSwgMTAsIHJlcGxhY2UgPSBGKSwgXQojc2FtcCA8LSBzYW1wWywgYygiZ2VzbGFjaHQiLCAicG9zdGNvZGUiLCAibGVlZnRpamQiLCAicG9zdGNvZGUiLCAiVjVhIiwgIlY1YV9hbmRlcnMiLCAiVjViIiwgIlY1Yl9hbmRlcnMiKV0KI3dyaXRlLmNzdihzYW1wLCAidGVzdHNhbXBsZV9pby5jc3YiLCByb3cubmFtZXMgPSBGKQoKIyBtYXRjaCB0byBpbwppb21hdGNoIDwtIGRmWywgYygiZ2VzbGFjaHQiLCAib3BsZWlkaW5nIiwgImxlZWZ0aWpkIiwgInBvc3Rjb2RlIiwgIlY1YSIsICJWNWFfYW5kZXJzIiwgIlY1YiIsICJWNWJfYW5kZXJzIildCgpzZXQuc2VlZCgxMjk4MTI5OCkKcGVyc29uaWQgPC0gc2FtcGxlKDEwMDAwOjIwMDAwLCBucm93KGRmKSwgcmVwbGFjZSA9IEYpCmlvbWF0Y2ggPC0gY2JpbmQocGVyc29uaWQsIGlvbWF0Y2gpCndyaXRlLmNzdihpb21hdGNoLCAiZGF0YS9pb21hdGNoLmNzdiIsIHJvdy5uYW1lcyA9IEYpCgpgYGAKCg==