@article{fe9d8e6e3f7d405fa9d5049ffea59b41,
title = "Regrouped design in privacy analysis for multinomial microdata",
abstract = "In this paper, we are dealing with the dual goals for protecting privacy and making statistical inferences from the disseminated data using the regrouped design. It is not difficult to protect the privacy of patients by perturbing data. The problem is to perturb the data in such a way that privacy is protected, and also, the released data are useful for research. By applying the regrouped design, the dataset is released with the dummy groups associated with the actual groups via a pre-specified transition probability matrix. Small stagnation probabilities of regrouped design are recommended to reach a small disclosure risk and a higher power of hypothesis testing. The power of test statistic in the released data increases as the stagnation probabilities depart from 0.5. The disclosure risk can be reduced further if more quasi-identifiers are relocated. An example of National Health Insurance Research Database is given to illustrate the use of the regrouped design to protect the privacy and make the statistical inference.",
keywords = "disclosure risk, regrouped design, transition probability matrix",
author = "Wan, {Shu Mei} and Chung, {Wen Yaw} and {Mayeni Manurung}, Monica and Chang, {Kwang Hwa} and Wu, {Chien Hua}",
note = "Funding Information: Part of this study is based on data from the National Health Insurance Research Database provided by the Bureau of National Health Insurance, Department of Health, and managed by National Health Research Institutes. The interpretation and conclusions contained herein do not represent those of the National Health Insurance Administration, Department of Health, or National Health Research Institutes. The authors thank Shih‐Hsiang Tseng at Chung‐Yuan Christian University for help in creating Tables 4 and 5 of simulation study. This research was supported by a research grant from the Ministry of Science and Technology in Taiwan (Grant No. MOST 107‐2118‐M‐033‐003). Publisher Copyright: {\textcopyright} 2021 Wiley Periodicals LLC.",
year = "2022",
month = apr,
doi = "10.1002/sam.11553",
language = "English",
journal = "Statistical Analysis and Data Mining",
issn = "1932-1864",
publisher = "John Wiley and Sons Inc.",
}