# Bibliography

## Journal Articles and Proceedings

### 2019

• J. M. Abowd, I. M. Schmutte, W. N. Sexton, and L. Vilhuber, “Why the Economics Profession Must Actively Participate in the Privacy Protection Debate,” AEA Papers and Proceedings, vol. 109, pp. 397-402, 2019.
[DOI] [URL] [Bibtex]
@Article{AEAPP2019,
author = {John M. Abowd and Ian M. Schmutte and William N. Sexton and Lars Vilhuber},
title = {Why the Economics Profession Must Actively Participate in the Privacy Protection Debate},
journal = {AEA Papers and Proceedings},
year = {2019},
volume = {109},
month = {may},
pages = {397-402},
doi = {10.1257/pandp.20191106},
owner = {vilhuber},
url = {https://www.aeaweb.org/articles?id=10.1257/pandp.20191106},
timestamp = {2019.03.10},
abstract = {When Google or the U.S. Census Bureau publish detailed statistics on browsing habits or neighborhood characteristics, some privacy is lost for everybody while supplying public information. To date, economists have not focused on the privacy loss inherent in data publication. In their stead, these issues have been advanced almost exclusively by computer scientists who are primarily interested in technical problems associated with protecting privacy. Economists should join the discussion, first, to determine where to balance privacy protection against data quality; a social choice problem. Furthermore, economists must ensure new privacy models preserve the validity of public data for economic research.},
}
• L. Vilhuber, “Report by the AEA Data Editor,” AEA Papers and Proceedings, vol. 109, pp. 718-29, 2019.
[DOI] [URL] [Bibtex]
@Article{ReportDE2019,
author = {Lars Vilhuber},
title = {Report by the AEA Data Editor},
journal = {AEA Papers and Proceedings},
year = {2019},
volume = {109},
month = {may},
pages = {718-29},
doi = {10.1257/pandp.109.718},
owner = {vilhuber},
url = {https://www.aeaweb.org/articles?id=10.1257/pandp.109.718},
timestamp = {2019.03.10},
}
• L. Vilhuber, “Making Confidential Data Part of Reproducible Research,” in Methods to Foster Transparency and Reproducibility of Federal Statistics: Proceedings of a Workshop, Washington, DC, 2019, pp. 63-66.
[DOI] [URL] [Bibtex]
@InProceedings{NAP25305,
author = "Lars Vilhuber",
title = "Making Confidential Data Part of Reproducible Research",
editor = "{National Academies of Sciences, Engineering, and Medicine} ",
booktitle = "Methods to Foster Transparency and Reproducibility of Federal Statistics: Proceedings of a Workshop",
isbn = "978-0-309-48629-3",
doi = "10.17226/25305",
pages = "63-66",
abstract = "In 2014 the National Science Foundation (NSF) provided support to the National Academies of Sciences, Engineering, and Medicine for a series of Forums on Open Science in response to a government-wide directive to support increased public access to the results of research funded by the federal government. However, the breadth of the work resulting from the series precluded a focus on any specific topic or discussion about how to improve public access. Thus, the main goal of the Workshop on Transparency and Reproducibility in Federal Statistics was to develop some understanding of what principles and practices are, or would be, supportive of making federal statistics more understandable and reviewable, both by agency staff and the public. This publication summarizes the presentations and discussions from the workshop.",
url = "https://www.nap.edu/catalog/25305/methods-to-foster-transparency-and-reproducibility-of-federal-statistics-proceedings",
year = 2019,
publisher = "The National Academies Press",
note = "National Academies of Sciences, Engineering, and Medicine; Michael Cohen (Rapporteur)",
}

### 2018

• A. Foote, M. J. Kutzbach, and L. Vilhuber, “Recalculating – How Uncertainty in Local Labor Market Definitions Affects Empirical Findings,” submitted, 2018.
[Bibtex]
@article{FooteKutzbachVilhuber-submitted,
author={Andrew Foote and Mark J. Kutzbach and Lars Vilhuber},
title={{Recalculating - How Uncertainty in Local Labor Market Definitions Affects Empirical Findings}},
year=2018,
journal={submitted},
abstract={This paper evaluates the use of commuting zones as a local labor market definition. We revisit Tolbert and Sizer (1996) and demonstrate the sensitivity of definitions to two features of the methodology. We show how these features impact empirical estimates using a well-known application of commuting zones. We conclude with advice to researchers using commuting zones on how to demonstrate the robustness of empirical findings to uncertainty in definitions.},
keywords={Local labor markets; commuting; measurement error},
doi={},
}
• M. Pistner, A. Slavković, and L. Vilhuber, “Synthetic Data via Quantile Regression for Heavy-Tailed and Heteroskedastic Data,” in Privacy in Statistical Databases, J. Domingo-Ferrer and F. Montes, Eds., , 2018.
[DOI] [URL] [Bibtex]
@InCollection{PistnerSlavkovicVilhuber:PSD:2018,
Title = {Synthetic Data via Quantile Regression for Heavy-Tailed and Heteroskedastic Data},
Author = {Michelle Pistner and Aleksandra Slavkovi\'c and Lars Vilhuber},
Booktitle = {Privacy in Statistical Databases},
Year = {2018},
editor = {Domingo-Ferrer, Josep and Montes, Francisco},
DOI = {10.1007/978-3-319-99771-1_7},
Keywords = {Synthetic Data; Quantile Regression; Statistical Disclosure Limitation; Privacy-preserving Datamining},
Owner = {vilhuber},
Timestamp = {2018.06.26},
URL = {http://dx.doi.org/10.1007/978-3-642-TBD}
}
• A. Slavković and L. Vilhuber, “Remembering Stephen Fienberg,” Journal of Privacy and Confidentiality, vol. 8, iss. 1, 2018.
[DOI] [Bibtex]
@Article{Slavkovic2018,
author = {Aleksandra Slavkovi{\'{c}} and Lars Vilhuber},
title = {Remembering Stephen Fienberg},
journal = {Journal of Privacy and Confidentiality},
year = {2018},
volume = {8},
number = {1},
month = {dec},
doi = {10.29012/jpc.685},
owner = {vilhuber},
publisher = {Journal of Privacy and Confidentiality},
timestamp = {2019.03.10},
}
• L. Vilhuber, “Relaunching the Journal of Privacy and Confidentiality,” Journal of Privacy and Confidentiality, vol. 8, iss. 1, 2018.
[DOI] [Bibtex]
@Article{Vilhuber2018,
author = {Lars Vilhuber},
title = {Relaunching the Journal of Privacy and Confidentiality},
journal = {Journal of Privacy and Confidentiality},
year = {2018},
volume = {8},
number = {1},
month = {dec},
doi = {10.29012/jpc.706},
owner = {vilhuber},
publisher = {Journal of Privacy and Confidentiality},
timestamp = {2019.03.10},
}
• D. H. Weinberg, J. M. Abowd, R. F. Belli, N. Cressie, D. C. Folch, S. H. Holan, M. C. Levenstein, K. M. Olson, J. P. Reiter, M. D. Shapiro, J. Smyth, L. Soh, B. D. Spencer, S. E. Spielman, L. Vilhuber, and C. K. Wikle, “Effects of a Government-Academic Partnership: Has the NSF-Census Bureau Research Network Helped Improve the U.S. Statistical System?,” Journal of Survey Statistics and Methodology, 2018.
[DOI] [Bibtex]
@article{ncrn-summary,
author={Daniel H. Weinberg and John M. Abowd and Robert F. Belli and Noel Cressie and David C. Folch and Scott H. Holan and Margaret C. Levenstein and Kristen M. Olson and Jerome P. Reiter and Matthew D. Shapiro and Jolene Smyth and Leen-Kiat Soh and Bruce D. Spencer and Seth E. Spielman and Lars Vilhuber and Christopher K. Wikle},
title={{Effects of a Government-Academic Partnership: Has the NSF-Census Bureau Research Network Helped Improve the U.S. Statistical System?}},
year={2018},
journal={Journal of Survey Statistics and Methodology},
abstract={The National Science Foundation-Census Bureau Research Network (NCRN) was established in 2011 to create interdisciplinary research nodes on methodological questions of interest and significance to the broader research community and to the Federal Statistical System (FSS), particularly the Census Bureau. The activities to date have covered both fundamental and applied statistical research and have focused at least in part on the training of current and future generations of researchers in skills of relevance to surveys and alternative measurement of economic units, households, and persons. This paper discusses some of the key research findings of the eight nodes, organized into six topics: (1) Improving census and survey data collection methods; (2) Using alternative sources of data; (3) Protecting privacy and confidentiality by improving disclosure avoidance; (4) Using spatial and spatio-temporal statistical modeling to improve estimates; (5) Assessing data cost and quality tradeoffs; and (6) Combining information from multiple sources. It also reports on collaborations across nodes and with federal agencies, new software developed, and educational activities and outcomes. The paper concludes with an evaluation of the ability of the FSS to apply the NCRN’s research outcomes and suggests some next steps, as well as the implications of this research-network model for future federal government renewal initiatives.},
keywords={},
doi={10.1093/jssam/smy023},
}

### 2017

• J. Cloutier, L. Vilhuber, D. Harrisson, and V. Béland-Ouellette, “Understanding the effect of procedural justice on psychological distress,” International Journal of Stress Management, vol. Advance online, 2017.
[DOI] [Bibtex]
@Article{CloutierVilhuber2017,
author = {Julie Cloutier and Lars Vilhuber and Denis Harrisson and Vanessa B{\'e}land-Ouellette},
title = {Understanding the effect of procedural justice on psychological distress},
journal = {International Journal of Stress Management},
year = {2017},
doi = {10.1037/str0000065},
abstract = {Studies on the effect of procedural justice on psychological distress present conflicting results. Drawing on instrumental and relational perspectives of justice, we test the hypothesis that the perception of procedural justice influences the level of workers' psychological distress. Using a number of validated instruments to collected data from 659 workers in three call centers, we use OLS regressions and Hayes' PROCESS tool to show that the perception of procedural justice has a direct, unique, and independent effect on psychological distress. The perception of procedural justice has no instrumental role, the key mechanism being the relational role, suggesting that perceived injustice influences psychological distress because it threatens self-esteem. Distributive justice perceptions (recognition, promotions, job security) are not associated with psychological distress, calling into question Siegrist's model. Our findings suggest that perceived procedural justice provides workers better evidence of the extent to which they are valued and appreciated members of their organizations than do perceptions of distributive justice. The results highlight the greater need for workers to be valued and appreciated for who they are (consideration and esteem), rather than for what they do for their organization (distributive justice of rewards).},
owner = {vilhuber},
timestamp = {2016.11.22},
}
• S. Haney, A. Machanavajjhala, J. M. Abowd, M. Graham, M. Kutzbach, and L. Vilhuber, “Utility Cost of Formal Privacy for Releasing National Employer-Employee Statistics,” in Proceedings of the 2017 International Conference on Management of Data, 2017, pp. 1339-1354.
[DOI] [URL] [Bibtex]
@InProceedings{HaneySIGMOD2017,
author = {Samuel Haney and Ashwin Machanavajjhala and John M. Abowd and Matthew Graham and Mark Kutzbach and Lars Vilhuber},
title = {Utility Cost of Formal Privacy for Releasing National Employer-Employee Statistics},
booktitle = {Proceedings of the 2017 International Conference on Management of Data},
year = {2017},
series = {SIGMOD '17},
publisher = {ACM},
pages = {1339-1354},
doi = {10.1145/3035918.3035940},
acmid = {3035940},
url = {http://doi.acm.org/10.1145/3035918.3035940},
abstract = {National statistical agencies around the world publish tabular summaries based on combined employer-employee (ER-EE) data. The privacy of both individuals and business establishments that feature in these data are protected by law in most countries. These data are currently released using a variety of statistical disclosure limitation (SDL) techniques that do not reveal the exact characteristics of particular employers and employees, but lack provable privacy guarantees limiting inferential disclosures.
In this work, we present novel algorithms for releasing tabular summaries of linked ER-EE data with formal, provable guarantees of privacy. We show that state-of-the-art differentially private algorithms add too much noise for the output to be useful. Instead, we identify the privacy requirements mandated by current interpretations of the relevant laws, and formalize them using the Pufferfish framework. We then develop new privacy definitions that are customized to ER-EE data and satisfy the statutory privacy requirements. We implement the experiments in this paper on production data gathered by the U.S. Census Bureau. An empirical evaluation of utility for these data shows that for reasonable values of the privacy-loss parameter $\epsilon\geq$ 1, the additive error introduced by our provably private algorithms is comparable, and in some cases better, than the error introduced by existing SDL techniques that have no provable privacy guarantees. For some complex queries currently published, however, our algorithms do not have utility comparable to the existing traditional SDL algorithms. Those queries are fodder for future research.},
acmid = {3035940},
journal = {SIGMOD},
owner = {vilhuber},
timestamp = {2017.03.01},
}
• K. L. McKinney, A. S. Green, J. M. Abowd, and L. Vilhuber, “Total Error and Variability Measures with Integrated Disclosure Limitation for Quarterly Workforce Indicators and LEHD Origin Destination Employment Statistics in OnTheMap,” submitted, 2017.
[Bibtex]
@Article{McKinneyEtAl:submitted:2017,
author = {Kevin L. McKinney and Andrew S. Green and John M. Abowd and Lars Vilhuber},
title = {Total Error and Variability Measures with Integrated Disclosure Limitation for {Q}uarterly {W}orkforce {I}ndicators and {LEHD} {O}rigin {D}estination {E}mployment {S}tatistics in {OnTheMap}},
journal = {submitted},
year = {2017},
abstract = {We report results from the first comprehensive total quality evaluation of five major indicators in the U.S. Census Bureau's Longitudinal Employer-Household Dynamics (LEHD) Program Quarterly Workforce Indicators (QWI): total employment, beginning-of-quarter employment, full-quarter employment, total payroll, and average monthly earnings of full-quarter employees. Beginning-of-quarter employment is also the main tabulation variable in the LEHD Origin-Destination Employment Statistics (LODES) workplace reports as displayed in OnTheMap (OTM). The evaluation is conducted by generating multiple threads of the edit and imputation models used in the LEHD Infrastructure File System. These threads conform to the Rubin (1987) multiple imputation model, with each thread or implicate being the output of formal probability models that address coverage, edit, and imputation errors. Design-based sampling variability and finite population corrections are also included in the evaluation. We derive special formulas for the Rubin total variability and its components that are consistent with the disclosure avoidance system used for QWI and LODES/OTM workplace reports. These formulas allow us to publish the complete set of detailed total quality measures for QWI and LODES. The analysis reveals that the five publication variables under study are estimated very accurately for tabulations involving at least 10 jobs. Tabulations involving three to nine jobs have quality in the range generally deemed acceptable. Tabulations involving zero, one or two jobs, which are generally suppressed in the QWI and synthesized in LODES, have substantial total variability but their publication in LODES allows the formation of larger custom aggregations, which will in general have the accuracy estimated for tabulations in the QWI based on a similar number of workers.},
owner = {vilhuber},
timestamp = {2017.12.19},
}
• L. Vilhuber and C. Lagoze, “Making Confidential Data Part of Reproducible Research,” Chance, 2017.
[URL] [Bibtex]
@Article{chance:2017,
author = {Vilhuber, Lars and Lagoze, Carl},
title = {Making Confidential Data Part of Reproducible Research},
journal = {Chance},
year = {2017},
month = {09/2017},
url = {http://chance.amstat.org/2017/09/reproducible-research/},
owner = {vilhuber},
timestamp = {2017.10.02},
}

### 2016

• J. Miranda and L. Vilhuber, “Using partially synthetic microdata to protect sensitive cells in business statistics,” Statistical Journal of the International Association for Official Statistics, vol. 32, iss. 1, pp. 69-80, 2016.
[DOI] [Bibtex]
@article {MirandaVilhuber:Using:SJIAOS:2016,
title = {Using partially synthetic microdata to protect
author = {Javier Miranda and Lars Vilhuber},
journal = {Statistical Journal of the International Association for Official Statistics},
year=2016,
volume={32},
number={1},
pages={69-80},
doi={10.3233/SJI-160963},
abstract={We describe and analyze a method that blends records from both observed and synthetic microdata into public-use tabulations on establishment statistics. The resulting tables use synthetic data only in potentially sensitive cells. We describe different algorithms, and present preliminary results when applied to the Census Bureau's Business Dynamics Statistics and Synthetic Longitudinal Business Database, highlighting accuracy and protection afforded by the method when compared to existing public-use tabulations (with suppressions).},
}
• L. Vilhuber, J. M. Abowd, and J. P. Reiter, “Synthetic establishment microdata around the world,” Statistical Journal of the International Association for Official Statistics, vol. 32, iss. 1, pp. 65-68, 2016.
[DOI] [Bibtex]
@article{VilhuberAbowdReiter:Synthetic:SJIAOS:2016,
title = {Synthetic establishment microdata around the world},
journal = {Statistical Journal of the International Association for Official Statistics},
author = {Lars Vilhuber and John M. Abowd and Jerome P. Reiter},
year=2016,
volume={32},
number={1},
pages={65-68},
doi={10.3233/SJI-160964},
abstract={In contrast to the many public-use microdata samples available for individual and household data from many statistical agencies around the world, there are virtually no establishment or firm microdata available. In large part, this difficulty in providing access to business micro data is due to the skewed and sparse distributions that characterize business data. Synthetic data are simulated data generated from statistical models. We organized sessions at the 2015 World Statistical Congress and the 2015 Joint Statistical Meetings, highlighting work on synthetic establishment microdata. This overview situates those papers, published in this issue, within the broader literature.},
}

### 2014

• J. Drechsler and L. Vilhuber, “Synthetic Longitudinal Business Databases for International Comparisons,” in Privacy in Statistical Databases, J. Domingo-Ferrer, Ed., Springer International Publishing, 2014, vol. 8744, pp. 243-252.
[DOI] [URL] [Bibtex]
@InCollection{psd2014b,
Title = {Synthetic Longitudinal Business Databases for International Comparisons},
Author = {Drechsler, J\"org and Vilhuber, Lars},
Booktitle = {Privacy in Statistical Databases},
Publisher = {Springer International Publishing},
Year = {2014},
Editor = {Domingo-Ferrer, Josep},
Pages = {243-252},
Series = {Lecture Notes in Computer Science},
Volume = {8744},
Abstract = {International comparison studies on economic activity are often hampered by the fact that access to business microdata is very limited on an international level. A recently launched project tries to overcome these limitations by improving access to Business Censuses from multiple countries based on synthetic data. Starting from the synthetic version of the longitudinally edited version of the U.S. Business Register (the Longitudinal Business Database, LBD), the idea is to create similar data products in other countries by applying the synthesis methodology developed for the LBD to generate synthetic replicates that could be distributed without confidentiality concerns. In this paper we present some first results of this project based on German business data collected at the Institute for Employment Research.},
DOI = {10.1007/978-3-319-11257-2_19},
ISBN = {978-3-319-11256-5},
Keywords = {business data; confidentiality; international comparison; multiple imputation; synthetic},
URL = {http://dx.doi.org/10.1007/978-3-319-11257-2_19}
}
• J. Drechsler and L. Vilhuber, “A First Step Towards A German SynLBD: Constructing A German Longitudinal Business Database,” Statistical Journal of the IAOS: Journal of the International Association for Official Statistics, vol. 30, 2014.
[DOI] [URL] [Bibtex]
@Article{SJIAOS-2014b,
Title = {{A First Step Towards A {German} {SynLBD}: {C}onstructing A {G}erman {L}ongitudinal {B}usiness {D}atabase}},
Author = {J{\"o}rg Drechsler and Lars Vilhuber},
Journal = {Statistical Journal of the IAOS: Journal of the International Association for Official Statistics},
Year = {2014},
Volume = {30},
Abstract = {One major criticism against the use of synthetic data has been that the efforts necessary to generate useful synthetic data are so in- tense that many statistical agencies cannot afford them. We argue many lessons in this evolving field have been learned in the early years of synthetic data generation, and can be used in the development of new synthetic data products, considerably reducing the required in- vestments. The final goal of the project described in this paper will be to evaluate whether synthetic data algorithms developed in the U.S. to generate a synthetic version of the Longitudinal Business Database (LBD) can easily be transferred to generate a similar data product for other countries. We construct a German data product with infor- mation comparable to the LBD - the German Longitudinal Business Database (GLBD) - that is generated from different administrative sources at the Institute for Employment Research, Germany. In a fu- ture step, the algorithms developed for the synthesis of the LBD will be applied to the GLBD. Extensive evaluations will illustrate whether the algorithms provide useful synthetic data without further adjustment. The ultimate goal of the project is to provide access to multiple synthetic datasets similar to the SynLBD at Cornell to enable comparative studies between countries. The Synthetic GLBD is a first step towards that goal.},
DOI = {10.3233/SJI-140812},
Keywords = {confidentiality; comparative studies; US Longitudinal Business Database; synthetic data},
Owner = {vilhuber},
Timestamp = {2014.03.24},
URL = {http://iospress.metapress.com/content/X415V18331Q33150}
}
• C. Lagoze, L. Vilhuber, J. Williams, B. Perry, and W. C. Block, “CED2AR: The Comprehensive Extensible Data Documentation and Access Repository,” in ACM/IEEE Joint Conference on Digital Libraries (JCDL 2014), London, United Kingdom, 2014.
[Bibtex]
@InProceedings{LagozeJCDL2014,
Title = {CED2AR: The Comprehensive Extensible Data Documentation and Access Repository},
Author = {Carl Lagoze and Lars Vilhuber and Jeremy Williams and Benjamin Perry and William C. Block},
Booktitle = {ACM/IEEE Joint Conference on Digital Libraries (JCDL 2014)},
Year = {2014},
Month = {8th-12th September 2014},
Note = {Presented at the ACM/IEEE Joint Conference on Digital Libraries (JCDL 2014)},
Organization = {ACM/IEEE},
Abstract = {Social science researchers increasingly make use of data that is confidential because it contains linkages to the identities of people, corporations, etc. The value of this data lies in the ability to join the identifiable entities with external data such as genome data, geospatial information, and the like. However, the confidentiality of this data is a barrier to its utility and curation, making it difficult to fulfill US federal data management mandates and interfering with basic scholarly practices such as validation and reuse of existing results. We describe the complexity of the relationships among data that span a public and private divide. We then describe our work on the CED2AR prototype, a first step in providing researchers with a tool that spans this divide and makes it possible for them to search, access, and cite that data.},
Owner = {vilhuber},
Timestamp = {2014.07.09}
}
• J. Miranda and L. Vilhuber, “Using Partially Synthetic Data to Replace Suppression in the Business Dynamics Statistics: Early Results,” in Privacy in Statistical Databases, J. Domingo-Ferrer, Ed., Springer International Publishing, 2014, vol. 8744, pp. 232-242.
[DOI] [URL] [Bibtex]
@InCollection{psd2014a,
Title = {Using Partially Synthetic Data to Replace Suppression in the Business Dynamics Statistics: Early Results},
Author = {Miranda, Javier and Vilhuber, Lars},
Booktitle = {Privacy in Statistical Databases},
Publisher = {Springer International Publishing},
Year = {2014},
Editor = {Domingo-Ferrer, Josep},
Pages = {232-242},
Series = {Lecture Notes in Computer Science},
Volume = {8744},
Abstract = {The Business Dynamics Statistics is a product of the U.S. Census Bureau that provides measures of business openings and closings, and job creation and destruction, by a variety of cross-classifications (firm and establishment age and size, industrial sector, and geography). Sensitive data are currently protected through suppression. However, as additional tabulations are being developed, at ever more detailed geographic levels, the number of suppressions increases dramatically. This paper explores the option of providing public-use data that are analytically valid and without suppressions, by leveraging synthetic data to replace observations in sensitive cells.},
DOI = {10.1007/978-3-319-11257-2_18},
ISBN = {978-3-319-11256-5},
Keywords = {synthetic data; statistical disclosure limitation; time-series; local labor markets; gross job flows; confidentiality protection},
URL = {http://dx.doi.org/10.1007/978-3-319-11257-2_18}
}
• J. Miranda and L. Vilhuber, “Looking Back On Three Years Of Using The Synthetic LBD Beta,” Statistical Journal of the IAOS: Journal of the International Association for Official Statistics, vol. 30, 2014.
[DOI] [URL] [Bibtex]
@Article{SJIAOS-2014a,
Title = {{Looking Back On Three Years Of Using The {S}ynthetic {LBD} Beta}},
Author = {Miranda, Javier and Lars Vilhuber},
Journal = {Statistical Journal of the IAOS: Journal of the International Association for Official Statistics},
Year = {2014},
Volume = {30},
Abstract = {Distributions of business data are typically much more skewed than those for household or individual data and public knowledge of the underlying units is greater. As a results, national statistical offices (NSOs) rarely release establishment or firm-level business microdata due to the risk to respondent confidentiality. One potential approach for overcoming these risks is to release synthetic data where the establishment data are simulated from statistical models designed to mimic the distributions of the real underlying microdata. The US Census Bureau?s Center for Economic Studies in collaboration with Duke University, the National Institute of Statistical Sciences, and Cornell University made available a synthetic public use file for the Longitudinal Business Database (LBD) comprising more than 20 million records for all business establishment with paid employees dating back to 1976. The resulting product, dubbed the SynLBD, was released in 2010 and is the first-ever comprehensive business microdata set publicly released in the United States including data on establishments employment and payroll, birth and death years, and industrial classification. This pa- per documents the scope of projects that have requested and used the SynLBD.},
DOI = {10.3233/SJI-140811},
Keywords = {confidentiality; comparative studies; US Longitudinal Business Database; synthetic data},
Owner = {vilhuber},
Timestamp = {2014.03.24},
URL = {http://iospress.metapress.com/content/X415V18331Q33150}
}

### 2013

• J. M. Abowd, M. J. Schneider, and L. Vilhuber, “Differential Privacy Applications to Bayesian and Linear Mixed Model Estimation,” Journal of Privacy and Confidentiality, vol. 5, iss. 1, 2013.
[PDF] [URL] [Bibtex]
@Article{AbowdSchneiderVilhuber2013,
Title = {Differential Privacy Applications to Bayesian and Linear Mixed Model Estimation},
Author = {Abowd, John M. and Schneider, Matthew J. and Vilhuber, Lars},
Journal = {Journal of Privacy and Confidentiality},
Year = {2013},
Note = {Article 4},
Number = {1},
Volume = {5},
Abstract = {We consider a particular maximum likelihood estimator (MLE) and a computationally intensive Bayesian method for differentially private estimation of the linear mixed-effects model (LMM) with normal random errors. The LMM is important because it is used in small-area estimation and detailed industry tabulations that present significant challenges for confidentiality protection of the underlying data. The differentially private MLE performs well compared to the regular MLE, and deteriorates as the protection increases for a problem in which the small-area variation is at the county level. More dimensions of random effects are needed to adequately represent the time dimension of the data, and for these cases the differentially private MLE cannot be computed. The direct Bayesian approach for the same model uses an informative, reasonably diffuse prior to compute the posterior predictive distribution for the random effects. The empirical differential privacy of this approach is estimated by direct computation of the relevant odds ratios after deleting influential observations according to various criteria.},
File = {AbowdSchneiderVilhuber2013.pdf:A/AbowdSchneiderVilhuber2013.pdf:PDF},
Owner = {vilhuber},
Timestamp = {2013.07.24},
URL = {https://doi.org/10.29012/jpc.v5i1.627}
}
• J. Drechsler and L. Vilhuber, “Replicating the Synthetic LBD with German Establishment Data,” Proceedings 59th ISI World Statistics Congress, 25-30 August 2013, Hong Kong (Session STS062), pp. 2291-2296, 2013.
[URL] [Bibtex]
@Article{ISI2013-3,
Title = {Replicating the {S}ynthetic {LBD} with {G}erman Establishment Data},
Author = {J{\"o}rg Drechsler and Lars Vilhuber},
Journal = {Proceedings 59th ISI World Statistics Congress, 25-30 August 2013, Hong Kong (Session STS062) },
Year = {2013},
Pages = {2291-2296},
ISBN = {978-90-73592-34-6},
URL = {http://2013.isiproceedings.org},
Urldate = {2014-03-24}
}
• C. Lagoze, W. C. Block, J. Williams, J. M. Abowd, and L. Vilhuber, “Data Management of Confidential Data,” International Journal of Digital Curation, vol. 8, iss. 1, pp. 265-278, 2013.
[DOI] [Bibtex]
@Article{DBLP:journals/ijdc/LagozeBWAV13,
Title = {Data Management of Confidential Data},
Author = {Carl Lagoze and William C. Block and Jeremy Williams and John M. Abowd and Lars Vilhuber},
Journal = {International Journal of Digital Curation},
Year = {2013},
Number = {1},
Pages = {265-278},
Volume = {8},
Abstract = {Social science researchers increasingly make use of data that is confidential because it contains linkages to the identities of people, corporations, etc. The value of this data lies in the ability to join the identifiable entities with external data such as genome data, geospatial information, and the like. However, the confidentiality of this data is a barrier to its utility and curation, making it difficult to fulfill US federal data management mandates and interfering with basic scholarly practices such as validation and reuse of existing results. We describe the complexity of the relationships among data that span a public and private divide. We then describe our work on the CED2AR prototype, a first step in providing researchers with a tool that spans this divide and makes it possible for them to search, access, and cite that data.},
Bibsource = {DBLP, http://dblp.uni-trier.de},
Comment = {Presented at 8th International Digital Curation Conference 2013, Amsterdam. See also http://hdl.handle.net/1813/30924},
DOI = {10.2218/ijdc.v8i1.259},
Owner = {vilhuber},
Timestamp = {2013.10.09}
}
• C. Lagoze, W. C. Block, J. Williams, and L. Vilhuber, “Encoding Provenance of Social Science Data: Integrating PROV with DDI,” in 5th Annual European DDI User Conference, 2013.
[Bibtex]
@InProceedings{LagozeEtAl2013,
Title = {Encoding Provenance of Social Science Data: Integrating PROV with DDI},
Author = {Carl Lagoze and William C. Block and Jeremy Williams and Lars Vilhuber},
Booktitle = {5th Annual European DDI User Conference},
Year = {2013},
Abstract = {Provenance is a key component of evaluating the integrity and reusability of data for scholarship. While recording and providing access provenance has always been important, it is even more critical in the web environment in which data from distributed sources and of varying integrity can be combined and derived. The PROV model, developed under the auspices of the W3C, is a foundation for semantically-rich, interoperable, and web-compatible provenance metadata. We report on the results of our experimentation with integrating the PROV model into the DDI metadata for a complex, but characteristic, example social science data. We also present some preliminary thinking on how to visualize those graphs in the user interface.},
Keywords = {Metadata, Provenance, DDI, eSocial Science},
Owner = {vilhuber},
Timestamp = {2013.10.09}
}
• C. Lagoze, J. Willliams, and L. Vilhuber, “Encoding Provenance Metadata for Social Science Datasets,” in Metadata and Semantics Research, 2013, pp. 123-134.
[DOI] [URL] [Bibtex]
@InProceedings{LagozeEtAl2013b,
Title = {Encoding Provenance Metadata for Social Science Datasets},
Author = {Lagoze, Carl and Willliams, Jeremy and Vilhuber, Lars},
Booktitle = {Metadata and Semantics Research},
Year = {2013},
Editor = {Garoufallou, Emmanouel and Greenberg, Jane},
Pages = {123-134},
Publisher = {Springer International Publishing},
Series = {Communications in Computer and Information Science},
Volume = {390},
Abstract = {Recording provenance is a key requirement for data-centric scholarship, allowing researchers to evaluate the integrity of source data sets and reproduce, and thereby, validate results. Provenance has become even more critical in the web environment in which data from distributed sources and of varying integrity can be combined and derived. Recent work by the W3C on the PROV model provides the foundation for semantically-rich, interoperable, and web-compatible provenance metadata. We apply that model to complex, but characteristic, provenance examples of social science data, describe scenarios that make scholarly use of those provenance descriptions, and propose a manner for encoding this provenance metadata within the widely-used DDI metadata standard.},
DOI = {10.1007/978-3-319-03437-9_13},
ISBN = {978-3-319-03436-2},
Keywords = {Metadata; Provenance; DDI; eSocial Science},
Owner = {vilhuber},
Timestamp = {2013.11.05},
URL = {http://dx.doi.org/10.1007/978-3-319-03437-9_13}
}

### 2012

• J. M. Abowd, L. Vilhuber, and W. Block, “A Proposed Solution to the Archiving and Curation of Confidential Scientific Inputs,” in Privacy in Statistical Databases, , 2012, pp. 216-225.
[PDF] [DOI] [URL] [Bibtex]
@InCollection{AbowdVilhuberBlock2012,
Title = {A Proposed Solution to the Archiving and Curation of Confidential Scientific Inputs},
Author = {John M. Abowd and Lars Vilhuber and William Block},
Booktitle = {Privacy in Statistical Databases},
Year = {2012},
Pages = {216-225},
Bibsource = {DBLP, http://dblp.uni-trier.de},
Crossref = {DBLP:conf/psd/2012},
DOI = {10.1007/978-3-642-33627-0_17},
ISBN = {978-3-642-33626-3},
Keywords = {Data Archive; Data Curation; Statistical Disclosure Limitation; Privacy-preserving Datamining},
Owner = {vilhuber},
Timestamp = {2012.09.26},
URL = {http://dx.doi.org/10.1007/978-3-642-33627-0_17}
}
• J. M. Abowd and L. Vilhuber, “Did the Housing Price Bubble Clobber Local Labor Market Job and Worker Flows When It Burst?,” American Economic Review, vol. 102, iss. 3, pp. 589-93, 2012.
[PDF] [DOI] [URL] [Bibtex]
@Article{AbowdVilhuber2012,
Title = {Did the Housing Price Bubble Clobber Local Labor Market Job and Worker Flows When It Burst?},
Author = {John M. Abowd and Lars Vilhuber},
Journal = {American Economic Review},
Year = {2012},
Month = {May},
Number = {3},
Pages = {589-93},
Volume = {102},
Abstract = { We use the Census Bureau's Quarterly Workforce Indicators and the Federal Housing Finance Agency's House Price Indices to study the effects of the housing price bubble on local labor markets. We show that the 35 MSAs in the top decile of the house price boom were most severely impacted. Their stable job employment fell much more than the national average. Their real wage rates did not fall as fast as the national average. Accessions fell much faster than average while separations were constant. Job creations fell substantially while destructions rose slightly.},
DOI = {10.1257/aer.102.3.589},
Owner = {vilhuber},
Timestamp = {2013.01.11},
URL = {http://ideas.repec.org/a/aea/aecrev/v102y2012i3p589-93.html}
}
• J. M. Abowd and L. Vilhuber, “Did the Housing Price Bubble Clobber Local Labor Market Job and Worker Flows When It Burst? – Online Appendix,” American Economic Review, vol. 102, iss. 3, pp. 589-93, 2012.
[PDF] [DOI] [URL] [Bibtex]
@Article{aea-pp-abowd-vilhuber-online-appendix,
Title = {Did the Housing Price Bubble Clobber Local Labor Market Job and Worker Flows When It Burst? - Online Appendix},
Author = {John M. Abowd and Lars Vilhuber},
Journal = {American Economic Review},
Year = {2012},
Month = {May},
Number = {3},
Pages = {589-93},
Volume = {102},
Abstract = {This is the appendix to Abowd and Vilhuber (2012).},
DOI = {10.1257/aer.102.3.589},
Owner = {vilhuber},
Timestamp = {2013.01.11},
URL = {https://www.aeaweb.org/aer/data/may2012/2012_2790_app.pdf}
}

### 2011

• J. M. Abowd and L. Vilhuber, “National Estimates of Gross Employment and Job Flows from the Quarterly Workforce Indicators with Demographic and Industry Detail,” Journal of Econometrics, vol. 161, pp. 82-99, 2011.
[PDF] [DOI] [Bibtex]
@Article{AbowdVilhuber2010,
Title = {National Estimates of Gross Employment and Job Flows from the Quarterly Workforce Indicators with Demographic and Industry Detail},
Author = {John M. Abowd and Lars Vilhuber},
Journal = {Journal of Econometrics},
Year = {2011},
Pages = {82-99},
Volume = {161},
Abstract = {The Quarterly Workforce Indicators (QWI) are local labor market data produced and released every quarter by the United States Census Bureau. Unlike any other local labor market series produced in the US or the rest of the world, QWI measure employment flows for workers (accession and separations), jobs (creations and destructions) and earnings for demographic subgroups (age and gender), economic industry (NAICS industry groups), detailed geography (block (experimental), county, Core-Based Statistical Area, and Workforce Investment Area), and ownership (private, all) with fully interacted publication tables. The current QWI data cover 47 states, about 98\% of the private workforce in those states, and about 92\% of all private employment in the entire economy. State participation is sufficiently extensive to permit us to present the first national estimates constructed from these data. We focus on worker, job, and excess (churning) reallocation rates, rather than on levels of the basic variables. This permits a comparison to existing series from the Job Openings and Labor Turnover Survey and the Business Employment Dynamics Series from the Bureau of Labor Statistics (BLS). The national estimates from the QWI are an important enhancement to existing series because they include demographic and industry detail for both worker and job flow data compiled from underlying micro-data that have been integrated at the job and establishment levels by the Longitudinal Employer-Household Dynamics Program at the Census Bureau. The estimates presented herein were compiled exclusively from public-use data series and are available for download.},
Comment = {Final version published online: 4-MAR-2011},
DOI = {10.1016/j.jeconom.2010.09.008},
File = {AbowdVilhuber2010.pdf:A/AbowdVilhuber2010.pdf:PDF},
Owner = {vilhuber},
Timestamp = {2010.04.04}
}
• J. M. Abowd and L. Vilhuber, “Science, Confidentiality, and the Public Interest,” Chance, vol. 24, iss. 3, pp. 58-62, 2011.
[DOI] [URL] [Bibtex]
@Article{Chance2011,
Title = {Science, Confidentiality, and the Public Interest},
Author = {John M. Abowd and Lars Vilhuber},
Journal = {Chance},
Year = {2011},
Number = {3},
Volume = {24},
Pages = {58-62},
DOI = {10.1080/09332480.2011.10739876},
URL = {http://dx.doi.org/10.1080/09332480.2011.10739876},
}

### 2009

• J. M. Abowd, K. L. McKinney, and L. Vilhuber, “The link between human capital, mass layoffs, and firm deaths,” in Producer Dynamics: New Evidence from Micro Data, T. Dunne, B. J. Jensen, and M. J. Roberts, Eds., University of Chicago Press, 2009.
[PDF] [URL] [Bibtex]
@InBook{AbowdEtAl2009c,
Title = {The link between human capital, mass layoffs, and firm deaths},
Author = {Abowd, John M. and McKinney, Kevin L. and Vilhuber, Lars},
Booktitle = {Producer Dynamics: New Evidence from Micro Data},
Publisher = {University of Chicago Press},
Year = {2009},
Editor = {Timothy Dunne and Jensen, J. Bradford and Mark J. Roberts},
Crossref = {DunneJensenRoberts2009},
File = {AbowdMcKinneyVilhuber2005.pdf:L/LEHD/AbowdMcKinneyVilhuber2005.pdf:PDF},
Owner = {vilhuber},
Timestamp = {2007.01.11},
URL = {http://www.nber.org/chapters/c0497/}
}
• J. M. Abowd, B. E. Stephens, L. Vilhuber, F. Andersson, K. L. McKinney, M. Roemer, and S. D. Woodcock, “The LEHD Infrastructure Files and the Creation of the Quarterly Workforce Indicators,” in Producer Dynamics: New Evidence from Micro Data, T. Dunne, B. J. Jensen, and M. J. Roberts, Eds., University of Chicago Press, 2009.
[PDF] [URL] [Bibtex]
@InBook{AbowdEtAl2009,
Title = {The {LEHD} Infrastructure Files and the Creation of the {Q}uarterly {W}orkforce {I}ndicators},
Author = {John M. Abowd and Bryce E. Stephens and Lars Vilhuber and Fredrik Andersson and Kevin L. McKinney and Marc Roemer and Simon D. Woodcock},
Booktitle = {Producer Dynamics: New Evidence from Micro Data},
Publisher = {University of Chicago Press},
Year = {2009},
Editor = {Timothy Dunne and Jensen, J. Bradford and Mark J. Roberts},
Crossref = {DunneJensenRoberts2009},
File = {AbowdStephensVilhuber2005-LEHD-final.pdf:L/LEHD/AbowdStephensVilhuber2005-LEHD-final.pdf:PDF},
Timestamp = {2007.03.13},
URL = {http://www.nber.org/chapters/c0485}
}
• B. Dostie, K. L. McKinney, and L. Vilhuber, “Using linked employer-employee data to investigate the speed of adjustment in downsizing firms in Canada and the US,” in International Census Research Data Center Conference, Ithaca, NY, 2009.
[Bibtex]
@Conference{DostieMcKinneyVilhuber2009,
Title = {Using linked employer-employee data to investigate the speed of adjustment in downsizing firms in Canada and the US},
Author = {Dostie, Benoit and McKinney, Kevin L. and Vilhuber, Lars},
Booktitle = { International Census Research Data Center Conference},
Year = {2009},
Month = {October},
Abstract = {When firms are faced with a demand shock, adjustment can take many forms. Firms can adjust physical capital, human capital, or
both. The speed of adjustment may differ as well: costs of adjustment, the type of shock, the legal and economic enviroment all matter.
In this paper, we focus on firms that downsized between 1992 and 1997, but ultimately survive, and investigate how the human capital distribution within
a firm influences the speed of adjustment, {\it ceteris paribus}. In other words, when do firms use mass layoffs instead of attrition to adjust the level
of employment.
We combine worker-level wage records and measures of human capital with firm-level characteristics of the production function, and use levels and
changes in these variables to characterize the choice of adjustment method and speed. Firms are described/compared up to 9 years prior to death. We also
consider how workers fare after leaving downsizing firms, and analyze if observed differences in post-separation outcomes of workers provide clues to
File = {McKinneyVilhuber2006-ESEM2006.pdf:/home/vilhuber/Textes/Papers/Census/CAFE-displacement-death/releases/2006-05-24/McKinneyVilhuber2006-ESEM2006.pdf:PDF},
Institution = {U.S. Census Bureau, LEHD and Cornell University},
Journal = {Conference on Research in Income and Wealth},
Owner = {vilhuber},
Type = {mimeo}
}
• L. Vilhuber, “Adjusting Imperfect Data: Overview and Case Studies,” in The Structure of Wages: An International Comparison, E. P. Lazear and K. L. Shaw, Eds., University of Chicago Press, 2009, pp. 59-80.
[URL] [Bibtex]
@InBook{NBERc2366,
Title = {Adjusting Imperfect Data: Overview and Case Studies},
Author = {Lars Vilhuber},
Editor = {Edward P. Lazear and Kathryn L. Shaw},
Pages = {59-80},
Publisher = {University of Chicago Press},
Year = {2009},
Month = {January},
Type = {Book},
Booktitle = {The Structure of Wages: An International Comparison},
Institution = {National Bureau of Economic Research},
URL = {http://www.nber.org/chapters/c2366}
}

### 2008

• J. Abowd and L. Vilhuber, “How Protective Are Synthetic Data,” in Privacy in Statistical Database, J. Domingo-Ferrer and Y. Sayg{i}n, Eds., Springer Berlin Heidelberg, 2008, vol. 5262, pp. 239-246.
[PDF] [DOI] [URL] [Bibtex]
@InCollection{AbowdVilhuber2008,
Title = {How Protective Are Synthetic Data},
Author = {John Abowd and Lars Vilhuber},
Booktitle = {Privacy in Statistical Database},
Publisher = {Springer Berlin Heidelberg},
Year = {2008},
Editor = {Domingo-Ferrer, Josep and Sayg{\i}n, Y\"ucel},
Month = {September},
Pages = {239-246},
Series = {Lecture Notes in Computer Science},
Volume = {5262},
DOI = {10.1007/978-3-540-87471-3_20},
Owner = {vilhuber},
Timestamp = {2009.01.10},
URL = {http://dx.doi.org/10.1007/978-3-540-87471-3_20}
}
• J. Cloutier and L. Vilhuber, “Procedural justice criteria in salary determination,” Journal of Managerial Psychology, vol. 23, iss. 6, pp. 713-740, 2008.
[DOI] [URL] [Bibtex]
@Article{CloutierVilhuber2008,
Title = {Procedural justice criteria in salary determination},
Author = {Julie Cloutier and Lars Vilhuber},
Journal = {Journal of Managerial Psychology},
volume = {23},
number = {6},
pages = {713-740},
year = {2008},
doi = {10.1108/02683940810894765},
URL = {https://doi.org/10.1108/02683940810894765},
eprint = {https://doi.org/10.1108/02683940810894765},
abstract = { Purpose – The purpose of this research is to identify the dimensionality of the procedural justice construct and the criteria used by employees to assess procedural justice, in the context of salary determination.Design/methodology/approach – Based on a survey of 297 Canadian workers, the paper uses confirmatory factor analysis (CFA) to test the dimensionality and the discriminant and convergent validity of our procedural justice construct. Convergent and predictive validity are also tested using hierarchical linear regressions.Findings – The paper shows the multidimensionality of the procedural justice construct: justice of the salary determination process is assessed through the perceived characteristics of allocation procedures, the perceived characteristics of decision‐makers, and system transparency.Research limitations/implications – Results could be biased towards acceptance; this is discussed. The results also suggest possible extensions to the study.Practical implications – Knowledge of the justice standards improves the ability of organizations to effectively manage the salary determination process and promote its acceptance among employees. Emphasizes the need to adequately manage the selection, training, and perception of decision makers.Originality/value – The paper identifies the standards of procedural justice for salary determination processes. It contributes to the theoretical literature by providing a new multidimensional conceptualization, which helps to better understand the psychological process underlying the perception of procedural justice. The presence of a dimension associated with decision makers is novel and critical for compensation studies. }
}
• L. Dragoset and L. Vilhuber, “How Did Universal Primary Education Affect Returns to Education and Labor Market Participation in Uganda?,” in YOUTH IN AFRICA’S LABOR MARKET, M. Garcia and J. Fares, Eds., 1818 H ST NW, WASHINGTON, DC 20433 USA: WORLD BANK INST, 2008, pp. 263-280.
[DOI] [Bibtex]
@incollection{DragosetVilhuber2008,
Author = {Dragoset, Lisa and Vilhuber, Lars},
Editor = {Garcia, M and Fares, J},
Title = {How Did Universal Primary Education Affect Returns to Education and
Labor Market Participation in Uganda?},
Booktitle = {YOUTH IN AFRICA'S LABOR MARKET},
Year = {2008},
Pages = {263-280},
Publisher = {WORLD BANK INST},
Address = {1818 H ST NW, WASHINGTON, DC 20433 USA},
Type = {Article; Book Chapter},
DOI = {10.1596/978-0-8213-6884-8_ch11},
ISBN = {978-0-8213-6885-5},
Keywords-Plus = {CHILD LABOR; SCHOOL EXPANSION; RURAL PAKISTAN; QUALITY; INVESTMENT;
QUANTITY; PRODUCTIVITY; ALLOCATION; ATTAINMENT; COUNTRIES},
ORCID-Numbers = {Vilhuber, Lars/0000-0001-5733-8932},
}
• A. Machanavajjhala, D. Kifer, J. M. Abowd, J. Gehrke, and L. Vilhuber, “Privacy: Theory meets practice on the map,” International Conference on Data Engineering (ICDE), p. 277–286, 2008.
[DOI] [URL] [Bibtex]
@Article{Ashwin2008,
Title = {Privacy: {T}heory meets practice on the map},
Author = {Ashwin Machanavajjhala and Daniel Kifer and John M. Abowd and Johannes Gehrke and Lars Vilhuber},
Journal = {International Conference on Data Engineering (ICDE)},
Year = {2008},
Pages = {277--286},
Acmid = {1547184},
DOI = {10.1109/ICDE.2008.4497436},
Numpages = {10},
Publisher = {IEEE Computer Society},
URL = {http://dx.doi.org/10.1109/ICDE.2008.4497436}
}

### 2006

• K. L. McKinney and L. Vilhuber, “Using linked employer-employee data to investigate the speed of adjustment in downsizing firms,” in Conference on the Analysis of Firms and Employees (CAFE), Nuremberg, Germany, 2006.
[Bibtex]
@Conference{McKinneyVilhuber2006,
Title = {Using linked employer-employee data to investigate the speed of adjustment in downsizing firms},
Author = {McKinney, Kevin L. and Vilhuber, Lars},
Booktitle = {Conference on the Analysis of Firms and Employees (CAFE)},
Year = {2006},
Month = {September},
Abstract = {When firms are faced with a demand shock, adjustment can take many forms. Firms can adjust physical capital, human capital, or
both. The speed of adjustment may differ as well: costs of adjustment, the type of shock, the legal and economic enviroment all matter.
In this paper, we focus on firms that downsized between 1992 and 1997, but ultimately survive, and investigate how the human capital distribution within
a firm influences the speed of adjustment, {\it ceteris paribus}. In other words, when do firms use mass layoffs instead of attrition to adjust the level
of employment.
We combine worker-level wage records and measures of human capital with firm-level characteristics of the production function, and use levels and
changes in these variables to characterize the choice of adjustment method and speed. Firms are described/compared up to 9 years prior to death. We also
consider how workers fare after leaving downsizing firms, and analyze if observed differences in post-separation outcomes of workers provide clues to
File = {McKinneyVilhuber2006-ESEM2006.pdf:/home/vilhuber/Textes/Papers/Census/CAFE-displacement-death/releases/2006-05-24/McKinneyVilhuber2006-ESEM2006.pdf:PDF},
Institution = {U.S. Census Bureau, LEHD and Cornell University},
Journal = {Conference on Research in Income and Wealth},
Owner = {vilhuber},
Type = {mimeo}
}

### 2005

• J. M. Abowd and L. Vilhuber, “The Sensitivity of Economic Statistics to Coding Errors in Personal Identifiers,” , vol. 23, iss. 2, pp. 133-152, 2005.
[URL] [Bibtex]
@Article{AbowdVilhuber2005,
Title = {The Sensitivity of Economic Statistics to Coding Errors in Personal Identifiers},
Author = {John M. Abowd and Lars Vilhuber},
Journal = jbes,
Year = {2005},
Month = {April},
Number = {2},
Pages = {133-152},
Volume = {23},
File = {AbowdVilhuber2005.pdf:A/AbowdVilhuber2005.pdf:PDF;tp-2002-17.pdf:L/LEHD/tp-2002-17.pdf:PDF},
URL = {http://www.jstor.org/stable/27638803}
}

### 2004

• H. Holzer, J. Lane, and L. Vilhuber, “Escaping poverty for low-wage workers: The role of employer characteristics and changes,” Industrial and Labor Relations Review, vol. 57, iss. 4, 2004.
[DOI] [URL] [Bibtex]
@Article{HolzerLaneVilhuber2004,
Title = {Escaping poverty for low-wage workers: {T}he role of employer characteristics and changes},
Author = {Harry Holzer and Julia Lane and Lars Vilhuber},
Journal = {Industrial and Labor Relations Review},
Year = {2004},
Month = {July},
Number = {4},
Volume = {57},
Owner = {vilhuber},
url = {http://journals.sagepub.com/doi/pdf/10.1177/001979390405700405},
alturl = {http://www.jstor.org/stable/4126683},
doi = {10.1177/001979390405700405},
abstract = {Using a unique dataset based on individual Unemployment Insurance wage records for Illinois in the 1990s that are matched to other Census data, the authors analyze the extent to which escape from or entry into low earnings among adult workers was associated with changes in their employers and firm characteristics. The results show considerable mobility into and out of low earnings status, even for adults. They indicate that job changes were an important part of the process by which workers escaped or entered low-wage status, and that changes in employer characteristics help to account for these job changes. Matches between personal and firm characteristics also contributed to observed earnings outcomes.}
}
• D. N. Margolis, E. Plug, V. Simonnet, and LarsVilhuber, “Early Career Experiences and Later Career Outcomes: An InternationalComparison.” , 2004, pp. 90-117.
[Bibtex]
@InBook{MargolisEtAl2004,
Title = {Early Career Experiences and Later Career Outcomes: {A}n InternationalComparison},
Author = {David N. Margolis and Erik Plug and V{\'e}ronique Simonnet and LarsVilhuber},
Chapter = {5},
Pages = {90-117},
Year = {2004},
Crossref = {Sofer2004}
}

### 2001

• D. N. Margolis, V. Simonnet, and L. Vilhuber, “Early Career Experiences and Later Career Outcomes: Comparing the United States, France and Germany,” Vierteljahrshefte zur Wirtschaftsforschung, vol. 70, iss. 1, pp. 31-38, 2001.
[DOI] [URL] [Bibtex]
@Article{MargolisEtAl2001,
Title = {Early Career Experiences and Later Career Outcomes: {C}omparing the {U}nited {S}tates, {F}rance and {G}ermany},
Author = {David N. Margolis and V{\'e}ronique Simonnet and Lars Vilhuber},
journal = {Vierteljahrshefte zur Wirtschaftsforschung},
altJournal = {Quarterly Journal for Economic Research},
Year = {2001},
Pages = {31-38},
issn = {1861-1559},
number = {1},
volume = {70},
url = {http://hdl.handle.net/10419/99179},
doi = {10.3790/vjh.70.1.31},
abstract = {This paper explores the links between individuals' early career experiences and their labor market outcomes 5 to 20 years later using data from France, (western) Germany, and the United States. Relative to most of the literature, we consider a large set of measures of men's early career experiences and later career outcomes. Our results differ significantly across countries. Labor market outcomes in Germany are consistent with a dual labor market model. In the case of American workers, either the market learns about unobservable worker characteristics over time or the implicit contracts established at the start of the career are increasingly renegotiated over time. Unobserved heterogeneity in individuals' networks of labor market contacts is consistent with our results for France. These results reflect optimal firm responses to the different institutional environments in each country in the presence of ex ante imperfect information concerning young workers.}
}
• L. Vilhuber, “La spécificité de la formation en milieu de travail : un survol des contributions théoriques et empiriques récentes,,” L’Actualité économique, Revue d’analyse économique, vol. 77, iss. 1, 2001.
[Bibtex]
@Article{Vilhuber2001,
Title = {La sp{\'e}cificit{\'e} de la formation en milieu de travail : un survol des contributions th{\'e}oriques et empiriques r{\'e}centes,},
Author = {Lars Vilhuber},
Journal = {L'Actualit{\'e} {\'e}conomique, Revue d'analyse {\'e}conomique},
Year = {2001},
Month = {March},
Number = {1},
Volume = {77}
}

### 1999

• L. Vilhuber, “Continuous Training and sectoral mobility in Germany: Evidence from the 90s,” Vierteljahresheft für Wirtschaftsforschung, vol. 68, iss. 2, pp. 209-214, 1999.
[URL] [Bibtex]
@Article{Vilhuber99a,
Title = {Continuous Training and sectoral mobility in {G}ermany: {E}vidence from the 90s},
Author = {Lars Vilhuber},
journal = {Vierteljahresheft f{\"u}r Wirtschaftsforschung},
altJournal = {Quarterly Journal of Economic Research},
issn = {0340-1707},
Year = {1999},
volume = {68},
number = {2},
pages = {209-214},
Abstract = {see Vilhuber99b},
Mylibrary = {my own...},
url = {http://hdl.handle.net/10419/141240},
}

## Working papers

### 2019

• J. Abowd, I. Schmutte, W. Sexton, and L. Vilhuber, “Introductory Readings in Formal Privacy for Economists,” 2019.
[DOI] [URL] [Bibtex]
@techreport{formalprivacy:zenodo:2019,
author = {John Abowd and
Ian Schmutte and
William Sexton and
Lars Vilhuber},
title = {{Introductory Readings in Formal Privacy for
Economists}},
note = {{Supported by Alfred P. Sloan Foundation Grant
G-2015-13903 and NSF Grant SES-1131848}},
month = apr,
year = 2019,
doi = {10.5281/zenodo.2621345},
url = {https://doi.org/10.5281/zenodo.2621345}
}
• C. Lagoze and L. Vilhuber, “metajelo: A metadata package for journals to support external linked objects,” Labor Dynamics Institute, Document 52, 2019.
[URL] [Bibtex]
@TechReport{VilhuberLagoze2019,
Title = {{m}etajelo: {A} metadata package for journals to support external linked objects},
Author = {Carl Lagoze and Lars Vilhuber},
Institution = {Labor Dynamics Institute},
Year = {2019},
Month = {April},
Number = {52},
Type = {Document},
Abstract = {We propose a metadata package that is intended to provide academic journals with a lightweight means of registering, at the time of publication, the existence and disposition of supplementary materials. Information about the supplementary materials is, in most cases, critical for the reproducibility and replicability of scholarly results. In many instances, these materials are curated by a third party, which may or may not follow developing standards for the identification and description of those materials. As such, the vocabulary described here complements existing initiatives that specify vocabularies to describe the supplementary materials or the repositories and archives in which they have been deposited. Where possible, it reuses elements of relevant other vocabularies, facilitating coexistence with them. Furthermore, it provides an “at publication” record of reproducibility characteristics of a particular article that has been selected for publication. The proposed metadata package documents the key characteristics that journals care about in the case of supplementary materials that are held by third parties: existence, accessibility, and permanence. It does so in a robust, time-invariant fashion at the time of publication, when the editorial decisions are made. It also allows for better documentation of less accessible (non-public data), by treating it symmetrically from the point of view of the journal, therefore increasing the transparency of what up until now has been very opaque.},
Owner = {vilhuber},
Timestamp = {2019.04.10},
URL = {http://digitalcommons.ilr.cornell.edu/ldi/52/}
}
• L. Vilhuber and W. Block, “Outcomes Report of the Cornell Node of the NSF-Census Research Network,” , Report , 2019.
[URL] [Bibtex]
@techreport{VilhuberBlock2019,
timestamp = {2019-04-10T00:58:56Z},
type = {Report},
title = {Outcomes Report of the {{Cornell Node}} of the {{NSF}}-{{Census Research Network}}},
abstract = {Description and List of Outcomes of the Cornell node of the NSF-Census Research Network.},
urldate = {2019-04-10},
url = {https://hdl.handle.net/1813/65011},
author = {Vilhuber, Lars and Block, William},
month = jan,
year = {2019},
file = {Full Text PDF:/home/vilhuber/Zotero/storage/AGTYI8RG/Vilhuber and Block - 2019 - Outcomes report Cornell Node of the NSF-Census R.pdf:application/pdf;Snapshot:/home/vilhuber/Zotero/storage/JPN6HF5W/65011.html:text/html}
}

### 2018

• J. M. Abowd, I. M. Schmutte, and L. Vilhuber, “Disclosure Limitation and Confidentiality Protection in Linked Data,” Center for Economic Studies, U.S. Census Bureau, Working Papers 18-07, 2018.
[URL] [Bibtex]
@TechReport{RePEc:cen:wpaper:18-07,
author={John M. Abowd and Ian M. Schmutte and Lars Vilhuber},
title={{Disclosure Limitation and Confidentiality Protection in Linked Data}},
year=2018,
month=Jan,
institution={Center for Economic Studies, U.S. Census Bureau},
type={Working Papers},
url={https://ideas.repec.org/p/cen/wpaper/18-07.html},
number={18-07},
keywords={},
doi={},
}
• M. King and Working Group Participants, “Data Sharing Governance and Management,” Administrative Data Research Facilities Network, Working Group Report , 2018.
[URL] [Bibtex]
@techreport{adrf-working,
title = {Data Sharing Governance and Management},
author = {Monica King and {Working Group Participants}},
institution = {Administrative Data Research Facilities Network},
type = {Working Group Report},
year = {2018},
url = {https://docs.wixstatic.com/ugd/e35e20_33eaf93b681846248aac487e6f23e85c.pdf},
}
• L. Vilhuber, “LEHD Infrastructure S2014 files in the FSRDC,” Center for Economic Studies, U.S. Census Bureau, Working Papers 18-27, 2018.
[URL] [Bibtex]
@TechReport{RePEc:cen:wpaper:18-27,
author={Lars Vilhuber},
title={{LEHD Infrastructure S2014 files in the FSRDC}},
year=2018,
month=May,
institution={Center for Economic Studies, U.S. Census Bureau},
type={Working Papers},
url={https://ideas.repec.org/p/cen/wpaper/18-27.html},
number={18-27},
abstract={The Longitudinal Employer-Household Dynamics (LEHD) Program at the U.S. Census Bureau, with the support of several national research agencies, maintains a set of infrastructure files using administrative data provided by state agencies, enhanced with information from other administrative data sources, demographic and economic (business) surveys and censuses. The LEHD Infrastructure Files provide a detailed and comprehensive picture of workers, employers, and their interaction in the U.S. economy. This document describes the structure and content of the 2014 Snapshot of the LEHD Infrastructure files as they are made available in the Census Bureau’s secure and restricted-access Research Data Center network. The document attempts to provide a comprehensive description of all researcher-accessible files, of their creation, and of any modifications made to the files to facilitate researcher access.},
keywords={},
doi={},
}

### 2017

• J. Cloutier, L. Vilhuber, D. Harrisson, and V. Béland-Ouellette, “Understanding the effect of procedural justice on psychological distress,” Labor Dynamics Institute, Cornell University, Document 35, 2017.
[URL] [Bibtex]
@TechReport{CloutierVilhuberLDI2017,
author = {Julie Cloutier and Lars Vilhuber and Denis Harrisson and Vanessa B{\'e}land-Ouellette},
title = {Understanding the effect of procedural justice on psychological distress},
abstract = {Studies on the effect of procedural justice on psychological distress present conflicting results. Drawing on instrumental and relational perspectives of justice, we test the hypothesis that the perception of procedural justice influences the level of workers' psychological distress. Using a number of validated instruments to collected data from 659 workers in three call centers, we use OLS regressions and Hayes' PROCESS tool to show that the perception of procedural justice has a direct, unique, and independent effect on psychological distress. The perception of procedural justice has no instrumental role, the key mechanism being the relational role, suggesting that perceived injustice influences psychological distress because it threatens self-esteem. Distributive justice perceptions (recognition, promotions, job security) are not associated with psychological distress, calling into question Siegrist's model. Our findings suggest that perceived procedural justice provides workers better evidence of the extent to which they are valued and appreciated members of their organizations than do perceptions of distributive justice. The results highlight the greater need for workers to be valued and appreciated for who they are (consideration and esteem), rather than for what they do for their organization (distributive justice of rewards).},
institution = {Labor Dynamics Institute, Cornell University},
year = {2017},
type = {Document},
number = {35},
url = {http://digitalcommons.ilr.cornell.edu/ldi/35/},
owner = {vilhuber},
timestamp = {2017.09.28},
}
• A. Foote, M. J. Kutzbach, and L. Vilhuber, “Recalculating – How Uncertainty in Local Labor Market Definitions Affects Empirical Findings,” Center for Economic Studies, U.S. Census Bureau, Working Papers 17-49, 2017.
[URL] [Bibtex]
@TechReport{RePEc:cen:wpaper:17-49,
author={Andrew Foote and Mark J. Kutzbach and Lars Vilhuber},
title={{Recalculating - How Uncertainty in Local Labor Market Definitions Affects Empirical Findings}},
year=2017,
month=Jan,
institution={Center for Economic Studies, U.S. Census Bureau},
type={Working Papers},
url={https://ideas.repec.org/p/cen/wpaper/17-49.html},
number={17-49},
abstract={This paper evaluates the use of commuting zones as a local labor market definition. We revisit Tolbert and Sizer (1996) and demonstrate the sensitivity of definitions to two features of the methodology. We show how these features impact empirical estimates using a well-known application of commuting zones. We conclude with advice to researchers using commuting zones on how to demonstrate the robustness of empirical findings to uncertainty in definitions.},
keywords={Local labor markets; commuting; measurement error},
doi={},
}
• A. Foote, M. J. Kutzbach, and L. Vilhuber, “Recalculating – How Uncertainty in Local Labor Market Definitions Affects Empirical Findings,” NSF Census Research Network – NCRN-Cornell, Preprint 1813:52649, 2017.
[URL] [Bibtex]
@techreport{handle:1813:52649,
Title = {Recalculating - How Uncertainty in Local Labor Market Definitions Affects Empirical Findings},
Author = {Foote, Andrew and Kutzbach, Mark J. and Vilhuber, Lars},
institution = { NSF Census Research Network - NCRN-Cornell },
type = {Preprint} ,
Year = {2017},
number={1813:52649},
URL = {http://hdl.handle.net/1813/52649},
abstract ={This paper evaluates the use of commuting zones as a local labor market definition. We revisit Tolbert and Sizer (1996) and demonstrate the sensitivity of definitions to two features of the methodology. We show how these features impact empirical estimates using a well-known application of commuting zones. We conclude with advice to researchers using commuting zones on how to demonstrate the robustness of empirical findings to uncertainty in definitions.
The analysis, conclusions, and opinions expressed herein are those of the author(s) alone and do not necessarily
represent the views of the U.S. Census Bureau or the Federal Deposit Insurance Corporation. All results have been
reviewed to ensure that no confidential information is disclosed, and no confidential data was used in this paper. This
document is released to inform interested parties of ongoing research and to encourage discussion of work in progress.
Much of the work developing this paper occurred while Mark Kutzbach was an employee of the U.S. Census Bureau.}
}
• A. Foote, M. J. Kutzbach, and L. Vilhuber, “Recalculating – How Uncertainty in Local Labor Market Definitions Affects Empirical Findings,” Labor Dynamics Institute, Cornell University, Document 45, 2017.
[URL] [Bibtex]
@techreport{ldi:2017:45,
Title = {Recalculating - How Uncertainty in Local Labor Market Definitions Affects Empirical Findings},
Author = {Foote, Andrew and Kutzbach, Mark J. and Vilhuber, Lars},
abstract ={This paper evaluates the use of commuting zones as a local labor market definition. We revisit Tolbert and Sizer (1996) and demonstrate the sensitivity of definitions to two features of the methodology. We show how these features impact empirical estimates using a well-known application of commuting zones. We conclude with advice to researchers using commuting zones on how to demonstrate the robustness of empirical findings to uncertainty in definitions.
The analysis, conclusions, and opinions expressed herein are those of the author(s) alone and do not necessarily
represent the views of the U.S. Census Bureau or the Federal Deposit Insurance Corporation. All results have been
reviewed to ensure that no confidential information is disclosed, and no confidential data was used in this paper. This
document is released to inform interested parties of ongoing research and to encourage discussion of work in progress.
Much of the work developing this paper occurred while Mark Kutzbach was an employee of the U.S. Census Bureau.},
institution = {Labor Dynamics Institute, Cornell University},
year = {2017},
type = {Document},
number = {45},
url = {http://digitalcommons.ilr.cornell.edu/ldi/45/},
owner = {vilhuber},
timestamp = {2017.09.28},
}
• A. S. Green, M. J. Kutzbach, and L. Vilhuber, “Two Perspectives on Commuting: A Comparison of Home to Work Flows Across Job-Linked Survey and Administrative Files,” Center for Economic Studies, U.S. Census Bureau, Working Papers 17-34, 2017.
[URL] [Bibtex]
@TechReport{RePEc:cen:wpaper:17-34,
author={Andrew S. Green and Mark J. Kutzbach and Lars Vilhuber},
title={{Two Perspectives on Commuting: A Comparison of Home to Work Flows Across Job-Linked Survey and Administrative Files}},
year=2017,
month=Jan,
institution={Center for Economic Studies, U.S. Census Bureau},
type={Working Papers},
url={https://ideas.repec.org/p/cen/wpaper/17-34.html},
number={17-34},
abstract={Commuting flows and workplace employment data have a wide constituency of users including urban and regional planners, social science and transportation researchers, and businesses. The U.S. Census Bureau releases two, national data products that give the magnitude and characteristics of home to work flows. The American Community Survey (ACS) tabulates households' responses on employment, workplace, and commuting behavior. The Longitudinal Employer-Household Dynamics (LEHD) program tabulates administrative records on jobs in the LEHD Origin-Destination Employment Statistics (LODES). Design differences across the datasets lead to divergence in a comparable statistic: county-to-county aggregate commute flows. To understand differences in the public use data, this study compares ACS and LEHD source files, using identifying information and probabilistic matching to join person and job records. In our assessment, we compare commuting statistics for job frames linked on person, employment status, employer, and workplace and we identify person and job characteristics as well as design features of the data frames that explain aggregate differences. We find a lower rate of within-county commuting and farther commutes in LODES. We attribute these greater distances to differences in workplace reporting and to uncertainty of establishment assignments in LEHD for workers at multi-unit employers. Minor contributing factors include differences in residence location and ACS workplace edits. The results of this analysis and the data infrastructure developed will support further work to understand and enhance commuting statistics in both datasets.},
keywords={U.S. Census Bureau; LEHD; LODES; ACS; Employer-employee matched data; Commuting; Record linkage},
}
• A. Green, M. J. Kutzbach, and L. Vilhuber, “Two Perspectives on Commuting: A Comparison of Home to Work Flows Across Job-Linked Survey and Administrative Files,” NSF Census Research Network – NCRN-Cornell, Preprint 1813:52611, 2017.
[URL] [Bibtex]
@techreport{handle:1813:52611,
Title = {Two Perspectives on Commuting: A Comparison of Home to Work Flows Across Job-Linked Survey and Administrative Files},
Author = {Green, Andrew and Kutzbach, Mark J. and Vilhuber, Lars},
institution = { NSF Census Research Network - NCRN-Cornell },
type = {Preprint} ,
Year = {2017},
number={1813:52611},
URL = {http://hdl.handle.net/1813/52611},
abstract ={Commuting flows and workplace employment data have a wide constituency of users including urban and
regional planners, social science and transportation researchers, and businesses. The U.S. Census Bureau
releases two, national data products that give the magnitude and characteristics of home to work flows. The
American Community Survey (ACS) tabulates households’ responses on employment, workplace, and
commuting behavior. The Longitudinal Employer-Household Dynamics (LEHD) program tabulates
administrative records on jobs in the LEHD Origin-Destination Employment Statistics (LODES). Design
differences across the datasets lead to divergence in a comparable statistic: county-to-county aggregate
commute flows. To understand differences in the public use data, this study compares ACS and LEHD source
files, using identifying information and probabilistic matching to join person and job records. In our
assessment, we compare commuting statistics for job frames linked on person, employment status, employer,
and workplace and we identify person and job characteristics as well as design features of the data frames that
explain aggregate differences. We find a lower rate of within-county commuting and farther commutes in
LODES. We attribute these greater distances to differences in workplace reporting and to uncertainty of
establishment assignments in LEHD for workers at multi-unit employers. Minor contributing factors include
differences in residence location and ACS workplace edits. The results of this analysis and the data
infrastructure developed will support further work to understand and enhance commuting statistics in both
datasets.}
}
• A. S. Green, M. J. Kutzbach, and L. Vilhuber, “Two Perspectives on Commuting: A Comparison of Home to Work Flows Across Job-Linked Survey and Administrative Files,” Labor Dynamics Institute, Cornell University, Document 38, 2017.
[URL] [Bibtex]
@techreport{ldi:2017:38,
author={Andrew S. Green and Mark J. Kutzbach and Lars Vilhuber},
title={{Two Perspectives on Commuting: A Comparison of Home to Work Flows Across Job-Linked Survey and Administrative Files}},
abstract={Commuting flows and workplace employment data have a wide constituency of users including urban and regional planners, social science and transportation researchers, and businesses. The U.S. Census Bureau releases two, national data products that give the magnitude and characteristics of home to work flows. The American Community Survey (ACS) tabulates households' responses on employment, workplace, and commuting behavior. The Longitudinal Employer-Household Dynamics (LEHD) program tabulates administrative records on jobs in the LEHD Origin-Destination Employment Statistics (LODES). Design differences across the datasets lead to divergence in a comparable statistic: county-to-county aggregate commute flows. To understand differences in the public use data, this study compares ACS and LEHD source files, using identifying information and probabilistic matching to join person and job records. In our assessment, we compare commuting statistics for job frames linked on person, employment status, employer, and workplace and we identify person and job characteristics as well as design features of the data frames that explain aggregate differences. We find a lower rate of within-county commuting and farther commutes in LODES. We attribute these greater distances to differences in workplace reporting and to uncertainty of establishment assignments in LEHD for workers at multi-unit employers. Minor contributing factors include differences in residence location and ACS workplace edits. The results of this analysis and the data infrastructure developed will support further work to understand and enhance commuting statistics in both datasets.},
keywords={U.S. Census Bureau; LEHD; LODES; ACS; Employer-employee matched data; Commuting; Record linkage},
institution = {Labor Dynamics Institute, Cornell University},
year = {2017},
type = {Document},
number = {38},
url = {http://digitalcommons.ilr.cornell.edu/ldi/38/},
owner = {vilhuber},
timestamp = {2017.09.28},
}
• S. Haney, A. Machanavajjhala, J. M. Abowd, M. Graham, and M. Kutzbach, “Utility Cost of Formal Privacy for Releasing National Employer-Employee Statistics,” Cornell University, Preprint 1813:49652, 2017.
[URL] [Bibtex]
@TechReport{handle:1813:49652,
author = {Haney, Samuel and Machanavajjhala, Ashwin and Abowd, John M and Graham, Matthew and Kutzbach, Mark},
title = {Utility Cost of Formal Privacy for Releasing National Employer-Employee Statistics},
institution = {Cornell University},
year = {2017},
type = {Preprint},
number = {1813:49652},
url = {http://hdl.handle.net/1813/49652},
owner = {vilhuber},
timestamp = {2017.09.28},
}
• K. L. McKinney, A. S. Green, L. Vilhuber, and J. M. Abowd, “Total Error and Variability Measures with Integrated Disclosure Limitation for Quarterly Workforce Indicators and LEHD Origin Destination Employment Statistics in On The Map,” Center for Economic Studies, U.S. Census Bureau, Working Papers 17-71, 2017.
[URL] [Bibtex]
@TechReport{RePEc:cen:wpaper:17-71,
author={Kevin L. McKinney and Andrew S. Green and Lars Vilhuber and John M. Abowd},
title={{Total Error and Variability Measures with Integrated Disclosure Limitation for Quarterly Workforce Indicators and LEHD Origin Destination Employment Statistics in On The Map}},
year=2017,
month=Jan,
institution={Center for Economic Studies, U.S. Census Bureau},
type={Working Papers},
url={https://ideas.repec.org/p/cen/wpaper/17-71.html},
number={17-71},
abstract={We report results from the rst comprehensive total quality evaluation of five major indicators in the U.S. Census Bureau's Longitudinal Employer-Household Dynamics (LEHD) Program Quarterly Workforce Indicators (QWI): total employment, beginning-of-quarter employment, full-quarter employment, total payroll, and average monthly earnings of full-quarter employees. Beginning-of-quarter employment is also the main tabulation variable in the LEHD Origin-Destination Employment Statistics (LODES) workplace reports as displayed in OnTheMap (OTM). The evaluation is conducted by generating multiple threads of the edit and imputation models used in the LEHD Infrastructure File System. These threads conform to the Rubin (1987) multiple imputation model, with each thread or implicate being the output of formal probability models that address coverage, edit, and imputation errors. Design-based sampling variability and nite population corrections are also included in the evaluation. We derive special formulas for the Rubin total variability and its components that are consistent with the disclosure avoidance system used for QWI and LODES/OTM workplace reports. These formulas allow us to publish the complete set of detailed total quality measures for QWI and LODES. The analysis reveals that the five publication variables under study are estimated very accurately for tabulations involving at least 10 jobs. Tabulations involving three to nine jobs have quality in the range generally deemed acceptable. Tabulations involving zero, one or two jobs, which are generally suppressed in the QWI and synthesized in LODES, have substantial total variability but their publication in LODES allows the formation of larger custom aggregations, which will in general have the accuracy estimated for tabulations in the QWI based on a similar number of workers.},
keywords={Multiple imputation; Total quality measures; Employment statistics; Earnings statistics; Total surve},
doi={},
}
• L. Vilhuber, S. Kinney, and I. Schmutte, “Proceedings from the Synthetic LBD International Seminar,” Labor Dynamics Institute, Cornell University, Document 44, 2017.
[URL] [Bibtex]
@TechReport{ProceedingsSynLBD2017,
author = {Lars Vilhuber and Saki Kinney and Ian Schmutte},
title = {Proceedings from the Synthetic LBD International Seminar},
institution = {Labor Dynamics Institute, Cornell University},
year = {2017},
type = {Document},
number = {44},
url = {http://digitalcommons.ilr.cornell.edu/ldi/44/},
abstract = {On May 9, 2017, we hosted a seminar to discuss the conditions necessary to implement the SynLBD approach with interested parties, with the goal of providing a straightforward toolkit to implement the same procedure on other data. The proceedings summarize the discussions during the workshop.
Funding for the workshop was provided by the National Science Foundation (Grants 1012593; 1131848) and the Alfred P. Sloan Foundation (G-2015-13903). Organizational support was provided by the Labor Dynamics Institute at Cornell University.},
owner = {vilhuber},
timestamp = {2017.09.28},
}
• L. Vilhuber and C. Lagoze, “Making Confidential Data Part of Reproducible Research,” Labor Dynamics Institute, Cornell University, Document 41, 2017.
[URL] [Bibtex]
@TechReport{VilhuberLagozeLDI2017,
author = {Lars Vilhuber and Carl Lagoze},
title = {Making Confidential Data Part of Reproducible Research},
institution = {Labor Dynamics Institute, Cornell University},
year = {2017},
type = {Document},
number = {41},
url = {http://digitalcommons.ilr.cornell.edu/ldi/41/},
owner = {vilhuber},
timestamp = {2017.09.28},
}
• L. Vilhuber and I. Schmutte, “Proceedings from the 2016 NSF-Sloan Workshop on Practical Privacy,” Cornell University, Preprint 1813:46197, 2017.
[URL] [Bibtex]
@TechReport{handle:1813:46197,
author = {Vilhuber, Lars and Schmutte, Ian},
title = {Proceedings from the 2016 NSF-Sloan Workshop on Practical Privacy},
institution = {Cornell University},
year = {2017},
type = {Preprint},
number = {1813:46197},
url = {http://hdl.handle.net/1813/46197},
abstract = {Proceedings from the 2016 NSF{\textendash}Sloan Workshop on Practical Privacy Vilhuber, Lars; Schmutte, Ian; Abowd, John M. On October 14, 2016, we hosted a workshop that brought together economists, survey statisticians, and computer scientists with expertise in the field of privacy preserving methods: Census Bureau staff working on implementing cutting-edge methods in the Bureau{\textquoteright}s flagship public-use products mingled with academic researchers from a variety of universities. The four products discussed as part of the workshop were 1. the American Community Survey (ACS); 2. Longitudinal Employer-Household Data (LEHD), in particular the LEHD Origin-Destination Employment Statistics (LODES); the 3. 2020 Decennial Census; and the 4. 2017 Economic Census. The goal of the workshop was to 1. Discuss the specific challenges that have arisen in ongoing efforts to apply formal privacy models to Census data products by drawing together expertise of academic and governmental researchers 2. Produce short written memos that summarize concrete suggestions for practical applications to specific Census Bureau priority areas.},
owner = {vilhuber},
timestamp = {2017.09.28},
}
• L. Vilhuber and I. Schmutte, “Proceedings from the 2017 Cornell-Census-NSF-Sloan Workshop on Practical Privacy,” Labor Dynamics Institute, Cornell University, Document 43, 2017.
[URL] [Bibtex]
@TechReport{ProceedingsNSFSloan2017,
author = {Lars Vilhuber and Ian Schmutte},
title = {Proceedings from the 2017 Cornell-Census-NSF-Sloan Workshop on Practical Privacy},
institution = {Labor Dynamics Institute, Cornell University},
year = {2017},
type = {Document},
number = {43},
url = {http://digitalcommons.ilr.cornell.edu/ldi/43/},
abstract = {These proceedings report on a workshop hosted at the U.S. Census Bureau on May 8, 2017. Our purpose was to gather experts from various backgrounds together to continue discussing the development of formal privacy systems for Census Bureau data products. This workshop was a successor to a previous workshop held in October 2016 (Vilhuber and Schmutte 2017). At our prior workshop, we hosted computer scientists, survey statisticians, and economists, all of whom were experts in data privacy. At that time we discussed the practical implementation of cutting-edge methods for publishing data with formal, provable privacy guarantees, with a focus on applications to Census Bureau data products. The teams developing those applications were just starting out when our first workshop took place, and we spent our time brainstorming solutions to the various problems researchers were encountering, or anticipated encountering. For these cutting-edge formal privacy models, there had been very little effort in the academic literature to apply those methods in real-world settings with large, messy data. We therefore brought together an expanded group of specialists from academia and government who could shed light on technical challenges, subject matter challenges and address how data users might react to changes in data availability and publishing standards.
In May 2017, we organized a follow-up workshop, which these proceedings report on. We reviewed progress made in four different areas. The four topics discussed as part of the workshop were 1. the 2020 Decennial Census; 2. the American Community Survey (ACS); 3. the 2017 Economic Census; 4. measuring the demand for privacy and for data quality.
As in our earlier workshop, our goals were to 1. Discuss the specific challenges that have arisen in ongoing efforts to apply formal privacy models to Census data products by drawing together expertise of academic and governmental researchers; 2. Produce short written memos that summarize concrete suggestions for practical applications to specific Census Bureau priority areas.},
owner = {vilhuber},
timestamp = {2017.09.28},
}
• L. Vilhuber and I. M. Schmutte, “Proceedings from the 2016 NSF-Sloan Workshop on Practical Privacy,” Labor Dynamics Institute, Cornell University, Document 33, 2017.
[URL] [Bibtex]
@TechReport{Vilhuber:LDI:2017:33,
author = {Vilhuber, Lars and Schmutte, Ian M.},
title = {Proceedings from the 2016 NSF-Sloan Workshop on Practical Privacy},
institution = {Labor Dynamics Institute, Cornell University},
year = {2017},
type = {Document},
number = {33},
url = {http://digitalcommons.ilr.cornell.edu/ldi/33/},
abstract = {On October 14, 2016, we hosted a workshop that brought together economists, survey statisticians, and computer scientists with expertise in the field of privacy preserving methods: Census Bureau staff working on implementing cutting-edge methods in the Bureau's flagship public-use products mingled with academic researchers from a variety of universities. The four products discussed as part of the workshop were 1. the American Community Survey (ACS); 2. Longitudinal Employer-Household Data (LEHD), in particular the LEHD Origin-Destination Employment Statistics (LODES); the 3. 2020 Decennial Census; and the 4. 2017 Economic Census. The goal of the workshop was to 1. Discuss the specific challenges that have arisen in ongoing efforts to apply formal privacy models to Census data products by drawing together expertise of academic and governmental researchers 2. Produce short written memos that summarize concrete suggestions for practical applications to specific Census Bureau priority areas.
Funding for the workshop was provided by the National Science Foundation (CNS-1012593) and the Alfred P. Sloan Foundation. Organizational support was provided by the Research and Methodology Directorate at the U.S. Census Bureau and the Labor Dynamics Institute at Cornell University.},
comment = {Funding by National Science Foundation (CNS-1012593) and the Alfred P. Sloan Foundation},
owner = {vilhuber},
timestamp = {2017.05.03},
xurl = {http://digitalcommons.ilr.cornell.edu/ldi/33/},
}
• D. H. Weinberg, J. M. Abowd, R. F. Belli, N. Cressie, D. C. Folch, S. H. Holan, M. C. Levenstein, K. M. Olson, J. P. Reiter, M. D. Shapiro, J. Smyth, L. Soh, B. D. Spencer, S. E. Spielman, L. Vilhuber, and C. K. Wikle, “Effects of a Government-Academic Partnership: Has the NSF-Census Bureau Research Network Helped Improve the U.S. Statistical System?,” Center for Economic Studies, U.S. Census Bureau, Working Papers 17-59r, 2017.
[URL] [Bibtex]
@TechReport{RePEc:cen:wpaper:17-59r,
author={Daniel H. Weinberg and John M. Abowd and Robert F. Belli and Noel Cressie and David C. Folch and Scott H. Holan and Margaret C. Levenstein and Kristen M. Olson and Jerome P. Reiter and Matthew D. Shapiro and Jolene Smyth and Leen-Kiat Soh and Bruce D. Spencer and Seth E. Spielman and Lars Vilhuber and Christopher K. Wikle},
title={{Effects of a Government-Academic Partnership: Has the NSF-Census Bureau Research Network Helped Improve the U.S. Statistical System?}},
year=2017,
month=Jan,
institution={Center for Economic Studies, U.S. Census Bureau},
type={Working Papers},
url={https://ideas.repec.org/p/cen/wpaper/17-59r.html},
number={17-59r},
abstract={The National Science Foundation-Census Bureau Research Network (NCRN) was established in 2011 to create interdisciplinary research nodes on methodological questions of interest and significance to the broader research community and to the Federal Statistical System (FSS), particularly the Census Bureau. The activities to date have covered both fundamental and applied statistical research and have focused at least in part on the training of current and future generations of researchers in skills of relevance to surveys and alternative measurement of economic units, households, and persons. This paper discusses some of the key research findings of the eight nodes, organized into six topics: (1) Improving census and survey data collection methods; (2) Using alternative sources of data; (3) Protecting privacy and confidentiality by improving disclosure avoidance; (4) Using spatial and spatio-temporal statistical modeling to improve estimates; (5) Assessing data cost and quality tradeoffs; and (6) Combining information from multiple sources. It also reports on collaborations across nodes and with federal agencies, new software developed, and educational activities and outcomes. The paper concludes with an evaluation of the ability of the FSS to apply the NCRN’s research outcomes and suggests some next steps, as well as the implications of this research-network model for future federal government renewal initiatives.},
keywords={},
doi={},
}

### 2016

• J. Miranda and L. Vilhuber, “Using Partially Synthetic Microdata to Protect Sensitive Cells in Business Statistics,” NSF Census Research Network – NCRN-Cornell, 1813:42339, 2016.
[URL] [Bibtex]
@techreport{miranda-vilhuber-2016-ecommons,
Title = {{Using Partially Synthetic Microdata to Protect Sensitive Cells in Business Statistics}},
Author = {Miranda, Javier and Lars Vilhuber},
institution = {NSF Census Research Network - NCRN-Cornell },
Year = {2016},
number = {1813:42339},
Abstract = {We describe and analyze a method that blends records from both observed and synthetic microdata into public-use tabulations on establishment statistics. The resulting tables use synthetic data only in potentially sensitive cells. We describe different algorithms, and present preliminary results when applied to the Census Bureau's Business Dynamics Statistics and Synthetic Longitudinal Business Database, highlighting accuracy and protection afforded by the method when compared to existing public-use tabulations (with suppressions).},
Keywords = {confidentiality; comparative studies; US Longitudinal Business Database; synthetic data},
Owner = {vilhuber},
Timestamp = {2014.03.24},
URL = {http://hdl.handle.net/1813/42339}
}
• J. Miranda and L. Vilhuber, “Using Partially Synthetic Microdata to Protect Sensitive Cells in Business Statistics,” Center for Economic Studies, U.S. Census Bureau, Working Papers 16-10, 2016.
[URL] [Bibtex]
@TechReport{RePEc:cen:wpaper:16-10,
author={Javier Miranda and Lars Vilhuber},
title={{Using Partially Synthetic Microdata to Protect Sensitive Cells in Business Statistics}},
year=2016,
month=Feb,
institution={Center for Economic Studies, U.S. Census Bureau},
type={Working Papers},
url={https://ideas.repec.org/p/cen/wpaper/16-10.html},
number={16-10},
abstract={We describe and analyze a method that blends records from both observed and synthetic microdata into public-use tabulations on establishment statistics. The resulting tables use synthetic data only in potentially sensitive cells. We describe different algorithms, and present preliminary results when applied to the Census Bureau's Business Dynamics Statistics and Synthetic Longitudinal Business Database, highlighting accuracy and protection afforded by the method when compared to existing public-use tabulations (with suppressions).},
keywords={synthetic data; statistical disclosure limitation; time-series; local labor markets; gross job flows},
}
• L. Vilhuber, J. A. Abowd, and J. P. Reiter, “Synthetic Establishment Microdata Around the World,” NSF Census Research Network – NCRN-Cornell, 1813:42340, 2016.
[URL] [Bibtex]
@techreport{vilhuber-abowd-reiter-2016-ecommons,
Title = {{Synthetic Establishment Microdata Around the World}},
Author = {Lars Vilhuber and John A. Abowd and Jerome P. Reiter},
institution = {NSF Census Research Network - NCRN-Cornell },
Year = {2016},
number = {1813:42340},
Abstract = {In contrast to the many public-use microdata samples available for individual and household data from many statistical agencies around the world, there are virtually no establishment or firm microdata available. In large part, this difficulty in providing access to business micro data is due to the skewed and sparse distributions that characterize business data. Synthetic data are simulated data generated from statistical models. We organized sessions at the 2015 World Statistical Congress and the 2015 Joint Statistical Meetings, highlighting work on synthetic establishment microdata. This overview situates those papers, published in this issue, within the broader literature.},
Keywords = {confidentiality; comparative studies; US Longitudinal Business Database; synthetic data},
Owner = {vilhuber},
Timestamp = {2014.03.24},
URL = {http://hdl.handle.net/1813/42340}
}

### 2014

• J. Drechsler and L. Vilhuber, “A First Step Towards A German SynLBD: Constructing A German Longitudinal Business Database,” Center for Economic Studies, U.S. Census Bureau, Working Papers 14-13, 2014.
[URL] [Bibtex]
@TechReport{RePEc:cen:wpaper:14-13,
Title = {{A First Step Towards A {German} {SynLBD}: {C}onstructing A {G}erman {L}ongitudinal {B}usiness {D}atabase}},
Author = {J{\"o}rg Drechsler and Lars Vilhuber},
Institution = {Center for Economic Studies, U.S. Census Bureau},
Year = {2014},
Month = Feb,
Number = {14-13},
Type = {Working Papers},
Abstract = {One major criticism against the use of synthetic data has been that the efforts necessary to generate useful synthetic data are so in- tense that many statistical agencies cannot afford them. We argue many lessons in this evolving field have been learned in the early years of synthetic data generation, and can be used in the development of new synthetic data products, considerably reducing the required in- vestments. The final goal of the project described in this paper will be to evaluate whether synthetic data algorithms developed in the U.S. to generate a synthetic version of the Longitudinal Business Database (LBD) can easily be transferred to generate a similar data product for other countries. We construct a German data product with infor- mation comparable to the LBD - the German Longitudinal Business Database (GLBD) - that is generated from different administrative sources at the Institute for Employment Research, Germany. In a fu- ture step, the algorithms developed for the synthesis of the LBD will be applied to the GLBD. Extensive evaluations will illustrate whether the algorithms provide useful synthetic data without further adjustment. The ultimate goal of the project is to provide access to multiple synthetic datasets similar to the SynLBD at Cornell to enable comparative studies between countries. The Synthetic GLBD is a first step towards that goal.},
Keywords = {confidentiality; comparative studies; German Longitudinal Business Database; synthetic data},
Owner = {vilhuber},
Timestamp = {2014.03.24},
URL = {http://ideas.repec.org/p/cen/wpaper/14-13.html}
}
• J. Miranda and L. Vilhuber, “Looking Back On Three Years Of Using The Synthetic LBD Beta,” Center for Economic Studies, U.S. Census Bureau, Working Papers 14-11, 2014.
[URL] [Bibtex]
@TechReport{RePEc:cen:wpaper:14-11,
Title = {{Looking Back On Three Years Of Using The {S}ynthetic {LBD} Beta}},
Author = {Miranda, Javier and Lars Vilhuber},
Institution = {Center for Economic Studies, U.S. Census Bureau},
Year = {2014},
Month = Feb,
Number = {14-11},
Type = {Working Papers},
Abstract = {Distributions of business data are typically much more skewed than those for household or individual data and public knowledge of the underlying units is greater. As a results, national statistical offices (NSOs) rarely release establishment or firm-level business microdata due to the risk to respondent confidentiality. One potential approach for overcoming these risks is to release synthetic data where the establishment data are simulated from statistical models designed to mimic the distributions of the real underlying microdata. The US Census Bureau?s Center for Economic Studies in collaboration with Duke University, the National Institute of Statistical Sciences, and Cornell University made available a synthetic public use file for the Longitudinal Business Database (LBD) comprising more than 20 million records for all business establishment with paid employees dating back to 1976. The resulting product, dubbed the SynLBD, was released in 2010 and is the first-ever comprehensive business microdata set publicly released in the United States including data on establishments employment and payroll, birth and death years, and industrial classification. This pa- per documents the scope of projects that have requested and used the SynLBD.},
Keywords = {confidentiality; comparative studies; US Longitudinal Business Database; synthetic data},
Owner = {vilhuber},
Timestamp = {2014.03.24},
URL = {http://ideas.repec.org/p/cen/wpaper/14-11.html}
}
• L. Vilhuber and K. McKinney, “LEHD Infrastructure files in the Census RDC – Overview,” Center for Economic Studies, U.S. Census Bureau, Working Papers 14-26, 2014.
[URL] [Bibtex]
@TechReport{RePEc:cen:wpaper:14-26,
Title = {{LEHD Infrastructure files in the Census RDC - Overview}},
Author = {Lars Vilhuber and Kevin McKinney},
Institution = {Center for Economic Studies, U.S. Census Bureau},
Year = {2014},
Month = Jun,
Number = {14-26},
Type = {Working Papers},
Abstract = {The Longitudinal Employer-Household Dynamics (LEHD) Program at the U.S. Census Bureau, with the support of several national research agencies, maintains a set of infrastructure files using administrative data provided by state agencies, enhanced with information from other administrative data sources, demographic and economic (business) surveys and censuses. The LEHD Infrastructure Files provide a detailed and comprehensive picture of workers, employers, and their interaction in the U.S. economy. This document describes the structure and content of the 2011 Snapshot of the LEHD Infrastructure files as they are made available in the Census Bureaus secure and restricted-access Research Data Center network. The document attempts to provide a comprehensive description of all researcher-accessible files, of their creation, and of any modifcations made to the files to facilitate researcher access.},
URL = {http://ideas.repec.org/p/cen/wpaper/14-26.html}
}

### 2013

• C. Bérubé, B. Dostie, and L. Vilhuber, “Estimation de la contribution de la réallocation de la main-d’oeuvre à la croissance de la productivité au Canada,” Centre sur la productivité et la prospérité, HEC Montréal 2013.
[URL] [Bibtex]
@TechReport{BerubeDostieVilhuber2013,
Title = {Estimation de la contribution de la r\'{e}allocation de la main-d'oeuvre \{a} la croissance de la productivit\'{e} au {C}anada},
Author = {B\'{e}rub\'{e}, Charles and Benoit Dostie and Lars Vilhuber},
Institution = {Centre sur la productivit\'{e} et la prosp\'{e}rit\'{e}, HEC Montr\'{e}al},
Year = {2013},
Abstract = {In this report, we estimate the contribution of labour reallocation to productivity growth in the Canadian manufacturing sector. We find that most of productivity growth comes from within firm improvements, leaving a limited role for labour reallocation. Still, we also find that the importance of labour reallocation increase over time. This is both due to increasing net-entry and inter-firm effects. These effects are much more important post 2000 than in the 1990s. We also find that lost production from exiting firms is now most likely replaced by production from existing firms, while previously, it was more likely to be replaced by production from new firms. (French only)},
Owner = {vilhuber},
Timestamp = {2013.09.20},
URL = {http://cpp.hec.ca/cms/assets/documents/recherches_publiees/CH_2012_01.pdf}
}
• L. Vilhuber, “Methods for Protecting the Confidentiality of Firm-Level Data: Issues and Solutions,” Labor Dynamics Institute, Document 19, 2013.
[URL] [Bibtex]
@TechReport{Vilhuber2013,
Title = {Methods for Protecting the Confidentiality of Firm-Level Data: {I}ssues and Solutions},
Author = {Lars Vilhuber},
Institution = {Labor Dynamics Institute},
Year = {2013},
Month = {March},
Number = {19},
Type = {Document},
Abstract = {This report will provide an overview of methods used by statistical agencies to encourage, support, and
enhance research access to data for the purpose of generating new knowledge. Quite a few reports and
scientific articles have addressed the issue before, and we will be highly indebted to that literature. To a
summary of that literature, we hope to provide some recent developments and experiences derived
from a decade of working with systems that increase access as both researchers as well as data
providers. The report will focus on the data provided by statistical agencies, but it should be understood
that government agencies other than a National Statistical Office (NSO) may acquire that function.
While excluding the legal background limiting or permitting such data collection and provision, we
will highlight some alternate sources and methods, prior to concluding.},
Owner = {vilhuber},
Timestamp = {2013.09.20},
URL = {http://digitalcommons.ilr.cornell.edu/ldi/19/}
}

### 2012

• J. M. Abowd, K. Gittings, K. L. McKinney, B. E. Stephens, L. Vilhuber, and S. Woodcock, “Dynamically Consistent Noise Infusion and Partially Synthetic Data as Confidentiality Protection Measures for Related Time Series,” Federal Committee on Statistical Methodology, Research Conference Papers , 2012.
[PDF] [URL] [Bibtex]
@TechReport{AbowdEtAl2012,
Title = {Dynamically Consistent Noise Infusion and Partially Synthetic Data as Confidentiality Protection Measures for Related Time Series},
Author = {John M. Abowd and Kaj Gittings and Kevin L. McKinney and Bryce E. Stephens and Lars Vilhuber and Simon Woodcock},
Institution = {Federal Committee on Statistical Methodology},
Year = {2012},
Type = {Research Conference Papers},
Owner = {vilhuber},
Timestamp = {2013.01.11},
URL = {http://ideas.repec.org/p/cen/wpaper/12-13.html}
}
• J. M. Abowd and L. Vilhuber, “National Quarterly Workforce Indicators, r2254,” Cornell University, Labor Dynamics Institute [distributor], Ithaca, NY, USA, [Computer file] , 2012.
[URL] [Bibtex]
@TechReport{NQWI,
Title = {National {Quarterly} {Workforce} {Indicators}, r2254},
Author = {John M. Abowd and Lars Vilhuber},
Institution = {Cornell University, Labor Dynamics Institute [distributor]},
Year = {2012},
Type = {[Computer file]},
HowPublished = {Computer file},
Organization = {Cornell University, Labor Dynamics Institute [distributor]},
Owner = {vilhuber},
Timestamp = {2013.06.10},
URL = {http://www2.vrdc.cornell.edu/news/data/qwi-national-data/}
}

### 2011

• K. McKinney and L. Vilhuber, “LEHD Infrastructure Files in the Census RDC: Overview of S2004 Snapshot,” Center for Economic Studies, U.S. Census Bureau, Working Papers 11-13, 2011.
[URL] [Bibtex]
@TechReport{RePEc:cen:wpaper:11-13,
Title = {{LEHD Infrastructure Files in the Census RDC: Overview of S2004 Snapshot}},
Author = {Kevin McKinney and Lars Vilhuber},
Institution = {Center for Economic Studies, U.S. Census Bureau},
Year = {2011},
Month = Apr,
Number = {11-13},
Type = {Working Papers},
Abstract = {The Longitudinal Employer-Household Dynamics (LEHD) Program at the U.S. Census Bureau, with the support of several national research agencies, has built a set of infrastructure files using administrative data provided by state agencies, enhanced with information from other administrative data sources, demographic and economic (business) surveys and censuses. The LEHD Infrastructure Files provide a detailed and comprehensive picture of workers, employers, and their interaction in the U.S. economy. This document describes the structure and content of the 2004 Snapshot of the LEHD Infrastructure files as they are made available in the Census Bureau’s Research Data Center network.},
Keywords = {LEHD; linked employer-employee data; workers; employers; jobs; hires; separations; recalls; mobility},
URL = {http://ideas.repec.org/p/cen/wpaper/11-13.html}
}
• K. McKinney and L. Vilhuber, “LEHD Data Documentation LEHD-OVERVIEW-S2008-rev1,” Center for Economic Studies, U.S. Census Bureau, Working Papers 11-43, 2011.
[URL] [Bibtex]
@TechReport{RePEc:cen:wpaper:11-43,
Title = {{LEHD Data Documentation LEHD-OVERVIEW-S2008-rev1}},
Author = {Kevin McKinney and Lars Vilhuber},
Institution = {Center for Economic Studies, U.S. Census Bureau},
Year = {2011},
Month = Dec,
Number = {11-43},
Type = {Working Papers},
Abstract = {No abstract is available for this item.},
URL = {http://ideas.repec.org/p/cen/wpaper/11-43.html}
}
• S. Von Schrader, W. Erickson, T. Golden, and L. Vilhuber, “New York State Disability and Employment Status Report, 2011,” , Report on behalf of New York Makes Work Pay Comprehensive Employment System Medicaid Infrastructure Grant , 2011.
[URL] [Bibtex]
@TechReport{Employment2011,
Title = {New York State Disability and Employment Status Report, 2011},
Author = {Von Schrader, Sarah and Erickson, William and Golden, Thomas and Lars Vilhuber },
Year = {2011},
Type = {Report on behalf of New York Makes Work Pay Comprehensive Employment System Medicaid Infrastructure Grant},
Organization = {Cornell University, Employment and Disability Institute},
URL = {http://ilr-edi-r1.ilr.cornell.edu/nymakesworkpay/docs/Report_Card_2011/NYS%20Report%20Card%202011.pdf},
Urldate = {2014-04-10}
}

### 2010

• J. M. Abowd and L. Vilhuber, “National Estimates of Gross Employment and Job Flows from the Quarterly Workforce Indicators with Demographic and Industry Detail (with color graphs),” Center for Economic Studies, U.S. Census Bureau, Working Papers 10-11, 2010.
[PDF] [URL] [Bibtex]
@TechReport{ces-wp-10-11,
Title = {National Estimates of Gross Employment and Job Flows from the {Quarterly} {Workforce} {Indicators} with Demographic and Industry Detail (with color graphs)},
Author = {John M. Abowd and Lars Vilhuber},
Institution = {Center for Economic Studies, U.S. Census Bureau},
Year = {2010},
Month = Jun,
Number = {10-11},
Type = {Working Papers},
Abstract = {The Quarterly Workforce Indicators (QWI) are local labor market data produced and released every quarter by the United States Census Bureau. Unlike any other local labor market series produced in the U.S. or the rest of the world, the QWI measure employment flows for workers (accession and separations), jobs (creations and destructions) and earnings for demographic subgroups (age and gender), economic industry (NAICS industry groups), detailed geography (block (experimental), county, Core- Based Statistical Area, and Workforce Investment Area), and ownership (private, all) with fully interacted publication tables. The current QWI data cover 47 states, about 98\% of the private workforce in those states, and about 92\% of all private employment in the entire economy. State participation is sufficiently extensive to permit us to present the first national estimates constructed from these data. We focus on worker, job, and excess (churning) reallocation rates, rather than on levels of the basic variables. This permits comparison to existing series from the Job Openings and Labor Turnover Survey and the Business Employment Dynamics Series from the Bureau of Labor Statistics. The national estimates from the QWI are an important enhancement to existing series because they include demographic and industry detail for both worker and job flow data compiled from underlying micro-data that have been integrated at the job and establishment levels by the Longitudinal Employer-Household Dynamics Program at the Census Bureau. The estimates presented herein were compiled exclusively from public-use data series and are available for download.},
URL = {http://ideas.repec.org/p/cen/wpaper/10-11.html}
}
• L. Vilhuber, “Measuring firm-level displacement events with administrative data,” Workshop on Measurement Error in Administrative Data, Mannheim, Germany 2010.
[Bibtex]
@TechReport{Vilhuber2010,
Title = {Measuring firm-level displacement events with administrative data},
Author = {Lars Vilhuber},
Institution = {Workshop on Measurement Error in Administrative Data},
Year = {2010},
Owner = {vilhuber},
Timestamp = {2010.06.10}
}
• S. Von Schrader, W. Erickson, L. Vilhuber, and T. Golden, “New York State Disability and Employment Status Report, 2009,” Cornell University, Employment and Disability Institute, Report on behalf of New York Makes Work Pay Comprehensive Employment System Medicaid Infrastructure Grant , 2010.
[URL] [Bibtex]
@TechReport{Employment2009,
Title = {New York State Disability and Employment Status Report, 2009},
Author = {Von Schrader, Sarah and Erickson, William and Lars Vilhuber and Golden, Thomas. },
Institution = {Cornell University, Employment and Disability Institute},
Year = {2010},
Type = {Report on behalf of New York Makes Work Pay Comprehensive Employment System Medicaid Infrastructure Grant},
URL = {http://digitalcommons.ilr.cornell.edu/edicollect/1282/},
Urldate = {2014-04-10}
}

### 2007

• L. Vilhuber, “Adjusting imperfect data: Overview and case studies,” NBER, Working paper 12977, 2007.
[DOI] [URL] [Bibtex]
@TechReport{Vilhuber2007,
Title = {Adjusting imperfect data: Overview and case studies},
Author = {Lars Vilhuber},
Institution = {NBER},
Year = {2007},
Number = {12977},
Type = {Working paper},
DOI = {10.3386/w12977},
File = {tp-2004-05.pdf:L/LEHD/tp-2004-05.pdf:PDF},
Owner = {vilhuber},
Timestamp = {2007.07.16},
URL = {http://www.nber.org/papers/w12977}
}

### 2005

• J. M. Abowd, B. E. Stephens, and L. Vilhuber, “Confidentiality Protection in the Census Bureau’s Quarterly Workforce Indicators,” U.S. Census Bureau, LEHD and Cornell University, presented at the {J}oint {S}tatistical {M}eetings 2005, {M}inneapolis, {MN}. , 2005.
[Bibtex]
@TechReport{AbowdEtAl2005b,
Title = {Confidentiality Protection in the {C}ensus {B}ureau's {Q}uarterly {W}orkforce {I}ndicators},
Author = {Abowd, John M. and Stephens, Bryce E. and Vilhuber, Lars},
Institution = {U.S. Census Bureau, LEHD and Cornell University},
Year = {2005},
Type = {presented at the {J}oint {S}tatistical {M}eetings 2005, {M}inneapolis, {MN}.},
File = {Abowd-Stephens-Vilhuber-2005.pdf:L/LEHD/Abowd-Stephens-Vilhuber-2005.pdf:PDF},
Owner = {vilhuber}
}

### 2004

• L. Vilhuber, “Adjusting imperfect data: Overview and case studies,” LEHD, Technical paper TP-2004-05, 2004.
[Bibtex]
@TechReport{tp-2004-05,
Title = {Adjusting imperfect data: Overview and case studies},
Author = {Lars Vilhuber},
Institution = {LEHD},
Year = {2004},
Number = {TP-2004-05},
Type = {Technical paper},
File = {tp-2004-05.pdf:L/LEHD/tp-2004-05.pdf:PDF}
}

### 2002

• J. M. Abowd, P. A. Lengermann, and L. Vilhuber, “The Creation of the Employment Dynamics Estimates,” LEHD, U.S. Census Bureau, Technical paper TP-2002-13, 2002.
[PDF] [URL] [Bibtex]
@TechReport{tp-2002-13,
Title = {The Creation of the Employment Dynamics Estimates},
Author = {John M. Abowd and Paul A. Lengermann and Lars Vilhuber},
Institution = {LEHD, U.S. Census Bureau},
Year = {2002},
Number = {TP-2002-13},
Type = {Technical paper},
File = {tp-2002-13.pdf:L/LEHD/tp-2002-13.pdf:PDF},
URL = {https://ideas.repec.org/p/cen/tpaper/2002-13.html}
}
• J. M. Abowd and L. Vilhuber, “The Sensitivity of Economic Statistics to Coding Errors in Personal Identifiers,” LEHD, U.S. Census Bureau, Technical paper TP-2002-17, 2002.
[Bibtex]
@TechReport{tp-2002-17,
Title = {The Sensitivity of Economic Statistics to Coding Errors in Personal Identifiers},
Author = {John M. Abowd and Lars Vilhuber},
Institution = {LEHD, U.S. Census Bureau},
Year = {2002},
Number = {TP-2002-17},
Type = {Technical paper},
Comment = {Published JBES 2005},
File = {tp-2002-17.pdf:L/LEHD/tp-2002-17.pdf:PDF}
}
• A. Bowlus and L. Vilhuber, “Displaced workers, early leavers, and re-employment wages,” LEHD, U.S. Census Bureau, Technical paper TP-2002-18, 2002.
[Bibtex]
@TechReport{tp-2002-18,
Title = {Displaced workers, early leavers, and re-employment wages},
Author = {Audra Bowlus and Lars Vilhuber},
Institution = {LEHD, U.S. Census Bureau},
Year = {2002},
Number = {TP-2002-18},
Type = {Technical paper},
File = {tp-2002-18.pdf:L/LEHD/tp-2002-18.pdf:PDF}
}
• P. A. Lengermann and L. Vilhuber, “Abandoning the Sinking Ship: The Composition of Worker Flows Prior to Displacement,” LEHD, U.S. Census Bureau, Technical paper TP-2002-11, 2002.
[Bibtex]
@TechReport{tp-2002-11,
Title = {Abandoning the Sinking Ship: {T}he Composition of Worker Flows Prior to Displacement},
Author = {Paul A. Lengermann and Lars Vilhuber},
Institution = {LEHD, U.S. Census Bureau},
Year = {2002},
Number = {TP-2002-11},
Type = {Technical paper},
File = {tp-2002-11.pdf:L/LEHD/tp-2002-11.pdf:PDF}
}

### 2001

• H. J. Holzer, J. I. Lane, L. Vilhuber, H. Jackson, and G. Putnam, “Escaping poverty for low-wage workers: The role of employer characteristics and changes,” LEHD, U.S. Census Bureau, Technical paper TP-2001-02, 2001.
[Bibtex]
@TechReport{tp-2001-02,
Title = {Escaping poverty for low-wage workers: {T}he role of employer characteristics and changes},
Author = {Harry J. Holzer and Julia I. Lane and Lars Vilhuber and Henry Jackson and George Putnam},
Institution = {LEHD, U.S. Census Bureau},
Year = {2001},
Number = {TP-2001-02},
Type = {Technical paper},
File = {tp-2001-02.pdf:L/LEHD/tp-2001-02.pdf:PDF}
}

### 2000

• L. Vilhuber and R. Pedace, “Longitudinal analysis of SSN response on SIPP 1990-1993 panels,” LEHD, U.S. Census Bureau, Technical paper TP-2000-01, 2000.
[Bibtex]
@TechReport{tp-2000-01,
Title = {Longitudinal analysis of {SSN} response on {SIPP} 1990-1993 panels},
Author = {Lars Vilhuber and Robert Pedace},
Institution = {LEHD, U.S. Census Bureau},
Year = {2000},
Number = {TP-2000-01},
Type = {Technical paper},
File = {tp-2000-01.pdf:L/LEHD/tp-2000-01.pdf:PDF}
}

### 1999

• L. Vilhuber, “Continuous Training and sectoral mobility in Germany,” CIRANO, Scientific Series 99s-03, 1999.
[Bibtex]
@TechReport{Vilhuber99b,
Title = {Continuous Training and sectoral mobility in {G}ermany},
Author = {Lars Vilhuber},
Institution = {CIRANO},
Year = {1999},
Number = {99s-03},
Type = {Scientific Series },
Abstract = {This article studies mobility patterns of German workers in light of a model of sector-specific human capital. Furthermore, I employ and describe little-used data on continuous on-the-job training occuring after apprenticeships. Results are presented describing the incidence and duration of continuous training. Continuous training is quite common, depite the high incidence of apprenticeships which precedes this part of a worker's career. Most previous studies have only distinguished between firm-specific and general human capital, generally concluding that training was general. Inconsistent with those conclusions, I show that German men are more likely to find a job within the same sector if they have received continuous training in that sector. These results are similar to results obtained for young U.S. workers, and suggest that sector-specific capital is an important feature of very different labor markets. Furthermore, the results suggest that the observed effect of training on mobility is sensitive to the state of the business cycle, indicating a more complex interaction between supply and demand that most theoretical models allow for.},
Keywords = {training mobility Germany}
}

### 1997

• L. Vilhuber, “Sector-Specific On-The-Job Training: Evidence from U.S. Data,” CIRANO, Scientific Series 97s-42, 1997.
[Bibtex]
@TechReport{Vilhuber97a,
Title = {Sector-Specific On-The-Job Training: Evidence from {U.S.} Data},
Author = {Lars Vilhuber},
Institution = {CIRANO},
Year = {1997},
Number = {97s-42},
Type = {Scientific Series },
Abstract = {Using data from the National Longitudinal Survey of Youth (NLSY), we re-examine the effect of formal on-the-job training on mobility patterns of young American workers. By employing parametric duration models, we evaluate the economic impact of training on productive time with an employer. Confirming previous studies, we find a positive and statistically significant impact of formal on-the-job training on tenure with the employer providing the training. However, expected duration net of the time spent in the training program is generally not significantly increased. We proceed to document and analyze intra-sectoral and cross-sectoral mobility patterns in order to infer whether training provides firm-specific, industry-specific, or general human capital. The econometric analysis rejects a sequential model of job separation in favor of a competing risks specification. We find significant evidence for the industry-specificity of training. The probability of sectoral mobility upon job separation decreases with training received in the current industry, whether with the last employer or previous employers, and employment attachment increases with on-the-job training. These results are robust to a number of variations on the base model.},
Jelclass = {J4 J6}
}

### 1996

• L. Vilhuber, “Wage Flexibility and Contract Structure in Germany,” CIRANO, Scientific Series 96s-28, 1996.
[Bibtex]
@TechReport{Vilhuber96,
Title = {Wage Flexibility and Contract Structure in {G}ermany },
Author = {Lars Vilhuber},
Institution = {CIRANO},
Year = {1996},
Number = {96s-28},
Type = {Scientific Series},
Abstract = {In this paper, we look at how labor market conditions at different points during the tenure of individuals with firms are correlated with current earnings. Using data from the German Socioeconomic Panel on individuals for the period 1984 to 1994, we find that both the contemporaneous unemployment rate and prior values of the unemployment rate are significantly correlated with current earnings, contrary to results for the American labor market. We interpret this result as evidence that German unions do in fact bargain over both wages and employment, but that the models of individualistic contracts, such as the implicit contract model, may explain some of the observed wage drift and longer-term wage movements reasonably well. Furthermore, we explore the heterogeneity of contracts over a variety of worker and job characteristics. In particular, we find evidence that contracts differ across industries and across firm size. Workers of large firms are remarkably more insulated from the job market than workers for any other type of firm, indicating the importance of internal job markets. },
Jelclass = {J23, J31, J41},
Mylibrary = {yes}
}

## Online resources

### 2013

• B. Perry, J. Williams, L. Vilhuber, and W. Block, “CED$^2$AR: Comprehensive Extensible Data Documentation and Access Repository,” , 2013.
[URL] [Bibtex]
@online{ced2ar,
Title = {CED$^2$AR: {C}omprehensive {E}xtensible {D}ata {D}ocumentation and {A}ccess Repository},
Author = {Benjamin Perry and Jeremy Williams and Lars Vilhuber and William Block},
HowPublished = {online resource},
Organization = {Cornell University, for NSF Grant SES-1131848},
Institution = {Cornell University, for NSF Grant SES-1131848},
type = {online resource},
URL = {http://www2.ncrn.cornell.edu/ced2ar-web/},
Urldate = {2014-04-10},
Year = {2013}
}

### 2012

• A. Karr, L. Vilhuber, J. Nunnelly, and K. Kantner, “NSF-Census Research Network,” , 2012.
[URL] [Bibtex]
@online{ncrn.info,
Title = {{NSF-Census} {R}esearch {N}etwork},
Author = {Alan Karr and Lars Vilhuber and Jamie Nunnelly and Katherine Kantner },
Organization = {National Institute for the Statistical Sciencies (NISS), Cornell University, and Duke University, for NSF Grant SES-1237602},
Institution = {National Institute for the Statistical Sciencies (NISS), Cornell University, and Duke University, for NSF Grant SES-1237602},
URL = {http://www.ncrn.info},
Urldate = {2014-04-10},
Year = {2012}
}
• L. Vilhuber, B. Perry, W. Block, and J. Williams, “NSF-Census Research Network – Cornell node website,” , 2012.
[URL] [Bibtex]
@online{ncrn.cornell,
Title = {{NSF-Census} {R}esearch {N}etwork - {C}ornell node website},
Author = {Lars Vilhuber and Benjamin Perry and William Block and Jeremy Williams},
Organization = {Cornell University, for NSF Grant SES-1131848},
URL = {http://www.ncrn.cornell.edu},
Urldate = {2014-04-10},
Year = {2012}
}

### 2010

• J. M. Abowd and L. Vilhuber, “VirtualRDC – Synthetic Data Server,” , 2010.
[URL] [Bibtex]
@online{AbowdVilhuber,
Title = {{VirtualRDC} - {Synthetic} {Data} {Server}},
Author = {John M. Abowd and Lars Vilhuber},
Type = {online resource},
HowPublished = {online resource},
Organization = {Cornell University, Labor Dynamics Institute},
Institution = {Cornell University, Labor Dynamics Institute},
Owner = {vilhuber},
Timestamp = {2013.10.15},
URL = {http://www.vrdc.cornell.edu/sds/},
Year = {2010}
}
• S. Von Schrader, W. Erickson, T. Golden, and L. Vilhuber, “New York State Disability and Employment Status Report, 2010,” , 2010.
[URL] [Bibtex]
@online{Employment2010,
Title = {New York State Disability and Employment Status Report, 2010},
Author = {Von Schrader, Sarah and Erickson, William and Golden, Thomas and Lars Vilhuber },
Organization = {Cornell University, Employment and Disability Institute on behalf of New York Makes Work Pay Comprehensive Employment System Medicaid Infrastructure Grant},
URL = {http://www.nymakesworkpay.org/status-reports/index.cfm},
Urldate = {2014-04-10},
Year = {2010}
}

### 2009

• S. Von Schrader, W. Erickson, L. Vilhuber, and T. Golden, “County-level Disability and Employment Status Reports, 2007,” , 2009.
[URL] [Bibtex]
@online{Employment2007,
Title = {County-level Disability and Employment Status Reports, 2007},
Author = {Von Schrader, Sarah and Erickson, William and Lars Vilhuber and Golden, Thomas },
Organization = {Cornell University, Employment and Disability Institute on behalf of New York Makes Work Pay Comprehensive Employment System Medicaid Infrastructure Grant},
URL = {http://www.ilr.cornell.edu/edi/nymakesworkpay/policy/stats_2009.cfm},
Urldate = {2009-07-01},
Year = {2009}
}
• S. Von Schrader, W. Erickson, L. Vilhuber, and T. Golden, “County-level Disability and Employment Status Reports, 2009,” , 2009.
[URL] [Bibtex]
@online{Employment2009online,
Title = {County-level Disability and Employment Status Reports, 2009},
Author = {Von Schrader, Sarah and Erickson, William and Lars Vilhuber and Golden, Thomas. },
Organization = {Cornell University, Employment and Disability Institute on behalf of New York Makes Work Pay Comprehensive Employment System Medicaid Infrastructure Grant},
URL = {http://www.ilr.cornell.edu/edi/nymakesworkpay/policy/index.cfm},
Urldate = {2010-01-01},
Year = {2009}
}

### 2004

• J. M. Abowd and L. Vilhuber, “VirtualRDC,” , 2004.
[URL] [Bibtex]
@online{vrdc,
Title = {{VirtualRDC}},
Author = {John M. Abowd and Lars Vilhuber},
Type = {online resource},
HowPublished = {online resource},
Institution = {Cornell University, Labor Dynamics Institute},
Organization = {Cornell University, Labor Dynamics Institute},
Owner = {vilhuber},
Timestamp = {2013.10.15},
URL = {http://www.vrdc.cornell.edu/},
Year = {2004}
}

## Data

### 2014

• J. M. Abowd and L. Vilhuber, “Replication data for: National estimates of gross employment and job flows from the Quarterly Workforce Indicators with demographic and industry detail,” , 2014.
[DOI] [URL] [Bibtex]
@report{AbowdVilhuber_NQWIDATA,
title={Replication data for: National estimates of gross employment and job flows from the Quarterly Workforce Indicators with demographic and industry detail},
url={http://dx.doi.org/10.7910/DVN/27923},
DOI={10.7910/DVN/27923},
publisher={Labor Dynamics Institute},
type={data},
author={Abowd, John M. and Vilhuber, Lars},
year={2014}}`