@techreport{TD:101622,
	att_abstract={{Semi-structured data are prevalent on the web, with formats such as XML and JSON soaring in popularity due to their generality, flexibility and easy customization. However, these same features make semi-structured data prone to a range of data quality errors, from errors in content to errors in structure. While the former has been well studied, not much attention has been paid to structural errors, which can impact applications quite severely.

In this demonstration, we present TREESCOPE, which analyzes semi-structured data sets with the goal of automatically identifying structural anomalies from the data. Our techniques learn robust structural models that have high support, to identify potential errors in the structure. Identified structural anomalies are then concisely summarized to provide plausible explanations of the potential errors. The goal of this demonstration is to enable an interactive exploration of the process of identifying and summarizing structural anomalies in semi-structured data sets.}},
	att_authors={ds8961},
	att_categories={C_IIS.6},
	att_copyright={{VLDB Foundation}},
	att_copyright_notice={{The definitive version was published in Very Large Databases, 2015. {{, Volume 8}}{{, Issue 12}}{{, 2015-08-31}}{{, http://www.vldb.org/pvldb/vol8/p1904-Ying.pdf}}
}},
	att_donotupload={},
	att_private={false},
	att_projects={},
	att_tags={},
	att_techdoc={true},
	att_techdoc_key={TD:101622},
	att_url={http://web1.research.att.com:81/techdocs_downloads/TD:101622_DS1_2015-04-25T11:14:06.624Z.pdf},
	author={Divesh Srivastava and Shanshan Ying and Flip Korn and Barna Saha},
	institution={{Proceedings of the VLDB Endowment}},
	month={August},
	title={{TreeScope: Finding Structural Anomalies In Semi-Structured Data}},
	year=2015,
}