@inproceedings{0fffa0c3c99b4f1bb8e4f6802cab8873,
title = "Warehousing and mining massive RFID data sets",
abstract = "Radio Frequency Identification (RFID) applications are set to play an essential role in object tracking and supply chain management systems. In the near future, it is expected that every major retailer will use RFID systems to track the movement of products from suppliers to warehouses, store backrooms and eventually to points of sale. The volume of information generated by such systems can be enormous as each individual item (a pallet, a case, or an SKU) will leave a trail of data as it moves through different locations. We propose two data models for the management of this data. The first is a path cube that preserves object transition information while allowing muti-dimensional analysis of path dependent aggregates. The second is a workflow cube that summarizes the major patterns and significant exceptions in the flow of items through the system. The design of our models is based on the following observations: (1) items usually move together in large groups through early stages in the system (e.g., distribution centers) and only in later stages (e.g., stores) do they move in smaller groups, (2) although RFID data is registered at the primitive level, data analysis usually takes place at a higher abstraction level, (3) many items have similar flow patterns and only a relatively small number of them truly deviate from the general trend, and (4) only non-redundant flow deviations with respect to previously recorded deviations are interesting. These observations facilitate the construction of highly compressed RFID data warehouses and the exploration of such data warehouses by scalable data mining. In this study we give a general overview of the principles driving the design of our framework. We believe warehousing and mining RFID data presents an interesting application for advanced data mining.",
author = "Jiawei Han and Hector Gonzalez and Xiaolei Li and Diego Klabjan",
year = "2006",
doi = "10.1007/11811305_1",
language = "English (US)",
isbn = "3540370250",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "1--18",
editor = "Xue Li and Za{\"i}ane, {Osmar R.} and Zhanhuai Li",
booktitle = "Advanced Data Mining and Applications - Second International Conference, ADMA 2006, Proceedings",
note = "2nd International Conference on Advanced Data Mining and Applications, ADMA 2006 ; Conference date: 14-08-2006 Through 16-08-2006",
}