@inproceedings{e30fb7d96cc54fd18cf00a80513554ad,

title = "Algorithms to calculate the Manhattan (L1) distance for vertical data represented in pTrees",

abstract = "In data mining applications different types of distance metrics are used to measure the closeness of two data points. Among these metrics Manhattan (L1), Euclidean (L2) and Max (L.) distances are used very frequently in various algorithms. In pTree vertical data representation Max distance can be efficiently implemented using only bitwise operations across the pTrees without any horizontal access of the data points. But many clustering and classification algorithms require computing L1 and L2 distances in order to increase 1 their accuracy. In this paper we have shown how Manhattan or L1 distance can be calculated for vertical data represented in pTrees. Similar to the Max distance this algorithm also uses only bitwise operations across various pTrees without performing any horizontal scan of the data points. As a result the algorithm works very fast on huge volume of data represented by pTrees comparing with traditional horizontal data representation. Also these algorithms enable various data mining algorithms that use pTrees to improve their accuracy without sacrificing any significant speed.",

author = "Mohammad Hossain and Roy, {Arjun G.} and Arijit Chatterjee and William Perrizo",

year = "2012",

month = dec,

day = "1",

language = "English (US)",

isbn = "9781880843840",

series = "Proceedings of the ISCA 27th International Conference on Computers and Their Applications, CATA 2012",

pages = "65--70",

booktitle = "Proceedings of the ISCA 27th International Conference on Computers and Their Applications, CATA 2012",

note = "27th International Conference on Computers and Their Applications, CATA 2012 ; Conference date: 12-03-2012 Through 14-03-2012",

}