@InProceedings{Hoffman_PDPTA99_19990628, author = {Forrest M. Hoffman and William W. Hargrove}, title = {Multivariate Geographic Clustering Using a {B}eowulf-style Parallel Computer}, editor = {Hamid R. Arabnia}, booktitle = {Proceedings of the International Conference on Parallel and Distributed Processing Techniques and Applications ({PDPTA} '99)}, volume = {III}, dates = {28 June--1 July 1999}, location = {Las Vegas, Nevada}, publisher = {CSREA Press}, pages = {1292--1298}, ISBN = {1-892512-11-4}, day = 28, month = jun, year = 1999, abstract = {The authors present an application of multivariate non-hierarchical statistical clustering to geographic environmental data from the 48 conterminous United States in order to produce maps of regions of ecological similarity called ecoregions. Nine input variables thought to affect the growth of vegetation are clustered at a resolution of one square kilometer. These data represent over 7.8 million map cells in a 9-dimensional data space. For the analysis, the authors built a 126-node heterogeneous cluster---aptly named the Stone SouperComputer---out of surplus PCs. The authors developed a parallel iterative statistical clustering algorithm which uses the MPI message passing routines, employs a classical master/slave single program multiple data (SPMD) organization, performs dynamic load balancing, and provides fault tolerance. In addition to being run on the Stone SouperComputer, the parallel algorithm was tested on other parallel platforms without code modification. Finally, the results of the geographic clustering are presented.} }