@TechReport{arendt:genome,
  author = {James W. Arendt},
  title = {Parallel Genome Sequence Comparison Using a Concurrent File System},
  year = {1991},
  number = {UIUCDCS-R-91-1674},
  institution = {University of Illinois at Urbana-Champaign},
  keywords = {parallel file system, parallel I/O, Intel iPSC/2, pario-bib},
  comment = {Studies the performance of Intel CFS. Uses an application that
  reads in a huge file of records, each a genome sequence, and compares each
  sequence against a given sequence. Looks at cache performance, message
  latency, cost of prefetches and directory reads, and throughput. He tries
  one-disk, one-proc transfer rates. Because of contention with the directory
  server on one of the two I/O nodes, it was faster to put all of the file on
  the other I/O node. Striping is good for multiple readers. Best access
  pattern was interleaved, not segmented or separate files, because it avoided
  disk seeks. Perhaps the files are stored contiguously? Can get good speedup
  by reading the sequences in big integral record sizes, from CFS, using a
  load-balancing scheduled by the host. Contention for directory blocks --
  through single-node directory server.}
}