<?xml version="1.0" encoding="ISO-8859-1"?>

<rdf:RDF
 xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
 xmlns="http://purl.org/rss/1.0/"
 xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/"
 xmlns:dc="http://purl.org/dc/elements/1.1/"
 xmlns:syn="http://purl.org/rss/1.0/modules/syndication/"
 xmlns:prism="http://purl.org/rss/1.0/modules/prism/"
 xmlns:admin="http://webns.net/mvcb/"
>

<channel rdf:about="http://hpc.sagepub.com">
<title>International Journal of High Performance Computing Applications recent issues</title>
<link>http://hpc.sagepub.com</link>
<description>International Journal of High Performance Computing Applications RSS feed -- recent issues</description>
<prism:publicationName>International Journal of High Performance Computing Applications</prism:publicationName>
<prism:issn>1094-3420</prism:issn>
<items>
 <rdf:Seq>
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/309?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/323?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/328?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/332?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/335?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/337?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/340?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/344?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/347?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/reprint/23/4/350?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/355?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/357?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/361?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/366?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/369?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/374?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/389?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/392?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/395?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/398?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/401?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/403?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/reprint/23/4/409?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/411?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/413?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/reprint/23/4/421?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/423?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/427?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/4/437?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/reprint/23/3/195?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/3/196?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/3/212?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/3/227?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/3/242?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/3/252?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/3/265?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/3/277?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/3/284?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/2/123?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/2/140?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/2/152?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/2/171?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/reprint/23/1/3?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/1/5?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/1/14?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/1/29?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/1/42?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/1/62?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/1/84?rss=1" />
  <rdf:li rdf:resource="http://hpc.sagepub.com/cgi/content/abstract/23/1/99?rss=1" />
 </rdf:Seq>
</items>
<image rdf:resource="http://hpc.sagepub.com:80/icons/banner/title.gif" />
</channel>

<image rdf:about="http://hpc.sagepub.com:80/icons/banner/title.gif">
<title>International Journal of High Performance Computing Applications</title>
<url>http://hpc.sagepub.com:80/icons/banner/title.gif</url>
<link>http://hpc.sagepub.com</link>
</image>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/309?rss=1">
<title><![CDATA[The International Exascale Software Project: a Call To Cooperative Action By the Global High-Performance Community]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/309?rss=1</link>
<description><![CDATA[<p>Over the last 20 years, the open-source community has provided more and more software on which the world&rsquo;s high-performance computing systems depend for performance and productivity. The community has invested millions of dollars and years of effort to build key components. Although the investments in these separate software elements have been tremendously valuable, a great deal of productivity has also been lost because of the lack of planning, coordination, and key integration of technologies necessary to make them work together smoothly and efficiently, both within individual petascale systems and between different systems. A repository gatekeeper and an email discussion list can coordinate open-source development within a single project, but there is no global mechanism working across the community to identify critical holes in the overall software environment, spot opportunities for beneficial integration, or specify requirements for more careful coordination. It seems clear that this completely uncoordinated development model will not provide the software needed to support the unprecedented parallelism required for peta/exascale computation on millions of cores, or the flexibility required to exploit new hardware models and features, such as transactional memory, speculative execution, and GPUs. We believe the community must work together to prepare for the challenges of exascale computing, ultimately combing their efforts in a coordinated International Exascale Software Project.</p>]]></description>
<dc:creator><![CDATA[Dongarra, J., Beckman, P., Aerts, P., Cappello, F., Lippert, T., Matsuoka, S., Messina, P., Moore, T., Stevens, R., Trefethen, A., Valero, M.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347714</dc:identifier>
<dc:title><![CDATA[The International Exascale Software Project: a Call To Cooperative Action By the Global High-Performance Community]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>322</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>309</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/323?rss=1">
<title><![CDATA[Summary of the IESP White Papers]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/323?rss=1</link>
<description><![CDATA[<p>As part of the planning and development process for the IESP workshops, we asked participants to prepare white papers on various topics. We have grouped and summarized the content of the white papers that were contributed here. The list of the white papers relevant to a given group is given at the end of the summary for that group.</p>]]></description>
<dc:creator><![CDATA[Mohr, B.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347484</dc:identifier>
<dc:title><![CDATA[Summary of the IESP White Papers]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>327</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>323</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/328?rss=1">
<title><![CDATA[Programmability Issues]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/328?rss=1</link>
<description><![CDATA[<p>Programming models are at the very center of our effort to address the exascale challenge. They are the key interface that will allow the separation of the programmers&rsquo; concerns from those of system designers, potentially at different levels of granularity. Any such model must meet the extensive needs of application developers and be supported by the entire software stack. Considerable research is needed to define and implement the programming and execution models for such systems. Whereas evolutionary approaches may best support the migration of existing application software, revolutionary models may be best suited to providing extreme-scale performance for new applications on emerging architectures. Both approaches should be explored.</p>]]></description>
<dc:creator><![CDATA[Chapman, B., Labarta, J., Sarkar, V., Sato, M.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347488</dc:identifier>
<dc:title><![CDATA[Programmability Issues]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>331</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>328</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/332?rss=1">
<title><![CDATA[Models of Computation -- Enabling Exascale]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/332?rss=1</link>
<description><![CDATA[<p>A model of computation provides a set of governing principles and a discipline determining the objects, their interrelationships, parallel flow control, and distribution. In so doing it provides a conceptual framework for the co-design and operation for all layers of the software and hardware architecture system stack from programming model through system software to processor core instruction set and structures. As enabling technologies advance changing capabilities, balance, and design challenges, the response has been a phase change in how HPC systems are realized reflected by the development and adoption of new models of computation to best fit the emerging underlying technology conditions. This has occurred at least through five technology epochs in the past and the field is entering a sixth such with the heterogeneous multicore Petaflops decade. A brief presentation of the nature and characteristics of models of computation is offered here to contribute to the current community discussions on how to proceed towards the realization of the promise of practical Exascale computing by the end of the next decade.</p>]]></description>
<dc:creator><![CDATA[Sterling, T.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347490</dc:identifier>
<dc:title><![CDATA[Models of Computation -- Enabling Exascale]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>334</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>332</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/335?rss=1">
<title><![CDATA[The Biggest Need: a New Model of Computation]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/335?rss=1</link>
<description><![CDATA[<p>The development of HPC systems capable of exascale performance will demand innovations in hardware architecture and system software as well as programming models and methods. The combination of a vast increase in scale of such systems combined with the emergence of heterogeneous multicore structures is forcing future systems to be organized and operate on principles very different from the conventional practices of the last two decades. The biggest need for achieving exascale computing is the development of a new model of computation that will provide the new paradigm exploiting the opportunities and addressing the challenges of the emerging technologies and advanced architectures that together will comprise future exascale systems. This brief paper discusses the need for a new model of computation and the properties such a model should embody.</p>]]></description>
<dc:creator><![CDATA[Sterling, T.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347492</dc:identifier>
<dc:title><![CDATA[The Biggest Need: a New Model of Computation]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>336</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>335</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/337?rss=1">
<title><![CDATA[Slouching Towards Exascale]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/337?rss=1</link>
<description><![CDATA[<p>One question before the high-performance computing community is "How will application developers write code for exascale machines?" At this point it looks like they might be riding a rough beast indeed. This paper is a brief assessment of where we stand now with respect to writing programs for our largest supercomputers and what we should do next. MPI is likely to remain a critical part of the programming infrastructure as we move towards exascale, but more is needed, in particular a robust, portable, and effective standard for parallel programming within a single address space, perhaps for heterogeneous processors. Formal methods provide the only truly scalable approach to developing correct code in this complex programming environment.</p>]]></description>
<dc:creator><![CDATA[Lusk, E.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347493</dc:identifier>
<dc:title><![CDATA[Slouching Towards Exascale]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>339</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>337</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/340?rss=1">
<title><![CDATA[BSC Vision Towards Exascale]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/340?rss=1</link>
<description><![CDATA[<p>This paper provides the vision of the Barcelona Supercomputing Center towards exascale computing. We believe that it is key to have unified views of future computer systems, looking at the good ideas, developments, and practices from the past and applying them at the scalability levels we want to consider. The programming model is of Alexander&rsquo;s sword used to break the Gordian knot of exascale systems based on massive multicore architectures. The implementation of the programming model should decouple the way programs are written by the user (parallelism, address spaces, etc.) and executed by the runtime (execution vehicles, memory containers, malleability and load balancing, fault tolerance, etc.) on a specific target architecture. At the application level, it will be crucial to ensure that application porting is going to guarantee their survival for some decades or their clean upgrade to the foreseeable explosion of hardware platforms. Performance tools and analysis practices are in their infancy with regard to providing the required exascale support. BSC would like to contribute with this vision and ongoing efforts to the holistic exascale initiative.</p>]]></description>
<dc:creator><![CDATA[Labarta, J., Ayguade, E., Valero, M.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347439</dc:identifier>
<dc:title><![CDATA[BSC Vision Towards Exascale]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>343</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>340</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/344?rss=1">
<title><![CDATA[Programming Models at Exascale: Adaptive Runtime Systems, Incomplete Simple Languages, and Interoperability]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/344?rss=1</link>
<description><![CDATA[<p>Applications running on exascale machines will be complex in many ways. They will involve dynamic and adaptive refinements, and will be composed of multiple, independently developed modules, often involving a multiphysics simulation. The programming models of this era must have several characteristics. First, they need to do away with the notion of processors, and automate resource management via adaptive runtime systems. Data structure-specific frameworks and domain-specific environments will be needed to further simplify programming. More importantly, parallel mini-languages need to be developed, such that each language captures only a restricted subset of possible parallel interactions, but allows for a simple expression of them. Coupled with interoperability and parallel composition, which must be supported in many ways, including message-driven runtime systems, this will create a productive ecosystem of parallel programming models for the exascale era.</p>]]></description>
<dc:creator><![CDATA[Kale, L.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347497</dc:identifier>
<dc:title><![CDATA[Programming Models at Exascale: Adaptive Runtime Systems, Incomplete Simple Languages, and Interoperability]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>346</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>344</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/347?rss=1">
<title><![CDATA[Resource Management]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/347?rss=1</link>
<description><![CDATA[<p>Application scalability is directly related to the ability of the application developer to effectively use the resources provided by a computing system. As we start to address the development of exascale platforms, we must engage in a dialog to define the terms related to resource management. Approaches to resource management can be categorized in two dimensions: static/dynamic and explicit/ implicit. The static/dynamic dimension refers to when resource management decisions are made: prior to program execution or during program execution. The implicit/ explicit dimension refers to the object that implements the decision making: the tools that implement the programming environment or the application developer. The development of applications that can scale to the resources provided by an exascale system will require tools that allow programmers to move easily and seamlessly between these dimensions as they express resource management decisions.</p>]]></description>
<dc:creator><![CDATA[Maccabe, A., Falter, H., Kramer, W.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347498</dc:identifier>
<dc:title><![CDATA[Resource Management]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>349</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>347</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/reprint/23/4/350?rss=1">
<title><![CDATA[The Case for a Hierarchical System Model for Linux Clusters]]></title>
<link>http://hpc.sagepub.com/cgi/reprint/23/4/350?rss=1</link>
<description><![CDATA[]]></description>
<dc:creator><![CDATA[Seager, M., Gorda, B.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347499</dc:identifier>
<dc:title><![CDATA[The Case for a Hierarchical System Model for Linux Clusters]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>354</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>350</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/355?rss=1">
<title><![CDATA[Performance at Exascale]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/355?rss=1</link>
<description><![CDATA[<p>Exascale systems will consist of complex configurations with a huge number of potentially heterogeneous components. Deep software hierarchies of large, complex software components will be required to make use of such systems. While the software layers are designed to be transparent, they are typically not transparent with respect to performance. This performance non-transparency will result in escalation of unforeseen problems to higher layers, including the application. Altogether this will require an integrated and collaborative approach to handling performance issues and correctly detecting and analyzing performance problems. Contributions to this integrated approach are required from areas such as system design, operating software, and programming models, as well as performance modeling, monitoring, and analysis.</p>]]></description>
<dc:creator><![CDATA[Mohr, B., Muller, M. S., Nagel, W. E.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347501</dc:identifier>
<dc:title><![CDATA[Performance at Exascale]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>356</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>355</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/357?rss=1">
<title><![CDATA[On the Importance of End-to-End Application Performance Monitoring and Workload Analysis at the Exascale]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/357?rss=1</link>
<description><![CDATA[<p>This paper sets out to examine the future of performance monitoring on exascale HPC systems. In particular we put forth the idea that such machines will be sufficiently complex that performance monitoring of individual applications and the workload as a whole will change from being a beneficial option to being a necessity. This complexity arises from the number of components and concurrencies expected for such systems. We see the need for a shift from performance monitoring being a useful add-on toward it being a core requirement for basic operation and suggest some first steps toward meeting that need.</p>]]></description>
<dc:creator><![CDATA[Skinner, D., Choudary, A.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347502</dc:identifier>
<dc:title><![CDATA[On the Importance of End-to-End Application Performance Monitoring and Workload Analysis at the Exascale]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>360</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>357</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/361?rss=1">
<title><![CDATA[XXL Simulation for XXIst Century Power Systems Operation]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/361?rss=1</link>
<description><![CDATA[<p>As an industrial user with very high stakes in the operation and maintenance of complex systems such as nuclear power plants, EDF has been engaged in simulation for many years. We feel that exaflops software should not only be thought of as a way of tackling daunting research problems but should also take into account the sometimes equally daunting requirements that stem from an industrial usage perspective. We do feel that, whatever the hard changes that will probably have to be made to various software aspects, we should not lose sight of the fact that continuity paths also have to be found in order to make those big changes acceptable and profitable to many. We identify in this paper what we think are priority research themes that could benefit from an international collaboration.</p>]]></description>
<dc:creator><![CDATA[Berthou, J.-Y., Hamelin, J.-F., de Rocquigny, E.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347503</dc:identifier>
<dc:title><![CDATA[XXL Simulation for XXIst Century Power Systems Operation]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>365</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>361</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/366?rss=1">
<title><![CDATA[Partial Differential Equation-Based Applications and Solvers At Extreme Scale]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/366?rss=1</link>
<description><![CDATA[<p>Partial differential equation-based applications of multi-scale, multiphysics phenomena have driven the quest for extreme architectural scales since the foundation of modern digital computing and will continue to be principal among a broader set of science drivers for the foreseeable future. However, scientific and engineering drivers ceased long ago to dominate the computing industry and any commercially viable path to the petascale would seem to be through architectures that are assembled from components designed without the balance of resources required by scientific and engineering simulations foremost in mind. Concurrency will be massive and will involve many cores sharing common memory at the finest scales and severely dividing available memory bandwidth. As a result, algorithm designers will have to look beyond the message-passing-based SPMD paradigm that dominates today&rsquo;s most successful large-scale applications and solver frameworks, with stronger than ever emphasis on locality or operands and synchronization avoidance.</p>]]></description>
<dc:creator><![CDATA[Keyes, D.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347504</dc:identifier>
<dc:title><![CDATA[Partial Differential Equation-Based Applications and Solvers At Extreme Scale]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>368</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>366</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/369?rss=1">
<title><![CDATA[Application Analysis and Porting in the PRACE Project]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/369?rss=1</link>
<description><![CDATA[<p>This paper reports on the construction of a benchmark suite, to be used both within the current PRACE project and beyond, when actual Tier-0 systems will be purchased. PRACE targets toward a European research infrastructure, ideally consisting of various hardware architectures. This implicitly means that some applications are more suited to certain architectures than others. This needs to be reflected in the final benchmark suite, with the idea that potentially subsets of the overall benchmark suite may be used for benchmarking different architectures. The paper gives insight into the ideas behind the construction of the benchmark suite, including the current status of it.</p>]]></description>
<dc:creator><![CDATA[Michielse, P.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347505</dc:identifier>
<dc:title><![CDATA[Application Analysis and Porting in the PRACE Project]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>373</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>369</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/374?rss=1">
<title><![CDATA[Toward Exascale Resilience]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/374?rss=1</link>
<description><![CDATA[<p>Over the past few years resilience has became a major issue for high-performance computing (HPC) systems, in particular in the perspective of large petascale systems and future exascale systems. These systems will typically gather from half a million to several millions of central processing unit (CPU) cores running up to a billion threads. From the current knowledge and observations of existing large systems, it is anticipated that exascale systems will experience various kind of faults many times per day. It is also anticipated that the current approach for resilience, which relies on automatic or application level checkpoint/ restart, will not work because the time for checkpointing and restarting will exceed the mean time to failure of a full system. This set of projections leaves the community of fault tolerance for HPC systems with a difficult challenge: finding new approaches, which are possibly radically disruptive, to run applications until their normal termination, despite the essentially unstable nature of exascale systems. Yet, the community has only five to six years to solve the problem. This white paper synthesizes the motivations, observations and research issues considered as determinant of several complimentary experts of HPC in applications, programming models, distributed systems and system management.</p>]]></description>
<dc:creator><![CDATA[Cappello, F., Geist, A., Gropp, B., Kale, L., Kramer, B., Snir, M.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347767</dc:identifier>
<dc:title><![CDATA[Toward Exascale Resilience]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>388</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>374</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/389?rss=1">
<title><![CDATA[An Exascale Approach to Software and Hardware Design]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/389?rss=1</link>
<description><![CDATA[<p>For the past 10&mdash;15 years, horizontal layers of software and hardware design and development have been the <I>de facto</I> standard of creating high-performance computing (HPC) software. The horizontal design approach leads to the development of discrete components in the software stack and independent hardware components &mdash; all developed with different methods, requirements and quality dominated by plug-and-play componentization that is focused on horizontal functionality and portability. The horizontal software paradigm will break down at the exascale due to the system scale and complexity. The vertical approach needed for the exascale should include resilience (reliability and fault tolerance); performance; programmability; computational models; I/O; consistency and verification; resource management; and power management/total cost of ownership. To make the exascale an effective reality, instead of thinking of integration as the final step in defining and developing an exascale system, it will have to be the first step.</p>]]></description>
<dc:creator><![CDATA[Kramer, W., Skinner, D.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347768</dc:identifier>
<dc:title><![CDATA[An Exascale Approach to Software and Hardware Design]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>391</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>389</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/392?rss=1">
<title><![CDATA[Consistent Application Performance at the Exascale]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/392?rss=1</link>
<description><![CDATA[<p>We examine the future of application performance consistency on exascale parallel computing systems. By performance consistency we mean the regularity of wall clock times to complete a fixed amount of application progress. Exascale systems will have dramatically increased complexity along with their capability. Contributors to inconsistency include architectural choices, software functions and subtle interactions, and inconsistency will lead to lost potential. The challenge is how to maintain consistency at the exascale. In order for exascale systems to exhibit the consistency that is required to make the applications and systems productive, a new understanding of the causes and solutions to inconsistency is required, along with new ways of measuring the impact that design, implementation and operational choices have on consistency.</p>]]></description>
<dc:creator><![CDATA[Kramer, W., Skinner, D.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347700</dc:identifier>
<dc:title><![CDATA[Consistent Application Performance at the Exascale]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>394</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>392</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/395?rss=1">
<title><![CDATA[A Collaboration and Commercialization Model for Exascale Software Research]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/395?rss=1</link>
<description><![CDATA[<p>We propose a coordinated strategy for exascale software development that includes the incorporation of successful research and development (R&amp;D) into development and engineering (D&amp;E) projects and harvesting the successful D&amp;E projects into products with vendor support (P&amp;S). This allows the most flexible R&amp;D agenda while at the same time providing a commercialization path. This process is described as a natural extension of current focus areas and funding agents for R&amp;D, D&amp;E and P&amp;S, but adds stake holders from the next stage in the process in the upstream processes. This model allows the flexibility to encourage development and competition of ideas in the research, development and productization phases. We anticipate that multiple iterations through this process from R&amp;D through P&amp;S are required to achieve appropriate software for Exascale systems.</p>]]></description>
<dc:creator><![CDATA[Seager, M., Gorda, B.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347701</dc:identifier>
<dc:title><![CDATA[A Collaboration and Commercialization Model for Exascale Software Research]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>397</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>395</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/398?rss=1">
<title><![CDATA[Towards Exascale Distributed Data Management]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/398?rss=1</link>
<description><![CDATA[<p>"Exascale eScience infrastructures" will face important and critical challenges, both from computational and data perspectives. Increasingly complex and parallel scientific codes will lead to the production of a huge amount of data. The large volume of data and the time needed to locate, access, analyze and visualize data will greatly impact on the scientific productivity of scientists and researchers in several domains. Significant improvements in the data management field will increase research productivity in solving complex scientific problems. Next-generation eScience infrastructures will start from the assumption that exascale high-performance computing (HPC) applications (running on million of cores) will generate data at a very high rate (terabytes/s). Hundreds of exabytes of data (distributed across several centers) are expected, by 2020, to be available through heterogeneous storage resources for access, analysis, post-processing and other scientific activities.</p>]]></description>
<dc:creator><![CDATA[Aloisio, G., Fiore, S.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347702</dc:identifier>
<dc:title><![CDATA[Towards Exascale Distributed Data Management]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>400</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>398</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/401?rss=1">
<title><![CDATA[IESP Exascale Challenge: Co-Design of Architectures and Algorithms]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/401?rss=1</link>
<description><![CDATA[<p>There is a large gap between the peak performance of supercomputers and the actual performance realized by today&rsquo;s algorithms. This architecture&mdash;algorithm performance gap will get even wider with the increase in computing power being driven by a rapid escalation in the number of cores incorporated into a single chip rather than increases in the clock rate. In order to improve the effectiveness of peta and exascale systems we need to have a paradigm shift where architectures and algorithms are co-designed.</p>]]></description>
<dc:creator><![CDATA[Geist, A., Dosanjh, S.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347766</dc:identifier>
<dc:title><![CDATA[IESP Exascale Challenge: Co-Design of Architectures and Algorithms]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>402</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>401</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/403?rss=1">
<title><![CDATA[The Application Perspective: Seeking Productivity and Performance]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/403?rss=1</link>
<description><![CDATA[<p>In this note we propose two projects: (1) creating a hierarchical programming model from current models; and (2) extracting application primitives from the "13 dwarfs". The first topic addresses the need for a unified and manageable framework for very large-scale concurrent execution. This is the productivity part: less complexity will drive better mapping of algorithms to architecture, which will also contribute to better performance. The second topic focuses mostly on the processor and the node with the aim of laying the groundwork for software and silicon optimized kernels. While it is understood that applications primitives are outside the scope of IESP, the motivation for introducing it here is that it is a companion issue and that increasing the efficiency of each processor provides high return for science, at all levels of system size.</p>]]></description>
<dc:creator><![CDATA[Barkai, D.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347440</dc:identifier>
<dc:title><![CDATA[The Application Perspective: Seeking Productivity and Performance]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>408</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>403</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/reprint/23/4/409?rss=1">
<title><![CDATA[Musings on the Path Forward to Exascale]]></title>
<link>http://hpc.sagepub.com/cgi/reprint/23/4/409?rss=1</link>
<description><![CDATA[]]></description>
<dc:creator><![CDATA[Lucas, R. F]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347705</dc:identifier>
<dc:title><![CDATA[Musings on the Path Forward to Exascale]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>410</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>409</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/411?rss=1">
<title><![CDATA[Early Application Development/Tuning and Application Characterization/ Segmentation]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/411?rss=1</link>
<description><![CDATA[<p>This position paper makes two separate, only tangentially related points:</p><p>1. A research program is necessary to produce tools and techniques that allow application developers to develop and tune applications for future exascale machines, well before the machines are deployed.</p><p>2. In order to cope with, or facilitate, segmentation of exascale architectures, it is necessary to carry out an extensive study characterizing the needs and behaviors of applications that are expected to run on exascale machines.</p>]]></description>
<dc:creator><![CDATA[Kale, L.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347703</dc:identifier>
<dc:title><![CDATA[Early Application Development/Tuning and Application Characterization/ Segmentation]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>412</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>411</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/413?rss=1">
<title><![CDATA[On the Need for a Consortium of Capability Centers]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/413?rss=1</link>
<description><![CDATA[<p>Users of high-performance computing systems face many challenges, particularly as they design and develop their software to run at multiple facilities. This can lead to a "greatest common denominator" strategy that slows innovation and the adoption of newer techniques. In addition, these systems typically push the limits &mdash; leading to problems with reliability and functionality of the system and software. We propose a consortium of HPC centers to collaborate on raising both the capability and the quality of the software for HPC systems.</p>]]></description>
<dc:creator><![CDATA[Gropp, W., Snir, M.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347706</dc:identifier>
<dc:title><![CDATA[On the Need for a Consortium of Capability Centers]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>420</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>413</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/reprint/23/4/421?rss=1">
<title><![CDATA[Exascale Software: Some Questions to Drive the Development]]></title>
<link>http://hpc.sagepub.com/cgi/reprint/23/4/421?rss=1</link>
<description><![CDATA[]]></description>
<dc:creator><![CDATA[Patra, A., Pennington, R., Seidel, E.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347708</dc:identifier>
<dc:title><![CDATA[Exascale Software: Some Questions to Drive the Development]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>422</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>421</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/423?rss=1">
<title><![CDATA[Developing a High-Performance Computing/Numerical Analysis Roadmap]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/423?rss=1</link>
<description><![CDATA[<p>A roadmap activity in the UK has leveraged US and European efforts for identifying the challenges and barriers in the development of high-performance computing (HPC) algorithms and software. The activity has identified the Grand Challenge to provide:</p><p>1. Algorithms and software that application developers can reuse in the form of high-quality, high performance, sustained software components, libraries and modules</p><p>2. A community environment that allows the sharing of software, communication of interdisciplinary knowledge and the development of appropriate skills.</p><p>Through a series of workshops and discussions with UK HPC application groups and numerical analysts, five areas of challenge have emerged.</p>]]></description>
<dc:creator><![CDATA[Trefethen, A., Higham, N., Duff, I., Coveney, P.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347710</dc:identifier>
<dc:title><![CDATA[Developing a High-Performance Computing/Numerical Analysis Roadmap]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>426</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>423</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/427?rss=1">
<title><![CDATA[Major Computer Science Challenges At Exascale]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/427?rss=1</link>
<description><![CDATA[<p>Exascale systems will provide an unprecedented opportunity for science, one that will make it possible to use computation not only as a critical tool along with theory and experiment in understanding the behavior of the fundamental components of nature, but also for critical advances for the nation&rsquo;s energy needs and security. To create exascale systems and software that will enable the US Department of Energy (DOE) to meet the science goals critical to the nation&rsquo;s energy, ecological sustainability, and global security, we must focus on major architecture, software, algorithm, and data challenges, and build on newly emerging programming environments. Only with this new infrastructure will applications be able to scale up to the required levels of parallelism and integrate technologies into complex coupled systems for real-world multidisciplinary modeling and simulation. Achieving this goal will likely involve a shift from current static approaches for application development and execution to a combination of new software tools, algorithms, and dynamically adaptive methods.</p>]]></description>
<dc:creator><![CDATA[Geist, A., Lucas, R.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347445</dc:identifier>
<dc:title><![CDATA[Major Computer Science Challenges At Exascale]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>436</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>427</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/4/437?rss=1">
<title><![CDATA[Software Challenges for Extreme Scale Computing: Going From Petascale to Exascale Systems]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/4/437?rss=1</link>
<description><![CDATA[<p>Preparing applications for a transition from petascale to exascale systems will require a very large investment in several areas of software research and development. The introduction of manycore nodes, the abundance of parallelism, an increase in system faults (including soft errors) and a complicated, multi-component software environment are some of the most challenging issues we face. In this paper we address four topics we believe to be the most the challenging issues and therefore the greatest opportunities for making effective next-generation scalable applications. First and foremost is the need to transform existing applications to run on manycore platforms and properly design new applications. This is particularly challenging in the absence of a standard, portable manycore programming environment, but we can make progress in this direction while manycore programming models are developed. Second is promoting advanced modeling and simulation capabilities such as embedded optimization and uncertainty quantification that lead to higher quality results and orders of magnitude more parallelism. Third is progress toward fault resilience in applications, a critical need as system reliability degrades. Fourth and finally is a qualitative improvement in software design, including the social aspects, as exascale software systems will be increasingly multi-team and multi-faceted efforts.</p>]]></description>
<dc:creator><![CDATA[Heroux, M. A.]]></dc:creator>
<dc:date>Thu, 22 Oct 2009 02:11:07 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009347711</dc:identifier>
<dc:title><![CDATA[Software Challenges for Extreme Scale Computing: Going From Petascale to Exascale Systems]]></dc:title>
<prism:number>4</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>439</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>437</prism:startingPage>
<prism:section>Articles</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/reprint/23/3/195?rss=1">
<title><![CDATA[Editorial]]></title>
<link>http://hpc.sagepub.com/cgi/reprint/23/3/195?rss=1</link>
<description><![CDATA[]]></description>
<dc:creator><![CDATA[Dongarra, J., Tourancheau, B.]]></dc:creator>
<dc:date>Mon, 20 Jul 2009 04:07:45 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009343130</dc:identifier>
<dc:title><![CDATA[Editorial]]></dc:title>
<prism:number>3</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>195</prism:endingPage>
<prism:publicationDate>2009-08-01</prism:publicationDate>
<prism:startingPage>195</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/3/196?rss=1">
<title><![CDATA[Hybrid Message-Passing and Shared-Memory Programming in a Molecular Dynamics Application On Multicore Clusters]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/3/196?rss=1</link>
<description><![CDATA[<p>Hybrid programming, whereby shared-memory and message-passing programming techniques are combined within a single parallel application, has often been discussed as a method for increasing code performance on clusters of symmetric multiprocessors (SMPs). This paper examines whether the hybrid model brings any performance benefits for clusters based on multicore processors. A molecular dynamics application has been parallelized using both MPI and hybrid MPI/OpenMP programming models. The performance of this application has been examined on two high-end multicore clusters using both Infiniband and Gigabit Ethernet interconnects. The hybrid model has been found to perform well on the higher-latency Gigabit Ethernet connection, but offers no performance benefit on low-latency Infiniband interconnects. The changes in performance are attributed to the differing communication profiles of the hybrid and MPI codes.</p>]]></description>
<dc:creator><![CDATA[Chorley, M. J., Walker, D. W., Guest, M. F.]]></dc:creator>
<dc:date>Mon, 20 Jul 2009 04:07:45 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009106188</dc:identifier>
<dc:title><![CDATA[Hybrid Message-Passing and Shared-Memory Programming in a Molecular Dynamics Application On Multicore Clusters]]></dc:title>
<prism:number>3</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>211</prism:endingPage>
<prism:publicationDate>2009-08-01</prism:publicationDate>
<prism:startingPage>196</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/3/212?rss=1">
<title><![CDATA[Fault Tolerance in Petascale/ Exascale Systems: Current Knowledge, Challenges and Research Opportunities]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/3/212?rss=1</link>
<description><![CDATA[<p>The emergence of petascale systems and the promise of future exascale systems have reinvigorated the community interest in how to manage failures in such systems and ensure that large applications, lasting several hours or tens of hours, are completed successfully. Most of the existing results for several key mechanisms associated with fault tolerance in high-performance computing (HPC) platforms follow the rollback&mdash;recovery approach. Over the last decade, these mechanisms have received a lot of attention from the community with different levels of success. Unfortunately, despite their high degree of optimization, existing approaches do not fit well with the challenging evolutions of large-scale systems. There is room and even a need for new approaches. Opportunities may come from different origins: diskless checkpointing, algorithmic-based fault tolerance, proactive operation, speculative execution, software transactional memory, forward recovery, etc. The contributions of this paper are as follows: (1) we summarize and analyze the existing results concerning the failures in large-scale computers and point out the urgent need for drastic improvements or disruptive approaches for fault tolerance in these systems; (2) we sketch most of the known opportunities and analyze their associated limitations; (3) we extract and express the challenges that the HPC community will have to face for addressing the stringent issue of failures in HPC systems.</p>]]></description>
<dc:creator><![CDATA[Cappello, F.]]></dc:creator>
<dc:date>Mon, 20 Jul 2009 04:07:45 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009106189</dc:identifier>
<dc:title><![CDATA[Fault Tolerance in Petascale/ Exascale Systems: Current Knowledge, Challenges and Research Opportunities]]></dc:title>
<prism:number>3</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>226</prism:endingPage>
<prism:publicationDate>2009-08-01</prism:publicationDate>
<prism:startingPage>212</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/3/227?rss=1">
<title><![CDATA[Adaptive Fault Tolerance for Scalable Cluster Computing in Space]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/3/227?rss=1</link>
<description><![CDATA[<p>Future missions of deep-space exploration face the challenge of building more capable autonomous spacecraft and planetary rovers. Given the communication latencies and bandwidth limitations for such missions, the need for increased autonomy becomes mandatory, along with the requirement for enhanced on-board computational capabilities while in deep-space or time-critical situations. This will result in dramatic changes in the way missions are conducted and supported by on-board computing systems. Specifically, the traditional approach of relying exclusively on radiation-hardened hardware and modular redundancy will not be able to deliver the required computational power. As a consequence, such systems are expected to include high-capability low-power components based on emerging commercial-off-the-shelf (COTS) multi-core technology. In this paper we describe the design of a generic framework for introspection that supports runtime monitoring and analysis of program execution as well as a feedback-oriented recovery from faults. Our focus is on providing flexible software fault tolerance matched to the requirements and properties of applications by exploiting knowledge that is either contained in an application knowledge base, provided by users, or automatically derived from specifications. A prototype implementation is currently in progress at the Jet Propulsion Laboratory, California Institute of Technology, targeting a cluster of cell broadband engines.</p>]]></description>
<dc:creator><![CDATA[James, M. L., Shapiro, A. A., Springer, P. L., Zima, H. P.]]></dc:creator>
<dc:date>Mon, 20 Jul 2009 04:07:45 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009106190</dc:identifier>
<dc:title><![CDATA[Adaptive Fault Tolerance for Scalable Cluster Computing in Space]]></dc:title>
<prism:number>3</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>241</prism:endingPage>
<prism:publicationDate>2009-08-01</prism:publicationDate>
<prism:startingPage>227</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/3/242?rss=1">
<title><![CDATA[The Raid-6 Liber8Tion Code]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/3/242?rss=1</link>
<description><![CDATA[<p>Large centralized and networked storage systems have grown to the point where the single fault tolerance provided by RAID-5 is no longer enough. RAID-6 storage systems protect <I> k</I> disks of data with two parity disks so that the system of <I>k</I> + 2 disks may tolerate the failure of any two disks. Coding techniques for RAID-6 systems are varied, but an important class of techniques are those with <I>minimum density</I>, featuring an optimal combination of encoding, decoding and modification complexity. The <I>word size</I> of a code has an impact on both how the code is laid out on each disk's sectors and how large <I>k</I> can be. Word sizes which are powers of two are especially important, since they fit precisely into file system blocks. Minimum density codes exist for many word sizes with the notable exception of eight. This paper fills that gap by describing a new code called <b>The RAID-6 Liber8tion Code</b> for this important word size. The description includes performance properties as well as details of the discovery process.</p>]]></description>
<dc:creator><![CDATA[Plank, J. S.]]></dc:creator>
<dc:date>Mon, 20 Jul 2009 04:07:45 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009106191</dc:identifier>
<dc:title><![CDATA[The Raid-6 Liber8Tion Code]]></dc:title>
<prism:number>3</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>251</prism:endingPage>
<prism:publicationDate>2009-08-01</prism:publicationDate>
<prism:startingPage>242</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/3/252?rss=1">
<title><![CDATA[HPC and Grid Computing for Integrative Biomedical Research]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/3/252?rss=1</link>
<description><![CDATA[<p>Integrative biomedical research projects query, analyze, and integrate many different data types and make use of datasets obtained from measurements or simulations of structure and function at multiple biological scales. With the increasing availability of high-throughput and high-resolution instruments, the integrative biomedical research imposes many challenging requirements on software middleware systems. In this paper, we look at some of these requirements using example research pattern templates. We then discuss how middleware systems, which incorporate Grid and high-performance computing, could be employed to address the requirements.</p>]]></description>
<dc:creator><![CDATA[Kurc, T., Hastings, S., Kumar, V., Langella, S., Sharma, A., Pan, T., Oster, S., Ervin, D., Permar, J., Narayanan, S., Gil, Y., Deelman, E., Hall, M., Saltz, J.]]></dc:creator>
<dc:date>Mon, 20 Jul 2009 04:07:45 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009106192</dc:identifier>
<dc:title><![CDATA[HPC and Grid Computing for Integrative Biomedical Research]]></dc:title>
<prism:number>3</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>264</prism:endingPage>
<prism:publicationDate>2009-08-01</prism:publicationDate>
<prism:startingPage>252</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/3/265?rss=1">
<title><![CDATA[Energy Profiling and Analysis of the HPC Challenge Benchmarks]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/3/265?rss=1</link>
<description><![CDATA[<p>Future high performance systems must use energy efficiently to achieve petaFLOPS computational speeds and beyond. To address this challenge, we must first understand the power and energy characteristics of high performance computing applications. In this paper, we use a power-performance profiling framework called Power-Pack to study the power and energy profiles of the HPC Challenge benchmarks. We present detailed experimental results along with in-depth analysis of how each benchmark's workload characteristics affect power consumption and energy efficiency. This paper summarizes various findings using the HPC Challenge benchmarks, including but not limited to: 1) identifying application power profiles by function and component in a high performance cluster; 2) correlating applications' memory access patterns to power consumption for these benchmarks; and 3) exploring how energy consumption scales with system size and workload.</p>]]></description>
<dc:creator><![CDATA[Shuaiwen Song,  , Rong Ge,  , Xizhou Feng,  , Cameron, K. W.]]></dc:creator>
<dc:date>Mon, 20 Jul 2009 04:07:45 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009106193</dc:identifier>
<dc:title><![CDATA[Energy Profiling and Analysis of the HPC Challenge Benchmarks]]></dc:title>
<prism:number>3</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>276</prism:endingPage>
<prism:publicationDate>2009-08-01</prism:publicationDate>
<prism:startingPage>265</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/3/277?rss=1">
<title><![CDATA[Parallel Programming in MATLAB]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/3/277?rss=1</link>
<description><![CDATA[<p>A visit to the neighborhood PC retail store provides ample proof that we are in the multi-core era. The key differentiator among manufacturers today is the number of cores that they pack onto a single chip. The clock frequency of commodity processors has reached its limit, however, and is likely to stay below 4 GHz for years to come. As a result, adding cores is not synonymous with increasing computational power. To take full advantage of the performance enhancements offered by the new multi-core hardware, a corresponding shift must take place in the software infrastructure &mdash; a shift to parallel computing.</p>]]></description>
<dc:creator><![CDATA[Luszczek, P.]]></dc:creator>
<dc:date>Mon, 20 Jul 2009 04:07:45 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009106194</dc:identifier>
<dc:title><![CDATA[Parallel Programming in MATLAB]]></dc:title>
<prism:number>3</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>283</prism:endingPage>
<prism:publicationDate>2009-08-01</prism:publicationDate>
<prism:startingPage>277</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/3/284?rss=1">
<title><![CDATA[Hierarchical Task-Based Programming With StarSs]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/3/284?rss=1</link>
<description><![CDATA[<p>Programming models for multicore and many-core systems are listed as one of the main challenges in the near future for computing research. These programming models should be able to exploit the underlying platform, but also should have good programmability to enable programmer productivity. With respect to the heterogeneity and hierarchy of the underlying platforms, the programming models should take them into account but they should also enable the programmer to be unaware of the complexity of the hardware. In this paper we present an extension of the StarSs syntax to support task hierarchy. A motivation for such a hierarchical approach is presented through experimentation with CellSs. A prototype implementation of such a hierarchical task-based programming model that combines a first task level with SMPSs and a second task level with CellSs is presented. The preliminary results obtained when executing a matrix multiplication and a Cholesky factorization show the viability and potential of the approach and the current issues raised.</p>]]></description>
<dc:creator><![CDATA[Planas, J., Badia, R. M., Ayguade, E., Labarta, J.]]></dc:creator>
<dc:date>Mon, 20 Jul 2009 04:07:45 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009106195</dc:identifier>
<dc:title><![CDATA[Hierarchical Task-Based Programming With StarSs]]></dc:title>
<prism:number>3</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>299</prism:endingPage>
<prism:publicationDate>2009-08-01</prism:publicationDate>
<prism:startingPage>284</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/2/123?rss=1">
<title><![CDATA[Accurate and Efficient Estimation of Parameters of Heterogeneous Communication Performance Models]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/2/123?rss=1</link>
<description><![CDATA[<p>Analytical predictive communication models play an important role in the optimization of communication operations in scientific applications running on computational clusters. The effectiveness of this model-based optimization strongly depends on the accuracy of the estimation of the parameters of these models. The task of accurate estimation of the model is particularly challenging for heterogeneous communication models that use a much larger number of point-to-point parameters than their homogeneous counterparts. One particular challenge occurs when the number of point-to-point parameters describing communication between a pair of processors becomes larger than the number of independent point-to-point communication experiments traditionally used for estimation of the parameters. In this paper, we address this and other related issues and propose an approach that allows us to design a set of communication experiments sufficient for the accurate and efficient estimation of the parameters of a heterogeneous communication performance model. The experiments on heterogeneous clusters demonstrate the accuracy and efficiency of the proposed solution.</p>]]></description>
<dc:creator><![CDATA[Lastovetsky, A., Rychkov, V.]]></dc:creator>
<dc:date>Wed, 20 May 2009 04:33:32 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009103947</dc:identifier>
<dc:title><![CDATA[Accurate and Efficient Estimation of Parameters of Heterogeneous Communication Performance Models]]></dc:title>
<prism:number>2</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>139</prism:endingPage>
<prism:publicationDate>2009-05-01</prism:publicationDate>
<prism:startingPage>123</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/2/140?rss=1">
<title><![CDATA[A Parallel Algorithm To Solve Large Stiff ODE Systems On Grid Systems]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/2/140?rss=1</link>
<description><![CDATA[<p>This paper introduces a parallel algorithm to solve large stiff ODE systems on distributed clusters, with computing nodes geographically distant from each other. This algorithm is based on the waveform relaxation method coupled with a sequential solver for differential equations systems. With respect to the standard PVODE algorithm (Parallel Variable-coefficient Ordinary Differential Equations solver; Byrne, George, and Hindmars 1999), it drastically reduces the number of messages exchanged between nodes which makes it less sensitive to slow communications. Thus, it is a coarse-grained algorithm well suited for grid environments connected via high latency networks. In this paper, we present various experiments which compare the PVODE solver and our algorithm and which show the benefits brought by this work.</p>]]></description>
<dc:creator><![CDATA[Bahi, J. M., Charr, J.-C., Couturier, R., Laiymani, D.]]></dc:creator>
<dc:date>Wed, 20 May 2009 04:33:32 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009104010</dc:identifier>
<dc:title><![CDATA[A Parallel Algorithm To Solve Large Stiff ODE Systems On Grid Systems]]></dc:title>
<prism:number>2</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>151</prism:endingPage>
<prism:publicationDate>2009-05-01</prism:publicationDate>
<prism:startingPage>140</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/2/152?rss=1">
<title><![CDATA[Parallel Algorithms for the Execution of Relational Database Operations Revisited On Grids]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/2/152?rss=1</link>
<description><![CDATA[<p>This paper presents an analytical discussion of algorithms for relational database operations in a grid environment, compares the findings with the classical generalized multiprocessor framework, and describes an optimization algorithm to maximize performance for a heterogeneous environment.</p><p>We develop a concise but comprehensive analytical model of parallel algorithms for sorting, joining, and aggregation. In our approach we focus on a limited number of characteristic parameters to keep the analytical model clear. It is shown that an expressive model can be built upon just three characteristic parameter sets, namely the node processing performance and the network and the disk bandwidths. These parameters are the input for the optimization process for the orchestration of the execution workflow on the grid. Based on these results the paper proves that using smart enhancement to exploit the heterogeneity of the grid, the performance of the algorithms for database operations can be increased remarkably.</p>]]></description>
<dc:creator><![CDATA[Mach, W., Schikuta, E.]]></dc:creator>
<dc:date>Wed, 20 May 2009 04:33:32 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009104006</dc:identifier>
<dc:title><![CDATA[Parallel Algorithms for the Execution of Relational Database Operations Revisited On Grids]]></dc:title>
<prism:number>2</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>170</prism:endingPage>
<prism:publicationDate>2009-05-01</prism:publicationDate>
<prism:startingPage>152</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/2/171?rss=1">
<title><![CDATA[Multi-Criteria Scheduling of Pipeline Workflows (and Application To the JPEG Encoder)]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/2/171?rss=1</link>
<description><![CDATA[<p>Mapping workflow applications onto parallel platforms is a challenging problem, even for simple application patterns such as pipeline graphs. Several antagonist criteria should be optimized, such as throughput and latency (or a combination). A typical application class is digital image coding, where images are processed in steady-state mode. In this paper, we study the general bi-criteria mapping problem (minimizing period and latency) for pipeline graphs on communication homogeneous platforms. We present an integer linear programming formulation for this NP-hard problem. Furthermore, we provide several efficient polynomial bi-criteria heuristics, whose relative performance is evaluated through extensive simulations. As a case study, we provide simulations and MPI experimental results for the JPEG encoder application pipeline on a cluster of workstations.</p>]]></description>
<dc:creator><![CDATA[Benoit, A., Kosch, H., Rehn-Sonigo, V., Robert, Y.]]></dc:creator>
<dc:date>Wed, 20 May 2009 04:33:32 PDT</dc:date>
<dc:identifier>info:doi/10.1177/1094342009104009</dc:identifier>
<dc:title><![CDATA[Multi-Criteria Scheduling of Pipeline Workflows (and Application To the JPEG Encoder)]]></dc:title>
<prism:number>2</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>187</prism:endingPage>
<prism:publicationDate>2009-05-01</prism:publicationDate>
<prism:startingPage>171</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/reprint/23/1/3?rss=1">
<title><![CDATA[Thank You To Reviewers]]></title>
<link>http://hpc.sagepub.com/cgi/reprint/23/1/3?rss=1</link>
<description><![CDATA[]]></description>
<dc:creator><![CDATA[]]></dc:creator>
<dc:date>Wed, 18 Feb 2009 07:55:26 PST</dc:date>
<dc:identifier>info:doi/10.1177/1094342008099585</dc:identifier>
<dc:title><![CDATA[Thank You To Reviewers]]></dc:title>
<prism:number>1</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>3</prism:endingPage>
<prism:publicationDate>2009-02-01</prism:publicationDate>
<prism:startingPage>3</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/1/5?rss=1">
<title><![CDATA[The Problem With the Linpack Benchmark 1.0 Matrix Generator]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/1/5?rss=1</link>
<description><![CDATA[<p>We characterize the matrix sizes for which the Linpack Benchmark 1.0 matrix generator constructs a matrix with identical columns.</p>]]></description>
<dc:creator><![CDATA[Dongarra, J. J., Langou, J.]]></dc:creator>
<dc:date>Wed, 18 Feb 2009 07:55:27 PST</dc:date>
<dc:identifier>info:doi/10.1177/1094342008098683</dc:identifier>
<dc:title><![CDATA[The Problem With the Linpack Benchmark 1.0 Matrix Generator]]></dc:title>
<prism:number>1</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>13</prism:endingPage>
<prism:publicationDate>2009-02-01</prism:publicationDate>
<prism:startingPage>5</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/1/14?rss=1">
<title><![CDATA[Performance Modeling and Analysis of a Massively Parallel Direct--Part 1]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/1/14?rss=1</link>
<description><![CDATA[<p>Modeling and analysis techniques are used to investigate the performance of a massively parallel version of DIRECT, a global search algorithm widely used in multidisciplinary design optimization applications. Several high-dimensional benchmark functions and real world problems are used to test the design effectiveness under various problem structures. Theoretical and experimental results are compared for two parallel clusters with different system scales and network connectivities. The present work aims at studying the performance sensitivity to important parameters for problem configurations, parallel schemes, and system settings. The performance metrics include the memory usage, load balancing, parallel efficiency, and scalability. An analytical bounding model is constructed to measure the load balancing performance under different schemes. Additionally, linear regression models are used to characterize two major overhead sources, interprocessor communication and processor idleness, and also applied to the isoefficiency functions in scalability analysis. For a variety of high-dimensional problems and large-scale systems, the massively parallel design has achieved reasonable performance. The results of the performance study provide guidance for efficient problem and scheme configuration. More importantly, the generalized design considerations and analysis techniques are beneficial for transforming many global search algorithms into effective large-scale parallel optimization tools.</p>]]></description>
<dc:creator><![CDATA[Jian He,  , Verstak, A., Watson, L.T., Sosonkina, M.]]></dc:creator>
<dc:date>Wed, 18 Feb 2009 07:55:27 PST</dc:date>
<dc:identifier>info:doi/10.1177/1094342008098462</dc:identifier>
<dc:title><![CDATA[Performance Modeling and Analysis of a Massively Parallel Direct--Part 1]]></dc:title>
<prism:number>1</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>28</prism:endingPage>
<prism:publicationDate>2009-02-01</prism:publicationDate>
<prism:startingPage>14</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/1/29?rss=1">
<title><![CDATA[Performance Modeling and Analysis of a Massively Parallel Direct--Part 2]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/1/29?rss=1</link>
<description><![CDATA[<p>Modeling and analysis techniques are used to investigate the performance of a massively parallel version of DIRECT, a global search algorithm widely used in multidisciplinary design optimization applications. Several high-dimensional benchmark functions and real world problems are used to test the design effectiveness under various problem structures. In this second part of a two-part work, theoretical and experimental results are compared for two parallel clusters with different system scales and network connectivities. The first part studied performance sensitivity to important parameters for problem configurations and parallel schemes, using performance metrics such as memory usage, load balancing, and parallel efficiency. Here linear regression models are used to characterize two major overhead sources, interprocessor communication and processor idleness, and also applied to the isoefficiency functions in scalability analysis. For a variety of high-dimensional problems and large-scale systems, the massively parallel design has achieved reasonable performance. The results of the performance study provide guidance for efficient problem and scheme configuration. More importantly, the design considerations and analysis techniques generalize to the transformation of other global search algorithms into effective large-scale parallel optimization tools.</p>]]></description>
<dc:creator><![CDATA[Jian He,  , Verstak, A., Sosonkina, M., Watson, L.T.]]></dc:creator>
<dc:date>Wed, 18 Feb 2009 07:55:27 PST</dc:date>
<dc:identifier>info:doi/10.1177/1094342008098463</dc:identifier>
<dc:title><![CDATA[Performance Modeling and Analysis of a Massively Parallel Direct--Part 2]]></dc:title>
<prism:number>1</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>41</prism:endingPage>
<prism:publicationDate>2009-02-01</prism:publicationDate>
<prism:startingPage>29</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/1/42?rss=1">
<title><![CDATA[Opendda: a Novel High-Performance Computational Framework for the Discrete Dipole Approximation]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/1/42?rss=1</link>
<description><![CDATA[<p>This work presents a highly optimized computational framework for the Discrete Dipole Approximation, a numerical method for calculating the optical properties associated with a target of arbitrary geometry that is widely used in atmospheric, astrophysical and industrial simulations. Core optimizations include the bit-fielding of integer data and iterative methods that complement a new Discrete Fourier Transform (DFT) kernel, which efficiently calculates the matrix&mdash; vector products required by these iterative solution schemes. The new kernel performs the requisite 3-D DFTs as ensembles of 1-D transforms, and by doing so, is able to reduce the number of constituent 1-D transforms by 60% and the memory by over 80%. The optimizations also facilitate the use of parallel techniques to further enhance the performance. Complete OpenMP-based shared-memory and MPI-based distributed-memory implementations have been created to take full advantage of the various architectures. Several benchmarks of the new framework indicate extremely favorable performance and scalability.</p>]]></description>
<dc:creator><![CDATA[Donald, J. M., Golden, A., Jennings, S. G.]]></dc:creator>
<dc:date>Wed, 18 Feb 2009 07:55:27 PST</dc:date>
<dc:identifier>info:doi/10.1177/1094342008097914</dc:identifier>
<dc:title><![CDATA[Opendda: a Novel High-Performance Computational Framework for the Discrete Dipole Approximation]]></dc:title>
<prism:number>1</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>61</prism:endingPage>
<prism:publicationDate>2009-02-01</prism:publicationDate>
<prism:startingPage>42</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/1/62?rss=1">
<title><![CDATA[Optimization With High-Cost Objective Function Evaluations in a Computing Grid and an Application To Simulation-Based Design]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/1/62?rss=1</link>
<description><![CDATA[<p>The emerging grid computing technologies are aimed at the creation of virtual supercomputers to conduct huge scale scientific computations by harvesting computing resources on the Internet. This paper introduces a grid-enabled implementation of an optimization program for large-scale optimization problems requiring high-cost, black-box objective function evaluations. Adopting grid computing can be particularly beneficial for building surrogates such as response surfaces and carrying out large-scale optimizations using stochastic optimization algorithms. However, several problems have to be resolved for effective utilization of grid resources because of heterogeneity in computer capacity among grid resources and limited network conditions inherent in grid systems. This paper identifies some of the problems and introduces algorithms to effectively carry out large-scale optimizations on a grid. Specifically, asynchronous genetic and particle swarm optimization algorithms are developed for grid computing environments. The performance and characteristics of the grid-enabled implementations are assessed via extensive numerical tests. Finally, structural design based on high-fidelity simulations is carried out using the proposed algorithm in a computing grid system.</p>]]></description>
<dc:creator><![CDATA[Jin Woo Park,  , Si Hyong Park,  , Seung Jo Kim,  ]]></dc:creator>
<dc:date>Wed, 18 Feb 2009 07:55:27 PST</dc:date>
<dc:identifier>info:doi/10.1177/1094342008101234</dc:identifier>
<dc:title><![CDATA[Optimization With High-Cost Objective Function Evaluations in a Computing Grid and an Application To Simulation-Based Design]]></dc:title>
<prism:number>1</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>83</prism:endingPage>
<prism:publicationDate>2009-02-01</prism:publicationDate>
<prism:startingPage>62</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/1/84?rss=1">
<title><![CDATA[Dynamic Component Extension: a Strategy for Performance Improvement in Multicomponent Applications]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/1/84?rss=1</link>
<description><![CDATA[<p>Multicomponent application paradigms have gained prominence in many significant multidisciplinary scientific applications. In this work, we propose a software strategy called dynamic component extension for multicomponent applications to improve application performance by minimizing processor idling. In this strategy, the processor space of a component is dynamically extended to include the processors of other components during certain computationally intensive phases of the component. We demonstrate its use in improving the performance of one of the most prominent multicomponent applications, the community climate system model (CCSM). In this application, we dynamically extend the atmosphere component to minimize the idling in other components caused by large periodic temporal load imbalances in the atmosphere component. By means of experiments on different parallel platforms with different numbers of processors, we show that using our strategy can lead to about 15% reduction and savings of several days in execution times of CCSM for 1000-year simulation runs.</p>]]></description>
<dc:creator><![CDATA[Sivagama, S. M., Vadhiyar, S. S., Nanjundiah, R. S.]]></dc:creator>
<dc:date>Wed, 18 Feb 2009 07:55:27 PST</dc:date>
<dc:identifier>info:doi/10.1177/1094342008101364</dc:identifier>
<dc:title><![CDATA[Dynamic Component Extension: a Strategy for Performance Improvement in Multicomponent Applications]]></dc:title>
<prism:number>1</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>98</prism:endingPage>
<prism:publicationDate>2009-02-01</prism:publicationDate>
<prism:startingPage>84</prism:startingPage>
<prism:section>Article</prism:section>
</item>

<item rdf:about="http://hpc.sagepub.com/cgi/content/abstract/23/1/99?rss=1">
<title><![CDATA[How to Balance the Load on Heterogeneous Clusters]]></title>
<link>http://hpc.sagepub.com/cgi/content/abstract/23/1/99?rss=1</link>
<description><![CDATA[<p>The problem of computing a large set of different tasks on a set of heterogeneous resources connected by a network is very common nowadays in very different environments and load balancing is indispensable for achieving high performance and high throughput in systems such as clusters. Cluster heterogeneity increases the difficulty of balancing the load across the system nodes and, although the relationship between heterogeneity and load balancing is difficult to describe analytically, in this paper different models and performance metrics are proposed to describe heterogeneous cluster behavior and to perform an exhaustive analysis of the effects of heterogeneity on load balancing algorithm performance. This analysis allows us to propose efficient solutions capable of dealing with heterogeneity for all the load balancing algorithm stages. Furthermore, a load balancing algorithm has been implemented following these solutions to demonstrate, with experimental results, its efficiency on real heterogeneous clusters.</p>]]></description>
<dc:creator><![CDATA[Beltran, M., Guzman, A.]]></dc:creator>
<dc:date>Wed, 18 Feb 2009 07:55:27 PST</dc:date>
<dc:identifier>info:doi/10.1177/1094342008101834</dc:identifier>
<dc:title><![CDATA[How to Balance the Load on Heterogeneous Clusters]]></dc:title>
<prism:number>1</prism:number>
<prism:volume>23</prism:volume>
<prism:endingPage>118</prism:endingPage>
<prism:publicationDate>2009-02-01</prism:publicationDate>
<prism:startingPage>99</prism:startingPage>
<prism:section>Article</prism:section>
</item>

</rdf:RDF>