Nessuna descrizione

literature_review.bib 6.0KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144
  1. @article{goto_2008,
  2. author = {Goto, Kazushige and Geijn, Robert A. van de},
  3. title = {Anatomy of High-performance Matrix Multiplication},
  4. journal = {ACM Trans. Math. Softw.},
  5. issue_date = {May 2008},
  6. volume = {34},
  7. number = {3},
  8. month = may,
  9. year = {2008},
  10. issn = {0098-3500},
  11. pages = {12:1--12:25},
  12. articleno = {12},
  13. numpages = {25},
  14. url = {http://doi.acm.org/10.1145/1356052.1356053},
  15. doi = {10.1145/1356052.1356053},
  16. acmid = {1356053},
  17. publisher = {ACM},
  18. address = {New York, NY, USA},
  19. keywords = {Linear algebra, basic linear algebra subprogrms, matrix multiplication},
  20. }
  21. @Inbook{sweetman_2007,
  22. edition={2},
  23. title={See MIPS Run: Linux; Second Edition},
  24. publisher={Morgan Kaufmann Publishers},
  25. author={Sweetman, Dominic},
  26. year={2007},
  27. pages={81}
  28. }
  29. @article{paikaray_2013,
  30. author = {Bijay Paikaray},
  31. title = {Relative Performance of a Multi-level Cache with Last-Level Cache
  32. Replacement: An Analytic Review},
  33. journal = {CoRR},
  34. volume = {abs/1307.6406},
  35. year = {2013},
  36. url = {http://arxiv.org/abs/1307.6406},
  37. archivePrefix = {arXiv},
  38. eprint = {1307.6406},
  39. timestamp = {Wed, 07 Jun 2017 14:40:21 +0200},
  40. biburl = {http://dblp.org/rec/bib/journals/corr/Paikaray13},
  41. bibsource = {dblp computer science bibliography, http://dblp.org}
  42. }
  43. @Inbook{weidendorfer_2004,
  44. author="Weidendorfer, Josef
  45. and Kowarschik, Markus
  46. and Trinitis, Carsten",
  47. editor="Bubak, Marian
  48. and van Albada, Geert Dick
  49. and Sloot, Peter M. A.
  50. and Dongarra, Jack",
  51. title="A Tool Suite for Simulation Based Analysis of Memory Access Behavior",
  52. bookTitle="Computational Science - ICCS 2004: 4th International Conference, Krak{\'o}w, Poland, June 6-9, 2004, Proceedings, Part III",
  53. year="2004",
  54. publisher="Springer Berlin Heidelberg",
  55. address="Berlin, Heidelberg",
  56. pages="440--447",
  57. abstract="In this paper, two tools are presented: an execution driven cache simulator which relates event metrics to a dynamically built-up call-graph, and a graphical front end able to visualize the generated data in various ways. To get a general purpose, easy-to-use tool suite, the simulation approach allows us to take advantage of runtime instrumentation, i.e. no preparation of application code is needed, and enables for sophisticated preprocessing of the data already in the simulation phase. In an ongoing project, research on advanced cache analysis is based on these tools. Taking a multigrid solver as an example, we present the results obtained from the cache simulation together with real data measured by hardware performance counters.",
  58. isbn="978-3-540-24688-6",
  59. doi="10.1007/978-3-540-24688-6_58",
  60. url="https://doi.org/10.1007/978-3-540-24688-6_58"
  61. }
  62. @article{nethercote_2004,
  63. author = {Nethercote, Nicholas},
  64. year = {2004},
  65. month = {01},
  66. title = {Dynamic Binary Analysis and Instrumentation}
  67. }
  68. @article{kaparelos_2014,
  69. month = {June},
  70. author = {Stavros Kaparelos},
  71. series = {Department of Computer Science Technical Report Series},
  72. note = {Undergraduate dissertation supervised by Professor James Davenport},
  73. title = {Extending Cachegrind: L2 cache inclusion and TLB measuring},
  74. publisher = {Department of Computer Science, University of Bath},
  75. year = {2014},
  76. keywords = {computer performance,cache utilization,tlb},
  77. url = {http://opus.bath.ac.uk/39762/},
  78. abstract = {Programmers need to develop hardware conscious software in order to optimise efficiency and increase execution speed. To do that, they need tools that can provide such kind of information. Cachegrind is such a tool. It is a cache profiling tool that provides statistics for level 1 and the last level caches. This project extended Cachegrind, firstly, to include information for L2 cache when 3 levels of cache are present and, secondly, to measure the Translation Lookaside Buer (TLB). L2 cache inclusion presents the same information as presented in the other cache levels, while measuring the TLB provides a) the number of hits and misses, b) the pages used and the times used and c) per file, per function and, per source code line statistics. Any extension is developed to work in an Intel x86 architecture. Finally, extensions have been tested and results have been checked to be logical, as well as to be along the lines of the expected ones.}
  79. }
  80. @misc{forum_2017,
  81. title={AMD Discloses New Technologies At Microprocessor Forum},
  82. howpublished={\url{https://web.archive.org/web/20120308030806/http://www.amd.com/us/press-releases/Pages/Press_Release_751.aspx}},
  83. year={2017},
  84. note={[Online; accessed 20-November-2017]}
  85. }
  86. @misc{isambard_2017,
  87. title={GW4 joins industry partners to develop ‘first of its kind’ supercomputer},
  88. howpublished={\url{http://gw4.ac.uk/news/gw4-joins-industry-partners-develop-first-kind-supercomputer/}},
  89. year={2017},
  90. note={[Online; accessed 20-November-2017]}
  91. }
  92. @book{hennessy_2011,
  93. title={Computer Organization and Design, Revised Fourth Edition},
  94. publisher={Morgan Kaufmann},
  95. author={Hennessy, John L},
  96. year={2011},
  97. pages={456}
  98. }
  99. @inproceedings{gaur_2011,
  100. author = {Gaur, Jayesh and Chaudhuri, Mainak and Subramoney, Sreenivas},
  101. title = {Bypass and Insertion Algorithms for Exclusive Last-level Caches},
  102. booktitle = {Proceedings of the 38th Annual International Symposium on Computer Architecture},
  103. series = {ISCA '11},
  104. year = {2011},
  105. isbn = {978-1-4503-0472-6},
  106. location = {San Jose, California, USA},
  107. pages = {81--92},
  108. numpages = {12},
  109. url = {http://doi.acm.org/10.1145/2000064.2000075},
  110. doi = {10.1145/2000064.2000075},
  111. acmid = {2000075},
  112. publisher = {ACM},
  113. address = {New York, NY, USA},
  114. keywords = {bypass policy, exclusive last-level cache, insertion policy},
  115. }
  116. @article{smith_1982,
  117. author = {Smith, Alan Jay},
  118. title = {Cache Memories},
  119. journal = {ACM Comput. Surv.},
  120. issue_date = {Sept. 1982},
  121. volume = {14},
  122. number = {3},
  123. month = sep,
  124. year = {1982},
  125. issn = {0360-0300},
  126. pages = {473--530},
  127. numpages = {58},
  128. url = {http://doi.acm.org/10.1145/356887.356892},
  129. doi = {10.1145/356887.356892},
  130. acmid = {356892},
  131. publisher = {ACM},
  132. address = {New York, NY, USA},
  133. }