|
| 1 | +--- |
| 2 | +layout: page |
| 3 | +title: ELANA |
| 4 | +full_title: "ELANA: A Simple Energy and Latency Analyzer for LLMs" |
| 5 | +authors: Hung-Yueh Chiang, Bokun Wang, Diana Marculescu |
| 6 | +description: "Energy and Latency Analyzern for LLMs" |
| 7 | +img: assets/img/publication_preview/elana.png |
| 8 | +importance: 2 |
| 9 | +category: research |
| 10 | +--- |
| 11 | + |
| 12 | +<style> |
| 13 | +li { |
| 14 | + font-size: 1.1rem; /* Adjust as needed */ |
| 15 | +} |
| 16 | +</style> |
| 17 | + |
| 18 | +<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css"> |
| 19 | + |
| 20 | +<div style="text-align: center; padding-bottom: 1rem;"> |
| 21 | +<!-- <abbr class="badge" style="background-color:#00369f; margin-left:0.1rem; margin-right:0.1rem; font-size:1.1rem;">Arxiv</abbr> --> |
| 22 | +<abbr class="badge" style="background-color:#BF5700; margin-left:0.1rem; margin-right:0.1rem; font-size:1.1rem; width:80px; display:inline-block; text-align:center;">Arxiv</abbr> |
| 23 | +</div> |
| 24 | + |
| 25 | +<div class="authors"> |
| 26 | + <a href="https://hychiang.info">Hung-Yueh Chiang</a>, |
| 27 | + <a href="https://bokun-wang.github.io">Bokun Wang</a>, |
| 28 | + <a href="https://users.ece.utexas.edu/~dianam/">Diana Marculescu</a> |
| 29 | +</div> |
| 30 | +<div class="authors"> |
| 31 | + The University of Texas at Austin |
| 32 | +</div> |
| 33 | +<div style="text-align: center; margin-top:12px;"> |
| 34 | + <a href="https://arxiv.org/pdf/2512.09946"><i class="fa fa-file-pdf-o" style="font-size:24px;color"></i><b> Report </b></a> |
| 35 | + <a href="https://github.com/enyac-group/Elana/"><i class="fa fa-github" style="font-size:24px;color"></i><b> Code </b></a> |
| 36 | +</div> |
| 37 | + |
| 38 | + |
| 39 | +<br> |
| 40 | +<div style="text-align: center;"> |
| 41 | +<p style="font-family: Comic Neue; font-size: 1.4rem;"> |
| 42 | + 🤗 Support models on Hugging Face, including Transformers, SSMs, and hybrid models <br> |
| 43 | + 🔧 Support energy, latency, model size, KV cache size profiling <br> |
| 44 | + 🔍 Support detailed kernel latency profiling <br> |
| 45 | +</p> |
| 46 | +</div> |
| 47 | +<div class="row mt-3"> |
| 48 | + <div class="col-sm-10 mt-3 mt-md-0 offset-1"> |
| 49 | + {% include figure.html path="assets/img/projects/elana/elana.png" title="elana logo" class="img-fluid rounded z-depth-1" %} |
| 50 | + </div> |
| 51 | +</div> |
| 52 | +<br> |
| 53 | + |
| 54 | +# Compare to Zeus profiling framework |
| 55 | +<div class="row"> |
| 56 | + <div class="col-sm-10 mt-3 mt-md-0 offset-1"> |
| 57 | + {% include gif.html path="assets/img/projects/elana/compare.png" title="compare" class="img-fluid rounded z-depth-1" %} |
| 58 | + </div> |
| 59 | +</div> |
| 60 | +<br> |
| 61 | + |
| 62 | +# Hugging Face interface |
| 63 | +<div class="row mt-3"> |
| 64 | + <div class="col-sm-10 mt-3 mt-md-0 offset-1"> |
| 65 | + {% include figure.html path="assets/img/projects/elana/hf_interface.png" title="hf interface" class="img-fluid rounded z-depth-1" %} |
| 66 | + </div> |
| 67 | +</div> |
| 68 | +<br> |
| 69 | + |
| 70 | +# Profile model size |
| 71 | +<div class="row mt-3"> |
| 72 | + <div class="col-sm-10 mt-3 mt-md-0 offset-1"> |
| 73 | + {% include figure.html path="assets/img/projects/elana/model_size.png" title="model size" class="img-fluid rounded z-depth-1" %} |
| 74 | + </div> |
| 75 | +</div> |
| 76 | +<br> |
| 77 | + |
| 78 | + |
| 79 | + |
| 80 | +# Profiling results |
| 81 | +### Profile models on A6000 |
| 82 | +<div class="row mt-4"> |
| 83 | + <div class="col-sm-10 mt-4 mt-md-0 offset-1"> |
| 84 | + {% include figure.html path="assets/img/projects/elana/A6000.png" title="A6000 results" class="img-fluid rounded z-depth-1" %} |
| 85 | + </div> |
| 86 | +</div> |
| 87 | +<br> |
| 88 | + |
| 89 | +### Profile models on Jetson series |
| 90 | +<div class="row mt-4"> |
| 91 | + <div class="col-sm-10 mt-4 mt-md-0 offset-1"> |
| 92 | + {% include figure.html path="assets/img/projects/elana/jetson.png" title="jetson results" class="img-fluid rounded z-depth-1" %} |
| 93 | + </div> |
| 94 | +</div> |
| 95 | +<br> |
| 96 | + |
| 97 | + |
| 98 | +# Profiling kernels |
| 99 | +We use torch profile to generate a json trace file and visualize it with [Perfetto](https://ui.perfetto.dev/). |
| 100 | +<div class="row mt-4"> |
| 101 | + <div class="col-sm-10 mt-4 mt-md-0 offset-1"> |
| 102 | + {% include figure.html path="assets/img/projects/elana/perfetto_kernel.png" title="kernel results" class="img-fluid rounded z-depth-1" %} |
| 103 | + </div> |
| 104 | +</div> |
| 105 | +<br> |
| 106 | + |
| 107 | + |
| 108 | +# Citation |
| 109 | +{% raw %} |
| 110 | +```latex |
| 111 | +@article{chiang2025elana, |
| 112 | + title = {ELANA: A Simple Energy and Latency Analyzer for LLMs}, |
| 113 | + author = {Chiang, Hung-Yueh and Wang, Bokun and Marculescu, Diana}, |
| 114 | + journal = {arXiv preprint arXiv:2512.09946}, |
| 115 | + year = {2025}, |
| 116 | +} |
| 117 | +``` |
| 118 | +{% endraw %} |
| 119 | + |
| 120 | +<br> |
| 121 | +# Acknowledgements |
| 122 | +This work was supported in part by the ONR Minerva program, NSF CCF Grant No. 2107085, iMAGiNE - the Intelligent Machine Engineering Consortium at UT Austin, UT Cockrell School of Engineering Doctoral Fellowships. |
0 commit comments