Skip to content

Commit

Permalink
deploy: e8b198d
Browse files Browse the repository at this point in the history
  • Loading branch information
RaymondWang0 committed Oct 23, 2023
1 parent 0e74008 commit c7457d1
Show file tree
Hide file tree
Showing 10 changed files with 21 additions and 21 deletions.
Binary file added coding_demo_gpu.gif
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file added coding_demo_m1.gif
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
10 changes: 5 additions & 5 deletions index.html
Original file line number Diff line number Diff line change
Expand Up @@ -79,11 +79,11 @@ <h1><a class="anchor" id="autotoc_md0"></a>
<p>This is enabled by LLM model compression technique: <a href="https://github.com/mit-han-lab/smoothquant">SmoothQuant</a> and <a href="https://github.com/mit-han-lab/llm-awq">AWQ (Activation-aware Weight Quantization)</a>, co-designed with TinyChatEngine that implements the compressed low-precision model.</p>
<h3><a class="anchor" id="autotoc_md1"></a>
Demo on an NVIDIA GeForce RTX 4070 laptop:</h3>
<p><img src="chat_demo_gpu.gif" alt="" class="inline" title="chat_demo_gpu"/> </p>
<h3><a class="anchor" id="autotoc_md2"></a>
Demo on an Apple MacBook Air (M1, 2020):</h3>
<p><img src="chat_demo_m1.gif" alt="" class="inline" title="chat_demo_m1"/> </p>
<p>Feel free to check out our <a href="assets/slides.pdf">slides</a> for more details!</p>
<p><img src="assets/figures/chat_demo_gpu.gif" alt="chat_demo_gpu" width="49%" class="inline"/> <img src="assets/figures/coding_demo_gpu.gif" alt="coding_demo_gpu" width="49%" class="inline"/> </p><div class="fragment"><div class="line">LLaMA Chat Code LLaMA</div>
</div><!-- fragment --><h3><a class="anchor" id="autotoc_md2"></a>
Demo on an Apple MacBook Pro (M1, 2021):</h3>
<p><img src="assets/figures/chat_demo_m1.gif" alt="chat_demo_m1" width="49%" class="inline"/> <img src="assets/figures/coding_demo_m1.gif" alt="coding_demo_m1" width="49%" class="inline"/> </p><div class="fragment"><div class="line">LLaMA Chat Code LLaMA</div>
</div><!-- fragment --><p>Feel free to check out our <a href="assets/slides.pdf">slides</a> for more details!</p>
<h2><a class="anchor" id="autotoc_md3"></a>
Overview</h2>
<h3><a class="anchor" id="autotoc_md4"></a>
Expand Down
2 changes: 1 addition & 1 deletion search/all_0.js
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
var searchData=
[
['2020_20_3a_0',['Demo on an Apple MacBook Air (M1, 2020):',['../index.html#autotoc_md2',1,'']]]
['2021_20_3a_0',['Demo on an Apple MacBook Pro (M1, 2021):',['../index.html#autotoc_md2',1,'']]]
];
2 changes: 1 addition & 1 deletion search/all_10.js
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
var searchData=
[
['on_20an_20apple_20macbook_20air_20m1_202020_20_3a_0',['Demo on an Apple MacBook Air (M1, 2020):',['../index.html#autotoc_md2',1,'']]],
['on_20an_20apple_20macbook_20pro_20m1_202021_20_3a_0',['Demo on an Apple MacBook Pro (M1, 2021):',['../index.html#autotoc_md2',1,'']]],
['on_20an_20nvidia_20geforce_20rtx_204070_20laptop_3a_1',['Demo on an NVIDIA GeForce RTX 4070 laptop:',['../index.html#autotoc_md1',1,'']]],
['on_20device_20llm_20inference_20library_2',['TinyChatEngine: On-Device LLM Inference Library',['../index.html#autotoc_md0',1,'']]],
['opt_5fparams_3',['opt_params',['../structopt__params.html',1,'']]],
Expand Down
5 changes: 3 additions & 2 deletions search/all_11.js
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@ var searchData=
['pack_5fq8_5ftensor_1',['pack_q8_tensor',['../structpack__q8__tensor.html',1,'']]],
['pair_5fhash_2',['pair_hash',['../structpair__hash.html',1,'']]],
['prerequisites_3',['Prerequisites',['../index.html#autotoc_md7',1,'']]],
['profiler_4',['Profiler',['../classProfiler.html',1,'']]],
['projects_5',['Related Projects',['../index.html#autotoc_md18',1,'']]]
['pro_20m1_202021_20_3a_4',['Demo on an Apple MacBook Pro (M1, 2021):',['../index.html#autotoc_md2',1,'']]],
['profiler_5',['Profiler',['../classProfiler.html',1,'']]],
['projects_6',['Related Projects',['../index.html#autotoc_md18',1,'']]]
];
2 changes: 1 addition & 1 deletion search/all_3.js
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
var searchData=
[
['_3a_0',['Demo on an Apple MacBook Air (M1, 2020):',['../index.html#autotoc_md2',1,'']]]
['_3a_0',['Demo on an Apple MacBook Pro (M1, 2021):',['../index.html#autotoc_md2',1,'']]]
];
15 changes: 7 additions & 8 deletions search/all_4.js
Original file line number Diff line number Diff line change
Expand Up @@ -3,12 +3,11 @@ var searchData=
['a_20href_20https_3a_20youtu_20be_20bw5dm3awmna_20si_20ccvzdmq3hwoweqcc_20demo_20a_0',['Voice Chatbot &lt;a href=&quot;https://youtu.be/Bw5Dm3aWMnA?si=CCvZDmq3HwowEQcC&quot; &gt;[Demo]&lt;/a&gt;',['../index.html#autotoc_md17',1,'']]],
['a8w4_5fthread_5fargs_1',['a8w4_thread_args',['../structa8w4__thread__args.html',1,'']]],
['acknowledgement_2',['Acknowledgement',['../index.html#autotoc_md19',1,'']]],
['air_20m1_202020_20_3a_3',['Demo on an Apple MacBook Air (M1, 2020):',['../index.html#autotoc_md2',1,'']]],
['an_20apple_20macbook_20air_20m1_202020_20_3a_4',['Demo on an Apple MacBook Air (M1, 2020):',['../index.html#autotoc_md2',1,'']]],
['an_20nvidia_20geforce_20rtx_204070_20laptop_3a_5',['Demo on an NVIDIA GeForce RTX 4070 laptop:',['../index.html#autotoc_md1',1,'']]],
['and_20awq_6',['LLM Compression: SmoothQuant and AWQ',['../index.html#autotoc_md4',1,'']]],
['and_20deploy_20models_20from_20our_20model_20zoo_7',['Download and Deploy Models from our Model Zoo',['../index.html#autotoc_md15',1,'']]],
['and_20model_20support_8',['Quantization and Model Support',['../index.html#autotoc_md13',1,'']]],
['apple_20macbook_20air_20m1_202020_20_3a_9',['Demo on an Apple MacBook Air (M1, 2020):',['../index.html#autotoc_md2',1,'']]],
['awq_10',['LLM Compression: SmoothQuant and AWQ',['../index.html#autotoc_md4',1,'']]]
['an_20apple_20macbook_20pro_20m1_202021_20_3a_3',['Demo on an Apple MacBook Pro (M1, 2021):',['../index.html#autotoc_md2',1,'']]],
['an_20nvidia_20geforce_20rtx_204070_20laptop_3a_4',['Demo on an NVIDIA GeForce RTX 4070 laptop:',['../index.html#autotoc_md1',1,'']]],
['and_20awq_5',['LLM Compression: SmoothQuant and AWQ',['../index.html#autotoc_md4',1,'']]],
['and_20deploy_20models_20from_20our_20model_20zoo_6',['Download and Deploy Models from our Model Zoo',['../index.html#autotoc_md15',1,'']]],
['and_20model_20support_7',['Quantization and Model Support',['../index.html#autotoc_md13',1,'']]],
['apple_20macbook_20pro_20m1_202021_20_3a_8',['Demo on an Apple MacBook Pro (M1, 2021):',['../index.html#autotoc_md2',1,'']]],
['awq_9',['LLM Compression: SmoothQuant and AWQ',['../index.html#autotoc_md4',1,'']]]
];
2 changes: 1 addition & 1 deletion search/all_7.js
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
var searchData=
[
['demo_20a_0',['Voice Chatbot &lt;a href=&quot;https://youtu.be/Bw5Dm3aWMnA?si=CCvZDmq3HwowEQcC&quot; &gt;[Demo]&lt;/a&gt;',['../index.html#autotoc_md17',1,'']]],
['demo_20on_20an_20apple_20macbook_20air_20m1_202020_20_3a_1',['Demo on an Apple MacBook Air (M1, 2020):',['../index.html#autotoc_md2',1,'']]],
['demo_20on_20an_20apple_20macbook_20pro_20m1_202021_20_3a_1',['Demo on an Apple MacBook Pro (M1, 2021):',['../index.html#autotoc_md2',1,'']]],
['demo_20on_20an_20nvidia_20geforce_20rtx_204070_20laptop_3a_2',['Demo on an NVIDIA GeForce RTX 4070 laptop:',['../index.html#autotoc_md1',1,'']]],
['deploy_20llama2_207b_20chat_20with_20tinychatengine_3',['Step-by-step to Deploy LLaMA2-7B-chat with TinyChatEngine',['../index.html#autotoc_md11',1,'']]],
['deploy_20models_20from_20our_20model_20zoo_4',['Download and Deploy Models from our Model Zoo',['../index.html#autotoc_md15',1,'']]],
Expand Down
4 changes: 2 additions & 2 deletions search/all_e.js
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
var searchData=
[
['m1_202020_20_3a_0',['Demo on an Apple MacBook Air (M1, 2020):',['../index.html#autotoc_md2',1,'']]],
['macbook_20air_20m1_202020_20_3a_1',['Demo on an Apple MacBook Air (M1, 2020):',['../index.html#autotoc_md2',1,'']]],
['m1_202021_20_3a_0',['Demo on an Apple MacBook Pro (M1, 2021):',['../index.html#autotoc_md2',1,'']]],
['macbook_20pro_20m1_202021_20_3a_1',['Demo on an Apple MacBook Pro (M1, 2021):',['../index.html#autotoc_md2',1,'']]],
['macos_2',['MacOS',['../index.html#autotoc_md8',1,'']]],
['matmul_5fparams_3',['matmul_params',['../structmatmul__params.html',1,'']]],
['matmuloperator_4',['MatmulOperator',['../classmatmul_1_1MatmulOperator.html',1,'matmul']]],
Expand Down

0 comments on commit c7457d1

Please sign in to comment.