shuaijiang commited on
Commit
6667ab2
·
1 Parent(s): 37ca002
index.html CHANGED
@@ -33,7 +33,7 @@
33
  <div class="container is-max-desktop">
34
  <div class="columns is-centered">
35
  <div class="column has-text-centered">
36
- <h1 class="title is-1 publication-title">KE-Omni: A Seamless Speech Language Model with 60,000+ Hours Synthesized Chinese and English Speech Dialogues</h1>
37
  <div class="is-size-5 publication-authors">
38
  <span class="author-block">
39
  Shuaijiang Zhao,
@@ -106,7 +106,7 @@
106
  </span>
107
  <!-- Dataset Link. -->
108
  <span class="link-block">
109
- <a href="https://huggingface.co/datasets/AM-Team/KESpeechChat" target="_blank"
110
  class="external-link button is-normal is-rounded is-dark">
111
  <span class="icon">
112
  <i class="far fa-images"></i>
@@ -152,7 +152,7 @@
152
  <div class="columns is-centered">
153
  <div class="column">
154
  <div class="content dialogue-block" style="display: flex; flex-direction: column; justify-content: space-between; height: 100%;">
155
- <img src="./static/images/model.jpg" alt="am-omni architecture">
156
  </div>
157
  </div>
158
  </div>
@@ -169,7 +169,7 @@
169
  </div>
170
  </div>
171
 
172
- <h2 class="title is-2 has-text-centered">KE-SpeechChat Dataset Details</h2>
173
  <div class="columns is-centered">
174
  <!-- Left image -->
175
  <div class="column is-half">
@@ -192,7 +192,7 @@
192
 
193
  <section class="section">
194
  <div class="container is-max-desktop">
195
- <h2 class="title is-2 has-text-centered" >KESpeechChat Dialogue Demos</h2>
196
  <h2 class="title is-3 has-text-centered" >Chinese Dialogues</h2>
197
  <div class="columns is-centered">
198
  <div class="column">
@@ -412,7 +412,7 @@
412
  <h2 class="title">BibTeX</h2>
413
  <pre><code>@article{zhao2024keomni,
414
  author = {Zhao, Shuajiang and Guo, Tingwei and Xiang, Bajian and Wan, Tongtang and Niu, Qiang and Zou, Wei and Li, Xiangang},
415
- title = {KE-Omni: A Seamless Speech Language Model with 60,000+ Hours Synthesized Chinese and English Speech Dialogues},
416
  year = {2024},
417
  }</code></pre>
418
  </div>
@@ -423,7 +423,7 @@
423
  <div class="container">
424
  <div class="content has-text-centered">
425
  <a class="icon-link" target="_blank"
426
- href="./static/am_omni.pdf">
427
  <i class="fas fa-file-pdf"></i>
428
  </a>
429
  <a class="icon-link" href="https://github.com/LianjiaTech/BELLE" target="_blank" class="external-link" disabled>
 
33
  <div class="container is-max-desktop">
34
  <div class="columns is-centered">
35
  <div class="column has-text-centered">
36
+ <h1 class="title is-1 publication-title">Advancing Speech Language Models by Scaling Supervised Fine-Tuning with Over 60,000 Hours of Synthetic Speech Dialogue Data</h1>
37
  <div class="is-size-5 publication-authors">
38
  <span class="author-block">
39
  Shuaijiang Zhao,
 
106
  </span>
107
  <!-- Dataset Link. -->
108
  <span class="link-block">
109
+ <a href="https://huggingface.co/datasets/KE-Team/Ke-SpeechChat" target="_blank"
110
  class="external-link button is-normal is-rounded is-dark">
111
  <span class="icon">
112
  <i class="far fa-images"></i>
 
152
  <div class="columns is-centered">
153
  <div class="column">
154
  <div class="content dialogue-block" style="display: flex; flex-direction: column; justify-content: space-between; height: 100%;">
155
+ <img src="./static/images/model.png" alt="am-omni architecture">
156
  </div>
157
  </div>
158
  </div>
 
169
  </div>
170
  </div>
171
 
172
+ <h2 class="title is-2 has-text-centered">Ke-SpeechChat Dataset Details</h2>
173
  <div class="columns is-centered">
174
  <!-- Left image -->
175
  <div class="column is-half">
 
192
 
193
  <section class="section">
194
  <div class="container is-max-desktop">
195
+ <h2 class="title is-2 has-text-centered" >Ke-SpeechChat Dialogue Demos</h2>
196
  <h2 class="title is-3 has-text-centered" >Chinese Dialogues</h2>
197
  <div class="columns is-centered">
198
  <div class="column">
 
412
  <h2 class="title">BibTeX</h2>
413
  <pre><code>@article{zhao2024keomni,
414
  author = {Zhao, Shuajiang and Guo, Tingwei and Xiang, Bajian and Wan, Tongtang and Niu, Qiang and Zou, Wei and Li, Xiangang},
415
+ title = {Advancing Speech Language Models by Scaling Supervised Fine-Tuning with Over 60,000 Hours of Synthetic Speech Dialogue Data},
416
  year = {2024},
417
  }</code></pre>
418
  </div>
 
423
  <div class="container">
424
  <div class="content has-text-centered">
425
  <a class="icon-link" target="_blank"
426
+ href="./static/KE_Omni.pdf">
427
  <i class="fas fa-file-pdf"></i>
428
  </a>
429
  <a class="icon-link" href="https://github.com/LianjiaTech/BELLE" target="_blank" class="external-link" disabled>
static/KE_Omni.pdf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e54bf3b22998263825af29eefb0d16ebe9db3d818abb7723c5fc47a9bbcbdb8b
3
- size 1824220
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:417655c3417fc8050727236a26f0ba78914d785b72ab6b2c43e8fa243c089f8f
3
+ size 1942368
static/images/am_speech.png CHANGED

Git LFS Details

  • SHA256: ad7d6f09cc77afe84403672eaaed0ad7f9a68fff083bda2344c26415243f4af4
  • Pointer size: 130 Bytes
  • Size of remote file: 67.8 kB

Git LFS Details

  • SHA256: b677736cbc66bf0ed5e371f07ef1bc63582e81f774ab94d2d2fd56cb49b8a9e9
  • Pointer size: 131 Bytes
  • Size of remote file: 108 kB
static/images/interpolate_end.jpg DELETED
Binary file (113 kB)
 
static/images/interpolate_start.jpg DELETED
Binary file (117 kB)
 
static/images/model.png ADDED

Git LFS Details

  • SHA256: c64928a7802e281ce601aeabb21f2d0ab695d9bf172226137cf840e75ade58f7
  • Pointer size: 131 Bytes
  • Size of remote file: 407 kB
static/images/{model.jpg → model_old.jpg} RENAMED
File without changes
static/images/subset.png CHANGED

Git LFS Details

  • SHA256: 4e958e802a6ddde79923993cfce9af288c7174c7546481e9483e09d1a42e80d4
  • Pointer size: 130 Bytes
  • Size of remote file: 57.2 kB

Git LFS Details

  • SHA256: 4bc773c9df32e88de01288f3e7e4cedf85554f97a2408158b387b6a0d20e3a03
  • Pointer size: 130 Bytes
  • Size of remote file: 88.2 kB