Update README.md
Browse files
README.md
CHANGED
@@ -15,8 +15,12 @@ tags:
|
|
15 |
- custom_code
|
16 |
- audio
|
17 |
- speech
|
|
|
|
|
|
|
18 |
- asr
|
19 |
- tts
|
|
|
20 |
---
|
21 |
|
22 |
<h1>A GPT-4o Level MLLM for Vision, Speech and Multimodal Live Streaming on Your Phone</h1>
|
@@ -1390,4 +1394,4 @@ If you find our work helpful, please consider citing our papers 📝 and liking
|
|
1390 |
journal={arXiv preprint arXiv:2408.01800},
|
1391 |
year={2024}
|
1392 |
}
|
1393 |
-
```
|
|
|
15 |
- custom_code
|
16 |
- audio
|
17 |
- speech
|
18 |
+
- voice cloning
|
19 |
+
- live Streaming
|
20 |
+
- realtime speech conversation
|
21 |
- asr
|
22 |
- tts
|
23 |
+
license: apache-2.0
|
24 |
---
|
25 |
|
26 |
<h1>A GPT-4o Level MLLM for Vision, Speech and Multimodal Live Streaming on Your Phone</h1>
|
|
|
1394 |
journal={arXiv preprint arXiv:2408.01800},
|
1395 |
year={2024}
|
1396 |
}
|
1397 |
+
```
|