generated from alshedivat/al-folio
-
Notifications
You must be signed in to change notification settings - Fork 0
/
papers.bib
57 lines (48 loc) · 2.27 KB
/
papers.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
@inproceedings{enclap++,
title = {EnCLAP++: Analyzing the EnCLAP Framework for Optimizing Automated Audio Captioning Performance},
author = {Jaeyeon Kim and Jeon, Minjeong and Jung, Jaeyoon and Woo, Sang Hoon and Lee, Jinjoo},
booktitle = {DCASE2024 Workshop},
year = {2024},
selected = True,
preview = {enclap++.png},
html = {https://dcase.community/documents/workshop2024/proceedings/DCASE2024Workshop_Kim_70.pdf}
}
@article{dcase_technical,
title = {Expanding on EnCLAP with Auxiliary Retrieval Model for Automated Audio Captioning},
author = {Jaeyeon Kim and Jung, Jaeyoon and Jeon, Minjeong and Woo, Sang Hoon and Lee, Jinjoo},
journal = {DCASE2024 Challenge Technical Report},
year = {2024},
html = {https://dcase.community/documents/challenge2024/technical_reports/DCASE2024_Kim_108_t6.pdf}
}
@inproceedings{learning_semantic,
author = {Jaeyeon Kim and Hwang, Injune and Lee, Kyogu},
booktitle = {ICASSP},
title = {Learning Semantic Information from Raw Audio Signal Using Both Contextual and Phonetic Representations},
year = {2024},
doi = {10.1109/ICASSP48485.2024.10445745},
selected = True,
preview = {learning_semantic.png},
html = {https://ieeexplore.ieee.org/document/10445745}
}
@inproceedings{enclap,
author = {Jaeyeon Kim and Jung, Jaeyoon and Lee, Jinjoo and Woo, Sang Hoon},
booktitle = {ICASSP},
title = {EnCLAP: Combining Neural Audio Codec and Audio-Text Joint Embedding for Automated Audio Captioning},
year = {2024},
doi = {10.1109/ICASSP48485.2024.10446672},
selected = True,
preview = {enclap.png},
html = {https://ieeexplore.ieee.org/document/10446672},
code = {https://github.com/jaeyeonkim99/EnCLAP}
}
@inproceedings{pits,
title = {PITS: Variational pitch inference without fundamental frequency for end-to-end pitch-controllable TTS},
author = {Lee, Junhyeok and Jung, Wonbin and Cho, Hyunjae and Jaeyeon Kim and Kim, Jaehwan},
booktitle = {ICML Workshop on
Structured Probabilistic Inference \& Generative Modeling},
year = {2023},
selected = True,
preview = {pits.png},
html = {https://openreview.net/forum?id=EwzNo0znwf#discussion},
code = {https://github.com/anonymous-pits/pits}
}