This repo contains a collection of scripts to help with IMDB construction for common machine learning/computer vision datasets. Any additions/PRs welcome.
Pascal VOC: paper
@article{everingham2010pascal,
title={The pascal visual object classes (voc) challenge},
author={Everingham, Mark and Van Gool, Luc and Williams, Christopher KI and Winn, John and Zisserman, Andrew},
journal={International journal of computer vision},
volume={88},
number={2},
pages={303--338},
year={2010},
publisher={Springer}
}
MS Coco: paper
Lin, Tsung-Yi, Michael Maire, Serge Belongie, James Hays, Pietro Perona,
Deva Ramanan, Piotr Dollár, and C. Lawrence Zitnick. "Microsoft coco:
Common objects in context." In European conference on computer vision, pp.
740-755. Springer, Cham, 2014.
Note that to use the coco imdb constructor, it is necessary to have the coco Matlab API somewhere on your MATLAB path.
AFEW 3.0: paper
Dhall, A., Goecke, R., Joshi, J., Hoey, J., & Gedeon, T. (2016, October).
Emotiw 2016: Video and group-level emotion recognition challenges.
In Proceedings of the 18th ACM International Conference on Multimodal
Interaction (pp. 427-432). ACM.
enterface: paper
@inproceedings{martin2006enterface,
titludio-visual emotion database},
author={Martin, Olivier and Kotsia, Irene and Macq, Benoit and Pitas, Ioannis},
booktitle={Data Engineering Workshops, 2006. Proceedings. 22nd International Conference on},
pages={8--8},
year={2006},
organization={IEEE}
}
RML: paper
@inproceedings{wang2004investigation,
title={An investigation of speech-based human emotion recognition},
author={Wang, Yongjin and Guan, Ling},
booktitle={Multimedia Signal Processing, 2004 IEEE 6th Workshop on},
pages={15--18},
year={2004},
organization={IEEE}
}
FER2013: paper
@inproceedings{goodfellow2013challenges,
title={Challenges in representation learning: A report on three machine learning contests},
author={Goodfellow, Ian J and Erhan, Dumitru and Carrier, Pierre Luc and Courville, Aaron and Mirza, Mehdi and Hamner, Ben and Cukierski, Will and Tang, Yichuan and Thaler, David and Lee, Dong-Hyun and others},
booktitle={International Conference on Neural Information Processing},
pages={117--124},
year={2013},
organization={Springer}
}
@inproceedings{BarsoumICMI2016,
title={Training Deep Networks for Facial Expression Recognition with Crowd-Sourced Label Distribution},
author={Barsoum, Emad and Zhang, Cha and Canton Ferrer, Cristian and Zhang, Zhengyou},
booktitle={ACM International Conference on Multimodal Interaction (ICMI)},
year={2016}
}
SFEW 2.0*: paper
@article{dhall2012collecting,
title={Collecting large, richly annotated facial-expression databases from movies},
author={Dhall, Abhinav and Goecke, Roland and Lucey, Simon and Gedeon, Tom and others},
journal={IEEE multimedia},
volume={19},
number={3},
pages={34--41},
year={2012}
}