This dataset contains 11 converted Endoscopy datasets, part of the OmniMedSeg superset. All datasets are converted to a standardized structure with binary masks for each segmentation target.
================================================================================
DATASET LICENSE AND CITATION SUMMARY
QUICK REFERENCE: DATASETS AND LICENSES
BAGLS: CC BY-NC-SA 4.0
EAD: CC-BY-NC 3.0
ENDOVIS_15: CC-BY-NC 3.0
FETOSCOPY_PLACENTA: CC BY-NC-SA 4.0
FETREG: CC-BY-NC-SA 4.0
HYPER_KVASIR: CC-BY 4.0
KVASIR_CAPSULE_SEG: 'The use of the KvasirCapsule-SEG dataset is restricted for research and educational purposes. The use of the KvasirCapsule-SEG dataset for commercial purposes is forbidden without prior written permission.'
KVASIR_SEG:'The use of the Kvasir-SEG dataset is restricted for research and educational purposes. The use of the Kvasir-SEG dataset for commercial purposes is forbidden without prior written permission.'
LARYNGEAL_ENDOSCOPIC: CC-BY 4.0
POLYP_DB: 'Publicly Accessible: The dataset is open for research and educational purposes.'
CVC_CLINICDB: 'The use of this database is completely restricted for research and educational purposes. The use of this database is forbidden for commercial purposes.'
DETAILED INFORMATION BY DATASET
[1] BAGLS
License: CC BY-NC-SA 4.0
Dataset link: https://zenodo.org/records/3762320
Metadata file: Endoscopy/BAGLS/metadata.json
Citation (bibtex):
@article{gomez2020bagls,
title={BAGLS, a multihospital benchmark for automatic glottis segmentation},
author={G{'o}mez, Pablo and Kist, Andreas M and Schlegel, Patrick and Berry, David A and Chhetri, Dinesh K and D{"u}rr, Stephan and Echternach, Matthias and Johnson, Aaron M and Kniesburges, Stefan and Kunduk, Melda and others},
journal={Scientific data},
volume={7},
number={1},
pages={186},
year={2020},
publisher={Nature Publishing Group UK London}
}
[2] CVC_CLINICDB
License: he use of this database is completely restricted for research and educational purposes. The use of this database is forbidden for commercial purposes.'
Dataset link: https://polyp.grand-challenge.org/CVCClinicDB/
Metadata file: Endoscopy/CVC_CLINICDB/metadata.json
Citation (bibtex):
@article{bernal2015wm,
title={WM-DOVA maps for accurate polyp highlighting in colonoscopy: Validation vs. saliency maps from physicians},
author={Bernal, Jorge and S{'a}nchez, F Javier and Fern{'a}ndez-Esparrach, Gloria and Gil, Debora and Rodr{'\i}guez, Cristina and Vilari{~n}o, Fernando},
journal={Computerized medical imaging and graphics},
volume={43},
pages={99--111},
year={2015},
publisher={Elsevier}
}
[3] EAD
License: CC-BY-NC 3.0
Dataset link: https://data.mendeley.com/datasets/c7fjbxcgj9/3
Metadata file: Endoscopy/EAD/metadata.json
Citation (bibtex):
@article{ali2019endoscopy,
title={Endoscopy artifact detection (EAD 2019) challenge dataset},
author={Ali, Sharib and Zhou, Felix and Daul, Christian and Braden, Barbara and Bailey, Adam and Realdon, Stefano and East, James and Wagnieres, Georges and Loschenov, Victor and Grisan, Enrico and others},
journal={arXiv preprint arXiv:1905.03209},
year={2019}
}
[4] ENDOVIS_15
License: CC-BY-NC 3.0
Dataset link: https://archive.iar.kit.edu/opencas/index.html%3Fq=node%252F30.html
Metadata file: Endoscopy/ENDOVIS_15/metadata.json
Citation (bibtex):
@article{bernal2017comparative,
title={Comparative validation of polyp detection methods in video colonoscopy: results from the MICCAI 2015 endoscopic vision challenge},
author={Bernal, Jorge and Tajkbaksh, Nima and Sanchez, Francisco Javier and Matuszewski, Bogdan J and Chen, Hao and Yu, Lequan and Angermann, Quentin and Romain, Olivier and Rustad, Bj{\o}rn and Balasingham, Ilangko and others},
journal={IEEE transactions on medical imaging},
volume={36},
number={6},
pages={1231--1249},
year={2017},
publisher={IEEE}
}
[5] FETOSCOPY_PLACENTA
License: CC BY-NC-SA 4.0
Dataset link: https://rdr.ucl.ac.uk/articles/dataset/Fetoscopy_Placenta_Dataset/30536171
Metadata file: Endoscopy/FETOSCOPY_PLACENTA/metadata.json
Citation (bibtex):
@article{Bano2020,
title = {FetNet: a recurrent convolutional network for occlusion identification in fetoscopic videos},
volume = {15},
ISSN = {1861-6429},
url = {http://dx.doi.org/10.1007/s11548-020-02169-0},
DOI = {10.1007/s11548-020-02169-0},
number = {5},
journal = {International Journal of Computer Assisted Radiology and Surgery},
publisher = {Springer Science and Business Media LLC},
author = {Bano, Sophia and Vasconcelos, Francisco and Vander Poorten, Emmanuel and Vercauteren, Tom and Ourselin, Sebastien and Deprest, Jan and Stoyanov, Danail},
year = {2020},
month = Apr,
pages = {791–801}
}
[6] FETREG
License: CC-BY-NC-SA 4.0
Dataset link: https://rdr.ucl.ac.uk/articles/dataset/b_FetReg_Largescale_Multi-centre_Fetoscopy_Placenta_Dataset_b/30417166
Metadata file: Endoscopy/FETREG/metadata.json
Citation (bibtex):
@article{Bano2025,
author = "Sophia Bano and Alessandro Casella and Francisco Vasconcelos and Sara Moccia and George Attilakos and Ruwan C. Wimalasundera and Anna L David and Dario Paladini and Jan Deprest and Elena De Momi and Leonardo S. Mattos and Danail Stoyanov",
title = "{FetReg: Largescale Multi-centre Fetoscopy Placenta Dataset}",
year = "2025",
month = "11",
url = "https://rdr.ucl.ac.uk/articles/dataset/b_FetReg_Largescale_Multi-centre_Fetoscopy_Placenta_Dataset_b/30417166",
doi = "10.5522/04/30417166.v1"
}
[7] HYPER_KVASIR
License: CC-BY 4.0
Dataset link: https://datasets.simula.no/hyper-kvasir/
Metadata file: Endoscopy/HYPER_KVASIR/metadata.json
Citation (bibtex):
@article{Borgli2020,
title = {{HyperKvasir, a comprehensive multi-class
image and video dataset for gastrointestinal endoscopy}},
author = {
Borgli, Hanna and Thambawita, Vajira and
Smedsrud, Pia H and Hicks, Steven and Jha, Debesh and
Eskeland, Sigrun L and Randel, Kristin Ranheim and
Pogorelov, Konstantin and Lux, Mathias and
Nguyen, Duc Tien Dang and Johansen, Dag and
Griwodz, Carsten and Stensland, H{\aa}kon K and
Garcia-Ceja, Enrique and Schmidt, Peter T and
Hammer, Hugo L and Riegler, Michael A and
Halvorsen, P{\aa}l and de Lange, Thomas
},
doi = {10.1038/s41597-020-00622-y},
issn = {2052-4463},
journal = {Scientific Data},
number = {1},
pages = {283},
url = {https://doi.org/10.1038/s41597-020-00622-y},
volume = {7},
year = {2020}
}
[8] KVASIR_CAPSULE_SEG
License:
- 'The use of the KvasirCapsule-SEG dataset is restricted for research and educational purposes. The use of the KvasirCapsule-SEG dataset for commercial purposes is forbidden without prior written permission.'
Dataset link: https://datasets.simula.no/kvasir-capsule-seg/
Metadata file: Endoscopy/KVASIR_CAPSULE_SEG/metadata.json
Citation (bibtex):
@inproceedings{jha2021nanonet,
title = {Nanonet: Real-time polyp segmentation in
video capsule endoscopy and colonoscopy},
author = {
Jha, Debesh and Tomar, Nikhil Kumar and Ali, Sharib and
Riegler, Michael A and Johansen, H{\aa}vard D and Johansen, Dag and
de Lange, Thomas and Halvorsen, P{\aa}l
},
booktitle = {Proceedings of the 2021 IEEE 34th International
Symposium on Computer-Based Medical Systems (CBMS)},
pages = {37--43},
year = {2021}
}
[9] KVASIR_SEG
License: 'The use of the Kvasir-SEG dataset is restricted for research and educational purposes. The use of the Kvasir-SEG dataset for commercial purposes is forbidden without prior written permission
Dataset link: https://datasets.simula.no/kvasir-seg/
Metadata file: Endoscopy/KVASIR_SEG/metadata.json
Citation (bibtex):
@inproceedings{jha2020kvasir, title={Kvasir-seg: A segmented polyp dataset}, author={Jha, Debesh and Smedsrud, Pia H and Riegler, Michael A and Halvorsen, P{\aa}l and de Lange, Thomas and Johansen, Dag and Johansen, H{\aa}vard D}, booktitle={International Conference on Multimedia Modeling}, pages={451--462}, year={2020}, organization={Springer} }
[10] LARYNGEAL_ENDOSCOPIC
License: CC-BY 4.0
Dataset link: https://github.com/imesluh/vocalfolds
Metadata file: Endoscopy/LARYNGEAL_ENDOSCOPIC/metadata.json
Citation (bibtex):
@article{Laves2019,
title = {A dataset of laryngeal endoscopic images with comparative study on convolution neural network-based semantic segmentation},
volume = {14},
ISSN = {1861-6429},
url = {http://dx.doi.org/10.1007/s11548-018-01910-0},
DOI = {10.1007/s11548-018-01910-0},
number = {3},
journal = {International Journal of Computer Assisted Radiology and Surgery},
publisher = {Springer Science and Business Media LLC},
author = {Laves, Max-Heinrich and Bicker, Jens and Kahrs, L"{u}der A. and Ortmaier, Tobias},
year = {2019},
month = Jan,
pages = {483–492}
}
[11] POLYP_DB
License: 'Publicly Accessible: The dataset is open for research and educational purposes.'
Dataset link: https://github.com/DebeshJha/PolypDB
Metadata file: Endoscopy/POLYP_DB/metadata.json
Citation (bibtex):
@article{Jha2024PolypDB,
author = {Debesh Jha and et al.},
title = {PolypDB: A Curated Multi-Center Dataset for Development of AI Algorithms in Colonoscopy},
journal = {Arxiv},
year = {2024},
doi = {10.1109/TMI.2024.1234567}
}
================================================================================
IMPORTANT NOTES
- All datasets listed are publicly available
- Full metadata is stored in each dataset's metadata.json file
- For CC0-licensed datasets, attribution is appreciated but not required
- For other licenses, please review the specific terms before use