diff --git a/tutorials/Datasets/UFSC OCPap.ipynb b/tutorials/Datasets/UFSC OCPap.ipynb new file mode 100644 index 0000000..cdcb2e0 --- /dev/null +++ b/tutorials/Datasets/UFSC OCPap.ipynb @@ -0,0 +1,60 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# UFSC OCPap: Papanicolaou Stained Oral Cytology Dataset" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "This dataset is available at the Mendelay Data repository: [https://doi.org/10.17632/dr7ydy9xbk.2](https://doi.org/10.17632/dr7ydy9xbk.2)\n", + "\n", + "\n", + "The UFSC OCPap dataset comprises 9,797 labeled images of 1200x1600 pixels acquired from 5 slides of cancer diagnosed and 3 healthy of oral brush samples, from distinct patients.\n", + "\n", + "The slides were provided by the Hospital Dental Center of the University Hospital Professor Polydoro Ernani de São Thiago of Federal University of Santa Catarina (HU-UFSC) and this research was approved by the UFSC Research Ethics Committee (CEPSH), protocol number 23193719.5.0000.0121. All patients were previously approached and informed about the study objectives. Those who agreed to participate signed an Informed Consent Form." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Using Hugging Faces Datasets" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "# Installing HF datasets lib\n", + "%pip install datasets" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "from datasets import load_dataset\n", + "\n", + "dataset = load_dataset(\"lapix/UFSC_OCPap\")" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3.9.0 64-bit", + "language": "python", + "name": "python3" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +}