{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "name": "Crowd-Kit-Categorical.ipynb", "provenance": [], "collapsed_sections": [] }, "kernelspec": { "name": "python3", "display_name": "Python 3" }, "language_info": { "name": "python" } }, "cells": [ { "cell_type": "code", "metadata": { "id": "KtiDQZCyr3xx" }, "source": [ "%%capture\n", "!pip install crowd-kit" ], "execution_count": 1, "outputs": [] }, { "cell_type": "code", "metadata": { "id": "26Ov-2mHsxek" }, "source": [ "from crowdkit.datasets import load_dataset" ], "execution_count": 2, "outputs": [] }, { "cell_type": "code", "metadata": { "id": "UteIznTotSeH", "colab": { "base_uri": "https://localhost:8080/" }, "outputId": "3685dfa8-2fb0-46be-ba31-5bf712890645" }, "source": [ "df, df_gt = load_dataset('relevance-2')" ], "execution_count": 3, "outputs": [ { "output_type": "stream", "text": [ "Downloading relevance-2 from remote\n" ], "name": "stdout" } ] }, { "cell_type": "code", "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 419 }, "id": "TwGUO-30dw9S", "outputId": "5f8de55b-e161-450f-f530-de4db30c8527" }, "source": [ "df" ], "execution_count": 4, "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
\n", " | performer | \n", "task | \n", "label | \n", "
---|---|---|---|
0 | \n", "w851 | \n", "t30685 | \n", "1 | \n", "
1 | \n", "w6991 | \n", "t30008 | \n", "0 | \n", "
2 | \n", "w2596 | \n", "t36316 | \n", "0 | \n", "
3 | \n", "w5507 | \n", "t15145 | \n", "1 | \n", "
4 | \n", "w2982 | \n", "t44785 | \n", "1 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "
475531 | \n", "w4660 | \n", "t62250 | \n", "1 | \n", "
475532 | \n", "w6630 | \n", "t46626 | \n", "0 | \n", "
475533 | \n", "w4605 | \n", "t93513 | \n", "1 | \n", "
475534 | \n", "w1928 | \n", "t29002 | \n", "0 | \n", "
475535 | \n", "w5375 | \n", "t49052 | \n", "1 | \n", "
475536 rows × 3 columns
\n", "