diff --git a/config.yaml b/config-eval.yaml similarity index 100% rename from config.yaml rename to config-eval.yaml diff --git a/dataset_create.ipynb b/dataset_create.ipynb new file mode 100644 index 0000000..4fbcd73 --- /dev/null +++ b/dataset_create.ipynb @@ -0,0 +1,822 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd\n", + "from huggingface_hub import login\n", + "from datasets import load_dataset\n", + "import os\n", + "import json\n", + "import shutil" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [ + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "f0476002f8d14822a24f1376cfe29a07", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "VBox(children=(HTML(value='