{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "## SCRIPT TO EXTRACT EXISTING TEXT EMBEDDINGS INTO A NEW WORKFLOW WITH NEW LOOKUP TABLES" ] }, { "cell_type": "code", "execution_count": 74, "metadata": {}, "outputs": [], "source": [ "import sys\n", "\n", "sys.path.insert(1, \"../../\")" ] }, { "cell_type": "code", "execution_count": 75, "metadata": {}, "outputs": [], "source": [ "import re\n", "from pathlib import Path\n", "\n", "import pandas as pd\n" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### SET VALUES FOR THE INDEX FOLDER TO BE EXTRACTED" ] }, { "cell_type": "code", "execution_count": 76, "metadata": {}, "outputs": [], "source": [ "# set local folder where the index data is located\n", "LOCAL_ROOT = \"