|
|
|
@ -1,6 +1,7 @@
|
|
|
|
|
{
|
|
|
|
|
"cells": [
|
|
|
|
|
{
|
|
|
|
|
"attachments": {},
|
|
|
|
|
"cell_type": "markdown",
|
|
|
|
|
"metadata": {},
|
|
|
|
|
"source": [
|
|
|
|
@ -20,6 +21,7 @@
|
|
|
|
|
]
|
|
|
|
|
},
|
|
|
|
|
{
|
|
|
|
|
"attachments": {},
|
|
|
|
|
"cell_type": "markdown",
|
|
|
|
|
"metadata": {},
|
|
|
|
|
"source": [
|
|
|
|
@ -29,20 +31,19 @@
|
|
|
|
|
{
|
|
|
|
|
"cell_type": "code",
|
|
|
|
|
"execution_count": 1,
|
|
|
|
|
"metadata": {
|
|
|
|
|
"collapsed": false
|
|
|
|
|
},
|
|
|
|
|
"outputs": [
|
|
|
|
|
{
|
|
|
|
|
"name": "stdout",
|
|
|
|
|
"output_type": "stream",
|
|
|
|
|
"text": [
|
|
|
|
|
]
|
|
|
|
|
"text": []
|
|
|
|
|
}
|
|
|
|
|
],
|
|
|
|
|
"source": [
|
|
|
|
|
"!pip install nomic"
|
|
|
|
|
],
|
|
|
|
|
"metadata": {
|
|
|
|
|
"collapsed": false
|
|
|
|
|
}
|
|
|
|
|
]
|
|
|
|
|
},
|
|
|
|
|
{
|
|
|
|
|
"cell_type": "code",
|
|
|
|
@ -52,13 +53,14 @@
|
|
|
|
|
"source": [
|
|
|
|
|
"import pandas as pd\n",
|
|
|
|
|
"import numpy as np\n",
|
|
|
|
|
"from ast import literal_eval\n",
|
|
|
|
|
"\n",
|
|
|
|
|
"# Load the embeddings\n",
|
|
|
|
|
"datafile_path = \"data/fine_food_reviews_with_embeddings_1k.csv\"\n",
|
|
|
|
|
"df = pd.read_csv(datafile_path)\n",
|
|
|
|
|
"\n",
|
|
|
|
|
"# Convert to a list of lists of floats\n",
|
|
|
|
|
"embeddings = np.array(df.embedding.apply(eval).to_list())\n",
|
|
|
|
|
"embeddings = np.array(df.embedding.apply(literal_eval).to_list())\n",
|
|
|
|
|
"df = df.drop('embedding', axis=1)\n",
|
|
|
|
|
"df = df.rename(columns={'Unnamed: 0': 'id'})\n"
|
|
|
|
|
]
|
|
|
|
@ -71,8 +73,7 @@
|
|
|
|
|
{
|
|
|
|
|
"name": "stderr",
|
|
|
|
|
"output_type": "stream",
|
|
|
|
|
"text": [
|
|
|
|
|
]
|
|
|
|
|
"text": []
|
|
|
|
|
}
|
|
|
|
|
],
|
|
|
|
|
"source": [
|
|
|
|
@ -88,6 +89,7 @@
|
|
|
|
|
]
|
|
|
|
|
},
|
|
|
|
|
{
|
|
|
|
|
"attachments": {},
|
|
|
|
|
"cell_type": "markdown",
|
|
|
|
|
"metadata": {},
|
|
|
|
|
"source": [
|
|
|
|
@ -97,11 +99,65 @@
|
|
|
|
|
{
|
|
|
|
|
"cell_type": "code",
|
|
|
|
|
"execution_count": 10,
|
|
|
|
|
"metadata": {
|
|
|
|
|
"collapsed": false
|
|
|
|
|
},
|
|
|
|
|
"outputs": [
|
|
|
|
|
{
|
|
|
|
|
"data": {
|
|
|
|
|
"text/plain": "meek-laborer: https://atlas.nomic.ai/map/fddc0e07-97c5-477c-827c-96bca44519aa/463f4614-7689-47e4-b55b-1da0cc679559",
|
|
|
|
|
"text/html": "\n <h3>Project: meek-laborer</h3>\n <script>\n destroy = function() {\n document.getElementById(\"iframe463f4614-7689-47e4-b55b-1da0cc679559\").remove()\n }\n </script>\n\n <h4>Projection ID: 463f4614-7689-47e4-b55b-1da0cc679559</h4>\n <div class=\"actions\">\n <div id=\"hide\" class=\"action\" onclick=\"destroy()\">Hide embedded project</div>\n <div class=\"action\" id=\"out\">\n <a href=\"https://atlas.nomic.ai/map/fddc0e07-97c5-477c-827c-96bca44519aa/463f4614-7689-47e4-b55b-1da0cc679559\" target=\"_blank\">Explore on atlas.nomic.ai</a>\n </div>\n </div>\n \n <iframe class=\"iframe\" id=\"iframe463f4614-7689-47e4-b55b-1da0cc679559\" allow=\"clipboard-read; clipboard-write\" src=\"https://atlas.nomic.ai/map/fddc0e07-97c5-477c-827c-96bca44519aa/463f4614-7689-47e4-b55b-1da0cc679559\">\n </iframe>\n\n <style>\n .iframe {\n /* vh can be **very** large in vscode ipynb. */\n height: min(75vh, 66vw);\n width: 100%;\n }\n </style>\n \n <style>\n .actions {\n display: block;\n }\n .action {\n min-height: 18px;\n margin: 5px;\n transition: all 500ms ease-in-out;\n }\n .action:hover {\n cursor: pointer;\n }\n #hide:hover::after {\n content: \" X\";\n }\n #out:hover::after {\n content: \"\";\n }\n </style>\n \n "
|
|
|
|
|
"text/html": [
|
|
|
|
|
"\n",
|
|
|
|
|
" <h3>Project: meek-laborer</h3>\n",
|
|
|
|
|
" <script>\n",
|
|
|
|
|
" destroy = function() {\n",
|
|
|
|
|
" document.getElementById(\"iframe463f4614-7689-47e4-b55b-1da0cc679559\").remove()\n",
|
|
|
|
|
" }\n",
|
|
|
|
|
" </script>\n",
|
|
|
|
|
"\n",
|
|
|
|
|
" <h4>Projection ID: 463f4614-7689-47e4-b55b-1da0cc679559</h4>\n",
|
|
|
|
|
" <div class=\"actions\">\n",
|
|
|
|
|
" <div id=\"hide\" class=\"action\" onclick=\"destroy()\">Hide embedded project</div>\n",
|
|
|
|
|
" <div class=\"action\" id=\"out\">\n",
|
|
|
|
|
" <a href=\"https://atlas.nomic.ai/map/fddc0e07-97c5-477c-827c-96bca44519aa/463f4614-7689-47e4-b55b-1da0cc679559\" target=\"_blank\">Explore on atlas.nomic.ai</a>\n",
|
|
|
|
|
" </div>\n",
|
|
|
|
|
" </div>\n",
|
|
|
|
|
" \n",
|
|
|
|
|
" <iframe class=\"iframe\" id=\"iframe463f4614-7689-47e4-b55b-1da0cc679559\" allow=\"clipboard-read; clipboard-write\" src=\"https://atlas.nomic.ai/map/fddc0e07-97c5-477c-827c-96bca44519aa/463f4614-7689-47e4-b55b-1da0cc679559\">\n",
|
|
|
|
|
" </iframe>\n",
|
|
|
|
|
"\n",
|
|
|
|
|
" <style>\n",
|
|
|
|
|
" .iframe {\n",
|
|
|
|
|
" /* vh can be **very** large in vscode ipynb. */\n",
|
|
|
|
|
" height: min(75vh, 66vw);\n",
|
|
|
|
|
" width: 100%;\n",
|
|
|
|
|
" }\n",
|
|
|
|
|
" </style>\n",
|
|
|
|
|
" \n",
|
|
|
|
|
" <style>\n",
|
|
|
|
|
" .actions {\n",
|
|
|
|
|
" display: block;\n",
|
|
|
|
|
" }\n",
|
|
|
|
|
" .action {\n",
|
|
|
|
|
" min-height: 18px;\n",
|
|
|
|
|
" margin: 5px;\n",
|
|
|
|
|
" transition: all 500ms ease-in-out;\n",
|
|
|
|
|
" }\n",
|
|
|
|
|
" .action:hover {\n",
|
|
|
|
|
" cursor: pointer;\n",
|
|
|
|
|
" }\n",
|
|
|
|
|
" #hide:hover::after {\n",
|
|
|
|
|
" content: \" X\";\n",
|
|
|
|
|
" }\n",
|
|
|
|
|
" #out:hover::after {\n",
|
|
|
|
|
" content: \"\";\n",
|
|
|
|
|
" }\n",
|
|
|
|
|
" </style>\n",
|
|
|
|
|
" \n",
|
|
|
|
|
" "
|
|
|
|
|
],
|
|
|
|
|
"text/plain": [
|
|
|
|
|
"meek-laborer: https://atlas.nomic.ai/map/fddc0e07-97c5-477c-827c-96bca44519aa/463f4614-7689-47e4-b55b-1da0cc679559"
|
|
|
|
|
]
|
|
|
|
|
},
|
|
|
|
|
"execution_count": 10,
|
|
|
|
|
"metadata": {},
|
|
|
|
@ -110,19 +166,16 @@
|
|
|
|
|
],
|
|
|
|
|
"source": [
|
|
|
|
|
"map"
|
|
|
|
|
],
|
|
|
|
|
"metadata": {
|
|
|
|
|
"collapsed": false
|
|
|
|
|
}
|
|
|
|
|
]
|
|
|
|
|
},
|
|
|
|
|
{
|
|
|
|
|
"cell_type": "code",
|
|
|
|
|
"execution_count": null,
|
|
|
|
|
"outputs": [],
|
|
|
|
|
"source": [],
|
|
|
|
|
"metadata": {
|
|
|
|
|
"collapsed": false
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
"outputs": [],
|
|
|
|
|
"source": []
|
|
|
|
|
}
|
|
|
|
|
],
|
|
|
|
|
"metadata": {
|
|
|
|
|