SuffolkLITLab
diff --git a/‎dev-testing/functions.ipynb‎
Lines changed: 23 additions & 69 deletions b/‎dev-testing/functions.ipynb‎
Lines changed: 23 additions & 69 deletions
@@ -2,68 +2,19 @@
  "cells": [
   {
    "cell_type": "code",
-   "execution_count": 11,
+   "execution_count": 1,
    "id": "cc93a668",
    "metadata": {},
    "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "None of PyTorch, TensorFlow >= 2.0, or Flax have been found. Models won't be available and only tokenizers, configuration and file/data utilities can be used.\n"
-     ]
-    },
     {
      "data": {
       "application/vnd.jupyter.widget-view+json": {
-       "model_id": "daa35a202b9944a981d2163df1c63c60",
+       "model_id": "5bd625018f6247fab661ce6d838cb40c",
        "version_major": 2,
        "version_minor": 0
       },
       "text/plain": [
-       "Downloading:   0%|          | 0.00/1.04M [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "bebdf1cab3a0459d8287208bd0923907",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "Downloading:   0%|          | 0.00/456k [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "292dc7fa30e14ed29d3fd1c547a1c121",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "Downloading:   0%|          | 0.00/1.36M [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "c8b65b559f5e42dc9c3015181358047b",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "Downloading:   0%|          | 0.00/665 [00:00<?, ?B/s]"
+       "Downloading:   0%|          | 0.00/26.0 [00:00<?, ?B/s]"
       ]
      },
      "metadata": {},
@@ -139,31 +90,32 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 12,
+   "execution_count": 2,
    "id": "e158174f",
    "metadata": {},
    "outputs": [],
    "source": [
     "stop_words = set(stopwords.words(\"english\"))\n",
     "\n",
-    "try:\n",
-    "    # this takes a while to load\n",
-    "    import en_core_web_lg\n",
+    "if 1==2:\n",
+    "    try:\n",
+    "        # this takes a while to load\n",
+    "        import en_core_web_lg\n",
     "\n",
-    "    nlp = en_core_web_lg.load()\n",
-    "except:\n",
-    "    print(\"Downloading word2vec model en_core_web_lg\")\n",
-    "    import subprocess\n",
+    "        nlp = en_core_web_lg.load()\n",
+    "    except:\n",
+    "        print(\"Downloading word2vec model en_core_web_lg\")\n",
+    "        import subprocess\n",
     "\n",
-    "    bashCommand = \"python -m spacy download en_core_web_lg\"\n",
-    "    process = subprocess.Popen(bashCommand.split(), stdout=subprocess.PIPE)\n",
-    "    output, error = process.communicate()\n",
-    "    print(f\"output of word2vec model download: {str(output)}\")\n",
-    "    import en_core_web_lg\n",
+    "        bashCommand = \"python -m spacy download en_core_web_lg\"\n",
+    "        process = subprocess.Popen(bashCommand.split(), stdout=subprocess.PIPE)\n",
+    "        output, error = process.communicate()\n",
+    "        print(f\"output of word2vec model download: {str(output)}\")\n",
+    "        import en_core_web_lg\n",
     "\n",
-    "    nlp = en_core_web_lg.load()\n",
+    "        nlp = en_core_web_lg.load()\n",
     "\n",
-    "passivepy = PassivePy.PassivePyAnalyzer(nlp=nlp)"
+    "    passivepy = PassivePy.PassivePyAnalyzer(nlp=nlp)"
    ]
   },
   {
@@ -198,6 +150,8 @@
     "jurisdictions = load(\"../formfyxer/data/jurisdictions.joblib\")\n",
     "groups = load(\"../formfyxer/data/groups.joblib\")\n",
     "clf_field_names = load(\"../formfyxer/data/clf_field_names.joblib\")\n",
+    "with open(\"../../keys/tools_token.txt\", \"r\") as file:\n",
+    "    tools_token = file.read().rstrip()\n",
     "with open(\"../../keys/spot_token.txt\", \"r\") as file:\n",
     "    spot_token = file.read().rstrip()\n",
     "with open(\"../../keys/openai_org.txt\", \"r\") as file:\n",
@@ -3045,7 +2999,7 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python 3.8.10 64-bit",
+   "display_name": "Python 3 (ipykernel)",
    "language": "python",
    "name": "python3"
   },
@@ -3059,7 +3013,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.8.10"
+   "version": "3.8.12"
   },
   "vscode": {
    "interpreter": {