USC-Applied-NLP-Group
/

SQL-Generation

TensorBoard

Safetensors

Model card Files Files and versions Metrics Training metrics Community

licesma commited on 25 days ago

Commit

5af7feb

1 Parent(s): aa43cb9

Modify path to relative path

Browse files

Files changed (1) hide show

test_pretrained.ipynb +15 -15

test_pretrained.ipynb CHANGED Viewed

@@ -48,7 +48,7 @@
     "    hugging_face_path = snapshot_download(\n",
     "        repo_id=\"USC-Applied-NLP-Group/SQL-Generation\",\n",
     "        repo_type=\"model\",  \n",
-    "        allow_patterns=[\"src/*\", \"train-data/*\", \"deepseek-coder-1.3b-instruct/*\"], \n",
     "    )\n",
     "    sys.path.append(hugging_face_path)\n",
     "    current_path = hugging_face_path"
@@ -166,7 +166,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 29,
    "metadata": {},
    "outputs": [
     {
@@ -179,7 +179,7 @@
    ],
    "source": [
     "# Create connection to sqlite3 database\n",
-    "connection = sql.connect('./nba-data/nba.sqlite')\n",
     "cursor = connection.cursor()\n",
     "\n",
     "# Execute query from model output and print result\n",
@@ -304,7 +304,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
    "metadata": {},
    "outputs": [
     {
@@ -325,7 +325,7 @@
     }
    ],
    "source": [
-    "less_than_90_df = pd.read_csv(\"./train-data/less_than_90.tsv\", sep='\\t')\n",
     "run_evaluation(less_than_90_df, \"Less than 90\")\n",
     "print(\"Dataset length: \" + str(len(less_than_90_df)))"
    ]
@@ -339,7 +339,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 10,
    "metadata": {},
    "outputs": [
     {
@@ -372,7 +372,7 @@
     }
    ],
    "source": [
-    "game_queries = pd.read_csv(\"./train-data/queries_from_game.tsv\", sep='\\t')\n",
     "run_evaluation(game_queries, \"Queries from game\")\n",
     "print(\"Dataset length: \" + str(len(game_queries)))"
    ]
@@ -386,7 +386,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 11,
    "metadata": {},
    "outputs": [
     {
@@ -406,7 +406,7 @@
     }
    ],
    "source": [
-    "other_stats_queries = pd.read_csv(\"./train-data/queries_from_other_stats.tsv\", sep='\\t')\n",
     "run_evaluation(other_stats_queries, \"Queries from other stats\")\n",
     "print(\"Dataset length: \" + str(len(other_stats_queries)))"
    ]
@@ -420,7 +420,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 12,
    "metadata": {},
    "outputs": [
     {
@@ -438,7 +438,7 @@
     }
    ],
    "source": [
-    "team_queries = pd.read_csv(\"./train-data/queries_from_team.tsv\", sep='\\t')\n",
     "run_evaluation(team_queries, \"Queries from team\")\n",
     "print(\"Dataset length: \" + str(len(team_queries)))"
    ]
@@ -452,7 +452,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 13,
    "metadata": {},
    "outputs": [
     {
@@ -472,7 +472,7 @@
     }
    ],
    "source": [
-    "join_queries = pd.read_csv(\"./train-data/with_join.tsv\", sep='\\t')\n",
     "run_evaluation(join_queries, \"Queries with join\")\n",
     "print(\"Dataset length: \" + str(len(join_queries)))"
    ]
@@ -486,7 +486,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 14,
    "metadata": {},
    "outputs": [
     {
@@ -520,7 +520,7 @@
     }
    ],
    "source": [
-    "no_join_queries = pd.read_csv(\"./train-data/without_join.tsv\", sep='\\t')\n",
     "run_evaluation(no_join_queries, \"Queries without join\")\n",
     "print(\"Dataset length: \" + str(len(no_join_queries)))"
    ]

     "    hugging_face_path = snapshot_download(\n",
     "        repo_id=\"USC-Applied-NLP-Group/SQL-Generation\",\n",
     "        repo_type=\"model\",  \n",
+    "        allow_patterns=[\"src/*\", \"train-data/*\", \"deepseek-coder-1.3b-instruct/*\", \"nba-data/*\"], \n",
     "    )\n",
     "    sys.path.append(hugging_face_path)\n",
     "    current_path = hugging_face_path"
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "metadata": {},
    "outputs": [
     {
    ],
    "source": [
     "# Create connection to sqlite3 database\n",
+    "connection = sql.connect(get_path('nba-data/nba.sqlite'))\n",
     "cursor = connection.cursor()\n",
     "\n",
     "# Execute query from model output and print result\n",
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "metadata": {},
    "outputs": [
     {
     }
    ],
    "source": [
+    "less_than_90_df = pd.read_csv(get_path(\"train-data/less_than_90.tsv\"), sep='\\t')\n",
     "run_evaluation(less_than_90_df, \"Less than 90\")\n",
     "print(\"Dataset length: \" + str(len(less_than_90_df)))"
    ]
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "metadata": {},
    "outputs": [
     {
     }
    ],
    "source": [
+    "game_queries = pd.read_csv(get_path(\"train-data/queries_from_game.tsv\"), sep='\\t')\n",
     "run_evaluation(game_queries, \"Queries from game\")\n",
     "print(\"Dataset length: \" + str(len(game_queries)))"
    ]
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "metadata": {},
    "outputs": [
     {
     }
    ],
    "source": [
+    "other_stats_queries = pd.read_csv(get_path(\"train-data/queries_from_other_stats.tsv\"), sep='\\t')\n",
     "run_evaluation(other_stats_queries, \"Queries from other stats\")\n",
     "print(\"Dataset length: \" + str(len(other_stats_queries)))"
    ]
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "metadata": {},
    "outputs": [
     {
     }
    ],
    "source": [
+    "team_queries = pd.read_csv(get_path(\"train-data/queries_from_team.tsv\"), sep='\\t')\n",
     "run_evaluation(team_queries, \"Queries from team\")\n",
     "print(\"Dataset length: \" + str(len(team_queries)))"
    ]
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "metadata": {},
    "outputs": [
     {
     }
    ],
    "source": [
+    "join_queries = pd.read_csv(get_path(\"train-data/with_join.tsv\"), sep='\\t')\n",
     "run_evaluation(join_queries, \"Queries with join\")\n",
     "print(\"Dataset length: \" + str(len(join_queries)))"
    ]
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "metadata": {},
    "outputs": [
     {
     }
    ],
    "source": [
+    "no_join_queries = pd.read_csv(get_path(\"train-data/without_join.tsv\"), sep='\\t')\n",
     "run_evaluation(no_join_queries, \"Queries without join\")\n",
     "print(\"Dataset length: \" + str(len(no_join_queries)))"
    ]