add more to config

2026-06-05 22:50:18 +00:00 · 2023-12-24 21:46:36 -05:00
parent 8d76069397
commit e53f605a2d
1 changed files with 30 additions and 33 deletions
@@ -374,7 +374,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 18,
+   "execution_count": 23,
   "metadata": {
    "scrolled": true
   },
@@ -414,9 +414,12 @@
    "aclient = instructor.patch(AsyncOpenAI())\n",
    "\n",
    "\n",
-    "async def expand_query(q) -> Query:\n",
+    "async def expand_query(\n",
+    "    q, *, model: str = \"gpt-4-1106-preview\", temp: float = 0\n",
+    ") -> Query:\n",
    "    return await aclient.chat.completions.create(\n",
-    "        model=\"gpt-4-1106-preview\",\n",
+    "        model=model,\n",
+    "        temperature=temp,\n",
    "        response_model=Query,\n",
    "        messages=[\n",
    "            {\n",
@@ -430,7 +433,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 19,
+   "execution_count": 27,
   "metadata": {},
   "outputs": [
    {
@@ -461,7 +464,7 @@
    {
     "data": {
      "text/html": [
-       "Run data is saved locally in <code>/Users/jasonliu/dev/instructor/tutorials/wandb/run-20231222_152028-opuq58lr</code>"
+       "Run data is saved locally in <code>/Users/jasonliu/dev/instructor/tutorials/wandb/run-20231224_212738-tq55vci1</code>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
@@ -473,7 +476,7 @@
    {
     "data": {
      "text/html": [
-       "Syncing run <strong><a href='https://wandb.ai/instructor/query-understanding/runs/opuq58lr' target=\"_blank\">major-firebrand-21</a></strong> to <a href='https://wandb.ai/instructor/query-understanding' target=\"_blank\">Weights & Biases</a> (<a href='https://wandb.me/run' target=\"_blank\">docs</a>)<br/>"
+       "Syncing run <strong><a href='https://wandb.ai/instructor/query-understanding/runs/tq55vci1' target=\"_blank\">cool-sponge-25</a></strong> to <a href='https://wandb.ai/instructor/query-understanding' target=\"_blank\">Weights & Biases</a> (<a href='https://wandb.me/run' target=\"_blank\">docs</a>)<br/>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
@@ -497,7 +500,7 @@
    {
     "data": {
      "text/html": [
-       " View run at <a href='https://wandb.ai/instructor/query-understanding/runs/opuq58lr' target=\"_blank\">https://wandb.ai/instructor/query-understanding/runs/opuq58lr</a>"
+       " View run at <a href='https://wandb.ai/instructor/query-understanding/runs/tq55vci1' target=\"_blank\">https://wandb.ai/instructor/query-understanding/runs/tq55vci1</a>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
@@ -510,34 +513,13 @@
     "name": "stderr",
     "output_type": "stream",
     "text": [
-      "Retrying, exception: 1 validation error for Query\n",
-      "rewritten_query\n",
-      "  Field required [type=missing, input_value={'rewitten_query': 'recen...', 'end': '2023-12-22'}}, input_type=dict]\n",
-      "    For further information visit https://errors.pydantic.dev/2.5/v/missing\n",
-      "Traceback (most recent call last):\n",
-      "  File \"/Users/jasonliu/dev/instructor/instructor/patch.py\", line 231, in retry_async\n",
-      "    return await process_response_async(\n",
-      "           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n",
-      "  File \"/Users/jasonliu/dev/instructor/instructor/patch.py\", line 201, in process_response_async\n",
-      "    model = await response_model.from_response_async(\n",
-      "            ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n",
-      "  File \"/Users/jasonliu/dev/instructor/instructor/function_calls.py\", line 198, in from_response_async\n",
-      "    return cls.model_validate_json(\n",
-      "           ^^^^^^^^^^^^^^^^^^^^^^^^\n",
-      "  File \"/Users/jasonliu/dev/instructor/.venv/lib/python3.11/site-packages/pydantic/main.py\", line 532, in model_validate_json\n",
-      "    return cls.__pydantic_validator__.validate_json(json_data, strict=strict, context=context)\n",
-      "           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n",
-      "pydantic_core._pydantic_core.ValidationError: 1 validation error for Query\n",
-      "rewritten_query\n",
-      "  Field required [type=missing, input_value={'rewitten_query': 'recen...', 'end': '2023-12-22'}}, input_type=dict]\n",
-      "    For further information visit https://errors.pydantic.dev/2.5/v/missing\n",
      "wandb: WARNING Source type is set to 'repo' but some required information is missing from the environment. A job will not be created from this run. See https://docs.wandb.ai/guides/launch/create-job\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "96b112129c944465a35156a6ffbdfe54",
+       "model_id": "5497ec4b72e24f9baa3fd23e49fe2403",
       "version_major": 2,
       "version_minor": 0
      },
@@ -551,7 +533,7 @@
    {
     "data": {
      "text/html": [
-       "W&B sync reduced upload amount by 7.9%             "
+       "W&B sync reduced upload amount by 8.6%             "
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
@@ -563,7 +545,7 @@
    {
     "data": {
      "text/html": [
-       " View run <strong style=\"color:#cdcd00\">major-firebrand-21</strong> at: <a href='https://wandb.ai/instructor/query-understanding/runs/opuq58lr' target=\"_blank\">https://wandb.ai/instructor/query-understanding/runs/opuq58lr</a><br/>Synced 5 W&B file(s), 1 media file(s), 4 artifact file(s) and 0 other file(s)"
+       " View run <strong style=\"color:#cdcd00\">cool-sponge-25</strong> at: <a href='https://wandb.ai/instructor/query-understanding/runs/tq55vci1' target=\"_blank\">https://wandb.ai/instructor/query-understanding/runs/tq55vci1</a><br/>Synced 4 W&B file(s), 1 media file(s), 4 artifact file(s) and 0 other file(s)"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
@@ -575,7 +557,7 @@
    {
     "data": {
      "text/html": [
-       "Find logs at: <code>./wandb/run-20231222_152028-opuq58lr/logs</code>"
+       "Find logs at: <code>./wandb/run-20231224_212738-tq55vci1/logs</code>"
      ],
      "text/plain": [
       "<IPython.core.display.HTML object>"
@@ -587,7 +569,10 @@
   ],
   "source": [
    "import asyncio\n",
+    "import time\n",
    "\n",
+    "model = \"gpt-4-1106-preview\"\n",
+    "temp = 0\n",
    "\n",
    "run = wandb.init(\n",
    "    project=\"query-understanding\",\n",
@@ -599,8 +584,15 @@
    "    \"quantum computing advancements last 2 months\",\n",
    "    \"biotechnology updates last 10 days\",\n",
    "]\n",
+    "start = time.perf_counter()\n",
+    "queries = await asyncio.gather(\n",
+    "    *[expand_query(q, model=model, temp=temp) for q in test_queries]\n",
+    ")\n",
    "\n",
-    "queries = await asyncio.gather(*[expand_query(q) for q in test_queries])\n",
+    "run.config.update({\"duration (s)\": time.perf_counter() - start})\n",
+    "run.config.update({\"n_queries\": len(queries)})\n",
+    "run.config.update({\"model\": model})\n",
+    "run.config.update({\"temp\": temp})\n",
    "\n",
    "with open(\"schema.json\", \"w+\") as f:\n",
    "    schema = Query.model_json_schema()\n",
@@ -614,6 +606,10 @@
    "df[\"input\"] = test_queries\n",
    "df.to_csv(\"results.csv\")\n",
    "\n",
+    "run.config.update({\"usage_total_tokens\": df[\"usage_total_tokens\"].sum()})\n",
+    "run.config.update({\"usage_completion_tokens\": df[\"usage_completion_tokens\"].sum()})\n",
+    "run.config.update({\"usage_prompt_tokens\": df[\"usage_prompt_tokens\"].sum()})\n",
+    "\n",
    "run.log({\"results\": wandb.Table(dataframe=df)})\n",
    "\n",
    "files = wandb.Artifact(\"data\", type=\"dataset\")\n",
@@ -622,6 +618,7 @@
    "files.add_file(\"results.jsonlines\")\n",
    "files.add_file(\"results.csv\")\n",
    "\n",
+    "\n",
    "run.log_artifact(files)\n",
    "run.finish()"
   ]