Replace build with python-build, fix package order (Point72#358)

arhamchopra · Nijat K · commit ffd6bcacdfe8 · 2024-11-03T17:20:15.000-05:00
- build feedstock is deprecated: https://github.com/conda-forge/build-feedstock Signed-off-by: Arham Chopra <arham.chopra@cubistsystematic.com>
diff --git a/cpp/csp/adapters/websocket/rand_csp.ipynb b/cpp/csp/adapters/websocket/rand_csp.ipynb
@@ -0,0 +1,258 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 18,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import csp\n",
+    "from datetime import datetime, timedelta\n",
+    "\n",
+    "from csp.adapters.parquet import ParquetOutputConfig, ParquetReader, ParquetWriter\n",
+    "from typing import Dict, List\n",
+    "\n",
+    "class MySmolStruct(csp.Struct):\n",
+    "    v: str\n",
+    "    z: int = 12\n",
+    "\n",
+    "class MySillyStruct(csp.Struct):\n",
+    "    header: str = \"abad\"\n",
+    "    x: int\n",
+    "    ms: MySmolStruct\n",
+    "\n",
+    "\n",
+    "class MyStruct(csp.Struct):\n",
+    "    x: int\n",
+    "    v: float = 1.0\n",
+    "    bb: MySillyStruct = MySillyStruct()\n",
+    "\n",
+    "\n",
+    "@csp.node\n",
+    "def dedup(real: csp.ts[\"T\"], hist: csp.ts[\"T\"], flag: csp.ts[bool]) -> csp.ts[\"T\"]:\n",
+    "    if csp.ticked(flag):\n",
+    "        csp.make_passive(hist)\n",
+    "    \n",
+    "    if csp.ticked(hist):\n",
+    "        return real\n",
+    "    \n",
+    "    if csp.ticked(real):\n",
+    "        return real\n",
+    "\n",
+    "\n",
+    "# big_vals = [MyStruct(x=3) * 100]\n",
+    "tup_size = 1_000_000\n",
+    "# tups = [(timedelta(microseconds= i), MyStruct(x=3) ) for i in range(tup_size)]\n",
+    "# tup2 = [(timedelta(microseconds = i), MyStruct(x=3) ) for i in range(tup_size)]\n",
+    "\n",
+    "path = \"/Users/neej/dev/csp/test_tup.pq\"\n",
+    "path2 = \"/Users/neej/dev/csp/test_tup2.pq\"\n",
+    "\n",
+    "@csp.graph\n",
+    "def write_vals():\n",
+    "\n",
+    "    writer = ParquetWriter(\n",
+    "        file_name=path, timestamp_column_name=\"csp_time\", config=ParquetOutputConfig(allow_overwrite=True)\n",
+    "    )\n",
+    "    tups = [(timedelta(microseconds= i), MyStruct(x=3) ) for i in range(tup_size)]\n",
+    "    tups_csp = csp.curve(typ=MyStruct, data=tups)\n",
+    "    writer.publish_struct(tups_csp)\n",
+    "\n",
+    "csp.run(write_vals, starttime=datetime(2020, 1, 1), endtime=datetime(2099, 1, 1))\n",
+    "\n",
+    "@csp.graph\n",
+    "def g_fast():\n",
+    "    # vals1 = csp.curve(typ=MyStruct, data=tups)\n",
+    "    # vals2 = csp.curve( typ=MyStruct, data=tup2 )\n",
+    "    struct_reader = ParquetReader(path, time_column=\"csp_time\")\n",
+    "    vals1 = struct_reader.subscribe_all(MyStruct)\n",
+    "\n",
+    "    struct_reader2 = ParquetReader(path2, time_column=\"csp_time\")\n",
+    "    vals2 = struct_reader2.subscribe_all(MyStruct)\n",
+    "\n",
+    "\n",
+    "    flag = csp.const(True)\n",
+    "    filt1 = csp.filter(flag, vals1)\n",
+    "    res = csp.merge(filt1, vals2)\n",
+    "    csp.add_graph_output(\"res\", res)\n",
+    "\n",
+    "\n",
+    "\n",
+    "@csp.graph\n",
+    "def g_slow():\n",
+    "    struct_reader = ParquetReader(path, time_column=\"csp_time\")\n",
+    "    vals1 = struct_reader.subscribe_all(MyStruct)\n",
+    "\n",
+    "    struct_reader2 = ParquetReader(path2, time_column=\"csp_time\")\n",
+    "    vals2 = struct_reader2.subscribe_all(MyStruct)\n",
+    "\n",
+    "    flag = csp.const(True)\n",
+    "    res = dedup(vals1, vals2, flag)\n",
+    "    csp.add_graph_output(\"res\", res)\n",
+    "\n",
+    "\n",
+    "with csp.profiler.Profiler(cycle_file=\"cycle_data_slow.csv\", node_file=\"node_data_slow.csv\") as p:\n",
+    "    csp.run(g_slow, starttime=datetime(1970, 1, 1), endtime=datetime(2099, 1, 1))\n",
+    "\n",
+    "with csp.profiler.Profiler(cycle_file=\"cycle_data_fast.csv\", node_file=\"node_data_fast.csv\") as p:\n",
+    "    csp.run(g_fast, starttime=datetime(1970, 1, 1), endtime=datetime(2099, 1, 1))\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 19,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CYCLE FAST\n",
+      "\n",
+      "Overall Execution Time Statistics:\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div><style>\n",
+       ".dataframe > thead > tr,\n",
+       ".dataframe > tbody > tr {\n",
+       "  text-align: right;\n",
+       "  white-space: pre-wrap;\n",
+       "}\n",
+       "</style>\n",
+       "<small>shape: (1, 4)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>overall_mean_time_us</th><th>overall_variance_us</th><th>overall_std_dev_us</th><th>total_samples</th></tr><tr><td>f64</td><td>f64</td><td>f64</td><td>u32</td></tr></thead><tbody><tr><td>2.859916</td><td>7.21443</td><td>2.685969</td><td>1000001</td></tr></tbody></table></div>"
+      ],
+      "text/plain": [
+       "shape: (1, 4)\n",
+       "┌──────────────────────┬─────────────────────┬────────────────────┬───────────────┐\n",
+       "│ overall_mean_time_us ┆ overall_variance_us ┆ overall_std_dev_us ┆ total_samples │\n",
+       "│ ---                  ┆ ---                 ┆ ---                ┆ ---           │\n",
+       "│ f64                  ┆ f64                 ┆ f64                ┆ u32           │\n",
+       "╞══════════════════════╪═════════════════════╪════════════════════╪═══════════════╡\n",
+       "│ 2.859916             ┆ 7.21443             ┆ 2.685969           ┆ 1000001       │\n",
+       "└──────────────────────┴─────────────────────┴────────────────────┴───────────────┘"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "import polars as pl\n",
+    "\n",
+    "from IPython.display import display\n",
+    "\n",
+    "# df = pl.read_csv(\"node_data_fast.csv\").group_by(\"Node Type\").agg(pl.col(\"Execution Time\").sum())\n",
+    "# display(df)\n",
+    "# df[\"Execution Time\"].sum()\n",
+    "\n",
+    "df = pl.read_csv(\"cycle_data_fast.csv\")\n",
+    "# display(df)\n",
+    "print(\"CYCLE FAST\")\n",
+    "import numpy as np\n",
+    "\n",
+    "# Overall statistics across all node types\n",
+    "overall_stats = df.select([\n",
+    "    (pl.col('Execution Time').mean() * 1_000_000).alias('overall_mean_time_us'),\n",
+    "    (pl.col('Execution Time').var() * 1_000_000 * 1_000_000).alias('overall_variance_us'),  # multiply twice since variance is squared\n",
+    "    (pl.col('Execution Time').std() * 1_000_000).alias('overall_std_dev_us'),\n",
+    "    pl.col('Execution Time').count().alias('total_samples')\n",
+    "]).with_columns([\n",
+    "    pl.col(['overall_mean_time_us', 'overall_variance_us', 'overall_std_dev_us'])\n",
+    "])\n",
+    "\n",
+    "print(\"\\nOverall Execution Time Statistics:\")\n",
+    "display(overall_stats)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 20,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CYCLE SLOW\n",
+      "\n",
+      "Overall Execution Time Statistics:\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div><style>\n",
+       ".dataframe > thead > tr,\n",
+       ".dataframe > tbody > tr {\n",
+       "  text-align: right;\n",
+       "  white-space: pre-wrap;\n",
+       "}\n",
+       "</style>\n",
+       "<small>shape: (1, 4)</small><table border=\"1\" class=\"dataframe\"><thead><tr><th>overall_mean_time_us</th><th>overall_variance_us</th><th>overall_std_dev_us</th><th>total_samples</th></tr><tr><td>f64</td><td>f64</td><td>f64</td><td>u32</td></tr></thead><tbody><tr><td>1.583237</td><td>5.8768</td><td>2.424211</td><td>1000001</td></tr></tbody></table></div>"
+      ],
+      "text/plain": [
+       "shape: (1, 4)\n",
+       "┌──────────────────────┬─────────────────────┬────────────────────┬───────────────┐\n",
+       "│ overall_mean_time_us ┆ overall_variance_us ┆ overall_std_dev_us ┆ total_samples │\n",
+       "│ ---                  ┆ ---                 ┆ ---                ┆ ---           │\n",
+       "│ f64                  ┆ f64                 ┆ f64                ┆ u32           │\n",
+       "╞══════════════════════╪═════════════════════╪════════════════════╪═══════════════╡\n",
+       "│ 1.583237             ┆ 5.8768              ┆ 2.424211           ┆ 1000001       │\n",
+       "└──────────────────────┴─────────────────────┴────────────────────┴───────────────┘"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "import polars as pl\n",
+    "\n",
+    "from IPython.display import display\n",
+    "\n",
+    "df = pl.read_csv(\"cycle_data_slow.csv\")\n",
+    "# display(df)\n",
+    "print(\"CYCLE SLOW\")\n",
+    "import numpy as np\n",
+    "\n",
+    "# Overall statistics across all node types\n",
+    "overall_stats = df.select([\n",
+    "    (pl.col('Execution Time').mean() * 1_000_000).alias('overall_mean_time_us'),\n",
+    "    (pl.col('Execution Time').var() * 1_000_000 * 1_000_000).alias('overall_variance_us'),  # multiply twice since variance is squared\n",
+    "    (pl.col('Execution Time').std() * 1_000_000).alias('overall_std_dev_us'),\n",
+    "    pl.col('Execution Time').count().alias('total_samples')\n",
+    "]).with_columns([\n",
+    "    pl.col(['overall_mean_time_us', 'overall_variance_us', 'overall_std_dev_us'])\n",
+    "])\n",
+    "\n",
+    "print(\"\\nOverall Execution Time Statistics:\")\n",
+    "display(overall_stats)"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
diff --git a/csp/adapters/testing_csp.ipynb b/csp/adapters/testing_csp.ipynb
@@ -0,0 +1,106 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'a': '9'}"
+      ]
+     },
+     "execution_count": 6,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "import csp\n",
+    "from typing import Dict\n",
+    "\n",
+    "class A(csp.Struct):\n",
+    "    d: Dict[str, str] = {}\n",
+    "\n",
+    "x = A()\n",
+    "x.d['a'] = '9'\n",
+    "\n",
+    "A().d\n",
+    "x.d"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'{\"john\": 11, \"stevie\": 12, \"my_list\": [1, 2]}'"
+      ]
+     },
+     "execution_count": 4,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "import json\n",
+    "\n",
+    "d = {'john': 11, 'stevie': 12, 'my_list': [1, 2]}\n",
+    "\n",
+    "x = json.dumps(d)\n",
+    "\n",
+    "with open('test.json', 'w') as f:\n",
+    "    f.write(x)\n",
+    "x"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "11"
+      ]
+     },
+     "execution_count": 10,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "with open(\"test.json\", 'r') as g:\n",
+    "    raw_str = g.read()\n",
+    "\n",
+    "json.loads(raw_str)['john']"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}