From 938a896ac73eee6cb2aa2d071e9a7a8056aa9c79 Mon Sep 17 00:00:00 2001 From: Candace Moore Date: Sat, 22 Jun 2024 14:08:29 +0000 Subject: [PATCH] labs update1 --- notebooks/experi/labs.ipynb | 87 ++++++++++++++++++++++- notebooks/experi/labs2.ipynb | 133 ++++++++++++++++++++++++++++++++++- 2 files changed, 217 insertions(+), 3 deletions(-) diff --git a/notebooks/experi/labs.ipynb b/notebooks/experi/labs.ipynb index 1edeab2..18217db 100644 --- a/notebooks/experi/labs.ipynb +++ b/notebooks/experi/labs.ipynb @@ -66,6 +66,73 @@ "lab_data2['studieID'].unique()" ] }, + { + "cell_type": "code", + "execution_count": null, + "id": "ad76d432-1819-4181-b7f9-eb4797bf1d62", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "set_2023 = set(['BRICK-001', 'BRICK-002', 'BRICK-003', 'BRICK-004', 'BRICK-005',\n", + " 'BRICK-006', 'BRICK-007', 'BRICK-008', 'BRICK-009', 'BRICK-010',\n", + " 'BRICK-011', 'BRICK-012', 'BRICK-013', 'BRICK-014', 'BRICK-015',\n", + " 'BRICK-016', 'BRICK-017', 'BRICK-018', 'BRICK-019', 'BRICK-021',\n", + " 'BRICK-024', 'BRICK-025', 'BRICK-026', 'BRICK-027', 'BRICK-028',\n", + " 'BRICK-029', 'BRICK-030', 'BRICK-031', 'BRICK-032', 'BRICK-033',\n", + " 'BRICK-035', 'BRICK-037', 'BRICK-038', 'BRICK-039', 'BRICK-040',\n", + " 'BRICK-041', 'BRICK-042', 'BRICK-044', 'BRICK-047', 'BRICK-048',\n", + " 'BRICK-049', 'BRICK-050', 'BRICK-051', 'BRICK-052', 'BRICK-053',\n", + " 'BRICK-054', 'BRICK-056', 'BRICK-058'])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "ca376f25-fc91-47b8-a84f-9c7d4214b257", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "set_2024 = set(['BRICK-052', 'BRICK-053', 'BRICK-058', 'BRICK-056', 'BRICK-055',\n", + " 'BRICK-054', 'BRICK-027', 'BRICK-031', 'BRICK-028', 'BRICK-024',\n", + " 'BRICK-037', 'BRICK-025', 'BRICK-029', 'BRICK-019', 'BRICK-011',\n", + " 'BRICK-050', 'BRICK-026', 'BRICK-003', 'BRICK-030', 'BRICK-040',\n", + " 'BRICK-002', 'BRICK-014', 'BRICK-004', 'BRICK-042', 'BRICK-047',\n", + " 'BRICK-012', 'BRICK-051', 'BRICK-041', 'BRICK-010', 'BRICK-044',\n", + " 'BRICK-017', 'BRICK-001', 'BRICK-006', 'BRICK-018', 'BRICK-035',\n", + " 'BRICK-049', 'BRICK-016', 'BRICK-015', 'BRICK-048', 'BRICK-023',\n", + " 'BRICK-043', 'BRICK-005', 'BRICK-033', 'BRICK-008', 'BRICK-013',\n", + " 'BRICK-038', 'BRICK-039'])" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "0c271158-c559-4865-9407-d3944412d839", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "len(set_2023)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "2d296ff1-0d7d-46a4-ac88-b8e1f2e4b6ee", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "intersection = set_2023.intersection(set_2024)\n", + "print(intersection)" + ] + }, { "cell_type": "markdown", "id": "5", @@ -596,7 +663,9 @@ "cell_type": "code", "execution_count": null, "id": "49", - "metadata": {}, + "metadata": { + "tags": [] + }, "outputs": [], "source": [ "#final_df" @@ -614,6 +683,18 @@ "final_df.head(3)" ] }, + { + "cell_type": "code", + "execution_count": null, + "id": "b8e04bf1-d8e6-4f1b-84dc-618222858c6a", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "final_df" + ] + }, { "cell_type": "code", "execution_count": null, @@ -660,7 +741,9 @@ "cell_type": "code", "execution_count": null, "id": "55", - "metadata": {}, + "metadata": { + "tags": [] + }, "outputs": [], "source": [ "updates.columns" diff --git a/notebooks/experi/labs2.ipynb b/notebooks/experi/labs2.ipynb index 097b547..ff79e6f 100644 --- a/notebooks/experi/labs2.ipynb +++ b/notebooks/experi/labs2.ipynb @@ -92,6 +92,18 @@ "len(lab_data['studieID'].unique())" ] }, + { + "cell_type": "code", + "execution_count": null, + "id": "598f35f7-8df1-435b-b159-cd4730f80930", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "#set(lab_data['studieID'].unique())" + ] + }, { "cell_type": "markdown", "id": "7", @@ -625,6 +637,26 @@ "final_df.shape" ] }, + { + "cell_type": "code", + "execution_count": null, + "id": "e7b3070e-247a-4cb3-ad5d-dfa262c0e1f7", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "final_df" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "35b5d282-c355-4d24-a037-fea21c323a8d", + "metadata": {}, + "outputs": [], + "source": [] + }, { "cell_type": "code", "execution_count": null, @@ -637,6 +669,18 @@ "final_df.head(30)" ] }, + { + "cell_type": "code", + "execution_count": null, + "id": "36b55f97-e328-4226-87c5-1956838007b8", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "30*1582" + ] + }, { "cell_type": "code", "execution_count": null, @@ -646,7 +690,94 @@ }, "outputs": [], "source": [ - "final_df.to_csv('full_labs_UPDATES.csv')" + "final_df.to_csv('../../secret_data/full_labs_UPDATES_assembled_22_6_2024.csv')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "316dd391-35aa-4882-ab5b-3c724e198612", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "final_df.head(3)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "bd74bd62-3f8c-4c95-a59b-9b88e39c1498", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "df = pd.read_csv('../../secret_data/full_labs_UPDATES_assembled_22_6_2024.csv', index_col=1)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "5a41d76e-2af2-41a6-9e88-81f307a7d2d6", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "df = df.drop('Unnamed: 0', axis=1)\n", + "df" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "cf2c3b14-9f8e-4293-a7bd-826b98b89315", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "df.columns" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "4d94d7e6-9fe0-4bcb-a5c1-1d3fe7d2e80f", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "df.to_csv('../../secret_data/castor_ready_labs_from_2023_made_22_6_2024.csv')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "f3cf5d0d-6ada-4ad5-bd29-9100e17cac84", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "df_top = df[:15]\n", + "df_top" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "e4d686ba-1a40-438f-9d0e-6f6425853262", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "df_top.to_csv('../../secret_data/castor_ready_labs_first_third_from_2023_made_22_6_2024.csv')" ] }, {