Files
HowBadIsMyBatch/HowBadIsMyBatch.ipynb
frankknoll aaa5fc36e0 updating
2022-01-24 00:26:03 +01:00

2866 lines
105 KiB
Plaintext
Raw Blame History

This file contains ambiguous Unicode characters
This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
{
"cells": [
{
"cell_type": "code",
"execution_count": 3,
"id": "9de5907f-18f5-4cb1-903e-26028ff1fa03",
"metadata": {},
"outputs": [],
"source": [
"import numpy as np\n",
"import pandas as pd\n",
"pd.set_option('display.max_rows', 10)\n",
"pd.set_option('display.max_columns', None)"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "ad0e6044",
"metadata": {},
"outputs": [],
"source": [
"df_patients_22 = pd.read_csv(\"VAERS/2021VAERSData/2021VAERSDATA.csv\", index_col='VAERS_ID', encoding='latin1', low_memory=False)"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "4472e902",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>RECVDATE</th>\n",
" <th>STATE</th>\n",
" <th>AGE_YRS</th>\n",
" <th>CAGE_YR</th>\n",
" <th>CAGE_MO</th>\n",
" <th>SEX</th>\n",
" <th>RPT_DATE</th>\n",
" <th>SYMPTOM_TEXT</th>\n",
" <th>DIED</th>\n",
" <th>DATEDIED</th>\n",
" <th>L_THREAT</th>\n",
" <th>ER_VISIT</th>\n",
" <th>HOSPITAL</th>\n",
" <th>HOSPDAYS</th>\n",
" <th>X_STAY</th>\n",
" <th>DISABLE</th>\n",
" <th>RECOVD</th>\n",
" <th>VAX_DATE</th>\n",
" <th>ONSET_DATE</th>\n",
" <th>NUMDAYS</th>\n",
" <th>LAB_DATA</th>\n",
" <th>V_ADMINBY</th>\n",
" <th>V_FUNDBY</th>\n",
" <th>OTHER_MEDS</th>\n",
" <th>CUR_ILL</th>\n",
" <th>HISTORY</th>\n",
" <th>PRIOR_VAX</th>\n",
" <th>SPLTTYPE</th>\n",
" <th>FORM_VERS</th>\n",
" <th>TODAYS_DATE</th>\n",
" <th>BIRTH_DEFECT</th>\n",
" <th>OFC_VISIT</th>\n",
" <th>ER_ED_VISIT</th>\n",
" <th>ALLERGIES</th>\n",
" </tr>\n",
" <tr>\n",
" <th>VAERS_ID</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>916600</th>\n",
" <td>01/01/2021</td>\n",
" <td>TX</td>\n",
" <td>33.0</td>\n",
" <td>33.0</td>\n",
" <td>NaN</td>\n",
" <td>F</td>\n",
" <td>NaN</td>\n",
" <td>Right side of epiglottis swelled up and hinder...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>12/28/2020</td>\n",
" <td>12/30/2020</td>\n",
" <td>2.0</td>\n",
" <td>None</td>\n",
" <td>PVT</td>\n",
" <td>NaN</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>01/01/2021</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>NaN</td>\n",
" <td>Pcn and bee venom</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916601</th>\n",
" <td>01/01/2021</td>\n",
" <td>CA</td>\n",
" <td>73.0</td>\n",
" <td>73.0</td>\n",
" <td>NaN</td>\n",
" <td>F</td>\n",
" <td>NaN</td>\n",
" <td>Approximately 30 min post vaccination administ...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>12/31/2020</td>\n",
" <td>12/31/2020</td>\n",
" <td>0.0</td>\n",
" <td>NaN</td>\n",
" <td>SEN</td>\n",
" <td>NaN</td>\n",
" <td>Patient residing at nursing facility. See pati...</td>\n",
" <td>Patient residing at nursing facility. See pati...</td>\n",
" <td>Patient residing at nursing facility. See pati...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>01/01/2021</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>NaN</td>\n",
" <td>\"Dairy\"</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916602</th>\n",
" <td>01/01/2021</td>\n",
" <td>WA</td>\n",
" <td>23.0</td>\n",
" <td>23.0</td>\n",
" <td>NaN</td>\n",
" <td>F</td>\n",
" <td>NaN</td>\n",
" <td>About 15 minutes after receiving the vaccine, ...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>U</td>\n",
" <td>12/31/2020</td>\n",
" <td>12/31/2020</td>\n",
" <td>0.0</td>\n",
" <td>NaN</td>\n",
" <td>SEN</td>\n",
" <td>NaN</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>01/01/2021</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>Shellfish</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916603</th>\n",
" <td>01/01/2021</td>\n",
" <td>WA</td>\n",
" <td>58.0</td>\n",
" <td>58.0</td>\n",
" <td>NaN</td>\n",
" <td>F</td>\n",
" <td>NaN</td>\n",
" <td>extreme fatigue, dizziness,. could not lift my...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>12/23/2020</td>\n",
" <td>12/23/2020</td>\n",
" <td>0.0</td>\n",
" <td>none</td>\n",
" <td>WRK</td>\n",
" <td>NaN</td>\n",
" <td>none</td>\n",
" <td>kidney infection</td>\n",
" <td>diverticulitis, mitral valve prolapse, osteoar...</td>\n",
" <td>got measles from measel shot, mums from mumps ...</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>01/01/2021</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Diclofenac, novacaine, lidocaine, pickles, tom...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916604</th>\n",
" <td>01/01/2021</td>\n",
" <td>TX</td>\n",
" <td>47.0</td>\n",
" <td>47.0</td>\n",
" <td>NaN</td>\n",
" <td>F</td>\n",
" <td>NaN</td>\n",
" <td>Injection site swelling, redness, warm to the ...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>N</td>\n",
" <td>12/22/2020</td>\n",
" <td>12/29/2020</td>\n",
" <td>7.0</td>\n",
" <td>NaN</td>\n",
" <td>PUB</td>\n",
" <td>NaN</td>\n",
" <td>Na</td>\n",
" <td>Na</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>01/01/2021</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Na</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1997120</th>\n",
" <td>12/31/2021</td>\n",
" <td>ID</td>\n",
" <td>56.0</td>\n",
" <td>56.0</td>\n",
" <td>NaN</td>\n",
" <td>M</td>\n",
" <td>NaN</td>\n",
" <td>I had symptoms of low level un-diagnosed kidn...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>11/28/2021</td>\n",
" <td>11/30/2021</td>\n",
" <td>2.0</td>\n",
" <td>lab test for UTI</td>\n",
" <td>UNK</td>\n",
" <td>NaN</td>\n",
" <td>none</td>\n",
" <td>un-diagnosed kidney infection</td>\n",
" <td>none</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>12/31/2021</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>NaN</td>\n",
" <td>none</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1997121</th>\n",
" <td>12/31/2021</td>\n",
" <td>OH</td>\n",
" <td>69.0</td>\n",
" <td>69.0</td>\n",
" <td>NaN</td>\n",
" <td>M</td>\n",
" <td>NaN</td>\n",
" <td>I got very bad eczema after first shot. Then i...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>N</td>\n",
" <td>02/26/2021</td>\n",
" <td>03/04/2021</td>\n",
" <td>6.0</td>\n",
" <td>went to my doctor he said I have eczema. Gave...</td>\n",
" <td>PHM</td>\n",
" <td>NaN</td>\n",
" <td>b12 and d3 vitamins</td>\n",
" <td>NaN</td>\n",
" <td>hypothyroid</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>12/31/2021</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>penicillin, statin drugs, codeine</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1997122</th>\n",
" <td>12/31/2021</td>\n",
" <td>NV</td>\n",
" <td>50.0</td>\n",
" <td>50.0</td>\n",
" <td>NaN</td>\n",
" <td>M</td>\n",
" <td>NaN</td>\n",
" <td>Hives all over the body and swelling of the li...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>U</td>\n",
" <td>09/04/2021</td>\n",
" <td>10/01/2021</td>\n",
" <td>27.0</td>\n",
" <td>NaN</td>\n",
" <td>PHM</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>12/31/2021</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>None</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1998668</th>\n",
" <td>12/31/2021</td>\n",
" <td>SC</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>F</td>\n",
" <td>NaN</td>\n",
" <td>Arm tenderness</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>PVT</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>12/31/2021</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1998669</th>\n",
" <td>12/31/2021</td>\n",
" <td>CA</td>\n",
" <td>59.0</td>\n",
" <td>59.0</td>\n",
" <td>NaN</td>\n",
" <td>M</td>\n",
" <td>NaN</td>\n",
" <td>Can't get up, all joints hurt States he is in ...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>N</td>\n",
" <td>04/29/2021</td>\n",
" <td>05/05/2021</td>\n",
" <td>6.0</td>\n",
" <td>Blood test.</td>\n",
" <td>PVT</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>07/07/2021</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>NaN</td>\n",
" <td>NKA</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>749067 rows × 34 columns</p>\n",
"</div>"
],
"text/plain": [
" RECVDATE STATE AGE_YRS CAGE_YR CAGE_MO SEX RPT_DATE \\\n",
"VAERS_ID \n",
"916600 01/01/2021 TX 33.0 33.0 NaN F NaN \n",
"916601 01/01/2021 CA 73.0 73.0 NaN F NaN \n",
"916602 01/01/2021 WA 23.0 23.0 NaN F NaN \n",
"916603 01/01/2021 WA 58.0 58.0 NaN F NaN \n",
"916604 01/01/2021 TX 47.0 47.0 NaN F NaN \n",
"... ... ... ... ... ... .. ... \n",
"1997120 12/31/2021 ID 56.0 56.0 NaN M NaN \n",
"1997121 12/31/2021 OH 69.0 69.0 NaN M NaN \n",
"1997122 12/31/2021 NV 50.0 50.0 NaN M NaN \n",
"1998668 12/31/2021 SC NaN NaN NaN F NaN \n",
"1998669 12/31/2021 CA 59.0 59.0 NaN M NaN \n",
"\n",
" SYMPTOM_TEXT DIED DATEDIED \\\n",
"VAERS_ID \n",
"916600 Right side of epiglottis swelled up and hinder... NaN NaN \n",
"916601 Approximately 30 min post vaccination administ... NaN NaN \n",
"916602 About 15 minutes after receiving the vaccine, ... NaN NaN \n",
"916603 extreme fatigue, dizziness,. could not lift my... NaN NaN \n",
"916604 Injection site swelling, redness, warm to the ... NaN NaN \n",
"... ... ... ... \n",
"1997120 I had symptoms of low level un-diagnosed kidn... NaN NaN \n",
"1997121 I got very bad eczema after first shot. Then i... NaN NaN \n",
"1997122 Hives all over the body and swelling of the li... NaN NaN \n",
"1998668 Arm tenderness NaN NaN \n",
"1998669 Can't get up, all joints hurt States he is in ... NaN NaN \n",
"\n",
" L_THREAT ER_VISIT HOSPITAL HOSPDAYS X_STAY DISABLE RECOVD \\\n",
"VAERS_ID \n",
"916600 NaN NaN NaN NaN NaN NaN Y \n",
"916601 NaN NaN NaN NaN NaN NaN Y \n",
"916602 NaN NaN NaN NaN NaN NaN U \n",
"916603 NaN NaN NaN NaN NaN NaN Y \n",
"916604 NaN NaN NaN NaN NaN NaN N \n",
"... ... ... ... ... ... ... ... \n",
"1997120 NaN NaN NaN NaN NaN NaN Y \n",
"1997121 NaN NaN NaN NaN NaN NaN N \n",
"1997122 NaN NaN NaN NaN NaN NaN U \n",
"1998668 NaN NaN NaN NaN NaN NaN Y \n",
"1998669 NaN NaN NaN NaN NaN NaN N \n",
"\n",
" VAX_DATE ONSET_DATE NUMDAYS \\\n",
"VAERS_ID \n",
"916600 12/28/2020 12/30/2020 2.0 \n",
"916601 12/31/2020 12/31/2020 0.0 \n",
"916602 12/31/2020 12/31/2020 0.0 \n",
"916603 12/23/2020 12/23/2020 0.0 \n",
"916604 12/22/2020 12/29/2020 7.0 \n",
"... ... ... ... \n",
"1997120 11/28/2021 11/30/2021 2.0 \n",
"1997121 02/26/2021 03/04/2021 6.0 \n",
"1997122 09/04/2021 10/01/2021 27.0 \n",
"1998668 NaN NaN NaN \n",
"1998669 04/29/2021 05/05/2021 6.0 \n",
"\n",
" LAB_DATA V_ADMINBY \\\n",
"VAERS_ID \n",
"916600 None PVT \n",
"916601 NaN SEN \n",
"916602 NaN SEN \n",
"916603 none WRK \n",
"916604 NaN PUB \n",
"... ... ... \n",
"1997120 lab test for UTI UNK \n",
"1997121 went to my doctor he said I have eczema. Gave... PHM \n",
"1997122 NaN PHM \n",
"1998668 NaN PVT \n",
"1998669 Blood test. PVT \n",
"\n",
" V_FUNDBY OTHER_MEDS \\\n",
"VAERS_ID \n",
"916600 NaN None \n",
"916601 NaN Patient residing at nursing facility. See pati... \n",
"916602 NaN None \n",
"916603 NaN none \n",
"916604 NaN Na \n",
"... ... ... \n",
"1997120 NaN none \n",
"1997121 NaN b12 and d3 vitamins \n",
"1997122 NaN NaN \n",
"1998668 NaN NaN \n",
"1998669 NaN NaN \n",
"\n",
" CUR_ILL \\\n",
"VAERS_ID \n",
"916600 None \n",
"916601 Patient residing at nursing facility. See pati... \n",
"916602 None \n",
"916603 kidney infection \n",
"916604 Na \n",
"... ... \n",
"1997120 un-diagnosed kidney infection \n",
"1997121 NaN \n",
"1997122 None \n",
"1998668 NaN \n",
"1998669 NaN \n",
"\n",
" HISTORY \\\n",
"VAERS_ID \n",
"916600 None \n",
"916601 Patient residing at nursing facility. See pati... \n",
"916602 None \n",
"916603 diverticulitis, mitral valve prolapse, osteoar... \n",
"916604 NaN \n",
"... ... \n",
"1997120 none \n",
"1997121 hypothyroid \n",
"1997122 None \n",
"1998668 NaN \n",
"1998669 NaN \n",
"\n",
" PRIOR_VAX SPLTTYPE \\\n",
"VAERS_ID \n",
"916600 NaN NaN \n",
"916601 NaN NaN \n",
"916602 NaN NaN \n",
"916603 got measles from measel shot, mums from mumps ... NaN \n",
"916604 NaN NaN \n",
"... ... ... \n",
"1997120 NaN NaN \n",
"1997121 NaN NaN \n",
"1997122 NaN NaN \n",
"1998668 NaN NaN \n",
"1998669 NaN NaN \n",
"\n",
" FORM_VERS TODAYS_DATE BIRTH_DEFECT OFC_VISIT ER_ED_VISIT \\\n",
"VAERS_ID \n",
"916600 2 01/01/2021 NaN Y NaN \n",
"916601 2 01/01/2021 NaN Y NaN \n",
"916602 2 01/01/2021 NaN NaN Y \n",
"916603 2 01/01/2021 NaN NaN NaN \n",
"916604 2 01/01/2021 NaN NaN NaN \n",
"... ... ... ... ... ... \n",
"1997120 2 12/31/2021 NaN Y NaN \n",
"1997121 2 12/31/2021 NaN NaN NaN \n",
"1997122 2 12/31/2021 NaN NaN NaN \n",
"1998668 2 12/31/2021 NaN NaN NaN \n",
"1998669 2 07/07/2021 NaN Y NaN \n",
"\n",
" ALLERGIES \n",
"VAERS_ID \n",
"916600 Pcn and bee venom \n",
"916601 \"Dairy\" \n",
"916602 Shellfish \n",
"916603 Diclofenac, novacaine, lidocaine, pickles, tom... \n",
"916604 Na \n",
"... ... \n",
"1997120 none \n",
"1997121 penicillin, statin drugs, codeine \n",
"1997122 None \n",
"1998668 NaN \n",
"1998669 NKA \n",
"\n",
"[749067 rows x 34 columns]"
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_patients_22.index\n",
"df_patients_22"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "fb54ec47",
"metadata": {},
"outputs": [],
"source": [
"df_vax_22 = pd.read_csv(\"VAERS/2021VAERSData/2021VAERSVAX.csv\", index_col='VAERS_ID', encoding='latin1')"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "d8942466",
"metadata": {
"scrolled": false
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>VAX_TYPE</th>\n",
" <th>VAX_MANU</th>\n",
" <th>VAX_LOT</th>\n",
" <th>VAX_DOSE_SERIES</th>\n",
" <th>VAX_ROUTE</th>\n",
" <th>VAX_SITE</th>\n",
" <th>VAX_NAME</th>\n",
" </tr>\n",
" <tr>\n",
" <th>VAERS_ID</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>916600</th>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>037K20A</td>\n",
" <td>1</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916601</th>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>025L20A</td>\n",
" <td>1</td>\n",
" <td>IM</td>\n",
" <td>RA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916602</th>\n",
" <td>COVID19</td>\n",
" <td>PFIZER\\BIONTECH</td>\n",
" <td>EL1284</td>\n",
" <td>1</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (PFIZER-BIONTECH))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916603</th>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>unknown</td>\n",
" <td>UNK</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916604</th>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>NaN</td>\n",
" <td>1</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2013746</th>\n",
" <td>HIBV</td>\n",
" <td>MERCK &amp; CO. INC.</td>\n",
" <td>T026960</td>\n",
" <td>UNK</td>\n",
" <td>IM</td>\n",
" <td>LL</td>\n",
" <td>HIB (PEDVAXHIB)</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2013746</th>\n",
" <td>PNC13</td>\n",
" <td>PFIZER\\WYETH</td>\n",
" <td>DR1779</td>\n",
" <td>UNK</td>\n",
" <td>IM</td>\n",
" <td>LL</td>\n",
" <td>PNEUMO (PREVNAR13)</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2013746</th>\n",
" <td>RV5</td>\n",
" <td>MERCK &amp; CO. INC.</td>\n",
" <td>1742458</td>\n",
" <td>UNK</td>\n",
" <td>PO</td>\n",
" <td>MO</td>\n",
" <td>ROTAVIRUS (ROTATEQ)</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2013757</th>\n",
" <td>DTAPIPV</td>\n",
" <td>GLAXOSMITHKLINE BIOLOGICALS</td>\n",
" <td>7P5J5</td>\n",
" <td>1</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>DTAP + IPV (KINRIX)</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2013757</th>\n",
" <td>MMRV</td>\n",
" <td>MERCK &amp; CO. INC.</td>\n",
" <td>T027111</td>\n",
" <td>1</td>\n",
" <td>SC</td>\n",
" <td>LA</td>\n",
" <td>MEASLES + MUMPS + RUBELLA + VARICELLA (PROQUAD)</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>793346 rows × 7 columns</p>\n",
"</div>"
],
"text/plain": [
" VAX_TYPE VAX_MANU VAX_LOT VAX_DOSE_SERIES \\\n",
"VAERS_ID \n",
"916600 COVID19 MODERNA 037K20A 1 \n",
"916601 COVID19 MODERNA 025L20A 1 \n",
"916602 COVID19 PFIZER\\BIONTECH EL1284 1 \n",
"916603 COVID19 MODERNA unknown UNK \n",
"916604 COVID19 MODERNA NaN 1 \n",
"... ... ... ... ... \n",
"2013746 HIBV MERCK & CO. INC. T026960 UNK \n",
"2013746 PNC13 PFIZER\\WYETH DR1779 UNK \n",
"2013746 RV5 MERCK & CO. INC. 1742458 UNK \n",
"2013757 DTAPIPV GLAXOSMITHKLINE BIOLOGICALS 7P5J5 1 \n",
"2013757 MMRV MERCK & CO. INC. T027111 1 \n",
"\n",
" VAX_ROUTE VAX_SITE VAX_NAME \n",
"VAERS_ID \n",
"916600 IM LA COVID19 (COVID19 (MODERNA)) \n",
"916601 IM RA COVID19 (COVID19 (MODERNA)) \n",
"916602 IM LA COVID19 (COVID19 (PFIZER-BIONTECH)) \n",
"916603 NaN NaN COVID19 (COVID19 (MODERNA)) \n",
"916604 IM LA COVID19 (COVID19 (MODERNA)) \n",
"... ... ... ... \n",
"2013746 IM LL HIB (PEDVAXHIB) \n",
"2013746 IM LL PNEUMO (PREVNAR13) \n",
"2013746 PO MO ROTAVIRUS (ROTATEQ) \n",
"2013757 IM LA DTAP + IPV (KINRIX) \n",
"2013757 SC LA MEASLES + MUMPS + RUBELLA + VARICELLA (PROQUAD) \n",
"\n",
"[793346 rows x 7 columns]"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_vax_22"
]
},
{
"cell_type": "code",
"execution_count": 8,
"id": "d31c5225",
"metadata": {},
"outputs": [],
"source": [
"df_COVID19_22 = df_vax_22[df_vax_22[\"VAX_TYPE\"] == \"COVID19\"]"
]
},
{
"cell_type": "code",
"execution_count": 9,
"id": "be2b57c9",
"metadata": {
"scrolled": false
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>VAX_TYPE</th>\n",
" <th>VAX_MANU</th>\n",
" <th>VAX_LOT</th>\n",
" <th>VAX_DOSE_SERIES</th>\n",
" <th>VAX_ROUTE</th>\n",
" <th>VAX_SITE</th>\n",
" <th>VAX_NAME</th>\n",
" </tr>\n",
" <tr>\n",
" <th>VAERS_ID</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>916600</th>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>037K20A</td>\n",
" <td>1</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916601</th>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>025L20A</td>\n",
" <td>1</td>\n",
" <td>IM</td>\n",
" <td>RA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916602</th>\n",
" <td>COVID19</td>\n",
" <td>PFIZER\\BIONTECH</td>\n",
" <td>EL1284</td>\n",
" <td>1</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (PFIZER-BIONTECH))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916603</th>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>unknown</td>\n",
" <td>UNK</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916604</th>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>NaN</td>\n",
" <td>1</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2005264</th>\n",
" <td>COVID19</td>\n",
" <td>PFIZER\\BIONTECH</td>\n",
" <td>EN6208</td>\n",
" <td>UNK</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>COVID19 (COVID19 (PFIZER-BIONTECH))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2005274</th>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>028L20A</td>\n",
" <td>UNK</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2005274</th>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>014M20A</td>\n",
" <td>UNK</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2005290</th>\n",
" <td>COVID19</td>\n",
" <td>JANSSEN</td>\n",
" <td>1805020</td>\n",
" <td>UNK</td>\n",
" <td>IM</td>\n",
" <td>NaN</td>\n",
" <td>COVID19 (COVID19 (JANSSEN))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2009884</th>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>737971 rows × 7 columns</p>\n",
"</div>"
],
"text/plain": [
" VAX_TYPE VAX_MANU VAX_LOT VAX_DOSE_SERIES VAX_ROUTE \\\n",
"VAERS_ID \n",
"916600 COVID19 MODERNA 037K20A 1 IM \n",
"916601 COVID19 MODERNA 025L20A 1 IM \n",
"916602 COVID19 PFIZER\\BIONTECH EL1284 1 IM \n",
"916603 COVID19 MODERNA unknown UNK NaN \n",
"916604 COVID19 MODERNA NaN 1 IM \n",
"... ... ... ... ... ... \n",
"2005264 COVID19 PFIZER\\BIONTECH EN6208 UNK NaN \n",
"2005274 COVID19 MODERNA 028L20A UNK IM \n",
"2005274 COVID19 MODERNA 014M20A UNK IM \n",
"2005290 COVID19 JANSSEN 1805020 UNK IM \n",
"2009884 COVID19 MODERNA NaN 2 IM \n",
"\n",
" VAX_SITE VAX_NAME \n",
"VAERS_ID \n",
"916600 LA COVID19 (COVID19 (MODERNA)) \n",
"916601 RA COVID19 (COVID19 (MODERNA)) \n",
"916602 LA COVID19 (COVID19 (PFIZER-BIONTECH)) \n",
"916603 NaN COVID19 (COVID19 (MODERNA)) \n",
"916604 LA COVID19 (COVID19 (MODERNA)) \n",
"... ... ... \n",
"2005264 NaN COVID19 (COVID19 (PFIZER-BIONTECH)) \n",
"2005274 LA COVID19 (COVID19 (MODERNA)) \n",
"2005274 LA COVID19 (COVID19 (MODERNA)) \n",
"2005290 NaN COVID19 (COVID19 (JANSSEN)) \n",
"2009884 LA COVID19 (COVID19 (MODERNA)) \n",
"\n",
"[737971 rows x 7 columns]"
]
},
"execution_count": 9,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_COVID19_22"
]
},
{
"cell_type": "code",
"execution_count": 10,
"id": "8c432ab2",
"metadata": {},
"outputs": [],
"source": [
"df_patients_COVID19 = pd.merge(df_patients_22, df_COVID19_22, left_index=True, right_index=True)"
]
},
{
"cell_type": "code",
"execution_count": 11,
"id": "fef882ff",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"((749067, 34), (737971, 7), (737971, 41))"
]
},
"execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_patients_22.shape, df_COVID19_22.shape, df_patients_COVID19.shape"
]
},
{
"cell_type": "code",
"execution_count": 12,
"id": "6ce15322",
"metadata": {
"scrolled": false
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>RECVDATE</th>\n",
" <th>STATE</th>\n",
" <th>AGE_YRS</th>\n",
" <th>CAGE_YR</th>\n",
" <th>CAGE_MO</th>\n",
" <th>SEX</th>\n",
" <th>RPT_DATE</th>\n",
" <th>SYMPTOM_TEXT</th>\n",
" <th>DIED</th>\n",
" <th>DATEDIED</th>\n",
" <th>L_THREAT</th>\n",
" <th>ER_VISIT</th>\n",
" <th>HOSPITAL</th>\n",
" <th>HOSPDAYS</th>\n",
" <th>X_STAY</th>\n",
" <th>DISABLE</th>\n",
" <th>RECOVD</th>\n",
" <th>VAX_DATE</th>\n",
" <th>ONSET_DATE</th>\n",
" <th>NUMDAYS</th>\n",
" <th>LAB_DATA</th>\n",
" <th>V_ADMINBY</th>\n",
" <th>V_FUNDBY</th>\n",
" <th>OTHER_MEDS</th>\n",
" <th>CUR_ILL</th>\n",
" <th>HISTORY</th>\n",
" <th>PRIOR_VAX</th>\n",
" <th>SPLTTYPE</th>\n",
" <th>FORM_VERS</th>\n",
" <th>TODAYS_DATE</th>\n",
" <th>BIRTH_DEFECT</th>\n",
" <th>OFC_VISIT</th>\n",
" <th>ER_ED_VISIT</th>\n",
" <th>ALLERGIES</th>\n",
" <th>VAX_TYPE</th>\n",
" <th>VAX_MANU</th>\n",
" <th>VAX_LOT</th>\n",
" <th>VAX_DOSE_SERIES</th>\n",
" <th>VAX_ROUTE</th>\n",
" <th>VAX_SITE</th>\n",
" <th>VAX_NAME</th>\n",
" </tr>\n",
" <tr>\n",
" <th>VAERS_ID</th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>916600</th>\n",
" <td>01/01/2021</td>\n",
" <td>TX</td>\n",
" <td>33.0</td>\n",
" <td>33.0</td>\n",
" <td>NaN</td>\n",
" <td>F</td>\n",
" <td>NaN</td>\n",
" <td>Right side of epiglottis swelled up and hinder...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>12/28/2020</td>\n",
" <td>12/30/2020</td>\n",
" <td>2.0</td>\n",
" <td>None</td>\n",
" <td>PVT</td>\n",
" <td>NaN</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>01/01/2021</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>NaN</td>\n",
" <td>Pcn and bee venom</td>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>037K20A</td>\n",
" <td>1</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916601</th>\n",
" <td>01/01/2021</td>\n",
" <td>CA</td>\n",
" <td>73.0</td>\n",
" <td>73.0</td>\n",
" <td>NaN</td>\n",
" <td>F</td>\n",
" <td>NaN</td>\n",
" <td>Approximately 30 min post vaccination administ...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>12/31/2020</td>\n",
" <td>12/31/2020</td>\n",
" <td>0.0</td>\n",
" <td>NaN</td>\n",
" <td>SEN</td>\n",
" <td>NaN</td>\n",
" <td>Patient residing at nursing facility. See pati...</td>\n",
" <td>Patient residing at nursing facility. See pati...</td>\n",
" <td>Patient residing at nursing facility. See pati...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>01/01/2021</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>NaN</td>\n",
" <td>\"Dairy\"</td>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>025L20A</td>\n",
" <td>1</td>\n",
" <td>IM</td>\n",
" <td>RA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916602</th>\n",
" <td>01/01/2021</td>\n",
" <td>WA</td>\n",
" <td>23.0</td>\n",
" <td>23.0</td>\n",
" <td>NaN</td>\n",
" <td>F</td>\n",
" <td>NaN</td>\n",
" <td>About 15 minutes after receiving the vaccine, ...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>U</td>\n",
" <td>12/31/2020</td>\n",
" <td>12/31/2020</td>\n",
" <td>0.0</td>\n",
" <td>NaN</td>\n",
" <td>SEN</td>\n",
" <td>NaN</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" <td>None</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>01/01/2021</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>Shellfish</td>\n",
" <td>COVID19</td>\n",
" <td>PFIZER\\BIONTECH</td>\n",
" <td>EL1284</td>\n",
" <td>1</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (PFIZER-BIONTECH))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916603</th>\n",
" <td>01/01/2021</td>\n",
" <td>WA</td>\n",
" <td>58.0</td>\n",
" <td>58.0</td>\n",
" <td>NaN</td>\n",
" <td>F</td>\n",
" <td>NaN</td>\n",
" <td>extreme fatigue, dizziness,. could not lift my...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>12/23/2020</td>\n",
" <td>12/23/2020</td>\n",
" <td>0.0</td>\n",
" <td>none</td>\n",
" <td>WRK</td>\n",
" <td>NaN</td>\n",
" <td>none</td>\n",
" <td>kidney infection</td>\n",
" <td>diverticulitis, mitral valve prolapse, osteoar...</td>\n",
" <td>got measles from measel shot, mums from mumps ...</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>01/01/2021</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Diclofenac, novacaine, lidocaine, pickles, tom...</td>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>unknown</td>\n",
" <td>UNK</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>916604</th>\n",
" <td>01/01/2021</td>\n",
" <td>TX</td>\n",
" <td>47.0</td>\n",
" <td>47.0</td>\n",
" <td>NaN</td>\n",
" <td>F</td>\n",
" <td>NaN</td>\n",
" <td>Injection site swelling, redness, warm to the ...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>N</td>\n",
" <td>12/22/2020</td>\n",
" <td>12/29/2020</td>\n",
" <td>7.0</td>\n",
" <td>NaN</td>\n",
" <td>PUB</td>\n",
" <td>NaN</td>\n",
" <td>Na</td>\n",
" <td>Na</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>01/01/2021</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Na</td>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>NaN</td>\n",
" <td>1</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2005264</th>\n",
" <td>04/24/2021</td>\n",
" <td>HI</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>M</td>\n",
" <td>NaN</td>\n",
" <td>None</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>PVT</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>04/24/2021</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>COVID19</td>\n",
" <td>PFIZER\\BIONTECH</td>\n",
" <td>EN6208</td>\n",
" <td>UNK</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>COVID19 (COVID19 (PFIZER-BIONTECH))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2005274</th>\n",
" <td>04/26/2021</td>\n",
" <td>NC</td>\n",
" <td>65.0</td>\n",
" <td>65.0</td>\n",
" <td>NaN</td>\n",
" <td>F</td>\n",
" <td>NaN</td>\n",
" <td>New onset nasal herpes simplex coming up about...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>03/01/2021</td>\n",
" <td>03/10/2021</td>\n",
" <td>9.0</td>\n",
" <td>NaN</td>\n",
" <td>PVT</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>04/24/2021</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>028L20A</td>\n",
" <td>UNK</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2005274</th>\n",
" <td>04/26/2021</td>\n",
" <td>NC</td>\n",
" <td>65.0</td>\n",
" <td>65.0</td>\n",
" <td>NaN</td>\n",
" <td>F</td>\n",
" <td>NaN</td>\n",
" <td>New onset nasal herpes simplex coming up about...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>03/01/2021</td>\n",
" <td>03/10/2021</td>\n",
" <td>9.0</td>\n",
" <td>NaN</td>\n",
" <td>PVT</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>04/24/2021</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>014M20A</td>\n",
" <td>UNK</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2005290</th>\n",
" <td>04/21/2021</td>\n",
" <td>MI</td>\n",
" <td>44.0</td>\n",
" <td>44.0</td>\n",
" <td>NaN</td>\n",
" <td>M</td>\n",
" <td>NaN</td>\n",
" <td>5 weeks daily; Sweats, Nausea, Light headed, L...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>N</td>\n",
" <td>03/17/2021</td>\n",
" <td>03/18/2021</td>\n",
" <td>1.0</td>\n",
" <td>unremarkable; CBC, Comp Panel, Sed rate, D-dim...</td>\n",
" <td>PHM</td>\n",
" <td>NaN</td>\n",
" <td>see list</td>\n",
" <td>NaN</td>\n",
" <td>insulin dependant diabetes, hypertension, obes...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>04/26/2021</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>NaN</td>\n",
" <td>Bactrim, cephalexin, penicillin</td>\n",
" <td>COVID19</td>\n",
" <td>JANSSEN</td>\n",
" <td>1805020</td>\n",
" <td>UNK</td>\n",
" <td>IM</td>\n",
" <td>NaN</td>\n",
" <td>COVID19 (COVID19 (JANSSEN))</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2009884</th>\n",
" <td>04/26/2021</td>\n",
" <td>NaN</td>\n",
" <td>62.0</td>\n",
" <td>61.0</td>\n",
" <td>NaN</td>\n",
" <td>M</td>\n",
" <td>NaN</td>\n",
" <td>CoughWheeze Chills, night sweats, arm sore, ey...</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>Y</td>\n",
" <td>04/21/2021</td>\n",
" <td>04/22/2021</td>\n",
" <td>1.0</td>\n",
" <td>NaN</td>\n",
" <td>OTH</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>04/26/2021</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>NaN</td>\n",
" <td>COVID19</td>\n",
" <td>MODERNA</td>\n",
" <td>NaN</td>\n",
" <td>2</td>\n",
" <td>IM</td>\n",
" <td>LA</td>\n",
" <td>COVID19 (COVID19 (MODERNA))</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>737971 rows × 41 columns</p>\n",
"</div>"
],
"text/plain": [
" RECVDATE STATE AGE_YRS CAGE_YR CAGE_MO SEX RPT_DATE \\\n",
"VAERS_ID \n",
"916600 01/01/2021 TX 33.0 33.0 NaN F NaN \n",
"916601 01/01/2021 CA 73.0 73.0 NaN F NaN \n",
"916602 01/01/2021 WA 23.0 23.0 NaN F NaN \n",
"916603 01/01/2021 WA 58.0 58.0 NaN F NaN \n",
"916604 01/01/2021 TX 47.0 47.0 NaN F NaN \n",
"... ... ... ... ... ... .. ... \n",
"2005264 04/24/2021 HI NaN NaN NaN M NaN \n",
"2005274 04/26/2021 NC 65.0 65.0 NaN F NaN \n",
"2005274 04/26/2021 NC 65.0 65.0 NaN F NaN \n",
"2005290 04/21/2021 MI 44.0 44.0 NaN M NaN \n",
"2009884 04/26/2021 NaN 62.0 61.0 NaN M NaN \n",
"\n",
" SYMPTOM_TEXT DIED DATEDIED \\\n",
"VAERS_ID \n",
"916600 Right side of epiglottis swelled up and hinder... NaN NaN \n",
"916601 Approximately 30 min post vaccination administ... NaN NaN \n",
"916602 About 15 minutes after receiving the vaccine, ... NaN NaN \n",
"916603 extreme fatigue, dizziness,. could not lift my... NaN NaN \n",
"916604 Injection site swelling, redness, warm to the ... NaN NaN \n",
"... ... ... ... \n",
"2005264 None NaN NaN \n",
"2005274 New onset nasal herpes simplex coming up about... NaN NaN \n",
"2005274 New onset nasal herpes simplex coming up about... NaN NaN \n",
"2005290 5 weeks daily; Sweats, Nausea, Light headed, L... NaN NaN \n",
"2009884 CoughWheeze Chills, night sweats, arm sore, ey... NaN NaN \n",
"\n",
" L_THREAT ER_VISIT HOSPITAL HOSPDAYS X_STAY DISABLE RECOVD \\\n",
"VAERS_ID \n",
"916600 NaN NaN NaN NaN NaN NaN Y \n",
"916601 NaN NaN NaN NaN NaN NaN Y \n",
"916602 NaN NaN NaN NaN NaN NaN U \n",
"916603 NaN NaN NaN NaN NaN NaN Y \n",
"916604 NaN NaN NaN NaN NaN NaN N \n",
"... ... ... ... ... ... ... ... \n",
"2005264 NaN NaN NaN NaN NaN NaN Y \n",
"2005274 NaN NaN NaN NaN NaN NaN NaN \n",
"2005274 NaN NaN NaN NaN NaN NaN NaN \n",
"2005290 NaN NaN NaN NaN NaN NaN N \n",
"2009884 NaN NaN NaN NaN NaN NaN Y \n",
"\n",
" VAX_DATE ONSET_DATE NUMDAYS \\\n",
"VAERS_ID \n",
"916600 12/28/2020 12/30/2020 2.0 \n",
"916601 12/31/2020 12/31/2020 0.0 \n",
"916602 12/31/2020 12/31/2020 0.0 \n",
"916603 12/23/2020 12/23/2020 0.0 \n",
"916604 12/22/2020 12/29/2020 7.0 \n",
"... ... ... ... \n",
"2005264 NaN NaN NaN \n",
"2005274 03/01/2021 03/10/2021 9.0 \n",
"2005274 03/01/2021 03/10/2021 9.0 \n",
"2005290 03/17/2021 03/18/2021 1.0 \n",
"2009884 04/21/2021 04/22/2021 1.0 \n",
"\n",
" LAB_DATA V_ADMINBY \\\n",
"VAERS_ID \n",
"916600 None PVT \n",
"916601 NaN SEN \n",
"916602 NaN SEN \n",
"916603 none WRK \n",
"916604 NaN PUB \n",
"... ... ... \n",
"2005264 NaN PVT \n",
"2005274 NaN PVT \n",
"2005274 NaN PVT \n",
"2005290 unremarkable; CBC, Comp Panel, Sed rate, D-dim... PHM \n",
"2009884 NaN OTH \n",
"\n",
" V_FUNDBY OTHER_MEDS \\\n",
"VAERS_ID \n",
"916600 NaN None \n",
"916601 NaN Patient residing at nursing facility. See pati... \n",
"916602 NaN None \n",
"916603 NaN none \n",
"916604 NaN Na \n",
"... ... ... \n",
"2005264 NaN NaN \n",
"2005274 NaN NaN \n",
"2005274 NaN NaN \n",
"2005290 NaN see list \n",
"2009884 NaN NaN \n",
"\n",
" CUR_ILL \\\n",
"VAERS_ID \n",
"916600 None \n",
"916601 Patient residing at nursing facility. See pati... \n",
"916602 None \n",
"916603 kidney infection \n",
"916604 Na \n",
"... ... \n",
"2005264 NaN \n",
"2005274 NaN \n",
"2005274 NaN \n",
"2005290 NaN \n",
"2009884 NaN \n",
"\n",
" HISTORY \\\n",
"VAERS_ID \n",
"916600 None \n",
"916601 Patient residing at nursing facility. See pati... \n",
"916602 None \n",
"916603 diverticulitis, mitral valve prolapse, osteoar... \n",
"916604 NaN \n",
"... ... \n",
"2005264 NaN \n",
"2005274 NaN \n",
"2005274 NaN \n",
"2005290 insulin dependant diabetes, hypertension, obes... \n",
"2009884 NaN \n",
"\n",
" PRIOR_VAX SPLTTYPE \\\n",
"VAERS_ID \n",
"916600 NaN NaN \n",
"916601 NaN NaN \n",
"916602 NaN NaN \n",
"916603 got measles from measel shot, mums from mumps ... NaN \n",
"916604 NaN NaN \n",
"... ... ... \n",
"2005264 NaN NaN \n",
"2005274 NaN NaN \n",
"2005274 NaN NaN \n",
"2005290 NaN NaN \n",
"2009884 NaN NaN \n",
"\n",
" FORM_VERS TODAYS_DATE BIRTH_DEFECT OFC_VISIT ER_ED_VISIT \\\n",
"VAERS_ID \n",
"916600 2 01/01/2021 NaN Y NaN \n",
"916601 2 01/01/2021 NaN Y NaN \n",
"916602 2 01/01/2021 NaN NaN Y \n",
"916603 2 01/01/2021 NaN NaN NaN \n",
"916604 2 01/01/2021 NaN NaN NaN \n",
"... ... ... ... ... ... \n",
"2005264 2 04/24/2021 NaN NaN NaN \n",
"2005274 2 04/24/2021 NaN Y NaN \n",
"2005274 2 04/24/2021 NaN Y NaN \n",
"2005290 2 04/26/2021 NaN Y NaN \n",
"2009884 2 04/26/2021 NaN NaN NaN \n",
"\n",
" ALLERGIES VAX_TYPE \\\n",
"VAERS_ID \n",
"916600 Pcn and bee venom COVID19 \n",
"916601 \"Dairy\" COVID19 \n",
"916602 Shellfish COVID19 \n",
"916603 Diclofenac, novacaine, lidocaine, pickles, tom... COVID19 \n",
"916604 Na COVID19 \n",
"... ... ... \n",
"2005264 NaN COVID19 \n",
"2005274 NaN COVID19 \n",
"2005274 NaN COVID19 \n",
"2005290 Bactrim, cephalexin, penicillin COVID19 \n",
"2009884 NaN COVID19 \n",
"\n",
" VAX_MANU VAX_LOT VAX_DOSE_SERIES VAX_ROUTE VAX_SITE \\\n",
"VAERS_ID \n",
"916600 MODERNA 037K20A 1 IM LA \n",
"916601 MODERNA 025L20A 1 IM RA \n",
"916602 PFIZER\\BIONTECH EL1284 1 IM LA \n",
"916603 MODERNA unknown UNK NaN NaN \n",
"916604 MODERNA NaN 1 IM LA \n",
"... ... ... ... ... ... \n",
"2005264 PFIZER\\BIONTECH EN6208 UNK NaN NaN \n",
"2005274 MODERNA 028L20A UNK IM LA \n",
"2005274 MODERNA 014M20A UNK IM LA \n",
"2005290 JANSSEN 1805020 UNK IM NaN \n",
"2009884 MODERNA NaN 2 IM LA \n",
"\n",
" VAX_NAME \n",
"VAERS_ID \n",
"916600 COVID19 (COVID19 (MODERNA)) \n",
"916601 COVID19 (COVID19 (MODERNA)) \n",
"916602 COVID19 (COVID19 (PFIZER-BIONTECH)) \n",
"916603 COVID19 (COVID19 (MODERNA)) \n",
"916604 COVID19 (COVID19 (MODERNA)) \n",
"... ... \n",
"2005264 COVID19 (COVID19 (PFIZER-BIONTECH)) \n",
"2005274 COVID19 (COVID19 (MODERNA)) \n",
"2005274 COVID19 (COVID19 (MODERNA)) \n",
"2005290 COVID19 (COVID19 (JANSSEN)) \n",
"2009884 COVID19 (COVID19 (MODERNA)) \n",
"\n",
"[737971 rows x 41 columns]"
]
},
"execution_count": 12,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# pd.set_option('display.max_rows', 100)\n",
"df_patients_COVID19"
]
},
{
"cell_type": "code",
"execution_count": 13,
"id": "233bc590",
"metadata": {},
"outputs": [],
"source": [
"df_PFIZER_BIONTECH = df_patients_COVID19[df_patients_COVID19[\"VAX_MANU\"] == \"MODERNA\"]"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "86e0e4f2",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"<class 'pandas.core.frame.DataFrame'>\n",
"Int64Index: 339877 entries, 916600 to 2009884\n",
"Data columns (total 41 columns):\n",
" # Column Non-Null Count Dtype \n",
"--- ------ -------------- ----- \n",
" 0 RECVDATE 339877 non-null object \n",
" 1 STATE 302148 non-null object \n",
" 2 AGE_YRS 309475 non-null float64\n",
" 3 CAGE_YR 302392 non-null float64\n",
" 4 CAGE_MO 561 non-null float64\n",
" 5 SEX 339877 non-null object \n",
" 6 RPT_DATE 271 non-null object \n",
" 7 SYMPTOM_TEXT 339774 non-null object \n",
" 8 DIED 4694 non-null object \n",
" 9 DATEDIED 4392 non-null object \n",
" 10 L_THREAT 4753 non-null object \n",
" 11 ER_VISIT 26 non-null object \n",
" 12 HOSPITAL 20841 non-null object \n",
" 13 HOSPDAYS 13803 non-null float64\n",
" 14 X_STAY 152 non-null object \n",
" 15 DISABLE 4875 non-null object \n",
" 16 RECOVD 308614 non-null object \n",
" 17 VAX_DATE 323994 non-null object \n",
" 18 ONSET_DATE 311854 non-null object \n",
" 19 NUMDAYS 306537 non-null float64\n",
" 20 LAB_DATA 127507 non-null object \n",
" 21 V_ADMINBY 339877 non-null object \n",
" 22 V_FUNDBY 284 non-null object \n",
" 23 OTHER_MEDS 200657 non-null object \n",
" 24 CUR_ILL 163361 non-null object \n",
" 25 HISTORY 203490 non-null object \n",
" 26 PRIOR_VAX 18047 non-null object \n",
" 27 SPLTTYPE 97511 non-null object \n",
" 28 FORM_VERS 339877 non-null int64 \n",
" 29 TODAYS_DATE 337268 non-null object \n",
" 30 BIRTH_DEFECT 191 non-null object \n",
" 31 OFC_VISIT 61181 non-null object \n",
" 32 ER_ED_VISIT 34734 non-null object \n",
" 33 ALLERGIES 178840 non-null object \n",
" 34 VAX_TYPE 339877 non-null object \n",
" 35 VAX_MANU 339877 non-null object \n",
" 36 VAX_LOT 236149 non-null object \n",
" 37 VAX_DOSE_SERIES 339478 non-null object \n",
" 38 VAX_ROUTE 301519 non-null object \n",
" 39 VAX_SITE 246947 non-null object \n",
" 40 VAX_NAME 339877 non-null object \n",
"dtypes: float64(5), int64(1), object(35)\n",
"memory usage: 108.9+ MB\n"
]
}
],
"source": [
"df_PFIZER_BIONTECH.info()"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "4b3cb943",
"metadata": {},
"outputs": [],
"source": [
"# table = pd.pivot_table(df_PFIZER_BIONTECH, values='DIED', columns=['DIED'], aggfunc=np.sum)"
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "349da946",
"metadata": {
"scrolled": false
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>VAX_LOT</th>\n",
" </tr>\n",
" <tr>\n",
" <th>VAERS_ID</th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>917117</th>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>917790</th>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>917793</th>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>918065</th>\n",
" <td>025J20-2A</td>\n",
" </tr>\n",
" <tr>\n",
" <th>918487</th>\n",
" <td>011L2Oa</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1995984</th>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1996537</th>\n",
" <td>037F21A</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1996542</th>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1996546</th>\n",
" <td>NaN</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1996867</th>\n",
" <td>003A21A</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>4694 rows × 1 columns</p>\n",
"</div>"
],
"text/plain": [
" VAX_LOT\n",
"VAERS_ID \n",
"917117 NaN\n",
"917790 NaN\n",
"917793 NaN\n",
"918065 025J20-2A\n",
"918487 011L2Oa\n",
"... ...\n",
"1995984 NaN\n",
"1996537 037F21A\n",
"1996542 NaN\n",
"1996546 NaN\n",
"1996867 003A21A\n",
"\n",
"[4694 rows x 1 columns]"
]
},
"execution_count": 16,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df = df_PFIZER_BIONTECH[df_PFIZER_BIONTECH['DIED']=='Y'][['VAX_LOT']]\n",
"df"
]
},
{
"cell_type": "code",
"execution_count": 17,
"id": "9c5ff2fd",
"metadata": {
"scrolled": false
},
"outputs": [
{
"data": {
"text/plain": [
"VAX_LOT \n",
"039K20A 93\n",
"012L20A 72\n",
"010M20A 69\n",
"013L20A 68\n",
"030L20A 54\n",
"037K20A 53\n",
"016M20A 53\n",
"012M20A 53\n",
"029L20A 51\n",
"024M20A 51\n",
"025L20A 50\n",
"022M20A 50\n",
"027L20A 48\n",
"010A21A 48\n",
"013M20A 45\n",
"026A21A 45\n",
"031L20A 45\n",
"015M20A 45\n",
"007M20A 44\n",
"026L20A 42\n",
"031M20A 40\n",
"013A21A 39\n",
"011A21A 39\n",
"032L20A 38\n",
"004M20A 38\n",
"030A21A 38\n",
"011J20A 37\n",
"011M20A 37\n",
"028L20A 35\n",
"011L20A 35\n",
"041L20A 35\n",
"025J20-2A 32\n",
"Unknown 32\n",
"030M20A 31\n",
"012A21A 31\n",
"032H20A 31\n",
"040A21A 30\n",
"032M20A 30\n",
"043L20A 30\n",
"042L20A 29\n",
"006M20A 29\n",
"023M20A 29\n",
"002A21A 27\n",
"017B21A 26\n",
"036A21A 26\n",
"027A21A 26\n",
"048A21A 23\n",
"047A21A 22\n",
"006B21A 22\n",
"003A21A 22\n",
"unknown 22\n",
"025B21A 21\n",
"020B21A 21\n",
"044A21A 20\n",
"025A21A 20\n",
"038K20A 20\n",
"014M20A 19\n",
"031A21A 18\n",
"021B21A 18\n",
"003B21A 18\n",
"007B21A 17\n",
"029A21A 17\n",
"031B21A 17\n",
"038A21A 16\n",
"001A21A 15\n",
"001B21A 15\n",
"019B21A 14\n",
"045A21A 14\n",
"018B21A 14\n",
"025J20A 14\n",
"046A21A 14\n",
"036B21A 14\n",
"026B21A 13\n",
"016B21A 13\n",
"027B21A 13\n",
"008B21A 13\n",
"028A21A 12\n",
"002C21A 12\n",
"029K20A 11\n",
"009C21A 11\n",
"040B21A 11\n",
"038B21A 11\n",
"002B21A 11\n",
"039B21A 11\n",
"047B21A 10\n",
"006C21A 10\n",
"045B21A 10\n",
"048B21A 10\n",
"046B21A 10\n",
"030H21B 10\n",
"008C21A 9\n",
"030B21A 9\n",
"UNKNOWN 9\n",
"001C21A 9\n",
"039A21A 8\n",
"017C21A 8\n",
"044B21A 8\n",
"032B21A 8\n",
"939906 8\n",
"004C21A 8\n",
"038C21A 8\n",
"042B21A 7\n",
"035C21A 7\n",
"047C21A 7\n",
"025C21A 7\n",
"037A21B 7\n",
"043B21A 7\n",
"041C21A 7\n",
"030m20a 6\n",
"016C21A 6\n",
"048C21A 6\n",
"006D21A 6\n",
"NO LOT # AVAILA 6\n",
"003C21A 6\n",
"027C21A 6\n",
"037B21A 6\n",
"058H21A 6\n",
"052E21A 6\n",
"007C21A 6\n",
"013F21A 5\n",
"008B21-2A 5\n",
"033C21A 5\n",
"005C21A 5\n",
"030a21a 5\n",
"026a21a 5\n",
"025J202A 5\n",
"033B21A 4\n",
"037k20a 4\n",
"003b21a 4\n",
"024C21A 4\n",
"008B212A 4\n",
"026D21A 4\n",
"040a21a 4\n",
"065F21A 4\n",
"022C21A 4\n",
"021C21A 4\n",
"031l20a 4\n",
"041B21A 4\n",
"032F21A 4\n",
"024m20a 4\n",
"051F21A 4\n",
"015m20a 3\n",
"002a21a 3\n",
"038k20a 3\n",
"002c21a 3\n",
"007m20a 3\n",
"026C21A 3\n",
"091D21A 3\n",
"025b21a 3\n",
"062E21A 3\n",
"016m20a 3\n",
"027b21a 3\n",
"039K208 3\n",
"017E21A 3\n",
"017F21A 3\n",
"039k20a 3\n",
"020f21a 3\n",
"076C21A 3\n",
"03M20A 3\n",
"071F21A 3\n",
"039K20-2A 3\n",
"051C21A 3\n",
"? 3\n",
"037k20A 3\n",
"045C21A 3\n",
"033c21a 3\n",
"009D21A 3\n",
"036C21A 3\n",
"010a21a 3\n",
"046C21A 3\n",
"CVO224 3\n",
"011F21A 3\n",
"Moderna 3\n",
"030l20a 3\n",
"048F21A 3\n",
"012H21B 3\n",
"004m20a 3\n",
"069F21A 3\n",
"014C21A 3\n",
"050C21A 3\n",
"013a21a 3\n",
"003F21A 3\n",
"042B212A 2\n",
"066F21A 2\n",
"039k20-2a 2\n",
"039k20A 2\n",
"035c21A 2\n",
"046AZ1A 2\n",
"054C21A 2\n",
"040b21a 2\n",
"032l20a 2\n",
"038a21a 2\n",
"034F21A 2\n",
"024M2OA 2\n",
"034C21A 2\n",
"045a21a 2\n",
"027H21B 2\n",
"045J21A 2\n",
"023m20a 2\n",
"036a21a 2\n",
"041620A 2\n",
"025J20 2\n",
"049C21A 2\n",
"048b21a 2\n",
"048a21a 2\n",
"043821A 2\n",
"058F21A 2\n",
"057G20A 2\n",
"037a21b 2\n",
"031A21 2\n",
"037K2OA 2\n",
"062G20A 2\n",
"050e21a 2\n",
"053E21A 2\n",
"037C21A 2\n",
"047a21a 2\n",
"043220A 2\n",
"062e21a 2\n",
"037B31A 2\n",
"027C20A 2\n",
"052c21a 2\n",
"01A21A 2\n",
"023C21A 2\n",
"007M20 2\n",
"13L20A 2\n",
"16B21A 2\n",
"004c21a 2\n",
"005c21a 2\n",
"014m20a 2\n",
"014c21a 2\n",
"014F21A 2\n",
"013m20a 2\n",
"013l20a 2\n",
"MOD039K20A 2\n",
"006m20a 2\n",
"013L20a 2\n",
"013120A 2\n",
"UNKNOWN/NA 2\n",
"012m20a 2\n",
"42L20A 2\n",
"007m20A 2\n",
"012F21A 2\n",
"011m20a 2\n",
"EN6199 2\n",
"939902 2\n",
"939905 2\n",
"948548 2\n",
"022m20a 2\n",
"011D21A 2\n",
"01021A 2\n",
"003a21a 2\n",
"006821A 2\n",
"017c21a 2\n",
"unk 2\n",
"unavailable 2\n",
"001a21a 2\n",
"001121A 2\n",
"022B21A 2\n",
"019F21A 2\n",
"045Ax119 1\n",
"not documented 1\n",
"ER8727 1\n",
"042B1-2A 1\n",
"041220A 1\n",
"ER8729 1\n",
"045A21H 1\n",
"EW0158 1\n",
"EW0186 1\n",
"n/A 1\n",
"mRNA1273 1\n",
"G38A21A 1\n",
"EN6200 1\n",
"EN604 1\n",
"unavailable (pl 1\n",
"EL9266 1\n",
"EL1283 1\n",
"EL3247 1\n",
"unknown, check 1\n",
"EL3248 1\n",
"EL3302 1\n",
"EL9261 1\n",
"046821A 1\n",
"Given on 7/20/2 1\n",
"040D21A 1\n",
"ELO140 1\n",
"040M20A 1\n",
"04613212 1\n",
"ELP264 1\n",
"EM9810 1\n",
"c039b21a 1\n",
"LOT: 011L20A Ex 1\n",
"Given on 8/17/2 1\n",
"U11620A or 6111 1\n",
"Not provided 1\n",
"Unknow 1\n",
"O-012L20A 1\n",
"O-031M20A 1\n",
"O11L20A 1\n",
"O13L20A 1\n",
"O14MZOA 1\n",
"0421321A 1\n",
"O31B21A 1\n",
"O4SC21A 1\n",
"O54C21A 1\n",
"042b21-2a 1\n",
"Unk 1\n",
"RA 5190 1\n",
"RA5190 1\n",
"041l20A 1\n",
"041MZ0A 1\n",
"041MZ017 1\n",
"Y13A21A 1\n",
"044b21a 1\n",
"044a21a 1\n",
"ZTC540693 1\n",
"Lot#007M20A, # 1\n",
"MOD 040C21A 1\n",
"MOD/013L20A 1\n",
"W1010A21A 1\n",
"VO1B21F 1\n",
"Moderna 021C21A 1\n",
"044921A 1\n",
"Moderna/039K20A 1\n",
"041LAUA 1\n",
"E261283 1\n",
"043L20A 02/10/2 1\n",
"EL0140 1\n",
"CO3A21A 1\n",
"046B23A 1\n",
"088D214 1\n",
"061e21A 1\n",
"061F21A 1\n",
"061B21A 1\n",
"05E214 1\n",
"08B21A 1\n",
"059E21A 1\n",
"059A21A 1\n",
"0c1a21a 1\n",
"102627 1\n",
"1273 1\n",
"058f21a 1\n",
"12M20A 1\n",
"13508314 1\n",
"1442 1\n",
"14M20A 1\n",
"1538554 1\n",
"15M20A 1\n",
"088D21A 1\n",
"0880021A 1\n",
"054c21a 1\n",
"085A21A 1\n",
"070M20A 1\n",
"067F21A 1\n",
"073K20A 1\n",
"0746C21A 1\n",
"077L20A 1\n",
"077c21b 1\n",
"066F212 1\n",
"066D 1\n",
"040C21A 1\n",
"078C21A 1\n",
"078c21a 1\n",
"07B21A 1\n",
"07L20A 1\n",
"065F214 1\n",
"07M20A 1\n",
"064H21a 1\n",
"0819E21A 1\n",
"168342635 1\n",
"17B21A 1\n",
"Don?t know 1\n",
"37K20A 1\n",
"048c21a 1\n",
"5/4/2021 1\n",
"623MZ0A 1\n",
"693894 1\n",
"80777-0273-99 1\n",
"91301 1\n",
"939901 1\n",
"048B211A 1\n",
"939909 1\n",
"A-HRSA-043B2 1\n",
"047AZIA 1\n",
"Congestive Hear 1\n",
"Covid Moderna 0 1\n",
"D06B7 or 21A 1\n",
"046b21a 1\n",
"046azia 1\n",
"D12L20A 1\n",
"38077727399 1\n",
"310M20A 1\n",
"210414-015 1\n",
"04A21A 1\n",
"053C21A 1\n",
"052e21a 1\n",
"23M20A 1\n",
"052EZ1A 1\n",
"24M20A 1\n",
"2599133 1\n",
"26L20A 1\n",
"051E21A 1\n",
"27C21A 1\n",
"050ez1a 1\n",
"28L20A0 1\n",
"29k21A 1\n",
"050E2114 1\n",
"309K20A 1\n",
"04TAZ1A 1\n",
"04DC21A 1\n",
"04C21A 1\n",
"#027L20A 1\n",
"031L20 A 1\n",
"03ZM20A 1\n",
"017821A 1\n",
"012M20a 1\n",
"012L20R 1\n",
"0124214 1\n",
"012120a 1\n",
"011j20A 1\n",
"011f21a 1\n",
"011a21a 1\n",
"011M208 1\n",
"011M202A 1\n",
"011L2Oa 1\n",
"011L20a 1\n",
"011J220A 1\n",
"011J20A17691231 1\n",
"011J204 1\n",
"011I20A 1\n",
"011AZ1A 1\n",
"01120A 1\n",
"0111Z0A 1\n",
"011021A 1\n",
"011 1\n",
"010m2qa 1\n",
"010a21A 1\n",
"010M2OA 1\n",
"010A21 1\n",
"0108218 1\n",
"012M2CA 1\n",
"012M2OA 1\n",
"012l20a 1\n",
"0161321A 1\n",
"016b21a 1\n",
"016MZOA 1\n",
"016M210A 1\n",
"016M20a 1\n",
"016M20-A 1\n",
"016M02A 1\n",
"016C219 1\n",
"016B12A 1\n",
"016420A 1\n",
"0163L20A 1\n",
"01620A 1\n",
"015b21a 1\n",
"0131L20A 1\n",
"015M2OA 1\n",
"015M21A 1\n",
"015M02A 1\n",
"015B21A 1\n",
"014F1A 1\n",
"0146214 1\n",
"013M2OA 1\n",
"013M20 1\n",
"013M02A 1\n",
"013A20A 1\n",
"013620A 1\n",
"00C21A 1\n",
"009c21a 1\n",
"009C21B 1\n",
"002A221A 1\n",
"004D21A 1\n",
"004021A 1\n",
"003c21a 1\n",
"00321A 1\n",
"002b21a 1\n",
"002b 1\n",
"002V21A 1\n",
"002M20A 1\n",
"002F21A 1\n",
"002CIA 1\n",
"002B21B 1\n",
"0029L20A 1\n",
"004M208 1\n",
"001c21a 1\n",
"001b21a 1\n",
"001L20A 1\n",
"001CZ1A 1\n",
"001821A 1\n",
"0016M20A 1\n",
"0012A 1\n",
"0011M20A 1\n",
"#069H21A 1\n",
"#065F21A 1\n",
"#039K20A 1\n",
"004F21A 1\n",
"004M20A. 012A 1\n",
"009C2117 1\n",
"007B214 1\n",
"009021a 1\n",
"008b21a 1\n",
"008b212a 1\n",
"008B211A 1\n",
"008B21-2a 1\n",
"008 B 2I-2H 1\n",
"007c21a 1\n",
"007b21a 1\n",
"007NCOa 1\n",
"007MA20A 1\n",
"007M2OA 1\n",
"007621A 1\n",
"004M20a 1\n",
"0071321A 1\n",
"006c219 1\n",
"006b21A 1\n",
"006b12a 1\n",
"006M208 1\n",
"006B81A 1\n",
"006B218 1\n",
"006B21 1\n",
"005c21A 1\n",
"004MZ0A 1\n",
"004MA20A 1\n",
"016c21a 1\n",
"017B214 1\n",
"03K20A 1\n",
"017b21a 1\n",
"034f21a 1\n",
"033b21a 1\n",
"033H21A 1\n",
"033F21A 1\n",
"033F214 1\n",
"033F 1\n",
"033C1A 1\n",
"0330L20A 1\n",
"032m20a 1\n",
"032b21a 1\n",
"032V20A 1\n",
"0329K20A 1\n",
"0321H20A 1\n",
"031b21a 1\n",
"031a21a 1\n",
"031M20A and 001 1\n",
"#029A21A 1\n",
"031K20A 1\n",
"031I20a 1\n",
"031H21A 1\n",
"031C20A 1\n",
"031821A 1\n",
"030b221a 1\n",
"030b21a 1\n",
"030M20a 1\n",
"03621A 1\n",
"036c21a 1\n",
"037A2113 1\n",
"039B12A 1\n",
"03H20A 1\n",
"03EB21A 1\n",
"03B21A 1\n",
"039f21a 1\n",
"039d21a 1\n",
"039c21a 1\n",
"039b21A 1\n",
"039K2020A 1\n",
"039K20 1\n",
"039K0A 1\n",
"039F21A 1\n",
"039A212A 1\n",
"037B221a 1\n",
"0399K20-2A 1\n",
"039*K20A 1\n",
"038k20A 1\n",
"038KWA 1\n",
"038K208 1\n",
"038A21A/039B21A 1\n",
"037f21a 1\n",
"037b21a 1\n",
"037KZOA 1\n",
"037K209 1\n",
"037F21A 1\n",
"030M2011 1\n",
"030L2OA 1\n",
"030L29A 1\n",
"023m20A 1\n",
"025j20-2a 1\n",
"025az1a 1\n",
"025a21a 1\n",
"025J20a 1\n",
"025J20A 030L20 1\n",
"025J20-JA 1\n",
"025420-2A 1\n",
"02521A 1\n",
"024mzoa 1\n",
"024MZ0A 1\n",
"023m2oa 1\n",
"022c21a 1\n",
"0261721A 1\n",
"022b21a 1\n",
"022N20A 1\n",
"022M2OA 1\n",
"021C12A 1\n",
"021B21A-1 1\n",
"020F21A 1\n",
"019B12A 1\n",
"018b21a 1\n",
"018B2a 1\n",
"018B218 1\n",
"017f21a 1\n",
"025j20a 1\n",
"026A21 1\n",
"030E21A 1\n",
"028L28A 1\n",
"030B21a 1\n",
"030A1A 1\n",
"02SL20A 1\n",
"02A21A 1\n",
"029k20a 1\n",
"029L20A / 024M2 1\n",
"029I20a 1\n",
"029H21B 1\n",
"029AZ1A 1\n",
"029A21P 1\n",
"028l20a 1\n",
"027h21b 1\n",
"026AZ1A 1\n",
"027c21a 1\n",
"027a21a 1\n",
"027LZOA 1\n",
"027L20AModerna 1\n",
"027D21A 1\n",
"027C264 1\n",
"027A 1\n",
"027821A 1\n",
"026l20A 1\n",
"026L204 1\n",
"026B1A 1\n",
"unsure 1\n",
"dtype: int64"
]
},
"execution_count": 17,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# df = df.groupby(['VAX_LOT']).count()\n",
"#df2 = df.sort_values(by=['DIED'], ascending=False)\n",
"#pd.set_option('display.max_rows', None)\n",
"#print(df2)\n",
"pd.set_option('display.max_rows', None)\n",
"df.value_counts()"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "eff80ae1",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.9.7"
}
},
"nbformat": 4,
"nbformat_minor": 5
}