refactoring

This commit is contained in:
frankknoll
2022-02-01 11:41:10 +01:00
parent c24632894d
commit e2bbe4086f

View File

@@ -125,72 +125,61 @@
"source": [
"import pandas as pd\n",
"\n",
"class BatchCodeTableFactory:\n",
"class BatchCodeTableHelper:\n",
" \n",
" def __init__(self, dataFrame : pd.DataFrame):\n",
" self.dataFrame = dataFrame \n",
"\n",
" def createBatchCodeTable(self, manufacturer, dose):\n",
" df = DataFrameFilter(self.dataFrame).filterBy(manufacturer = manufacturer, dose = dose)\n",
" return BatchCodeTableFactory._asDataFrame(\n",
" def createBatchCodeTable(self):\n",
" return self._asDataFrame(\n",
" {\n",
" 'ADRs': BatchCodeTableFactory._getADRs(df),\n",
" 'DEATHS': BatchCodeTableFactory._getDEATHS(df),\n",
" 'DISABILITIES': BatchCodeTableFactory._getDISABILITIES(df),\n",
" 'LIFE THREATENING ILLNESSES': BatchCodeTableFactory._getLIFE_THREATENING_ILLNESSES(df)\n",
" 'ADRs': self._getADRs(),\n",
" 'DEATHS': self._getDEATHS(),\n",
" 'DISABILITIES': self._getDISABILITIES(),\n",
" 'LIFE THREATENING ILLNESSES': self._getLIFE_THREATENING_ILLNESSES()\n",
" })\n",
"\n",
" # create table from https://www.howbadismybatch.com/combined.html\n",
" def createSevereEffectsBatchCodeTable(self, dose):\n",
" df = DataFrameFilter(self.dataFrame).filterForSevereEffects(dose)\n",
" return BatchCodeTableFactory._addCompanyColumn(\n",
" BatchCodeTableFactory._asDataFrame(\n",
" def createSevereEffectsBatchCodeTable(self):\n",
" return self._addCompanyColumn(\n",
" self._asDataFrame(\n",
" {\n",
" 'ADRs': BatchCodeTableFactory._getADRs(df),\n",
" 'DEATHS': BatchCodeTableFactory._getDEATHS(df),\n",
" 'DISABILITIES': BatchCodeTableFactory._getDISABILITIES(df),\n",
" 'LIFE THREATENING ILLNESSES': BatchCodeTableFactory._getLIFE_THREATENING_ILLNESSES(df),\n",
" 'HOSPITALISATIONS': BatchCodeTableFactory._getHOSPITALISATIONS(df),\n",
" 'EMERGENCY ROOM OR DOCTOR VISITS': BatchCodeTableFactory._getER_VISITs(df)\n",
" 'ADRs': self._getADRs(),\n",
" 'DEATHS': self._getDEATHS(),\n",
" 'DISABILITIES': self._getDISABILITIES(),\n",
" 'LIFE THREATENING ILLNESSES': self._getLIFE_THREATENING_ILLNESSES(),\n",
" 'HOSPITALISATIONS': self._getHOSPITALISATIONS(),\n",
" 'EMERGENCY ROOM OR DOCTOR VISITS': self._getER_VISITs()\n",
" }),\n",
" BatchCodeTableFactory._createCompanyByBatchCodeTable(df))\n",
" self._createCompanyByBatchCodeTable())\n",
"\n",
" @staticmethod\n",
" def _getADRs(df):\n",
" return df['VAX_LOT'].value_counts()\n",
" def _getADRs(self):\n",
" return self.dataFrame['VAX_LOT'].value_counts()\n",
"\n",
" @staticmethod\n",
" def _getDEATHS(df):\n",
" return BatchCodeTableFactory._countValues(df, 'DIED')\n",
" def _getDEATHS(self):\n",
" return self._countValues('DIED')\n",
"\n",
" @staticmethod\n",
" def _getDISABILITIES(df):\n",
" return BatchCodeTableFactory._countValues(df, 'DISABLE')\n",
" def _getDISABILITIES(self):\n",
" return self._countValues('DISABLE')\n",
"\n",
" @staticmethod\n",
" def _getLIFE_THREATENING_ILLNESSES(df):\n",
" return BatchCodeTableFactory._countValues(df, 'L_THREAT')\n",
" def _getLIFE_THREATENING_ILLNESSES(self):\n",
" return self._countValues('L_THREAT')\n",
"\n",
" @staticmethod\n",
" def _getHOSPITALISATIONS(df):\n",
" return BatchCodeTableFactory._countValues(df, 'HOSPITAL')\n",
" def _getHOSPITALISATIONS(self):\n",
" return self._countValues('HOSPITAL')\n",
"\n",
" @staticmethod\n",
" def _getER_VISITs(df):\n",
" return BatchCodeTableFactory._countValues(df, 'ER_VISIT')\n",
" def _getER_VISITs(self):\n",
" return self._countValues('ER_VISIT')\n",
"\n",
" @staticmethod\n",
" def _countValues(df, column):\n",
" return df[df[column] == 'Y']['VAX_LOT'].value_counts()\n",
" def _countValues(self, column):\n",
" return self.dataFrame[self.dataFrame[column] == 'Y']['VAX_LOT'].value_counts()\n",
"\n",
" @staticmethod\n",
" def _asDataFrame(dict):\n",
" def _asDataFrame(self, dict):\n",
" dataFrame = pd.concat(dict, axis = 'columns')\n",
" dataFrame.index.name = 'VAX_LOT'\n",
" return dataFrame.replace(to_replace = np.nan, value = 0)\n",
"\n",
" @staticmethod\n",
" def _addCompanyColumn(batchCodeTable, companyByBatchCodeTable):\n",
" def _addCompanyColumn(self, batchCodeTable, companyByBatchCodeTable):\n",
" return pd.merge(\n",
" batchCodeTable,\n",
" companyByBatchCodeTable,\n",
@@ -199,15 +188,26 @@
" right_index = True,\n",
" validate = 'one_to_one')\n",
"\n",
" @staticmethod\n",
" def _createManufacturerByBatchCodeTable(df):\n",
" manufacturerByBatchCodeTable = df[['VAX_LOT', 'VAX_MANU']]\n",
" def _createCompanyByBatchCodeTable(self):\n",
" return self._createManufacturerByBatchCodeTable().rename(columns = {\"VAX_MANU\": \"COMPANY\"})\n",
"\n",
" def _createManufacturerByBatchCodeTable(self):\n",
" manufacturerByBatchCodeTable = self.dataFrame[['VAX_LOT', 'VAX_MANU']]\n",
" manufacturerByBatchCodeTable = manufacturerByBatchCodeTable.drop_duplicates(subset = ['VAX_LOT'])\n",
" return manufacturerByBatchCodeTable.set_index('VAX_LOT')\n",
"\n",
"class BatchCodeTableFactory:\n",
"\n",
" @staticmethod\n",
" def _createCompanyByBatchCodeTable(df):\n",
" return BatchCodeTableFactory._createManufacturerByBatchCodeTable(df).rename(columns = {\"VAX_MANU\": \"COMPANY\"})\n"
" def createBatchCodeTable(dataFrame : pd.DataFrame, manufacturer, dose):\n",
" filteredDataFrame = DataFrameFilter(dataFrame).filterBy(manufacturer = manufacturer, dose = dose)\n",
" return BatchCodeTableHelper(filteredDataFrame).createBatchCodeTable()\n",
"\n",
" # create table from https://www.howbadismybatch.com/combined.html\n",
" @staticmethod\n",
" def createSevereEffectsBatchCodeTable(dataFrame : pd.DataFrame, dose):\n",
" severeEffectsDataFrame = DataFrameFilter(dataFrame).filterForSevereEffects(dose)\n",
" return BatchCodeTableHelper(severeEffectsDataFrame).createSevereEffectsBatchCodeTable()\n"
]
},
{
@@ -411,8 +411,7 @@
"\n",
" def test_createSevereEffectsBatchCodeTable(self):\n",
" # Given\n",
" batchCodeTableFactory = BatchCodeTableFactory(\n",
" VaersDescr2DataFrameConverter.createDataFrameFromDescrs(\n",
" dataFrame = VaersDescr2DataFrameConverter.createDataFrameFromDescrs(\n",
" [\n",
" {\n",
" 'VAERSDATA': self.createDataFrame(\n",
@@ -431,10 +430,10 @@
" \"0916601\"],\n",
" dtypes = {'VAX_DOSE_SERIES': \"string\"})\n",
" }\n",
" ]))\n",
" ])\n",
"\n",
" # When\n",
" batchCodeTable = batchCodeTableFactory.createSevereEffectsBatchCodeTable('1')\n",
" batchCodeTable = BatchCodeTableFactory.createSevereEffectsBatchCodeTable(dataFrame, '1')\n",
"\n",
" # Then\n",
" batchCodeTableExpected = pd.DataFrame(\n",
@@ -496,11 +495,8 @@
" self._test_createBatchCodeTable(dataFrame, \"MODERNA\", '1')\n",
"\n",
" def _test_createBatchCodeTable(self, dataFrame, manufacturer, dose):\n",
" # Given\n",
" batchCodeTableFactory = BatchCodeTableFactory(dataFrame)\n",
"\n",
" # When\n",
" batchCodeTable = batchCodeTableFactory.createBatchCodeTable(manufacturer, dose)\n",
" batchCodeTable = BatchCodeTableFactory.createBatchCodeTable(dataFrame, manufacturer, dose)\n",
"\n",
" # Then\n",
" batchCodeTableExpected = pd.DataFrame(\n",
@@ -537,8 +533,7 @@
"def saveBatchCodeTable(manufacturer, excelFile):\n",
" vaersDescrs = VaersDescrReader(\"VAERS\").readAllVaersDescrs()\n",
" dataFrame = VaersDescr2DataFrameConverter.createDataFrameFromDescrs(vaersDescrs)\n",
" batchCodeTableFactory = BatchCodeTableFactory(dataFrame)\n",
" batchCodeTable = batchCodeTableFactory.createBatchCodeTable(manufacturer = manufacturer, dose = '1')\n",
" batchCodeTable = BatchCodeTableFactory.createBatchCodeTable(dataFrame, manufacturer = manufacturer, dose = '1')\n",
" display(manufacturer, batchCodeTable)\n",
" batchCodeTable.to_excel(excelFile)"
]
@@ -565,8 +560,7 @@
"def saveSevereEffectsBatchCodeTable(excelFile):\n",
" vaersDescrs = VaersDescrReader(\"VAERS\").readAllVaersDescrs()\n",
" dataFrame = VaersDescr2DataFrameConverter.createDataFrameFromDescrs(vaersDescrs)\n",
" batchCodeTableFactory = BatchCodeTableFactory(dataFrame)\n",
" severeEffectsBatchCodeTable = batchCodeTableFactory.createSevereEffectsBatchCodeTable(dose = '1')\n",
" severeEffectsBatchCodeTable = BatchCodeTableFactory.createSevereEffectsBatchCodeTable(dataFrame, dose = '1')\n",
" display('severeEffectsBatchCodeTable', severeEffectsBatchCodeTable)\n",
" severeEffectsBatchCodeTable.to_excel(excelFile)"
]