diff --git a/src/VaersDescrReader.py b/src/VaersDescrReader.py index dcc4c5c3e98..dccec6cb496 100644 --- a/src/VaersDescrReader.py +++ b/src/VaersDescrReader.py @@ -31,7 +31,11 @@ class VaersDescrReader: return self._read_csv( file = file, usecols = ['VAERS_ID', 'VAX_DOSE_SERIES', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT'], - dtype = {"VAX_DOSE_SERIES": "string"}) + dtype = + { + "VAX_DOSE_SERIES": "string", + "VAX_LOT": "string" + }) def _read_csv(self, file, **kwargs): return pd.read_csv( diff --git a/src/VaersDescrReaderTest.py b/src/VaersDescrReaderTest.py index 53fe966157a..a157a777325 100644 --- a/src/VaersDescrReaderTest.py +++ b/src/VaersDescrReaderTest.py @@ -15,11 +15,21 @@ class VaersDescrReaderTest(unittest.TestCase): vaersDescr = vaersDescrReader.readVaersDescrForYear(2023) # Then - RECVDATE = pd.to_datetime('01/01/2023', format = "%m/%d/%Y") - dataFrameExpected = TestHelper.createDataFrame( - columns = ['RECVDATE', 'DIED', 'L_THREAT', 'ER_VISIT', 'HOSPITAL', 'DISABLE', 'SPLTTYPE'], - data = [ [RECVDATE, np.nan, np.nan, np.nan, np.nan, np.nan, np.nan]], - index = pd.Index( - name = 'VAERS_ID', - data=[2547730])) - assert_frame_equal(vaersDescr['VAERSDATA'], dataFrameExpected, check_dtype=False) + assert_frame_equal( + vaersDescr['VAERSDATA'], + TestHelper.createDataFrame( + columns = ['RECVDATE', 'DIED', 'L_THREAT', 'ER_VISIT', 'HOSPITAL', 'DISABLE', 'SPLTTYPE'], + data = [ [pd.to_datetime('01/01/2023', format = "%m/%d/%Y"), np.nan, np.nan, np.nan, np.nan, np.nan, np.nan]], + index = pd.Index( + name = 'VAERS_ID', + data=[2547730])), + check_dtype = False) + assert_frame_equal( + vaersDescr['VAERSVAX'], + TestHelper.createDataFrame( + columns = ['VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_DOSE_SERIES'], + data = [ ['COVID19', 'JANSSEN', '1808982', 'UNK']], + index = pd.Index( + name = 'VAERS_ID', + data=[2547730])), + check_dtype = False)