refactoring

This commit is contained in:
frankknoll
2022-01-26 09:46:00 +01:00
parent fd3c49ce8b
commit 455181b946
4 changed files with 33 additions and 35 deletions

3
.gitignore vendored
View File

@@ -1,5 +1,4 @@
VAERS/ VAERS/
.ipynb_checkpoints/ .ipynb_checkpoints/
VAERSDataUseGuide_en_September2021.pdf config/
Vaccine Lot Numbers Expiration (1).xlsx
results/ results/

View File

@@ -106,21 +106,21 @@
" # Given\n", " # Given\n",
" dataFrame = createDataFrame(\"test/VAERS\", \"MODERNA\")\n", " dataFrame = createDataFrame(\"test/VAERS\", \"MODERNA\")\n",
" display(\"dataFrame:\", dataFrame)\n", " display(\"dataFrame:\", dataFrame)\n",
" batchCodeTable = createBatchCodeTable(dataFrame)\n",
"\n", "\n",
" # When\n", " # When\n",
" batchCodeTable = createBatchCodeTable(dataFrame)\n",
" display(\"batchCodeTable:\", batchCodeTable)\n",
"\n",
" # Then\n",
" batchCodeTableExpected = pd.DataFrame(\n", " batchCodeTableExpected = pd.DataFrame(\n",
" {\n", " {\n",
" 'ADRs': [2, 1],\n", " 'ADRs': [2, 1],\n",
" 'DEATHS': [0, 1],\n", " 'DEATHS': [0, 1],\n",
" 'DISABILITIES': [2, 0],\n", " 'DISABILITIES': [2, 0],\n",
" 'LIFE THREATENING ILLNESSES': [0.0, 0.0]\n", " 'LIFE THREATENING ILLNESSES': [0, 0]\n",
" },\n", " },\n",
" index = pd.MultiIndex.from_arrays([['025L20A', '037K20A']], names = ('VAX_LOT',)))\n", " index = pd.MultiIndex.from_arrays([['025L20A', '037K20A']], names = ('VAX_LOT',)))\n",
" display(\"batchCodeTable:\", batchCodeTable)\n",
" display(\"batchCodeTableExpected:\", batchCodeTableExpected)\n", " display(\"batchCodeTableExpected:\", batchCodeTableExpected)\n",
"\n",
" # Then\n",
" assert_frame_equal(batchCodeTable, batchCodeTableExpected, check_dtype = False)\n" " assert_frame_equal(batchCodeTable, batchCodeTableExpected, check_dtype = False)\n"
] ]
}, },

View File

@@ -1,30 +1,2 @@
# HowBadIsMyBatch # HowBadIsMyBatch
jupyter notebook
FK-TODO:
- VAX_LOT-Spalte normalisieren, d.h. toUpperCase(), Format des jeweiligen Herstellers berücksichtigen und "verschmutzte" Einträge säubern, denn sie stellen alle dieselbe Charge dar:
039k20a
MOD039K20A
#039K20A
039K20A-MODERNA
039K20A-2A
039K20A or 039L
Moderna/039K20A
MODERNA 039K20A
MODERNA039K20A
Modena 039k20A
L039K20A
M039K20A
MOD; 039K20A
m0039k20A
u039k20a
6/21 039K20A
2039K20A
013L20A 039K20A#039K20A
#039K
039K20A 12-31-
039K20A & 031M2
039K20A and 032
039K20A, 011L20

27
help.txt Normal file
View File

@@ -0,0 +1,27 @@
jupyter notebook
FK-TODO:
- VAX_LOT-Spalte normalisieren, d.h. toUpperCase(), Format des jeweiligen Herstellers berücksichtigen und "verschmutzte" Einträge säubern, denn sie stellen alle dieselbe Charge dar:
039k20a
MOD039K20A
#039K20A
039K20A-MODERNA
039K20A-2A
039K20A or 039L
Moderna/039K20A
MODERNA 039K20A
MODERNA039K20A
Modena 039k20A
L039K20A
M039K20A
MOD; 039K20A
m0039k20A
u039k20a
6/21 039K20A
2039K20A
013L20A 039K20A#039K20A
#039K
039K20A 12-31-
039K20A & 031M2
039K20A and 032
039K20A, 011L20