From 818a2c78873933aace3e4ecd3799f70957be2936 Mon Sep 17 00:00:00 2001 From: frankknoll Date: Sun, 26 Mar 2023 00:35:32 +0100 Subject: [PATCH] readExploration() from Google Analytics --- src/HowBadIsMyBatch.ipynb | 28 ++++++++++++++++++++-------- 1 file changed, 20 insertions(+), 8 deletions(-) diff --git a/src/HowBadIsMyBatch.ipynb b/src/HowBadIsMyBatch.ipynb index 5ab6ef85ca0..20b8c900774 100644 --- a/src/HowBadIsMyBatch.ipynb +++ b/src/HowBadIsMyBatch.ipynb @@ -23,6 +23,20 @@ "from HistogramFactoryAndPersister import createAndSaveGlobalHistograms, createAndSaveHistogramsForCountries" ] }, + { + "cell_type": "code", + "execution_count": null, + "id": "0474f6d7", + "metadata": {}, + "outputs": [], + "source": [ + "def readExploration(csvFile, indexName):\n", + " exploration = pd.read_csv(csvFile, header=[0, 1], index_col=0, skiprows=6)\n", + " exploration.drop(index=indexName, inplace=True)\n", + " exploration.index.rename(indexName, inplace=True)\n", + " return exploration" + ] + }, { "cell_type": "code", "execution_count": null, @@ -30,9 +44,7 @@ "metadata": {}, "outputs": [], "source": [ - "country_By_Clicked_Batchcode = pd.read_csv('data/Country By Clicked Batchcode.csv', header=[0, 1], index_col=0, skiprows=6)\n", - "country_By_Clicked_Batchcode.drop(index='Clicked Batchcode', inplace=True)\n", - "country_By_Clicked_Batchcode.index.rename('Clicked Batchcode', inplace=True)\n", + "country_By_Clicked_Batchcode = readExploration('data/Country By Clicked Batchcode.csv', indexName = 'Clicked Batchcode')\n", "country_By_Clicked_Batchcode" ] }, @@ -43,9 +55,7 @@ "metadata": {}, "outputs": [], "source": [ - "country_By_Batchcode_Search_Term = pd.read_csv('data/Country By Batchcode Search Term.csv', header=[0, 1], index_col=0, skiprows=6)\n", - "country_By_Batchcode_Search_Term.drop(index='Batchcode Search Term', inplace=True)\n", - "country_By_Batchcode_Search_Term.index.rename('Batchcode Search Term', inplace=True)\n", + "country_By_Batchcode_Search_Term = readExploration('data/Country By Batchcode Search Term.csv', indexName = 'Batchcode Search Term')\n", "country_By_Batchcode_Search_Term" ] }, @@ -191,7 +201,7 @@ "from CompletedBatchcodeColumnAdder import CompletedBatchcodeColumnAdder\n", "from BatchcodeCompletion import BatchcodeCompletion\n", "\n", - "batchcodeCompletion = BatchcodeCompletion(batchCodeTable)\n", + "batchcodeCompletion = BatchcodeCompletion(ADR_by_Batchcode = batchCodeTable)\n", "completedBatchcodeColumnAdder = CompletedBatchcodeColumnAdder(batchcodeCompletion.completeBatchcode)\n", "country_By_Batchcode_Search_Term = completedBatchcodeColumnAdder.addCompletedBatchcodeColumn(country_By_Batchcode_Search_Term)\n", "country_By_Batchcode_Search_Term" @@ -204,7 +214,9 @@ "metadata": {}, "outputs": [], "source": [ - "country_By_Batchcode_Search_Term.to_excel('tmp/Country_By_Batchcode_Search_Term.xlsx')" + "country_By_Batchcode_Search_Term.to_excel('tmp/Country_By_Batchcode_Search_Term.xlsx')\n", + "FK-TODO: country_By_Batchcode_Search_Term['Completed Batchcode'] + Country-Spalten dazu verwenden,\n", + " in der BatchCodeTable der Web-Seite fehlende mit 'Unknown Country' markierte Countries nachzutragen." ] }, {