Skip to content

Commit 3bf2045

Browse files
committed
Small Improvements
Update Notebook_Time_Series_Silviu.ipynb Update Notebook_Time_Series_Silviu.ipynb
1 parent 3d89601 commit 3bf2045

File tree

1 file changed

+22
-15
lines changed

1 file changed

+22
-15
lines changed

Notebook_Time_Series_Silviu.ipynb

Lines changed: 22 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -290,7 +290,7 @@
290290
"metadata": {},
291291
"outputs": [],
292292
"source": [
293-
"def generate_table(): \n",
293+
"def init_highest_table(): \n",
294294
" df_highest = pd.DataFrame(columns={\"Indicator\"})\n",
295295
" df_highest[\"Indicator\"] = indicators\n",
296296
" df_highest[\"Year range\"] = 0\n",
@@ -317,22 +317,28 @@
317317
"metadata": {},
318318
"outputs": [],
319319
"source": [
320-
"iterable = list(range(min(set(df_gold['Year'])), max(set(df_gold['Year'])) + 1))\n",
321-
"iterable = list(itertools.combinations(iterable, 2))\n",
322-
"iterable_aux = iterable.copy()\n",
323-
"\n",
324-
"#The year length must be higher than 5. All entries with a lower range are deleted.\n",
325-
"for years in iterable_aux:\n",
326-
" if (years[1] - years[0]) < 4:\n",
327-
" iterable.remove(years)\n",
328-
"\n",
329320
"indicators = list(df_gold.columns[3:])\n",
330321
"indicators.remove('GDP')"
331322
]
332323
},
333324
{
334325
"cell_type": "code",
335326
"execution_count": 7,
327+
"metadata": {},
328+
"outputs": [],
329+
"source": [
330+
"def generate_years_combinations(min_diff: int):\n",
331+
" iterable = list(range(min(set(df_gold['Year'])), max(set(df_gold['Year'])) + 1))\n",
332+
" iterable = list(itertools.combinations(iterable, 2))\n",
333+
" \n",
334+
" #The year length must be higher than min_diff. All entries with a lower range are deleted.\n",
335+
" for years in iterable.copy():\n",
336+
" if (years[1] - years[0]) < min_diff:\n",
337+
" iterable.remove(years)\n",
338+
" \n",
339+
" return iterable"
340+
]
341+
},
336342
"metadata": {},
337343
"outputs": [
338344
{
@@ -377,17 +383,18 @@
377383
" #Search for the entries of the region and normalize.\n",
378384
" df_zone = countries_by_region[Zone]\n",
379385
"\n",
380-
" df_highest = generate_table()\n",
386+
" df_highest = init_highest_table()\n",
381387
" \n",
382388
" i = 0\n",
383389
" computing_text = \"Loading \"\n",
384390
" print (computing_text, end=\"\\r\")\n",
385391
"\n",
386392
"\n",
387393
" #For all the combination of years...\n",
388-
" for years in iterable:\n",
394+
" for years in generate_years_combinations(5):\n",
389395
" i = (i + 1) % 50\n",
390396
" print (computing_text + \"\".join([\".\" for _ in range(i)]), end=\"\\r\")\n",
397+
" \n",
391398
" df_aux = searchTimeSeries(0, years[0], years[1], True, df_zone)\n",
392399
" #Delete indicators which are not available that year\n",
393400
" indicators_inter = list(set(indicators) & set(list(df_aux.index)))\n",
@@ -476,13 +483,14 @@
476483
"def plotYearRange(Zone, Indicator, Years):\n",
477484
" df_aux = df_gold_index.loc[df_gold_index.index.get_level_values('Country') == Zone]\n",
478485
" df_aux = df_aux.loc[(df_aux.index.get_level_values(\"Year\") >= Years[0]) & (df_aux.index.get_level_values(\"Year\") <= Years[1])]\n",
486+
" # TODO: Country or Region??\n",
479487
" spear = stats.spearmanr(df_aux[Indicator], df_aux['GDP'])\n",
480488
" df_aux = normalize_by_country(df_aux).reset_index(drop=False)\n",
481489
" \n",
482490
" print(spear)\n",
483491
" plt.figure(figsize=(6,6))\n",
484-
" plt.plot(df_aux[\"GDP\"], color=\"red\", label = 'GDP')\n",
485-
" plt.plot(df_aux[Indicator], color=\"green\", label = Indicator)\n",
492+
" plt.plot(df_aux[\"Year\"], df_aux[\"GDP\"], color=\"red\", label = 'GDP')\n",
493+
" plt.plot(df_aux[\"Year\"], df_aux[Indicator], color=\"green\", label = Indicator)\n",
486494
" plt.legend(loc=\"lower right\")\n",
487495
" \n",
488496
"\n",
@@ -509,7 +517,6 @@
509517
")\n",
510518
"\n",
511519
"\n",
512-
"\n",
513520
"# TODO By Region: Say Y axis is Qualitative (Not real values but Normalized to observe evolution vs GDP - Tendendency)\n",
514521
"widgets.interact(plotYearRange, Zone = country_drop, Indicator = indicator_drop, Years = intslider)"
515522
]

0 commit comments

Comments
 (0)