renku update --with-siblings

71ee1b3f · Chandrasekhar Ramakrishnan · renku 0.9.1 · 052d4070 · 71ee1b3f · 71ee1b3f
Commit 71ee1b3f authored 5 years ago by Chandrasekhar Ramakrishnan Committed by renku 0.9.1 5 years ago
--- a/.renku/workflow/c1e3191700aa4231a584f4eb0fac4631.cwl
+++ b/.renku/workflow/c1e3191700aa4231a584f4eb0fac4631.cwl
+class: Workflow
+cwlVersion: v1.0
+hints: []
+inputs:
+  input_1:
+    default: ts_folder
+    streamable: false
+    type: string
+  input_10:
+    default:
+      class: Directory
+      listing: []
+      path: ../../data/covid-19_jhu-csse
+    streamable: false
+    type: Directory
+  input_11:
+    default: rates_folder
+    streamable: false
+    type: string
+  input_12:
+    default:
+      class: Directory
+      listing: []
+      path: ../../data/covid-19_rates
+    streamable: false
+    type: Directory
+  input_13:
+    default: geodata_path
+    streamable: false
+    type: string
+  input_14:
+    default:
+      class: File
+      path: ../../data/geodata/geo_data.csv
+    streamable: false
+    type: File
+  input_15:
+    default:
+      class: File
+      path: ../../notebooks/Dashboard.ipynb
+    streamable: false
+    type: File
+  input_16:
+    default: runs/Dashboard.run.ipynb
+    streamable: false
+    type: string
+  input_2:
+    default:
+      class: Directory
+      listing: []
+      path: ../../data/covid-19_jhu-csse
+    streamable: false
+    type: Directory
+  input_3:
+    default: worldmap_path
+    streamable: false
+    type: string
+  input_4:
+    default:
+      class: File
+      path: ../../data/worldmap/country_centroids.csv
+    streamable: false
+    type: File
+  input_5:
+    default: out_folder
+    streamable: false
+    type: string
+  input_6:
+    default: data/geodata
+    streamable: false
+    type: string
+  input_7:
+    default:
+      class: File
+      path: ../../notebooks/CompileGeoData.ipynb
+    streamable: false
+    type: File
+  input_8:
+    default: runs/CompileGeoData.run.ipynb
+    streamable: false
+    type: string
+  input_9:
+    default: ts_folder
+    streamable: false
+    type: string
+outputs:
+  output_0:
+    outputSource: step_2/output_0
+    streamable: false
+    type: File
+  output_1:
+    outputSource: step_1/output_1
+    streamable: false
+    type: Directory
+  output_2:
+    outputSource: step_1/output_0
+    streamable: false
+    type: File
+requirements: []
+steps:
+  step_1:
+    in:
+      input_1: input_1
+      input_2: input_2
+      input_3: input_3
+      input_4: input_4
+      input_5: input_5
+      input_6: input_6
+      input_7: input_7
+      input_8: input_8
+    out:
+    - output_0
+    - output_1
+    run: 73781f74e51d4e54bc522007a2030ec2_papermill.cwl
+  step_2:
+    in:
+      input_1: input_9
+      input_2: input_10
+      input_3: input_11
+      input_4: input_12
+      input_5: input_13
+      input_6: input_14
+      input_7: input_15
+      input_8: input_16
+    out:
+    - output_0
+    run: 4cc7ffe9d5a045efb048ef2222a40ffa_papermill.cwl
--- a/data/geodata/geo_data.csv
+++ b/data/geodata/geo_data.csv
--- a/runs/CompileGeoData.run.ipynb
+++ b/runs/CompileGeoData.run.ipynb
@@ -4,10 +4,10 @@
   "cell_type": "markdown",
   "metadata": {
    "papermill": {
-     "duration": 0.025663,
+     "duration": 0.021165,
-     "end_time": "2020-03-15T16:43:49.005977",
+     "end_time": "2020-03-16T19:41:41.269273",
     "exception": false,
-     "start_time": "2020-03-15T16:43:48.980314",
+     "start_time": "2020-03-16T19:41:41.248108",
     "status": "completed"
    },
    "tags": []
@@ -23,10 +23,10 @@
   "execution_count": 1,
   "metadata": {
    "papermill": {
-     "duration": 0.285624,
+     "duration": 0.283727,
-     "end_time": "2020-03-15T16:43:49.302040",
+     "end_time": "2020-03-16T19:41:41.563021",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.016416",
+     "start_time": "2020-03-16T19:41:41.279294",
     "status": "completed"
    },
    "tags": []
@@ -42,10 +42,10 @@
   "execution_count": 2,
   "metadata": {
    "papermill": {
-     "duration": 0.057379,
+     "duration": 0.024974,
-     "end_time": "2020-03-15T16:43:49.376597",
+     "end_time": "2020-03-16T19:41:41.606737",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.319218",
+     "start_time": "2020-03-16T19:41:41.581763",
     "status": "completed"
    },
    "tags": []
@@ -62,10 +62,10 @@
   "cell_type": "markdown",
   "metadata": {
    "papermill": {
-     "duration": 0.015419,
+     "duration": 0.008508,
-     "end_time": "2020-03-15T16:43:49.400508",
+     "end_time": "2020-03-16T19:41:41.625473",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.385089",
+     "start_time": "2020-03-16T19:41:41.616965",
     "status": "completed"
    },
    "tags": [
@@ -81,10 +81,10 @@
   "execution_count": 3,
   "metadata": {
    "papermill": {
-     "duration": 0.019117,
+     "duration": 0.02138,
-     "end_time": "2020-03-15T16:43:49.427165",
+     "end_time": "2020-03-16T19:41:41.653962",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.408048",
+     "start_time": "2020-03-16T19:41:41.632582",
     "status": "completed"
    },
    "tags": [
@@ -94,10 +94,10 @@
   "outputs": [],
   "source": [
    "# Parameters\n",
-    "PAPERMILL_INPUT_PATH = \"/tmp/262jiqqx/notebooks/CompileGeoData.ipynb\"\n",
+    "PAPERMILL_INPUT_PATH = \"/tmp/q9ufv19r/notebooks/CompileGeoData.ipynb\"\n",
    "PAPERMILL_OUTPUT_PATH = \"runs/CompileGeoData.run.ipynb\"\n",
-    "ts_folder = \"/tmp/262jiqqx/data/covid-19_jhu-csse\"\n",
+    "ts_folder = \"/tmp/q9ufv19r/data/covid-19_jhu-csse\"\n",
-    "worldmap_path = \"/tmp/262jiqqx/data/worldmap/country_centroids.csv\"\n",
+    "worldmap_path = \"/tmp/q9ufv19r/data/worldmap/country_centroids.csv\"\n",
    "out_folder = \"data/geodata\"\n"
   ]
  },
@@ -106,10 +106,10 @@
   "execution_count": 4,
   "metadata": {
    "papermill": {
-     "duration": 0.019727,
+     "duration": 0.025944,
-     "end_time": "2020-03-15T16:43:49.457802",
+     "end_time": "2020-03-16T19:41:41.689098",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.438075",
+     "start_time": "2020-03-16T19:41:41.663154",
     "status": "completed"
    },
    "tags": []
@@ -130,10 +130,10 @@
   "execution_count": 5,
   "metadata": {
    "papermill": {
-     "duration": 0.057337,
+     "duration": 0.058376,
-     "end_time": "2020-03-15T16:43:49.523781",
+     "end_time": "2020-03-16T19:41:41.758318",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.466444",
+     "start_time": "2020-03-16T19:41:41.699942",
     "status": "completed"
    },
    "tags": []
@@ -147,10 +147,10 @@
   "cell_type": "markdown",
   "metadata": {
    "papermill": {
-     "duration": 0.008192,
+     "duration": 0.010532,
-     "end_time": "2020-03-15T16:43:49.544325",
+     "end_time": "2020-03-16T19:41:41.785637",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.536133",
+     "start_time": "2020-03-16T19:41:41.775105",
     "status": "completed"
    },
    "tags": []
@@ -164,10 +164,10 @@
   "execution_count": 6,
   "metadata": {
    "papermill": {
-     "duration": 0.04304,
+     "duration": 0.071813,
-     "end_time": "2020-03-15T16:43:49.594611",
+     "end_time": "2020-03-16T19:41:41.868125",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.551571",
+     "start_time": "2020-03-16T19:41:41.796312",
     "status": "completed"
    },
    "tags": []
@@ -184,10 +184,10 @@
   "execution_count": 7,
   "metadata": {
    "papermill": {
-     "duration": 0.033254,
+     "duration": 0.043949,
-     "end_time": "2020-03-15T16:43:49.644104",
+     "end_time": "2020-03-16T19:41:41.931586",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.610850",
+     "start_time": "2020-03-16T19:41:41.887637",
     "status": "completed"
    },
    "tags": []
@@ -214,10 +214,10 @@
   "cell_type": "markdown",
   "metadata": {
    "papermill": {
-     "duration": 0.007079,
+     "duration": 0.008107,
-     "end_time": "2020-03-15T16:43:49.660788",
+     "end_time": "2020-03-16T19:41:41.952766",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.653709",
+     "start_time": "2020-03-16T19:41:41.944659",
     "status": "completed"
    },
    "tags": []
@@ -231,10 +231,10 @@
   "execution_count": 8,
   "metadata": {
    "papermill": {
-     "duration": 0.027734,
+     "duration": 0.028654,
-     "end_time": "2020-03-15T16:43:49.695692",
+     "end_time": "2020-03-16T19:41:41.989067",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.667958",
+     "start_time": "2020-03-16T19:41:41.960413",
     "status": "completed"
    },
    "tags": []
@@ -260,10 +260,10 @@
   "execution_count": 9,
   "metadata": {
    "papermill": {
-     "duration": 0.019985,
+     "duration": 0.021395,
-     "end_time": "2020-03-15T16:43:49.727444",
+     "end_time": "2020-03-16T19:41:42.022612",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.707459",
+     "start_time": "2020-03-16T19:41:42.001217",
     "status": "completed"
    },
    "tags": []
@@ -278,10 +278,10 @@
   "cell_type": "markdown",
   "metadata": {
    "papermill": {
-     "duration": 0.008364,
+     "duration": 0.008796,
-     "end_time": "2020-03-15T16:43:49.744328",
+     "end_time": "2020-03-16T19:41:42.040797",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.735964",
+     "start_time": "2020-03-16T19:41:42.032001",
     "status": "completed"
    },
    "tags": []
@@ -295,10 +295,10 @@
   "execution_count": 10,
   "metadata": {
    "papermill": {
-     "duration": 0.038721,
+     "duration": 0.044041,
-     "end_time": "2020-03-15T16:43:49.790199",
+     "end_time": "2020-03-16T19:41:42.092451",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.751478",
+     "start_time": "2020-03-16T19:41:42.048410",
     "status": "completed"
    },
    "tags": []
@@ -325,8 +325,8 @@
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
-       "      <th>2020-03-13</th>\n",
       "      <th>2020-03-14</th>\n",
+       "      <th>2020-03-15</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Country/Region</th>\n",
@@ -336,6 +336,11 @@
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
+       "      <th>Congo (Brazzaville)</th>\n",
+       "      <td>0</td>\n",
+       "      <td>1</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
       "      <th>Congo (Kinshasa)</th>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
@@ -347,23 +352,18 @@
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Curacao</th>\n",
-       "      <td>0</td>\n",
+       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Eswatini</th>\n",
-       "      <td>0</td>\n",
       "      <td>1</td>\n",
-       "    </tr>\n",
+       "      <td>1</td>\n",
-       "    <tr>\n",
-       "      <th>French Guiana</th>\n",
-       "      <td>5</td>\n",
-       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Guadeloupe</th>\n",
       "      <td>1</td>\n",
-       "      <td>1</td>\n",
+       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Holy See</th>\n",
@@ -372,7 +372,7 @@
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Martinique</th>\n",
-       "      <td>3</td>\n",
+       "      <td>9</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
@@ -382,8 +382,8 @@
       "    </tr>\n",
       "    <tr>\n",
       "      <th>Reunion</th>\n",
-       "      <td>5</td>\n",
       "      <td>6</td>\n",
+       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>occupied Palestinian territory</th>\n",
@@ -395,18 +395,18 @@
       "</div>"
      ],
      "text/plain": [
-       "                                2020-03-13  2020-03-14\n",
+       "                                2020-03-14  2020-03-15\n",
       "Country/Region                                        \n",
+       "Congo (Brazzaville)                      0           1\n",
       "Congo (Kinshasa)                         2           2\n",
       "Cruise Ship                            696         696\n",
-       "Curacao                                  0           1\n",
+       "Curacao                                  1           1\n",
-       "Eswatini                                 0           1\n",
+       "Eswatini                                 1           1\n",
-       "French Guiana                            5           5\n",
+       "Guadeloupe                               1           3\n",
-       "Guadeloupe                               1           1\n",
       "Holy See                                 1           1\n",
-       "Martinique                               3           9\n",
+       "Martinique                               9           9\n",
       "North Macedonia                         14          14\n",
-       "Reunion                                  5           6\n",
+       "Reunion                                  6           7\n",
       "occupied Palestinian territory           0           0"
      ]
     },
@@ -425,10 +425,10 @@
   "cell_type": "markdown",
   "metadata": {
    "papermill": {
-     "duration": 0.00976,
+     "duration": 0.009916,
-     "end_time": "2020-03-15T16:43:49.816102",
+     "end_time": "2020-03-16T19:41:42.118533",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.806342",
+     "start_time": "2020-03-16T19:41:42.108617",
     "status": "completed"
    },
    "tags": []
@@ -442,10 +442,10 @@
   "execution_count": 11,
   "metadata": {
    "papermill": {
-     "duration": 0.029533,
+     "duration": 0.033068,
-     "end_time": "2020-03-15T16:43:49.853512",
+     "end_time": "2020-03-16T19:41:42.159802",
     "exception": false,
-     "start_time": "2020-03-15T16:43:49.823979",
+     "start_time": "2020-03-16T19:41:42.126734",
     "status": "completed"
    },
    "tags": []
@@ -477,20 +477,20 @@
   "version": "3.7.6"
  },
  "papermill": {
-   "duration": 2.036815,
+   "duration": 1.96386,
-   "end_time": "2020-03-15T16:43:50.175740",
+   "end_time": "2020-03-16T19:41:42.484999",
   "environment_variables": {},
   "exception": null,
-   "input_path": "/tmp/262jiqqx/notebooks/CompileGeoData.ipynb",
+   "input_path": "/tmp/q9ufv19r/notebooks/CompileGeoData.ipynb",
   "output_path": "runs/CompileGeoData.run.ipynb",
   "parameters": {
-    "PAPERMILL_INPUT_PATH": "/tmp/262jiqqx/notebooks/CompileGeoData.ipynb",
+    "PAPERMILL_INPUT_PATH": "/tmp/q9ufv19r/notebooks/CompileGeoData.ipynb",
    "PAPERMILL_OUTPUT_PATH": "runs/CompileGeoData.run.ipynb",
    "out_folder": "data/geodata",
-    "ts_folder": "/tmp/262jiqqx/data/covid-19_jhu-csse",
+    "ts_folder": "/tmp/q9ufv19r/data/covid-19_jhu-csse",
-    "worldmap_path": "/tmp/262jiqqx/data/worldmap/country_centroids.csv"
+    "worldmap_path": "/tmp/q9ufv19r/data/worldmap/country_centroids.csv"
   },
-   "start_time": "2020-03-15T16:43:48.138925",
+   "start_time": "2020-03-16T19:41:40.521139",
   "version": "1.1.0"
  }
 },

 %% Cell type:markdown id: tags:
 # Extract the Geographic Info
 Use the Harvard [country_centroids.csv](https://worldmap.harvard.edu/data/geonode:country_centroids_az8) data to extract the geographic info we need for the visualizations.
 %% Cell type:code id: tags:
 ``` python
 import pandas as pd
 import os
 ```
 %% Cell type:code id: tags:
 ``` python
 ts_folder = "../data/covid-19_jhu-csse/"
 worldmap_path = "../data/worldmap/country_centroids.csv"
 out_folder = None
 PAPERMILL_OUTPUT_PATH = None
 ```
 %% Cell type:markdown id: tags:parameters
 ## Read in JHU CSSE data
 %% Cell type:code id: tags:injected-parameters
 ``` python
 # Parameters
-PAPERMILL_INPUT_PATH = "/tmp/262jiqqx/notebooks/CompileGeoData.ipynb"
+PAPERMILL_INPUT_PATH = "/tmp/q9ufv19r/notebooks/CompileGeoData.ipynb"
 PAPERMILL_OUTPUT_PATH = "runs/CompileGeoData.run.ipynb"
-ts_folder = "/tmp/262jiqqx/data/covid-19_jhu-csse"
+ts_folder = "/tmp/q9ufv19r/data/covid-19_jhu-csse"
-worldmap_path = "/tmp/262jiqqx/data/worldmap/country_centroids.csv"
+worldmap_path = "/tmp/q9ufv19r/data/worldmap/country_centroids.csv"
 out_folder = "data/geodata"
 ```
 %% Cell type:code id: tags:
 ``` python
 def read_jhu_covid_region_df(name):
    filename = os.path.join(ts_folder, f"time_series_19-covid-{name}.csv")
    df = pd.read_csv(filename)
    df = df.set_index(['Country/Region', 'Province/State', 'Lat', 'Long'])
    df.columns = pd.to_datetime(df.columns)
    region_df = df.groupby(level='Country/Region').sum()
    return region_df
 ```
 %% Cell type:code id: tags:
 ``` python
 confirmed_df = read_jhu_covid_region_df("Confirmed")
 ```
 %% Cell type:markdown id: tags:
 # Read in Harvard country centroids
 %% Cell type:code id: tags:
 ``` python
 country_centroids_df = pd.read_csv(worldmap_path)
 country_centroids_df = country_centroids_df[['name', 'name_long', 'region_un', 'subregion', 'region_wb', 'pop_est', 'gdp_md_est', 'income_grp', 'Longitude', 'Latitude']]
 country_centroids_df['name_jhu'] = country_centroids_df['name_long']
 ```
 %% Cell type:code id: tags:
 ``` python
 country_centroids_df.columns
 ```
 %% Output
    Index(['name', 'name_long', 'region_un', 'subregion', 'region_wb', 'pop_est',
           'gdp_md_est', 'income_grp', 'Longitude', 'Latitude', 'name_jhu'],
          dtype='object')
 %% Cell type:markdown id: tags:
 Fix names that differ between JHU CSSE and Harvard data
 %% Cell type:code id: tags:
 ``` python
 region_hd_jhu_map = {
     'Brunei Darussalam': 'Brunei',
     "CÃ´te d'Ivoire": "Cote d'Ivoire",
     'Czech Republic': 'Czechia',
     'Hong Kong': 'Hong Kong SAR',
     'Republic of Korea': 'Korea, South',
     'Macao': 'Macao SAR',
     'Russian Federation': 'Russia',
     'Taiwan': 'Taiwan*',
     'United States': 'US'
 }
 country_centroids_df['name_jhu'] = country_centroids_df['name_jhu'].replace(region_hd_jhu_map)
 ```
 %% Cell type:code id: tags:
 ``` python
 # Use this to find the name in the series
 # country_centroids_df[country_centroids_df['name'].str.contains('Macao')]
 ```
 %% Cell type:markdown id: tags:
 There are some regions that we cannot resolve, but we will just ignore these.
 %% Cell type:code id: tags:
 ``` python
 confirmed_df.loc[
    (confirmed_df.index.isin(country_centroids_df['name_jhu']) == False)
 ].iloc[:,-2:]
 ```
 %% Output
-                                    2020-03-13  2020-03-14
+                                    2020-03-14  2020-03-15
    Country/Region
+    Congo (Brazzaville)                      0           1
    Congo (Kinshasa)                         2           2
    Cruise Ship                            696         696
-    Curacao                                  0           1
+    Curacao                                  1           1
-    Eswatini                                 0           1
+    Eswatini                                 1           1
-    French Guiana                            5           5
+    Guadeloupe                               1           3
-    Guadeloupe                               1           1
    Holy See                                 1           1
-    Martinique                               3           9
+    Martinique                               9           9
    North Macedonia                         14          14
-    Reunion                                  5           6
+    Reunion                                  6           7
    occupied Palestinian territory           0           0
 %% Cell type:markdown id: tags:
 # Save the result
 %% Cell type:code id: tags:
 ``` python
 if PAPERMILL_OUTPUT_PATH:
    out_path = os.path.join(out_folder, f"geo_data.csv")
    country_centroids_df.to_csv(out_path)
 ```

--- a/runs/Dashboard.run.ipynb
+++ b/runs/Dashboard.run.ipynb