From 01ec83027a1a60d7fdc43bbcbe1ed1589f145872 Mon Sep 17 00:00:00 2001
From: "CR (covid cron)" <cramakri+covid-cron@ethz.ch>
Date: Thu, 23 Apr 2020 07:25:44 +0000
Subject: [PATCH] renku rerun data/covidtracking/states-metadata.json
 data/covidtracking/states-daily.json

---
 .../056013780b0849118b7789497cc14c9c.cwl      | 148 ++++++++++++++++++
 data/covidtracking/states-daily.json          |   4 +-
 data/covidtracking/states-metadata.json       |   4 +-
 runs/download-covidtracking-data.runs.ipynb   | 144 ++++++++---------
 4 files changed, 224 insertions(+), 76 deletions(-)
 create mode 100644 .renku/workflow/056013780b0849118b7789497cc14c9c.cwl

diff --git a/.renku/workflow/056013780b0849118b7789497cc14c9c.cwl b/.renku/workflow/056013780b0849118b7789497cc14c9c.cwl
new file mode 100644
index 000000000..247d32bc6
--- /dev/null
+++ b/.renku/workflow/056013780b0849118b7789497cc14c9c.cwl
@@ -0,0 +1,148 @@
+class: Workflow
+cwlVersion: v1.0
+hints: []
+inputs:
+  input_1:
+    default: states-daily.json
+    streamable: false
+    type: string
+  input_10:
+    default: states-metadata.json
+    streamable: false
+    type: string
+  input_2:
+    default: out_folder
+    streamable: false
+    type: string
+  input_3:
+    default: data/covidtracking
+    streamable: false
+    type: string
+  input_4:
+    default:
+      class: File
+      path: ../../notebooks/process/download-covidtracking-data.ipynb
+    streamable: false
+    type: File
+  input_5:
+    default: runs/download-covidtracking-data.runs.ipynb
+    streamable: false
+    type: string
+  input_6:
+    default: out_folder
+    streamable: false
+    type: string
+  input_7:
+    default: data/covidtracking
+    streamable: false
+    type: string
+  input_8:
+    default:
+      class: File
+      path: ../../notebooks/process/download-covidtracking-data.ipynb
+    streamable: false
+    type: File
+  input_9:
+    default: runs/download-covidtracking-data.runs.ipynb
+    streamable: false
+    type: string
+outputs:
+  output_2:
+    outputSource: step_2/output_1
+    streamable: false
+    type: Directory
+  output_3:
+    outputSource: step_2/output_0
+    streamable: false
+    type: File
+requirements: []
+steps:
+  step_1:
+    in:
+      filename: input_1
+      input_directory: step_2/output_1
+    out:
+    - output_file
+    run:
+      arguments: []
+      baseCommand:
+      - 'true'
+      class: CommandLineTool
+      cwlVersion: v1.0
+      hints: []
+      inputs:
+        filename:
+          default: states-daily.json
+          streamable: false
+          type: string
+        input_directory:
+          streamable: false
+          type: Directory
+      outputs:
+        output_file:
+          outputBinding:
+            glob: $(inputs.filename)
+          streamable: false
+          type: File
+      permanentFailCodes: []
+      requirements:
+      - &id001
+        class: InlineJavascriptRequirement
+      - &id002
+        class: InitialWorkDirRequirement
+        listing: $(inputs.input_directory.listing)
+      successCodes: []
+      temporaryFailCodes: []
+  step_2:
+    in:
+      input_1: input_2
+      input_2: input_3
+      input_3: input_4
+      input_4: input_5
+    out:
+    - output_0
+    - output_1
+    run: a17d560c41a54f5aa307ce5f3c5effe5_papermill.cwl
+  step_3:
+    in:
+      input_1: input_6
+      input_2: input_7
+      input_3: input_8
+      input_4: input_9
+    out:
+    - output_0
+    - output_1
+    run: a17d560c41a54f5aa307ce5f3c5effe5_papermill.cwl
+  step_4:
+    in:
+      filename: input_10
+      input_directory: step_3/output_1
+    out:
+    - output_file
+    run:
+      arguments: []
+      baseCommand:
+      - 'true'
+      class: CommandLineTool
+      cwlVersion: v1.0
+      hints: []
+      inputs:
+        filename:
+          default: states-metadata.json
+          streamable: false
+          type: string
+        input_directory:
+          streamable: false
+          type: Directory
+      outputs:
+        output_file:
+          outputBinding:
+            glob: $(inputs.filename)
+          streamable: false
+          type: File
+      permanentFailCodes: []
+      requirements:
+      - *id001
+      - *id002
+      successCodes: []
+      temporaryFailCodes: []
diff --git a/data/covidtracking/states-daily.json b/data/covidtracking/states-daily.json
index 2268880a1..fa3abf56e 100644
--- a/data/covidtracking/states-daily.json
+++ b/data/covidtracking/states-daily.json
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2741616ce804f09a57e91994eefddf08b69f19d61650fd654ebd5f791bb69fe1
-size 1296997
+oid sha256:fe0159a2a71ff0d1fb1826d3b7c64a5521a43bae971d6f7a53251aef16a98aa7
+size 1332057
diff --git a/data/covidtracking/states-metadata.json b/data/covidtracking/states-metadata.json
index 91869fdd0..92cfc8271 100644
--- a/data/covidtracking/states-metadata.json
+++ b/data/covidtracking/states-metadata.json
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e09dc92ab8fd8ee1b8f62d98ab273afb13132e32eac757e6ee4128e6c5d975f3
-size 28635
+oid sha256:a602301962982474d3e6c3e609022b94dff92782a0af644cd98008bc17521de5
+size 28757
diff --git a/runs/download-covidtracking-data.runs.ipynb b/runs/download-covidtracking-data.runs.ipynb
index d69566477..43c4d395e 100644
--- a/runs/download-covidtracking-data.runs.ipynb
+++ b/runs/download-covidtracking-data.runs.ipynb
@@ -5,10 +5,10 @@
    "execution_count": 1,
    "metadata": {
     "papermill": {
-     "duration": 0.537757,
-     "end_time": "2020-04-22T07:26:03.736336",
+     "duration": 1.60642,
+     "end_time": "2020-04-23T07:25:39.761433",
      "exception": false,
-     "start_time": "2020-04-22T07:26:03.198579",
+     "start_time": "2020-04-23T07:25:38.155013",
      "status": "completed"
     },
     "tags": []
@@ -25,10 +25,10 @@
    "execution_count": 2,
    "metadata": {
     "papermill": {
-     "duration": 0.025946,
-     "end_time": "2020-04-22T07:26:03.774138",
+     "duration": 0.027358,
+     "end_time": "2020-04-23T07:25:39.808543",
      "exception": false,
-     "start_time": "2020-04-22T07:26:03.748192",
+     "start_time": "2020-04-23T07:25:39.781185",
      "status": "completed"
     },
     "tags": [
@@ -46,10 +46,10 @@
    "execution_count": 3,
    "metadata": {
     "papermill": {
-     "duration": 0.02433,
-     "end_time": "2020-04-22T07:26:03.813292",
+     "duration": 0.023119,
+     "end_time": "2020-04-23T07:25:39.841604",
      "exception": false,
-     "start_time": "2020-04-22T07:26:03.788962",
+     "start_time": "2020-04-23T07:25:39.818485",
      "status": "completed"
     },
     "tags": [
@@ -59,7 +59,7 @@
    "outputs": [],
    "source": [
     "# Parameters\n",
-    "PAPERMILL_INPUT_PATH = \"/tmp/vwmf0jau/notebooks/process/download-covidtracking-data.ipynb\"\n",
+    "PAPERMILL_INPUT_PATH = \"/tmp/5uveaykp/notebooks/process/download-covidtracking-data.ipynb\"\n",
     "PAPERMILL_OUTPUT_PATH = \"runs/download-covidtracking-data.runs.ipynb\"\n",
     "out_folder = \"data/covidtracking\"\n"
    ]
@@ -68,10 +68,10 @@
    "cell_type": "markdown",
    "metadata": {
     "papermill": {
-     "duration": 0.007982,
-     "end_time": "2020-04-22T07:26:03.830058",
+     "duration": 0.006677,
+     "end_time": "2020-04-23T07:25:39.855331",
      "exception": false,
-     "start_time": "2020-04-22T07:26:03.822076",
+     "start_time": "2020-04-23T07:25:39.848654",
      "status": "completed"
     },
     "tags": []
@@ -87,10 +87,10 @@
    "execution_count": 4,
    "metadata": {
     "papermill": {
-     "duration": 0.255316,
-     "end_time": "2020-04-22T07:26:04.091234",
+     "duration": 0.157191,
+     "end_time": "2020-04-23T07:25:40.018550",
      "exception": false,
-     "start_time": "2020-04-22T07:26:03.835918",
+     "start_time": "2020-04-23T07:25:39.861359",
      "status": "completed"
     },
     "tags": []
@@ -107,10 +107,10 @@
    "execution_count": 5,
    "metadata": {
     "papermill": {
-     "duration": 0.026576,
-     "end_time": "2020-04-22T07:26:04.132325",
+     "duration": 0.028598,
+     "end_time": "2020-04-23T07:25:40.061751",
      "exception": false,
-     "start_time": "2020-04-22T07:26:04.105749",
+     "start_time": "2020-04-23T07:25:40.033153",
      "status": "completed"
     },
     "tags": []
@@ -129,10 +129,10 @@
    "execution_count": 6,
    "metadata": {
     "papermill": {
-     "duration": 0.07693,
-     "end_time": "2020-04-22T07:26:04.218750",
+     "duration": 0.073297,
+     "end_time": "2020-04-23T07:25:40.148737",
      "exception": false,
-     "start_time": "2020-04-22T07:26:04.141820",
+     "start_time": "2020-04-23T07:25:40.075440",
      "status": "completed"
     },
     "tags": []
@@ -246,10 +246,10 @@
    "cell_type": "markdown",
    "metadata": {
     "papermill": {
-     "duration": 0.008348,
-     "end_time": "2020-04-22T07:26:04.240058",
+     "duration": 0.007835,
+     "end_time": "2020-04-23T07:25:40.168710",
      "exception": false,
-     "start_time": "2020-04-22T07:26:04.231710",
+     "start_time": "2020-04-23T07:25:40.160875",
      "status": "completed"
     },
     "tags": []
@@ -263,10 +263,10 @@
    "execution_count": 7,
    "metadata": {
     "papermill": {
-     "duration": 0.313441,
-     "end_time": "2020-04-22T07:26:04.560698",
+     "duration": 0.249515,
+     "end_time": "2020-04-23T07:25:40.424452",
      "exception": false,
-     "start_time": "2020-04-22T07:26:04.247257",
+     "start_time": "2020-04-23T07:25:40.174937",
      "status": "completed"
     },
     "tags": []
@@ -283,10 +283,10 @@
    "execution_count": 8,
    "metadata": {
     "papermill": {
-     "duration": 0.034309,
-     "end_time": "2020-04-22T07:26:04.610677",
+     "duration": 0.031698,
+     "end_time": "2020-04-23T07:25:40.471178",
      "exception": false,
-     "start_time": "2020-04-22T07:26:04.576368",
+     "start_time": "2020-04-23T07:25:40.439480",
      "status": "completed"
     },
     "tags": []
@@ -305,10 +305,10 @@
    "execution_count": 9,
    "metadata": {
     "papermill": {
-     "duration": 0.123985,
-     "end_time": "2020-04-22T07:26:04.751067",
+     "duration": 0.118394,
+     "end_time": "2020-04-23T07:25:40.602114",
      "exception": false,
-     "start_time": "2020-04-22T07:26:04.627082",
+     "start_time": "2020-04-23T07:25:40.483720",
      "status": "completed"
     },
     "tags": []
@@ -318,7 +318,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "2620 data points\n"
+      "2676 data points\n"
      ]
     },
     {
@@ -368,51 +368,51 @@
        "  <tbody>\n",
        "    <tr>\n",
        "      <th>0</th>\n",
-       "      <td>20200421</td>\n",
+       "      <td>20200422</td>\n",
        "      <td>AK</td>\n",
-       "      <td>329.0</td>\n",
-       "      <td>10790.0</td>\n",
+       "      <td>335.0</td>\n",
+       "      <td>11824.0</td>\n",
        "      <td>NaN</td>\n",
-       "      <td>42.0</td>\n",
+       "      <td>39.0</td>\n",
        "      <td>36.0</td>\n",
        "      <td>NaN</td>\n",
        "      <td>NaN</td>\n",
        "      <td>NaN</td>\n",
        "      <td>...</td>\n",
        "      <td>36.0</td>\n",
-       "      <td>11119.0</td>\n",
-       "      <td>11119.0</td>\n",
-       "      <td>11119.0</td>\n",
+       "      <td>12159.0</td>\n",
+       "      <td>12159.0</td>\n",
+       "      <td>12159.0</td>\n",
        "      <td>2</td>\n",
        "      <td>0.0</td>\n",
        "      <td>0.0</td>\n",
-       "      <td>987.0</td>\n",
-       "      <td>8.0</td>\n",
-       "      <td>995.0</td>\n",
+       "      <td>1034.0</td>\n",
+       "      <td>6.0</td>\n",
+       "      <td>1040.0</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>1</th>\n",
-       "      <td>20200421</td>\n",
+       "      <td>20200422</td>\n",
        "      <td>AL</td>\n",
-       "      <td>5231.0</td>\n",
+       "      <td>5465.0</td>\n",
        "      <td>43295.0</td>\n",
        "      <td>NaN</td>\n",
        "      <td>NaN</td>\n",
-       "      <td>699.0</td>\n",
+       "      <td>730.0</td>\n",
        "      <td>NaN</td>\n",
-       "      <td>260.0</td>\n",
+       "      <td>288.0</td>\n",
        "      <td>NaN</td>\n",
        "      <td>...</td>\n",
-       "      <td>699.0</td>\n",
-       "      <td>48526.0</td>\n",
-       "      <td>48526.0</td>\n",
-       "      <td>48526.0</td>\n",
+       "      <td>730.0</td>\n",
+       "      <td>48760.0</td>\n",
+       "      <td>48760.0</td>\n",
+       "      <td>48760.0</td>\n",
        "      <td>1</td>\n",
-       "      <td>10.0</td>\n",
-       "      <td>58.0</td>\n",
-       "      <td>2420.0</td>\n",
-       "      <td>206.0</td>\n",
-       "      <td>2626.0</td>\n",
+       "      <td>17.0</td>\n",
+       "      <td>31.0</td>\n",
+       "      <td>0.0</td>\n",
+       "      <td>234.0</td>\n",
+       "      <td>234.0</td>\n",
        "    </tr>\n",
        "  </tbody>\n",
        "</table>\n",
@@ -421,24 +421,24 @@
       ],
       "text/plain": [
        "       date state  positive  negative  pending  hospitalizedCurrently  \\\n",
-       "0  20200421    AK     329.0   10790.0      NaN                   42.0   \n",
-       "1  20200421    AL    5231.0   43295.0      NaN                    NaN   \n",
+       "0  20200422    AK     335.0   11824.0      NaN                   39.0   \n",
+       "1  20200422    AL    5465.0   43295.0      NaN                    NaN   \n",
        "\n",
        "   hospitalizedCumulative  inIcuCurrently  inIcuCumulative  \\\n",
        "0                    36.0             NaN              NaN   \n",
-       "1                   699.0             NaN            260.0   \n",
+       "1                   730.0             NaN            288.0   \n",
        "\n",
        "   onVentilatorCurrently  ...  hospitalized    total totalTestResults  \\\n",
-       "0                    NaN  ...          36.0  11119.0          11119.0   \n",
-       "1                    NaN  ...         699.0  48526.0          48526.0   \n",
+       "0                    NaN  ...          36.0  12159.0          12159.0   \n",
+       "1                    NaN  ...         730.0  48760.0          48760.0   \n",
        "\n",
        "    posNeg  fips  deathIncrease  hospitalizedIncrease  negativeIncrease  \\\n",
-       "0  11119.0     2            0.0                   0.0             987.0   \n",
-       "1  48526.0     1           10.0                  58.0            2420.0   \n",
+       "0  12159.0     2            0.0                   0.0            1034.0   \n",
+       "1  48760.0     1           17.0                  31.0               0.0   \n",
        "\n",
        "   positiveIncrease  totalTestResultsIncrease  \n",
-       "0               8.0                     995.0  \n",
-       "1             206.0                    2626.0  \n",
+       "0               6.0                    1040.0  \n",
+       "1             234.0                     234.0  \n",
        "\n",
        "[2 rows x 25 columns]"
       ]
@@ -474,18 +474,18 @@
    "version": "3.7.3"
   },
   "papermill": {
-   "duration": 3.020416,
-   "end_time": "2020-04-22T07:26:05.182696",
+   "duration": 3.812008,
+   "end_time": "2020-04-23T07:25:40.931308",
    "environment_variables": {},
    "exception": null,
-   "input_path": "/tmp/vwmf0jau/notebooks/process/download-covidtracking-data.ipynb",
+   "input_path": "/tmp/5uveaykp/notebooks/process/download-covidtracking-data.ipynb",
    "output_path": "runs/download-covidtracking-data.runs.ipynb",
    "parameters": {
-    "PAPERMILL_INPUT_PATH": "/tmp/vwmf0jau/notebooks/process/download-covidtracking-data.ipynb",
+    "PAPERMILL_INPUT_PATH": "/tmp/5uveaykp/notebooks/process/download-covidtracking-data.ipynb",
     "PAPERMILL_OUTPUT_PATH": "runs/download-covidtracking-data.runs.ipynb",
     "out_folder": "data/covidtracking"
    },
-   "start_time": "2020-04-22T07:26:02.162280",
+   "start_time": "2020-04-23T07:25:37.119300",
    "version": "1.1.0"
   }
  },
-- 
GitLab