From 9a18ef0a0158f136d9c7ad21816da42625797714 Mon Sep 17 00:00:00 2001 From: "CR (covid cron)" <cramakri+covid-cron@ethz.ch> Date: Wed, 8 Apr 2020 07:24:37 +0000 Subject: [PATCH] renku rerun data/covidtracking/states-metadata.json data/covidtracking/states-daily.json --- .../ac820fd3b5414df1a89556c3f4262994.cwl | 120 +++++++++++++++ data/covidtracking/states-daily.json | 4 +- data/covidtracking/states-metadata.json | 4 +- runs/download-covidtracking-data.runs.ipynb | 142 +++++++++--------- 4 files changed, 195 insertions(+), 75 deletions(-) create mode 100644 .renku/workflow/ac820fd3b5414df1a89556c3f4262994.cwl diff --git a/.renku/workflow/ac820fd3b5414df1a89556c3f4262994.cwl b/.renku/workflow/ac820fd3b5414df1a89556c3f4262994.cwl new file mode 100644 index 000000000..0e74f62c2 --- /dev/null +++ b/.renku/workflow/ac820fd3b5414df1a89556c3f4262994.cwl @@ -0,0 +1,120 @@ +class: Workflow +cwlVersion: v1.0 +hints: [] +inputs: + input_1: + default: states-metadata.json + streamable: false + type: string + input_2: + default: out_folder + streamable: false + type: string + input_3: + default: data/covidtracking + streamable: false + type: string + input_4: + default: + class: File + path: ../../notebooks/process/download-covidtracking-data.ipynb + streamable: false + type: File + input_5: + default: runs/download-covidtracking-data.runs.ipynb + streamable: false + type: string + input_6: + default: states-daily.json + streamable: false + type: string +outputs: + output_0: + outputSource: step_2/output_1 + streamable: false + type: Directory + output_2: + outputSource: step_2/output_0 + streamable: false + type: File +requirements: [] +steps: + step_1: + in: + filename: input_1 + input_directory: step_2/output_1 + out: + - output_file + run: + arguments: [] + baseCommand: + - 'true' + class: CommandLineTool + cwlVersion: v1.0 + hints: [] + inputs: + filename: + default: states-metadata.json + streamable: false + type: string + input_directory: + streamable: false + type: Directory + outputs: + output_file: + outputBinding: + glob: $(inputs.filename) + streamable: false + type: File + permanentFailCodes: [] + requirements: + - &id001 + class: InlineJavascriptRequirement + - &id002 + class: InitialWorkDirRequirement + listing: $(inputs.input_directory.listing) + successCodes: [] + temporaryFailCodes: [] + step_2: + in: + input_1: input_2 + input_2: input_3 + input_3: input_4 + input_4: input_5 + out: + - output_0 + - output_1 + run: a17d560c41a54f5aa307ce5f3c5effe5_papermill.cwl + step_3: + in: + filename: input_6 + input_directory: step_2/output_1 + out: + - output_file + run: + arguments: [] + baseCommand: + - 'true' + class: CommandLineTool + cwlVersion: v1.0 + hints: [] + inputs: + filename: + default: states-daily.json + streamable: false + type: string + input_directory: + streamable: false + type: Directory + outputs: + output_file: + outputBinding: + glob: $(inputs.filename) + streamable: false + type: File + permanentFailCodes: [] + requirements: + - *id001 + - *id002 + successCodes: [] + temporaryFailCodes: [] diff --git a/data/covidtracking/states-daily.json b/data/covidtracking/states-daily.json index 9e82cab72..2b98b1f89 100644 --- a/data/covidtracking/states-daily.json +++ b/data/covidtracking/states-daily.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a2533d0e3eaadc749bd05d9a72eef0962b6fcbb18235394fa0ae79cf334ca073 -size 825479 +oid sha256:624c4e90483859c5b4f066d76e10a91f79f14c02fb2d5a11ea660e6a3c2e5e4f +size 856825 diff --git a/data/covidtracking/states-metadata.json b/data/covidtracking/states-metadata.json index 8986b3f83..8388329e0 100644 --- a/data/covidtracking/states-metadata.json +++ b/data/covidtracking/states-metadata.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a3c7782acbff7ad8b6ec15335382e45e9fdcb4895d4bc3d2d206d31f3e4053cd -size 25405 +oid sha256:deca95d58f3cb059c7023d28cba9da0d67c1a59bf2e5aa9403bbe32d5e8cfaac +size 25520 diff --git a/runs/download-covidtracking-data.runs.ipynb b/runs/download-covidtracking-data.runs.ipynb index ae19636d3..aa9bc6674 100644 --- a/runs/download-covidtracking-data.runs.ipynb +++ b/runs/download-covidtracking-data.runs.ipynb @@ -5,10 +5,10 @@ "execution_count": 1, "metadata": { "papermill": { - "duration": 3.786663, - "end_time": "2020-04-07T07:23:43.653334", + "duration": 4.461396, + "end_time": "2020-04-08T07:24:35.331262", "exception": false, - "start_time": "2020-04-07T07:23:39.866671", + "start_time": "2020-04-08T07:24:30.869866", "status": "completed" }, "tags": [] @@ -25,10 +25,10 @@ "execution_count": 2, "metadata": { "papermill": { - "duration": 0.017429, - "end_time": "2020-04-07T07:23:43.680093", + "duration": 0.026627, + "end_time": "2020-04-08T07:24:35.373890", "exception": false, - "start_time": "2020-04-07T07:23:43.662664", + "start_time": "2020-04-08T07:24:35.347263", "status": "completed" }, "tags": [ @@ -46,10 +46,10 @@ "execution_count": 3, "metadata": { "papermill": { - "duration": 0.018377, - "end_time": "2020-04-07T07:23:43.707020", + "duration": 0.027542, + "end_time": "2020-04-08T07:24:35.414725", "exception": false, - "start_time": "2020-04-07T07:23:43.688643", + "start_time": "2020-04-08T07:24:35.387183", "status": "completed" }, "tags": [ @@ -59,7 +59,7 @@ "outputs": [], "source": [ "# Parameters\n", - "PAPERMILL_INPUT_PATH = \"/tmp/lhx0ak2n/notebooks/process/download-covidtracking-data.ipynb\"\n", + "PAPERMILL_INPUT_PATH = \"/tmp/e17s3uzn/notebooks/process/download-covidtracking-data.ipynb\"\n", "PAPERMILL_OUTPUT_PATH = \"runs/download-covidtracking-data.runs.ipynb\"\n", "out_folder = \"data/covidtracking\"\n" ] @@ -68,10 +68,10 @@ "cell_type": "markdown", "metadata": { "papermill": { - "duration": 0.00828, - "end_time": "2020-04-07T07:23:43.725251", + "duration": 0.009615, + "end_time": "2020-04-08T07:24:35.443594", "exception": false, - "start_time": "2020-04-07T07:23:43.716971", + "start_time": "2020-04-08T07:24:35.433979", "status": "completed" }, "tags": [] @@ -87,10 +87,10 @@ "execution_count": 4, "metadata": { "papermill": { - "duration": 1.688127, - "end_time": "2020-04-07T07:23:45.420727", + "duration": 0.496555, + "end_time": "2020-04-08T07:24:35.946501", "exception": false, - "start_time": "2020-04-07T07:23:43.732600", + "start_time": "2020-04-08T07:24:35.449946", "status": "completed" }, "tags": [] @@ -107,10 +107,10 @@ "execution_count": 5, "metadata": { "papermill": { - "duration": 0.021236, - "end_time": "2020-04-07T07:23:45.454724", + "duration": 0.026674, + "end_time": "2020-04-08T07:24:35.986611", "exception": false, - "start_time": "2020-04-07T07:23:45.433488", + "start_time": "2020-04-08T07:24:35.959937", "status": "completed" }, "tags": [] @@ -129,10 +129,10 @@ "execution_count": 6, "metadata": { "papermill": { - "duration": 0.067313, - "end_time": "2020-04-07T07:23:45.531445", + "duration": 0.076069, + "end_time": "2020-04-08T07:24:36.071390", "exception": false, - "start_time": "2020-04-07T07:23:45.464132", + "start_time": "2020-04-08T07:24:35.995321", "status": "completed" }, "tags": [] @@ -246,10 +246,10 @@ "cell_type": "markdown", "metadata": { "papermill": { - "duration": 0.007752, - "end_time": "2020-04-07T07:23:45.550856", + "duration": 0.008016, + "end_time": "2020-04-08T07:24:36.093347", "exception": false, - "start_time": "2020-04-07T07:23:45.543104", + "start_time": "2020-04-08T07:24:36.085331", "status": "completed" }, "tags": [] @@ -263,10 +263,10 @@ "execution_count": 7, "metadata": { "papermill": { - "duration": 0.178878, - "end_time": "2020-04-07T07:23:45.737754", + "duration": 0.289201, + "end_time": "2020-04-08T07:24:36.389295", "exception": false, - "start_time": "2020-04-07T07:23:45.558876", + "start_time": "2020-04-08T07:24:36.100094", "status": "completed" }, "tags": [] @@ -283,10 +283,10 @@ "execution_count": 8, "metadata": { "papermill": { - "duration": 0.025186, - "end_time": "2020-04-07T07:23:45.774141", + "duration": 0.027866, + "end_time": "2020-04-08T07:24:36.431887", "exception": false, - "start_time": "2020-04-07T07:23:45.748955", + "start_time": "2020-04-08T07:24:36.404021", "status": "completed" }, "tags": [] @@ -305,10 +305,10 @@ "execution_count": 9, "metadata": { "papermill": { - "duration": 0.095883, - "end_time": "2020-04-07T07:23:45.880749", + "duration": 0.099568, + "end_time": "2020-04-08T07:24:36.541506", "exception": false, - "start_time": "2020-04-07T07:23:45.784866", + "start_time": "2020-04-08T07:24:36.441938", "status": "completed" }, "tags": [] @@ -318,7 +318,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "1765 data points\n" + "1821 data points\n" ] }, { @@ -368,10 +368,10 @@ " <tbody>\n", " <tr>\n", " <th>0</th>\n", - " <td>20200406</td>\n", + " <td>20200407</td>\n", " <td>AK</td>\n", - " <td>191.0</td>\n", - " <td>6692.0</td>\n", + " <td>213.0</td>\n", + " <td>6700.0</td>\n", " <td>NaN</td>\n", " <td>NaN</td>\n", " <td>23.0</td>\n", @@ -380,39 +380,39 @@ " <td>NaN</td>\n", " <td>...</td>\n", " <td>23.0</td>\n", - " <td>6883</td>\n", - " <td>6883</td>\n", - " <td>6883</td>\n", + " <td>6913</td>\n", + " <td>6913</td>\n", + " <td>6913</td>\n", " <td>2</td>\n", " <td>0.0</td>\n", - " <td>3.0</td>\n", - " <td>593.0</td>\n", - " <td>6.0</td>\n", - " <td>599.0</td>\n", + " <td>0.0</td>\n", + " <td>8.0</td>\n", + " <td>22.0</td>\n", + " <td>30.0</td>\n", " </tr>\n", " <tr>\n", " <th>1</th>\n", - " <td>20200406</td>\n", + " <td>20200407</td>\n", " <td>AL</td>\n", - " <td>1968.0</td>\n", + " <td>2119.0</td>\n", " <td>12797.0</td>\n", " <td>NaN</td>\n", " <td>NaN</td>\n", - " <td>240.0</td>\n", + " <td>271.0</td>\n", " <td>NaN</td>\n", " <td>NaN</td>\n", " <td>NaN</td>\n", " <td>...</td>\n", - " <td>240.0</td>\n", - " <td>14765</td>\n", - " <td>14765</td>\n", - " <td>14765</td>\n", + " <td>271.0</td>\n", + " <td>14916</td>\n", + " <td>14916</td>\n", + " <td>14916</td>\n", " <td>1</td>\n", - " <td>5.0</td>\n", - " <td>9.0</td>\n", - " <td>1515.0</td>\n", - " <td>172.0</td>\n", - " <td>1687.0</td>\n", + " <td>6.0</td>\n", + " <td>31.0</td>\n", + " <td>0.0</td>\n", + " <td>151.0</td>\n", + " <td>151.0</td>\n", " </tr>\n", " </tbody>\n", "</table>\n", @@ -421,24 +421,24 @@ ], "text/plain": [ " date state positive negative pending hospitalizedCurrently \\\n", - "0 20200406 AK 191.0 6692.0 NaN NaN \n", - "1 20200406 AL 1968.0 12797.0 NaN NaN \n", + "0 20200407 AK 213.0 6700.0 NaN NaN \n", + "1 20200407 AL 2119.0 12797.0 NaN NaN \n", "\n", " hospitalizedCumulative inIcuCurrently inIcuCumulative \\\n", "0 23.0 NaN NaN \n", - "1 240.0 NaN NaN \n", + "1 271.0 NaN NaN \n", "\n", " onVentilatorCurrently ... hospitalized total totalTestResults posNeg \\\n", - "0 NaN ... 23.0 6883 6883 6883 \n", - "1 NaN ... 240.0 14765 14765 14765 \n", + "0 NaN ... 23.0 6913 6913 6913 \n", + "1 NaN ... 271.0 14916 14916 14916 \n", "\n", " fips deathIncrease hospitalizedIncrease negativeIncrease \\\n", - "0 2 0.0 3.0 593.0 \n", - "1 1 5.0 9.0 1515.0 \n", + "0 2 0.0 0.0 8.0 \n", + "1 1 6.0 31.0 0.0 \n", "\n", " positiveIncrease totalTestResultsIncrease \n", - "0 6.0 599.0 \n", - "1 172.0 1687.0 \n", + "0 22.0 30.0 \n", + "1 151.0 151.0 \n", "\n", "[2 rows x 25 columns]" ] @@ -474,18 +474,18 @@ "version": "3.7.3" }, "papermill": { - "duration": 7.815282, - "end_time": "2020-04-07T07:23:46.200468", + "duration": 8.231266, + "end_time": "2020-04-08T07:24:36.871358", "environment_variables": {}, "exception": null, - "input_path": "/tmp/lhx0ak2n/notebooks/process/download-covidtracking-data.ipynb", + "input_path": "/tmp/e17s3uzn/notebooks/process/download-covidtracking-data.ipynb", "output_path": "runs/download-covidtracking-data.runs.ipynb", "parameters": { - "PAPERMILL_INPUT_PATH": "/tmp/lhx0ak2n/notebooks/process/download-covidtracking-data.ipynb", + "PAPERMILL_INPUT_PATH": "/tmp/e17s3uzn/notebooks/process/download-covidtracking-data.ipynb", "PAPERMILL_OUTPUT_PATH": "runs/download-covidtracking-data.runs.ipynb", "out_folder": "data/covidtracking" }, - "start_time": "2020-04-07T07:23:38.385186", + "start_time": "2020-04-08T07:24:28.640092", "version": "1.1.0" } }, -- GitLab