From 2d6af889d0794b05b83c71c38178f4541a696b4c Mon Sep 17 00:00:00 2001 From: "CR (covid cron)" <cramakri+covid-cron@ethz.ch> Date: Wed, 25 Mar 2020 08:22:58 +0000 Subject: [PATCH] renku rerun data/covidtracking/states-metadata.json data/covidtracking/states-daily.json --- .../349ff7f9cbbd41febc2ee66f691da823.cwl | 120 ++++++++++++++++++ data/covidtracking/states-daily.json | 4 +- data/covidtracking/states-metadata.json | 4 +- runs/download-covidtracking-data.runs.ipynb | 112 ++++++++-------- 4 files changed, 180 insertions(+), 60 deletions(-) create mode 100644 .renku/workflow/349ff7f9cbbd41febc2ee66f691da823.cwl diff --git a/.renku/workflow/349ff7f9cbbd41febc2ee66f691da823.cwl b/.renku/workflow/349ff7f9cbbd41febc2ee66f691da823.cwl new file mode 100644 index 00000000..453e6e03 --- /dev/null +++ b/.renku/workflow/349ff7f9cbbd41febc2ee66f691da823.cwl @@ -0,0 +1,120 @@ +class: Workflow +cwlVersion: v1.0 +hints: [] +inputs: + input_1: + default: states-daily.json + streamable: false + type: string + input_2: + default: states-metadata.json + streamable: false + type: string + input_3: + default: out_folder + streamable: false + type: string + input_4: + default: data/covidtracking + streamable: false + type: string + input_5: + default: + class: File + path: ../../notebooks/process/download-covidtracking-data.ipynb + streamable: false + type: File + input_6: + default: runs/download-covidtracking-data.runs.ipynb + streamable: false + type: string +outputs: + output_0: + outputSource: step_3/output_1 + streamable: false + type: Directory + output_3: + outputSource: step_3/output_0 + streamable: false + type: File +requirements: [] +steps: + step_1: + in: + filename: input_1 + input_directory: step_3/output_1 + out: + - output_file + run: + arguments: [] + baseCommand: + - 'true' + class: CommandLineTool + cwlVersion: v1.0 + hints: [] + inputs: + filename: + default: states-daily.json + streamable: false + type: string + input_directory: + streamable: false + type: Directory + outputs: + output_file: + outputBinding: + glob: $(inputs.filename) + streamable: false + type: File + permanentFailCodes: [] + requirements: + - &id001 + class: InlineJavascriptRequirement + - &id002 + class: InitialWorkDirRequirement + listing: $(inputs.input_directory.listing) + successCodes: [] + temporaryFailCodes: [] + step_2: + in: + filename: input_2 + input_directory: step_3/output_1 + out: + - output_file + run: + arguments: [] + baseCommand: + - 'true' + class: CommandLineTool + cwlVersion: v1.0 + hints: [] + inputs: + filename: + default: states-metadata.json + streamable: false + type: string + input_directory: + streamable: false + type: Directory + outputs: + output_file: + outputBinding: + glob: $(inputs.filename) + streamable: false + type: File + permanentFailCodes: [] + requirements: + - *id001 + - *id002 + successCodes: [] + temporaryFailCodes: [] + step_3: + in: + input_1: input_3 + input_2: input_4 + input_3: input_5 + input_4: input_6 + out: + - output_1 + - output_0 + run: ff5f474d38144c5d882c0036bd1059c2_papermill.cwl diff --git a/data/covidtracking/states-daily.json b/data/covidtracking/states-daily.json index a6234d1e..ee2b6bc8 100644 --- a/data/covidtracking/states-daily.json +++ b/data/covidtracking/states-daily.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:04a4bbec05fc52248512469d41ee013fdce83b6fef928e9562dfe801ad82aff9 -size 151715 +oid sha256:4b0927c74f3dbb27dacfddb47b00d2c543f8ec932625dc1502b3d048fcc2668e +size 160445 diff --git a/data/covidtracking/states-metadata.json b/data/covidtracking/states-metadata.json index 55645103..08dcd867 100644 --- a/data/covidtracking/states-metadata.json +++ b/data/covidtracking/states-metadata.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7eaff61b1c975bf893a6e7e35a694980140435ce8cb5afc02164ce685cfa5baa -size 25218 +oid sha256:02330f655200284fbdaef1b3d4272cc84385c648ce7c3b73d910a0cacc3fa529 +size 25509 diff --git a/runs/download-covidtracking-data.runs.ipynb b/runs/download-covidtracking-data.runs.ipynb index 24fe640f..5c6e420d 100644 --- a/runs/download-covidtracking-data.runs.ipynb +++ b/runs/download-covidtracking-data.runs.ipynb @@ -5,10 +5,10 @@ "execution_count": 1, "metadata": { "papermill": { - "duration": 1.484962, - "end_time": "2020-03-24T11:08:51.882283", + "duration": 0.564716, + "end_time": "2020-03-25T08:22:56.714459", "exception": false, - "start_time": "2020-03-24T11:08:50.397321", + "start_time": "2020-03-25T08:22:56.149743", "status": "completed" }, "tags": [] @@ -25,10 +25,10 @@ "execution_count": 2, "metadata": { "papermill": { - "duration": 0.034224, - "end_time": "2020-03-24T11:08:51.927200", + "duration": 0.019507, + "end_time": "2020-03-25T08:22:56.745116", "exception": false, - "start_time": "2020-03-24T11:08:51.892976", + "start_time": "2020-03-25T08:22:56.725609", "status": "completed" }, "tags": [ @@ -46,10 +46,10 @@ "execution_count": 3, "metadata": { "papermill": { - "duration": 0.024298, - "end_time": "2020-03-24T11:08:51.965529", + "duration": 0.018572, + "end_time": "2020-03-25T08:22:56.773076", "exception": false, - "start_time": "2020-03-24T11:08:51.941231", + "start_time": "2020-03-25T08:22:56.754504", "status": "completed" }, "tags": [ @@ -59,7 +59,7 @@ "outputs": [], "source": [ "# Parameters\n", - "PAPERMILL_INPUT_PATH = \"/tmp/kq4860jy/notebooks/process/download-covidtracking-data.ipynb\"\n", + "PAPERMILL_INPUT_PATH = \"/tmp/e18fw9c9/notebooks/process/download-covidtracking-data.ipynb\"\n", "PAPERMILL_OUTPUT_PATH = \"runs/download-covidtracking-data.runs.ipynb\"\n", "out_folder = \"data/covidtracking\"\n" ] @@ -68,10 +68,10 @@ "cell_type": "markdown", "metadata": { "papermill": { - "duration": 0.007354, - "end_time": "2020-03-24T11:08:51.981277", + "duration": 0.007795, + "end_time": "2020-03-25T08:22:56.790849", "exception": false, - "start_time": "2020-03-24T11:08:51.973923", + "start_time": "2020-03-25T08:22:56.783054", "status": "completed" }, "tags": [] @@ -87,10 +87,10 @@ "execution_count": 4, "metadata": { "papermill": { - "duration": 1.994092, - "end_time": "2020-03-24T11:08:53.981279", + "duration": 1.020789, + "end_time": "2020-03-25T08:22:57.818863", "exception": false, - "start_time": "2020-03-24T11:08:51.987187", + "start_time": "2020-03-25T08:22:56.798074", "status": "completed" }, "tags": [] @@ -107,10 +107,10 @@ "execution_count": 5, "metadata": { "papermill": { - "duration": 0.028446, - "end_time": "2020-03-24T11:08:54.020108", + "duration": 0.022913, + "end_time": "2020-03-25T08:22:57.852810", "exception": false, - "start_time": "2020-03-24T11:08:53.991662", + "start_time": "2020-03-25T08:22:57.829897", "status": "completed" }, "tags": [] @@ -129,10 +129,10 @@ "execution_count": 6, "metadata": { "papermill": { - "duration": 0.080991, - "end_time": "2020-03-24T11:08:54.110615", + "duration": 0.066514, + "end_time": "2020-03-25T08:22:57.927763", "exception": false, - "start_time": "2020-03-24T11:08:54.029624", + "start_time": "2020-03-25T08:22:57.861249", "status": "completed" }, "tags": [] @@ -199,7 +199,7 @@ " <td>@alpublichealth</td>\n", " <td>No data</td>\n", " <td>False</td>\n", - " <td>Last negative count from 3/16. Last update tim...</td>\n", + " <td>Last update time taken from [main page](http:/...</td>\n", " <td>Alabama</td>\n", " </tr>\n", " </tbody>\n", @@ -221,7 +221,7 @@ "\n", " pui pum notes name \n", "0 All data False We count the reported number as \"persons teste... Alaska \n", - "1 No data False Last negative count from 3/16. Last update tim... Alabama " + "1 No data False Last update time taken from [main page](http:/... Alabama " ] }, "execution_count": 6, @@ -239,10 +239,10 @@ "cell_type": "markdown", "metadata": { "papermill": { - "duration": 0.010469, - "end_time": "2020-03-24T11:08:54.132051", + "duration": 0.008089, + "end_time": "2020-03-25T08:22:57.947587", "exception": false, - "start_time": "2020-03-24T11:08:54.121582", + "start_time": "2020-03-25T08:22:57.939498", "status": "completed" }, "tags": [] @@ -256,10 +256,10 @@ "execution_count": 7, "metadata": { "papermill": { - "duration": 0.162493, - "end_time": "2020-03-24T11:08:54.304650", + "duration": 0.184993, + "end_time": "2020-03-25T08:22:58.140940", "exception": false, - "start_time": "2020-03-24T11:08:54.142157", + "start_time": "2020-03-25T08:22:57.955947", "status": "completed" }, "tags": [] @@ -276,10 +276,10 @@ "execution_count": 8, "metadata": { "papermill": { - "duration": 0.02792, - "end_time": "2020-03-24T11:08:54.344357", + "duration": 0.022977, + "end_time": "2020-03-25T08:22:58.177014", "exception": false, - "start_time": "2020-03-24T11:08:54.316437", + "start_time": "2020-03-25T08:22:58.154037", "status": "completed" }, "tags": [] @@ -298,10 +298,10 @@ "execution_count": 9, "metadata": { "papermill": { - "duration": 0.06445, - "end_time": "2020-03-24T11:08:54.419822", + "duration": 0.060602, + "end_time": "2020-03-25T08:22:58.251228", "exception": false, - "start_time": "2020-03-24T11:08:54.355372", + "start_time": "2020-03-25T08:22:58.190626", "status": "completed" }, "tags": [] @@ -311,7 +311,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "981 data points\n" + "1037 data points\n" ] }, { @@ -349,27 +349,27 @@ " <tbody>\n", " <tr>\n", " <th>0</th>\n", - " <td>20200323</td>\n", + " <td>20200324</td>\n", " <td>AK</td>\n", - " <td>22.0</td>\n", - " <td>946.0</td>\n", + " <td>36.0</td>\n", + " <td>986.0</td>\n", " <td>NaN</td>\n", " <td>0.0</td>\n", " <td>NaN</td>\n", - " <td>968</td>\n", - " <td>2020-03-23T20:00:00Z</td>\n", + " <td>1022</td>\n", + " <td>2020-03-24T20:00:00Z</td>\n", " </tr>\n", " <tr>\n", " <th>1</th>\n", - " <td>20200323</td>\n", + " <td>20200324</td>\n", " <td>AL</td>\n", - " <td>167.0</td>\n", - " <td>1665.0</td>\n", + " <td>215.0</td>\n", + " <td>2106.0</td>\n", " <td>NaN</td>\n", " <td>NaN</td>\n", " <td>0.0</td>\n", - " <td>1832</td>\n", - " <td>2020-03-23T20:00:00Z</td>\n", + " <td>2321</td>\n", + " <td>2020-03-24T20:00:00Z</td>\n", " </tr>\n", " </tbody>\n", "</table>\n", @@ -377,12 +377,12 @@ ], "text/plain": [ " date state positive negative pending hospitalized death total \\\n", - "0 20200323 AK 22.0 946.0 NaN 0.0 NaN 968 \n", - "1 20200323 AL 167.0 1665.0 NaN NaN 0.0 1832 \n", + "0 20200324 AK 36.0 986.0 NaN 0.0 NaN 1022 \n", + "1 20200324 AL 215.0 2106.0 NaN NaN 0.0 2321 \n", "\n", " dateChecked \n", - "0 2020-03-23T20:00:00Z \n", - "1 2020-03-23T20:00:00Z " + "0 2020-03-24T20:00:00Z \n", + "1 2020-03-24T20:00:00Z " ] }, "execution_count": 9, @@ -416,18 +416,18 @@ "version": "3.7.3" }, "papermill": { - "duration": 5.713541, - "end_time": "2020-03-24T11:08:54.762805", + "duration": 3.460914, + "end_time": "2020-03-25T08:22:58.575452", "environment_variables": {}, "exception": null, - "input_path": "/tmp/kq4860jy/notebooks/process/download-covidtracking-data.ipynb", + "input_path": "/tmp/e18fw9c9/notebooks/process/download-covidtracking-data.ipynb", "output_path": "runs/download-covidtracking-data.runs.ipynb", "parameters": { - "PAPERMILL_INPUT_PATH": "/tmp/kq4860jy/notebooks/process/download-covidtracking-data.ipynb", + "PAPERMILL_INPUT_PATH": "/tmp/e18fw9c9/notebooks/process/download-covidtracking-data.ipynb", "PAPERMILL_OUTPUT_PATH": "runs/download-covidtracking-data.runs.ipynb", "out_folder": "data/covidtracking" }, - "start_time": "2020-03-24T11:08:49.049264", + "start_time": "2020-03-25T08:22:55.114538", "version": "1.1.0" } }, -- GitLab