diff --git a/.renku/workflow/4999a116583346fc8f64f137bece2787.cwl b/.renku/workflow/4999a116583346fc8f64f137bece2787.cwl new file mode 100644 index 0000000000000000000000000000000000000000..fe39d4a6290c000b671965d78ed939fcea8670f4 --- /dev/null +++ b/.renku/workflow/4999a116583346fc8f64f137bece2787.cwl @@ -0,0 +1,120 @@ +class: Workflow +cwlVersion: v1.0 +hints: [] +inputs: + input_1: + default: out_folder + streamable: false + type: string + input_2: + default: data/covidtracking + streamable: false + type: string + input_3: + default: + class: File + path: ../../notebooks/process/download-covidtracking-data.ipynb + streamable: false + type: File + input_4: + default: runs/download-covidtracking-data.runs.ipynb + streamable: false + type: string + input_5: + default: states-daily.json + streamable: false + type: string + input_6: + default: states-metadata.json + streamable: false + type: string +outputs: + output_0: + outputSource: step_1/output_0 + streamable: false + type: File + output_1: + outputSource: step_1/output_1 + streamable: false + type: Directory +requirements: [] +steps: + step_1: + in: + input_1: input_1 + input_2: input_2 + input_3: input_3 + input_4: input_4 + out: + - output_1 + - output_0 + run: a17d560c41a54f5aa307ce5f3c5effe5_papermill.cwl + step_2: + in: + filename: input_5 + input_directory: step_1/output_1 + out: + - output_file + run: + arguments: [] + baseCommand: + - 'true' + class: CommandLineTool + cwlVersion: v1.0 + hints: [] + inputs: + filename: + default: states-daily.json + streamable: false + type: string + input_directory: + streamable: false + type: Directory + outputs: + output_file: + outputBinding: + glob: $(inputs.filename) + streamable: false + type: File + permanentFailCodes: [] + requirements: + - &id001 + class: InlineJavascriptRequirement + - &id002 + class: InitialWorkDirRequirement + listing: $(inputs.input_directory.listing) + successCodes: [] + temporaryFailCodes: [] + step_3: + in: + filename: input_6 + input_directory: step_1/output_1 + out: + - output_file + run: + arguments: [] + baseCommand: + - 'true' + class: CommandLineTool + cwlVersion: v1.0 + hints: [] + inputs: + filename: + default: states-metadata.json + streamable: false + type: string + input_directory: + streamable: false + type: Directory + outputs: + output_file: + outputBinding: + glob: $(inputs.filename) + streamable: false + type: File + permanentFailCodes: [] + requirements: + - *id001 + - *id002 + successCodes: [] + temporaryFailCodes: [] diff --git a/data/covidtracking/states-daily.json b/data/covidtracking/states-daily.json index 79108d0ddc56b64fd90e76fe08bc702e9649c7cc..edf218b9674dd9f8fda10926290c721d9ea04d14 100644 --- a/data/covidtracking/states-daily.json +++ b/data/covidtracking/states-daily.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bdad962f55521d67f534b2aeb1badaf6b703e76057653c269428a9e327f46b25 -size 20485516 +oid sha256:bb2ad9c5ece75da5d24bcf21eb89b62878125c949f6af859c2897479a4eceb6b +size 20562632 diff --git a/data/covidtracking/states-metadata.json b/data/covidtracking/states-metadata.json index 3ae8e969bb56dd18b12fb5df9fea5fbbe6b8694b..4c46c9342a30977aa9dd58edea1a01d40add3f7d 100644 --- a/data/covidtracking/states-metadata.json +++ b/data/covidtracking/states-metadata.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1d3ae035cdae441dea198f8a30c79af627e67e76952a06595f266a56428c44cc -size 132306 +oid sha256:85f4353ea432c3e807ec92687176e5236a3bf67cd894566ffdbe3f3ab7464111 +size 137048 diff --git a/runs/download-covidtracking-data.runs.ipynb b/runs/download-covidtracking-data.runs.ipynb index b71ede25110f09d17878b684980a6aac9770fc2f..470b96d9c911399b980e68c33695f3b0ed095f5c 100644 --- a/runs/download-covidtracking-data.runs.ipynb +++ b/runs/download-covidtracking-data.runs.ipynb @@ -5,10 +5,10 @@ "execution_count": 1, "metadata": { "papermill": { - "duration": 6.475913, - "end_time": "2020-11-26T07:58:35.675162", + "duration": 5.337619, + "end_time": "2020-11-27T07:36:46.605067", "exception": false, - "start_time": "2020-11-26T07:58:29.199249", + "start_time": "2020-11-27T07:36:41.267448", "status": "completed" }, "tags": [] @@ -25,10 +25,10 @@ "execution_count": 2, "metadata": { "papermill": { - "duration": 0.020822, - "end_time": "2020-11-26T07:58:35.708619", + "duration": 0.01986, + "end_time": "2020-11-27T07:36:46.637566", "exception": false, - "start_time": "2020-11-26T07:58:35.687797", + "start_time": "2020-11-27T07:36:46.617706", "status": "completed" }, "tags": [ @@ -46,10 +46,10 @@ "execution_count": 3, "metadata": { "papermill": { - "duration": 0.017946, - "end_time": "2020-11-26T07:58:35.734541", + "duration": 0.018416, + "end_time": "2020-11-27T07:36:46.663773", "exception": false, - "start_time": "2020-11-26T07:58:35.716595", + "start_time": "2020-11-27T07:36:46.645357", "status": "completed" }, "tags": [ @@ -59,7 +59,7 @@ "outputs": [], "source": [ "# Parameters\n", - "PAPERMILL_INPUT_PATH = \"/tmp/p4r5vl68/notebooks/process/download-covidtracking-data.ipynb\"\n", + "PAPERMILL_INPUT_PATH = \"/tmp/rqwp5r7w/notebooks/process/download-covidtracking-data.ipynb\"\n", "PAPERMILL_OUTPUT_PATH = \"runs/download-covidtracking-data.runs.ipynb\"\n", "out_folder = \"data/covidtracking\"\n" ] @@ -68,10 +68,10 @@ "cell_type": "markdown", "metadata": { "papermill": { - "duration": 0.005967, - "end_time": "2020-11-26T07:58:35.746416", + "duration": 0.00507, + "end_time": "2020-11-27T07:36:46.675456", "exception": false, - "start_time": "2020-11-26T07:58:35.740449", + "start_time": "2020-11-27T07:36:46.670386", "status": "completed" }, "tags": [] @@ -87,10 +87,10 @@ "execution_count": 4, "metadata": { "papermill": { - "duration": 10.821161, - "end_time": "2020-11-26T07:58:46.572554", + "duration": 0.385069, + "end_time": "2020-11-27T07:36:47.064880", "exception": false, - "start_time": "2020-11-26T07:58:35.751393", + "start_time": "2020-11-27T07:36:46.679811", "status": "completed" }, "tags": [] @@ -107,10 +107,10 @@ "execution_count": 5, "metadata": { "papermill": { - "duration": 0.029661, - "end_time": "2020-11-26T07:58:46.614568", + "duration": 0.023918, + "end_time": "2020-11-27T07:36:47.102050", "exception": false, - "start_time": "2020-11-26T07:58:46.584907", + "start_time": "2020-11-27T07:36:47.078132", "status": "completed" }, "tags": [] @@ -129,10 +129,10 @@ "execution_count": 6, "metadata": { "papermill": { - "duration": 0.063953, - "end_time": "2020-11-26T07:58:46.690388", + "duration": 0.070892, + "end_time": "2020-11-27T07:36:47.180661", "exception": false, - "start_time": "2020-11-26T07:58:46.626435", + "start_time": "2020-11-27T07:36:47.109769", "status": "completed" }, "tags": [] @@ -284,10 +284,10 @@ "cell_type": "markdown", "metadata": { "papermill": { - "duration": 0.00631, - "end_time": "2020-11-26T07:58:46.707816", + "duration": 0.008123, + "end_time": "2020-11-27T07:36:47.201689", "exception": false, - "start_time": "2020-11-26T07:58:46.701506", + "start_time": "2020-11-27T07:36:47.193566", "status": "completed" }, "tags": [] @@ -301,10 +301,10 @@ "execution_count": 7, "metadata": { "papermill": { - "duration": 10.615746, - "end_time": "2020-11-26T07:58:57.330443", + "duration": 0.646562, + "end_time": "2020-11-27T07:36:47.854170", "exception": false, - "start_time": "2020-11-26T07:58:46.714697", + "start_time": "2020-11-27T07:36:47.207608", "status": "completed" }, "tags": [] @@ -321,10 +321,10 @@ "execution_count": 8, "metadata": { "papermill": { - "duration": 0.035601, - "end_time": "2020-11-26T07:58:57.378913", + "duration": 0.050376, + "end_time": "2020-11-27T07:36:47.919674", "exception": false, - "start_time": "2020-11-26T07:58:57.343312", + "start_time": "2020-11-27T07:36:47.869298", "status": "completed" }, "tags": [] @@ -343,10 +343,10 @@ "execution_count": 9, "metadata": { "papermill": { - "duration": 0.515161, - "end_time": "2020-11-26T07:58:57.904857", + "duration": 0.559813, + "end_time": "2020-11-27T07:36:48.493390", "exception": false, - "start_time": "2020-11-26T07:58:57.389696", + "start_time": "2020-11-27T07:36:47.933577", "status": "completed" }, "tags": [] @@ -356,7 +356,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "15017 data points\n" + "15073 data points\n" ] }, { @@ -406,21 +406,21 @@ " <tbody>\n", " <tr>\n", " <th>0</th>\n", - " <td>20201125</td>\n", + " <td>20201126</td>\n", " <td>AK</td>\n", - " <td>28339.0</td>\n", + " <td>28892.0</td>\n", " <td>NaN</td>\n", - " <td>925937.0</td>\n", + " <td>940681.0</td>\n", " <td>NaN</td>\n", " <td>totalTestsViral</td>\n", - " <td>954276.0</td>\n", + " <td>969573.0</td>\n", " <td>145.0</td>\n", - " <td>663.0</td>\n", + " <td>688.0</td>\n", " <td>...</td>\n", - " <td>954276</td>\n", - " <td>0</td>\n", - " <td>32</td>\n", - " <td>e4015d41f79fe8f9552517702ee27996c0d86b6a</td>\n", + " <td>969573</td>\n", + " <td>3</td>\n", + " <td>25</td>\n", + " <td>dcdef309762dffbb3f252251698f060c4c11e56f</td>\n", " <td>0</td>\n", " <td>0</td>\n", " <td>0</td>\n", @@ -430,21 +430,21 @@ " </tr>\n", " <tr>\n", " <th>1</th>\n", - " <td>20201125</td>\n", + " <td>20201126</td>\n", " <td>AL</td>\n", - " <td>239318.0</td>\n", - " <td>39692.0</td>\n", - " <td>1353961.0</td>\n", + " <td>241957.0</td>\n", + " <td>40202.0</td>\n", + " <td>1361187.0</td>\n", " <td>NaN</td>\n", " <td>totalTestsViral</td>\n", - " <td>1553587.0</td>\n", - " <td>1483.0</td>\n", - " <td>24376.0</td>\n", + " <td>1562942.0</td>\n", + " <td>1434.0</td>\n", + " <td>24401.0</td>\n", " <td>...</td>\n", - " <td>1593279</td>\n", - " <td>60</td>\n", - " <td>216</td>\n", - " <td>cfbf3932514b39bd3f684d0fc235d8daa8009616</td>\n", + " <td>1603144</td>\n", + " <td>40</td>\n", + " <td>25</td>\n", + " <td>751d7219f69c39f0970b03836d9448ceec5db281</td>\n", " <td>0</td>\n", " <td>0</td>\n", " <td>0</td>\n", @@ -459,20 +459,20 @@ ], "text/plain": [ " date state positive probableCases negative pending \\\n", - "0 20201125 AK 28339.0 NaN 925937.0 NaN \n", - "1 20201125 AL 239318.0 39692.0 1353961.0 NaN \n", + "0 20201126 AK 28892.0 NaN 940681.0 NaN \n", + "1 20201126 AL 241957.0 40202.0 1361187.0 NaN \n", "\n", " totalTestResultsSource totalTestResults hospitalizedCurrently \\\n", - "0 totalTestsViral 954276.0 145.0 \n", - "1 totalTestsViral 1553587.0 1483.0 \n", + "0 totalTestsViral 969573.0 145.0 \n", + "1 totalTestsViral 1562942.0 1434.0 \n", "\n", " hospitalizedCumulative ... posNeg deathIncrease hospitalizedIncrease \\\n", - "0 663.0 ... 954276 0 32 \n", - "1 24376.0 ... 1593279 60 216 \n", + "0 688.0 ... 969573 3 25 \n", + "1 24401.0 ... 1603144 40 25 \n", "\n", " hash commercialScore \\\n", - "0 e4015d41f79fe8f9552517702ee27996c0d86b6a 0 \n", - "1 cfbf3932514b39bd3f684d0fc235d8daa8009616 0 \n", + "0 dcdef309762dffbb3f252251698f060c4c11e56f 0 \n", + "1 751d7219f69c39f0970b03836d9448ceec5db281 0 \n", "\n", " negativeRegularScore negativeScore positiveScore score grade \n", "0 0 0 0 0 \n", @@ -512,18 +512,18 @@ "version": "3.7.3" }, "papermill": { - "duration": 31.109234, - "end_time": "2020-11-26T07:58:58.230145", + "duration": 9.421571, + "end_time": "2020-11-27T07:36:48.817125", "environment_variables": {}, "exception": null, - "input_path": "/tmp/p4r5vl68/notebooks/process/download-covidtracking-data.ipynb", + "input_path": "/tmp/rqwp5r7w/notebooks/process/download-covidtracking-data.ipynb", "output_path": "runs/download-covidtracking-data.runs.ipynb", "parameters": { - "PAPERMILL_INPUT_PATH": "/tmp/p4r5vl68/notebooks/process/download-covidtracking-data.ipynb", + "PAPERMILL_INPUT_PATH": "/tmp/rqwp5r7w/notebooks/process/download-covidtracking-data.ipynb", "PAPERMILL_OUTPUT_PATH": "runs/download-covidtracking-data.runs.ipynb", "out_folder": "data/covidtracking" }, - "start_time": "2020-11-26T07:58:27.120911", + "start_time": "2020-11-27T07:36:39.395554", "version": "1.1.0" } },