diff --git a/.renku/workflow/c602368708e545f383bf6f9821b44bce.cwl b/.renku/workflow/c602368708e545f383bf6f9821b44bce.cwl new file mode 100644 index 0000000000000000000000000000000000000000..4105b2e4b7864a8c984c0fb6a1ce3eb1cd63e3e3 --- /dev/null +++ b/.renku/workflow/c602368708e545f383bf6f9821b44bce.cwl @@ -0,0 +1,120 @@ +class: Workflow +cwlVersion: v1.0 +hints: [] +inputs: + input_1: + default: states-metadata.json + streamable: false + type: string + input_2: + default: out_folder + streamable: false + type: string + input_3: + default: data/covidtracking + streamable: false + type: string + input_4: + default: + class: File + path: ../../notebooks/process/download-covidtracking-data.ipynb + streamable: false + type: File + input_5: + default: runs/download-covidtracking-data.runs.ipynb + streamable: false + type: string + input_6: + default: states-daily.json + streamable: false + type: string +outputs: + output_1: + outputSource: step_2/output_1 + streamable: false + type: Directory + output_3: + outputSource: step_2/output_0 + streamable: false + type: File +requirements: [] +steps: + step_1: + in: + filename: input_1 + input_directory: step_2/output_1 + out: + - output_file + run: + arguments: [] + baseCommand: + - 'true' + class: CommandLineTool + cwlVersion: v1.0 + hints: [] + inputs: + filename: + default: states-metadata.json + streamable: false + type: string + input_directory: + streamable: false + type: Directory + outputs: + output_file: + outputBinding: + glob: $(inputs.filename) + streamable: false + type: File + permanentFailCodes: [] + requirements: + - &id001 + class: InlineJavascriptRequirement + - &id002 + class: InitialWorkDirRequirement + listing: $(inputs.input_directory.listing) + successCodes: [] + temporaryFailCodes: [] + step_2: + in: + input_1: input_2 + input_2: input_3 + input_3: input_4 + input_4: input_5 + out: + - output_0 + - output_1 + run: a17d560c41a54f5aa307ce5f3c5effe5_papermill.cwl + step_3: + in: + filename: input_6 + input_directory: step_2/output_1 + out: + - output_file + run: + arguments: [] + baseCommand: + - 'true' + class: CommandLineTool + cwlVersion: v1.0 + hints: [] + inputs: + filename: + default: states-daily.json + streamable: false + type: string + input_directory: + streamable: false + type: Directory + outputs: + output_file: + outputBinding: + glob: $(inputs.filename) + streamable: false + type: File + permanentFailCodes: [] + requirements: + - *id001 + - *id002 + successCodes: [] + temporaryFailCodes: [] diff --git a/data/covidtracking/states-daily.json b/data/covidtracking/states-daily.json index 477b54e1d286a4e68004c182791b3dd9187523b1..0fa2e34bfea8be31486cec0146fe430a21c8f1f7 100644 --- a/data/covidtracking/states-daily.json +++ b/data/covidtracking/states-daily.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5e87f93ee9862eb047539a22da2e3e6556a9bfa833b0752eb374ea4e492e9416 -size 887669 +oid sha256:b6e3407e8bbdb4e7337536b97780656d4d89bec4f478fbf4a2d28088f55182b9 +size 921293 diff --git a/data/covidtracking/states-metadata.json b/data/covidtracking/states-metadata.json index 35bc6258dca4d5b8fe0ca881d0e13351296b85aa..b3d23a03d08cc75a08ec7a7a9d0a303d6fa4e05c 100644 --- a/data/covidtracking/states-metadata.json +++ b/data/covidtracking/states-metadata.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c64df10b6938f71ba5b9a6a8a7ace894a1c39490db19da83197867961e1796b2 -size 25883 +oid sha256:c8b0e452e664c4aaee2adeffff45577197bcb86c669992b5aacfb89be1c2adca +size 26023 diff --git a/runs/download-covidtracking-data.runs.ipynb b/runs/download-covidtracking-data.runs.ipynb index 88ceef3b886ddb502bb0cb8f3cca66cdf012528f..861714872f6d334cce7e663b623c594efef4544e 100644 --- a/runs/download-covidtracking-data.runs.ipynb +++ b/runs/download-covidtracking-data.runs.ipynb @@ -5,10 +5,10 @@ "execution_count": 1, "metadata": { "papermill": { - "duration": 4.202528, - "end_time": "2020-04-09T07:23:34.956443", + "duration": 0.658092, + "end_time": "2020-04-10T11:26:07.273010", "exception": false, - "start_time": "2020-04-09T07:23:30.753915", + "start_time": "2020-04-10T11:26:06.614918", "status": "completed" }, "tags": [] @@ -25,10 +25,10 @@ "execution_count": 2, "metadata": { "papermill": { - "duration": 0.017913, - "end_time": "2020-04-09T07:23:34.987901", + "duration": 0.020612, + "end_time": "2020-04-10T11:26:07.303953", "exception": false, - "start_time": "2020-04-09T07:23:34.969988", + "start_time": "2020-04-10T11:26:07.283341", "status": "completed" }, "tags": [ @@ -46,10 +46,10 @@ "execution_count": 3, "metadata": { "papermill": { - "duration": 0.019593, - "end_time": "2020-04-09T07:23:35.014482", + "duration": 0.018549, + "end_time": "2020-04-10T11:26:07.334871", "exception": false, - "start_time": "2020-04-09T07:23:34.994889", + "start_time": "2020-04-10T11:26:07.316322", "status": "completed" }, "tags": [ @@ -59,7 +59,7 @@ "outputs": [], "source": [ "# Parameters\n", - "PAPERMILL_INPUT_PATH = \"/tmp/hlryh8jc/notebooks/process/download-covidtracking-data.ipynb\"\n", + "PAPERMILL_INPUT_PATH = \"/tmp/n4f_867t/notebooks/process/download-covidtracking-data.ipynb\"\n", "PAPERMILL_OUTPUT_PATH = \"runs/download-covidtracking-data.runs.ipynb\"\n", "out_folder = \"data/covidtracking\"\n" ] @@ -68,10 +68,10 @@ "cell_type": "markdown", "metadata": { "papermill": { - "duration": 0.006856, - "end_time": "2020-04-09T07:23:35.031803", + "duration": 0.008027, + "end_time": "2020-04-10T11:26:07.350497", "exception": false, - "start_time": "2020-04-09T07:23:35.024947", + "start_time": "2020-04-10T11:26:07.342470", "status": "completed" }, "tags": [] @@ -87,10 +87,10 @@ "execution_count": 4, "metadata": { "papermill": { - "duration": 0.170755, - "end_time": "2020-04-09T07:23:35.209942", + "duration": 0.138051, + "end_time": "2020-04-10T11:26:07.495832", "exception": false, - "start_time": "2020-04-09T07:23:35.039187", + "start_time": "2020-04-10T11:26:07.357781", "status": "completed" }, "tags": [] @@ -107,10 +107,10 @@ "execution_count": 5, "metadata": { "papermill": { - "duration": 0.02125, - "end_time": "2020-04-09T07:23:35.245223", + "duration": 0.028556, + "end_time": "2020-04-10T11:26:07.539023", "exception": false, - "start_time": "2020-04-09T07:23:35.223973", + "start_time": "2020-04-10T11:26:07.510467", "status": "completed" }, "tags": [] @@ -129,10 +129,10 @@ "execution_count": 6, "metadata": { "papermill": { - "duration": 0.065282, - "end_time": "2020-04-09T07:23:35.319713", + "duration": 0.070746, + "end_time": "2020-04-10T11:26:07.623783", "exception": false, - "start_time": "2020-04-09T07:23:35.254431", + "start_time": "2020-04-10T11:26:07.553037", "status": "completed" }, "tags": [] @@ -246,10 +246,10 @@ "cell_type": "markdown", "metadata": { "papermill": { - "duration": 0.008302, - "end_time": "2020-04-09T07:23:35.337790", + "duration": 0.014199, + "end_time": "2020-04-10T11:26:07.655008", "exception": false, - "start_time": "2020-04-09T07:23:35.329488", + "start_time": "2020-04-10T11:26:07.640809", "status": "completed" }, "tags": [] @@ -263,10 +263,10 @@ "execution_count": 7, "metadata": { "papermill": { - "duration": 0.189186, - "end_time": "2020-04-09T07:23:35.534942", + "duration": 0.240592, + "end_time": "2020-04-10T11:26:07.910062", "exception": false, - "start_time": "2020-04-09T07:23:35.345756", + "start_time": "2020-04-10T11:26:07.669470", "status": "completed" }, "tags": [] @@ -283,10 +283,10 @@ "execution_count": 8, "metadata": { "papermill": { - "duration": 0.027995, - "end_time": "2020-04-09T07:23:35.573749", + "duration": 0.021919, + "end_time": "2020-04-10T11:26:07.940064", "exception": false, - "start_time": "2020-04-09T07:23:35.545754", + "start_time": "2020-04-10T11:26:07.918145", "status": "completed" }, "tags": [] @@ -305,10 +305,10 @@ "execution_count": 9, "metadata": { "papermill": { - "duration": 0.105936, - "end_time": "2020-04-09T07:23:35.690696", + "duration": 0.090075, + "end_time": "2020-04-10T11:26:08.038142", "exception": false, - "start_time": "2020-04-09T07:23:35.584760", + "start_time": "2020-04-10T11:26:07.948067", "status": "completed" }, "tags": [] @@ -318,7 +318,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "1877 data points\n" + "1944 data points\n" ] }, { @@ -368,10 +368,10 @@ " <tbody>\n", " <tr>\n", " <th>0</th>\n", - " <td>20200408</td>\n", + " <td>20200409</td>\n", " <td>AK</td>\n", - " <td>226.0</td>\n", - " <td>6842.0</td>\n", + " <td>235.0</td>\n", + " <td>6988.0</td>\n", " <td>NaN</td>\n", " <td>NaN</td>\n", " <td>27.0</td>\n", @@ -380,39 +380,39 @@ " <td>NaN</td>\n", " <td>...</td>\n", " <td>27.0</td>\n", - " <td>7068</td>\n", - " <td>7068</td>\n", - " <td>7068</td>\n", + " <td>7223</td>\n", + " <td>7223</td>\n", + " <td>7223</td>\n", " <td>2</td>\n", - " <td>1.0</td>\n", - " <td>4.0</td>\n", - " <td>142.0</td>\n", - " <td>13.0</td>\n", + " <td>0.0</td>\n", + " <td>0.0</td>\n", + " <td>146.0</td>\n", + " <td>9.0</td>\n", " <td>155.0</td>\n", " </tr>\n", " <tr>\n", " <th>1</th>\n", - " <td>20200408</td>\n", + " <td>20200409</td>\n", " <td>AL</td>\n", - " <td>2369.0</td>\n", - " <td>16753.0</td>\n", + " <td>2769.0</td>\n", + " <td>18058.0</td>\n", " <td>NaN</td>\n", " <td>NaN</td>\n", - " <td>314.0</td>\n", + " <td>333.0</td>\n", " <td>NaN</td>\n", " <td>NaN</td>\n", " <td>NaN</td>\n", " <td>...</td>\n", - " <td>314.0</td>\n", - " <td>19122</td>\n", - " <td>19122</td>\n", - " <td>19122</td>\n", + " <td>333.0</td>\n", + " <td>20827</td>\n", + " <td>20827</td>\n", + " <td>20827</td>\n", " <td>1</td>\n", - " <td>10.0</td>\n", - " <td>43.0</td>\n", - " <td>3956.0</td>\n", - " <td>250.0</td>\n", - " <td>4206.0</td>\n", + " <td>8.0</td>\n", + " <td>19.0</td>\n", + " <td>1305.0</td>\n", + " <td>400.0</td>\n", + " <td>1705.0</td>\n", " </tr>\n", " </tbody>\n", "</table>\n", @@ -421,24 +421,24 @@ ], "text/plain": [ " date state positive negative pending hospitalizedCurrently \\\n", - "0 20200408 AK 226.0 6842.0 NaN NaN \n", - "1 20200408 AL 2369.0 16753.0 NaN NaN \n", + "0 20200409 AK 235.0 6988.0 NaN NaN \n", + "1 20200409 AL 2769.0 18058.0 NaN NaN \n", "\n", " hospitalizedCumulative inIcuCurrently inIcuCumulative \\\n", "0 27.0 NaN NaN \n", - "1 314.0 NaN NaN \n", + "1 333.0 NaN NaN \n", "\n", " onVentilatorCurrently ... hospitalized total totalTestResults posNeg \\\n", - "0 NaN ... 27.0 7068 7068 7068 \n", - "1 NaN ... 314.0 19122 19122 19122 \n", + "0 NaN ... 27.0 7223 7223 7223 \n", + "1 NaN ... 333.0 20827 20827 20827 \n", "\n", " fips deathIncrease hospitalizedIncrease negativeIncrease \\\n", - "0 2 1.0 4.0 142.0 \n", - "1 1 10.0 43.0 3956.0 \n", + "0 2 0.0 0.0 146.0 \n", + "1 1 8.0 19.0 1305.0 \n", "\n", " positiveIncrease totalTestResultsIncrease \n", - "0 13.0 155.0 \n", - "1 250.0 4206.0 \n", + "0 9.0 155.0 \n", + "1 400.0 1705.0 \n", "\n", "[2 rows x 25 columns]" ] @@ -474,18 +474,18 @@ "version": "3.7.3" }, "papermill": { - "duration": 6.894233, - "end_time": "2020-04-09T07:23:36.011265", + "duration": 2.829674, + "end_time": "2020-04-10T11:26:08.460913", "environment_variables": {}, "exception": null, - "input_path": "/tmp/hlryh8jc/notebooks/process/download-covidtracking-data.ipynb", + "input_path": "/tmp/n4f_867t/notebooks/process/download-covidtracking-data.ipynb", "output_path": "runs/download-covidtracking-data.runs.ipynb", "parameters": { - "PAPERMILL_INPUT_PATH": "/tmp/hlryh8jc/notebooks/process/download-covidtracking-data.ipynb", + "PAPERMILL_INPUT_PATH": "/tmp/n4f_867t/notebooks/process/download-covidtracking-data.ipynb", "PAPERMILL_OUTPUT_PATH": "runs/download-covidtracking-data.runs.ipynb", "out_folder": "data/covidtracking" }, - "start_time": "2020-04-09T07:23:29.117032", + "start_time": "2020-04-10T11:26:05.631239", "version": "1.1.0" } },