171171
172172<h1 class="title toc-ignore">Coronavirus Dataset Data Pipeline</h1>
173173<h4 class="author">Rami Krispin</h4>
174- <h4 class="date">05 January, 2023</h4>
174+ <h4 class="date">06 January, 2023</h4>
175175
176176</div>
177177
@@ -306,8 +306,8 @@ <h4 class="tbl-info">Table Info - conf_df</h4>
306306<br/>
307307Duplicated rows: 0
308308</div>
309- <div id="htmlwidget-90cd9f0dbf4815300b10 " class="reactable html-widget" style="width:auto;height:auto;"></div>
310- <script type="application/json" data-for="htmlwidget-90cd9f0dbf4815300b10">{"x":{"tag":{"name":"Reactable","attribs":{"data":{"cols_name":["Province.State","Country.Region","Lat","Long","date","cases","type"],"cols_class":["character","character","numeric","numeric","Date","integer","character"],"cols_NAs":[213642,0,2158,2158,0,0,0],"cols_min":["NA","NA",-71.9499,-178.1165,"NA",-349116,"NA"],"cols_max":["NA","NA",71.7069,178.065,"NA",1355241,"NA"],"cols_unique":[92,201,284,285,1079,19185,1]},"columns":[{"accessor":"cols_name","name":"cols_name","type":"character"},{"accessor":"cols_class","name":"cols_class","type":"character"},{"accessor":"cols_NAs","name":"cols_NAs","type":"numeric"},{"accessor":"cols_min","name":"cols_min","type":"numeric"},{"accessor":"cols_max","name":"cols_max","type":"numeric"},{"accessor":"cols_unique","name":"cols_unique","type":"numeric"}],"defaultPageSize":7,"paginationType":"numbers","showPageInfo":true,"minRows":1,"dataKey":"45a75d264c28acfe8e18b19e0ac7274b","key":"45a75d264c28acfe8e18b19e0ac7274b"},"children":[]},"class":"reactR_markup"},"evals":[],"jsHooks":[]}</script>
309+ <div id="htmlwidget-0e5aa2ba646be0737c64 " class="reactable html-widget" style="width:auto;height:auto;"></div>
310+ <script type="application/json" data-for="htmlwidget-0e5aa2ba646be0737c64">{"x":{"tag":{"name":"Reactable","attribs":{"data":{"cols_name":["Province.State","Country.Region","Lat","Long","date","cases","type"],"cols_class":["character","character","numeric","numeric","Date","integer","character"],"cols_NAs":[213642,0,2158,2158,0,0,0],"cols_min":["NA","NA",-71.9499,-178.1165,"NA",-349116,"NA"],"cols_max":["NA","NA",71.7069,178.065,"NA",1355241,"NA"],"cols_unique":[92,201,284,285,1079,19185,1]},"columns":[{"accessor":"cols_name","name":"cols_name","type":"character"},{"accessor":"cols_class","name":"cols_class","type":"character"},{"accessor":"cols_NAs","name":"cols_NAs","type":"numeric"},{"accessor":"cols_min","name":"cols_min","type":"numeric"},{"accessor":"cols_max","name":"cols_max","type":"numeric"},{"accessor":"cols_unique","name":"cols_unique","type":"numeric"}],"defaultPageSize":7,"paginationType":"numbers","showPageInfo":true,"minRows":1,"dataKey":"45a75d264c28acfe8e18b19e0ac7274b","key":"45a75d264c28acfe8e18b19e0ac7274b"},"children":[]},"class":"reactR_markup"},"evals":[],"jsHooks":[]}</script>
311311</div>
312312</div>
313313<div id="death-cases" class="section level3">
@@ -335,8 +335,8 @@ <h4 class="tbl-info">Table Info - death_df</h4>
335335<br/>
336336Duplicated rows: 0
337337</div>
338- <div id="htmlwidget-0c8f8bf439bfba8d9400 " class="reactable html-widget" style="width:auto;height:auto;"></div>
339- <script type="application/json" data-for="htmlwidget-0c8f8bf439bfba8d9400">{"x":{"tag":{"name":"Reactable","attribs":{"data":{"cols_name":["Province.State","Country.Region","Lat","Long","date","cases","type"],"cols_class":["character","character","numeric","numeric","Date","integer","character"],"cols_NAs":[213642,0,2158,2158,0,0,0],"cols_min":["NA","NA",-71.9499,-178.1165,"NA",-1918,"NA"],"cols_max":["NA","NA",71.7069,178.065,"NA",11447,"NA"],"cols_unique":[92,201,284,285,1079,1761,1]},"columns":[{"accessor":"cols_name","name":"cols_name","type":"character"},{"accessor":"cols_class","name":"cols_class","type":"character"},{"accessor":"cols_NAs","name":"cols_NAs","type":"numeric"},{"accessor":"cols_min","name":"cols_min","type":"numeric"},{"accessor":"cols_max","name":"cols_max","type":"numeric"},{"accessor":"cols_unique","name":"cols_unique","type":"numeric"}],"defaultPageSize":7,"paginationType":"numbers","showPageInfo":true,"minRows":1,"dataKey":"7f012f099faf74c6156efc5e6e8bf1a6","key":"7f012f099faf74c6156efc5e6e8bf1a6"},"children":[]},"class":"reactR_markup"},"evals":[],"jsHooks":[]}</script>
338+ <div id="htmlwidget-399993bd43f02d57b452 " class="reactable html-widget" style="width:auto;height:auto;"></div>
339+ <script type="application/json" data-for="htmlwidget-399993bd43f02d57b452">{"x":{"tag":{"name":"Reactable","attribs":{"data":{"cols_name":["Province.State","Country.Region","Lat","Long","date","cases","type"],"cols_class":["character","character","numeric","numeric","Date","integer","character"],"cols_NAs":[213642,0,2158,2158,0,0,0],"cols_min":["NA","NA",-71.9499,-178.1165,"NA",-1918,"NA"],"cols_max":["NA","NA",71.7069,178.065,"NA",11447,"NA"],"cols_unique":[92,201,284,285,1079,1761,1]},"columns":[{"accessor":"cols_name","name":"cols_name","type":"character"},{"accessor":"cols_class","name":"cols_class","type":"character"},{"accessor":"cols_NAs","name":"cols_NAs","type":"numeric"},{"accessor":"cols_min","name":"cols_min","type":"numeric"},{"accessor":"cols_max","name":"cols_max","type":"numeric"},{"accessor":"cols_unique","name":"cols_unique","type":"numeric"}],"defaultPageSize":7,"paginationType":"numbers","showPageInfo":true,"minRows":1,"dataKey":"7f012f099faf74c6156efc5e6e8bf1a6","key":"7f012f099faf74c6156efc5e6e8bf1a6"},"children":[]},"class":"reactR_markup"},"evals":[],"jsHooks":[]}</script>
340340</div>
341341</div>
342342<div id="recovery-cases" class="section level3">
@@ -364,8 +364,8 @@ <h4 class="tbl-info">Table Info - rec_df</h4>
364364<br/>
365365Duplicated rows: 0
366366</div>
367- <div id="htmlwidget-85f0fa5f4364eceffbe7 " class="reactable html-widget" style="width:auto;height:auto;"></div>
368- <script type="application/json" data-for="htmlwidget-85f0fa5f4364eceffbe7">{"x":{"tag":{"name":"Reactable","attribs":{"data":{"cols_name":["Province.State","Country.Region","Lat","Long","date","cases","type"],"cols_class":["character","character","numeric","numeric","Date","integer","character"],"cols_NAs":[214721,0,1079,1079,0,0,0],"cols_min":["NA","NA",-71.9499,-178.1165,"NA",-30974748,"NA"],"cols_max":["NA","NA",71.7069,178.065,"NA",1123456,"NA"],"cols_unique":[76,201,273,273,1079,9190,1]},"columns":[{"accessor":"cols_name","name":"cols_name","type":"character"},{"accessor":"cols_class","name":"cols_class","type":"character"},{"accessor":"cols_NAs","name":"cols_NAs","type":"numeric"},{"accessor":"cols_min","name":"cols_min","type":"numeric"},{"accessor":"cols_max","name":"cols_max","type":"numeric"},{"accessor":"cols_unique","name":"cols_unique","type":"numeric"}],"defaultPageSize":7,"paginationType":"numbers","showPageInfo":true,"minRows":1,"dataKey":"5dc2193b0cdb1328df8fd318082ea936","key":"5dc2193b0cdb1328df8fd318082ea936"},"children":[]},"class":"reactR_markup"},"evals":[],"jsHooks":[]}</script>
367+ <div id="htmlwidget-591521d54649f48997fe " class="reactable html-widget" style="width:auto;height:auto;"></div>
368+ <script type="application/json" data-for="htmlwidget-591521d54649f48997fe">{"x":{"tag":{"name":"Reactable","attribs":{"data":{"cols_name":["Province.State","Country.Region","Lat","Long","date","cases","type"],"cols_class":["character","character","numeric","numeric","Date","integer","character"],"cols_NAs":[214721,0,1079,1079,0,0,0],"cols_min":["NA","NA",-71.9499,-178.1165,"NA",-30974748,"NA"],"cols_max":["NA","NA",71.7069,178.065,"NA",1123456,"NA"],"cols_unique":[76,201,273,273,1079,9190,1]},"columns":[{"accessor":"cols_name","name":"cols_name","type":"character"},{"accessor":"cols_class","name":"cols_class","type":"character"},{"accessor":"cols_NAs","name":"cols_NAs","type":"numeric"},{"accessor":"cols_min","name":"cols_min","type":"numeric"},{"accessor":"cols_max","name":"cols_max","type":"numeric"},{"accessor":"cols_unique","name":"cols_unique","type":"numeric"}],"defaultPageSize":7,"paginationType":"numbers","showPageInfo":true,"minRows":1,"dataKey":"5dc2193b0cdb1328df8fd318082ea936","key":"5dc2193b0cdb1328df8fd318082ea936"},"children":[]},"class":"reactR_markup"},"evals":[],"jsHooks":[]}</script>
369369</div>
370370</div>
371371<div id="append-the-data" class="section level3">
@@ -384,8 +384,8 @@ <h4 class="tbl-info">Table Info - coronavirus_temp</h4>
384384<br/>
385385Duplicated rows: 0
386386</div>
387- <div id="htmlwidget-5779b6cf7e1e01b9d0f8 " class="reactable html-widget" style="width:auto;height:auto;"></div>
388- <script type="application/json" data-for="htmlwidget-5779b6cf7e1e01b9d0f8">{"x":{"tag":{"name":"Reactable","attribs":{"data":{"cols_name":["date","province","country","lat","long","type","cases"],"cols_class":["Date","character","character","numeric","numeric","character","integer"],"cols_NAs":[0,642005,0,5395,5395,0,0],"cols_min":["NA","NA","NA",-71.9499,-178.1165,"NA",-30974748],"cols_max":["NA","NA","NA",71.7069,178.065,"NA",1355241],"cols_unique":[1079,92,201,289,290,3,21904]},"columns":[{"accessor":"cols_name","name":"cols_name","type":"character"},{"accessor":"cols_class","name":"cols_class","type":"character"},{"accessor":"cols_NAs","name":"cols_NAs","type":"numeric"},{"accessor":"cols_min","name":"cols_min","type":"numeric"},{"accessor":"cols_max","name":"cols_max","type":"numeric"},{"accessor":"cols_unique","name":"cols_unique","type":"numeric"}],"defaultPageSize":7,"paginationType":"numbers","showPageInfo":true,"minRows":1,"dataKey":"9d3b6cf74fadb70ad62a610e77d248a9","key":"9d3b6cf74fadb70ad62a610e77d248a9"},"children":[]},"class":"reactR_markup"},"evals":[],"jsHooks":[]}</script>
387+ <div id="htmlwidget-ed7227249f966915b2c6 " class="reactable html-widget" style="width:auto;height:auto;"></div>
388+ <script type="application/json" data-for="htmlwidget-ed7227249f966915b2c6">{"x":{"tag":{"name":"Reactable","attribs":{"data":{"cols_name":["date","province","country","lat","long","type","cases"],"cols_class":["Date","character","character","numeric","numeric","character","integer"],"cols_NAs":[0,642005,0,5395,5395,0,0],"cols_min":["NA","NA","NA",-71.9499,-178.1165,"NA",-30974748],"cols_max":["NA","NA","NA",71.7069,178.065,"NA",1355241],"cols_unique":[1079,92,201,289,290,3,21904]},"columns":[{"accessor":"cols_name","name":"cols_name","type":"character"},{"accessor":"cols_class","name":"cols_class","type":"character"},{"accessor":"cols_NAs","name":"cols_NAs","type":"numeric"},{"accessor":"cols_min","name":"cols_min","type":"numeric"},{"accessor":"cols_max","name":"cols_max","type":"numeric"},{"accessor":"cols_unique","name":"cols_unique","type":"numeric"}],"defaultPageSize":7,"paginationType":"numbers","showPageInfo":true,"minRows":1,"dataKey":"9d3b6cf74fadb70ad62a610e77d248a9","key":"9d3b6cf74fadb70ad62a610e77d248a9"},"children":[]},"class":"reactR_markup"},"evals":[],"jsHooks":[]}</script>
389389</div>
390390</div>
391391<div id="add-gis-codes" class="section level3">
@@ -458,8 +458,8 @@ <h4 class="tbl-info">Table Info - coronavirus</h4>
458458<br/>
459459Duplicated rows: 0
460460</div>
461- <div id="htmlwidget-b2de69cc5cf40ee43430 " class="reactable html-widget" style="width:auto;height:auto;"></div>
462- <script type="application/json" data-for="htmlwidget-b2de69cc5cf40ee43430">{"x":{"tag":{"name":"Reactable","attribs":{"data":{"cols_name":["date","province","country","lat","long","type","cases","uid","iso2","iso3","code3","combined_key","population","continent_name","continent_code"],"cols_class":["Date","character","character","numeric","numeric","character","integer","numeric","character","character","numeric","character","numeric","character","character"],"cols_NAs":[0,642005,0,5395,5395,0,0,34528,44239,44239,44239,34528,51792,44239,44239],"cols_min":["NA","NA","NA",-71.9499,-178.1165,"NA",-30974748,4,"NA","NA",4,"NA",809,"NA","NA"],"cols_max":["NA","NA","NA",71.7069,178.065,"NA",1355241,15699,"NA","NA",894,"NA",1380004385,"NA","NA"],"cols_unique":[1079,92,201,289,290,3,21904,280,223,223,222,280,274,7,7]},"columns":[{"accessor":"cols_name","name":"cols_name","type":"character"},{"accessor":"cols_class","name":"cols_class","type":"character"},{"accessor":"cols_NAs","name":"cols_NAs","type":"numeric"},{"accessor":"cols_min","name":"cols_min","type":"numeric"},{"accessor":"cols_max","name":"cols_max","type":"numeric"},{"accessor":"cols_unique","name":"cols_unique","type":"numeric"}],"defaultPageSize":15,"paginationType":"numbers","showPageInfo":true,"minRows":1,"dataKey":"8ffa406aa4e087ec12f646d72b73b04f","key":"8ffa406aa4e087ec12f646d72b73b04f"},"children":[]},"class":"reactR_markup"},"evals":[],"jsHooks":[]}</script>
461+ <div id="htmlwidget-f2cd0f2990e3459d0bbf " class="reactable html-widget" style="width:auto;height:auto;"></div>
462+ <script type="application/json" data-for="htmlwidget-f2cd0f2990e3459d0bbf">{"x":{"tag":{"name":"Reactable","attribs":{"data":{"cols_name":["date","province","country","lat","long","type","cases","uid","iso2","iso3","code3","combined_key","population","continent_name","continent_code"],"cols_class":["Date","character","character","numeric","numeric","character","integer","numeric","character","character","numeric","character","numeric","character","character"],"cols_NAs":[0,642005,0,5395,5395,0,0,34528,44239,44239,44239,34528,51792,44239,44239],"cols_min":["NA","NA","NA",-71.9499,-178.1165,"NA",-30974748,4,"NA","NA",4,"NA",809,"NA","NA"],"cols_max":["NA","NA","NA",71.7069,178.065,"NA",1355241,15699,"NA","NA",894,"NA",1380004385,"NA","NA"],"cols_unique":[1079,92,201,289,290,3,21904,280,223,223,222,280,274,7,7]},"columns":[{"accessor":"cols_name","name":"cols_name","type":"character"},{"accessor":"cols_class","name":"cols_class","type":"character"},{"accessor":"cols_NAs","name":"cols_NAs","type":"numeric"},{"accessor":"cols_min","name":"cols_min","type":"numeric"},{"accessor":"cols_max","name":"cols_max","type":"numeric"},{"accessor":"cols_unique","name":"cols_unique","type":"numeric"}],"defaultPageSize":15,"paginationType":"numbers","showPageInfo":true,"minRows":1,"dataKey":"8ffa406aa4e087ec12f646d72b73b04f","key":"8ffa406aa4e087ec12f646d72b73b04f"},"children":[]},"class":"reactR_markup"},"evals":[],"jsHooks":[]}</script>
463463</div>
464464</div>
465465<div id="data-validation" class="section level3">
@@ -492,12 +492,12 @@ <h3>Saving the data</h3>
492492load(sprintf("../data_pipelines/log_%s.RData", branch))
493493tail(log)</code></pre>
494494<pre><code>## time dataset nrows last_date update success branch
495- ## 2141 2023-01-03 16:18:32 coronavirus 917604 2023-01-02 FALSE TRUE master
496495## 2142 2023-01-04 01:02:38 coronavirus 917604 2023-01-02 FALSE TRUE master
497496## 2143 2023-01-04 08:17:18 coronavirus 918456 2023-01-03 TRUE TRUE master
498497## 2144 2023-01-04 16:23:02 coronavirus 918456 2023-01-03 FALSE TRUE master
499498## 2145 2023-01-05 01:05:09 coronavirus 918456 2023-01-03 FALSE TRUE master
500- ## 2146 2023-01-05 08:17:50 coronavirus 919308 2023-01-04 TRUE TRUE master</code></pre>
499+ ## 2146 2023-01-05 08:17:50 coronavirus 919308 2023-01-04 TRUE TRUE master
500+ ## 2147 2023-01-05 16:20:51 coronavirus 919308 2023-01-04 FALSE TRUE master</code></pre>
501501<pre class="r"><code>log_last <- log %>% dplyr::filter(update == TRUE & success == TRUE, dataset == "coronavirus") %>%
502502 dplyr::filter(time == max(time))
503503if(s && nrow(coronavirus) > log_last$nrows){
0 commit comments