From ffcda64fd18fbcec440648635b590749534a70b1 Mon Sep 17 00:00:00 2001
From: Joshua Smith <jbsmith7741@gmail.com>
Date: Tue, 2 Mar 2021 15:13:50 -0700
Subject: [PATCH] fix lockup on errs on every row (#151)

* fix lockup on errs on every row

* add default support and unit tests

* fix globreader file stats and misc errors
---
 .gitignore                                    |   2 +-
 apps/taskmasters/flowlord/flowlord.drawio.svg |  57 +++---
 apps/workers/sql-load/main.go                 |  10 +-
 apps/workers/sql-load/worker.go               | 129 ++++++-------
 apps/workers/sql-load/worker_test.go          | 173 ++++++++++++++----
 file/file_test.go                             |   1 -
 file/globreader.go                            |  15 +-
 7 files changed, 236 insertions(+), 151 deletions(-)

diff --git a/.gitignore b/.gitignore
index 6aeeb921..89761305 100644
--- a/.gitignore
+++ b/.gitignore
@@ -13,7 +13,7 @@ apps/workers/deduper/deduper
 apps/workers/sort2file/sort2file
 apps/utils/file-watcher/file-watcher
 */stats/stats
-*/sql-load/sql-load
+apps/workers/sql-load/sql-load
 build
 
 coverage
\ No newline at end of file
diff --git a/apps/taskmasters/flowlord/flowlord.drawio.svg b/apps/taskmasters/flowlord/flowlord.drawio.svg
index c0682c10..7b69e646 100644
--- a/apps/taskmasters/flowlord/flowlord.drawio.svg
+++ b/apps/taskmasters/flowlord/flowlord.drawio.svg
@@ -1,4 +1,4 @@
-<svg host="65bd71144e" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" version="1.1" width="424px" height="305px" viewBox="-0.5 -0.5 424 305" content="&lt;mxfile host=&quot;fda10e51-4d1d-4f3e-8056-fe38b1e5596d&quot; modified=&quot;2021-03-01T22:11:39.137Z&quot; agent=&quot;5.0 (Macintosh; Intel Mac OS X 10_14_6) AppleWebKit/537.36 (KHTML, like Gecko) Code/1.53.2 Chrome/87.0.4280.141 Electron/11.2.1 Safari/537.36&quot; etag=&quot;IA9fBy-spS7nJT00SAe6&quot; version=&quot;14.2.4&quot; type=&quot;embed&quot;&gt;&lt;diagram id=&quot;6hGFLwfOUW9BJ-s0fimq&quot; name=&quot;Page-1&quot;&gt;5Vpdk6I4FP01Pi7Fp+Bj2+rMw2xVV/XDzjx1RYiQNRAqxFbn128C4TNgq6PSO9M+NLkJkNxzzz030Yn1HB++UJBGf5MA4ompB4eJtZiYpmEYHv8nLMfC4hlOYQgpCuSg2vCKfkJp1KV1hwKYtQYyQjBDadvokySBPmvZAKVk3x62Ibj91hSEUDG8+gCr1n9QwKJyXdNZ3fEVojCSr/ZMt+iIQTlYriSLQED2DZO1nFjPlBBWXMWHZ4iF80q/FPetBnqriVGYsHNumMppsGO5NhjwpcomoSwiIUkAXtbWOSW7JIDiATpv1WO+EZJyo8GN/0LGjhI3sGOEmyIWY9nL50aP38X9mlM2f8jH5Y3FodU6ytYGYfxMMKH5TC1jDQzIPTbPGCVb2OjR9enyiS95rrpDeigjO+rLFZsyggANoRxlFSbhi8Zt0oVfIIkhnxcfQCEGDL23wwLI6AqrcTUA/EJi0I+HnMs7wDv50D2h2w0WIcuf0QUrJShhkC7f+foy6d0qpITLApBFFVQNCIZdNuRkDNYQv5AMMUQS3udD8Wbe8Q4pQ5wb3zoDmIiGqvcJo1BY14QxEvMOIA3Vc8iOYZTwOZWc1YvFpGKt8SEUqUR7hxDEpsYnKSJxQxLWmOsm/zsFu5gNPJyEVPbaMiPJDGVJvu5rutvSFDWI7ui/HgLGbBROHhD73rj+UdOTt2pCisad+WipfDTcsQhpKYRccTLylQUKSjUGwon7CDH4moJ8VXsevNcQMCFJT5zrurtanXTn+XFeCpGMc8NUA312p0C3x4xzXXOdRqgbJwO9IVieZTUlq5KzAcnKWy+QIu4dkeVy47UsGE2VjKnCAgW7kEOTnojVTrIwgfhcFMNVPQfW5Uv1fgeUd9nd4HbOy+LODVxmf+yyRlgOieiwXOZ6PAf+Nsw50SeDXe0tFLnIPGXdOpCvPX2ln6wlusKMSOZqiAOUaQADGr/5mPjb/nTWA/l0APNBbFUkrR4krVsg6ShI+pSD00WTT5ydyvFlLlf9oWDbBS5GQZCnvz5RaafEC6TifJ8f2978gD7mDbSh2h99+iKo0oa/dE2fVnpQ3Gp73jUCcafCqqyiWpWVN5aolHI2lv5fJf8X7VerhGnIxgtgHOQkt5i6/VikSwEaAWlVC193vg+zrDcCcg1so3Z+hqQwQz9lgSAwyHfI+dyd+cRZXJQhq+L/lysRnhtM27Xa1UjROtvb8uEvYkGNIWSzyTjEXTiqOZynca6CkDh34K42dUMBqU3C/8tGR9npTDVVz9y+IsK9AQVULz72oM39DCdtpdjcdVOT3/pEKTg2Bsg0oNJIRoc1bZ/3GHrn3LQz3vNODecXxQSu5qOn8JGBbKsFgibdQOqW4qGfamsUvgWAAY2X4bvgLd2ts926HRwdjFcLY2bMuJ0/JECwxUN76lnLp6GKdmjvUuXkwWRdpnUMN6zniJEWHJyLynqBKM+3hR0zet9cYZ2zcZypmcK+ReU7zpH8H1EWlSVQqyxyRiuL3DGR/gQHvX1wjLgfMZWc60cIB79vCVR9n/qIAsgbuQByWltzQ9OdD9LUI3fmZRL6JEzoOfGSTFAPMX8PJngPZMJM8e4KIMxd+FFht07jRMN57Ded2vvF6VCg9p8j3/B73RMQ3w9Pw+viafds7vpOiMu8dAGivFn/QKMo7uufuVjL/wA=&lt;/diagram&gt;&lt;/mxfile&gt;">
+<svg host="65bd71144e" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" version="1.1" width="424px" height="305px" viewBox="-0.5 -0.5 424 305" content="&lt;mxfile host=&quot;fda10e51-4d1d-4f3e-8056-fe38b1e5596d&quot; modified=&quot;2021-03-01T22:52:19.046Z&quot; agent=&quot;5.0 (Macintosh; Intel Mac OS X 10_14_6) AppleWebKit/537.36 (KHTML, like Gecko) Code/1.53.2 Chrome/87.0.4280.141 Electron/11.2.1 Safari/537.36&quot; etag=&quot;uJ6JrGR4GCUUJS8d-Tdn&quot; version=&quot;14.2.4&quot; type=&quot;embed&quot;&gt;&lt;diagram id=&quot;6hGFLwfOUW9BJ-s0fimq&quot; name=&quot;Page-1&quot;&gt;5VnLcqM4FP0aL4fiafAyju2eRU9VqrKYziolgwwaC0QJ4Ud//UggnoLEmbaNq8cboyshpHvuuQ9pZj3Hp28UpNFfJIB4ZurBaWatZqZpGIbH/4TkXEo8wykFIUWBHNQIXtFPKIW6lOYogFlnICMEM5R2hT5JEuizjgxQSo7dYTuCu19NQQgVwasPsCr9GwUsqvY1XzQdf0IURvLTnumWHTGoBsudZBEIyLElstYz65kSwsqn+PQMsVBepZfyvc1Ib70wChN2yQtzuQx2rvYGA75V2SSURSQkCcDrRrqkJE8CKCbQeasZ852QlAsNLvwHMnaWuIGcES6KWIxlL18bPf8Q72tO1XyT0xWN1anTOsvWDmH8TDChxUotYwsMyDW2zBgle9jq0fX5+olveamqQ2ooIzn15Y5NaUGAhlCOskqR0EXrNanCb5DEkK+LD6AQA4YOXbMA0rrCelwDAH+QGAzjIddyADiXkx4J3e+wMFk+Rx+slKCEQbo+8P1lUru1SQmVBSCLaqhaEIyrbEzJGGwhfiEZYogkvM+H4su84wApQ5wb33sDmLCGuvcJo1BIt4QxEvMOIAX1PCRnGCV8TRVn9XIzqdhrfAqFK9EOEILY1PgihSXuSMI6e3A3mw9hF6uBpw8hlb229EjSQ1mSr8eG7rYURS2iO/qvm4CxmISTJ8R+tJ7fGnryVkNI0bgxHy2Vj4Y7FSEthZAbTka+s0BBqcFAKPEYIQZfU1Ds6siN92IC3s6oq6gjjdowVate3Miq64D38FZdR6c/dE2f1/GqfNX2vE+CVNF6gRRxFQm/dkumVLToUMWbLHZZU0LcwPrW6vkE4i8mIHU0NWTjBTAOclJITN2+L9JVsjAB0rbiFV9z34dZNmgBRWbQRU2J/v08IUZBUBoIzNBPsC3mExgUKU+xdmc5c1Zfcpi1N+97zLpUkB/qZONDnpT7BtN2ra47LVsXa1tO/iI21BpCdruMQ9yHo17DZUmEO5hIclWbuqGA1CXhQ0YuJXTNNUcJXu5A8LLcK9i7qrL7lknuI9RJVWS5aaFUvPpEKTi3BkjOq5yR1mHNu9m6ofeq3t54z/toOH8oF/Cfyecp5GMg22sBSaBiSP0KJ/RTbYvC9wAwoPmY5MF7mm+zfNs1jh7Gm5Wx4IWDteSTBAh2eGjPPWv9pOCfiNWMl2+1Ax71zJUPx3DHBgpEWnJwyRnOVohy51rKMaO39RWW3fcVqqewF6qnsK+R5k5zoPK/yIGGDmoqaCfIgdwpkX6AMn0IjgmLD/XkzI8QDn6TfKc++r5HtuNNnO04naLb0HTnE590z5q78jgPYvbOqNmbv4PZe3c0+4Wiyg1AmOvrs5Rtm8aJhgtDb2tw8EB7zCqVgvja5+2T4Gl4fTztgbLNGkC0ckK/dJKuHlMoWLbwGlPs+JVFgdES+PuwoFZLibviN4BHiVIJRnV3OOKVPH0jr0BG7nP6dohI5mrIJ0mmAQxo/M7LB39/JSR7FyJDSfUQjpZzBRwHnBzl0PSxFJXGR05MVjxtCkrR5cdRQ16z61dvSad+ZTO/7FrK/Hplw5vNLXRZAzd3+db6Xw==&lt;/diagram&gt;&lt;/mxfile&gt;">
     <defs>
         <linearGradient x1="0%" y1="0%" x2="0%" y2="100%" id="mx-gradient-fd1919-1-4683ea-1-s-0">
             <stop offset="0%" style="stop-color:#FD1919"/>
@@ -16,20 +16,20 @@
                 <foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility">
                     <div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe flex-end; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 14px; margin-left: 45px;">
                         <div style="box-sizing: border-box; font-size: 0; text-align: center; ">
-                            <div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #ffffff; line-height: 1.2; pointer-events: all; white-space: nowrap; ">
+                            <div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #007FFF; line-height: 1.2; pointer-events: all; white-space: nowrap; ">
                                 workflows/
                             </div>
                         </div>
                     </div>
                 </foreignObject>
-                <text x="45" y="14" fill="#ffffff" font-family="Helvetica" font-size="12px" text-anchor="middle">
+                <text x="45" y="14" fill="#007FFF" font-family="Helvetica" font-size="12px" text-anchor="middle">
                     workfl...
                 </text>
             </switch>
         </g>
         <path d="M 90 132 L 193.63 132" fill="none" stroke="#006eaf" stroke-miterlimit="10" pointer-events="stroke"/>
         <path d="M 198.88 132 L 191.88 135.5 L 193.63 132 L 191.88 128.5 Z" fill="#006eaf" stroke="#006eaf" stroke-miterlimit="10" pointer-events="all"/>
-        <rect x="0" y="107" width="90" height="50" rx="7.5" ry="7.5" fill="none" stroke="#006eaf" pointer-events="all"/>
+        <rect x="0" y="107" width="90" height="50" rx="7.5" ry="7.5" fill="#ffffff" stroke="#006eaf" pointer-events="all"/>
         <g transform="translate(-0.5 -0.5)">
             <switch>
                 <foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility">
@@ -46,29 +46,6 @@
                 </text>
             </switch>
         </g>
-        <path d="M 67.5 157 L 68.6 157" fill="none" stroke="#000000" stroke-miterlimit="10" pointer-events="stroke"/>
-        <path d="M 73.85 157 L 66.85 160.5 L 68.6 157 L 66.85 153.5 Z" fill="#000000" stroke="#000000" stroke-miterlimit="10" pointer-events="all"/>
-        <rect x="120" y="112" width="40" height="55" fill="#2a2a2a" stroke="none" pointer-events="all"/>
-        <ellipse cx="140" cy="131.42" rx="15" ry="15.58325912733749" fill="none" stroke="#0080f0" stroke-width="2" pointer-events="all"/>
-        <path d="M 140 119.3 L 140 131.42 L 133.33 131.42" fill="none" stroke="#0080f0" stroke-width="2" stroke-miterlimit="10" pointer-events="all"/>
-        <path d="M 125 147 L 129.33 142.5 M 155 147 L 150.67 142.5 M 136.67 114.1 L 126.67 119.3 C 126.44 116.74 127.75 114.3 129.96 113.15 C 132.17 112 134.83 112.38 136.67 114.1 Z M 143.33 114.1 L 153.33 119.3 C 153.56 116.74 152.25 114.3 150.04 113.15 C 147.83 112 145.17 112.38 143.33 114.1 Z" fill="none" stroke="#0080f0" stroke-width="2" stroke-miterlimit="10" pointer-events="all"/>
-        <rect x="120" y="147" width="40" height="20" fill="none" stroke="none" pointer-events="all"/>
-        <g transform="translate(-0.5 -0.5)">
-            <switch>
-                <foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility">
-                    <div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 157px; margin-left: 121px;">
-                        <div style="box-sizing: border-box; font-size: 0; text-align: center; ">
-                            <div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #007FFF; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">
-                                cron
-                            </div>
-                        </div>
-                    </div>
-                </foreignObject>
-                <text x="140" y="161" fill="#007FFF" font-family="Helvetica" font-size="12px" text-anchor="middle">
-                    cron
-                </text>
-            </switch>
-        </g>
         <path d="M 270 132 L 295 132 L 310.64 131.66" fill="none" stroke="#006eaf" stroke-miterlimit="10" pointer-events="stroke"/>
         <path d="M 315.89 131.54 L 308.97 135.2 L 310.64 131.66 L 308.82 128.2 Z" fill="#006eaf" stroke="#006eaf" stroke-miterlimit="10" pointer-events="all"/>
         <path d="M 235 150.5 L 235 190.63" fill="none" stroke="#006eaf" stroke-miterlimit="10" stroke-dasharray="1 4" pointer-events="stroke"/>
@@ -89,7 +66,7 @@
                 </text>
             </switch>
         </g>
-        <rect x="200" y="113.5" width="70" height="37" fill="none" stroke="#006eaf" pointer-events="all"/>
+        <rect x="200" y="113.5" width="70" height="37" fill="#ffffff" stroke="#006eaf" pointer-events="all"/>
         <g transform="translate(-0.5 -0.5)">
             <switch>
                 <foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility">
@@ -139,7 +116,7 @@
         <path d="M 235 265.88 L 231.5 258.88 L 235 260.63 L 238.5 258.88 Z" fill="#006eaf" stroke="#006eaf" stroke-miterlimit="10" pointer-events="all"/>
         <path d="M 270 215.5 L 344.5 215.5 L 344.5 158.37" fill="none" stroke="#006eaf" stroke-miterlimit="10" pointer-events="stroke"/>
         <path d="M 344.5 153.12 L 348 160.12 L 344.5 158.37 L 341 160.12 Z" fill="#006eaf" stroke="#006eaf" stroke-miterlimit="10" pointer-events="all"/>
-        <rect x="200" y="197" width="70" height="37" fill="none" stroke="#006eaf" pointer-events="all"/>
+        <rect x="200" y="197" width="70" height="37" fill="#ffffff" stroke="#006eaf" pointer-events="all"/>
         <g transform="translate(-0.5 -0.5)">
             <switch>
                 <foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility">
@@ -158,7 +135,7 @@
         </g>
         <path d="M 270 285.5 L 345 285.5 L 344.99 160.37" fill="none" stroke="#006eaf" stroke-miterlimit="10" pointer-events="stroke"/>
         <path d="M 344.99 155.12 L 348.49 162.12 L 344.99 160.37 L 341.49 162.12 Z" fill="#006eaf" stroke="#006eaf" stroke-miterlimit="10" pointer-events="all"/>
-        <rect x="200" y="267" width="70" height="37" fill="none" stroke="#006eaf" pointer-events="all"/>
+        <rect x="200" y="267" width="70" height="37" fill="#ffffff" stroke="#006eaf" pointer-events="all"/>
         <g transform="translate(-0.5 -0.5)">
             <switch>
                 <foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility">
@@ -192,6 +169,26 @@
                 </text>
             </switch>
         </g>
+        <ellipse cx="140" cy="131.42" rx="15" ry="15.58325912733749" fill="#ffffff" stroke="#0080f0" stroke-width="2" pointer-events="all"/>
+        <path d="M 140 119.3 L 140 131.42 L 133.33 131.42" fill="none" stroke="#0080f0" stroke-width="2" stroke-miterlimit="10" pointer-events="all"/>
+        <path d="M 125 147 L 129.33 142.5 M 155 147 L 150.67 142.5 M 136.67 114.1 L 126.67 119.3 C 126.44 116.74 127.75 114.3 129.96 113.15 C 132.17 112 134.83 112.38 136.67 114.1 Z M 143.33 114.1 L 153.33 119.3 C 153.56 116.74 152.25 114.3 150.04 113.15 C 147.83 112 145.17 112.38 143.33 114.1 Z" fill="#ffffff" stroke="#0080f0" stroke-width="2" stroke-miterlimit="10" pointer-events="all"/>
+        <rect x="120" y="147" width="40" height="20" fill="none" stroke="none" pointer-events="all"/>
+        <g transform="translate(-0.5 -0.5)">
+            <switch>
+                <foreignObject style="overflow: visible; text-align: left;" pointer-events="none" width="100%" height="100%" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility">
+                    <div xmlns="http://www.w3.org/1999/xhtml" style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 157px; margin-left: 121px;">
+                        <div style="box-sizing: border-box; font-size: 0; text-align: center; ">
+                            <div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #007FFF; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">
+                                cron
+                            </div>
+                        </div>
+                    </div>
+                </foreignObject>
+                <text x="140" y="161" fill="#007FFF" font-family="Helvetica" font-size="12px" text-anchor="middle">
+                    cron
+                </text>
+            </switch>
+        </g>
     </g>
     <switch>
         <g requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"/>
diff --git a/apps/workers/sql-load/main.go b/apps/workers/sql-load/main.go
index 292cb400..a6cf4da5 100644
--- a/apps/workers/sql-load/main.go
+++ b/apps/workers/sql-load/main.go
@@ -19,7 +19,6 @@ type options struct {
 	MySQL    bootstrap.DBOptions `toml:"mysql"`
 
 	sqlDB *sql.DB
-	//	sqlxDB *sqlx.DB // used for running direct exec command
 
 	producer bus.Producer
 	fileOpts *file.Options
@@ -38,14 +37,15 @@ delete : allows insert into pre-existing data by deleting previous data.
     - "?delete=date:2020-07-01|id:7"
 truncate: allows insert into pre-existing table by truncating before insertion
 fields : allows mapping different json key values to different database column names
-    - provide a list of field name mapping {json key name}:{DB column name} to be mapped 
-    - ?fields=jsonKey:dbColumnName
-
+    - provide a list of field name mapping {DB column name}:{json key name} to be mapped 
+    - ?fields=dbColumnName:jsonkey
+cached_insert: improves insert times by caching data into a temp table
+batch_size: (default:1000) number of rows to insert at a time (higher number increases memory usage) 
 Example task:
  
 {"type":"sql_load","info":"gs://bucket/path/to/file.json?table=schema.table_name&delete=date:2020-07-01|id:7"}
 {"type":"sql_load","info":"gs://bucket/path/of/files/to/load/?table=schema.table_name"}
-{"type":"sql_load","info":"gs://bucket/path/to/file.json?table=schema.table_name&delete=date:2020-07-01|id:7&fields=jsonKeyValue:dbColumnName"}`
+{"type":"sql_load","info":"gs://bucket/path/to/file.json?table=schema.table_name&delete=date:2020-07-01|id:7&fields=dbColumnName:jsonKeyValue"}`
 )
 
 func init() {
diff --git a/apps/workers/sql-load/worker.go b/apps/workers/sql-load/worker.go
index f8c52577..5692266a 100644
--- a/apps/workers/sql-load/worker.go
+++ b/apps/workers/sql-load/worker.go
@@ -11,7 +11,6 @@ import (
 	"sort"
 	"strconv"
 	"strings"
-	"sync"
 	"sync/atomic"
 	"time"
 
@@ -40,7 +39,8 @@ type worker struct {
 
 	Params InfoURI
 
-	flist    []string // list of full path file(s)
+	//flist    []string // list of full path file(s)
+	fReader  file.Reader
 	ds       *DataSet // the processing data for loading
 	delQuery string   // query statement built from DeleteMap
 
@@ -77,7 +77,6 @@ func (o *options) newWorker(info string) task.Worker {
 	w := &worker{
 		options: *o,
 		Meta:    task.NewMeta(),
-		flist:   make([]string, 0),
 		ds:      NewDataSet(),
 	}
 
@@ -85,23 +84,12 @@ func (o *options) newWorker(info string) task.Worker {
 		return task.InvalidWorker("params uri.unmarshal: %v", err)
 	}
 
-	f, err := file.Stat(w.Params.FilePath, w.fileOpts)
+	r, err := file.NewGlobReader(w.Params.FilePath, w.fileOpts)
 	if err != nil {
-		return task.InvalidWorker("filepath os: %v", err)
-	}
-	// app will load one file or a directory of files (only one folder deep)
-	if f.IsDir {
-		list, _ := file.List(w.Params.FilePath, w.fileOpts)
-		for i := range list {
-			w.flist = append(w.flist, list[i].Path)
-		}
-	} else {
-		w.flist = append(w.flist, w.Params.FilePath)
+		return task.InvalidWorker("%v", err)
 	}
+	w.fReader = r
 
-	if len(w.flist) == 0 {
-		return task.InvalidWorker("no files found in path %s", w.Params.FilePath)
-	}
 	if len(w.Params.DeleteMap) > 0 && w.Params.Truncate {
 		return task.InvalidWorker("truncate can not be used with delete fields")
 	}
@@ -125,7 +113,7 @@ func (w *worker) DoTask(ctx context.Context) (task.Result, string) {
 	rowChan := make(chan Row, 100)
 	w.ds.dbSchema, w.ds.insertCols = PrepareMeta(w.ds.dbSchema, w.Params.FieldsMap)
 
-	go w.ds.ReadFiles(ctx, w.flist, w.fileOpts, rowChan, w.Params.SkipErr)
+	go w.ds.ReadFiles(ctx, w.fReader, rowChan, w.Params.SkipErr)
 	retry := 0
 
 	if w.Params.CachedInsert && w.dbDriver == "postgres" {
@@ -310,14 +298,14 @@ func (w *worker) QuerySchema() (err error) {
 
 // ReadFiles uses a files list and file.Options to read files and process data into a Dataset
 // it will build the cols and rows for each file
-func (ds *DataSet) ReadFiles(ctx context.Context, files []string, fOpts *file.Options, rowChan chan Row, skipErrors bool) {
+func (ds *DataSet) ReadFiles(ctx context.Context, files file.Reader, rowChan chan Row, skipErrors bool) {
 	errChan := make(chan error, 20)
 	dataIn := make(chan []byte, 20)
-	var wg sync.WaitGroup
+	var activeThreads int32
 	for i := 0; i < 20; i++ {
-		wg.Add(1)
+		activeThreads++
 		go func() { // unmarshaler
-			defer wg.Done()
+			defer func() { atomic.AddInt32(&activeThreads, -1) }()
 			for b := range dataIn {
 				var j Jsondata
 				if e := json.Unmarshal(b, &j); e != nil {
@@ -335,59 +323,51 @@ func (ds *DataSet) ReadFiles(ctx context.Context, files []string, fOpts *file.Op
 		}()
 	}
 
-	// read each file
-	for i := range files {
-		r, err := file.NewReader(files[i], fOpts) // create a new file reader
-		if err != nil {
-			ds.err = fmt.Errorf("new reader error %w", err)
-			break
-		}
-
-		// read the lines of the file
-	loop:
-		for {
-			select {
-			case <-ctx.Done():
+	// read the lines of the file
+loop:
+	for {
+		select {
+		case <-ctx.Done():
+			break loop
+		case err := <-errChan:
+			if skipErrors {
+				ds.skipCount++
+				log.Println(err)
+			} else {
+				ds.err = err
 				break loop
-			case e := <-errChan:
-				if skipErrors {
-					ds.skipCount++
-					log.Println(e)
-				} else {
-					ds.err = e
+			}
+		default:
+			line, err := files.ReadLine()
+			if err != nil {
+				if err == io.EOF {
 					break loop
 				}
-			default:
-				line, e := r.ReadLine()
-				if e != nil {
-					if e == io.EOF {
-						break loop
-					}
-					errChan <- fmt.Errorf("readline error %v - %w", r.Stats().Path, err)
-					continue
-				}
-				dataIn <- line
+				errChan <- fmt.Errorf("readline error %v - %w", files.Stats().Path, err)
+				continue
 			}
+			dataIn <- line
 		}
-
-		log.Println("processed file", r.Stats().Path)
-		r.Close() // close the reader
-		if ds.err != nil {
-			break
-		} // readline
-	} // read file
+	}
+	files.Close() // close the reader
+	sts := files.Stats()
+	log.Printf("processed %d files at %s", sts.Files, sts.Path)
 
 	close(dataIn)
-	wg.Wait()
-	select {
-	case e := <-errChan:
-		if skipErrors {
-			log.Println(e)
-			ds.skipCount++
-		} else {
-			ds.err = e
+	for {
+		select {
+		case e := <-errChan:
+			if skipErrors {
+				log.Println(e)
+				ds.skipCount++
+			} else {
+				ds.err = e
+			}
+		default:
+		}
+		if i := atomic.LoadInt32(&activeThreads); i == 0 {
+			break
 		}
-	default:
 	}
 	close(rowChan)
 	close(errChan)
@@ -411,6 +391,16 @@ func PrepareMeta(dbSchema []DbColumn, fieldMap map[string]string) (meta []DbColu
 		jKey := k.Name
 		if v := fieldMap[k.Name]; v != "" {
 			jKey = v
+			if k.Default == nil && !k.Nullable {
+				var s string
+				switch k.TypeName {
+				case "int":
+					s = "0"
+				case "float":
+					s = "0.0"
+				}
+				k.Default = &s
+			}
 		}
 		// skip designated fields
 		if jKey == "-" {
@@ -436,7 +426,10 @@ func MakeRow(dbSchema []DbColumn, j Jsondata) (row Row, err error) {
 	for k, f := range dbSchema {
 		v, found := j[f.JsonKey]
 		if !found && !f.Nullable {
-			return nil, fmt.Errorf("%v is required", f.JsonKey)
+			if f.Default == nil {
+				return nil, fmt.Errorf("%v is required", f.JsonKey)
+			}
+			j[f.JsonKey] = *f.Default
 		}
 		switch x := v.(type) {
 		case string:
diff --git a/apps/workers/sql-load/worker_test.go b/apps/workers/sql-load/worker_test.go
index f3632863..7d0edc90 100644
--- a/apps/workers/sql-load/worker_test.go
+++ b/apps/workers/sql-load/worker_test.go
@@ -1,6 +1,7 @@
 package main
 
 import (
+	"context"
 	"errors"
 	"os"
 	"path/filepath"
@@ -11,6 +12,7 @@ import (
 	"github.com/hydronica/trial"
 	"github.com/pcelvng/task"
 	"github.com/pcelvng/task-tools/file"
+	"github.com/pcelvng/task-tools/file/mock"
 )
 
 func TestDefaultUpdate(t *testing.T) {
@@ -64,8 +66,8 @@ func TestPrepareMeta(t *testing.T) {
 			},
 			Expected: output{
 				schema: []DbColumn{
-					{Name: "C1", JsonKey: "J1"},
-					{Name: "C2", JsonKey: "J2"},
+					{Name: "C1", JsonKey: "J1", Default: trial.StringP("")},
+					{Name: "C2", JsonKey: "J2", Default: trial.StringP("")},
 				},
 				columns: []string{"C1", "C2"},
 			},
@@ -73,14 +75,14 @@ func TestPrepareMeta(t *testing.T) {
 		"Partial json mapping": {
 			Input: input{
 				schema: []DbColumn{
-					{Name: "C1"}, {Name: "C2"},
+					{Name: "C1", Nullable: true}, {Name: "C2", Nullable: true},
 				},
 				fields: map[string]string{"C1": "J1", "C3": "J2"},
 			},
 			Expected: output{
 				schema: []DbColumn{
-					{Name: "C1", JsonKey: "J1"},
-					{Name: "C2", JsonKey: "C2"},
+					{Name: "C1", JsonKey: "J1", Nullable: true},
+					{Name: "C2", JsonKey: "C2", Nullable: true},
 				},
 				columns: []string{"C1", "C2"},
 			},
@@ -113,6 +115,24 @@ func TestPrepareMeta(t *testing.T) {
 				columns: []string{"C1", "C3"},
 			},
 		},
+		"add defaults when in fieldMap": {
+			Input: input{
+				schema: []DbColumn{
+					{Name: "id", Nullable: false, TypeName: "int"},
+					{Name: "name", Nullable: false, TypeName: "string"},
+					{Name: "value", Nullable: false, TypeName: "float"},
+				},
+				fields: map[string]string{"id": "json_id", "name": "jName", "value": "jvalue"},
+			},
+			Expected: output{
+				schema: []DbColumn{
+					{Name: "id", JsonKey: "json_id", Default: trial.StringP("0"), Nullable: false, TypeName: "int"},
+					{Name: "name", JsonKey: "jName", Default: trial.StringP(""), Nullable: false, TypeName: "string"},
+					{Name: "value", JsonKey: "jvalue", Default: trial.StringP("0.0"), Nullable: false, TypeName: "float"},
+				},
+				columns: []string{"id", "name", "value"},
+			},
+		},
 	}
 
 	trial.New(fn, cases).Test(t)
@@ -122,7 +142,7 @@ func TestMakeRow(t *testing.T) {
 	schema := []DbColumn{
 		{Name: "id", JsonKey: "id"},
 		{Name: "name", JsonKey: "name", Nullable: true},
-		{Name: "count", JsonKey: "count", TypeName: "int", Nullable: true},
+		{Name: "count", JsonKey: "count", TypeName: "int", Default: trial.StringP("0")},
 		{Name: "percent", JsonKey: "percent", TypeName: "float", Nullable: true},
 		{Name: "num", JsonKey: "num", TypeName: "int", Nullable: true},
 	}
@@ -162,9 +182,10 @@ func TestMakeRow(t *testing.T) {
 		},
 		"nulls": {
 			Input: map[string]interface{}{
-				"id": "1234",
+				"id":    "1234",
+				"count": "10",
 			},
-			Expected: Row{"1234", nil, nil, nil, nil},
+			Expected: Row{"1234", nil, int64(10), nil, nil},
 		},
 		"missing required": {
 			Input:       map[string]interface{}{},
@@ -177,6 +198,12 @@ func TestMakeRow(t *testing.T) {
 			},
 			ExpectedErr: errors.New("cannot convert number"),
 		},
+		"defaults": {
+			Input: map[string]interface{}{
+				"id": "1234",
+			},
+			Expected: Row{"1234", nil, "0", nil, nil},
+		},
 	}
 	trial.New(fn, cases).SubTest(t)
 }
@@ -189,8 +216,6 @@ func TestNewWorker(t *testing.T) {
 
 	type output struct {
 		Params     InfoURI
-		Invalid    bool
-		Msg        string
 		Count      int
 		DeleteStmt string
 	}
@@ -206,7 +231,9 @@ func TestNewWorker(t *testing.T) {
 	w.WriteLine([]byte(`{"test":"value1","testing":"value2","number":123}`))
 	w.Close()
 
-	d1, _ := filepath.Abs(f2)
+	s, _ := filepath.Abs(f2)
+	d1, _ := filepath.Split(s)
+	d1 += "*"
 
 	f3 := "./tmp1"
 	os.Mkdir(f3, 0755)
@@ -218,19 +245,20 @@ func TestNewWorker(t *testing.T) {
 		wrkr := i.options.newWorker(i.Info)
 		o := output{}
 		// if task is invalid set values
-		o.Invalid, o.Msg = task.IsInvalidWorker(wrkr)
+		if invalid, msg := task.IsInvalidWorker(wrkr); invalid {
+			return nil, errors.New(msg)
+		}
 
 		// if the test isn't for a invalid worker set count and params
-		if !o.Invalid {
-			myw := wrkr.(*worker)
-			o.Params = myw.Params
-			o.Count = len(myw.flist)
-			o.DeleteStmt = myw.delQuery
+		myw := wrkr.(*worker)
+		o.Params = myw.Params
+		if myw.fReader != nil {
+			o.Count = int(myw.fReader.Stats().Files)
 		}
+		o.DeleteStmt = myw.delQuery
 
 		return o, nil
 	}
-
 	// testing cases
 	cases := trial.Cases{
 		"valid_worker": {
@@ -241,36 +269,23 @@ func TestNewWorker(t *testing.T) {
 					Table:     "schema.table_name",
 					BatchSize: 1000,
 				},
-				Invalid: false,
-				Msg:     "",
-				Count:   1,
+				Count: 2,
 			},
 		},
 
 		"table_required": {
-			Input: input{options: &options{}, Info: "nothing"},
-			Expected: output{
-				Invalid: true,
-				Msg:     "params uri.unmarshal: table is required",
-			},
+			Input:       input{options: &options{}, Info: "nothing"},
+			ExpectedErr: errors.New("params uri.unmarshal: table is required"),
 		},
 
 		"invalid_path": {
-			Input: input{options: &options{}, Info: "missingfile.json?table=schema.table_name"},
-			Expected: output{
-				Invalid: true,
-				Msg:     "filepath os: stat missingfile.json: no such file or directory",
-			},
+			Input:       input{options: &options{}, Info: "missingfile.json?table=schema.table_name"},
+			ExpectedErr: errors.New("no files found for missingfile.json"),
 		},
 
 		"invalid_worker": {
-			Input: input{options: &options{}, Info: d2 + "?table=schema.table_name"},
-			Expected: output{
-				Params:  InfoURI{},
-				Invalid: true,
-				Msg:     "no files found in path " + d2,
-				Count:   0,
-			},
+			Input:       input{options: &options{}, Info: d2 + "?table=schema.table_name"},
+			ExpectedErr: errors.New("no files found for " + d2),
 		},
 
 		"valid_path_with_delete": {
@@ -283,8 +298,7 @@ func TestNewWorker(t *testing.T) {
 					DeleteMap: map[string]string{"date(hour_utc)": "2020-07-09", "id": "1572", "amt": "65.2154"},
 				},
 				DeleteStmt: "delete from schema.table_name where amt = 65.2154 and date(hour_utc) = '2020-07-09' and id = 1572",
-				Invalid:    false,
-				Count:      1,
+				Count:      2,
 			},
 		},
 	}
@@ -375,3 +389,82 @@ func TestCreateInserts(t *testing.T) {
 	}
 	trial.New(fn, cases).Timeout(5 * time.Second).SubTest(t)
 }
+
+func TestReadFiles(t *testing.T) {
+	c := trial.CaptureLog()
+	defer c.ReadAll()
+
+	type input struct {
+		lines      []string
+		skipErrors bool
+	}
+	type out struct {
+		rowCount  int32
+		skipCount int
+	}
+	fn := func(in trial.Input) (interface{}, error) {
+		i := in.Interface().(input)
+		ds := DataSet{
+			dbSchema: []DbColumn{
+				{Name: "id", JsonKey: "id"},
+				{Name: "name", JsonKey: "name", Nullable: true},
+				{Name: "count", JsonKey: "count", TypeName: "int", Nullable: true}},
+		}
+		reader := mock.NewReader("nop").AddLines(i.lines...)
+
+		rowChan := make(chan Row)
+		doneChan := make(chan struct{})
+		go func() {
+			for range rowChan {
+			}
+			close(doneChan)
+		}()
+		ds.ReadFiles(context.Background(), reader, rowChan, i.skipErrors)
+		<-doneChan
+		return out{rowCount: ds.rowCount, skipCount: ds.skipCount}, ds.err // number of rows or error
+	}
+	cases := trial.Cases{
+		"valid data": {
+			Input: input{
+				lines: []string{
+					`{"id":1, "name":"apple", "count":10}`,
+					`{"id":1, "name":"banana", "count":3}`,
+				},
+			},
+			Expected: out{rowCount: 2},
+		},
+		"invalid row": {
+			Input: input{
+				lines: []string{
+					`"id":1, "name":"apple", "count":10}`,
+					`{"id":1, "name":"banana", "count":3}`,
+				},
+			},
+			ShouldErr: true,
+		},
+		"all invalid": {
+			Input: input{
+				lines: []string{
+					`{`, `{`, `{`, `{`, `{`, `{`, `{`, `{`, `{`, `{`,
+					`{`, `{`, `{`, `{`, `{`, `{`, `{`, `{`, `{`, `{`,
+					`{`, `{`, `{`, `{`, `{`, `{`, `{`, `{`, `{`, `{`,
+				},
+			},
+			ShouldErr: true,
+		},
+		"skip invalids": {
+			Input: input{
+				lines: []string{
+					`{`, `{`, `{`, `{`, `{`,
+					`{"id":1, "name":"apple", "count":10}`,
+					`{"id":1, "name":"banana", "count":3}`,
+					`{"id":1, "name":"apple", "count":10}`,
+					`{"id":1, "name":"banana", "count":3}`,
+				},
+				skipErrors: true,
+			},
+			Expected: out{skipCount: 5, rowCount: 4},
+		},
+	}
+	trial.New(fn, cases).Timeout(5 * time.Second).SubTest(t)
+}
diff --git a/file/file_test.go b/file/file_test.go
index 149a9a29..8f450faf 100644
--- a/file/file_test.go
+++ b/file/file_test.go
@@ -121,7 +121,6 @@ func TestGlob_Local(t *testing.T) {
 		},
 	}
 	trial.New(fn, cases).SubTest(t)
-
 }
 
 func TestGlob_S3(t *testing.T) {
diff --git a/file/globreader.go b/file/globreader.go
index 73d32f97..4a3d5c1b 100644
--- a/file/globreader.go
+++ b/file/globreader.go
@@ -11,18 +11,20 @@ import (
 func NewGlobReader(path string, opts *Options) (_ Reader, err error) {
 	r := &GlobReader{
 		path: path,
-		opts: *opts,
 		sts: stat.Stats{
 			Path: path,
 		},
 	}
+	if opts != nil {
+		r.opts = *opts
+	}
 	if r.files, err = Glob(path, opts); err != nil {
 		return nil, err
 	}
 	if err := r.nextFile(); err != nil {
-		return nil, fmt.Errorf("no files (%d) found for %s", len(r.files), path)
+		return nil, fmt.Errorf("no files found for %s", path)
 	}
-
+	r.sts.Files = int64(len(r.files))
 	return r, nil
 }
 
@@ -54,7 +56,6 @@ func (g *GlobReader) nextFile() (err error) {
 	}
 	g.reader, err = NewReader(g.files[g.fileIndex].Path, &g.opts)
 	g.fileIndex++
-	g.sts.Files = int64(g.fileIndex)
 
 	return err
 }
@@ -75,7 +76,10 @@ func (g *GlobReader) Read(p []byte) (n int, err error) {
 }
 
 func (g *GlobReader) Close() error {
-	return g.reader.Close()
+	if g.reader != nil {
+		return g.reader.Close()
+	}
+	return nil
 }
 
 func (g *GlobReader) ReadLine() (b []byte, err error) {
@@ -100,7 +104,6 @@ func (g *GlobReader) Stats() stat.Stats {
 		sts.ByteCnt += s.ByteCnt
 		sts.LineCnt += s.LineCnt
 		sts.Size += s.Size
-		sts.Files++
 	}
 	return sts
 }