Index: NOTES
==================================================================
--- NOTES
+++ NOTES
@@ -158,5 +158,9 @@
 INFO: (0) Server shutdown complete. Exiting
 
 Start: 0 at Sun Apr 28 22:18:25 MST 2013
 Max:  52 at Sun Apr 28 23:06:59 MST 2013
 End:   6 at Sun Apr 28 23:47:51 MST 2013
+
+========================================================================
+
+

Index: archive.scm
==================================================================
--- archive.scm
+++ archive.scm
@@ -185,13 +185,11 @@
 						partial-path-index)
 				     #f))
 	      ;; we need our archive dir checked for every test to enable folks who want to store other ways.
 	      (archive-info (archive:allocate-new-archive-block blockid-cache *toppath* tsname min-space target run-name test-name))
 	      (archive-dir  (if archive-info (cdr archive-info) #f))
-	      (archive-id   (if archive-info (car archive-info) -1))
-
-	      )
+	      (archive-id   (if archive-info (car archive-info) -1)))
 	 
 	 (if (not archive-dir) ;; no archive disk found, this is fatal
 	     (begin
 	       (debug:print 0 *default-log-port* "FATAL: No archive disks found. Please add disks with at least "
 			    min-space " MB space to the [archive-disks] section of megatest.config")
@@ -312,12 +310,14 @@
 	   (for-each
 	    (lambda (test-dat)
 	      (let ((test-id           (db:test-get-id        test-dat))
 		    (run-id            (db:test-get-run_id    test-dat)))
 		(rmt:test-set-archive-block-id run-id test-id archive-id)
-		(if (member archive-command '("save-remove"))
-		    (runs:remove-test-directory test-dat 'archive-remove))))
+		(if (member (symbol->string archive-command) '("save-remove"))
+                    (begin 
+                     (debug:print-info 0 *default-log-port* "remove testdat")
+		    (runs:remove-test-directory test-dat 'archive-remove)))))
 	    (hash-table-ref test-groups test-base)))))
        (hash-table-keys disk-groups))
     #t))
 
 (define (archive:bup-restore archive-command run-id run-name tests rp-mutex bup-mutex)  ;; move the getting of archive space down into the below block so that a single run can 

Index: common.scm
==================================================================
--- common.scm
+++ common.scm
@@ -716,14 +716,18 @@
 ;; dot-locking egg seems not to work, using this for now
 ;; if lock is older than expire-time then remove it and try again
 ;; to get the lock
 ;;
 (define (common:simple-file-lock fname #!key (expire-time 300))
+  (let ((fmod-time (handle-exceptions
+		       ext
+		     (current-seconds)
+		     (file-modification-time fname))))
     (if (common:file-exists? fname)
-	(if (> (- (current-seconds)(file-modification-time fname)) expire-time)
+	(if (> (- (current-seconds) fmod-time) expire-time)
 	    (begin
-              (handle-exceptions exn #f (delete-file* fname))	
+	      (handle-exceptions exn #f (delete-file* fname))	
 	      (common:simple-file-lock fname expire-time: expire-time))
 	    #f)
 	(let ((key-string (conc (get-host-name) "-" (current-process-id))))
 	  (with-output-to-file fname
 	    (lambda ()
@@ -733,11 +737,11 @@
 	      (handle-exceptions exn
                 #f 
                 (with-input-from-file fname
 	  	  (lambda ()
 		    (equal? key-string (read-line)))))
-	      #f))))
+	      #f)))))
 
 (define (common:simple-file-lock-and-wait fname #!key (expire-time 300))
   (let ((end-time (+ expire-time (current-seconds))))
     (let loop ((got-lock (common:simple-file-lock fname expire-time: expire-time)))
       (if got-lock
@@ -1733,11 +1737,17 @@
 	     exn
 	     #f
 	     (debug:print 2 *default-log-port* "reading file " fullpath)
 	     (let ((real-age (- (current-seconds)(file-change-time fullpath)))) 
 	       (if (< real-age age)
-		   (with-input-from-file fullpath read)
+		   (handle-exceptions
+		       exn
+		     (begin
+		       (debug:print-info 1 *default-log-port* " removing bad file " fullpath)
+		       (delete-file* fullpath)
+		       #f)
+		     (with-input-from-file fullpath read))
 		   (begin
 		     (debug:print-info 2 *default-log-port* "file " fullpath " is too old (" real-age" seconds) to trust, skipping reading it")
 		     #f))))
 	    (begin
 	      (debug:print 2 *default-log-port* "not reading file " fullpath)
@@ -2044,11 +2054,13 @@
 	 (numcpus (if (<= 1 numcpus-in) ;; not possible to have zero.  If we get 1, it's possible that we got the previous default, and we should check again
 		      (common:get-num-cpus remote-host)
 		      numcpus-in))
 	 (maxload (if force-maxload
 		      maxload-in
-		      (max maxload-in 0.5))) ;; so maxload must be greater than 0.5 for now BUG - FIXME?
+		      (if (number? maxload-in)
+			  (max maxload-in 0.5)
+			  0.5))) ;; so maxload must be greater than 0.5 for now BUG - FIXME?
 	 (first   (car loadavg))
 	 (next    (cadr loadavg))
 	 (adjmaxload (* maxload (max 1 numcpus))) ;; possible bug where
 					       ;; numcpus (or could be
 					       ;; maxload) is zero,

Index: db.scm
==================================================================
--- db.scm
+++ db.scm
@@ -1698,11 +1698,11 @@
               (begin
                 (debug:print-info 0 *default-log-port* "Found old test in REMOTEHOSTSTART state, test-id=" test-id" exceeded running-deadtime "running-deadtime" now="(current-seconds)" event-time="event-time" run-duration="run-duration)
                 (set! incompleted (cons (list test-id run-dir uname testname item-path run-id) incompleted)))))
         db
         "SELECT id,rundir,uname,testname,item_path,event_time,run_duration FROM tests WHERE run_id=? AND (strftime('%s','now') - event_time) > (run_duration + ?) AND state IN ('REMOTEHOSTSTART');"
-        run-id remotehoststart-deadtime) ;; default time 230 seconds.
+        run-id remotehoststart-deadtime) ;; default time 230 seconds
 
        ;; in LAUNCHED for more than one day. Could be long due to job queues TODO/BUG: Need override for this in config
        ;;
        ;; (db:delay-if-busy dbdat)
        (sqlite3:for-each-row
@@ -1732,36 +1732,37 @@
               ;;      		    incompleted))
               (min-incompleted-ids (map car incompleted)) ;; do 'em all
               (all-ids             (append min-incompleted-ids (map car oldlaunched))))
          (if (> (length all-ids) 0)
              (begin
+	       ;; (launch:is-test-alive "localhost" 435)
                (debug:print 0 *default-log-port* "WARNING: Marking test(s); " (string-intersperse (map conc all-ids) ", ") " as DEAD")
                (for-each
                   (lambda (test-id)
-                    (let* (
-                      (run-dir (db:test-get-rundir-from-test-id dbstruct run-id test-id))
-                      (result (db:get-status-from-final-status-file run-dir)))
-                    (if (and (list? result) (> (length result) 1) (equal? "PASS" (cadr result)) (equal? "COMPLETED" (car result))) 
-                      (begin
-                        (debug:print 0 *default-log-port* "INFO: test " test-id " actually passed, so marking PASS not DEAD")
-                        (db:set-state-status-and-roll-up-items dbstruct run-id test-id 'foo "COMPLETED" "PASS" "Test stopped responding but it has PASSED; marking it PASS in the DB.")
-                      )
-                      (begin
-                      (debug:print 0 *default-log-port* "INFO: test " test-id " final state/status is not COMPLETED/PASS. It is " result)
-                      (db:set-state-status-and-roll-up-items dbstruct run-id test-id 'foo "COMPLETED" "DEAD" "Test stopped responding while in RUNNING or REMOTEHOSTSTART; presumed dead.")
-                      )
-                     )
-                    )
-                  )
-                  all-ids)
-             )
-         )
-       )
-     )
-   )
- )
-)
+                    (let* (;; (run-dir (db:test-get-rundir-from-test-id dbstruct run-id test-id))
+			   (tinfo   (db:get-test-info-by-id dbstruct run-id test-id))
+			   (run-dir (db:test-get-rundir     tinfo))
+			   (host    (db:test-get-host       tinfo))
+			   (pid     (db:test-get-process_id tinfo))
+			   (result (db:get-status-from-final-status-file run-dir)))
+		      (if (and (list? result) (> (length result) 1) (equal? "PASS" (cadr result)) (equal? "COMPLETED" (car result))) 
+			  (begin
+			    (debug:print 0 *default-log-port* "INFO: test " test-id " actually passed, so marking PASS not DEAD")
+			    (db:set-state-status-and-roll-up-items dbstruct run-id test-id 'foo "COMPLETED" "PASS"
+								   "Test stopped responding but it has PASSED; marking it PASS in the DB."))
+			  (let ((is-alive (launch:is-test-alive host pid)))
+			    (if is-alive
+				(debug:print 0 *default-log-port* "INFO: test " test-id " on host " host " has a process on pid " pid ", NOT setting to DEAD.")
+				(begin
+				  (debug:print 0 *default-log-port* "INFO: test " test-id " final state/status is not COMPLETED/PASS. It is " result)
+				  (db:set-state-status-and-roll-up-items dbstruct run-id test-id 'foo "COMPLETED" "DEAD"
+									 "Test stopped responding while in RUNNING or REMOTEHOSTSTART; presumed dead.")))))))
+		  all-ids)
+	       ;;call end of eud of run detection for posthook
+	       (launch:end-of-run-check run-id)
+	       )))))))
+
 
 ;; ALL REPLACED BY THE BLOCK ABOVE
 ;;
 ;; 	    (sqlite3:execute 
 ;; 	     db

Index: docs/manual/megatest_manual.html
==================================================================
--- docs/manual/megatest_manual.html
+++ docs/manual/megatest_manual.html
@@ -769,13 +769,13 @@
 <h1>The Megatest Users Manual</h1>
 <span id="author">Matt Welland</span><br>
 <span id="email" class="monospaced">&lt;<a href="mailto:matt@kiatoa.com">matt@kiatoa.com</a>&gt;</span><br>
 <span id="revnumber">version 1.5,</span>
 <span id="revdate">June 2020</span>
-<div id="toc">
-  <div id="toctitle">Table of Contents</div>
-  <noscript><p><b>JavaScript must be enabled in your browser to display the table of contents.</b></p></noscript>
+<div id="toc">
+  <div id="toctitle">Table of Contents</div>
+  <noscript><p><b>JavaScript must be enabled in your browser to display the table of contents.</b></p></noscript>
 </div>
 </div>
 <div id="content">
 <div class="sect1">
 <h2 id="_preface">Preface</h2>
@@ -2588,10 +2588,32 @@
 A x y
 B 1 2
 
 # Yields x/1 y/2</pre>
 </div></div>
+<div class="listingblock">
+<div class="title">Or use files</div>
+<div class="content monospaced">
+<pre>[itemopts]
+slash path/to/file/with/items
+# or
+space path/to/file/with/items</pre>
+</div></div>
+<div class="listingblock">
+<div class="title">File format for / delimited</div>
+<div class="content monospaced">
+<pre>key1/key2/key3
+val1/val2/val2
+...</pre>
+</div></div>
+<div class="listingblock">
+<div class="title">File format for space delimited</div>
+<div class="content monospaced">
+<pre>key1 key2 key3
+val1 val2 val2
+...</pre>
+</div></div>
 </div>
 <div class="sect2">
 <h3 id="_requirements_section">Requirements section</h3>
 <div class="listingblock">
 <div class="title">Header</div>
@@ -3380,11 +3402,11 @@
 </div>
 <div id="footnotes"><hr></div>
 <div id="footer">
 <div id="footer-text">
 Version 1.5<br>
-Last updated
+Last updated 2020-07-22 14:21:46 PDT
  2020-06-16 23:02:26 MST
 </div>
 </div>
 </body>
 </html>

Index: docs/manual/reference.txt
==================================================================
--- docs/manual/reference.txt
+++ docs/manual/reference.txt
@@ -324,10 +324,31 @@
 B 1 2
 
 # Yields x/1 y/2
 ------------------
 
+.Or use files
+------------------
+[itemopts]
+slash path/to/file/with/items
+# or
+space path/to/file/with/items
+------------------
+
+.File format for / delimited
+------------------
+key1/key2/key3
+val1/val2/val2
+...
+------------------
+
+.File format for space delimited
+------------------
+key1 key2 key3
+val1 val2 val2
+...
+------------------
 
 Requirements section
 ~~~~~~~~~~~~~~~~~~~~
 
 .Header

Index: items.scm
==================================================================
--- items.scm
+++ items.scm
@@ -123,13 +123,63 @@
 			(if s (string-split s) #f))))
     (if valid-values
 	(if (member item valid-values)
 	    item #f)
 	item)))
+
+;;  '(("k1" "k2" "k3")
+;;    ("a" "b" "c")
+;;    ("d" "e" "f"))
+;;
+;;    => '((("k1" "a")("k2" "b")("k3" "c"))
+;;         (("k1" "d")("k2" "e")("k3" "f")))
+;;
+(define (items:first-row-intersperse data)
+  (if (< (length data) 2)
+      '()
+      (let ((header (car data))
+	    (rows   (cdr data)))
+	(map (lambda (row)
+	       (map list header row))
+	     rows))))
+
+;; k1/k2/k3
+;; a/b/c
+;; d/e/f
+;;    => '(("k1" "k2" "k3")
+;;         ("a" "b" "c")
+;;         ("d" "e" "f"))
+;;
+;;    => '((("k1" "a")("k2" "b")("k3" "c"))
+;;         (("k1" "d")("k2" "e")("k3" "f")))
+;;
+(define (items:read-items-file fname ftype) ;; 'sxml 'slash 'space 
+  (if (and fname (file-exists? fname))
+      (items:first-row-intersperse (case ftype
+				     ((slash space)
+				      (let ((splitter (case ftype
+							((slash) (lambda (x)(string-split x "/")))
+							(else    string-split))))
+					(debug:print 0 *default-log-port* "Reading " fname " of type " ftype)
+					(with-input-from-file fname
+					  (lambda ()
+					    (let loop ((inl (read-line))
+						       (res '()))
+					      (if (eof-object? inl)
+						  res
+						  (loop (read-line)(cons (splitter inl) res))))))))
+				     ((sxml)(with-input-from-file fname read))
+				     (else (debug:print 0 *default-log-port* "items file type " ftype " not recognised"))))
+      (begin
+	(if fname (debug:print 0 *default-log-port* "no items file " fname " found"))
+	'())))
 
 (define (items:get-items-from-config tconfig)
-  (let* ((have-items  (hash-table-ref/default tconfig "items"      #f))
+  (let* ((slashf      (configf:lookup tconfig "itemopts" "slash")) ;; a/b/c\nd/e/f\n ...
+	 (sxmlf       (configf:lookup tconfig "itemopts" "sxml"))  ;; '(("a" "b" "c")("d" "e" "f") ...)
+	 (spacef      (configf:lookup tconfig "itemopts" "space")) ;; a b c\nd e f\n ...
+	 (have-items  (hash-table-ref/default tconfig "items"      #f))
 	 (have-itable (hash-table-ref/default tconfig "itemstable" #f))
 	 (items       (hash-table-ref/default tconfig "items"      '()))
 	 (itemstable  (hash-table-ref/default tconfig "itemstable" '())))
     (debug:print 5 *default-log-port* "items: " items " itemstable: " itemstable)
     (set! items (map (lambda (item)
@@ -142,14 +192,21 @@
 				(list (car item)((cadr item)))  ;; evaluate the proc
 				item))
 			  itemstable))
     (if (and have-items  (null? items))     (debug:print 0 *default-log-port* "WARNING:[items] section in testconfig but no entries defined"))
     (if (and have-itable (null? itemstable))(debug:print 0 *default-log-port* "WARNNG:[itemstable] section in testconfig but no entries defined"))
-    (if (or (not (null? items))(not (null? itemstable)))
+    (if (or (not (null? items))
+	    (not (null? itemstable))
+	    slashf
+	    sxmlf
+	    spacef)
 	(append (item-assoc->item-list items)
-		(item-table->item-list itemstable))
+		(item-table->item-list itemstable)
+		(items:read-items-file slashf 'slash)
+		(items:read-items-file sxmlf  'sxml)
+		(items:read-items-file spacef 'space))
 	'(()))))
 
 ;; (pp (item-assoc->item-list itemdat))
 
 
 	

Index: launch.scm
==================================================================
--- launch.scm
+++ launch.scm
@@ -909,17 +909,25 @@
            (running-cnt (rmt:get-count-tests-running-for-run-id run-id))
            (all-test-launched (rmt:get-var (conc "lunch-complete-" run-id)))
            (current-state (rmt:get-run-state run-id))
            (current-status (rmt:get-run-status run-id)))
      ;;get-vars run-id to query metadata table to check if all completed. if all-test-launched = yes then only not-completed-cnt = 0 means everyting is completed if no entry found in the table do nothing 
-     (debug:print 0 *default-log-port* "rollup run state/status")                      
+     (debug:print 0 *default-log-port* "Running test cnt :" running-cnt)                      
      (rmt:set-state-status-and-roll-up-run  run-id current-state current-status)
      (runs:update-junit-test-reporter-xml run-id) 
      (cond 
        ((and all-test-launched (eq? not-completed-cnt 0) (equal? all-test-launched "yes" ))
-           	(debug:print 0 *default-log-port* "look for  post hook.")
-          	(runs:run-post-hook run-id))
+                (if (and (equal? (rmt:get-var (conc "end-of-run-" run-id)) "no") (common:simple-lock (conc "endOfRun" run-id)))
+                (begin
+           	(debug:print 4 *default-log-port* "look for  post hook. currseconds: " (current-seconds) " EOR " (rmt:get-var (conc "end-of-run-" run-id)))
+                (debug:print 0 *default-log-port* "End of Run Detected.")
+                (rmt:set-var (conc "end-of-run-" run-id) "yes")
+                ;(thread-sleep! 10)
+          	(runs:run-post-hook run-id)
+                (debug:print 4 *default-log-port* "currseconds: " (current-seconds)" eor: " (rmt:get-var (conc "end-of-run-" run-id)))
+                (common:simple-unlock (conc "endOfRun" run-id)))
+                 (debug:print 0 *default-log-port* "End of Run Detected but not running post hook. This should happen when eor is set to yes. This will happen only when 2 tests exit at smae time. eor= " (rmt:get-var (conc "end-of-run-" run-id)))))
         ((> running-cnt 3) 
         	  (debug:print 0 *default-log-port* "There are " running-cnt " tests running." ))
         ((> running-cnt 0)
             (debug:print 0 *default-log-port* "running cnt > 0 but <= 3 kill-running-tests-if-dead" )
    				  (let ((kill-cnt (launch:kill-tests-if-dead run-id)))
@@ -935,18 +943,18 @@
 			       	(debug:print 0 *default-log-port* "test " test-name "/" item-path " not completed")
               (if (not (null? tal))
 				  (loop (car tal) (cdr tal)))))))))))        
  
 (define (launch:is-test-alive host pid)
-(if (and host pid (not (equal? host "n/a")))
-(let* ((cmd (conc "ssh " host " pstree -A " pid))
-      (output (with-input-from-pipe cmd read-lines)))
-  (print "cmd: " cmd "\n op: " output )
-  (if(eq? (length output) 0)
-     #f
-     #t))
-#t))
+  (if (and host pid (not (equal? host "n/a")))
+      (let* ((cmd (conc "ssh " host " pstree -A " pid))
+	     (output (with-input-from-pipe cmd read-lines)))
+	(debug:print 2 *default-log-port* "Running " cmd " received " output)
+	(if (eq? (length output) 0)
+	   #f
+	   #t))
+      #t))
  
 (define (launch:kill-tests-if-dead run-id)
   (let* ((running-tests (rmt:get-tests-for-run run-id "%" `("RUNNING" "LAUNCHED" "REMOTEHOSTSTART") `() #f #f #f #f #f #f #f #f)))
        (let loop ((running-test (car running-tests))
 			     (tal    (cdr running-tests))
@@ -1399,29 +1407,29 @@
 	(let ((iterated-parent  (pathname-directory (conc lnkpath "/" item-path))))
 	  (debug:print-info 2 *default-log-port* "Creating iterated parent " iterated-parent)
 	  (handle-exceptions
 	   exn
 	   (begin
-	     (debug:print-error 0 *default-log-port* " Failed to create directory " iterated-parent ((condition-property-accessor 'exn 'message) exn) ", exiting")
-	     (exit 1))
+	     (debug:print-error 0 *default-log-port* " Failed to create directory " iterated-parent ((condition-property-accessor 'exn 'message) exn) ", continuing but link tree may be corrupted")
+	     #;(exit 1))
 	   (create-directory iterated-parent #t))))
 
     (if (symbolic-link? lnkpath) 
 	(handle-exceptions
 	 exn
 	 (begin
-	   (debug:print-error 0 *default-log-port* " Failed to remove symlink " lnkpath ((condition-property-accessor 'exn 'message) exn) ", exiting")
-	   (exit 1))
+	   (debug:print-error 0 *default-log-port* " Failed to remove symlink " lnkpath ((condition-property-accessor 'exn 'message) exn) ", continuing but link tree may be corrupted.")
+	   #;(exit 1))
 	 (delete-file lnkpath)))
 
     (if (not (or (common:file-exists? lnkpath)
 		 (symbolic-link? lnkpath)))
 	(handle-exceptions
 	 exn
 	 (begin
-	   (debug:print-error 0 *default-log-port* " Failed to create symlink " lnkpath ((condition-property-accessor 'exn 'message) exn) ", exiting")
-	   (exit 1))
+	   (debug:print-error 0 *default-log-port* " Failed to create symlink " lnkpath ((condition-property-accessor 'exn 'message) exn) ", continuing but link tree may be corrupted.")
+	   #;(exit 1))
 	 (create-symbolic-link toptest-path lnkpath)))
     
     ;; NB - This was not working right - some top tests are not getting the path set!!!
     ;;
     ;; Do the setting of this record after the paths are created so that the shortdir can 

Index: megatest.scm
==================================================================
--- megatest.scm
+++ megatest.scm
@@ -1805,16 +1805,13 @@
 	       (for-each (lambda (spec) 
 			   (let* ((precmd     (if (args:get-arg "-precmd")(conc (args:get-arg "-precmd") " ") ""))
 				  (newcmdline (conc
 					       precmd
 					       (string-substitute
-						(conc "target " target)
-						(conc "target " (simple-run-target spec))
-						(string-substitute
-						 (conc "runname " runname)
-						 (conc "runname " (simple-run-runname spec))
-						 orig-cmdline)))))
+						(conc "runname " runname)
+						(conc "runname " (simple-run-runname spec))
+						orig-cmdline))))
 			     (debug:print 0 *default-log-port* "ORIG: " orig-cmdline)
 			     (debug:print 0 *default-log-port* "NEW:  " newcmdline)
 			     (system newcmdline)))
 			 run-specs))
 	     (handle-run-requests target runname keys keyvals need-clean))))))

Index: mtut.scm
==================================================================
--- mtut.scm
+++ mtut.scm
@@ -23,10 +23,11 @@
 (define (toplevel-command . a) #f)
 
 (use srfi-1 posix srfi-69 readline ;;  regex regex-case srfi-69 apropos json http-client directory-utils rpc typed-records;; (srfi 18) extras)
    srfi-19  srfi-18 extras format regex regex-case
      (prefix dbi dbi:)
+     (prefix sqlite3 sqlite3:)
      nanomsg)
 
 (declare (uses common))
 (declare (uses megatest-version))
 (declare (uses margs))
@@ -230,10 +231,11 @@
     ("-msg"             . M)
     ("-start-dir"       . S)
     ("-set-vars"        . v)
     ("-config"          . h)
     ("-time-out"        . u)
+    ("-archive"         . b)
     ))
 (define *switch-keys*
   '(
     ("-h"               . #f)
     ("-help"            . #f)
@@ -257,11 +259,11 @@
     (kill-run    . "-kill-runs")
     (kill-rerun  . "-kill-rerun")
     (lock        . "-lock")
     (unlock      . "-unlock")
     (sync        . "")
-    (archive     . "-archive")
+    (archive     . "")
     (set-ss      . "-set-state-status")
     (remove      . "-remove-runs")))
 
 ;; manually keep this list updated from the keys to
 ;; the case *action* near the end of this file.
@@ -841,12 +843,11 @@
 	      (contours  (configf:get-section mtconf "contours"))
 	      (torun     (make-hash-table)) ;; target => ( ... info ... )
 	      (rgentargs (hash-table-keys rgconf))) ;; these are the targets registered for automatically triggering
 
 	 ;;(print "rgentargs: " rgentargs)
-	 
-	 (for-each
+	  (for-each
 	  (lambda (runkey)
 	    (let* ((keydats   (configf:get-section rgconf runkey)))
 	      (for-each
 	       (lambda (sense) ;; these are the sense rules
 		 (let* ((key        (car sense))
@@ -1429,10 +1430,11 @@
 	      (areas     (configf:get-section mtconf "areas"))
 	      (contours  (configf:get-section mtconf "contours"))
 	      (pkts      (find-pkts pdb '(cmd) '()))
 	      (torun     (make-hash-table)) ;; target => ( ... info ... )
 	      (rgentargs (hash-table-keys rgconf))) ;; these are the targets registered for automatically triggering
+         (sqlite3:set-busy-handler! (dbi:db-conn pdb) (sqlite3:make-busy-timeout 10000))
 	 (for-each
 	  (lambda (pktdat)
 	    (let* ((pkta    (alist-ref 'apkt pktdat))
 		   (action  (alist-ref 'A pkta))
 		   (cmdline (pkt->cmdline pkta))

Index: rmt.scm
==================================================================
--- rmt.scm
+++ rmt.scm
@@ -253,11 +253,11 @@
 (define (extras-case-11 *default-log-port* runremote cmd params attemptnum rid)
   ;; (mutex-unlock! *rmt-mutex*)
   (debug:print-info 12 *default-log-port* "rmt:send-receive, case  9")
   ;; (mutex-lock! *rmt-mutex*)
   (let* ((conninfo (remote-conndat runremote))
-	 (dat      (case (remote-transport runremote)
+	 (dat-in      (case (remote-transport runremote)
 		     ((http) (condition-case ;; handling here has
 					     ;; caused a lot of
 					     ;; problems. However it
 					     ;; is needed to deal with
 					     ;; attemtped
@@ -268,10 +268,37 @@
 			      ((commfail)(vector #f "communications fail"))
 			      ((exn)(vector #f "other fail" (print-call-chain)))))
 		     (else
 		      (debug:print 0 *default-log-port* "ERROR: transport " (remote-transport runremote) " not supported")
 		      (exit))))
+
+;; No Title 
+;; Error: (vector-ref) out of range
+;; #(#<condition: (exn type)> (#("db.scm:3740: regex#regexp" #f #f) #("db.scm:3739: regex#string-substitute" #f #f) #("db.scm:3738: base64#base64-decode" #f #f) #("db.scm:3737: z3#z3:decode-buffer" #f #f) #("db.scm:3736: with-input-from-string" #f #f) #("db.scm:3741: s11n#deserialize" #f #f) #("api.scm:374: api:execute-requests" #f #f) #("api.scm:139: call-with-current-continuation" #f #f) #("api.scm:139: with-exception-handler" #f #f) #("api.scm:139: ##sys#call-with-values" #f #f) #("api.scm:158: string->symbol" #f #f) #("api.scm:160: current-milliseconds" #f #f) #("api.scm:161: dbr:dbstruct-read-only" #f #f) #("api.scm:139: k15" #f #f) #("api.scm:139: g19" #f #f) #("api.scm:142: get-call-chain" #f #f)) #("get-test-info-by-id" (1102 507299)))
+;; 6
+;; 
+;; 	Call history:
+;; 
+;; 	http-transport.scm:306: thread-terminate!	  
+;; 	http-transport.scm:307: debug:print-info	  
+;; 	common_records.scm:235: debug:debug-mode	  
+;; 	rmt.scm:259: k587	  
+;; 	rmt.scm:259: g591	  
+;; 	rmt.scm:276: http-transport:server-dat-update-last-access	  
+;; 	http-transport.scm:364: current-seconds	  
+;; 	rmt.scm:282: debug:print-info	  
+;; 	common_records.scm:235: debug:debug-mode	  
+;; 	rmt.scm:283: mutex-unlock!	  
+;; 	rmt.scm:287: extras-transport-succeded	  	<--
+;; +-----------------------------------------------------------------------------+
+;; | Exit Status    : 70  
+;;  
+
+	 (dat      (if (and (vector? dat-in) ;; ... check it is a correct size
+			    (> (vector-length dat-in) 1))
+		       dat-in
+		       (vector #f (conc "communications fail (type 2), dat-in=" dat-in))))
 	 (success  (if (vector? dat) (vector-ref dat 0) #f))
 	 (res      (if (vector? dat) (vector-ref dat 1) #f)))
     (if (and (vector? conninfo) (< 5 (vector-length conninfo)))
 	(http-transport:server-dat-update-last-access conninfo) ;; refresh access time
 	(begin

Index: runs.scm
==================================================================
--- runs.scm
+++ runs.scm
@@ -532,10 +532,19 @@
     ;; run the run prehook if there are no tests yet run for this run:
     ;;
     (runs:run-pre-hook run-id)
     ;; mark all test launced flag as false in the meta table 
     (rmt:set-var (conc "lunch-complete-" run-id) "no")
+    (debug:print-info 1 *default-log-port* "Setting end-of-run to no")
+    (let* ((config-reruns      (let ((x (configf:lookup *configdat* "setup" "reruns")))
+			       (if x (string->number x) #f)))
+	  (config-rerun-cnt (if config-reruns
+			config-reruns
+			1)))
+    (if (eq? config-rerun-cnt run-count)
+      (rmt:set-var (conc "end-of-run-" run-id) "no")))
+
     (rmt:set-run-state-status run-id "new" "n/a")
     ;; now add non-directly referenced dependencies (i.e. waiton)
     ;;======================================================================
     ;; refactoring this block into tests:get-full-data
     ;;
@@ -685,21 +694,21 @@
 		  (if (not (hash-table-ref/default flags "-preclean" #f))
 		      (hash-table-set! flags "-preclean" #t))
 		  (if (not (hash-table-ref/default flags "-rerun" #f))
 		      (hash-table-set! flags "-rerun" "STUCK/DEAD,n/a,ZERO_ITEMS"))
 		  ;; recursive call to self
-      (runs:run-tests target runname test-patts user flags run-count: (- run-count 1)))))
+      (runs:run-tests target runname test-patts user flags run-count: (- run-count 1)))
+                  (launch:end-of-run-check run-id)))
 	  (debug:print-info 0 *default-log-port* "No tests to run")))
     (debug:print-info 4 *default-log-port* "All done by here")
     ;; TODO: try putting post hook call here
-    ;(if (eq? run-count 0)
-    ; (begin  
-    ;  (debug:print-info 0 *default-log-port* "Calling Post Hook")  
+      
     ;  (debug:print-info 2 *default-log-port* " run-count " run-count)
     ;  (runs:run-post-hook run-id))
     ;  (debug:print-info 2 *default-log-port* "Not calling post hook runcount = " run-count ))   
     (rmt:tasks-set-state-given-param-key task-key "done")
+     
     ;; (sqlite3:finalize! tasks-db)
     ))
 
 
 ;; loop logic. These are used in runs:run-tests-queue to make it a bit more readable.
@@ -1678,12 +1687,12 @@
 	 (else
           (debug:print-info 4 *default-log-port* "cond branch - "  "rtq-9")
 	  (debug:print-info 4 *default-log-port* "Exiting loop with...\n  hed=" hed "\n  tal=" tal "\n  reruns=" reruns))
 	 ))) ;; end loop on sorted test names
     ;; this is the point where everything is launched and now you can mark the run in metadata table as all launched 
-    (rmt:set-var (conc "lunch-complete-" run-id) "yes")
-  
+    (rmt:set-var (conc "lunch-complete-" run-id) "yes")  
+        
     ;; now *if* -run-wait we wait for all tests to be done
     ;; Now wait for any RUNNING tests to complete (if in run-wait mode)
     (thread-sleep! 10) ;; I think there is a race condition here. Let states/statuses settle
     (let wait-loop ((num-running      (rmt:get-count-tests-running-for-run-id run-id))
 		    (prev-num-running 0))
@@ -2365,10 +2374,16 @@
                                             (debug:print 2 *default-log-port* "Not removing directory " rundir " because either it doesn't exist or has a bad name")
                                             (debug:print 2 *default-log-port* "Is /tmp/badname: " (string=  rundir "/tmp/badname"))
                                             (debug:print 2 *default-log-port* "Exists: " (file-exists? rundir))
                                             (debug:print 2 *default-log-port* "Has run-name: " (substring-index run-name rundir))
                                             (debug:print 2 *default-log-port* "Has target: " (substring-index target rundir))
+                                            ;;PJH remove record from db no need to cleanup directory
+                                            (case mode
+                                               ((remove-data-only)(mt:test-set-state-status-by-id (db:test-get-run_id test)(db:test-get-id test) (db:test-get-state test)(db:test-get-status test) #f))
+                                               ((archive-remove)  (mt:test-set-state-status-by-id (db:test-get-run_id test)(db:test-get-id test) "ARCHIVED" #f #f))
+                                               (else (rmt:delete-test-records (db:test-get-run_id test) (db:test-get-id test))))
+
                                           )
                                         )
                                       )
 
                                       (if (not (null? tal))
@@ -2459,12 +2474,14 @@
                       (begin
                         (debug:print 1 *default-log-port* "Removing DB records for the run.")
                         (rmt:delete-run run-id)
                         (rmt:delete-old-deleted-test-records))
                     )
-	           (debug:print 1 *default-log-port* "Recursively removing links dir " linkspath)
-                   (runs:recursive-delete-with-error-msg linkspath)
+                    (if (not (equal?  linkspath "/does/not/exist/I"))
+	               (begin 
+                         (debug:print 1 *default-log-port* "Recursively removing links dir " linkspath)
+                         (runs:recursive-delete-with-error-msg linkspath)))
 
                    (for-each (lambda(runpath)
                        (debug:print 1 *default-log-port* "Recursively removing runs dir " runpath)
                        (runs:recursive-delete-with-error-msg runpath)
                      )
@@ -2735,23 +2752,21 @@
     (*PI* xml "version='1.0'")
     (testsuite)))
 
 (define (runs:update-junit-test-reporter-xml run-id)
   (let*	(
-	 (junit-test-reporter	 (configf:lookup *configdat* "runs" "junit-test-reporter-xml"))
+	 (junit-test-reporter	(configf:lookup *configdat* "runs" "junit-test-reporter-xml"))
 	 (junit-test-report-dir  (configf:lookup *configdat* "runs" "junit-test-report-dir"))
-	 (xml-dir		 (if (and junit-test-reporter (equal? junit-test-reporter "yes" ))
-				     (if junit-test-report-dir
-					 junit-test-report-dir
-					 (conc (getenv "MT_LINKTREE") "/" (getenv "MT_TARGET") "/" (getenv "MT_RUNNAME")))
-				     #f))
+	 (xml-dir		(if (and junit-test-reporter (equal? junit-test-reporter "yes" ))
+				    (if junit-test-report-dir
+					junit-test-report-dir
+					(conc (getenv "MT_LINKTREE") "/" (getenv "MT_TARGET") "/" (getenv "MT_RUNNAME")))
+				    #f))
 	 (xml-ts-name		(if xml-dir
 				    (conc (getenv "MT_TESTSUITENAME")"."(string-translate (getenv "MT_TARGET") "/" ".") "." (getenv "MT_RUNNAME"))
 				    #f))
-         (keyname               (if xml-ts-name
-				    (common:get-signature xml-ts-name)
-				    #f))
+         (keyname               (if xml-ts-name (common:get-signature xml-ts-name) #f))
 	 (xml-path		(if xml-dir
 				    (conc xml-dir "/" keyname ".xml")
 				    #f))
 
 	 (test-data		(if xml-dir
@@ -2781,13 +2796,13 @@
 			 (comment	(vector-ref test 14))   
 			 (test-status	(vector-ref test 4))
 			 (exc-msg	(conc "No bucket for State " test-state " Status " test-status))
 			 (new-doc	(cond 
 						((member test-state (list "RUNNING" ))
-							((sxml-modify `("testsuite" insert-into (testcase (@ (name ,tc-name)) (inProgress (@ (type "inProgress")))))) doc))
+							((sxml-modify `("testsuite" insert-into (testcase (@ (name ,tc-name)) (inProgress)))) doc))
 						((member test-state (list "LAUNCHED" "REMOTEHOSTSTART"  "NOT_STARTED"))
-							((sxml-modify `("testsuite" insert-into (testcase (@ (name ,tc-name)) (inProgress (@ (type "inQueue")))))) doc))
+							((sxml-modify `("testsuite" insert-into (testcase (@ (name ,tc-name)) (inQueue)))) doc))
 						((member test-status (list "PASS" "WARN" "WAIVED"))
 							((sxml-modify `("testsuite" insert-into (testcase (@ (name ,tc-name))))) doc))
 						((member test-status (list "FAIL" "CHECK"))
 							((sxml-modify `("testsuite" insert-into (testcase (@ (name ,tc-name)) (failure (@ (message ,comment) (type "failure")))))) doc)) 
 						((member test-status (list "DEAD" "KILLED" "ABORT" "PREQ_FAIL" "PREQ_DISCARDED"))

Index: utils/mtrunner
==================================================================
--- utils/mtrunner
+++ utils/mtrunner
@@ -26,6 +26,6 @@
 cd $1
 shift
 export PATH="$1:$PATH"
 shift 
 
-"$@"
+exec "$@"