Index: codescanlib.scm
==================================================================
--- codescanlib.scm
+++ codescanlib.scm
@@ -46,11 +46,11 @@
                          #f)]
                     [else #f] ) scm-tree))))
     procs))
 
 
-;; given a sexp, return a flat lost of atoms in that sexp
+;; given a sexp, return a flat list of atoms in that sexp
 (define (get-atoms-in-body body)
   (cond
    ((null? body) '())
    ((atom? body) (list body))
    (else

Index: common.scm
==================================================================
--- common.scm
+++ common.scm
@@ -531,11 +531,12 @@
     (5 "WAIVED")
     (6 "CHECK")
     (7 "STUCK/DEAD")
     (8 "DEAD")
     (9 "FAIL")
-    (10 "ABORT")))
+    (10 "PREQ_FAIL")
+    (11 "ABORT")))
 
 (define *common:ended-states*       ;; states which indicate the test is stopped and will not proceed
   '("COMPLETED" "ARCHIVED" "KILLED" "KILLREQ" "STUCK" "INCOMPLETE"))
 
 (define *common:badly-ended-states* ;; these roll up as CHECK, i.e. results need to be checked

Index: common_records.scm
==================================================================
--- common_records.scm
+++ common_records.scm
@@ -147,15 +147,17 @@
               (temp     (string-split (->string this-loc) " "))
               (this-func (if (and (list? temp) (> (length temp) 1)) (cadr temp) "???")))
          (if (equal? this-func "BB>")
              (set! location this-loc))))
      stack)
-    (let ((dp-args
-           (append
-            (list 0 *default-log-port*
-                  (conc location "@"(/ (- (current-milliseconds) *BB-process-starttime*) 1000)"   ")  )
-            in-args)))
+    (let* ((color-on "\x1b[1m")
+           (color-off "\x1b[0m")
+           (dp-args
+            (append
+             (list 0 *default-log-port*
+                   (conc color-on location "@"(/ (- (current-milliseconds) *BB-process-starttime*) 1000) color-off "   ")  )
+             in-args)))
       (apply debug:print dp-args))))
 
 (define *BBpp_custom_expanders_list* (make-hash-table))
 
 

Index: db.scm
==================================================================
--- db.scm
+++ db.scm
@@ -1,6 +1,6 @@
-;;======================================================================
+;======================================================================
 ;; Copyright 2006-2016, Matthew Welland.
 ;; 
 ;;  This program is made available under the GNU GPL version 2.0 or
 ;;  greater. See the accompanying file COPYING for details.
 ;; 
@@ -198,21 +198,21 @@
 
 ;; open an sql database inside a file lock
 ;; returns: db existed-prior-to-opening
 ;; RA => Returns a db handler; sets the lock if opened in writable mode
 ;;
-;;(define *db-open-mutex* (make-mutex))
+;; (define *db-open-mutex* (make-mutex))
 
 (define (db:lock-create-open fname initproc)
   (let* ((parent-dir   (or (pathname-directory fname)(current-directory))) ;; no parent? go local
          (raw-fname    (pathname-file fname))
 	 (dir-writable (file-write-access? parent-dir))
 	 (file-exists  (common:file-exists? fname))
 	 (file-write   (if file-exists
 			   (file-write-access? fname)
 			   dir-writable )))
-    ;;(mutex-lock! *db-open-mutex*) ;; tried this mutex, not clear it helped.
+    ;; (mutex-lock! *db-open-mutex*) ;; tried this mutex, not clear it helped.
     (if file-write ;; dir-writable
 	(condition-case
          (let* ((lockfname   (conc fname ".lock"))
                 (readyfname  (conc parent-dir "/.ready-" raw-fname))
                 (readyexists (common:file-exists? readyfname)))
@@ -246,11 +246,11 @@
         
 	(condition-case
          (begin
            (debug:print 2 *default-log-port* "WARNING: opening db in non-writable dir " fname)
            (let ((db (sqlite3:open-database fname)))
-             ;;(mutex-unlock! *db-open-mutex*)
+             ;; (mutex-unlock! *db-open-mutex*)
              db))
          (exn (io-error)  (debug:print 0 *default-log-port* "ERROR: i/o error with " fname ". Check permissions, disk space etc. and try again."))
          (exn (corrupt)   (debug:print 0 *default-log-port* "ERROR: database " fname " is corrupt. Repair it to proceed."))
          (exn (busy)      (debug:print 0 *default-log-port* "ERROR: database " fname " is locked. Try copying to another location, remove original and copy back."))
          (exn (permission)(debug:print 0 *default-log-port* "ERROR: database " fname " has some permissions problem."))
@@ -1581,17 +1581,17 @@
   
 
 ;;  select end_time-now from
 ;;      (select testname,item_path,event_time+run_duration as
 ;;                          end_time,strftime('%s','now') as now from tests where state in
-;;      ('RUNNING','REMOTEHOSTSTART','LAUNCED'));
+;;      ('RUNNING','REMOTEHOSTSTART','LAUNCHED'));
 
 (define (db:find-and-mark-incomplete dbstruct run-id ovr-deadtime)
   (let* ((incompleted '())
 	 (oldlaunched '())
 	 (toplevels   '())
-	 (deadtime-str (configf:lookup *configdat* "setup" "deadtime"))
+	 (deadtime-str (configf:lookup *configdat* "setup" "deadtime")) ;; FIXME suspect test run time & deadtime are not well matched; resulting in COMPLETED/DEAD status of an a-ok running test
 	 (deadtime     (if (and deadtime-str
 				(string->number deadtime-str))
 			   (string->number deadtime-str)
 			   7200))) ;; two hours
     (db:with-db 
@@ -1650,11 +1650,12 @@
          (if (> (length all-ids) 0)
              (begin
                (debug:print 0 *default-log-port* "WARNING: Marking test(s); " (string-intersperse (map conc all-ids) ", ") " as INCOMPLETE")
                (for-each
                 (lambda (test-id)
-                  (db:test-set-state-status dbstruct run-id test-id "COMPLETED" "DEAD" "Test failed to complete")) ;; fix for one aspect of Randy's ticket 1405717332
+                  (db:test-set-state-status dbstruct run-id test-id "COMPLETED" "DEAD" "Test failed to complete")) ;; fix for one aspect of Randy's ticket 1405717332 ;; TODO - fix problem where test goes to COMPLETED/DEAD while in progress, only later to go to COMPLETED/PASS.  ref ticket 220546828
+
                 all-ids))))))))
 
 ;; ALL REPLACED BY THE BLOCK ABOVE
 ;;
 ;; 	    (sqlite3:execute 
@@ -3492,37 +3493,51 @@
                                                         (map dbr:counts-status state-status-counts)))
                                                    *common:std-statuses* >))
 			    (non-completes     (filter (lambda (x)
 							 (not (equal? x "COMPLETED")))
 						       all-curr-states))
-			    (num-non-completes (length non-completes))
-                            
+			    (preq-fails        (filter (lambda (x)
+							 (equal? x "PREQ_FAIL"))
+						       all-curr-statuses))
+                            (num-non-completes (length non-completes))
                             (newstate          (cond
-						((> running 0)
-						 "RUNNING") ;; anything running, call the situation running
-						((> bad-not-started 0)  ;; we have an ugly situation, it is completed in the sense we cannot do more.
-						 "COMPLETED") 
-						((> num-non-completes 0) ;;
-						 (car non-completes))  ;;  (remove (lambda (x)(equal? "COMPLETED" x)) all-curr-states)))
-                                                ;; only rollup DELETED if all DELETED
-						(else
-						 (car all-curr-states))))
+						((> running 0)           "RUNNING")            ;; anything running, call the situation running
+                                                ((> (length preq-fails) 0)
+                                                 "NOT_STARTED")
+						((> bad-not-started 0)   "COMPLETED")          ;; we have an ugly situation, it is completed in the sense we cannot do more.
+						((> num-non-completes 0) (car non-completes))  ;;  (remove (lambda (x)(equal? "COMPLETED" x)) all-curr-states))) ;; only rollup DELETED if all DELETED
+						(else                    (car all-curr-states))))
 			                       ;; (if (> running 0)
                                                ;;     "RUNNING"
                                                ;;     (if (> bad-not-started 0)
                                                ;;         "COMPLETED"
                                                ;;         (car all-curr-states))))
-                            (newstatus            (if (or (> bad-not-started 0)
-							  (and (equal? newstate "NOT_STARTED")
-							       (> num-non-completes 0)))
-						      "STARTED"
-                                                      (car all-curr-statuses))))
+                            (newstatus         (cond
+                                                ((> (length preq-fails) 0)
+                                                 "PREQ_FAIL")
+                                                ((or (> bad-not-started 0)
+                                                     (and (equal? newstate "NOT_STARTED")
+                                                          (> num-non-completes 0)))
+                                                 "STARTED")
+                                                (else
+                                                 (car all-curr-statuses)))))
+
                        ;; (print "bad-not-supported: " bad-not-support " all-curr-states: " all-curr-states " all-curr-statuses: " all-curr-states)
                        ;;      " newstate: " newstate " newstatus: " newstatus)
                        ;; NB// Pass the db so it is part of the transaction
+
+                       ;; (debug:print 4 *default-log-port* "BB> tl-test-id="tl-test-id" ; "test-name":"item-path"> bad-not-started="bad-not-started" newstate="newstate" newstatus="newstatus" num-non-completes="num-non-completes" non-completes="non-completes "len(sscs)="(length state-status-counts)  " state-status-counts: "
+                       ;;              (apply conc
+                       ;;                     (map (lambda (x)
+                       ;;                            (conc
+                       ;;                             (with-output-to-string (lambda () (pp (dbr:counts->alist x)))) " | "))
+                       ;;                          state-status-counts))
+                                    
+                       ;;              ); end debug:print
                        (if tl-test-id
-			   (db:test-set-state-status db run-id tl-test-id newstate newstatus #f))))))))
+			   (db:test-set-state-status db run-id tl-test-id newstate newstatus #f)) ;; we are still in the transaction - must access the db and not the dbstruct
+		       ))))))
          (mutex-unlock! *db-transaction-mutex*)
          (if (and test-id state status (equal? status "AUTO")) 
              (db:test-data-rollup dbstruct run-id test-id status))
          tr-res)))))
 ;; BBnote: db:get-all-state-status-counts-for-test returns dbr:counts object aggregating state and status of items of a given test, *not including rollup state/status*
@@ -4047,103 +4062,141 @@
 ;;       mode 'toplevel means that tests must be COMPLETED only
 ;;       mode 'itemmatch or 'itemwait means that tests items must be COMPLETED and (PASS|WARN|WAIVED|CHECK) [[ NB// NOT IMPLEMENTED YET ]]
 ;;       mode 'exclusive means this test/item cannot run if the same test/item is LAUNCHED,REMOTEHOSTSTART or RUNNING
 ;; 
 ;; (define (db:get-prereqs-not-met dbstruct run-id waitons ref-item-path mode)
+
+
 (define (db:get-prereqs-not-met dbstruct run-id waitons ref-test-name ref-item-path mode itemmaps) ;; #!key (mode '(normal))(itemmap #f))
   ;; BBnote - rollup of an itemized test's overall state/status done in db:set-state-status-and-roll-up-items
-  (append
-   (if (member 'exclusive mode)
-       (let ((running-tests (db:get-tests-for-run dbstruct
-						  #f  ;; run-id of #f means for all runs. 
-						  (if (string=? ref-item-path "")   ;; testpatt
-						      ref-test-name
-						      (conc ref-test-name "/" ref-item-path))
-						  '("LAUNCHED" "REMOTEHOSTSTART" "RUNNING") ;; states
-						  '()          ;; statuses
-						  #f           ;; offset
-						  #f           ;; limit
-						  #f           ;; not-in
-						  #f           ;; sort by
-						  #f           ;; sort order
-						  'shortlist   ;; query type
-						  0            ;; last update, beginning of time ....
-						  #f           ;; mode
-						  )))
-	;;(map (lambda (testdat)
-	;;	(if (equal? (db:test-get-item-path testdat) "")
-	;;	    (db:test-get-testname testdat)
-	;;	    (conc (db:test-get-testname testdat)
-	;;		  "/"
-	;;		  (db:test-get-item-path testdat))))
-	 running-tests) ;; calling functions want the entire data
-       '())
-   (if (or (not waitons)
-	   (null? waitons))
-       '()
-       (let* ((unmet-pre-reqs '())
-	      (result         '()))
-	 (for-each 
-	  (lambda (waitontest-name)
-	    ;; by getting the tests with matching name we are looking only at the matching test 
-	    ;; and related sub items
-	    ;; next should be using mt:get-tests-for-run?
-	    (let ((tests             (db:get-tests-for-run-state-status dbstruct run-id waitontest-name))
-		  (ever-seen         #f)
-		  (parent-waiton-met #f)
-		  (item-waiton-met   #f))
-	      (for-each 
-	       (lambda (test) ;; BB- this is the upstream test
-		 ;; (if (equal? waitontest-name (db:test-get-testname test)) ;; by defintion this had better be true ...
-		 (let* ((state             (db:test-get-state test))
-			(status            (db:test-get-status test))
-			(item-path         (db:test-get-item-path test)) ;; BB- this is the upstream itempath
-			(is-completed      (equal? state "COMPLETED"))
-			(is-running        (equal? state "RUNNING"))
-			(is-killed         (equal? state "KILLED"))
-			(is-ok             (member status '("PASS" "WARN" "CHECK" "WAIVED" "SKIP")))
-			;;                                       testname-b    path-a    path-b
-			(same-itempath     (db:compare-itempaths ref-test-name item-path ref-item-path itemmaps))) ;; (equal? ref-item-path item-path)))
-		   (set! ever-seen #t)
-		   (cond
-		    ;; case 1, non-item (parent test) is 
-		    ((and (equal? item-path "") ;; this is the parent test of the waiton being examined
-			  is-completed
-			  (or is-ok (not (null? (lset-intersection eq? mode '(toplevel)))))) ;;  itemmatch itemwait))))))
-		     (set! parent-waiton-met #t))
-		    ;; Special case for toplevel and KILLED
-		    ((and (equal? item-path "") ;; this is the parent test
-			  is-killed
-			  (member 'toplevel mode))
-		     (set! parent-waiton-met #t))
-		    ;; For itemwait mode IFF the previous matching item is good the set parent-waiton-met
-		    ((and (not (null? (lset-intersection eq? mode '(itemmatch itemwait)))) ;; how is that different from (member mode '(itemmatch itemwait)) ?????
-			  ;; (not (equal? item-path "")) ;; this applies to both top level (to allow launching of next batch) and items
-			  same-itempath)
-		     (if (and is-completed is-ok)
-			 (set! item-waiton-met #t))
-		     (if (and (equal? item-path "") ;; if upstream rollup test is completed, parent-waiton-met is set
-			      (or is-completed is-running));; this is the parent, set it to run if completed or running ;; BB1
-			 (set! parent-waiton-met #t)))
-		    ;; normal checking of parent items, any parent or parent item not ok blocks running
-		    ((and is-completed
-			  (or is-ok 
-			      (member 'toplevel mode))              ;; toplevel does not block on FAIL
-			  (and is-ok (member 'itemmatch mode))) ;; itemmatch blocks on not ok
-		     (set! item-waiton-met #t)))))
-	       tests)
-	      ;; both requirements, parent and item-waiton must be met to NOT add item to
-	      ;; prereq's not met list
-	      (if (not (or parent-waiton-met item-waiton-met))
-		  (set! result (append (if (null? tests) (list waitontest-name) tests) result))) ;; appends the string if the full record is not available
-	      ;; if the test is not found then clearly the waiton is not met...
-	      ;; (if (not ever-seen)(set! result (cons waitontest-name result)))))
-	      (if (not ever-seen)
-		  (set! result (append (if (null? tests)(list waitontest-name) tests) result)))))
-	  waitons)
-	 (delete-duplicates result)))))
-
+  (let* ((ok-statuses '("PASS" "WARN" "CHECK" "WAIVED" "SKIP"))
+         (have-itemized (not (null? (lset-intersection eq? mode '(itemmatch itemwait))))))
+    (append
+     (if (member 'exclusive mode)
+         (let ((running-tests (db:get-tests-for-run dbstruct
+                                                    #f  ;; run-id of #f means for all runs. 
+                                                    (if (string=? ref-item-path "")   ;; testpatt
+                                                        ref-test-name
+                                                        (conc ref-test-name "/" ref-item-path))
+                                                    '("LAUNCHED" "REMOTEHOSTSTART" "RUNNING") ;; states
+                                                    '()          ;; statuses
+                                                    #f           ;; offset
+                                                    #f           ;; limit
+                                                    #f           ;; not-in
+                                                    #f           ;; sort by
+                                                    #f           ;; sort order
+                                                    'shortlist   ;; query type
+                                                    0            ;; last update, beginning of time ....
+                                                    #f           ;; mode
+                                                    )))
+           ;;(map (lambda (testdat)
+           ;;	(if (equal? (db:test-get-item-path testdat) "")
+           ;;	    (db:test-get-testname testdat)
+           ;;	    (conc (db:test-get-testname testdat)
+           ;;		  "/"
+           ;;		  (db:test-get-item-path testdat))))
+           running-tests) ;; calling functions want the entire data
+         '())
+     (if (or (not waitons)
+             (null? waitons))
+         '()
+         (let* ((unmet-pre-reqs '())
+                (result         '()))
+           (for-each ;; waitons
+            (lambda (waitontest-name)
+              ;; by getting the tests with matching name we are looking only at the matching test 
+              ;; and related sub items
+              ;; next should be using mt:get-tests-for-run?
+              (let ((tests             (db:get-tests-for-run-state-status dbstruct run-id waitontest-name))
+                    (ever-seen         #f)
+                    (parent-waiton-met #f)
+                    (item-waiton-met   #f))
+                (for-each ;; item (test record) in waiton
+                 (lambda (test) ;; BB- this is the upstream test
+                   ;; (if (equal? waitontest-name (db:test-get-testname test)) ;; by defintion this had better be true ...
+                   (let* ((state             (db:test-get-state test))
+                          (status            (db:test-get-status test))
+                          (item-path         (db:test-get-item-path test)) ;; BB- this is the upstream itempath
+                          (is-completed      (equal? state "COMPLETED"))
+                          (is-running        (member state '("LAUNCHED" "REMOTEHOSTSTART" "RUNNING")))
+                          (is-killed         (member state '("KILLREQ" "KILLING" "KILLED")))
+                          (is-ok             (member status ok-statuses))
+                          ;;                                       testname-b    path-a    path-b
+                          (same-itempath     (db:compare-itempaths ref-test-name item-path ref-item-path itemmaps))) ;; (equal? ref-item-path item-path)))
+                     (set! ever-seen #t)
+                     (cond
+                      ;; case 1, non-item (parent test) is 
+                      ((and (equal? item-path "") ;; this is the parent test of the waiton being examined
+                            is-completed
+                            (or is-ok (not (null? (lset-intersection eq? mode '(toplevel)))))) ;;  itemmatch itemwait))))))
+                       (set! parent-waiton-met #t))
+                      ;; Special case for toplevel and KILLED
+                      ((and (equal? item-path "") ;; this is the parent test
+                            is-killed
+                            (member 'toplevel mode))
+                       (set! parent-waiton-met #t))
+                      ;; For itemwait mode IFF the previous matching item is good the set parent-waiton-met
+                      ((and have-itemized ;; how is that different from (member mode '(itemmatch itemwait)) ?????
+                            ;; (not (equal? item-path "")) ;; this applies to both top level (to allow launching of next batch) and items
+                            same-itempath)
+                       (if (and is-completed is-ok)
+                           (set! item-waiton-met #t))
+                       (if (and (equal? item-path "") ;; if upstream rollup test is completed, parent-waiton-met is set
+                                (or is-completed is-running));; this is the parent, set it to run if completed or running ;; BB1
+                           (set! parent-waiton-met #t)))
+                      ;; normal checking of parent items, any parent or parent item not ok blocks running
+                      ((and is-completed
+                            (or is-ok 
+                                (member 'toplevel mode))              ;; toplevel does not block on FAIL
+                            (and is-ok (member 'itemmatch mode))) ;; itemmatch blocks on not ok
+                       (set! item-waiton-met #t)))))
+                 tests) ;; end of item for-each
+
+
+                ;; both requirements, parent and item-waiton must be met to NOT add item to
+                ;; prereq's not met list
+
+                ;; is:
+                (if (not (or
+                          (and (equal? ref-item-path "") parent-waiton-met)
+                          item-waiton-met))
+                    (set! result (append (if (null? tests) (list waitontest-name) tests) result))) ;; appends the string if the full record is not available
+                ;; was briefly:
+                ;; (if (not
+                ;;      (and
+                ;;       item-waiton-met
+                ;;       (or parent-waiton-met (not (equal? ref-item-path "")))))
+                ;;     ;;add to list
+                ;;     (set! result (append (if (null? tests) (list waitontest-name) tests) result))) ;; appends the string if the full record is not available
+
+
+                ;; if the test is not found then clearly the waiton is not met...
+                ;; (if (not ever-seen)(set! result (cons waitontest-name result)))))
+                (if (not ever-seen)
+                    (set! result (append (if (null? tests)(list waitontest-name) tests) result)))))
+            waitons)
+
+           ;; TODO: for itemwait and itemmatch mode, filter out failed toplevel prereq test if any items passed.
+           
+           ;; a rewrite might help understanding, but quick fix is just remove tests from result which are completed/pass. -BB
+           ;;(pp result)
+           ;; (let ((prereq-tests-some-items-passed-list '(ref-test-name))) ;; seed with ref-test-name; do not wait on self.
+
+           ;;   (for-each (lambda (test)
+           ;;               (if (vector? test)
+           ;;                   (if (and
+           ;;                        (equal? (db:test-get-state test) "COMPLETED")
+           ;;                        (member (db:test-get-status test) ok-statuses)
+           ;;                        (not (equal? (db:test-get-item-path test) "")))
+           ;;                       (set! prereq-tests-some-items-passed-list (cons (db:test-get-testname test) prereq-tests-some-items-passed-list)))))
+           ;;             result)
+           ;;   (set! prereq-tests-some-items-passed-list (delete-duplicates prereq-tests-some-items-passed-list))
+                                               
+
+           (delete-duplicates result)
+           )))))
+  
 ;;======================================================================
 ;; Just for sync, procedures to make sync easy
 ;;======================================================================
 
 ;; get an alist of record ids changed since time since-time

Index: gutils.scm
==================================================================
--- gutils.scm
+++ gutils.scm
@@ -23,10 +23,11 @@
     (null? (filter (lambda (x)(> x 3)) delta))))
 
 (define gutils:colors
   '((PASS . "70 249 73")
     (FAIL . "253 33 49")
+    (PREQ_FAIL . "255 127 127")
     (SKIP . "230 230 0")))
 
 (define (gutils:get-color-spec effective-state)
   (or (alist-ref effective-state gutils:colors)
       (alist-ref 'FAIL gutils:colors)))
@@ -59,10 +60,11 @@
     ((REMOTEHOSTSTART)  (list "50 130 195"   state))
     ((RUNNING STARTED)          (list "9 131 232"    state))
     ((KILLREQ)          (list "39 82 206"    state))
     ((KILLED)           (list "234 101 17"   state))
     ((NOT_STARTED)      (case (string->symbol status)
+                          ((PREQ_FAIL)(list (gutils:get-color-spec 'PREQ_FAIL) status))
 			  ((CHECK STARTED)(list (gutils:get-color-spec 'SKIP) state))
 			  (else   (list "240 240 240"                 state))))
     ;; for xor mode below
     ;;
     ((CLEAN)

Index: launch.scm
==================================================================
--- launch.scm
+++ launch.scm
@@ -1297,10 +1297,11 @@
 ;;    - could be ssh to host from hosts table (update regularly with load)
 ;;    - could be netbatch
 ;;      (launch-test db (cadr status) test-conf))
 (define (launch-test test-id run-id run-info keyvals runname test-conf test-name test-path itemdat params)
   (mutex-lock! *launch-setup-mutex*) ;; setting variables and processing the testconfig is NOT thread-safe, reuse the launch-setup mutex
+  (BB> "entered launch-test")
   (let* ( ;; (lock-key        (conc "test-" test-id))
 	;; (got-lock        (let loop ((lock        (rmt:no-sync-get-lock lock-key))
 	;; 			     (expire-time (+ (current-seconds) 15))) ;; give up on getting the lock and steal it after 15 seconds
 	;; 		    (if (car lock)
 	;; 			#t
@@ -1331,10 +1332,11 @@
        (list "MT_RUNNAME"   runname)
        (list "MT_ITEMPATH"  item-path)
        (list "MT_CONTOUR"   contour)
        )
       itemdat))
+    (BB> "set env vars")
     (let* ((tregistry       (tests:get-all)) ;; third param (below) is system-allowed
            ;; for tconfig, why do we allow fallback to test-conf?
 	   (tconfig         (or (tests:get-testconfig test-name item-path tregistry #t force-create: #t)
 				(begin
                                   (debug:print 0 *default-log-port* "WARNING: falling back to pre-calculated testconfig. This is likely not desired.")
@@ -1376,10 +1378,11 @@
 	   (mt-bindir-path #f)
 	   (testinfo   (rmt:get-test-info-by-id run-id test-id))
 	   (mt_target  (string-intersperse (map cadr keyvals) "/"))
 	   (debug-param (append (if (args:get-arg "-debug")  (list "-debug" (args:get-arg "-debug")) '())
 				(if (args:get-arg "-logging")(list "-logging") '()))))
+      (BB> "entered let 1")
       ;; (if hosts (set! hosts (string-split hosts)))
       ;; set the megatest to be called on the remote host
       (if (not remote-megatest)(set! remote-megatest local-megatest)) ;; "megatest"))
       (set! mt-bindir-path (pathname-directory remote-megatest))
       (if launcher (set! launcher (string-split launcher)))
@@ -1387,27 +1390,30 @@
       (if (and (args:get-arg "-preclean") ;; user has requested to preclean for this run
 	       (not (member (db:test-get-rundir testinfo)(list "n/a" "/tmp/badname")))) ;; n/a is a placeholder and thus not a read dir
 	  (begin
 	    (debug:print-info 0 *default-log-port* "attempting to preclean directory " (db:test-get-rundir testinfo) " for test " test-name "/" item-path)
 	    (runs:remove-test-directory testinfo 'remove-data-only))) ;; remove data only, do not perturb the record
-      
+
+      (BB> "after launcher set")
       ;; prevent overlapping actions - set to LAUNCHED as early as possible
       ;;
       ;; the following call handles waiver propogation. cannot yet condense into roll-up-pass-fail
       (tests:test-set-status! run-id test-id "LAUNCHED" "n/a" #f #f) ;; (if launch-results launch-results "FAILED"))
       (rmt:set-state-status-and-roll-up-items run-id test-name item-path #f "LAUNCHED" #f)
       ;; (pp (hash-table->alist tconfig))
       (set! diskpath (get-best-disk *configdat* tconfig))
+      (BB> "after launch state set")
       (if diskpath
 	  (let ((dat  (create-work-area run-id run-info keyvals test-id test-path diskpath test-name itemdat)))
 	    (set! work-area (car dat))
 	    (set! toptest-work-area (cadr dat))
 	    (debug:print-info 2 *default-log-port* "Using work area " work-area))
 	  (begin
 	    (set! work-area (conc test-path "/tmp_run"))
 	    (create-directory work-area #t)
 	    (debug:print 0 *default-log-port* "WARNING: No disk work area specified - running in the test directory under tmp_run")))
+      (BB> "after disk path set")
       (set! cmdparms (base64:base64-encode 
 		      (z3:encode-buffer 
 		       (with-output-to-string
 			 (lambda () ;; (list 'hosts     hosts)
 			   (write (list (list 'testpath  test-path)
@@ -1436,11 +1442,11 @@
 					(list 'runtlim   (if run-time-limit (common:hms-string->seconds run-time-limit) #f))
 					(list 'env-ovrd  (hash-table-ref/default *configdat* "env-override" '())) 
 					(list 'set-vars  (if params (hash-table-ref/default params "-setvars" #f)))
 					(list 'runname   runname)
 					(list 'mt-bindir-path mt-bindir-path))))))))
-      
+      (BB> "after cmdparams set")
       ;; clean out step records from previous run if they exist
       ;; (rmt:delete-test-step-records run-id test-id)
       ;; if the dir does not exist we may have a itempath where individual variables are a path, launch anyway
       (if (common:file-exists? work-area)
 	  (change-directory work-area)) ;; so that log files from the launch process don't clutter the test dir
@@ -1458,11 +1464,12 @@
       (if (args:get-arg "-xterm")(set! fullcmd (append fullcmd (list "-xterm"))))
       (debug:print 1 *default-log-port* "Launching " work-area)
       ;; set pre-launch-env-vars before launching, keep the vars in prevvals and put the envionment back when done
       (debug:print 4 *default-log-port* "fullcmd: " fullcmd)
       (set! *last-launch* (current-seconds)) ;; all that junk above takes time, set this as late as possible.
-      (let* ((commonprevvals (alist->env-vars
+      (BB> "after set *last-launch*")
+      (let* ((commonprevvals (alist->env-vars ;; observed this let can be very slow. (>5 sec)
 			      (hash-table-ref/default *configdat* "env-override" '())))
 	     (miscprevvals   (alist->env-vars ;; consolidate this code with the code in megatest.scm for "-execute"
 			      (append (list (list "MT_TEST_RUN_DIR" work-area)
 					    (list "MT_TEST_NAME" test-name)
 					    (list "MT_ITEM_INFO" (conc itemdat)) 
@@ -1485,10 +1492,11 @@
 					      (conc cmdstr " >> mt_launch.log 2>&1 &")))
 					(car fullcmd))
 				    (if useshell
 					'()
 					(cdr fullcmd)))))
+        (BB> "let depth 2 entered")
         (mutex-unlock! *launch-setup-mutex*) ;; yes, really should mutex all the way to here. Need to put this entire process into a fork.
 	;; (rmt:no-sync-del! lock-key)         ;; release the lock for starting this test
 	(if (not launchwait) ;; give the OS a little time to allow the process to start
 	    (thread-sleep! 0.01))
 	(with-output-to-file "mt_launch.log"

Index: megatest-version.scm
==================================================================
--- megatest-version.scm
+++ megatest-version.scm
@@ -1,7 +1,7 @@
 ;; Always use two or four digit decimal
 ;; 1.01, 1.02...1.10,1.11,1.1101 ... 1.99,2.00..
 
 (declare (unit megatest-version))
 
-(define megatest-version 1.6429)
+(define megatest-version 1.6431)
 

Index: runs.scm
==================================================================
--- runs.scm
+++ runs.scm
@@ -204,11 +204,11 @@
 					jobg-count))))
     (if (> (+ num-running num-running-in-jobgroup) 0)
 	(runs:inc-can-run-more-tests-count runsdat)) ;; (set! *runs:can-run-more-tests-count* (+ *runs:can-run-more-tests-count* 1)))
     (if (not (eq? *last-num-running-tests* num-running))
 	(begin
-	  (debug:print 2 *default-log-port* "max-concurrent-jobs: " max-concurrent-jobs ", num-running: " num-running)
+	  (debug:print 1 *default-log-port* "max-concurrent-jobs: " max-concurrent-jobs ", num-running: " num-running)
 	  (set! *last-num-running-tests* num-running)))
     (if (not (eq? 0 *globalexitstatus*))
 	(list #f num-running num-running-in-jobgroup max-concurrent-jobs job-group-limit)
 	(let ((can-not-run-more (cond
 				 ;; if max-concurrent-jobs is set and the number running is greater 
@@ -465,11 +465,11 @@
     ;;
     ;; What happended, this code is now duplicated in tests!?
     ;;
     ;;======================================================================
     
-    (if (not (null? test-names))
+    (if (not (null? test-names)) ;; BEGIN test-names loop
 	(let loop ((hed (car test-names))   ;; NOTE: This is the main loop that iterates over the test-names
 		   (tal (cdr test-names)))         ;; 'return-procs tells the config reader to prep running system but return a proc
 	  (change-directory *toppath*) ;; PLEASE OPTIMIZE ME!!! I think this should be a no-op but there are several places where change-directories could be happening.
 	  (setenv "MT_TEST_NAME" hed) ;; 
 	  (let*-values (((waitons waitors config)(tests:get-waitons hed all-tests-registry)))
@@ -483,16 +483,16 @@
 		  (set! waitons (filter (lambda (x)(not (equal? x hed))) waitons))
 		  (set! waitors (filter (lambda (x)(not (equal? x hed))) waitors))))
 	    
 	    ;; (items   (items:get-items-from-config config)))
 	    (if (not (hash-table-ref/default test-records hed #f))
-		(hash-table-set! test-records
-				 hed (vector hed     ;; 0
-					     config  ;; 1
-					     waitons ;; 2
+		(hash-table-set! test-records ;; BB: we are doing a manual make-tests:testqueue
+				 hed (vector hed     ;; 0 ;; testname
+					     config  ;; 1 
+					     waitons ;; 2 
 					     (config-lookup config "requirements" "priority")     ;; priority 3
-					     (tests:get-items config) ;; expand the [items] and or [itemstable] into explict items
+					     (tests:get-items config) ;; 4 ;; expand the [items] and or [itemstable] into explict items
 					     #f      ;; itemsdat 5
 					     #f      ;; spare - used for item-path
 					     waitors ;; 
 					     )))
 	    (for-each 
@@ -502,11 +502,11 @@
 			  (waiton-tconfig  (if waiton-record (vector-ref waiton-record 1) #f))
 			  (waiton-itemized (and waiton-tconfig
 						(or (hash-table-ref/default waiton-tconfig "items" #f)
 						    (hash-table-ref/default waiton-tconfig "itemstable" #f))))
 			  (itemmaps        (tests:get-itemmaps config))  ;; (configf:lookup config "requirements" "itemmap"))
-			  (new-test-patts  (tests:extend-test-patts test-patts hed waiton itemmaps)))
+			  (new-test-patts  (tests:extend-test-patts test-patts hed waiton itemmaps)))   ;; BB:  items expanded here.
 		     (debug:print-info 0 *default-log-port* "Test " waiton " has " (if waiton-record "a" "no") " waiton-record and" (if waiton-itemized " " " no ") "items")
 		     ;; need to account for test-patt here, if I am test "a", selected with a test-patt of "hed/b%"
 		     ;; and we are waiting on "waiton" we need to add "waiton/,waiton/b%" to test-patt
 		     ;; is this satisfied by merely appending "/" to the waiton name added to the list?
 		     ;;
@@ -542,11 +542,11 @@
 	     (delete-duplicates (append waitons waitors)))
 	    (let ((remtests (delete-duplicates (append waitons tal))))
 	      (if (not (null? remtests))
 		  (begin
 		    ;; (debug:print-info 0 *default-log-port* "Preprocessing continues for " (string-intersperse remtests ", "))
-		    (loop (car remtests)(cdr remtests))))))))
+		    (loop (car remtests)(cdr remtests)))))))) ;; END test-names loop
 
     (if (not (null? required-tests))
 	(debug:print-info 1 *default-log-port* "Adding \"" (string-intersperse required-tests " ") "\" to the run queue"))
     ;; NOTE: these are all parent tests, items are not expanded yet.
     (debug:print-info 4 *default-log-port* "test-records=" (hash-table->alist test-records))
@@ -561,19 +561,19 @@
 						  (print-call-chain)
 						  (print " message: " ((condition-property-accessor 'exn 'message) exn)))
 					      (runs:run-tests-queue run-id runname test-records keyvals flags test-patts required-tests
 								    (any->number reglen) all-tests-registry)))
 					  "runs:run-tests-queue"))
-		 (th2        (make-thread (lambda ()				    
+		 (th2        (make-thread (lambda ()			 ;; BBQ: why are we visiting ALL runs here?	    
 					    ;; (rmt:find-and-mark-incomplete-all-runs))))) CAN'T INTERRUPT IT ...
 					    (let ((run-ids (rmt:get-all-run-ids)))
 					      (for-each (lambda (run-id)
 							  (if keep-going
 							      (handle-exceptions
 							       exn
 							       (debug:print 0 *default-log-port* "error in calling find-and-mark-incomplete for run-id " run-id)
-							       (rmt:find-and-mark-incomplete run-id #f)))) ;; ovr-deadtime)))
+							       (rmt:find-and-mark-incomplete run-id #f)))) ;; ovr-deadtime))) ;; could be root of https://hsdes.intel.com/appstore/article/#/220546828/main -- Title: Megatest jobs show DEAD even though they are still running (1.64/27)
 							run-ids)))
 					  "runs: mark-incompletes")))
 	    (thread-start! th1)
 	    (thread-start! th2)
 	    (thread-join! th1)
@@ -630,176 +630,291 @@
 (define (runs:loop-values tal reg reglen regfull reruns)
   (list (runs:queue-next-hed tal reg reglen regfull)      ;; hed
         (runs:queue-next-tal tal reg reglen regfull)      ;; tal
         (runs:queue-next-reg tal reg reglen regfull)      ;; reg
         reruns))                                          ;; reruns
+
+;; objective - iterate thru tests
+;;    => want to prioritize tests we haven't seen before
+;;    => sometimes need to squeeze things in (added to reg)
+;;    => review of a previously seen test is higher priority of never visited test
+;; reg - list of previously visited tests
+;; tal - list of never visited tests
+;;   prefer next hed to be from reg than tal.
+
+
 
 (define runs:nothing-left-in-queue-count 0)
 
-;; BB: for future reference - suspect target vars are not expanded to env vars at this point (item expansion using [items]\nwhatever [system echo $TARGETVAR] doesnt work right whereas [system echo #{targetvar}] does.. Tal and Randy have tix on this.  on first pass, var not set, on second pass, ok.  
+;; BB: for future reference - suspect target vars are not expanded to env vars at this point (item expansion using [items]\nwhatever [system echo $TARGETVAR] doesnt work right whereas [system echo #{targetvar}] does.. Tal and Randy have tix on this.  on first pass, var not set, on second pass, ok.
+
+;; return value of runs:expand-items is passed back to runs-tests-queue and is fed to named loop with this signature:
+;;    (let loop ((hed         (car sorted-test-names))
+;;	         (tal         (cdr sorted-test-names))
+;;	         (reg         '()) ;; registered, put these at the head of tal 
+;;	         (reruns      '()))
+
+;; runs:expand-items: for a given test, expand its items into real tests ready to be processed at this time
+;;  this procedure's operation only makes sense in context of runs-tests-queue.
 (define (runs:expand-items hed tal reg reruns regfull newtal jobgroup max-concurrent-jobs run-id waitons item-path testmode test-record can-run-more items runname tconfig reglen test-registry test-records itemmaps)
   (let* ((loop-list       (list hed tal reg reruns))
-	 (prereqs-not-met (let ((res (rmt:get-prereqs-not-met run-id waitons hed item-path mode: testmode itemmaps: itemmaps)))
+	 (prereqs (let ((res (rmt:get-prereqs-not-met run-id waitons hed item-path mode: testmode itemmaps: itemmaps)))
 			    (if (list? res)
 				res
 				(begin
 				  (debug:print 0 *default-log-port*
 					       "ERROR: rmt:get-prereqs-not-met returned non-list!\n"
 					       "  res=" res " run-id=" run-id " waitons=" waitons " hed=" hed " item-path=" item-path " testmode=" testmode " itemmaps=" itemmaps)
 				  '()))))
+         (have-itemized (not (null? (lset-intersection eq? testmode '(itemmatch itemwait)))))
+         (ok-statuses '("PASS" "WARN" "CHECK" "WAIVED" "SKIP"))
+
+         ;; (prereqs-not-met
+         ;;  (filter (lambda (test)
+         ;;               (if (vector? test)  ;; BB: result may be a collection of strings or test vectors-- why not just test vectors?
+         ;;                   (let ((testname (db:test-get-testname test))
+         ;;                         (itempath (db:test-get-item-path test))
+         ;;                         (state (db:test-get-state test) )
+         ;;                         (status (db:test-get-status test)))
+         ;;                     (cond
+         ;;                      ((and (equal? state "COMPLETED") (member status ok-statuses)) #f)
+         ;;                      ((and have-itemized (equal? "" itempath) (member testname prereq-tests-some-items-passed-list)) #f)
+         ;;                      (else #t)))
+         ;;                   test))
+         ;;             (delete-duplicates prereqs)))
+
+         (prereq-items-completed
+          (filter (lambda (test)
+                       (if (vector? test)  ;; BB: result may be a collection of strings or test vectors-- why not just test vectors?
+                           (let ((testname (db:test-get-testname test))
+                                 (itempath (db:test-get-item-path test))
+                                 (state (db:test-get-state test) )
+                                 (status (db:test-get-status test)))
+                             (cond
+                              ((equal? state "COMPLETED") #t)
+                              ((not (equal? "" itempath))  #f)
+                              (else #f)))
+                           #f))
+                       prereqs))
+
+          
 	 ;; (prereqs-not-met (mt:lazy-get-prereqs-not-met run-id waitons item-path mode: testmode itemmap: itemmap))
-	 (fails           (runs:calc-fails prereqs-not-met))
-	 (prereq-fails    (runs:calc-prereq-fail prereqs-not-met))
-	 (non-completed   (runs:calc-not-completed prereqs-not-met))
-	 (runnables       (runs:calc-runnable prereqs-not-met)))
-    (debug:print-info 4 *default-log-port* "START OF INNER COND #2 "
-		      "\n can-run-more:    " can-run-more
-		      "\n testname:        " hed
-		      "\n prereqs-not-met: " (runs:pretty-string prereqs-not-met)
-		      "\n non-completed:   " (runs:pretty-string non-completed) 
-		      "\n prereq-fails:    " (runs:pretty-string prereq-fails)
-		      "\n fails:           " (runs:pretty-string fails)
-		      "\n testmode:        " testmode
+	 (fails           (runs:calc-fails prereqs)) ;; prereqs 
+	 (prereq-fails    (runs:calc-prereq-fail prereqs)) ;; filter - get NOT_STARTED's which are not status n/a or KEEP_TRYING
+	 (non-completed   (runs:calc-not-completed prereqs))
+	 (runnable-prereqs       (runs:calc-runnable prereqs))
+         
+         (unexpanded-prereqs
+          (filter (lambda (testname)
+                    (let* ((test-rec (hash-table-ref test-records testname))
+                           (items       (tests:testqueue-get-items  test-rec)))
+                      ;;(BB> "HEY " testname "=>"items)
+                      (or (procedure? items)(eq? items 'have-procedure))))
+                  waitons))
+         (completed-prereq-items 
+          (let ((foo (begin ;;(BB> "hello prereqs: "prereqs)
+                            #t))
+                (res (filter (lambda (test)
+                               ;;(BB> "foo - "test)
+                               (and (vector? test)
+                                    (equal? "COMPLETED" (db:test-get-state test))
+                                    (equal? "COMPLETED" (db:test-get-state test))
+                                    (not (equal? "" (db:test-get-item-path test)))))
+                             prereqs)))
+            res)) 
+
+         )
+    (debug:print-info 1 *default-log-port* "START OF INNER COND #2 "
+		      "\n can-run-more:            " can-run-more
+		      "\n testname:                " hed
+		      "\n prereqs:                 " (runs:pretty-string prereqs)
+                      "\n completed-prereq-items:  " (runs:pretty-string completed-prereq-items)
+		      "\n non-completed:           " (runs:pretty-string non-completed) 
+		      "\n prereq-fails:            " (runs:pretty-string prereq-fails)
+                      "\n runnable-prereqs:        " (runs:pretty-string runnable-prereqs)
+		      "\n fails:                   " (runs:pretty-string fails)
+		      "\n testmode:                " testmode
 		      "\n (member 'toplevel testmode): " (member 'toplevel testmode)
-		      "\n (null? non-completed):    " (null? non-completed)
-		      "\n reruns:          " reruns
-		      "\n items:           " items
-		      "\n can-run-more:    " can-run-more)
-
-   (cond
-     ;; all prereqs met, fire off the test
-     ;; or, if it is a 'toplevel test and all prereqs not met are COMPLETED then launch
-
-     ((and (not (member 'toplevel testmode))
-	   (member (hash-table-ref/default test-registry (db:test-make-full-name hed item-path) 'n/a)
-		   '(DONOTRUN removed CANNOTRUN))) ;; *common:cant-run-states-sym*) ;; '(COMPLETED KILLED WAIVED UNKNOWN INCOMPLETE)) ;; try to catch repeat processing of COMPLETED tests here
-      (debug:print-info 1 *default-log-port* "Test " hed " set to \"" (hash-table-ref test-registry (db:test-make-full-name hed item-path)) "\". Removing it from the queue")
-      (if (or (not (null? tal))
-	      (not (null? reg)))
-          (runs:loop-values tal reg reglen regfull reruns)
-	  (begin
-	    (debug:print-info 0 *default-log-port* "Nothing left in the queue!")
-	    ;; If get here twice then we know we've tried to expand all items
-	    ;; since there must be a logic issue with the handling of loops in the 
-	    ;; items expand phase we will brute force an exit here.
-	    (if (> runs:nothing-left-in-queue-count 2)
-		(begin
-		  (debug:print 0 *default-log-port* "WARNING: this condition is triggered when there were no items to expand and nothing to run. Please check your run for completeness")
-		  (exit 0))
-		(set! runs:nothing-left-in-queue-count (+ runs:nothing-left-in-queue-count 1)))
-	    #f)))
-
-     ;; 
-     ((or (null? prereqs-not-met)
-	  (and (member 'toplevel testmode)
-	       (null? non-completed)))
-      (debug:print-info 4 *default-log-port* "runs:expand-items: (or (null? prereqs-not-met) (and (member 'toplevel testmode)(null? non-completed)))")
-      (let ((test-name (tests:testqueue-get-testname test-record)))
-	(setenv "MT_TEST_NAME" test-name) ;; 
-	(setenv "MT_RUNNAME"   runname)
-	(runs:set-megatest-env-vars run-id inrunname: runname) ;; these may be needed by the launching process
-	(let ((items-list (items:get-items-from-config tconfig)))
-	  (if (list? items-list)
-	      (begin
-		(if (null? items-list)
-		    (let ((test-id   (rmt:get-test-id run-id test-name ""))
-			  (num-items (rmt:test-toplevel-num-items run-id test-name)))
-		      (if (and test-id
-			       (not (> num-items 0)))
-			  (mt:test-set-state-status-by-id run-id test-id "NOT_STARTED" "ZERO_ITEMS" "Failed to run due to failed prerequisites"))))
-		(tests:testqueue-set-items! test-record items-list)
-		(list hed tal reg reruns))
-	      (begin
-		(debug:print-error 0 *default-log-port* "The proc from reading the items table did not yield a list - please report this")
-		(exit 1))))))
-
-     ((and (null? fails)
-	   (null? prereq-fails)
-	   (not (null? non-completed)))
-      (let* ((allinqueue (map (lambda (x)(if (string? x) x (db:test-get-testname x)))
-        		      (append newtal reruns)))
-	     ;; prereqstrs is a list of test names as strings that are prereqs for hed
-             (prereqstrs (delete-duplicates (map (lambda (x)(if (string? x) x (db:test-get-testname x)))
-						 prereqs-not-met)))
-	     ;; a prereq that is not found in allinqueue will be put in the notinqueue list
-	     ;; 
-             ;; (notinqueue (filter (lambda (x)
-             ;;    		   (not (member x allinqueue)))
-             ;;    		 prereqstrs))
-	     (give-up    #f))
-
-	;; We can get here when a prereq has not been run due to *it* having a prereq that failed.
-	;; We need to use this to dequeue this item as CANNOTRUN
-	;; 
-	(if (member 'toplevel testmode) ;; '(toplevel)) ;; NOTE: this probably should be (member 'toplevel testmode)
-	    (for-each (lambda (prereq)
-			(if (eq? (hash-table-ref/default test-registry prereq 'justfine) 'CANNOTRUN)
-			    (set! give-up #t)))
-		      prereqstrs))
-
-	(if (and give-up
-		 (not (and (null? tal)(null? reg))))
-	    (let ((trimmed-tal (mt:discard-blocked-tests run-id hed tal test-records))
-		  (trimmed-reg (mt:discard-blocked-tests run-id hed reg test-records)))
-	      (debug:print 1 *default-log-port* "WARNING: test " hed " has discarded prerequisites, removing it from the queue")
-
-	      (let ((test-id (rmt:get-test-id run-id hed "")))
-		(if test-id (mt:test-set-state-status-by-id run-id test-id "NOT_STARTED" "PREQ_DISCARDED" "Failed to run due to discarded prerequisites")))
-	      
-	      (if (and (null? trimmed-tal)
-		       (null? trimmed-reg))
-		  #f
-                  (runs:loop-values trimmed-tal trimmed-reg reglen regfull reruns)
-                  ))
-	      (list (car newtal)(append (cdr newtal) reg) '() reruns))))
-
-     ((and (null? fails)
-	   (null? prereq-fails)
-	   (null? non-completed))
-      (if  (runs:can-keep-running? hed 20)
-	  (begin
-	    (runs:inc-cant-run-tests hed)
-	    (debug:print-info 1 *default-log-port* "no fails in prerequisites for " hed " but also none running, keeping " hed " for now. Try count: " (hash-table-ref/default *seen-cant-run-tests* hed 0))
-	    ;; getting here likely means the system is way overloaded, kill a full minute before continuing
-	    (thread-sleep! 60)
-	    ;; num-retries code was here
-	    ;; we use this opportunity to move contents of reg to tal
-	    (list (car newtal)(append (cdr newtal) reg) '() reruns)) ;; an issue with prereqs not yet met?
-	  (begin
-	    (debug:print-info 1 *default-log-port* "no fails in prerequisites for " hed " but nothing seen running in a while, dropping test " hed " from the run queue")
-	    (let ((test-id (rmt:get-test-id run-id hed "")))
-	      (if test-id (mt:test-set-state-status-by-id run-id test-id "NOT_STARTED" "TIMED_OUT" "Nothing seen running in a while.")))
-            (runs:loop-values tal reg reglen regfull reruns)
-            )))
-
-     ((and 
-       (or (not (null? fails))
-	   (not (null? prereq-fails)))
-       (member 'normal testmode))
-      (debug:print-info 1 *default-log-port* "test "  hed " (mode=" testmode ") has failed prerequisite(s); "
-			(string-intersperse (map (lambda (t)(conc (db:test-get-testname t) ":" (db:test-get-state t)"/"(db:test-get-status t))) fails) ", ")
-			", removing it from to-do list")
-      (let ((test-id (rmt:get-test-id run-id hed "")))
-	(if test-id
-	    (if (not (null? prereq-fails))
-		(mt:test-set-state-status-by-id run-id test-id "NOT_STARTED" "PREQ_DISCARDED" "Failed to run due to prior failed prerequisites")
-		(mt:test-set-state-status-by-id run-id test-id "NOT_STARTED" "PREQ_FAIL"      "Failed to run due to failed prerequisites"))))
-      (if (or (not (null? reg))(not (null? tal)))
-	  (begin
-	    (hash-table-set! test-registry hed 'CANNOTRUN)
-            (runs:loop-values tal reg reglen regfull (cons hed reruns))
-            )
-	  #f)) ;; #f flags do not loop
-
-     ((and (not (null? fails))(member 'toplevel testmode))
-      (if (or (not (null? reg))(not (null? tal)))
-	   (list (car newtal)(append (cdr newtal) reg) '() reruns)
-	  #f)) 
-     ((null? runnables) #f) ;; if we get here and non-completed is null then it is all over.
-     (else
-      (debug:print 0 *default-log-port* "WARNING: FAILS or incomplete tests maybe preventing completion of this run. Watch for issues with test " hed ", continuing for now")
-      (list (car newtal)(cdr newtal) reg reruns)))))
+		      "\n (null? non-completed):      " (null? non-completed)
+		      "\n reruns:                  " reruns
+		      "\n items:                   " items
+		      "\n unexpanded-prereqs:      " unexpanded-prereqs ;;all-prereqs-expanded
+                      "\n completed-prereq-items:  " completed-prereq-items
+                      "\n have-itemized:           " have-itemized
+		      "\n can-run-more:            " can-run-more)
+    
+    ;;(BB> "before runs:expand-items cond")
+    (let ((res
+           (cond
+            ;; all prereqs met, fire off the test
+            ;; or, if it is a 'toplevel test and all prereqs not met are COMPLETED then launch
+            ;; runs:expand-items case: test of interest not toplevel and IS blackballed -> ???
+            ((and (not (member 'toplevel testmode)) ;; test has been blackballed elsewhere
+                  (member (hash-table-ref/default test-registry (db:test-make-full-name hed item-path) 'n/a)
+                          '(DONOTRUN removed CANNOTRUN))) ;; *common:cant-run-states-sym*) ;; '(COMPLETED KILLED WAIVED UNKNOWN INCOMPLETE)) ;; try to catch repeat processing of COMPLETED tests here
+             ;;(BB> "cb1")
+             
+             (debug:print-info 1 *default-log-port* "Test " hed " set to \"" (hash-table-ref test-registry (db:test-make-full-name hed item-path)) "\". Removing it from the queue")
+             (if (or (not (null? tal))
+                     (not (null? reg))) 
+                 (runs:loop-values tal reg reglen regfull reruns) ;; blackballed test - throw it away
+                 (begin
+                   (debug:print-info 0 *default-log-port* "Nothing left in the queue!")
+                   ;; If get here twice then we know we've tried to expand all items
+                   ;; since there must be a logic issue with the handling of loops in the 
+                   ;; items expand phase we will brute force an exit here.
+                   (if (> runs:nothing-left-in-queue-count 2)
+                       (begin
+                         (debug:print 0 *default-log-port* "WARNING: this condition is triggered when there were no items to expand and nothing to run. Please check your run for completeness")
+                         (exit 0))
+                       (set! runs:nothing-left-in-queue-count (+ runs:nothing-left-in-queue-count 1)))
+                   #f)))
+
+            ;;; desired result of below cond branch:
+            ;;   we want to expand items in our test of interest (hed) in the following cases:
+            ;;    case 1 - mode is itemmatch or itemwait: (DONE)
+            ;;       - all prereq tests have been expanded
+            ;;       - at least one prereq's items have completed
+            ;;    case 2 - mode is toplevel   (PARTIAL)
+            ;;       - prereqs are completed.
+            ;;       - or no prereqs can complete (TODO)
+            ;;    case 3 - mode not specified (DONE)
+            ;;       - prereqs are completed and passed (we could consider removing "and passed" -- it would change behavior from current)          
+                   
+            ;; runs:expand-items case: toplevel or else no dangling prerequeistes -- expand items now.
+            ((or
+              (and have-itemized (null? unexpanded-prereqs) (not (null? completed-prereq-items)))
+              (null? prereqs)            ;; nothing is in our way to proceed (need to expand this to an item level check.)
+              (and (member 'toplevel testmode)   ;; for toplevel test - proceed (nothing in our way)
+                   (null? non-completed)))
+             ;;(BB> "cb2")
+
+             (debug:print-info 4 *default-log-port* "runs:expand-items: (or (null? prereqs) (and (member 'toplevel testmode)(null? non-completed)))")
+             (let ((test-name (tests:testqueue-get-testname test-record)))
+               (setenv "MT_TEST_NAME" test-name) ;; hack to give context to get-items-from-config TODO: call-with-environment-variables
+               (setenv "MT_RUNNAME"   runname)   
+               (runs:set-megatest-env-vars run-id inrunname: runname) ;; these may be needed by the launching process
+               (let ((items-list (items:get-items-from-config tconfig))) ;; BB: RIGHT HERE is where item expansion occurs..  target vars are not expanded to env vars at this point (item expansion using [items]\nwhatever [system echo $TARGETVAR] doesnt work right whereas [system echo #{targetvar}] does.. Tal and Randy have tix on this.
+                 (if (list? items-list)
+                     (begin                      ;; we have discovered we have items we need to process, so stuff them into test list and recur
+                       (if (null? items-list)
+                           (let ((test-id   (rmt:get-test-id run-id test-name ""))
+                                 (num-items (rmt:test-toplevel-num-items run-id test-name)))
+                             (if (and test-id
+                                      (not (> num-items 0)))
+                                 (mt:test-set-state-status-by-id run-id test-id "NOT_STARTED" "ZERO_ITEMS" "Failed to run due to failed prerequisites"))))
+                       (tests:testqueue-set-items! test-record items-list) ; stuffing happens here
+                       (list hed tal reg reruns)) ;; return value..
+                     (begin
+                       (debug:print-error 0 *default-log-port* "The proc from reading the items table did not yield a list - please report this")
+                       (exit 1))))))
+
+            ;; runs:expand-items case: no fails, no prereq-fails, some non-completed
+            ((and (null? fails)
+                  (null? prereq-fails)
+                  (not (null? non-completed)))
+             ;;(BB> "cb3")
+             (let* ((allinqueue (map (lambda (x)(if (string? x) x (db:test-get-testname x)))
+                                     (append newtal reruns)))
+                    ;; prereqstrs is a list of test names as strings that are prereqs for hed
+                    (prereqstrs (delete-duplicates (map (lambda (x)(if (string? x) x (db:test-get-testname x)))
+                                                        prereqs)))
+                    ;; a prereq that is not found in allinqueue will be put in the notinqueue list
+                    ;; 
+                    ;; (notinqueue (filter (lambda (x)
+                    ;;    		   (not (member x allinqueue)))
+                    ;;    		 prereqstrs))
+                    (give-up    #f))
+
+               ;; We can get here when a prereq has not been run due to *it* having a prereq that failed.
+               ;; We need to use this to dequeue this item as CANNOTRUN
+               ;; 
+               (if (member 'toplevel testmode) ;; '(toplevel)) ;; NOTE: this probably should be (member 'toplevel testmode)
+                   (for-each (lambda (prereq)
+                               (if (eq? (hash-table-ref/default test-registry prereq 'justfine) 'CANNOTRUN)
+                                   (set! give-up #t)))
+                             prereqstrs))
+
+               (if (and give-up
+                        (not (and (null? tal)(null? reg))))
+                   (let ((trimmed-tal (mt:discard-blocked-tests run-id hed tal test-records))
+                         (trimmed-reg (mt:discard-blocked-tests run-id hed reg test-records)))
+                     (debug:print 1 *default-log-port* "WARNING: test " hed " has discarded prerequisites, removing it from the queue")
+
+                     (let ((test-id (rmt:get-test-id run-id hed "")))
+                       (if test-id (mt:test-set-state-status-by-id run-id test-id "NOT_STARTED" "PREQ_DISCARDED" "Failed to run due to discarded prerequisites")))
+                     
+                     (if (and (null? trimmed-tal)
+                              (null? trimmed-reg))
+                         #f
+                         (runs:loop-values trimmed-tal trimmed-reg reglen regfull reruns)
+                         ))
+                   (list (car newtal)(append (cdr newtal) reg) '() reruns))))
+
+            ((and (null? fails) ;; have not-started tests, but unable to run them.  everything looks completed with no prospect of unsticking something that is stuck.  we should mark hed as moribund and exit or continue if there are more tests to consider
+                  (null? prereq-fails)
+                  (null? non-completed))
+             ;;(BB> "cb4")
+             (if  (runs:can-keep-running? hed 20)
+                  (begin
+                    (runs:inc-cant-run-tests hed)
+                    (debug:print-info 0 *default-log-port* "no fails in prerequisites for " hed " but also none running, keeping " hed " for now. Try count: " (hash-table-ref/default *seen-cant-run-tests* hed 0)) ;; 
+                    ;; getting here likely means the system is way overloaded, kill a full minute before continuing
+                    (thread-sleep! 60) ;; TODO: gate by normalized server load > 1.0 (maxload config thing)
+                    ;; num-retries code was here
+                    ;; we use this opportunity to move contents of reg to tal
+                    (list (car newtal)(append (cdr newtal) reg) '() reruns)) ;; an issue with prereqs not yet met?
+                  (begin
+                    (debug:print-info 1 *default-log-port* "no fails in prerequisites for " hed " but nothing seen running in a while, dropping test " hed " from the run queue")
+                    (let ((test-id (rmt:get-test-id run-id hed "")))
+                      (if test-id (mt:test-set-state-status-by-id run-id test-id "NOT_STARTED" "TIMED_OUT" "Nothing seen running in a while.")))
+                    (runs:loop-values tal reg reglen regfull reruns)
+                    )))
+
+            ((and 
+              (or (not (null? fails))
+                  (not (null? prereq-fails)))
+              (member 'normal testmode))
+             ;;(BB> "cb5")
+             (debug:print-info 1 *default-log-port* "test "  hed " (mode=" testmode ") has failed prerequisite(s); "
+                               (string-intersperse (map (lambda (t)(conc (db:test-get-testname t) ":" (db:test-get-state t)"/"(db:test-get-status t))) fails) ", ")
+                               ", removing it from to-do list")
+             (let ((test-id (rmt:get-test-id run-id hed "")))
+               (if test-id
+                   (if (not (null? prereq-fails))
+                       ;;was: (mt:test-set-state-status-by-id run-id test-id "NOT_STARTED" "PREQ_DISCARDED" "Failed to run due to prior failed prerequisites")
+                       (rmt:set-state-status-and-roll-up-items run-id test-id #f "NOT_STARTED" "PREQ_DISCARDED" "Failed to run due to prior failed prerequisites")
+                       (begin
+                         ;;(debug:print 4 *default-log-port*"BB> set PREQ_FAIL on "hed)
+
+                         
+                         ;;was: (mt:test-set-state-status-by-id run-id test-id "NOT_STARTED" "PREQ_FAIL" "Failed to run due to failed prerequisites")
+                         (rmt:set-state-status-and-roll-up-items run-id test-id #f "NOT_STARTED" "PREQ_FAIL" "Failed to run due to failed prerequisites")
+                         )))) 
+             (if (or (not (null? reg))(not (null? tal)))
+                 (begin
+                   (hash-table-set! test-registry hed 'CANNOTRUN)
+                   (runs:loop-values tal reg reglen regfull (cons hed reruns))
+                   )
+                 #f)) ;; #f flags do not loop
+
+            ((and (not (null? fails))(member 'toplevel testmode))
+             ;;(BB> "cb6")
+             (if (or (not (null? reg))(not (null? tal)))
+                 (list (car newtal)(append (cdr newtal) reg) '() reruns)
+                 #f))
+            
+            ((null? runnable-prereqs)
+             ;;(BB> "cb7")
+             #f) ;; if we get here and non-completed is null then it is all over.
+            
+            (else
+             ;;(BB> "cb8")
+             (debug:print 0 *default-log-port* "WARNING: FAILS or incomplete tests maybe preventing completion of this run. Watch for issues with test " hed ", continuing for now")
+             (list (car newtal)(cdr newtal) reg reruns)))))
+      ;;(BB> "after runs:expand-items big cond")
+      res)))
 
 (define (runs:mixed-list-testname-and-testrec->list-of-strings inlst)
   (if (null? inlst)
       '()
       (map (lambda (t)
@@ -818,10 +933,13 @@
 
 
 ;;  hed tal reg reruns reglen regfull test-record runname test-name item-path jobgroup max-concurrent-jobs run-id waitons item-path testmode test-patts required-tests test-registry registry-mutex flags keyvals run-info newtal all-tests-registry itemmaps)
 (define (runs:process-expanded-tests runsdat testdat)
   ;; unroll the contents of runsdat and testdat (due to ongoing refactoring).
+  (debug:print 2 *default-log-port* "runs:process-expanded-tests; testdat:" )
+  (debug:print 2 *default-log-port* (with-output-to-string
+                                            (lambda () (pp (runs:testdat->alist testdat) ))))
   (let* ((hed                    (runs:testdat-hed testdat))
 	 (tal                    (runs:testdat-tal testdat))
 	 (reg                    (runs:testdat-reg testdat))
 	 (reruns                 (runs:testdat-reruns testdat))
 	 (test-name              (runs:testdat-test-name testdat))
@@ -889,11 +1007,11 @@
 
     ;; Don't know at this time if the test have been launched at some time in the past
     ;; i.e. is this a re-launch?
     (debug:print-info 4 *default-log-port* "run-limits-info = " run-limits-info)
     
-    (cond
+    (cond ; cond 894- 1067
      
      ;; Check item path against item-patts, 
      ;;
      ((not (tests:match test-patts (tests:testqueue-get-testname test-record) item-path required: required-tests)) ;; This test/itempath is not to be run
       ;; else the run is stuck, temporarily or permanently
@@ -1005,30 +1123,39 @@
 		 (debug:print-info 0 *default-log-port* "Waiting for more work to do..."))
 	    (thread-sleep! 1)
 	    (list (car newtal)(cdr newtal) reg reruns))
 	  ;; the waiton is FAIL so no point in trying to run hed ever again
 	  (if (or (not (null? reg))(not (null? tal)))
-	      (if (vector? hed)
+	      (if (or (vector? hed)  (not (null? fails))) ;; BB: why do we need a vector?  in my case, fails is populated (prereq failed), reg is not nul, and we really want to drop this one
 		  (begin
 		    (debug:print 1 *default-log-port* "WARNING: Dropping test " test-name "/" item-path
 				 " from the launch list as it has prerequistes that are FAIL")
 		    (let ((test-id (rmt:get-test-id run-id hed "")))
-		      (if test-id (mt:test-set-state-status-by-id run-id test-id "NOT_STARTED" "PREQ_FAIL" "Failed to run due to failed prerequisites")))
-		    (runs:shrink-can-run-more-tests-count runsdat) ;; DELAY TWEAKER (still needed?)
+		      (if test-id
+                          ;; was: ;(mt:test-set-state-status-by-id run-id test-id "NOT_STARTED" "PREQ_FAIL" "Failed to run due to failed prerequisites")))
+                          (rmt:set-state-status-and-roll-up-items run-id test-id #f "NOT_STARTED"  "PREQ_FAIL" "Failed to run due to failed prerequisites")))
+                                        
+                    (runs:shrink-can-run-more-tests-count runsdat) ;; DELAY TWEAKER (still needed?)
 		    ;; (thread-sleep! *global-delta*)
 		    ;; This next is for the items
-		    (mt:test-set-state-status-by-testname run-id test-name item-path "NOT_STARTED" "BLOCKED" #f)
+
+                    (if (not (null? fails))
+                        ;;(mt:test-set-state-status-by-testname run-id test-name item-path "NOT_STARTED" "PREQ_FAIL" #f)
+                        (rmt:set-state-status-and-roll-up-items run-id test-name item-path "NOT_STARTED" "PREQ_FAIL" #f) 
+                        ;;(mt:test-set-state-status-by-testname run-id test-name item-path "NOT_STARTED" "BLOCKED" #f)
+                        (rmt:set-state-status-and-roll-up-items run-id test-name item-path "NOT_STARTED" "BLOCKED" #f) )
 		    (hash-table-set! test-registry (db:test-make-full-name test-name item-path) 'removed)
 		    (runs:loop-values tal reg reglen regfull reruns))
-		  (let ((nth-try (hash-table-ref/default test-registry hed 0)))
+		  (let ((nth-try (hash-table-ref/default test-registry hed 0))) ;; hed not a vector...
+                    (debug:print 2 *default-log-port* "nth-try("hed")="nth-try)
 		    (cond
 		     ((member "RUNNING" (map db:test-get-state prereqs-not-met))
 		      (if (runs:lownoise (conc "possible RUNNING prerequistes " hed) 60)
 			  (debug:print 0 *default-log-port* "WARNING: test " hed " has possible RUNNING prerequisites, don't give up on it yet."))
 		      (thread-sleep! 4)
 		      (runs:loop-values tal reg reglen regfull reruns))
-		     ((or (not nth-try)
+		     ((or (not nth-try) ;; BB: condition on subsequent tries, condition below fires on first try 
 			  (and (number? nth-try)
 			       (< nth-try 10)))
 		      (hash-table-set! test-registry hed (if (number? nth-try)
 							     (+ nth-try 1)
 							     0))
@@ -1035,18 +1162,18 @@
 		      (if (runs:lownoise (conc "not removing test " hed) 60)
 			  (debug:print 1 *default-log-port* "WARNING: not removing test " hed " from queue although it may not be runnable due to FAILED prerequisites"))
 		      ;; may not have processed correctly. Could be a race condition in your test implementation? Dropping test " hed) ;;  " as it has prerequistes that are FAIL. (NOTE: hed is not a vector)")
 		      (runs:shrink-can-run-more-tests-count runsdat) ;; DELAY TWEAKER (still needed?)
 		      (runs:loop-values newtal reg reglen regfull reruns))
-		     ((symbol? nth-try)
+		     ((symbol? nth-try) ;; BB: 'done matches here in one case where prereq itemwait failed.  This is first "try"
 		      (if (eq? nth-try 'removed) ;; removed is removed - drop it NOW
 			  (if (null? tal)
 			      #f ;; yes, really
 			      (list (car tal)(cdr tal) reg reruns))
 			  (begin
 			    (if (runs:lownoise (conc "FAILED prerequisites or other issue" hed) 60)
-				(debug:print 0 *default-log-port* "WARNING: test " hed " has FAILED prerequisites or other issue. Internal state " nth-try " will be overridden and we'll retry."))
+				(debug:print 0 *default-log-port* "WARNING: test " hed " has FAILED prerequisites or other issue. Internal state >" nth-try "< will be overridden and we'll retry."))
 			    (mt:test-set-state-status-by-testname run-id test-name item-path "NOT_STARTED" "KEEP_TRYING" #f)
 			    (hash-table-set! test-registry hed 0)
 			    (runs:loop-values newtal reg reglen regfull))))
 		     (else
 		      (if (runs:lownoise (conc "FAILED prerequitests and we tried" hed) 60)
@@ -1166,50 +1293,50 @@
   ;; Do mark-and-find clean up of db before starting runing of quue
   ;;
   ;; (rmt:find-and-mark-incomplete)
 
   (let* ((run-info             (rmt:get-run-info run-id))
-	(tests-info            (mt:get-tests-for-run run-id #f '() '())) ;;  qryvals: "id,testname,item_path"))
-	(sorted-test-names     (tests:sort-by-priority-and-waiton test-records))
-	(test-registry         (make-hash-table))
-	(registry-mutex        (make-mutex))
-	(num-retries           0)
-	(max-retries           (config-lookup *configdat* "setup" "maxretries"))
-	(max-concurrent-jobs   (configf:lookup-number *configdat* "setup" "max_concurrent_jobs" default: 50))
-        (reglen                (if (number? reglen-in) reglen-in 1))
-	(last-time-incomplete  (- (current-seconds) 900)) ;; force at least one clean up cycle
-	(last-time-some-running (current-seconds))
-	;; (tdbdat                (tasks:open-db))
-	(runsdat (make-runs:dat
-		  ;; hed: hed
-		  ;; tal: tal
-		  ;; reg: reg
-		  ;; reruns: reruns
-		  reglen: reglen
-		  regfull: #f ;; regfull
-		  ;; test-record: test-record
-		  runname: runname
-		  ;; test-name: test-name
-		  ;; item-path: item-path
-		  ;; jobgroup: jobgroup
-		  max-concurrent-jobs: max-concurrent-jobs
-		  run-id: run-id
-		  ;; waitons: waitons
-		  ;; testmode: testmode
-		  test-patts: test-patts
-		  required-tests: required-tests
-		  test-registry: test-registry
-		  registry-mutex: registry-mutex
-		  flags: flags
-		  keyvals: keyvals
-		  run-info: run-info
-		  ;; newtal: newtal
-		  all-tests-registry: all-tests-registry
-		  ;; itemmaps: itemmaps
-		  ;; prereqs-not-met: (rmt:get-prereqs-not-met run-id waitons hed item-path mode: testmode itemmaps: itemmaps)
-		  ;; can-run-more-tests: (runs:can-run-more-tests run-id jobgroup max-concurrent-jobs) ;; look at the test jobgroup and tot jobs running
-		  )))
+         (tests-info            (mt:get-tests-for-run run-id #f '() '())) ;;  qryvals: "id,testname,item_path"))
+         (sorted-test-names     (tests:sort-by-priority-and-waiton test-records))
+         (test-registry         (make-hash-table))
+         (registry-mutex        (make-mutex))
+         (num-retries           0)
+         (max-retries           (config-lookup *configdat* "setup" "maxretries"))
+         (max-concurrent-jobs   (configf:lookup-number *configdat* "setup" "max_concurrent_jobs" default: 50))
+         (reglen                (if (number? reglen-in) reglen-in 1))
+         (last-time-incomplete  (- (current-seconds) 900)) ;; force at least one clean up cycle
+         (last-time-some-running (current-seconds))
+         ;; (tdbdat                (tasks:open-db))
+         (runsdat (make-runs:dat
+                   ;; hed: hed
+                   ;; tal: tal
+                   ;; reg: reg
+                   ;; reruns: reruns
+                   reglen: reglen
+                   regfull: #f ;; regfull
+                   ;; test-record: test-record
+                   runname: runname
+                   ;; test-name: test-name
+                   ;; item-path: item-path
+                   ;; jobgroup: jobgroup
+                   max-concurrent-jobs: max-concurrent-jobs
+                   run-id: run-id
+                   ;; waitons: waitons
+                   ;; testmode: testmode
+                   test-patts: test-patts
+                   required-tests: required-tests
+                   test-registry: test-registry
+                   registry-mutex: registry-mutex
+                   flags: flags
+                   keyvals: keyvals
+                   run-info: run-info
+                   ;; newtal: newtal
+                   all-tests-registry: all-tests-registry
+                   ;; itemmaps: itemmaps
+                   ;; prereqs-not-met: (rmt:get-prereqs-not-met run-id waitons hed item-path mode: testmode itemmaps: itemmaps)
+                   ;; can-run-more-tests: (runs:can-run-more-tests run-id jobgroup max-concurrent-jobs) ;; look at the test jobgroup and tot jobs running
+                   )))
 
     ;; Initialize the test-registery hash with tests that already have a record
     ;; convert state to symbol and use that as the hash value
     (for-each (lambda (trec)
 		(let ((id (db:test-get-id        trec))
@@ -1283,12 +1410,12 @@
 	;;     (server:kind-run *toppath*))
 	
 	(if (> num-running 0)
 	  (set! last-time-some-running (current-seconds)))
 
-      (if (> (current-seconds)(+ last-time-some-running (or (configf:lookup *configdat* "setup" "give-up-waiting") 36000)))
-	  (hash-table-set! *max-tries-hash* tfullname (+ (hash-table-ref/default *max-tries-hash* tfullname 0) 1)))
+        (if (> (current-seconds)(+ last-time-some-running (or (configf:lookup *configdat* "setup" "give-up-waiting") 36000)))
+            (hash-table-set! *max-tries-hash* tfullname (+ (hash-table-ref/default *max-tries-hash* tfullname 0) 1)))
 	;; (debug:print 0 *default-log-port* "max-tries-hash: " (hash-table->alist *max-tries-hash*))
 
 	;; Ensure all top level tests get registered. This way they show up as "NOT_STARTED" on the dashboard
 	;; and it is clear they *should* have run but did not.
 	(if (not (hash-table-ref/default test-registry (db:test-make-full-name test-name "") #f))
@@ -1309,11 +1436,11 @@
 			(runs:queue-next-reg tal reg reglen regfull)
 			reruns))))
 		  ;; (loop (car tal)(cdr tal) reg reruns))))
 
 	(runs:incremental-print-results run-id)
-	(debug:print 4 *default-log-port* "TOP OF LOOP => "
+	(debug:print 1 *default-log-port* "TOP OF LOOP => "
 		     "test-name: " test-name
 		     "\n  test-record  " test-record
 		     "\n  hed:         " hed
 		     "\n  itemdat:     " itemdat
 		     "\n  items:       " items
@@ -1350,10 +1477,17 @@
 				       #f))
 				 waitons))))) ;; could do this more elegantly with a marker....
 	  (debug:print 0 *default-log-port* "WARNING: Marking test " tfullname " as not runnable. It is waiting on tests that cannot be run. Giving up now.")
 	  (hash-table-set! test-registry tfullname 'removed))
 
+
+         ; BB - a possibility for preqfail propagation
+         ;; ((and (not items) (string? item-path) (not (equal? item-path ""))
+         ;;       (lset-intersection testmode '(itemmatch itemwait)))
+
+         ;;  )
+
 	 ;; items is #f then the test is ok to be handed off to launch (but not before)
 	 ;; 
 	 ((not items)
 	  (debug:print-info 4 *default-log-port* "OUTER COND: (not items)")
 	  (if (and (not (tests:match test-patts (tests:testqueue-get-testname test-record) item-path required: required-tests))
@@ -1410,10 +1544,12 @@
 	      (loop (car tal)(cdr tal) reg reruns)))
 	    
 	 ;; if items is a proc then need to run items:get-items-from-config, get the list and loop 
 	 ;;    - but only do that if resources exist to kick off the job
 	 ;; EXPAND ITEMS
+         ;; 
+         ;; * the condition for (eq? items 'have-procedure) below ensure that runs:expand-items is not called on the same test twice -- expand-items will flatten the procedure to an actual list of items.
 	 ((or (procedure? items)(eq? items 'have-procedure)) ;; BB - target vars are env vars here? to allow expansion of [items]\nsomething [system echo $SOMETARGVAR], which is wonky
 	  (let ((can-run-more    (runs:can-run-more-tests runsdat run-id jobgroup max-concurrent-jobs)))
 	    (if (and (list? can-run-more)
 		     (car can-run-more))
 		(let ((loop-list (runs:expand-items hed tal reg reruns regfull newtal jobgroup max-concurrent-jobs run-id waitons item-path testmode test-record can-run-more items runname tconfig reglen test-registry test-records itemmaps)))
@@ -1442,11 +1578,12 @@
 	 ((not (null? reg)) ;; could we get here with leftovers?
 	  (debug:print-info 0 *default-log-port* "Have leftovers!")
 	  (loop (car reg)(cdr reg) '() reruns))
 	 (else
 	  (debug:print-info 4 *default-log-port* "Exiting loop with...\n  hed=" hed "\n  tal=" tal "\n  reruns=" reruns))
-	 )))
+	 ))) ;; end loop on sorted test names
+    
     ;; now *if* -run-wait we wait for all tests to be done
     ;; Now wait for any RUNNING tests to complete (if in run-wait mode)
     (thread-sleep! 5) ;; I think there is a race condition here. Let states/statuses settle
     (let wait-loop ((num-running      (rmt:get-count-tests-running-for-run-id run-id))
 		    (prev-num-running 0))
@@ -1470,30 +1607,34 @@
     ;; LET* ((test-record
     ;; we get here on "drop through". All done!
     (runs:run-post-hook run-id)
     (debug:print-info 1 *default-log-port* "All tests launched")))
 
-(define (runs:calc-fails prereqs-not-met)
+(define (runs:calc-fails prereqs-not-met) ;; BB is this redundant with runs:runable-tests ?
   (filter (lambda (test)
-	    (and (vector? test) ;; not (string? test))
-		 (member (db:test-get-state test) '("INCOMPLETE" "COMPLETED"))
-		 (not (member (db:test-get-status test)
-			      '("PASS" "WARN" "CHECK" "WAIVED" "SKIP")))))
+            (or
+             (and (vector? test) ;; not (string? test))
+                  (member (db:test-get-status test) '("TEN_STRIKES" "BLOCKED" "PREQ_FAIL" "ZERO_ITEMS" "PREQ_DISCARDED" "TIMED_OUT" "KILLED")))
+             (and (vector? test) ;; not (string? test))
+                  (member (db:test-get-state test) '("INCOMPLETE" "COMPLETED"))
+                  (not (member (db:test-get-status test)
+                               '("PASS" "WARN" "CHECK" "WAIVED" "SKIP"))))))
 	  prereqs-not-met))
 
 (define (runs:calc-prereq-fail prereqs-not-met)
   (filter (lambda (test)
 	    (and (vector? test) ;; not (string? test))
 		 (equal? (db:test-get-state test) "NOT_STARTED")
-		 (not (member (db:test-get-status test)
+                 (not (member (db:test-get-status test)
 			      '("n/a" "KEEP_TRYING")))))
 	  prereqs-not-met))
 
-(define (runs:calc-not-completed prereqs-not-met)
-  (filter
+(define (runs:calc-not-completed prereqs-not-met) ;; filter out tests which have reached a ground state -- they are done one way or another.
+  (filter 
    (lambda (t)
      (or (not (vector? t))
+         (not (member (db:test-get-status t) '("TEN_STRIKES" "BLOCKED" "PREQ_FAIL" "ZERO_ITEMS" "PREQ_DISCARDED" "TIMED_OUT" "KILLED")))
 	 (not (member (db:test-get-state t) '("INCOMPLETE" "COMPLETED")))))
    prereqs-not-met))
 
 ;; (define (runs:calc-not-completed prereqs-not-met)
 ;;   (filter
@@ -1507,18 +1648,18 @@
    (lambda (t)
      (or (not (vector? t))
 	 (and (equal? "NOT_STARTED" (db:test-get-state t))
 	      (member (db:test-get-status t)
 		      '("n/a" "KEEP_TRYING")))
-	 (and (equal? "RUNNING" (db:test-get-state t))))) ;; account for a test that is running
+	 (and (member (db:test-get-state t) '("RUNNING" "LAUNCHED" "REMOTEHOSTSTART" ))))) ;; account for a test that is running
    prereqs-not-met))
 
 (define (runs:pretty-string lst)
   (map (lambda (t)
 	 (if (not (vector? t))
 	     (conc t)
-	     (conc (db:test-get-testname t) ":" (db:test-get-state t) "/" (db:test-get-status t))))
+	     (conc (db:test-get-testname t)"/"(db:test-get-item-path t) ":" (db:test-get-state t) "/" (db:test-get-status t))))
        lst))
 
 ;; parent-test is there as a placeholder for when parent-tests can be run as a setup step
 ;;
 (define (run:test run-id run-info keyvals runname test-record flags parent-test test-registry all-tests-registry)

Index: server.scm
==================================================================
--- server.scm
+++ server.scm
@@ -458,14 +458,15 @@
         (sync-stale-seconds (configf:lookup-number *configdat* "server" "sync-stale-seconds" default: 300))
 	(debug-mode   (debug:debug-mode 1))
 	(last-time    (current-seconds))
 	(no-sync-db   (db:open-no-sync-db))
         (sync-duration 0) ;; run time of the sync in milliseconds
-        (this-wd-num  (begin (mutex-lock! *wdnum*mutex) (let ((x *wdnum*)) (set! *wdnum* (add1 *wdnum*)) (mutex-unlock! *wdnum*mutex) x))))
+        ;;(this-wd-num  (begin (mutex-lock! *wdnum*mutex) (let ((x *wdnum*)) (set! *wdnum* (add1 *wdnum*)) (mutex-unlock! *wdnum*mutex) x)))
+        )
     (set! *no-sync-db* no-sync-db) ;; make the no sync db available to api calls
     (debug:print-info 2 *default-log-port* "Periodic sync thread started.")
-    (debug:print-info 3 *default-log-port* "watchdog starting. legacy-sync is " legacy-sync" pid="(current-process-id)" this-wd-num="this-wd-num)
+    (debug:print-info 3 *default-log-port* "watchdog starting. legacy-sync is " legacy-sync" pid="(current-process-id)  );;  " this-wd-num="this-wd-num)
     (if (and legacy-sync (not *time-to-exit*))
 	(let* (;;(dbstruct (db:setup))
 	       (mtdb       (dbr:dbstruct-mtdb dbstruct))
 	       (mtpath     (db:dbdat-get-path mtdb))
 	       (tmp-area   (common:get-db-tmp-area))
@@ -579,7 +580,7 @@
 			(delay-loop (+ count 1))))
 		  (if (not *time-to-exit*) (loop))))
 	    ;; time to exit, close the no-sync db here
 	    (db:no-sync-close-db no-sync-db)
 	    (if (common:low-noise-print 30)
-		(debug:print-info 0 *default-log-port* "Exiting watchdog timer, *time-to-exit* = " *time-to-exit*" pid="(current-process-id)" this-wd-num="this-wd-num)))))))
+		(debug:print-info 0 *default-log-port* "Exiting watchdog timer, *time-to-exit* = " *time-to-exit*" pid="(current-process-id) ))))))) ;;" this-wd-num="this-wd-num)))))))